hoang14 commited on
Commit
43000e1
1 Parent(s): 0d100ad

Create README.md

Browse files
Files changed (1) hide show
  1. README.md +31 -0
README.md ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ATASET = "task-focus + sample from remain datasets"
2
+
3
+ DATASET_FORMAT = 'input-output'
4
+
5
+ PER_DEVICE_TRAIN_BATCH_SIZE = 2
6
+
7
+ GRADIENT_ACCUMULATION_STEPS = 4
8
+
9
+ LEARNING_RATE = 0.0003
10
+
11
+ LR_SCHEDULER_TYPE = 'cosine'
12
+
13
+ WARMUP_RATIO = 0.03
14
+
15
+ LORA_R = 192
16
+
17
+ LORA_ALPHA = 32
18
+
19
+ LORA_DROPOUT = 0.1
20
+
21
+ TRAIN_ON_SOURCE = False
22
+
23
+ SOURCE_MAX_LENGTH = 1024
24
+
25
+ TARGET_MAX_LENGTH = 1024
26
+
27
+ LOGGING_STEPS = 20
28
+
29
+ SAVE_STEPS = 100
30
+
31
+ SAVE_TOTAL_LIMIT = 4