racai-andrei commited on
Commit
8af97e9
·
1 Parent(s): bc67776

Delete parameters.json

Browse files
Files changed (1) hide show
  1. parameters.json +0 -51
parameters.json DELETED
@@ -1,51 +0,0 @@
1
- {
2
- "force": true,
3
- "dump_path": "distilmulti-bert-base-ro_dir/checkpoints",
4
- "data_file": "data/binarized_text_merged.bert-base-ro-cased.bin",
5
- "student_type": "distilbert",
6
- "student_config": "training_configs/distilbert-base-uncased.json",
7
- "student_pretrained_weights": "distilmulti-bert-base-ro_dir/distilmulti-bert-base-ro.pth",
8
- "teacher_type": "bert",
9
- "teacher_name": "bert-base-ro-cased",
10
- "temperature": 2.0,
11
- "alpha_ce": 0.65,
12
- "alpha_mlm": 0.25,
13
- "alpha_clm": 0.0,
14
- "alpha_mse": 0.0,
15
- "alpha_cos": 0.1,
16
- "mlm": true,
17
- "mlm_mask_prop": 0.15,
18
- "word_mask": 0.8,
19
- "word_keep": 0.1,
20
- "word_rand": 0.1,
21
- "mlm_smoothing": 0.7,
22
- "token_counts": "data/token_counts.bert-base-ro.pickle",
23
- "restrict_ce_to_mask": false,
24
- "freeze_pos_embs": true,
25
- "freeze_token_type_embds": false,
26
- "n_epoch": 3,
27
- "batch_size": 8,
28
- "group_by_size": true,
29
- "gradient_accumulation_steps": 32,
30
- "warmup_prop": 0.05,
31
- "weight_decay": 0.005,
32
- "learning_rate": 0.0005,
33
- "adam_epsilon": 1e-06,
34
- "max_grad_norm": 5.0,
35
- "initializer_range": 0.02,
36
- "fp16": true,
37
- "fp16_opt_level": "O1",
38
- "n_gpu": 1,
39
- "local_rank": 0,
40
- "seed": 56,
41
- "log_interval": 500,
42
- "checkpoint_interval": 4000,
43
- "n_nodes": 1,
44
- "node_id": 0,
45
- "global_rank": 0,
46
- "world_size": 1,
47
- "n_gpu_per_node": 1,
48
- "multi_gpu": false,
49
- "is_master": true,
50
- "multi_node": false
51
- }