dreeven commited on
Commit
ace156e
·
1 Parent(s): b2ea088

End of training

Browse files
README.md CHANGED
@@ -39,7 +39,7 @@ The following hyperparameters were used during training:
39
  - seed: 42
40
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
41
  - lr_scheduler_type: linear
42
- - num_epochs: 100
43
 
44
  ### Training results
45
 
 
39
  - seed: 42
40
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
41
  - lr_scheduler_type: linear
42
+ - num_epochs: 350
43
 
44
  ### Training results
45
 
runs/Jul27_05-31-40_cdr2647.int.cedar.computecanada.ca/events.out.tfevents.1690461107.cdr2647.int.cedar.computecanada.ca.108270.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a87706f2e0d451333557e217f7410bc7b8c64cb341ef33aa4a5b3f6b948cc9e1
3
- size 30507
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cf57391e2d6673693742240bb7a5b5e4a472291562773dbfeb4bc7300f74ea0
3
+ size 30861
tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 512,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 512
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 1024,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 1024
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,