damienbenveniste commited on
Commit
e71c099
·
verified ·
1 Parent(s): e2d7e11

Training in progress, step 125

Browse files
config.json CHANGED
@@ -3,8 +3,10 @@
3
  "architectures": [
4
  "MistralForSequenceClassification"
5
  ],
 
6
  "bos_token_id": 1,
7
  "eos_token_id": 2,
 
8
  "hidden_act": "silu",
9
  "hidden_size": 768,
10
  "initializer_range": 0.02,
@@ -20,7 +22,7 @@
20
  "sliding_window": 768,
21
  "tie_word_embeddings": false,
22
  "torch_dtype": "float32",
23
- "transformers_version": "4.35.2",
24
  "use_cache": true,
25
  "vocab_size": 32000
26
  }
 
3
  "architectures": [
4
  "MistralForSequenceClassification"
5
  ],
6
+ "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 2,
9
+ "head_dim": 48,
10
  "hidden_act": "silu",
11
  "hidden_size": 768,
12
  "initializer_range": 0.02,
 
22
  "sliding_window": 768,
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "float32",
25
+ "transformers_version": "4.44.2",
26
  "use_cache": true,
27
  "vocab_size": 32000
28
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87c3d9e4c849616fb721fa88f241470c321c56c0f1ad30d540075740237e784f
3
  size 239899848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e02d7fb650b0d80e4b4c573b72abb01167d69aeda6ca8c733ba34ef89c4bbbb
3
  size 239899848
tokenizer.json CHANGED
@@ -36,23 +36,13 @@
36
  "special": true
37
  }
38
  ],
39
- "normalizer": {
40
- "type": "Sequence",
41
- "normalizers": [
42
- {
43
- "type": "Prepend",
44
- "prepend": "▁"
45
- },
46
- {
47
- "type": "Replace",
48
- "pattern": {
49
- "String": " "
50
- },
51
- "content": "▁"
52
- }
53
- ]
54
  },
55
- "pre_tokenizer": null,
56
  "post_processor": {
57
  "type": "TemplateProcessing",
58
  "single": [
@@ -139,6 +129,7 @@
139
  "end_of_word_suffix": null,
140
  "fuse_unk": true,
141
  "byte_fallback": true,
 
142
  "vocab": {
143
  "<unk>": 0,
144
  "<s>": 1,
 
36
  "special": true
37
  }
38
  ],
39
+ "normalizer": null,
40
+ "pre_tokenizer": {
41
+ "type": "Metaspace",
42
+ "replacement": "▁",
43
+ "prepend_scheme": "first",
44
+ "split": false
 
 
 
 
 
 
 
 
 
45
  },
 
46
  "post_processor": {
47
  "type": "TemplateProcessing",
48
  "single": [
 
129
  "end_of_word_suffix": null,
130
  "fuse_unk": true,
131
  "byte_fallback": true,
132
+ "ignore_merges": false,
133
  "vocab": {
134
  "<unk>": 0,
135
  "<s>": 1,
tokenizer_config.json CHANGED
@@ -1,4 +1,7 @@
1
  {
 
 
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<unk>",
@@ -29,8 +32,8 @@
29
  "bos_token": "<s>",
30
  "clean_up_tokenization_spaces": false,
31
  "eos_token": "</s>",
32
- "legacy": true,
33
- "max_length": 30000,
34
  "model_max_length": 1000000000000000019884624838656,
35
  "pad_to_multiple_of": null,
36
  "pad_token": "</s>",
 
1
  {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "add_prefix_space": null,
5
  "added_tokens_decoder": {
6
  "0": {
7
  "content": "<unk>",
 
32
  "bos_token": "<s>",
33
  "clean_up_tokenization_spaces": false,
34
  "eos_token": "</s>",
35
+ "legacy": false,
36
+ "max_length": 512,
37
  "model_max_length": 1000000000000000019884624838656,
38
  "pad_to_multiple_of": null,
39
  "pad_token": "</s>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e2bb060d61518375f44121ee4894d0fc41e84753f635b4c2502ca6d8770b8f1
3
- size 4536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e74ef77809653d0f2da60c9bed7aed627936675cd46d134fdae657da36847a97
3
+ size 5176