Commit
·
245b41b
1
Parent(s):
70bae09
Training in progress, epoch 1
Browse files- added_tokens.json +4 -0
- config.json +1 -1
- model.safetensors +2 -2
- runs/Dec18_12-23-38_a0b19801e9d5/events.out.tfevents.1702902237.a0b19801e9d5.3244.7 +3 -0
- runs/Dec18_12-24-17_a0b19801e9d5/events.out.tfevents.1702902262.a0b19801e9d5.3244.8 +3 -0
- runs/Dec18_12-32-54_a0b19801e9d5/events.out.tfevents.1702902779.a0b19801e9d5.3244.9 +3 -0
- runs/Dec18_12-37-33_a0b19801e9d5/events.out.tfevents.1702903057.a0b19801e9d5.3244.10 +3 -0
- special_tokens_map.json +16 -0
- tokenizer.json +18 -0
- tokenizer_config.json +20 -0
- training_args.bin +1 -1
added_tokens.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<English>": 50258,
|
3 |
+
"<Korean>": 50257
|
4 |
+
}
|
config.json
CHANGED
@@ -42,5 +42,5 @@
|
|
42 |
"torch_dtype": "float32",
|
43 |
"transformers_version": "4.35.2",
|
44 |
"use_cache": true,
|
45 |
-
"vocab_size":
|
46 |
}
|
|
|
42 |
"torch_dtype": "float32",
|
43 |
"transformers_version": "4.35.2",
|
44 |
"use_cache": true,
|
45 |
+
"vocab_size": 50259
|
46 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65425e2f42c3924afa3ff76d108ec0393264cefd6b7a9728ad28df98878aa009
|
3 |
+
size 327664072
|
runs/Dec18_12-23-38_a0b19801e9d5/events.out.tfevents.1702902237.a0b19801e9d5.3244.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8738b8f7d0fd4059419dc8f8d90d65d7e8e55152fc5e1e9822e2f59a841f91fc
|
3 |
+
size 4585
|
runs/Dec18_12-24-17_a0b19801e9d5/events.out.tfevents.1702902262.a0b19801e9d5.3244.8
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0268673e515e85e75c9999917a4842e241c073f3cc307a0b8af7a33b9f93e464
|
3 |
+
size 5213
|
runs/Dec18_12-32-54_a0b19801e9d5/events.out.tfevents.1702902779.a0b19801e9d5.3244.9
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5bd0c9b9625328d29b313221c635ca145ea3647bc09ad7e2effa3df784f43b8
|
3 |
+
size 4585
|
runs/Dec18_12-37-33_a0b19801e9d5/events.out.tfevents.1702903057.a0b19801e9d5.3244.10
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67cfaf6806867c0d062ff4386bca6ce6ca0a2c8d3ffc3f98497fc1daf23a0d73
|
3 |
+
size 7451
|
special_tokens_map.json
CHANGED
@@ -1,4 +1,20 @@
|
|
1 |
{
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2 |
"bos_token": "<|endoftext|>",
|
3 |
"eos_token": "<|endoftext|>",
|
4 |
"pad_token": "<|endoftext|>",
|
|
|
1 |
{
|
2 |
+
"additional_special_tokens": [
|
3 |
+
{
|
4 |
+
"content": "<Korean>",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false
|
9 |
+
},
|
10 |
+
{
|
11 |
+
"content": "<English>",
|
12 |
+
"lstrip": false,
|
13 |
+
"normalized": false,
|
14 |
+
"rstrip": false,
|
15 |
+
"single_word": false
|
16 |
+
}
|
17 |
+
],
|
18 |
"bos_token": "<|endoftext|>",
|
19 |
"eos_token": "<|endoftext|>",
|
20 |
"pad_token": "<|endoftext|>",
|
tokenizer.json
CHANGED
@@ -25,6 +25,24 @@
|
|
25 |
"rstrip": false,
|
26 |
"normalized": true,
|
27 |
"special": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
28 |
}
|
29 |
],
|
30 |
"normalizer": null,
|
|
|
25 |
"rstrip": false,
|
26 |
"normalized": true,
|
27 |
"special": true
|
28 |
+
},
|
29 |
+
{
|
30 |
+
"id": 50257,
|
31 |
+
"content": "<Korean>",
|
32 |
+
"single_word": false,
|
33 |
+
"lstrip": false,
|
34 |
+
"rstrip": false,
|
35 |
+
"normalized": false,
|
36 |
+
"special": true
|
37 |
+
},
|
38 |
+
{
|
39 |
+
"id": 50258,
|
40 |
+
"content": "<English>",
|
41 |
+
"single_word": false,
|
42 |
+
"lstrip": false,
|
43 |
+
"rstrip": false,
|
44 |
+
"normalized": false,
|
45 |
+
"special": true
|
46 |
}
|
47 |
],
|
48 |
"normalizer": null,
|
tokenizer_config.json
CHANGED
@@ -8,8 +8,28 @@
|
|
8 |
"rstrip": false,
|
9 |
"single_word": false,
|
10 |
"special": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
11 |
}
|
12 |
},
|
|
|
|
|
|
|
|
|
13 |
"bos_token": "<|endoftext|>",
|
14 |
"clean_up_tokenization_spaces": true,
|
15 |
"eos_token": "<|endoftext|>",
|
|
|
8 |
"rstrip": false,
|
9 |
"single_word": false,
|
10 |
"special": true
|
11 |
+
},
|
12 |
+
"50257": {
|
13 |
+
"content": "<Korean>",
|
14 |
+
"lstrip": false,
|
15 |
+
"normalized": false,
|
16 |
+
"rstrip": false,
|
17 |
+
"single_word": false,
|
18 |
+
"special": true
|
19 |
+
},
|
20 |
+
"50258": {
|
21 |
+
"content": "<English>",
|
22 |
+
"lstrip": false,
|
23 |
+
"normalized": false,
|
24 |
+
"rstrip": false,
|
25 |
+
"single_word": false,
|
26 |
+
"special": true
|
27 |
}
|
28 |
},
|
29 |
+
"additional_special_tokens": [
|
30 |
+
"<Korean>",
|
31 |
+
"<English>"
|
32 |
+
],
|
33 |
"bos_token": "<|endoftext|>",
|
34 |
"clean_up_tokenization_spaces": true,
|
35 |
"eos_token": "<|endoftext|>",
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cd05ea9dfe6c6eeeb3e0d3bb2947a05305fbf2109d158fec6f3b1c2a6a570d5
|
3 |
size 4600
|