Saving weights and logs of step 5000
Browse files- config.json +1 -1
- events.out.tfevents.1640186853.t1v-n-ccbf3e94-w-0.1752357.3.v2 +3 -0
- flax_model.msgpack +1 -1
- run_w5.sh +2 -2
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"architectures": [
|
4 |
"RobertaForMaskedLM"
|
5 |
],
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "./",
|
3 |
"architectures": [
|
4 |
"RobertaForMaskedLM"
|
5 |
],
|
events.out.tfevents.1640186853.t1v-n-ccbf3e94-w-0.1752357.3.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39b704dcdc54412f4a6883f964ca3cc45da8651d27f71d251eb2bb04304acb6b
|
3 |
+
size 228246
|
flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 498796983
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c0ef99d6b6e1a47ad00474100dd3a3c9c17c8cec41fde77b1252184054f2168
|
3 |
size 498796983
|
run_w5.sh
CHANGED
@@ -3,8 +3,8 @@
|
|
3 |
--model_type="roberta" \
|
4 |
--config_name="./" \
|
5 |
--tokenizer_name="./" \
|
6 |
-
--train_file="/mnt/disks/flaxdisk/
|
7 |
-
--validation_file="/mnt/disks/flaxdisk/
|
8 |
--max_seq_length="128" \
|
9 |
--weight_decay="0.01" \
|
10 |
--per_device_train_batch_size="128" \
|
|
|
3 |
--model_type="roberta" \
|
4 |
--config_name="./" \
|
5 |
--tokenizer_name="./" \
|
6 |
+
--train_file="/mnt/disks/flaxdisk/NCC_small/data/train-shard-0001-of-0001.json" \
|
7 |
+
--validation_file="/mnt/disks/flaxdisk/NCC_small/data/validation-shard-0001-of-0001.json" \
|
8 |
--max_seq_length="128" \
|
9 |
--weight_decay="0.01" \
|
10 |
--per_device_train_batch_size="128" \
|