Training in progress, step 125
Browse files- benchmarks.shelve.bak +2 -2
- benchmarks.shelve.dat +0 -0
- benchmarks.shelve.dir +2 -2
- logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8, warmup_ratio=0.1/events.out.tfevents.1727027042.1c1a426a2fee +3 -0
- logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8/events.out.tfevents.1727026091.1c1a426a2fee +3 -0
- logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8/events.out.tfevents.1727026979.1c1a426a2fee +0 -0
- model.safetensors +1 -1
- training_args.bin +1 -1
benchmarks.shelve.bak
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
'teacher', (0, 13436)
|
2 |
-
'distily_tinyBenchmarks/logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8', (13824,
|
3 |
-
'logis/teacher', (27648,
|
|
|
1 |
'teacher', (0, 13436)
|
2 |
+
'distily_tinyBenchmarks/logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8', (13824, 448)
|
3 |
+
'logis/teacher', (27648, 448)
|
benchmarks.shelve.dat
CHANGED
Binary files a/benchmarks.shelve.dat and b/benchmarks.shelve.dat differ
|
|
benchmarks.shelve.dir
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
'teacher', (0, 13436)
|
2 |
-
'distily_tinyBenchmarks/logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8', (13824,
|
3 |
-
'logis/teacher', (27648,
|
|
|
1 |
'teacher', (0, 13436)
|
2 |
+
'distily_tinyBenchmarks/logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8', (13824, 448)
|
3 |
+
'logis/teacher', (27648, 448)
|
logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8, warmup_ratio=0.1/events.out.tfevents.1727027042.1c1a426a2fee
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e25ccdd0021f36ebd92ac4e946cc9ac8cf15a8773cea8eaa9b56d433b538fa7
|
3 |
+
size 9199
|
logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8/events.out.tfevents.1727026091.1c1a426a2fee
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:737e88e22d14bdb28dc024f0db7d4a04276d19b98956856b1dc267ae69124d0f
|
3 |
+
size 511
|
logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8/events.out.tfevents.1727026979.1c1a426a2fee
ADDED
File without changes
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 325669528
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db9e2804f336617d31f89b54279052b1d16570381c6c703c5a8f76b581be9374
|
3 |
size 325669528
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5688
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c160784e6306b46c5f159ce424ff2114c638bddc9a4fedcb0074202ba9e6621
|
3 |
size 5688
|