lapp0 commited on
Commit
ab8e9a5
·
verified ·
1 Parent(s): 681429a

Training in progress, step 125

Browse files
benchmarks.shelve.bak CHANGED
@@ -1,3 +1,4 @@
1
  'teacher', (0, 13436)
2
  'distily_tinyBenchmarks/logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8', (13824, 448)
3
  'logis/teacher', (27648, 448)
 
 
1
  'teacher', (0, 13436)
2
  'distily_tinyBenchmarks/logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8', (13824, 448)
3
  'logis/teacher', (27648, 448)
4
+ 'distily_tinyBenchmarks/logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8, warmup_ratio=0.1', (41472, 448)
benchmarks.shelve.dat CHANGED
Binary files a/benchmarks.shelve.dat and b/benchmarks.shelve.dat differ
 
benchmarks.shelve.dir CHANGED
@@ -1,3 +1,4 @@
1
  'teacher', (0, 13436)
2
  'distily_tinyBenchmarks/logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8', (13824, 448)
3
  'logis/teacher', (27648, 448)
 
 
1
  'teacher', (0, 13436)
2
  'distily_tinyBenchmarks/logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8', (13824, 448)
3
  'logis/teacher', (27648, 448)
4
+ 'distily_tinyBenchmarks/logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8, warmup_ratio=0.1', (41472, 448)
logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8, warmup_ratio=0.1/events.out.tfevents.1727027678.1c1a426a2fee ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b975f74ccba1b3ee1db3870dfb7833adaa613431b4e57d772a290207eb697d38
3
+ size 511
logs/harness_benchmarks=tinyBenchmarks, learning_rate=0.0001, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8, warmup_ratio=0.1/events.out.tfevents.1727028505.1c1a426a2fee ADDED
File without changes
logs/harness_benchmarks=tinyBenchmarks, learning_rate=5e-05, lr_scheduler_kwargs=__power___0.7___lr_end___2e-05_, lr_scheduler_type=polynomial, per_device_train_batch_size=8/events.out.tfevents.1727028561.1c1a426a2fee ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ca6861b734eea2bd17b0d0f62385e313032c1595bbbd5fcc024ef3152b47503
3
+ size 9160
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db9e2804f336617d31f89b54279052b1d16570381c6c703c5a8f76b581be9374
3
  size 325669528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c024fbbddc1e8a8bfbd824fa9879a31110848613d8a486329849c18b6c97d4d
3
  size 325669528
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c160784e6306b46c5f159ce424ff2114c638bddc9a4fedcb0074202ba9e6621
3
- size 5688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e1058fc06d8c6819fe512ee297f98cd7b3c2b58c8a87a4ddce8a838e68eb05a
3
+ size 5624