photonmz commited on
Commit
945d036
·
0 Parent(s):

Initial commit

Browse files
.gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
checkpoints/epoch_10.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9120ed17f0c15b9d8afec43161a7b7ea2efecd6df42743a2cf25e90ff488be69
3
+ size 9938341609
checkpoints/epoch_20.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a887b12720ec4c107c87f2064c279d25f276621163606cc74fbcb768eb987121
3
+ size 9938341609
checkpoints/epoch_latest.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:843e5811c55bd6cdfbb33b97eec5b9a56fe68f8baa2f400f7f69009724329c6f
3
+ size 9938247015
checkpoints/results.jsonl ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"image_to_text_mean_rank": 150.0776568587935, "image_to_text_median_rank": 11.0, "image_to_text_R@1": 0.08706166868198308, "image_to_text_R@5": 0.32715302969232835, "image_to_text_R@10": 0.4866317345156523, "text_to_image_mean_rank": 106.41354292623942, "text_to_image_median_rank": 11.0, "text_to_image_R@1": 0.09095794706435577, "text_to_image_R@5": 0.32567513099556633, "text_to_image_R@10": 0.4874378610775225, "clip_val_loss": 0.832438588142395, "epoch": 1, "num_samples": 7443}
2
+ {"image_to_text_mean_rank": 123.40131667338439, "image_to_text_median_rank": 10.0, "image_to_text_R@1": 0.10506516189708451, "image_to_text_R@5": 0.3556361682117426, "image_to_text_R@10": 0.5230417842267903, "text_to_image_mean_rank": 89.46903130458149, "text_to_image_median_rank": 9.0, "text_to_image_R@1": 0.10090017466075507, "text_to_image_R@5": 0.35832325675130994, "text_to_image_R@10": 0.5253258094854225, "clip_val_loss": 0.7709452509880066, "epoch": 2, "num_samples": 7443}
3
+ {"image_to_text_mean_rank": 121.00591159478705, "image_to_text_median_rank": 9.0, "image_to_text_R@1": 0.10143759236866855, "image_to_text_R@5": 0.36705629450490396, "image_to_text_R@10": 0.5406422141609566, "text_to_image_mean_rank": 80.4937525191455, "text_to_image_median_rank": 9.0, "text_to_image_R@1": 0.10143759236866855, "text_to_image_R@5": 0.3666532312239688, "text_to_image_R@10": 0.541851404003762, "clip_val_loss": 0.7330073714256287, "epoch": 3, "num_samples": 7443}
4
+ {"image_to_text_mean_rank": 119.51914550584442, "image_to_text_median_rank": 9.0, "image_to_text_R@1": 0.1099019212683058, "image_to_text_R@5": 0.37820771194410857, "image_to_text_R@10": 0.5417170495767836, "text_to_image_mean_rank": 83.68896950154507, "text_to_image_median_rank": 9.0, "text_to_image_R@1": 0.11003627569528417, "text_to_image_R@5": 0.3779390030901518, "text_to_image_R@10": 0.5472255810828967, "clip_val_loss": 0.7334970831871033, "epoch": 4, "num_samples": 7443}
5
+ {"image_to_text_mean_rank": 112.08235926373774, "image_to_text_median_rank": 8.0, "image_to_text_R@1": 0.10788660486363026, "image_to_text_R@5": 0.3882842939674862, "image_to_text_R@10": 0.5593174795109499, "text_to_image_mean_rank": 77.26225984146177, "text_to_image_median_rank": 8.0, "text_to_image_R@1": 0.11191723767298133, "text_to_image_R@5": 0.3878812306865511, "text_to_image_R@10": 0.5531371758699449, "clip_val_loss": 0.710077702999115, "epoch": 5, "num_samples": 7443}
6
+ {"image_to_text_mean_rank": 110.78704823323929, "image_to_text_median_rank": 9.0, "image_to_text_R@1": 0.11057369340319763, "image_to_text_R@5": 0.38492543329302703, "image_to_text_R@10": 0.5543463657127502, "text_to_image_mean_rank": 74.08464328899638, "text_to_image_median_rank": 8.0, "text_to_image_R@1": 0.11460432621254871, "text_to_image_R@5": 0.39164315464194543, "text_to_image_R@10": 0.5625419857584307, "clip_val_loss": 0.6953209638595581, "epoch": 6, "num_samples": 7443}
7
+ {"image_to_text_mean_rank": 108.28483138519414, "image_to_text_median_rank": 8.0, "image_to_text_R@1": 0.11164852881902458, "image_to_text_R@5": 0.3944645976084912, "image_to_text_R@10": 0.5699314792422411, "text_to_image_mean_rank": 71.48354158269515, "text_to_image_median_rank": 8.0, "text_to_image_R@1": 0.11608222490931076, "text_to_image_R@5": 0.40037619239553945, "text_to_image_R@10": 0.5671100362756953, "clip_val_loss": 0.680811882019043, "epoch": 7, "num_samples": 7443}
8
+ {"image_to_text_mean_rank": 95.73035066505442, "image_to_text_median_rank": 8.0, "image_to_text_R@1": 0.1185006045949214, "image_to_text_R@5": 0.3984952304178423, "image_to_text_R@10": 0.5716780867929598, "text_to_image_mean_rank": 66.8242644095123, "text_to_image_median_rank": 8.0, "text_to_image_R@1": 0.12118769313448878, "text_to_image_R@5": 0.40252586322719336, "text_to_image_R@10": 0.5779927448609432, "clip_val_loss": 0.6552522778511047, "epoch": 8, "num_samples": 7443}
9
+ {"image_to_text_mean_rank": 107.53835818890232, "image_to_text_median_rank": 8.0, "image_to_text_R@1": 0.11514174392046218, "image_to_text_R@5": 0.40870616686819833, "image_to_text_R@10": 0.5857853016256885, "text_to_image_mean_rank": 68.347843611447, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.12575574365175332, "text_to_image_R@5": 0.4169017869138788, "text_to_image_R@10": 0.5906220609969098, "clip_val_loss": 0.6697020530700684, "epoch": 9, "num_samples": 7443}
10
+ {"image_to_text_mean_rank": 92.24949617089884, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.1275023512024721, "image_to_text_R@5": 0.4194545210264678, "image_to_text_R@10": 0.5955931747951095, "text_to_image_mean_rank": 62.04151551793632, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.12562138922477495, "text_to_image_R@5": 0.4265753056563214, "text_to_image_R@10": 0.5949214026602176, "clip_val_loss": 0.640340268611908, "epoch": 10, "num_samples": 7443}
11
+ {"image_to_text_mean_rank": 105.58739755474943, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.12521832594383986, "image_to_text_R@5": 0.4233507994088405, "image_to_text_R@10": 0.5978772000537418, "text_to_image_mean_rank": 65.34609700389628, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.12400913610103453, "text_to_image_R@5": 0.42039500201531643, "text_to_image_R@10": 0.5933091495364772, "clip_val_loss": 0.663438618183136, "epoch": 11, "num_samples": 7443}
12
+ {"image_to_text_mean_rank": 90.01813784764208, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.1266962246406019, "image_to_text_R@5": 0.4311433561735859, "image_to_text_R@10": 0.6095660352008598, "text_to_image_mean_rank": 58.37444578798871, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.1309955663039097, "text_to_image_R@5": 0.43624882439876395, "text_to_image_R@10": 0.6121187693134489, "clip_val_loss": 0.6251317858695984, "epoch": 12, "num_samples": 7443}
13
+ {"image_to_text_mean_rank": 100.03157329033992, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.1336826548434771, "image_to_text_R@5": 0.4350396345559586, "image_to_text_R@10": 0.6117157060325138, "text_to_image_mean_rank": 60.34569394061534, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.13784764207980654, "text_to_image_R@5": 0.43893591293833134, "text_to_image_R@10": 0.6117157060325138, "clip_val_loss": 0.6327502727508545, "epoch": 13, "num_samples": 7443}
14
+ {"image_to_text_mean_rank": 81.72376729813247, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.13825070536074163, "image_to_text_R@5": 0.4396076850732232, "image_to_text_R@10": 0.6203143893591294, "text_to_image_mean_rank": 52.97635362085181, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.13086121187693134, "text_to_image_R@5": 0.4429665457476824, "text_to_image_R@10": 0.6113126427515787, "clip_val_loss": 0.6010527610778809, "epoch": 14, "num_samples": 7443}
15
+ {"image_to_text_mean_rank": 89.35617358591966, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.13784764207980654, "image_to_text_R@5": 0.4460566975681849, "image_to_text_R@10": 0.6208518070670429, "text_to_image_mean_rank": 57.76676071476555, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.1379819965067849, "text_to_image_R@5": 0.44780330511890365, "text_to_image_R@10": 0.6238076044605669, "clip_val_loss": 0.6247494220733643, "epoch": 15, "num_samples": 7443}
16
+ {"image_to_text_mean_rank": 82.66008329974473, "image_to_text_median_rank": 6.0, "image_to_text_R@1": 0.14564019884455193, "image_to_text_R@5": 0.45425231761386536, "image_to_text_R@10": 0.6337498320569662, "text_to_image_mean_rank": 54.96345559586188, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.14241569259707107, "text_to_image_R@5": 0.45640198844551927, "text_to_image_R@10": 0.634018540910923, "clip_val_loss": 0.605738639831543, "epoch": 16, "num_samples": 7443}
17
+ {"image_to_text_mean_rank": 81.23552331049308, "image_to_text_median_rank": 6.0, "image_to_text_R@1": 0.14429665457476823, "image_to_text_R@5": 0.46123874781674057, "image_to_text_R@10": 0.6415423888217117, "text_to_image_mean_rank": 52.43678624210668, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.14940212279994625, "text_to_image_R@5": 0.46688163374983205, "text_to_image_R@10": 0.6393927179900578, "clip_val_loss": 0.5852788090705872, "epoch": 17, "num_samples": 7443}
18
+ {"image_to_text_mean_rank": 74.80545478973532, "image_to_text_median_rank": 6.0, "image_to_text_R@1": 0.14644632540642213, "image_to_text_R@5": 0.4726588741099019, "image_to_text_R@10": 0.648931882305522, "text_to_image_mean_rank": 49.20609969098482, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.15558242644095122, "text_to_image_R@5": 0.4809888485825608, "text_to_image_R@10": 0.6497380088673922, "clip_val_loss": 0.5786479115486145, "epoch": 18, "num_samples": 7443}
19
+ {"image_to_text_mean_rank": 77.01074835415827, "image_to_text_median_rank": 6.0, "image_to_text_R@1": 0.15934435039634556, "image_to_text_R@5": 0.4821980384253661, "image_to_text_R@10": 0.6596802364637915, "text_to_image_mean_rank": 48.961708988311166, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.1574633884186484, "text_to_image_R@5": 0.4831385194142147, "text_to_image_R@10": 0.6604863630256617, "clip_val_loss": 0.5690401196479797, "epoch": 19, "num_samples": 7443}
20
+ {"image_to_text_mean_rank": 79.00806126561871, "image_to_text_median_rank": 6.0, "image_to_text_R@1": 0.1652559451833938, "image_to_text_R@5": 0.4987236329437055, "image_to_text_R@10": 0.6753997044202606, "text_to_image_mean_rank": 49.19145505844418, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.163509337632675, "text_to_image_R@5": 0.4909310761789601, "text_to_image_R@10": 0.6658605401047965, "clip_val_loss": 0.5861181616783142, "epoch": 20, "num_samples": 7443}
21
+ {"image_to_text_mean_rank": 83.14644632540642, "image_to_text_median_rank": 5.0, "image_to_text_R@1": 0.17103318554346367, "image_to_text_R@5": 0.5083971516861481, "image_to_text_R@10": 0.6786242106677415, "text_to_image_mean_rank": 50.80988848582561, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.16901786913878813, "text_to_image_R@5": 0.49442429128039767, "text_to_image_R@10": 0.6706972994760177, "clip_val_loss": 0.592087984085083, "epoch": 21, "num_samples": 7443}
22
+ {"image_to_text_mean_rank": 76.7769716512159, "image_to_text_median_rank": 5.0, "image_to_text_R@1": 0.18110976756684133, "image_to_text_R@5": 0.5168614805857853, "image_to_text_R@10": 0.6881633749832057, "text_to_image_mean_rank": 51.414617761655244, "text_to_image_median_rank": 5.0, "text_to_image_R@1": 0.17318285637511757, "text_to_image_R@5": 0.510949885798737, "text_to_image_R@10": 0.6810425903533521, "clip_val_loss": 0.5895509123802185, "epoch": 22, "num_samples": 7443}
23
+ {"image_to_text_mean_rank": 80.9969098481795, "image_to_text_median_rank": 5.0, "image_to_text_R@1": 0.18084105871288458, "image_to_text_R@5": 0.532043530834341, "image_to_text_R@10": 0.698105602579605, "text_to_image_mean_rank": 48.64987236329437, "text_to_image_median_rank": 5.0, "text_to_image_R@1": 0.18742442563482467, "text_to_image_R@5": 0.5194142146983743, "text_to_image_R@10": 0.6864167674324869, "clip_val_loss": 0.5935105085372925, "epoch": 23, "num_samples": 7443}
24
+ {"image_to_text_mean_rank": 81.97930941824534, "image_to_text_median_rank": 5.0, "image_to_text_R@1": 0.19387343812978639, "image_to_text_R@5": 0.5449415558242644, "image_to_text_R@10": 0.7092570200188096, "text_to_image_mean_rank": 49.71624345022168, "text_to_image_median_rank": 5.0, "text_to_image_R@1": 0.19266424828698106, "text_to_image_R@5": 0.529490796721752, "text_to_image_R@10": 0.6960902861749295, "clip_val_loss": 0.6055031418800354, "epoch": 24, "num_samples": 7443}
25
+ {"image_to_text_mean_rank": 69.55878006180303, "image_to_text_median_rank": 5.0, "image_to_text_R@1": 0.19172376729813248, "image_to_text_R@5": 0.5446728469703077, "image_to_text_R@10": 0.7085852478839177, "text_to_image_mean_rank": 46.23216444981862, "text_to_image_median_rank": 5.0, "text_to_image_R@1": 0.196291817815397, "text_to_image_R@5": 0.5415826951498052, "text_to_image_R@10": 0.7018675265349993, "clip_val_loss": 0.5871114730834961, "epoch": 25, "num_samples": 7443}
26
+ {"image_to_text_mean_rank": 79.41152760983475, "image_to_text_median_rank": 4.0, "image_to_text_R@1": 0.20099422275963993, "image_to_text_R@5": 0.5602579604997985, "image_to_text_R@10": 0.7255139056831923, "text_to_image_mean_rank": 48.719333602042184, "text_to_image_median_rank": 5.0, "text_to_image_R@1": 0.20489050114201263, "text_to_image_R@5": 0.5538089480048367, "text_to_image_R@10": 0.7128845895472256, "clip_val_loss": 0.5863779187202454, "epoch": 26, "num_samples": 7443}
27
+ {"image_to_text_mean_rank": 75.5820233776703, "image_to_text_median_rank": 4.0, "image_to_text_R@1": 0.21133951363697434, "image_to_text_R@5": 0.5689909982533925, "image_to_text_R@10": 0.7241703614134086, "text_to_image_mean_rank": 49.841193067311565, "text_to_image_median_rank": 4.0, "text_to_image_R@1": 0.2110708047830176, "text_to_image_R@5": 0.559720542791885, "text_to_image_R@10": 0.7150342603788795, "clip_val_loss": 0.5865182876586914, "epoch": 27, "num_samples": 7443}
28
+ {"image_to_text_mean_rank": 74.15262662904743, "image_to_text_median_rank": 4.0, "image_to_text_R@1": 0.21819158941287115, "image_to_text_R@5": 0.5689909982533925, "image_to_text_R@10": 0.7249764879752788, "text_to_image_mean_rank": 51.40386940749698, "text_to_image_median_rank": 4.0, "text_to_image_R@1": 0.21523579201934703, "text_to_image_R@5": 0.5640198844551928, "text_to_image_R@10": 0.7183931210533387, "clip_val_loss": 0.5956308245658875, "epoch": 28, "num_samples": 7443}
29
+ {"image_to_text_mean_rank": 77.1198441488647, "image_to_text_median_rank": 4.0, "image_to_text_R@1": 0.21416095660352008, "image_to_text_R@5": 0.5681848716915222, "image_to_text_R@10": 0.7298132473465001, "text_to_image_mean_rank": 52.97568184871692, "text_to_image_median_rank": 4.0, "text_to_image_R@1": 0.21899771597474138, "text_to_image_R@5": 0.5645573021631063, "text_to_image_R@10": 0.7210802095929061, "clip_val_loss": 0.5956435799598694, "epoch": 29, "num_samples": 7443}
30
+ {"image_to_text_mean_rank": 76.52747548031708, "image_to_text_median_rank": 4.0, "image_to_text_R@1": 0.21738546285100094, "image_to_text_R@5": 0.571006314658068, "image_to_text_R@10": 0.7284697030767163, "text_to_image_mean_rank": 53.000940480988845, "text_to_image_median_rank": 4.0, "text_to_image_R@1": 0.21899771597474138, "text_to_image_R@5": 0.5653634287249765, "text_to_image_R@10": 0.7189305387612522, "clip_val_loss": 0.594023585319519, "epoch": 30, "num_samples": 7443}
out.log ADDED
The diff for this file is too large to render. See raw diff
 
params.txt ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ accum_freq: 1
2
+ aug_cfg: {}
3
+ batch_size: 32
4
+ beta1: 0.9
5
+ beta2: 0.999
6
+ cache_dir: None
7
+ checkpoint_path: ./logs/2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16/checkpoints
8
+ coca_caption_loss_weight: 2.0
9
+ coca_contrastive_loss_weight: 1.0
10
+ copy_codebase: False
11
+ csv_caption_key: title
12
+ csv_img_key: filepath
13
+ csv_separator:
14
+ dataset_resampled: False
15
+ dataset_type: hf
16
+ ddp_static_graph: False
17
+ debug: False
18
+ delete_previous_checkpoint: False
19
+ device: cuda
20
+ dist_backend: None
21
+ dist_url: None
22
+ distill: False
23
+ distill_model: None
24
+ distill_pretrained: None
25
+ distributed: False
26
+ epochs: 30
27
+ epochs_cooldown: None
28
+ eps: 1e-08
29
+ force_custom_text: False
30
+ force_image_size: None
31
+ force_patch_dropout: None
32
+ force_quick_gelu: False
33
+ gather_with_grad: False
34
+ grad_checkpointing: False
35
+ grad_clip_norm: None
36
+ hf_dataset: photonmz/opi_function_packed
37
+ horovod: False
38
+ image_interpolation: None
39
+ image_mean: None
40
+ image_resize_mode: None
41
+ image_std: None
42
+ imagenet_v2: None
43
+ imagenet_val: None
44
+ local_loss: False
45
+ local_rank: 0
46
+ lock_image: False
47
+ lock_image_freeze_bn_stats: False
48
+ lock_image_unlocked_groups: 0
49
+ lock_text: False
50
+ lock_text_freeze_layer_norm: False
51
+ lock_text_unlocked_layers: 0
52
+ log_every_n_steps: 100
53
+ log_level: 20
54
+ log_local: False
55
+ log_path: ./logs/2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16/out.log
56
+ logs: ./logs/
57
+ loss_dist_impl: None
58
+ lr: 0.0002
59
+ lr_cooldown_end: 0.0
60
+ lr_cooldown_power: 1.0
61
+ lr_scheduler: cosine
62
+ model: crisp_1
63
+ momentum: None
64
+ name: 2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16
65
+ no_set_device_rank: False
66
+ opt: adamw
67
+ precision: amp_bfloat16
68
+ pretrained:
69
+ pretrained_image: False
70
+ rank: 0
71
+ remote_sync: None
72
+ remote_sync_frequency: 300
73
+ remote_sync_protocol: s3
74
+ report_to: wandb
75
+ resume: None
76
+ save_frequency: 1
77
+ save_most_recent: True
78
+ seed: 0
79
+ siglip: False
80
+ skip_scheduler: False
81
+ tensorboard: False
82
+ tensorboard_path:
83
+ torchcompile: False
84
+ torchscript: False
85
+ trace: False
86
+ train_data: stub
87
+ train_data_upsampling_factors: None
88
+ train_num_samples: None
89
+ use_bn_sync: False
90
+ use_bnb_linear: None
91
+ val_data: stub
92
+ val_frequency: 1
93
+ val_num_samples: None
94
+ wandb: True
95
+ wandb_notes:
96
+ wandb_project_name: open-clip
97
+ warmup: 10000
98
+ wd: 0.1
99
+ workers: 1
100
+ world_size: 1
101
+ zeroshot_frequency: 1