Commit
·
945d036
0
Parent(s):
Initial commit
Browse files- .gitattributes +35 -0
- checkpoints/epoch_10.pt +3 -0
- checkpoints/epoch_20.pt +3 -0
- checkpoints/epoch_latest.pt +3 -0
- checkpoints/results.jsonl +30 -0
- out.log +0 -0
- params.txt +101 -0
.gitattributes
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
22 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
23 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
24 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
25 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
26 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
27 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
28 |
+
*.tar filter=lfs diff=lfs merge=lfs -text
|
29 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
30 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
31 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
32 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
33 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
checkpoints/epoch_10.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9120ed17f0c15b9d8afec43161a7b7ea2efecd6df42743a2cf25e90ff488be69
|
3 |
+
size 9938341609
|
checkpoints/epoch_20.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a887b12720ec4c107c87f2064c279d25f276621163606cc74fbcb768eb987121
|
3 |
+
size 9938341609
|
checkpoints/epoch_latest.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:843e5811c55bd6cdfbb33b97eec5b9a56fe68f8baa2f400f7f69009724329c6f
|
3 |
+
size 9938247015
|
checkpoints/results.jsonl
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"image_to_text_mean_rank": 150.0776568587935, "image_to_text_median_rank": 11.0, "image_to_text_R@1": 0.08706166868198308, "image_to_text_R@5": 0.32715302969232835, "image_to_text_R@10": 0.4866317345156523, "text_to_image_mean_rank": 106.41354292623942, "text_to_image_median_rank": 11.0, "text_to_image_R@1": 0.09095794706435577, "text_to_image_R@5": 0.32567513099556633, "text_to_image_R@10": 0.4874378610775225, "clip_val_loss": 0.832438588142395, "epoch": 1, "num_samples": 7443}
|
2 |
+
{"image_to_text_mean_rank": 123.40131667338439, "image_to_text_median_rank": 10.0, "image_to_text_R@1": 0.10506516189708451, "image_to_text_R@5": 0.3556361682117426, "image_to_text_R@10": 0.5230417842267903, "text_to_image_mean_rank": 89.46903130458149, "text_to_image_median_rank": 9.0, "text_to_image_R@1": 0.10090017466075507, "text_to_image_R@5": 0.35832325675130994, "text_to_image_R@10": 0.5253258094854225, "clip_val_loss": 0.7709452509880066, "epoch": 2, "num_samples": 7443}
|
3 |
+
{"image_to_text_mean_rank": 121.00591159478705, "image_to_text_median_rank": 9.0, "image_to_text_R@1": 0.10143759236866855, "image_to_text_R@5": 0.36705629450490396, "image_to_text_R@10": 0.5406422141609566, "text_to_image_mean_rank": 80.4937525191455, "text_to_image_median_rank": 9.0, "text_to_image_R@1": 0.10143759236866855, "text_to_image_R@5": 0.3666532312239688, "text_to_image_R@10": 0.541851404003762, "clip_val_loss": 0.7330073714256287, "epoch": 3, "num_samples": 7443}
|
4 |
+
{"image_to_text_mean_rank": 119.51914550584442, "image_to_text_median_rank": 9.0, "image_to_text_R@1": 0.1099019212683058, "image_to_text_R@5": 0.37820771194410857, "image_to_text_R@10": 0.5417170495767836, "text_to_image_mean_rank": 83.68896950154507, "text_to_image_median_rank": 9.0, "text_to_image_R@1": 0.11003627569528417, "text_to_image_R@5": 0.3779390030901518, "text_to_image_R@10": 0.5472255810828967, "clip_val_loss": 0.7334970831871033, "epoch": 4, "num_samples": 7443}
|
5 |
+
{"image_to_text_mean_rank": 112.08235926373774, "image_to_text_median_rank": 8.0, "image_to_text_R@1": 0.10788660486363026, "image_to_text_R@5": 0.3882842939674862, "image_to_text_R@10": 0.5593174795109499, "text_to_image_mean_rank": 77.26225984146177, "text_to_image_median_rank": 8.0, "text_to_image_R@1": 0.11191723767298133, "text_to_image_R@5": 0.3878812306865511, "text_to_image_R@10": 0.5531371758699449, "clip_val_loss": 0.710077702999115, "epoch": 5, "num_samples": 7443}
|
6 |
+
{"image_to_text_mean_rank": 110.78704823323929, "image_to_text_median_rank": 9.0, "image_to_text_R@1": 0.11057369340319763, "image_to_text_R@5": 0.38492543329302703, "image_to_text_R@10": 0.5543463657127502, "text_to_image_mean_rank": 74.08464328899638, "text_to_image_median_rank": 8.0, "text_to_image_R@1": 0.11460432621254871, "text_to_image_R@5": 0.39164315464194543, "text_to_image_R@10": 0.5625419857584307, "clip_val_loss": 0.6953209638595581, "epoch": 6, "num_samples": 7443}
|
7 |
+
{"image_to_text_mean_rank": 108.28483138519414, "image_to_text_median_rank": 8.0, "image_to_text_R@1": 0.11164852881902458, "image_to_text_R@5": 0.3944645976084912, "image_to_text_R@10": 0.5699314792422411, "text_to_image_mean_rank": 71.48354158269515, "text_to_image_median_rank": 8.0, "text_to_image_R@1": 0.11608222490931076, "text_to_image_R@5": 0.40037619239553945, "text_to_image_R@10": 0.5671100362756953, "clip_val_loss": 0.680811882019043, "epoch": 7, "num_samples": 7443}
|
8 |
+
{"image_to_text_mean_rank": 95.73035066505442, "image_to_text_median_rank": 8.0, "image_to_text_R@1": 0.1185006045949214, "image_to_text_R@5": 0.3984952304178423, "image_to_text_R@10": 0.5716780867929598, "text_to_image_mean_rank": 66.8242644095123, "text_to_image_median_rank": 8.0, "text_to_image_R@1": 0.12118769313448878, "text_to_image_R@5": 0.40252586322719336, "text_to_image_R@10": 0.5779927448609432, "clip_val_loss": 0.6552522778511047, "epoch": 8, "num_samples": 7443}
|
9 |
+
{"image_to_text_mean_rank": 107.53835818890232, "image_to_text_median_rank": 8.0, "image_to_text_R@1": 0.11514174392046218, "image_to_text_R@5": 0.40870616686819833, "image_to_text_R@10": 0.5857853016256885, "text_to_image_mean_rank": 68.347843611447, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.12575574365175332, "text_to_image_R@5": 0.4169017869138788, "text_to_image_R@10": 0.5906220609969098, "clip_val_loss": 0.6697020530700684, "epoch": 9, "num_samples": 7443}
|
10 |
+
{"image_to_text_mean_rank": 92.24949617089884, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.1275023512024721, "image_to_text_R@5": 0.4194545210264678, "image_to_text_R@10": 0.5955931747951095, "text_to_image_mean_rank": 62.04151551793632, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.12562138922477495, "text_to_image_R@5": 0.4265753056563214, "text_to_image_R@10": 0.5949214026602176, "clip_val_loss": 0.640340268611908, "epoch": 10, "num_samples": 7443}
|
11 |
+
{"image_to_text_mean_rank": 105.58739755474943, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.12521832594383986, "image_to_text_R@5": 0.4233507994088405, "image_to_text_R@10": 0.5978772000537418, "text_to_image_mean_rank": 65.34609700389628, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.12400913610103453, "text_to_image_R@5": 0.42039500201531643, "text_to_image_R@10": 0.5933091495364772, "clip_val_loss": 0.663438618183136, "epoch": 11, "num_samples": 7443}
|
12 |
+
{"image_to_text_mean_rank": 90.01813784764208, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.1266962246406019, "image_to_text_R@5": 0.4311433561735859, "image_to_text_R@10": 0.6095660352008598, "text_to_image_mean_rank": 58.37444578798871, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.1309955663039097, "text_to_image_R@5": 0.43624882439876395, "text_to_image_R@10": 0.6121187693134489, "clip_val_loss": 0.6251317858695984, "epoch": 12, "num_samples": 7443}
|
13 |
+
{"image_to_text_mean_rank": 100.03157329033992, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.1336826548434771, "image_to_text_R@5": 0.4350396345559586, "image_to_text_R@10": 0.6117157060325138, "text_to_image_mean_rank": 60.34569394061534, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.13784764207980654, "text_to_image_R@5": 0.43893591293833134, "text_to_image_R@10": 0.6117157060325138, "clip_val_loss": 0.6327502727508545, "epoch": 13, "num_samples": 7443}
|
14 |
+
{"image_to_text_mean_rank": 81.72376729813247, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.13825070536074163, "image_to_text_R@5": 0.4396076850732232, "image_to_text_R@10": 0.6203143893591294, "text_to_image_mean_rank": 52.97635362085181, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.13086121187693134, "text_to_image_R@5": 0.4429665457476824, "text_to_image_R@10": 0.6113126427515787, "clip_val_loss": 0.6010527610778809, "epoch": 14, "num_samples": 7443}
|
15 |
+
{"image_to_text_mean_rank": 89.35617358591966, "image_to_text_median_rank": 7.0, "image_to_text_R@1": 0.13784764207980654, "image_to_text_R@5": 0.4460566975681849, "image_to_text_R@10": 0.6208518070670429, "text_to_image_mean_rank": 57.76676071476555, "text_to_image_median_rank": 7.0, "text_to_image_R@1": 0.1379819965067849, "text_to_image_R@5": 0.44780330511890365, "text_to_image_R@10": 0.6238076044605669, "clip_val_loss": 0.6247494220733643, "epoch": 15, "num_samples": 7443}
|
16 |
+
{"image_to_text_mean_rank": 82.66008329974473, "image_to_text_median_rank": 6.0, "image_to_text_R@1": 0.14564019884455193, "image_to_text_R@5": 0.45425231761386536, "image_to_text_R@10": 0.6337498320569662, "text_to_image_mean_rank": 54.96345559586188, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.14241569259707107, "text_to_image_R@5": 0.45640198844551927, "text_to_image_R@10": 0.634018540910923, "clip_val_loss": 0.605738639831543, "epoch": 16, "num_samples": 7443}
|
17 |
+
{"image_to_text_mean_rank": 81.23552331049308, "image_to_text_median_rank": 6.0, "image_to_text_R@1": 0.14429665457476823, "image_to_text_R@5": 0.46123874781674057, "image_to_text_R@10": 0.6415423888217117, "text_to_image_mean_rank": 52.43678624210668, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.14940212279994625, "text_to_image_R@5": 0.46688163374983205, "text_to_image_R@10": 0.6393927179900578, "clip_val_loss": 0.5852788090705872, "epoch": 17, "num_samples": 7443}
|
18 |
+
{"image_to_text_mean_rank": 74.80545478973532, "image_to_text_median_rank": 6.0, "image_to_text_R@1": 0.14644632540642213, "image_to_text_R@5": 0.4726588741099019, "image_to_text_R@10": 0.648931882305522, "text_to_image_mean_rank": 49.20609969098482, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.15558242644095122, "text_to_image_R@5": 0.4809888485825608, "text_to_image_R@10": 0.6497380088673922, "clip_val_loss": 0.5786479115486145, "epoch": 18, "num_samples": 7443}
|
19 |
+
{"image_to_text_mean_rank": 77.01074835415827, "image_to_text_median_rank": 6.0, "image_to_text_R@1": 0.15934435039634556, "image_to_text_R@5": 0.4821980384253661, "image_to_text_R@10": 0.6596802364637915, "text_to_image_mean_rank": 48.961708988311166, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.1574633884186484, "text_to_image_R@5": 0.4831385194142147, "text_to_image_R@10": 0.6604863630256617, "clip_val_loss": 0.5690401196479797, "epoch": 19, "num_samples": 7443}
|
20 |
+
{"image_to_text_mean_rank": 79.00806126561871, "image_to_text_median_rank": 6.0, "image_to_text_R@1": 0.1652559451833938, "image_to_text_R@5": 0.4987236329437055, "image_to_text_R@10": 0.6753997044202606, "text_to_image_mean_rank": 49.19145505844418, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.163509337632675, "text_to_image_R@5": 0.4909310761789601, "text_to_image_R@10": 0.6658605401047965, "clip_val_loss": 0.5861181616783142, "epoch": 20, "num_samples": 7443}
|
21 |
+
{"image_to_text_mean_rank": 83.14644632540642, "image_to_text_median_rank": 5.0, "image_to_text_R@1": 0.17103318554346367, "image_to_text_R@5": 0.5083971516861481, "image_to_text_R@10": 0.6786242106677415, "text_to_image_mean_rank": 50.80988848582561, "text_to_image_median_rank": 6.0, "text_to_image_R@1": 0.16901786913878813, "text_to_image_R@5": 0.49442429128039767, "text_to_image_R@10": 0.6706972994760177, "clip_val_loss": 0.592087984085083, "epoch": 21, "num_samples": 7443}
|
22 |
+
{"image_to_text_mean_rank": 76.7769716512159, "image_to_text_median_rank": 5.0, "image_to_text_R@1": 0.18110976756684133, "image_to_text_R@5": 0.5168614805857853, "image_to_text_R@10": 0.6881633749832057, "text_to_image_mean_rank": 51.414617761655244, "text_to_image_median_rank": 5.0, "text_to_image_R@1": 0.17318285637511757, "text_to_image_R@5": 0.510949885798737, "text_to_image_R@10": 0.6810425903533521, "clip_val_loss": 0.5895509123802185, "epoch": 22, "num_samples": 7443}
|
23 |
+
{"image_to_text_mean_rank": 80.9969098481795, "image_to_text_median_rank": 5.0, "image_to_text_R@1": 0.18084105871288458, "image_to_text_R@5": 0.532043530834341, "image_to_text_R@10": 0.698105602579605, "text_to_image_mean_rank": 48.64987236329437, "text_to_image_median_rank": 5.0, "text_to_image_R@1": 0.18742442563482467, "text_to_image_R@5": 0.5194142146983743, "text_to_image_R@10": 0.6864167674324869, "clip_val_loss": 0.5935105085372925, "epoch": 23, "num_samples": 7443}
|
24 |
+
{"image_to_text_mean_rank": 81.97930941824534, "image_to_text_median_rank": 5.0, "image_to_text_R@1": 0.19387343812978639, "image_to_text_R@5": 0.5449415558242644, "image_to_text_R@10": 0.7092570200188096, "text_to_image_mean_rank": 49.71624345022168, "text_to_image_median_rank": 5.0, "text_to_image_R@1": 0.19266424828698106, "text_to_image_R@5": 0.529490796721752, "text_to_image_R@10": 0.6960902861749295, "clip_val_loss": 0.6055031418800354, "epoch": 24, "num_samples": 7443}
|
25 |
+
{"image_to_text_mean_rank": 69.55878006180303, "image_to_text_median_rank": 5.0, "image_to_text_R@1": 0.19172376729813248, "image_to_text_R@5": 0.5446728469703077, "image_to_text_R@10": 0.7085852478839177, "text_to_image_mean_rank": 46.23216444981862, "text_to_image_median_rank": 5.0, "text_to_image_R@1": 0.196291817815397, "text_to_image_R@5": 0.5415826951498052, "text_to_image_R@10": 0.7018675265349993, "clip_val_loss": 0.5871114730834961, "epoch": 25, "num_samples": 7443}
|
26 |
+
{"image_to_text_mean_rank": 79.41152760983475, "image_to_text_median_rank": 4.0, "image_to_text_R@1": 0.20099422275963993, "image_to_text_R@5": 0.5602579604997985, "image_to_text_R@10": 0.7255139056831923, "text_to_image_mean_rank": 48.719333602042184, "text_to_image_median_rank": 5.0, "text_to_image_R@1": 0.20489050114201263, "text_to_image_R@5": 0.5538089480048367, "text_to_image_R@10": 0.7128845895472256, "clip_val_loss": 0.5863779187202454, "epoch": 26, "num_samples": 7443}
|
27 |
+
{"image_to_text_mean_rank": 75.5820233776703, "image_to_text_median_rank": 4.0, "image_to_text_R@1": 0.21133951363697434, "image_to_text_R@5": 0.5689909982533925, "image_to_text_R@10": 0.7241703614134086, "text_to_image_mean_rank": 49.841193067311565, "text_to_image_median_rank": 4.0, "text_to_image_R@1": 0.2110708047830176, "text_to_image_R@5": 0.559720542791885, "text_to_image_R@10": 0.7150342603788795, "clip_val_loss": 0.5865182876586914, "epoch": 27, "num_samples": 7443}
|
28 |
+
{"image_to_text_mean_rank": 74.15262662904743, "image_to_text_median_rank": 4.0, "image_to_text_R@1": 0.21819158941287115, "image_to_text_R@5": 0.5689909982533925, "image_to_text_R@10": 0.7249764879752788, "text_to_image_mean_rank": 51.40386940749698, "text_to_image_median_rank": 4.0, "text_to_image_R@1": 0.21523579201934703, "text_to_image_R@5": 0.5640198844551928, "text_to_image_R@10": 0.7183931210533387, "clip_val_loss": 0.5956308245658875, "epoch": 28, "num_samples": 7443}
|
29 |
+
{"image_to_text_mean_rank": 77.1198441488647, "image_to_text_median_rank": 4.0, "image_to_text_R@1": 0.21416095660352008, "image_to_text_R@5": 0.5681848716915222, "image_to_text_R@10": 0.7298132473465001, "text_to_image_mean_rank": 52.97568184871692, "text_to_image_median_rank": 4.0, "text_to_image_R@1": 0.21899771597474138, "text_to_image_R@5": 0.5645573021631063, "text_to_image_R@10": 0.7210802095929061, "clip_val_loss": 0.5956435799598694, "epoch": 29, "num_samples": 7443}
|
30 |
+
{"image_to_text_mean_rank": 76.52747548031708, "image_to_text_median_rank": 4.0, "image_to_text_R@1": 0.21738546285100094, "image_to_text_R@5": 0.571006314658068, "image_to_text_R@10": 0.7284697030767163, "text_to_image_mean_rank": 53.000940480988845, "text_to_image_median_rank": 4.0, "text_to_image_R@1": 0.21899771597474138, "text_to_image_R@5": 0.5653634287249765, "text_to_image_R@10": 0.7189305387612522, "clip_val_loss": 0.594023585319519, "epoch": 30, "num_samples": 7443}
|
out.log
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params.txt
ADDED
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
accum_freq: 1
|
2 |
+
aug_cfg: {}
|
3 |
+
batch_size: 32
|
4 |
+
beta1: 0.9
|
5 |
+
beta2: 0.999
|
6 |
+
cache_dir: None
|
7 |
+
checkpoint_path: ./logs/2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16/checkpoints
|
8 |
+
coca_caption_loss_weight: 2.0
|
9 |
+
coca_contrastive_loss_weight: 1.0
|
10 |
+
copy_codebase: False
|
11 |
+
csv_caption_key: title
|
12 |
+
csv_img_key: filepath
|
13 |
+
csv_separator:
|
14 |
+
dataset_resampled: False
|
15 |
+
dataset_type: hf
|
16 |
+
ddp_static_graph: False
|
17 |
+
debug: False
|
18 |
+
delete_previous_checkpoint: False
|
19 |
+
device: cuda
|
20 |
+
dist_backend: None
|
21 |
+
dist_url: None
|
22 |
+
distill: False
|
23 |
+
distill_model: None
|
24 |
+
distill_pretrained: None
|
25 |
+
distributed: False
|
26 |
+
epochs: 30
|
27 |
+
epochs_cooldown: None
|
28 |
+
eps: 1e-08
|
29 |
+
force_custom_text: False
|
30 |
+
force_image_size: None
|
31 |
+
force_patch_dropout: None
|
32 |
+
force_quick_gelu: False
|
33 |
+
gather_with_grad: False
|
34 |
+
grad_checkpointing: False
|
35 |
+
grad_clip_norm: None
|
36 |
+
hf_dataset: photonmz/opi_function_packed
|
37 |
+
horovod: False
|
38 |
+
image_interpolation: None
|
39 |
+
image_mean: None
|
40 |
+
image_resize_mode: None
|
41 |
+
image_std: None
|
42 |
+
imagenet_v2: None
|
43 |
+
imagenet_val: None
|
44 |
+
local_loss: False
|
45 |
+
local_rank: 0
|
46 |
+
lock_image: False
|
47 |
+
lock_image_freeze_bn_stats: False
|
48 |
+
lock_image_unlocked_groups: 0
|
49 |
+
lock_text: False
|
50 |
+
lock_text_freeze_layer_norm: False
|
51 |
+
lock_text_unlocked_layers: 0
|
52 |
+
log_every_n_steps: 100
|
53 |
+
log_level: 20
|
54 |
+
log_local: False
|
55 |
+
log_path: ./logs/2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16/out.log
|
56 |
+
logs: ./logs/
|
57 |
+
loss_dist_impl: None
|
58 |
+
lr: 0.0002
|
59 |
+
lr_cooldown_end: 0.0
|
60 |
+
lr_cooldown_power: 1.0
|
61 |
+
lr_scheduler: cosine
|
62 |
+
model: crisp_1
|
63 |
+
momentum: None
|
64 |
+
name: 2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16
|
65 |
+
no_set_device_rank: False
|
66 |
+
opt: adamw
|
67 |
+
precision: amp_bfloat16
|
68 |
+
pretrained:
|
69 |
+
pretrained_image: False
|
70 |
+
rank: 0
|
71 |
+
remote_sync: None
|
72 |
+
remote_sync_frequency: 300
|
73 |
+
remote_sync_protocol: s3
|
74 |
+
report_to: wandb
|
75 |
+
resume: None
|
76 |
+
save_frequency: 1
|
77 |
+
save_most_recent: True
|
78 |
+
seed: 0
|
79 |
+
siglip: False
|
80 |
+
skip_scheduler: False
|
81 |
+
tensorboard: False
|
82 |
+
tensorboard_path:
|
83 |
+
torchcompile: False
|
84 |
+
torchscript: False
|
85 |
+
trace: False
|
86 |
+
train_data: stub
|
87 |
+
train_data_upsampling_factors: None
|
88 |
+
train_num_samples: None
|
89 |
+
use_bn_sync: False
|
90 |
+
use_bnb_linear: None
|
91 |
+
val_data: stub
|
92 |
+
val_frequency: 1
|
93 |
+
val_num_samples: None
|
94 |
+
wandb: True
|
95 |
+
wandb_notes:
|
96 |
+
wandb_project_name: open-clip
|
97 |
+
warmup: 10000
|
98 |
+
wd: 0.1
|
99 |
+
workers: 1
|
100 |
+
world_size: 1
|
101 |
+
zeroshot_frequency: 1
|