hsuvaskakoty
commited on
Push model using huggingface_hub.
Browse files- README.md +13 -8
- model.safetensors +1 -1
- model_head.pkl +1 -1
README.md
CHANGED
@@ -198,12 +198,12 @@ preds = model(" Interviews: Interviews WN:Story preparation/Office hours:Frank
|
|
198 |
| 3 | 7 |
|
199 |
|
200 |
### Training Hyperparameters
|
201 |
-
- batch_size: (8,
|
202 |
-
- num_epochs: (
|
203 |
- max_steps: -1
|
204 |
- sampling_strategy: oversampling
|
205 |
-
- body_learning_rate: (
|
206 |
-
- head_learning_rate:
|
207 |
- loss: CosineSimilarityLoss
|
208 |
- distance_metric: cosine_distance
|
209 |
- margin: 0.25
|
@@ -219,10 +219,15 @@ preds = model(" Interviews: Interviews WN:Story preparation/Office hours:Frank
|
|
219 |
| Epoch | Step | Training Loss | Validation Loss |
|
220 |
|:------:|:----:|:-------------:|:---------------:|
|
221 |
| 0.0035 | 1 | 0.1819 | - |
|
222 |
-
| 1.0381 | 300 | 0.
|
223 |
-
| 2.0761 | 600 | 0.
|
224 |
-
| 3.1142 | 900 | 0.
|
225 |
-
| 4.1522 | 1200 | 0.
|
|
|
|
|
|
|
|
|
|
|
226 |
|
227 |
### Framework Versions
|
228 |
- Python: 3.10.12
|
|
|
198 |
| 3 | 7 |
|
199 |
|
200 |
### Training Hyperparameters
|
201 |
+
- batch_size: (8, 4)
|
202 |
+
- num_epochs: (10, 10)
|
203 |
- max_steps: -1
|
204 |
- sampling_strategy: oversampling
|
205 |
+
- body_learning_rate: (0.0005, 0.0005)
|
206 |
+
- head_learning_rate: 1e-05
|
207 |
- loss: CosineSimilarityLoss
|
208 |
- distance_metric: cosine_distance
|
209 |
- margin: 0.25
|
|
|
219 |
| Epoch | Step | Training Loss | Validation Loss |
|
220 |
|:------:|:----:|:-------------:|:---------------:|
|
221 |
| 0.0035 | 1 | 0.1819 | - |
|
222 |
+
| 1.0381 | 300 | 0.1617 | 0.5 |
|
223 |
+
| 2.0761 | 600 | 0.2718 | 0.5000 |
|
224 |
+
| 3.1142 | 900 | 0.2721 | 0.5 |
|
225 |
+
| 4.1522 | 1200 | 0.2615 | 0.5 |
|
226 |
+
| 5.1903 | 1500 | 0.2572 | 0.5000 |
|
227 |
+
| 6.2284 | 1800 | 0.2571 | 0.5 |
|
228 |
+
| 7.2664 | 2100 | 0.254 | 0.5 |
|
229 |
+
| 8.3045 | 2400 | 0.2562 | 0.5000 |
|
230 |
+
| 9.3426 | 2700 | 0.2542 | 0.5000 |
|
231 |
|
232 |
### Framework Versions
|
233 |
- Python: 3.10.12
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 133462128
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6295a27359e599257963ff195f1e8084b4524b368b110a5805a869ba8697c255
|
3 |
size 133462128
|
model_head.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13175
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:513671b63f320ca50a3b61233abf3ca31c9e4d23d830fd988fcc4b7924f289c9
|
3 |
size 13175
|