Add new SentenceTransformer model
Browse files- README.md +14 -15
- model.safetensors +1 -1
README.md
CHANGED
@@ -202,7 +202,6 @@ You can finetune this model on your own dataset.
|
|
202 |
#### Non-Default Hyperparameters
|
203 |
|
204 |
- `per_device_train_batch_size`: 256
|
205 |
-
- `learning_rate`: 1e-05
|
206 |
- `warmup_ratio`: 0.1
|
207 |
- `fp16`: True
|
208 |
- `batch_sampler`: no_duplicates
|
@@ -221,7 +220,7 @@ You can finetune this model on your own dataset.
|
|
221 |
- `gradient_accumulation_steps`: 1
|
222 |
- `eval_accumulation_steps`: None
|
223 |
- `torch_empty_cache_steps`: None
|
224 |
-
- `learning_rate`:
|
225 |
- `weight_decay`: 0.0
|
226 |
- `adam_beta1`: 0.9
|
227 |
- `adam_beta2`: 0.999
|
@@ -330,19 +329,19 @@ You can finetune this model on your own dataset.
|
|
330 |
### Training Logs
|
331 |
| Epoch | Step | Training Loss |
|
332 |
|:------:|:----:|:-------------:|
|
333 |
-
| 0.2273 | 10 | 1.
|
334 |
-
| 0.4545 | 20 | 1.
|
335 |
-
| 0.6818 | 30 | 0.
|
336 |
-
| 0.9091 | 40 | 0.
|
337 |
-
| 1.1364 | 50 | 1.
|
338 |
-
| 1.3636 | 60 | 0.
|
339 |
-
| 1.5909 | 70 |
|
340 |
-
| 1.8182 | 80 | 0.
|
341 |
-
| 2.0455 | 90 | 0.
|
342 |
-
| 2.2727 | 100 |
|
343 |
-
| 2.5 | 110 | 0.
|
344 |
-
| 2.7273 | 120 | 0.
|
345 |
-
| 2.9545 | 130 | 0.
|
346 |
|
347 |
|
348 |
### Framework Versions
|
|
|
202 |
#### Non-Default Hyperparameters
|
203 |
|
204 |
- `per_device_train_batch_size`: 256
|
|
|
205 |
- `warmup_ratio`: 0.1
|
206 |
- `fp16`: True
|
207 |
- `batch_sampler`: no_duplicates
|
|
|
220 |
- `gradient_accumulation_steps`: 1
|
221 |
- `eval_accumulation_steps`: None
|
222 |
- `torch_empty_cache_steps`: None
|
223 |
+
- `learning_rate`: 5e-05
|
224 |
- `weight_decay`: 0.0
|
225 |
- `adam_beta1`: 0.9
|
226 |
- `adam_beta2`: 0.999
|
|
|
329 |
### Training Logs
|
330 |
| Epoch | Step | Training Loss |
|
331 |
|:------:|:----:|:-------------:|
|
332 |
+
| 0.2273 | 10 | 1.6158 |
|
333 |
+
| 0.4545 | 20 | 1.1681 |
|
334 |
+
| 0.6818 | 30 | 0.8775 |
|
335 |
+
| 0.9091 | 40 | 0.7628 |
|
336 |
+
| 1.1364 | 50 | 1.0154 |
|
337 |
+
| 1.3636 | 60 | 0.7048 |
|
338 |
+
| 1.5909 | 70 | 0.7981 |
|
339 |
+
| 1.8182 | 80 | 0.6322 |
|
340 |
+
| 2.0455 | 90 | 0.4916 |
|
341 |
+
| 2.2727 | 100 | 0.8441 |
|
342 |
+
| 2.5 | 110 | 0.6697 |
|
343 |
+
| 2.7273 | 120 | 0.5358 |
|
344 |
+
| 2.9545 | 130 | 0.5111 |
|
345 |
|
346 |
|
347 |
### Framework Versions
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 437951328
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b94852c6a04ca84b6478f9b3af75a7bff023c8ae5ed7db43464461ca19e98ea0
|
3 |
size 437951328
|