Shankhdhar commited on
Commit
4b10c16
·
verified ·
1 Parent(s): eb3d321

Add SetFit model

Browse files
Files changed (4) hide show
  1. README.md +19 -109
  2. config_setfit.json +2 -2
  3. model.safetensors +1 -1
  4. model_head.pkl +1 -1
README.md CHANGED
@@ -143,7 +143,7 @@ preds = model("what are the colors available in air jordan 4")
143
 
144
  ### Training Hyperparameters
145
  - batch_size: (16, 16)
146
- - num_epochs: (4, 4)
147
  - max_steps: -1
148
  - sampling_strategy: oversampling
149
  - body_learning_rate: (2e-05, 1e-05)
@@ -162,126 +162,36 @@ preds = model("what are the colors available in air jordan 4")
162
  | Epoch | Step | Training Loss | Validation Loss |
163
  |:------:|:----:|:-------------:|:---------------:|
164
  | 0.0007 | 1 | 0.1501 | - |
165
- | 0.0333 | 50 | 0.1693 | - |
166
- | 0.0667 | 100 | 0.0692 | - |
167
- | 0.1 | 150 | 0.0311 | - |
168
- | 0.1333 | 200 | 0.0182 | - |
169
- | 0.1667 | 250 | 0.0033 | - |
170
- | 0.2 | 300 | 0.0025 | - |
171
- | 0.2333 | 350 | 0.0013 | - |
172
- | 0.2667 | 400 | 0.0008 | - |
173
- | 0.3 | 450 | 0.0011 | - |
174
- | 0.3333 | 500 | 0.0005 | - |
175
- | 0.3667 | 550 | 0.0005 | - |
176
- | 0.4 | 600 | 0.0003 | - |
177
  | 0.4333 | 650 | 0.0002 | - |
178
  | 0.4667 | 700 | 0.0003 | - |
179
- | 0.5 | 750 | 0.0003 | - |
180
- | 0.5333 | 800 | 0.0004 | - |
181
- | 0.5667 | 850 | 0.0003 | - |
182
  | 0.6 | 900 | 0.0002 | - |
183
- | 0.6333 | 950 | 0.0001 | - |
184
  | 0.6667 | 1000 | 0.0001 | - |
185
  | 0.7 | 1050 | 0.0001 | - |
186
  | 0.7333 | 1100 | 0.0002 | - |
187
- | 0.7667 | 1150 | 0.0002 | - |
188
  | 0.8 | 1200 | 0.0001 | - |
189
  | 0.8333 | 1250 | 0.0001 | - |
190
- | 0.8667 | 1300 | 0.0001 | - |
191
  | 0.9 | 1350 | 0.0001 | - |
192
  | 0.9333 | 1400 | 0.0002 | - |
193
  | 0.9667 | 1450 | 0.0001 | - |
194
  | 1.0 | 1500 | 0.0002 | - |
195
- | 1.0333 | 1550 | 0.0001 | - |
196
- | 1.0667 | 1600 | 0.0001 | - |
197
- | 1.1 | 1650 | 0.0001 | - |
198
- | 1.1333 | 1700 | 0.0001 | - |
199
- | 1.1667 | 1750 | 0.0002 | - |
200
- | 1.2 | 1800 | 0.0001 | - |
201
- | 1.2333 | 1850 | 0.0001 | - |
202
- | 1.2667 | 1900 | 0.0001 | - |
203
- | 1.3 | 1950 | 0.0001 | - |
204
- | 1.3333 | 2000 | 0.0001 | - |
205
- | 1.3667 | 2050 | 0.0001 | - |
206
- | 1.4 | 2100 | 0.0001 | - |
207
- | 1.4333 | 2150 | 0.0001 | - |
208
- | 1.4667 | 2200 | 0.0001 | - |
209
- | 1.5 | 2250 | 0.0001 | - |
210
- | 1.5333 | 2300 | 0.0001 | - |
211
- | 1.5667 | 2350 | 0.0001 | - |
212
- | 1.6 | 2400 | 0.0 | - |
213
- | 1.6333 | 2450 | 0.0001 | - |
214
- | 1.6667 | 2500 | 0.0001 | - |
215
- | 1.7 | 2550 | 0.0 | - |
216
- | 1.7333 | 2600 | 0.0001 | - |
217
- | 1.7667 | 2650 | 0.0001 | - |
218
- | 1.8 | 2700 | 0.0001 | - |
219
- | 1.8333 | 2750 | 0.0001 | - |
220
- | 1.8667 | 2800 | 0.0001 | - |
221
- | 1.9 | 2850 | 0.0 | - |
222
- | 1.9333 | 2900 | 0.0001 | - |
223
- | 1.9667 | 2950 | 0.0 | - |
224
- | 2.0 | 3000 | 0.0 | - |
225
- | 2.0333 | 3050 | 0.0001 | - |
226
- | 2.0667 | 3100 | 0.0 | - |
227
- | 2.1 | 3150 | 0.0001 | - |
228
- | 2.1333 | 3200 | 0.0001 | - |
229
- | 2.1667 | 3250 | 0.0 | - |
230
- | 2.2 | 3300 | 0.0001 | - |
231
- | 2.2333 | 3350 | 0.0001 | - |
232
- | 2.2667 | 3400 | 0.0001 | - |
233
- | 2.3 | 3450 | 0.0 | - |
234
- | 2.3333 | 3500 | 0.0001 | - |
235
- | 2.3667 | 3550 | 0.0 | - |
236
- | 2.4 | 3600 | 0.0 | - |
237
- | 2.4333 | 3650 | 0.0 | - |
238
- | 2.4667 | 3700 | 0.0001 | - |
239
- | 2.5 | 3750 | 0.0 | - |
240
- | 2.5333 | 3800 | 0.0001 | - |
241
- | 2.5667 | 3850 | 0.0 | - |
242
- | 2.6 | 3900 | 0.0001 | - |
243
- | 2.6333 | 3950 | 0.0 | - |
244
- | 2.6667 | 4000 | 0.0001 | - |
245
- | 2.7 | 4050 | 0.0001 | - |
246
- | 2.7333 | 4100 | 0.0 | - |
247
- | 2.7667 | 4150 | 0.0 | - |
248
- | 2.8 | 4200 | 0.0 | - |
249
- | 2.8333 | 4250 | 0.0 | - |
250
- | 2.8667 | 4300 | 0.0 | - |
251
- | 2.9 | 4350 | 0.0 | - |
252
- | 2.9333 | 4400 | 0.0 | - |
253
- | 2.9667 | 4450 | 0.0001 | - |
254
- | 3.0 | 4500 | 0.0 | - |
255
- | 3.0333 | 4550 | 0.0001 | - |
256
- | 3.0667 | 4600 | 0.0 | - |
257
- | 3.1 | 4650 | 0.0 | - |
258
- | 3.1333 | 4700 | 0.0001 | - |
259
- | 3.1667 | 4750 | 0.0 | - |
260
- | 3.2 | 4800 | 0.0 | - |
261
- | 3.2333 | 4850 | 0.0 | - |
262
- | 3.2667 | 4900 | 0.0 | - |
263
- | 3.3 | 4950 | 0.0001 | - |
264
- | 3.3333 | 5000 | 0.0 | - |
265
- | 3.3667 | 5050 | 0.0 | - |
266
- | 3.4 | 5100 | 0.0001 | - |
267
- | 3.4333 | 5150 | 0.0 | - |
268
- | 3.4667 | 5200 | 0.0 | - |
269
- | 3.5 | 5250 | 0.0001 | - |
270
- | 3.5333 | 5300 | 0.0 | - |
271
- | 3.5667 | 5350 | 0.0 | - |
272
- | 3.6 | 5400 | 0.0 | - |
273
- | 3.6333 | 5450 | 0.0 | - |
274
- | 3.6667 | 5500 | 0.0 | - |
275
- | 3.7 | 5550 | 0.0001 | - |
276
- | 3.7333 | 5600 | 0.0 | - |
277
- | 3.7667 | 5650 | 0.0 | - |
278
- | 3.8 | 5700 | 0.0 | - |
279
- | 3.8333 | 5750 | 0.0 | - |
280
- | 3.8667 | 5800 | 0.0 | - |
281
- | 3.9 | 5850 | 0.0 | - |
282
- | 3.9333 | 5900 | 0.0 | - |
283
- | 3.9667 | 5950 | 0.0001 | - |
284
- | 4.0 | 6000 | 0.0 | - |
285
 
286
  ### Framework Versions
287
  - Python: 3.9.16
 
143
 
144
  ### Training Hyperparameters
145
  - batch_size: (16, 16)
146
+ - num_epochs: (1, 1)
147
  - max_steps: -1
148
  - sampling_strategy: oversampling
149
  - body_learning_rate: (2e-05, 1e-05)
 
162
  | Epoch | Step | Training Loss | Validation Loss |
163
  |:------:|:----:|:-------------:|:---------------:|
164
  | 0.0007 | 1 | 0.1501 | - |
165
+ | 0.0333 | 50 | 0.1076 | - |
166
+ | 0.0667 | 100 | 0.01 | - |
167
+ | 0.1 | 150 | 0.0023 | - |
168
+ | 0.1333 | 200 | 0.0008 | - |
169
+ | 0.1667 | 250 | 0.0007 | - |
170
+ | 0.2 | 300 | 0.0005 | - |
171
+ | 0.2333 | 350 | 0.0005 | - |
172
+ | 0.2667 | 400 | 0.0003 | - |
173
+ | 0.3 | 450 | 0.0005 | - |
174
+ | 0.3333 | 500 | 0.0003 | - |
175
+ | 0.3667 | 550 | 0.0003 | - |
176
+ | 0.4 | 600 | 0.0002 | - |
177
  | 0.4333 | 650 | 0.0002 | - |
178
  | 0.4667 | 700 | 0.0003 | - |
179
+ | 0.5 | 750 | 0.0002 | - |
180
+ | 0.5333 | 800 | 0.0002 | - |
181
+ | 0.5667 | 850 | 0.0002 | - |
182
  | 0.6 | 900 | 0.0002 | - |
183
+ | 0.6333 | 950 | 0.0002 | - |
184
  | 0.6667 | 1000 | 0.0001 | - |
185
  | 0.7 | 1050 | 0.0001 | - |
186
  | 0.7333 | 1100 | 0.0002 | - |
187
+ | 0.7667 | 1150 | 0.0001 | - |
188
  | 0.8 | 1200 | 0.0001 | - |
189
  | 0.8333 | 1250 | 0.0001 | - |
190
+ | 0.8667 | 1300 | 0.0002 | - |
191
  | 0.9 | 1350 | 0.0001 | - |
192
  | 0.9333 | 1400 | 0.0002 | - |
193
  | 0.9667 | 1450 | 0.0001 | - |
194
  | 1.0 | 1500 | 0.0002 | - |
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
195
 
196
  ### Framework Versions
197
  - Python: 3.9.16
config_setfit.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "labels": [
3
  "complaints",
4
  "order tracking",
@@ -6,6 +7,5 @@
6
  "product discoveribility",
7
  "product faq",
8
  "product policy"
9
- ],
10
- "normalize_embeddings": false
11
  }
 
1
  {
2
+ "normalize_embeddings": false,
3
  "labels": [
4
  "complaints",
5
  "order tracking",
 
7
  "product discoveribility",
8
  "product faq",
9
  "product policy"
10
+ ]
 
11
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae03ac1345d3ba6c609f184a07acf7265b5deee425cd424ce18ec3f74561823b
3
  size 437967672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6422d3ea83098d1f7e94cc8aed3489a2e6a3990ee34cdd519a308c98e63356ee
3
  size 437967672
model_head.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c7f26962d0c6ba43552743b68ebd7babd714d75d7a6158192612125e28b2b8c
3
  size 38311
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3731e8ff606284061a188661326d908304d2514b60b7a453926fbb6f55e0f840
3
  size 38311