Training in progress epoch 0

Browse files

Files changed (4) hide show

README.md +5 -149
config.json +1 -1
tf_model.h5 +1 -1
tokenizer_config.json +4 -0

README.md CHANGED Viewed

@@ -1,6 +1,4 @@
 ---
-license: apache-2.0
-base_model: t5-small
 tags:
 - generated_from_keras_callback
 model-index:
@@ -13,11 +11,11 @@ probably proofread and complete it, then remove this comment. -->
 # tarsssss/eng-jagoy-t5-002
-This model is a fine-tuned version of [t5-small](https://huggingface.co/t5-small) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Train Loss: 4.7104
-- Validation Loss: 5.2694
-- Epoch: 142
 ## Model description
@@ -43,149 +41,7 @@ The following hyperparameters were used during training:
 | Train Loss | Validation Loss | Epoch |
 |:----------:|:---------------:|:-----:|
-| 7.9230     | 7.4880          | 0     |
-| 7.4261     | 7.2365          | 1     |
-| 7.2130     | 7.0830          | 2     |
-| 7.0761     | 6.9717          | 3     |
-| 6.9678     | 6.8724          | 4     |
-| 6.8904     | 6.7979          | 5     |
-| 6.8053     | 6.7267          | 6     |
-| 6.7518     | 6.6660          | 7     |
-| 6.6899     | 6.6093          | 8     |
-| 6.6337     | 6.5595          | 9     |
-| 6.5867     | 6.5166          | 10    |
-| 6.5419     | 6.4748          | 11    |
-| 6.5020     | 6.4362          | 12    |
-| 6.4560     | 6.3967          | 13    |
-| 6.4189     | 6.3589          | 14    |
-| 6.3782     | 6.3209          | 15    |
-| 6.3324     | 6.2874          | 16    |
-| 6.2983     | 6.2530          | 17    |
-| 6.2466     | 6.2201          | 18    |
-| 6.2155     | 6.1900          | 19    |
-| 6.1906     | 6.1594          | 20    |
-| 6.1562     | 6.1335          | 21    |
-| 6.1244     | 6.1083          | 22    |
-| 6.1023     | 6.0840          | 23    |
-| 6.0687     | 6.0593          | 24    |
-| 6.0526     | 6.0386          | 25    |
-| 6.0281     | 6.0160          | 26    |
-| 5.9981     | 5.9931          | 27    |
-| 5.9756     | 5.9769          | 28    |
-| 5.9500     | 5.9537          | 29    |
-| 5.9325     | 5.9356          | 30    |
-| 5.9008     | 5.9193          | 31    |
-| 5.8793     | 5.9051          | 32    |
-| 5.8718     | 5.8847          | 33    |
-| 5.8474     | 5.8641          | 34    |
-| 5.8370     | 5.8531          | 35    |
-| 5.8135     | 5.8424          | 36    |
-| 5.7981     | 5.8243          | 37    |
-| 5.7759     | 5.8142          | 38    |
-| 5.7582     | 5.8050          | 39    |
-| 5.7482     | 5.7910          | 40    |
-| 5.7354     | 5.7740          | 41    |
-| 5.7066     | 5.7762          | 42    |
-| 5.6981     | 5.7576          | 43    |
-| 5.6797     | 5.7470          | 44    |
-| 5.6631     | 5.7400          | 45    |
-| 5.6511     | 5.7255          | 46    |
-| 5.6433     | 5.7211          | 47    |
-| 5.6196     | 5.7050          | 48    |
-| 5.6173     | 5.6980          | 49    |
-| 5.5903     | 5.6902          | 50    |
-| 5.5723     | 5.6808          | 51    |
-| 5.5701     | 5.6754          | 52    |
-| 5.5537     | 5.6724          | 53    |
-| 5.5478     | 5.6545          | 54    |
-| 5.5182     | 5.6566          | 55    |
-| 5.5112     | 5.6417          | 56    |
-| 5.4994     | 5.6290          | 57    |
-| 5.4895     | 5.6216          | 58    |
-| 5.4610     | 5.6147          | 59    |
-| 5.4567     | 5.6035          | 60    |
-| 5.4433     | 5.5957          | 61    |
-| 5.4386     | 5.5855          | 62    |
-| 5.4253     | 5.5851          | 63    |
-| 5.4214     | 5.5804          | 64    |
-| 5.4117     | 5.5714          | 65    |
-| 5.3940     | 5.5632          | 66    |
-| 5.3756     | 5.5616          | 67    |
-| 5.3668     | 5.5540          | 68    |
-| 5.3483     | 5.5465          | 69    |
-| 5.3523     | 5.5380          | 70    |
-| 5.3367     | 5.5371          | 71    |
-| 5.3398     | 5.5187          | 72    |
-| 5.3236     | 5.5241          | 73    |
-| 5.3003     | 5.5139          | 74    |
-| 5.3053     | 5.5093          | 75    |
-| 5.2933     | 5.5120          | 76    |
-| 5.2735     | 5.5064          | 77    |
-| 5.2715     | 5.4971          | 78    |
-| 5.2476     | 5.4956          | 79    |
-| 5.2534     | 5.4750          | 80    |
-| 5.2274     | 5.4845          | 81    |
-| 5.2343     | 5.4761          | 82    |
-| 5.2161     | 5.4686          | 83    |
-| 5.1994     | 5.4656          | 84    |
-| 5.1993     | 5.4551          | 85    |
-| 5.1786     | 5.4680          | 86    |
-| 5.1800     | 5.4557          | 87    |
-| 5.1552     | 5.4460          | 88    |
-| 5.1547     | 5.4377          | 89    |
-| 5.1450     | 5.4365          | 90    |
-| 5.1429     | 5.4228          | 91    |
-| 5.1303     | 5.4245          | 92    |
-| 5.1164     | 5.4177          | 93    |
-| 5.1200     | 5.4135          | 94    |
-| 5.1115     | 5.4120          | 95    |
-| 5.0928     | 5.3963          | 96    |
-| 5.0825     | 5.3945          | 97    |
-| 5.0760     | 5.4078          | 98    |
-| 5.0733     | 5.3935          | 99    |
-| 5.0611     | 5.3944          | 100   |
-| 5.0457     | 5.3882          | 101   |
-| 5.0296     | 5.3774          | 102   |
-| 5.0311     | 5.3812          | 103   |
-| 5.0189     | 5.3756          | 104   |
-| 5.0076     | 5.3756          | 105   |
-| 5.0037     | 5.3751          | 106   |
-| 4.9992     | 5.3582          | 107   |
-| 4.9774     | 5.3603          | 108   |
-| 4.9789     | 5.3679          | 109   |
-| 4.9717     | 5.3566          | 110   |
-| 4.9684     | 5.3489          | 111   |
-| 4.9578     | 5.3454          | 112   |
-| 4.9519     | 5.3457          | 113   |
-| 4.9327     | 5.3380          | 114   |
-| 4.9413     | 5.3324          | 115   |
-| 4.9093     | 5.3461          | 116   |
-| 4.9126     | 5.3269          | 117   |
-| 4.9096     | 5.3283          | 118   |
-| 4.8899     | 5.3252          | 119   |
-| 4.8936     | 5.3227          | 120   |
-| 4.8873     | 5.3213          | 121   |
-| 4.8657     | 5.3216          | 122   |
-| 4.8581     | 5.3195          | 123   |
-| 4.8619     | 5.3218          | 124   |
-| 4.8534     | 5.3062          | 125   |
-| 4.8466     | 5.3037          | 126   |
-| 4.8239     | 5.3075          | 127   |
-| 4.8287     | 5.3052          | 128   |
-| 4.8165     | 5.2992          | 129   |
-| 4.8136     | 5.2968          | 130   |
-| 4.8005     | 5.2902          | 131   |
-| 4.7898     | 5.2949          | 132   |
-| 4.7949     | 5.2858          | 133   |
-| 4.7786     | 5.2868          | 134   |
-| 4.7706     | 5.2928          | 135   |
-| 4.7579     | 5.2866          | 136   |
-| 4.7477     | 5.2772          | 137   |
-| 4.7517     | 5.2827          | 138   |
-| 4.7391     | 5.2849          | 139   |
-| 4.7268     | 5.2823          | 140   |
-| 4.7275     | 5.2832          | 141   |
-| 4.7104     | 5.2694          | 142   |
 ### Framework versions

 ---
 tags:
 - generated_from_keras_callback
 model-index:
 # tarsssss/eng-jagoy-t5-002
+This model was trained from scratch on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Train Loss: 4.8828
+- Validation Loss: 4.4230
+- Epoch: 0
 ## Model description
 | Train Loss | Validation Loss | Epoch |
 |:----------:|:---------------:|:-----:|
+| 4.8828     | 4.4230          | 0     |
 ### Framework versions

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "t5-small",
   "architectures": [
     "T5ForConditionalGeneration"
   ],

 {
+  "_name_or_path": "./eng-jagoy-t5-002",
   "architectures": [
     "T5ForConditionalGeneration"
   ],

tf_model.h5 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b85344689c0acb3d4ede8ce58079a92f9af7d98bdbd95ea1ff7158e9e3f9ba25
 size 373902664

 version https://git-lfs.github.com/spec/v1
+oid sha256:fecdab4ca7e83d87db3bc3aa082cbfdabf14dbad513f2e95b68884523e3651ba
 size 373902664

tokenizer_config.json CHANGED Viewed

@@ -104,8 +104,12 @@
   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
   "model_max_length": 512,
   "pad_token": "<pad>",
   "tokenizer_class": "T5Tokenizer",
   "unk_token": "<unk>"
 }

   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
+  "max_length": 128,
   "model_max_length": 512,
   "pad_token": "<pad>",
+  "stride": 0,
   "tokenizer_class": "T5Tokenizer",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
   "unk_token": "<unk>"
 }