Trained the model with a better bert model and more epochs
Browse files
notebooks/classify_sentiment_with_bert.ipynb
CHANGED
@@ -191,7 +191,7 @@
|
|
191 |
"source": [
|
192 |
"#@title Choose a BERT model to fine-tune\n",
|
193 |
"\n",
|
194 |
-
"bert_model_name = 'small_bert/bert_en_uncased_L-
|
195 |
"\n",
|
196 |
"map_name_to_handle = {\n",
|
197 |
" 'bert_en_uncased_L-12_H-768_A-12':\n",
|
@@ -467,7 +467,7 @@
|
|
467 |
},
|
468 |
"outputs": [],
|
469 |
"source": [
|
470 |
-
"epochs =
|
471 |
"steps_per_epoch = len(train_ds)\n",
|
472 |
"num_train_steps = steps_per_epoch * epochs\n",
|
473 |
"num_warmup_steps = int(0.1*num_train_steps)\n",
|
|
|
191 |
"source": [
|
192 |
"#@title Choose a BERT model to fine-tune\n",
|
193 |
"\n",
|
194 |
+
"bert_model_name = 'small_bert/bert_en_uncased_L-10_H-512_A-8' #@param [\"bert_en_uncased_L-12_H-768_A-12\", \"bert_en_cased_L-12_H-768_A-12\", \"bert_multi_cased_L-12_H-768_A-12\", \"small_bert/bert_en_uncased_L-2_H-128_A-2\", \"small_bert/bert_en_uncased_L-2_H-256_A-4\", \"small_bert/bert_en_uncased_L-2_H-512_A-8\", \"small_bert/bert_en_uncased_L-2_H-768_A-12\", \"small_bert/bert_en_uncased_L-4_H-128_A-2\", \"small_bert/bert_en_uncased_L-4_H-256_A-4\", \"small_bert/bert_en_uncased_L-4_H-512_A-8\", \"small_bert/bert_en_uncased_L-4_H-768_A-12\", \"small_bert/bert_en_uncased_L-6_H-128_A-2\", \"small_bert/bert_en_uncased_L-6_H-256_A-4\", \"small_bert/bert_en_uncased_L-6_H-512_A-8\", \"small_bert/bert_en_uncased_L-6_H-768_A-12\", \"small_bert/bert_en_uncased_L-8_H-128_A-2\", \"small_bert/bert_en_uncased_L-8_H-256_A-4\", \"small_bert/bert_en_uncased_L-8_H-512_A-8\", \"small_bert/bert_en_uncased_L-8_H-768_A-12\", \"small_bert/bert_en_uncased_L-10_H-128_A-2\", \"small_bert/bert_en_uncased_L-10_H-256_A-4\", \"small_bert/bert_en_uncased_L-10_H-512_A-8\", \"small_bert/bert_en_uncased_L-10_H-768_A-12\", \"small_bert/bert_en_uncased_L-12_H-128_A-2\", \"small_bert/bert_en_uncased_L-12_H-256_A-4\", \"small_bert/bert_en_uncased_L-12_H-512_A-8\", \"small_bert/bert_en_uncased_L-12_H-768_A-12\", \"albert_en_base\", \"electra_small\", \"electra_base\", \"experts_pubmed\", \"experts_wiki_books\", \"talking-heads_base\"]\n",
|
195 |
"\n",
|
196 |
"map_name_to_handle = {\n",
|
197 |
" 'bert_en_uncased_L-12_H-768_A-12':\n",
|
|
|
467 |
},
|
468 |
"outputs": [],
|
469 |
"source": [
|
470 |
+
"epochs = 5\n",
|
471 |
"steps_per_epoch = len(train_ds)\n",
|
472 |
"num_train_steps = steps_per_epoch * epochs\n",
|
473 |
"num_warmup_steps = int(0.1*num_train_steps)\n",
|