ierhon
/

neural-chatbot

Text Generation

Model card Files Files and versions Community

ierhon commited on Jul 29, 2023

Commit

a8ae0da

·

1 Parent(s): a88b388

Use model_settings.py

Files changed (1) hide show

train.py +1 -1

train.py CHANGED Viewed

@@ -5,6 +5,7 @@ from keras.models import Sequential
 from keras.layers import Embedding, Dense, Dropout, Flatten, PReLU
 from keras.preprocessing.text import Tokenizer
 from keras_self_attention import SeqSelfAttention, SeqWeightedAttention
 with open("dataset.json", "r") as f: # TODO: move the outputs into a separate file, so it would be "key": 0, "key2": 1 etc
@@ -14,7 +15,6 @@ dset_size = len(dset)
 tokenizer = Tokenizer() # a tokenizer is a thing to split text into words, it might have some other stuff like making all the letters lowercase, etc.
 tokenizer.fit_on_texts(list(dset.keys()))
-emb_size = 128 # how big are the word vectors in the input (how much information can be fit into one word)
 vocab_size = len(tokenizer.get_vocabulary())
 inp_len = 10 # limit of the input length, after 10 words the

 from keras.layers import Embedding, Dense, Dropout, Flatten, PReLU
 from keras.preprocessing.text import Tokenizer
 from keras_self_attention import SeqSelfAttention, SeqWeightedAttention
+from model_settings import *
 with open("dataset.json", "r") as f: # TODO: move the outputs into a separate file, so it would be "key": 0, "key2": 1 etc
 tokenizer = Tokenizer() # a tokenizer is a thing to split text into words, it might have some other stuff like making all the letters lowercase, etc.
 tokenizer.fit_on_texts(list(dset.keys()))
 vocab_size = len(tokenizer.get_vocabulary())
 inp_len = 10 # limit of the input length, after 10 words the