ierhon
/

neural-chatbot

ierhon commited on Jul 29, 2023

Commit

8ceb723

1 Parent(s): d12bf65

sleepy hon forgot how to use a tokenizer

Files changed (1) hide show

train.py CHANGED Viewed

@@ -33,7 +33,7 @@ X = [] # we're loading the training data into input X
 y = [] # and output y
 for line, key in enumerate(dset):
-    tokens = tokenizer.tokenize(key)
     X.append(numpy.array((list(tokens)+[0,]*inp_len)[:inp_len])) # refusing to use pad_sequences for an unspecified reason and creating the worst line of code
     output_array = np.zeros(dset_size)
     output_array[line] = 1 # 0 0 0 1 0 0 0 0 0, the neuron of the each line activates in the correct response

 y = [] # and output y
 for line, key in enumerate(dset):
+    tokens = tokenizer.texts_to_sequences([key,])[0]
     X.append(numpy.array((list(tokens)+[0,]*inp_len)[:inp_len])) # refusing to use pad_sequences for an unspecified reason and creating the worst line of code
     output_array = np.zeros(dset_size)
     output_array[line] = 1 # 0 0 0 1 0 0 0 0 0, the neuron of the each line activates in the correct response