fix: fix the ambigious naming of "load_dataset"
Browse files
app.py
CHANGED
@@ -29,7 +29,7 @@ def get_tweet(data):
|
|
29 |
labels = [get_label(x['label']) for x in data]
|
30 |
return tweets, labels
|
31 |
|
32 |
-
def
|
33 |
dataset = load_dataset("dair-ai/emotion")
|
34 |
train = dataset['train']
|
35 |
val = dataset['validation']
|
@@ -37,7 +37,7 @@ def load_dataset():
|
|
37 |
return train, val, test
|
38 |
|
39 |
|
40 |
-
train, val, test =
|
41 |
tweets, labels = get_tweet(train)
|
42 |
tokenizer = Tokenizer(num_words=10000,oov_token='<UNK>')
|
43 |
tokenizer.fit_on_texts(tweets)
|
@@ -83,7 +83,7 @@ def load_model():
|
|
83 |
_ = model.evaluate(test_seq, test_labels)
|
84 |
i = random.randint(0, len(test_labels) - 1)
|
85 |
print('Sentence:', test_tweets[i])
|
86 |
-
print('Emotion:', index_to_class[test_labels[i]])
|
87 |
p = model.predict(np.expand_dims(test_seq[i],axis=0))[0]
|
88 |
pred_class = index_to_class[np.argmax(p).astype('uint8')]
|
89 |
|
|
|
29 |
labels = [get_label(x['label']) for x in data]
|
30 |
return tweets, labels
|
31 |
|
32 |
+
def get_train_val_test_sets():
|
33 |
dataset = load_dataset("dair-ai/emotion")
|
34 |
train = dataset['train']
|
35 |
val = dataset['validation']
|
|
|
37 |
return train, val, test
|
38 |
|
39 |
|
40 |
+
train, val, test = get_train_val_test_sets()
|
41 |
tweets, labels = get_tweet(train)
|
42 |
tokenizer = Tokenizer(num_words=10000,oov_token='<UNK>')
|
43 |
tokenizer.fit_on_texts(tweets)
|
|
|
83 |
_ = model.evaluate(test_seq, test_labels)
|
84 |
i = random.randint(0, len(test_labels) - 1)
|
85 |
print('Sentence:', test_tweets[i])
|
86 |
+
print('Emotion:', index_to_class[test_labels[i]])
|
87 |
p = model.predict(np.expand_dims(test_seq[i],axis=0))[0]
|
88 |
pred_class = index_to_class[np.argmax(p).astype('uint8')]
|
89 |
|