Spaces:

nishantguvvada
/

Image-Captioning

Sleeping

nishantguvvada commited on Dec 25, 2023

Commit

efb91fe

1 Parent(s): 2f89c4d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import streamlit as st
 import tensorflow as tf
 import cv2
 import numpy as np
@@ -64,15 +65,13 @@ def standardize(inputs):
     )
 # Choose the most frequent words from the vocabulary & remove punctuation etc.
-tokenizer = TextVectorization(
-    max_tokens=VOCAB_SIZE,
-    standardize=standardize,
-    output_sequence_length=MAX_CAPTION_LEN,
-)
 # Lookup table: Word -> Index
 word_to_index = StringLookup(
-    mask_token="", vocabulary=tokenizer.get_vocabulary()
 )
@@ -102,7 +101,7 @@ def predict_caption(file):
         chosen_id = tf.random.categorical([top_probs], 1)[0].numpy()
         predicted_id = top_idxs.numpy()[chosen_id][0]
-        result.append(tokenizer.get_vocabulary()[predicted_id])
         if predicted_id == word_to_index("<end>"):
             return img, result

 import streamlit as st
+import pickle
 import tensorflow as tf
 import cv2
 import numpy as np
     )
 # Choose the most frequent words from the vocabulary & remove punctuation etc.
+file = open('./tokenizer.txt', 'rb')
+tokenizer = pickle.load(file)
 # Lookup table: Word -> Index
 word_to_index = StringLookup(
+    mask_token="", vocabulary=tokenizer
 )
         chosen_id = tf.random.categorical([top_probs], 1)[0].numpy()
         predicted_id = top_idxs.numpy()[chosen_id][0]
+        result.append(tokenizer[predicted_id])
         if predicted_id == word_to_index("<end>"):
             return img, result