Spaces:

Dekode
/

transformer-visualizer

Sleeping

Dekode commited on Apr 28, 2024

Commit

78127df

verified ·

1 Parent(s): 5ab3219

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -82,7 +82,7 @@ def initiate_model(config, device):
     model = build_transformer(tokenizer_src.get_vocab_size(), tokenizer_tgt.get_vocab_size(), config["seq_len"], config['seq_len'], d_model=config['d_model']).to(device)
     model_filename = latest_weights_file_path(config)
-    state = torch.load(model_filename, map_location=torch.device('cpu'))
     model.load_state_dict(state['model_state_dict'])
     return model, tokenizer_src, tokenizer_tgt
@@ -151,7 +151,12 @@ def main():
         st.write('Output:', ' '.join(decoder_input_tokens))
         st.write('Translated:', output)
         st.write('Attention Visualization')
-        st.write(get_all_attention_maps(attn_type, layers, heads, row_tokens, col_tokens, max_sentence_len, model))
     else:
         st.write('Enter a sentence to visualize the attention of the model')

     model = build_transformer(tokenizer_src.get_vocab_size(), tokenizer_tgt.get_vocab_size(), config["seq_len"], config['seq_len'], d_model=config['d_model']).to(device)
     model_filename = latest_weights_file_path(config)
+    state = torch.load(model_filename)
     model.load_state_dict(state['model_state_dict'])
     return model, tokenizer_src, tokenizer_tgt
         st.write('Output:', ' '.join(decoder_input_tokens))
         st.write('Translated:', output)
         st.write('Attention Visualization')
+        if attn_type == 'encoder':
+            st.write(get_all_attention_maps(attn_type, layers, heads, row_tokens, row_tokens, max_sentence_len, model))
+        elif attn_type == 'decoder':
+            st.write(get_all_attention_maps(attn_type, layers, heads, col_tokens, col_tokens, max_sentence_len, model))
+        elif attn_type == 'encoder-decoder':
+            st.write(get_all_attention_maps(attn_type, layers, heads, row_tokens, col_tokens, max_sentence_len, model))
     else:
         st.write('Enter a sentence to visualize the attention of the model')