Spaces:

AI4PD
/

hexviz

Sleeping

aksell commited on May 19, 2023

Commit

db42d48

1 Parent(s): 53a7dc6

Calculate pct of total attention

Files changed (2) hide show

hexviz/attention.py CHANGED Viewed

@@ -299,6 +299,7 @@ def get_attention_pairs(
         top_n_values, top_n_indexes = torch.topk(attention_into_res, top_n)
         for res, attn_sum in zip(top_n_indexes, top_n_values):
-            top_residues.append((attn_sum.item(), chain_ids[i], res.item()))
     return attention_pairs, top_residues

         top_n_values, top_n_indexes = torch.topk(attention_into_res, top_n)
         for res, attn_sum in zip(top_n_indexes, top_n_values):
+            fraction_of_total_attention = attn_sum.item() / len(sequence)
+            top_residues.append((fraction_of_total_attention, chain_ids[i], res.item()))
     return attention_pairs, top_residues

hexviz/🧬Attention_Visualization.py CHANGED Viewed

@@ -264,15 +264,19 @@ Pick a PDB ID, layer and head to visualize attention from the selected protein l
 chain_dict = {f"{chain.id}": list(chain.get_residues()) for chain in list(structure.get_chains())}
 data = []
-for att_weight, chain, resi in top_residues:
     try:
         res = chain_dict[chain][resi]
     except KeyError:
         continue
-    el = (att_weight, f"{res.resname:3}{res.id[1]}({chain})")
     data.append(el)
-df = pd.DataFrame(data, columns=["Total attention to", "Residue"])
 st.markdown(
     f"The {n_highest_resis} residues (per chain) with the highest attention to them are labeled in the visualization and listed here:"
 )

 chain_dict = {f"{chain.id}": list(chain.get_residues()) for chain in list(structure.get_chains())}
 data = []
+for fraction_of_total_attention, chain, resi in top_residues:
     try:
         res = chain_dict[chain][resi]
     except KeyError:
         continue
+    pct_of_total_attention = round(fraction_of_total_attention * 100, 3)
+    el = (pct_of_total_attention, f"{res.resname:3}{res.id[1]}({chain})")
     data.append(el)
+df = pd.DataFrame(data, columns=["% of total attention", "Residue"])
+df = df.style.format(
+    {"% of total attention": "{:.3f}"}  # Set 3 decimal places for "% of total attention"
+)
 st.markdown(
     f"The {n_highest_resis} residues (per chain) with the highest attention to them are labeled in the visualization and listed here:"
 )