aiqcamp commited on
Commit
25d992f
ยท
verified ยท
1 Parent(s): 1b8d3ac

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +193 -0
app.py CHANGED
@@ -66,6 +66,9 @@ client = OpenAI(
66
  ds = load_dataset("lamm-mit/protein_secondary_structure_from_PDB",
67
  token=ACCESS_TOKEN)
68
 
 
 
 
69
  def respond(
70
  message,
71
  history,
@@ -796,6 +799,157 @@ def combined_generation(name, strength, flexibility, speed, defense, size, abili
796
  None
797
  )
798
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
799
  with gr.Blocks(theme='ParityError/Interstellar') as demo:
800
  with gr.Row():
801
  with gr.Column(scale=1):
@@ -1172,7 +1326,46 @@ with gr.Blocks(theme='ParityError/Interstellar') as demo:
1172
  ]
1173
  )
1174
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1175
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1176
  # ์ฑ—๋ด‡ ์‘๋‹ต์— ๋”ฐ๋ฅธ ๊ฒฐ๊ณผ ์—…๋ฐ์ดํŠธ
1177
  msg.submit(
1178
  update_protein_display,
 
66
  ds = load_dataset("lamm-mit/protein_secondary_structure_from_PDB",
67
  token=ACCESS_TOKEN)
68
 
69
+ current_protein_result = None
70
+
71
+
72
  def respond(
73
  message,
74
  history,
 
799
  None
800
  )
801
 
802
+
803
+ def process_chat_and_generate(message, history):
804
+ try:
805
+ # 1. ํ”„๋กฌํ”„ํŠธ ๋ถ„์„ ๋ฐ ํŒŒ๋ผ๋ฏธํ„ฐ ์„ค์ •
806
+ analysis = analyze_prompt(message)
807
+ similar_structures = search_protein_data(analysis, ds)
808
+ params = extract_parameters(analysis, similar_structures)
809
+
810
+ # 2. ๋‹จ๋ฐฑ์งˆ ์ƒ์„ฑ
811
+ generator = protein_diffusion_model(
812
+ sequence=None,
813
+ seq_len=params['sequence_length'],
814
+ helix_bias=params['helix_bias'],
815
+ strand_bias=params['strand_bias'],
816
+ loop_bias=params['loop_bias'],
817
+ secondary_structure=None,
818
+ aa_bias=None,
819
+ aa_bias_potential=None,
820
+ num_steps="25",
821
+ noise="normal",
822
+ hydrophobic_target_score=str(params['hydrophobic_target_score']),
823
+ hydrophobic_potential="2",
824
+ contigs=None,
825
+ pssm=None,
826
+ seq_mask=None,
827
+ str_mask=None,
828
+ rewrite_pdb=None
829
+ )
830
+
831
+ # 3. ์ƒ์„ฑ ๊ฒฐ๊ณผ ๊ฐ€์ ธ์˜ค๊ธฐ
832
+ output_seq, output_pdb, structure_view, plddt_plot = next(generator)
833
+
834
+ # 4. ์„ค๋ช… ์ƒ์„ฑ
835
+ explanation = f"""
836
+ ์š”์ฒญํ•˜์‹  ๊ธฐ๋Šฅ์— ๋งž๋Š” ๋‹จ๋ฐฑ์งˆ์„ ์ƒ์„ฑํ–ˆ์Šต๋‹ˆ๋‹ค:
837
+
838
+ ๋ถ„์„๋œ ์š”๊ตฌ์‚ฌํ•ญ:
839
+ {analysis}
840
+
841
+ ์„ค๊ณ„๋œ ๊ตฌ์กฐ์  ํŠน์ง•:
842
+ - ๊ธธ์ด: {params['sequence_length']} ์•„๋ฏธ๋…ธ์‚ฐ
843
+ - ์•ŒํŒŒ ํ—ฌ๋ฆญ์Šค ๋น„์œจ: {params['helix_bias']*100:.1f}%
844
+ - ๋ฒ ํƒ€ ์‹œํŠธ ๋น„์œจ: {params['strand_bias']*100:.1f}%
845
+ - ๋ฃจํ”„ ๊ตฌ์กฐ ๋น„์œจ: {params['loop_bias']*100:.1f}%
846
+ - ์†Œ์ˆ˜์„ฑ ์ ์ˆ˜: {params['hydrophobic_target_score']}
847
+ """
848
+
849
+ # 5. ์ฑ—๋ด‡ ํžˆ์Šคํ† ๋ฆฌ ์—…๋ฐ์ดํŠธ
850
+ new_history = history + [
851
+ {"role": "user", "content": message},
852
+ {"role": "assistant", "content": explanation}
853
+ ]
854
+
855
+ # 6. ๋ชจ๋“  ๊ฒฐ๊ณผ ๋ฐ˜ํ™˜
856
+ return (
857
+ new_history, # ์ฑ—๋ด‡ ํžˆ์Šคํ† ๋ฆฌ
858
+ create_radar_chart(calculate_hero_stats(params)), # ๋Šฅ๋ ฅ์น˜ ์ฐจํŠธ
859
+ explanation, # ์„ค๋ช…
860
+ output_seq, # ๋‹จ๋ฐฑ์งˆ ์„œ์—ด
861
+ output_pdb, # PDB ํŒŒ์ผ
862
+ structure_view, # 3D ๊ตฌ์กฐ
863
+ plddt_plot # ์‹ ๋ขฐ๋„ ํ”Œ๋กฏ
864
+ )
865
+
866
+ except Exception as e:
867
+ print(f"Error in process_chat_and_generate: {str(e)}")
868
+ return (
869
+ history + [
870
+ {"role": "user", "content": message},
871
+ {"role": "assistant", "content": f"์˜ค๋ฅ˜๊ฐ€ ๋ฐœ์ƒํ–ˆ์Šต๋‹ˆ๋‹ค: {str(e)}"}
872
+ ],
873
+ None, None, None, None, None, None
874
+ )
875
+
876
+ def extract_keywords(analysis):
877
+ """๋ถ„์„ ํ…์ŠคํŠธ์—์„œ ํ‚ค์›Œ๋“œ ์ถ”์ถœ"""
878
+ try:
879
+ # ๊ธฐ๋ณธ ํ‚ค์›Œ๋“œ ์ถ”์ถœ
880
+ keywords = []
881
+ # ์ฃผ์š” ๊ธฐ๋Šฅ ํ‚ค์›Œ๋“œ
882
+ if "์น˜๋ฃŒ" in analysis: keywords.extend(["therapeutic", "binding"])
883
+ if "๊ฒฐํ•ฉ" in analysis: keywords.extend(["binding", "interaction"])
884
+ if "์ด‰๋งค" in analysis: keywords.extend(["enzyme", "catalytic"])
885
+
886
+ # ํ™˜๊ฒฝ ํ‚ค์›Œ๋“œ
887
+ if "๋ง‰" in analysis: keywords.extend(["membrane", "transmembrane"])
888
+ if "์ˆ˜์šฉ์„ฑ" in analysis: keywords.extend(["soluble", "hydrophilic"])
889
+ if "์†Œ์ˆ˜์„ฑ" in analysis: keywords.extend(["hydrophobic"])
890
+
891
+ # ๊ตฌ์กฐ ํ‚ค์›Œ๋“œ
892
+ if "์•ŒํŒŒ" in analysis or "๋‚˜์„ " in analysis: keywords.append("helix")
893
+ if "๋ฒ ํƒ€" in analysis or "์‹œํŠธ" in analysis: keywords.append("sheet")
894
+ if "๋ฃจํ”„" in analysis: keywords.append("loop")
895
+
896
+ return list(set(keywords)) # ์ค‘๋ณต ์ œ๊ฑฐ
897
+ except Exception as e:
898
+ print(f"ํ‚ค์›Œ๋“œ ์ถ”์ถœ ์ค‘ ์˜ค๋ฅ˜: {str(e)}")
899
+ return []
900
+
901
+ def calculate_similarity(keywords, entry):
902
+ """ํ‚ค์›Œ๋“œ์™€ ๋ฐ์ดํ„ฐ์…‹ ํ•ญ๋ชฉ ๊ฐ„์˜ ์œ ์‚ฌ๋„ ๊ณ„์‚ฐ"""
903
+ try:
904
+ score = 0
905
+ # ์‹œํ€€์Šค ํŠน์„ฑ ๊ฒ€์‚ฌ
906
+ sequence = entry['sequence'].lower()
907
+ for keyword in keywords:
908
+ if keyword in entry.get('description', '').lower():
909
+ score += 2
910
+ if keyword in sequence:
911
+ score += 1
912
+ if 'secondary_structure' in entry:
913
+ if keyword in ['helix'] and 'H' in entry['secondary_structure']:
914
+ score += 1
915
+ if keyword in ['sheet'] and 'E' in entry['secondary_structure']:
916
+ score += 1
917
+ if keyword in ['loop'] and 'L' in entry['secondary_structure']:
918
+ score += 1
919
+ return score
920
+ except Exception as e:
921
+ print(f"์œ ์‚ฌ๋„ ๊ณ„์‚ฐ ์ค‘ ์˜ค๋ฅ˜: {str(e)}")
922
+ return 0
923
+
924
+ def extract_parameters_from_chat(chat_response):
925
+ """์ฑ—๋ด‡ ์‘๋‹ต์—์„œ ํŒŒ๋ผ๋ฏธํ„ฐ ์ถ”์ถœ"""
926
+ try:
927
+ params = {
928
+ 'sequence_length': 100,
929
+ 'helix_bias': 0.02,
930
+ 'strand_bias': 0.02,
931
+ 'loop_bias': 0.1,
932
+ 'hydrophobic_target_score': 0
933
+ }
934
+
935
+ # ์‘๋‹ต ํ…์ŠคํŠธ์—์„œ ๊ฐ’ ์ถ”์ถœ
936
+ if "๊ธธ์ด:" in chat_response:
937
+ length_match = re.search(r'๊ธธ์ด: (\d+)', chat_response)
938
+ if length_match:
939
+ params['sequence_length'] = int(length_match.group(1))
940
+
941
+ if "์•ŒํŒŒ ํ—ฌ๋ฆญ์Šค ๋น„์œจ:" in chat_response:
942
+ helix_match = re.search(r'์•ŒํŒŒ ํ—ฌ๋ฆญ์Šค ๋น„์œจ: ([\d.]+)', chat_response)
943
+ if helix_match:
944
+ params['helix_bias'] = float(helix_match.group(1)) / 100
945
+
946
+ # ๋‚˜๋จธ์ง€ ํŒŒ๋ผ๋ฏธํ„ฐ๋„ ์œ ์‚ฌํ•˜๊ฒŒ ์ถ”์ถœ
947
+
948
+ return params
949
+ except Exception as e:
950
+ print(f"ํŒŒ๋ผ๋ฏธํ„ฐ ์ถ”์ถœ ์ค‘ ์˜ค๋ฅ˜: {str(e)}")
951
+ return None
952
+
953
  with gr.Blocks(theme='ParityError/Interstellar') as demo:
954
  with gr.Row():
955
  with gr.Column(scale=1):
 
1326
  ]
1327
  )
1328
 
1329
+ # ์ด๋ฒคํŠธ ํ•ธ๋“ค๋Ÿฌ ์—ฐ๊ฒฐ
1330
+ msg.submit(
1331
+ fn=process_chat_and_generate,
1332
+ inputs=[msg, chatbot],
1333
+ outputs=[
1334
+ chatbot,
1335
+ hero_stats,
1336
+ hero_description,
1337
+ output_seq,
1338
+ output_pdb,
1339
+ output_viewer,
1340
+ plddt_plot
1341
+ ]
1342
+ )
1343
 
1344
+ submit_btn.click(
1345
+ fn=process_chat_and_generate,
1346
+ inputs=[msg, chatbot],
1347
+ outputs=[
1348
+ chatbot,
1349
+ hero_stats,
1350
+ hero_description,
1351
+ output_seq,
1352
+ output_pdb,
1353
+ output_viewer,
1354
+ plddt_plot
1355
+ ]
1356
+ )
1357
+
1358
+ # ์ฑ„ํŒ… ๋‚ด์šฉ ์ง€์šฐ๊ธฐ
1359
+ clear.click(
1360
+ lambda: (None, None, None, None, None, None, None),
1361
+ None,
1362
+ [chatbot, hero_stats, hero_description, output_seq, output_pdb, output_viewer, plddt_plot],
1363
+ queue=False
1364
+ )
1365
+
1366
+
1367
+
1368
+
1369
  # ์ฑ—๋ด‡ ์‘๋‹ต์— ๋”ฐ๋ฅธ ๊ฒฐ๊ณผ ์—…๋ฐ์ดํŠธ
1370
  msg.submit(
1371
  update_protein_display,