fatmacankara commited on
Commit
0b6d591
·
1 Parent(s): 4c168c7

Update code/pdb_featureVector.py

Browse files
Files changed (1) hide show
  1. code/pdb_featureVector.py +8 -2
code/pdb_featureVector.py CHANGED
@@ -244,6 +244,9 @@ def pdb(input_set, mode, impute):
244
  pdb_data_list = [i for i in pdb_data_list if i.startswith('DBREF')]
245
  pdb_data_list = [[list(filter(None,i.split(' '))) for j in i.split(' ') if j == 'UNP'] for i in pdb_data_list]
246
  pdb_data_list = [i for i in pdb_data_list if i != []]
 
 
 
247
  #pdb_data_list = [[list(filter(None,j)) for j in i] for i in pdb_data_list]
248
  pdb_data_list = [[j[2] for j in i] for i in pdb_data_list]
249
  pdb_data_list = [i[0] for i in pdb_data_list]
@@ -251,7 +254,7 @@ def pdb(input_set, mode, impute):
251
  for pp in ppb.build_peptides(model):
252
  sequence = pp.get_sequence()
253
  st.write(sequence)
254
- for chain in model:
255
  chain_id = chain.get_id()
256
  # Extract UniProt ID if available in the chain's annotations
257
  uniprot_ids = fetch_uniprot_ids(search)
@@ -270,7 +273,7 @@ def pdb(input_set, mode, impute):
270
  pdb_fasta.at[index, 'pdbID'] = search
271
  pdb_fasta.at[index, 'chain'] = chain_id
272
  pdb_fasta.at[index, 'pdbSequence'] = str(sequence)
273
- pdb_info.at[index, 'uniprotID'] = ', '.join(uniprot_ids)
274
  pdb_info.at[index, 'pdbID'] = search
275
  pdb_info.at[index, 'chain'] = chain_id
276
  pdb_info.at[index, 'resolution'] = resolution
@@ -278,7 +281,10 @@ def pdb(input_set, mode, impute):
278
 
279
  print()
280
  st.write()
 
281
  st.write(pdb_info)
 
 
282
  print('PDB file processing finished..')
283
  for filename in list(Path(path_to_output_files / 'pdb_structures').glob("*")):
284
  try:
 
244
  pdb_data_list = [i for i in pdb_data_list if i.startswith('DBREF')]
245
  pdb_data_list = [[list(filter(None,i.split(' '))) for j in i.split(' ') if j == 'UNP'] for i in pdb_data_list]
246
  pdb_data_list = [i for i in pdb_data_list if i != []]
247
+ pdb_data_list_uniprot = [[j[6] for j in i] for i in pdb_data_list]
248
+
249
+
250
  #pdb_data_list = [[list(filter(None,j)) for j in i] for i in pdb_data_list]
251
  pdb_data_list = [[j[2] for j in i] for i in pdb_data_list]
252
  pdb_data_list = [i[0] for i in pdb_data_list]
 
254
  for pp in ppb.build_peptides(model):
255
  sequence = pp.get_sequence()
256
  st.write(sequence)
257
+ for chain, up in zip(model,pdb_data_list_uniprot ):
258
  chain_id = chain.get_id()
259
  # Extract UniProt ID if available in the chain's annotations
260
  uniprot_ids = fetch_uniprot_ids(search)
 
273
  pdb_fasta.at[index, 'pdbID'] = search
274
  pdb_fasta.at[index, 'chain'] = chain_id
275
  pdb_fasta.at[index, 'pdbSequence'] = str(sequence)
276
+ pdb_info.at[index, 'uniprotID'] = ', '.join(up)
277
  pdb_info.at[index, 'pdbID'] = search
278
  pdb_info.at[index, 'chain'] = chain_id
279
  pdb_info.at[index, 'resolution'] = resolution
 
281
 
282
  print()
283
  st.write()
284
+ st.write('pdb_info')
285
  st.write(pdb_info)
286
+ st.write('pdb_fasta')
287
+ st.write(pdb_fasta)
288
  print('PDB file processing finished..')
289
  for filename in list(Path(path_to_output_files / 'pdb_structures').glob("*")):
290
  try: