fatmacankara commited on
Commit
29503f2
·
1 Parent(s): 0b6d591

Update code/pdb_featureVector.py

Browse files
Files changed (1) hide show
  1. code/pdb_featureVector.py +12 -1
code/pdb_featureVector.py CHANGED
@@ -241,6 +241,17 @@ def pdb(input_set, mode, impute):
241
  structure = pdb_parser.get_structure(search, pdb_file_content)
242
  ppb = PPBuilder()
243
  pdb_data_list = pdb_data.split('\n')
 
 
 
 
 
 
 
 
 
 
 
244
  pdb_data_list = [i for i in pdb_data_list if i.startswith('DBREF')]
245
  pdb_data_list = [[list(filter(None,i.split(' '))) for j in i.split(' ') if j == 'UNP'] for i in pdb_data_list]
246
  pdb_data_list = [i for i in pdb_data_list if i != []]
@@ -272,7 +283,7 @@ def pdb(input_set, mode, impute):
272
  st.write(f"Sequence: {sequence}")
273
  pdb_fasta.at[index, 'pdbID'] = search
274
  pdb_fasta.at[index, 'chain'] = chain_id
275
- pdb_fasta.at[index, 'pdbSequence'] = str(sequence)
276
  pdb_info.at[index, 'uniprotID'] = ', '.join(up)
277
  pdb_info.at[index, 'pdbID'] = search
278
  pdb_info.at[index, 'chain'] = chain_id
 
241
  structure = pdb_parser.get_structure(search, pdb_file_content)
242
  ppb = PPBuilder()
243
  pdb_data_list = pdb_data.split('\n')
244
+ pdb_data_list_sequence = [i for i in pdb_data_list if i.startswith('SEQRES')]
245
+ pdb_data_list_sequence = [ list(filter(None,i.split(' '))) for i in pdb_data_list_sequence]
246
+ seqs = {}
247
+ for i in pdb_data_list_sequence:
248
+ if i[2] in seqs.keys():
249
+ seqs[i[2]] += i[4:]
250
+ else:
251
+ seqs[i[2]] = i[4:]
252
+ from Bio.PDB.Polypeptide import *
253
+ for key, val in seqs.items():
254
+ seqs[key] = ''.join([threeToOne(i) for i in val])
255
  pdb_data_list = [i for i in pdb_data_list if i.startswith('DBREF')]
256
  pdb_data_list = [[list(filter(None,i.split(' '))) for j in i.split(' ') if j == 'UNP'] for i in pdb_data_list]
257
  pdb_data_list = [i for i in pdb_data_list if i != []]
 
283
  st.write(f"Sequence: {sequence}")
284
  pdb_fasta.at[index, 'pdbID'] = search
285
  pdb_fasta.at[index, 'chain'] = chain_id
286
+ pdb_fasta.at[index, 'pdbSequence'] = str(seq[chain_id])
287
  pdb_info.at[index, 'uniprotID'] = ', '.join(up)
288
  pdb_info.at[index, 'pdbID'] = search
289
  pdb_info.at[index, 'chain'] = chain_id