Spaces:
Sleeping
Sleeping
Commit
·
0b6d591
1
Parent(s):
4c168c7
Update code/pdb_featureVector.py
Browse files
code/pdb_featureVector.py
CHANGED
|
@@ -244,6 +244,9 @@ def pdb(input_set, mode, impute):
|
|
| 244 |
pdb_data_list = [i for i in pdb_data_list if i.startswith('DBREF')]
|
| 245 |
pdb_data_list = [[list(filter(None,i.split(' '))) for j in i.split(' ') if j == 'UNP'] for i in pdb_data_list]
|
| 246 |
pdb_data_list = [i for i in pdb_data_list if i != []]
|
|
|
|
|
|
|
|
|
|
| 247 |
#pdb_data_list = [[list(filter(None,j)) for j in i] for i in pdb_data_list]
|
| 248 |
pdb_data_list = [[j[2] for j in i] for i in pdb_data_list]
|
| 249 |
pdb_data_list = [i[0] for i in pdb_data_list]
|
|
@@ -251,7 +254,7 @@ def pdb(input_set, mode, impute):
|
|
| 251 |
for pp in ppb.build_peptides(model):
|
| 252 |
sequence = pp.get_sequence()
|
| 253 |
st.write(sequence)
|
| 254 |
-
for chain in model:
|
| 255 |
chain_id = chain.get_id()
|
| 256 |
# Extract UniProt ID if available in the chain's annotations
|
| 257 |
uniprot_ids = fetch_uniprot_ids(search)
|
|
@@ -270,7 +273,7 @@ def pdb(input_set, mode, impute):
|
|
| 270 |
pdb_fasta.at[index, 'pdbID'] = search
|
| 271 |
pdb_fasta.at[index, 'chain'] = chain_id
|
| 272 |
pdb_fasta.at[index, 'pdbSequence'] = str(sequence)
|
| 273 |
-
pdb_info.at[index, 'uniprotID'] = ', '.join(
|
| 274 |
pdb_info.at[index, 'pdbID'] = search
|
| 275 |
pdb_info.at[index, 'chain'] = chain_id
|
| 276 |
pdb_info.at[index, 'resolution'] = resolution
|
|
@@ -278,7 +281,10 @@ def pdb(input_set, mode, impute):
|
|
| 278 |
|
| 279 |
print()
|
| 280 |
st.write()
|
|
|
|
| 281 |
st.write(pdb_info)
|
|
|
|
|
|
|
| 282 |
print('PDB file processing finished..')
|
| 283 |
for filename in list(Path(path_to_output_files / 'pdb_structures').glob("*")):
|
| 284 |
try:
|
|
|
|
| 244 |
pdb_data_list = [i for i in pdb_data_list if i.startswith('DBREF')]
|
| 245 |
pdb_data_list = [[list(filter(None,i.split(' '))) for j in i.split(' ') if j == 'UNP'] for i in pdb_data_list]
|
| 246 |
pdb_data_list = [i for i in pdb_data_list if i != []]
|
| 247 |
+
pdb_data_list_uniprot = [[j[6] for j in i] for i in pdb_data_list]
|
| 248 |
+
|
| 249 |
+
|
| 250 |
#pdb_data_list = [[list(filter(None,j)) for j in i] for i in pdb_data_list]
|
| 251 |
pdb_data_list = [[j[2] for j in i] for i in pdb_data_list]
|
| 252 |
pdb_data_list = [i[0] for i in pdb_data_list]
|
|
|
|
| 254 |
for pp in ppb.build_peptides(model):
|
| 255 |
sequence = pp.get_sequence()
|
| 256 |
st.write(sequence)
|
| 257 |
+
for chain, up in zip(model,pdb_data_list_uniprot ):
|
| 258 |
chain_id = chain.get_id()
|
| 259 |
# Extract UniProt ID if available in the chain's annotations
|
| 260 |
uniprot_ids = fetch_uniprot_ids(search)
|
|
|
|
| 273 |
pdb_fasta.at[index, 'pdbID'] = search
|
| 274 |
pdb_fasta.at[index, 'chain'] = chain_id
|
| 275 |
pdb_fasta.at[index, 'pdbSequence'] = str(sequence)
|
| 276 |
+
pdb_info.at[index, 'uniprotID'] = ', '.join(up)
|
| 277 |
pdb_info.at[index, 'pdbID'] = search
|
| 278 |
pdb_info.at[index, 'chain'] = chain_id
|
| 279 |
pdb_info.at[index, 'resolution'] = resolution
|
|
|
|
| 281 |
|
| 282 |
print()
|
| 283 |
st.write()
|
| 284 |
+
st.write('pdb_info')
|
| 285 |
st.write(pdb_info)
|
| 286 |
+
st.write('pdb_fasta')
|
| 287 |
+
st.write(pdb_fasta)
|
| 288 |
print('PDB file processing finished..')
|
| 289 |
for filename in list(Path(path_to_output_files / 'pdb_structures').glob("*")):
|
| 290 |
try:
|