Spaces:
Sleeping
Sleeping
Commit
·
a83bdd0
1
Parent(s):
a5eb586
Update code/process_input.py
Browse files- code/process_input.py +4 -0
code/process_input.py
CHANGED
|
@@ -5,11 +5,13 @@ def clean_data(input_set):
|
|
| 5 |
try:
|
| 6 |
if ',' in input_set:
|
| 7 |
input_set = [i.strip() for i in input_set.split(',')]
|
|
|
|
| 8 |
for i in input_set:
|
| 9 |
data = data.append(pd.Series([j.strip() for j in i.split('-')]), ignore_index=True)
|
| 10 |
data.columns = ['uniprotID', 'wt', 'pos', 'mut']
|
| 11 |
elif '\t' in input_set:
|
| 12 |
input_set = [i.strip() for i in input_set.split('\t')]
|
|
|
|
| 13 |
for i in input_set:
|
| 14 |
data = data.append(pd.Series([j.strip() for j in i.split('-')]), ignore_index=True)
|
| 15 |
data.columns = ['uniprotID', 'wt', 'pos', 'mut']
|
|
@@ -36,6 +38,8 @@ def clean_data(input_set):
|
|
| 36 |
data.at[i, 'datapoint'] = data.at[i, 'uniprotID'] + data.at[i, 'wt'] + str(data.at[i, 'pos']) + data.at[i, 'mut']
|
| 37 |
|
| 38 |
data = data.astype(str)
|
|
|
|
|
|
|
| 39 |
return data
|
| 40 |
except ValueError:
|
| 41 |
st.write('Your input is in the wrong format. Please see the example.')
|
|
|
|
| 5 |
try:
|
| 6 |
if ',' in input_set:
|
| 7 |
input_set = [i.strip() for i in input_set.split(',')]
|
| 8 |
+
initial_len = len(input_set)
|
| 9 |
for i in input_set:
|
| 10 |
data = data.append(pd.Series([j.strip() for j in i.split('-')]), ignore_index=True)
|
| 11 |
data.columns = ['uniprotID', 'wt', 'pos', 'mut']
|
| 12 |
elif '\t' in input_set:
|
| 13 |
input_set = [i.strip() for i in input_set.split('\t')]
|
| 14 |
+
initial_len = len(input_set)
|
| 15 |
for i in input_set:
|
| 16 |
data = data.append(pd.Series([j.strip() for j in i.split('-')]), ignore_index=True)
|
| 17 |
data.columns = ['uniprotID', 'wt', 'pos', 'mut']
|
|
|
|
| 38 |
data.at[i, 'datapoint'] = data.at[i, 'uniprotID'] + data.at[i, 'wt'] + str(data.at[i, 'pos']) + data.at[i, 'mut']
|
| 39 |
|
| 40 |
data = data.astype(str)
|
| 41 |
+
if initial_len != len(data):
|
| 42 |
+
print(f'{initial_len- len(data)} of {initial_len} datapoints is omitted. Check your input.')
|
| 43 |
return data
|
| 44 |
except ValueError:
|
| 45 |
st.write('Your input is in the wrong format. Please see the example.')
|