clsi_profile: clsi_profile.py comparison

comparison clsi_profile.py @ 5:3c27e5c2a8e9 draft

"planemo upload for repository https://github.com/rakesh4osdd/asist/tree/master commit d4b81c15919b4b87d215eaf1b792c8f251665647"

author	rakesh4osdd
date	Tue, 29 Jun 2021 12:58:49 +0000
parents	2a5861818faf
children

comparison

equal deleted inserted replaced

-:2a5861818faf
+:3c27e5c2a8e9
 #!/usr/bin/env python
 # coding: utf-8
-# In[115]:
+# In[7]:
 # ASIST module2 | map AST result to the CLSI breakporints with combination antibiotics
 # By rakesh4osdd@gmail.com, 06-Jun-2021
 import pandas as pd
 import re
 import sys
-# In[116]:
+# In[8]:
 #print(pd.__version__, re.__version__)
-# In[117]:
+# In[9]:
 # compare two MIC value strings
 def check_mic(mic1,mic2,mic_type):
 #print(mic1,mic2,mic_type)
 return(m_type)
 #check_mic('65','32-64','i')
-# In[118]:
+# In[10]:
 # compare MIC value in pandas list
 def sus_res_int(mic):
 #print(mic)
 #mic=['128','16/4','128/4','32/4-64/4']
 #sus_res_int(mic)
-# In[119]:
+# In[11]:
 # for input argument
 input_user = sys.argv[1]
 input_clsi = sys.argv[2]
 output_table = sys.argv[3]
-# In[3]:
+# In[49]:
-"""#input_user='~/Jupyterlab_notebook/ASIST_module/strain_profiles_16k.csv.csv'
+"""input_user='~/Jupyterlab_notebook/ASIST_module/strain_profiles_16k.csv.csv'
-input_user='test-data/input2.csv'
+#input_user='test-data/input2.csv'
 input_clsi='test-data/clsi.csv'
 output_profile='test-data/input2_profile.csv'
-output_table='test-data/input2_table.csv'
+#output_table='test-data/input2_table.csv'
-#output_table='/home/rakesh/Jupyterlab_notebook/ASIST_module/strain_profiles_16k_table.csv'"""
+output_table='/home/rakesh/Jupyterlab_notebook/ASIST_module/strain_profiles_16k_table.csv'"""
-# In[146]:
+# In[60]:
 # read user AST data with selected 3 columns
 strain_mic=pd.read_csv(input_user, sep=',', usecols =['Strain name', 'Antibiotics', 'MIC'],na_filter=False)
 #strain_mic
-# In[147]:
+# In[61]:
 clsi_bp=pd.read_csv(input_clsi,sep=',')
 #clsi_bp[clsi_bp[['Antibiotics', 'Susceptible']].duplicated()].shape
-# In[148]:
+# In[62]:
 #clsi_bp
 #strain_mic
-# In[149]:
+# In[64]:
+# warn user for duplicate files
 input_dups=strain_mic[strain_mic[['Strain name','Antibiotics']].duplicated()]
 if (input_dups.shape[0] == 0):
 #print( "No duplicates")
 pass
 else:
-input_dups.to_csv(output_table,na_rep='NA')
+with open(output_table, "w") as file_object:
-with open(output_table, "a") as file_object:
 # Append 'hello' at the end of file
-file_object.write('Input File Error: Please remove duplicate/mutiple MIC values for same combination of Strain name and Antibiotics from input file')
+file_object.write('S.No.,Strain name,Antibiotics,MIC\nInput File Error: Please remove duplicate/mutiple MIC values for same combination of Strain name and Antibiotics from input file\n')
+input_dups.to_csv(output_table,na_rep='NA', mode='a')
 exit()
-#input_dups.head()
+# In[17]:
-# In[125]:
 # convert MIC to numbers sMIC, rMIC
 clsi_bp['s_mic'] =clsi_bp[['Susceptible']].applymap(lambda x: (re.sub(r'[^0-9.\/-]', '', x)))
 clsi_bp['r_mic'] =clsi_bp[['Resistant']].applymap(lambda x: (re.sub(r'[^0-9.\/-]', '', x)))
 clsi_bp['i_mic'] = clsi_bp[['Intermediate']].applymap(lambda x: (re.sub(r'[^0-9.\/-]', '', x)))
-# In[126]:
+# In[18]:
 #clsi_bp['i_mic'] = clsi_bp[['Intermediate']].applymap(lambda x: (re.sub(r'[^0-9.\/-]', '', x)))
-# In[127]:
+# In[19]:
 # Read only numbers in MIC values
 #try:
 strain_mic['o_mic']=strain_mic[['MIC']].applymap(lambda x: (re.sub(r'[^0-9.\/]','', x)))
 #except TypeError:
 #    print('Waring: Error in MIC value')
-# In[128]:
+# In[20]:
 #strain_mic
-# In[129]:
+# In[21]:
 # capitalize each Antibiotic Name for comparision with removing whitespace
 strain_mic['Strain name']=strain_mic['Strain name'].str.capitalize().str.replace(" ","")
 strain_mic['Antibiotics']=strain_mic['Antibiotics'].str.capitalize().str.replace(" ","")
 clsi_bp['Antibiotics']=clsi_bp['Antibiotics'].str.capitalize().str.replace(" ","")
-# In[130]:
+# In[22]:
 #find duplicate values in input files
 dups=strain_mic[strain_mic[['Strain name', 'Antibiotics']].duplicated(keep=False)]
 if dups.shape[0] != 0:
 result=pd.merge(strain_mic, clsi_bp, on='Antibiotics',how='inner')[['Strain name','Antibiotics', 'MIC', 'o_mic', 's_mic', 'r_mic','i_mic']]
 except KeyError:
 print('Waring: Error in input Values')
-# In[131]:
+# In[23]:
-#result
+dups.head()
 # In[132]:

Mercurial > repos > rakesh4osdd > clsi_profile

comparison clsi_profile.py @ 5:3c27e5c2a8e9 draft