Mercurial > repos > jay > padaug_peptide_sequence_analysis
annotate PDAUG_AddClassLabel/PDAUG_AddClassLabel.py @ 1:aa0416e63597 draft default tip
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 60abdf7f6fdc87e5be4ffb7fa5c9c8a458383047"
| author | jay | 
|---|---|
| date | Tue, 17 Nov 2020 23:11:37 +0000 | 
| parents | 5d01ab729b2b | 
| children | 
| rev | line source | 
|---|---|
| 0 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 1 import pandas as pd | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 2 import argparse | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 3 | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 4 parser = argparse.ArgumentParser() | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 5 | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 6 parser.add_argument("-I", "--InFile", required=True, default=None, help="Input data file") | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 7 parser.add_argument("-C", "--ClassLabel", required=False, default=0, help="Class Label 0 or 1") | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 8 parser.add_argument("-t", "--ClassLabelTitle", required=False, default='Class_label', help="Title to use for class label column (Class_label)") | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 9 parser.add_argument("-O", "--OutFile", required=False, default='OutFile.tsv', help="Output file name") | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 10 | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 11 args = parser.parse_args() | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 12 | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 13 df1 = pd.read_csv(args.InFile, sep="\t") | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 14 df2 = pd.DataFrame([args.ClassLabel]*df1.shape[0], columns=[args.ClassLabelTitle]) | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 15 | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 16 df = pd.concat([df1, df2], axis=1) | 
| 
5d01ab729b2b
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 jay parents: diff
changeset | 17 df.to_csv(args.OutFile, sep="\t", index=False) | 
