# HG changeset patch # User chrisb # Date 1462536348 14400 # Node ID 0a5e0df170546447aa4845a476d1ce5ee66df1cd # Parent 89592faa287574c7608d1636b91c39592f73c6db Uploaded diff -r 89592faa2875 -r 0a5e0df17054 get_data/cfg_array/.README_CFG_array.md.swp Binary file get_data/cfg_array/.README_CFG_array.md.swp has changed diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/.idea/kegg_glycan.iml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/.idea/kegg_glycan.iml Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,12 @@ + + + + + + + + + + \ No newline at end of file diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/.idea/misc.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/.idea/misc.xml Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,14 @@ + + + + + + + + + + + + + + \ No newline at end of file diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/.idea/modules.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/.idea/modules.xml Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,8 @@ + + + + + + + + \ No newline at end of file diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/.idea/workspace.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/.idea/workspace.xml Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,477 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + true + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + 1462439789911 + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + \ No newline at end of file diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/2 --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/2 Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,54 @@ + +from KEGG searches as follows should work + + +/find/genes/shiga+toxin for keywords "shiga" and "toxin" +/find/genes/"shiga toxin" for keywords "shiga toxin" + +these do not function on all databases esp. enzyme + +http://rest.kegg.jp/find/enzyme/deoxy+1.1.1 AND works +http://rest.kegg.jp/find/enzyme/"deoxy%201.1.1" OR does not work +http://rest.kegg.jp/find/enzyme/"deoxy 1.1.1" OR does not work + +0 +http://rest.kegg.jp/find/enzyme/ec:2.4.99.1+ec:2.4.99.6 AND works but return nothing as no overlap +http://rest.kegg.jp/find/enzyme/"ec:2.4.99.1 ec:2.4.99.6" OR doesn't work +http://rest.kegg.jp/find/enzyme/ec:2.4.99. works + + ../../../virtualpy/bin/python findKEGG.py -d enzyme -q 2.4.99.1+2.4.99.6 . works but return None in python. which breaks file writing. rather fix this. + + + + + +# updated notes on KEGG behaviour + +True for release Release 78.0+/05-05, May 16 (see http://rest.kegg.jp/info/genes) + +multiple complex queries are not recommended. + +Using the shiga toxin example from http://www.genome.jp/kegg/rest/keggapi.html +/find/genes/shiga+toxin for keywords "shiga" and "toxin" +/find/genes/"shiga toxin" for keywords "shiga toxin" + +## AND example +/find/genes/shiga+toxin for keywords "shiga" and "toxin" +http://rest.kegg.jp/find/genes/shiga+toxin + +## OR example +/find/genes/"shiga toxin" for keywords "shiga toxin" +http://rest.kegg.jp/find/genes/"shiga%20toxin" + +## BROKEN AND +http://rest.kegg.jp/find/genes/"shiga+toxin" +If query is in put in quotes. + this result is the same as OR. + +## BROKEN OR +http://rest.kegg.jp/find/genes/shiga%20toxin +If query is not placed in quotations. + this result is the same as AND. + +# Recommendation +Do not combine AND with OR queries diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/KEGGnotes.md --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/KEGGnotes.md Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,51 @@ + +# notes on KEGG behaviour + +Tested with Release 78.0+/05-05, May 16 (see http://rest.kegg.jp/info/genes) + +*Recommendation 1 - Do not combine AND with OR queries* +multiple complex queries are not recommended. + +*OR's on certain db's e.g. glycan, enzyme do not always return correctly* + +## Shiga toxin behaviour test +Using the shiga toxin example from http://www.genome.jp/kegg/rest/keggapi.html +/find/genes/shiga+toxin for keywords "shiga" and "toxin" +/find/genes/"shiga toxin" for keywords "shiga toxin" + +results in test-data + - test-data/shiga-toxin-example-AND + - test-data/shiga-toxin-example-AND-broken + - test-data/shiga-toxin-example-OR + - test-data/shiga-toxin-example-OR-broken + + +### AND example +/find/genes/shiga+toxin for keywords "shiga" and "toxin" +http://rest.kegg.jp/find/genes/shiga+toxin + +### OR example +/find/genes/"shiga toxin" for keywords "shiga toxin" +http://rest.kegg.jp/find/genes/"shiga%20toxin" + +### BROKEN AND +http://rest.kegg.jp/find/genes/"shiga+toxin" +If query is in put in quotes. + this result is the same as OR. + +### BROKEN OR +http://rest.kegg.jp/find/genes/shiga%20toxin +If query is not placed in quotations. + this result is the same as AND. + +## Enzyme tests + +http://rest.kegg.jp/find/enzyme/deoxy+1.1.1 AND works +http://rest.kegg.jp/find/enzyme/"deoxy%201.1.1" OR does not work +http://rest.kegg.jp/find/enzyme/"deoxy 1.1.1" OR does not work + +0 +http://rest.kegg.jp/find/enzyme/ec:2.4.99.1+ec:2.4.99.6 AND works but return nothing as no overlap +http://rest.kegg.jp/find/enzyme/"ec:2.4.99.1 ec:2.4.99.6" OR doesn't work +http://rest.kegg.jp/find/enzyme/ec:2.4.99. works + diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/README_KEGG.md --- a/get_data/kegg_glycan/README_KEGG.md Wed Mar 23 14:35:56 2016 -0400 +++ b/get_data/kegg_glycan/README_KEGG.md Fri May 06 08:05:48 2016 -0400 @@ -20,6 +20,9 @@ findKEGG.py -d $dbname -q $searchpattern -o $output ``` +## Known Issues +Yes, the and/or functionality of the KEGG rest API (Release 78.0+/05-05, May 16 ) does not always function as expected. This has been resolved in the code. More details, [KEGGnotes.md ](KEGGnotes.md) + ## Help ``` ../../virtualpy/bin/activate @@ -31,7 +34,7 @@ ``` ../../virtualpy/bin/activate -python test_findKEGG.py +nosetests test_findKEGG.py ``` # 2. getkcfKEGG,py @@ -67,7 +70,7 @@ ``` ../../virtualpy/bin/activate -python test_getkcfKEGG.py +nosetests test_getkcfKEGG.py ``` # 3. linkKEGG.py @@ -101,6 +104,6 @@ ``` ../../virtualpy/bin/activate -python test_linkKEGG.py +nosetests test_linkKEGG.py ``` diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/db.output --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/db.output Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,83 @@ +ENTRY G10495 Glycan +NAME 1,4-alpha-D-Glucan; + 1,4-alpha-Glucan; + Amylose; + Maltodextrin +COMPOSITION (Glc)1 (*)2 +CLASS Polysaccharide +REMARK Same as: C00718 C01935 D02329 +REACTION R06049 R06050 R06051 R06052 R06069 R06158 R06159 R06160 + R06184 R06185 R06186 R06243 +ENZYME 2.4.1.1 2.4.1.2 2.4.1.4 2.4.1.11 + 2.4.1.18 2.4.1.21 2.4.1.25 3.2.1.2 + 3.2.1.33 3.2.1.54 5.4.99.15 +DBLINKS GlycomeDB: 12100 +NODE 3 + 1 * 8 0 + 2 Glc 0 0 + 3 * -8 0 +EDGE 2 + 1 2:a1 1 + 2 3 2:4 +BRACKET 1 -4.0 2.0 -4.0 -2.0 + 1 5.0 -2.0 5.0 2.0 + 1 n +/// +ENTRY G10608 Glycan +NAME UDP-D-glucose; + UDP-glucose; + Uridine diphosphate glucose +COMPOSITION (UDP-Glc)1 +REMARK Same as: C00029 +REACTION R06020 R06023 R06036 R06043 R06045 R06051 R06062 R06073 + R06181 R06226 R06275 R09315 R09316 +ENZYME 2.4.1.11 2.4.1.12 2.4.1.13 2.4.1.14 + 2.4.1.15 2.4.1.34 2.4.1.53 2.4.1.80 + 2.4.1.183 2.4.1.188 2.4.1.- +NODE 1 + 1 UDP-Glc -0.3 0 +EDGE 0 +/// +ENTRY G10619 Glycan +NAME UDP; + Uridine 5'-diphosphate +COMPOSITION (UDP)1 +REMARK Same as: C00015 +REACTION R05901 R05902 R05903 R05907 R05908 R05909 R05910 R05912 + R05915 R05916 R05925 R05926 R05927 R05928 R05929 R05930 + R05931 R05932 R05933 R05934 R05935 R05936 R05938 R05939 + R05941 R05946 R05948 R05952 R05953 R05956 R05960 R05962 + R05964 R05965 R05970 R05971 R05974 R05975 R05977 R05978 + R05983 R05985 R05986 R05987 R05989 R05991 R05992 R06006 + R06011 R06013 R06014 R06016 R06020 R06021 R06023 R06028 + R06029 R06033 R06036 R06043 R06045 R06051 R06055 R06062 + R06067 R06068 R06072 R06073 R06083 R06097 R06129 R06130 + R06145 R06167 R06168 R06169 R06172 R06173 R06174 R06181 + R06182 R06187 R06189 R06190 R06191 R06192 R06193 R06197 + R06198 R06210 R06214 R06226 R06234 R06275 R06276 R06277 + R06278 R07131 R07609 R07610 R07611 R07614 R07615 R07616 + R07617 R07619 R07621 R07622 R07623 R07624 R07625 R07628 + R09290 R09296 R09299 R09304 R09315 R09316 R09320 R10138 + R10139 +ENZYME 2.4.1.11 2.4.1.12 2.4.1.13 2.4.1.14 + 2.4.1.15 2.4.1.16 2.4.1.22 2.4.1.34 + 2.4.1.37 2.4.1.38 2.4.1.40 2.4.1.41 + 2.4.1.43 2.4.1.45 2.4.1.47 2.4.1.53 + 2.4.1.62 2.4.1.70 2.4.1.79 2.4.1.80 + 2.4.1.86 2.4.1.87 2.4.1.88 2.4.1.90 + 2.4.1.92 2.4.1.101 2.4.1.102 2.4.1.122 + 2.4.1.123 2.4.1.133 2.4.1.134 2.4.1.135 + 2.4.1.138 2.4.1.141 2.4.1.143 2.4.1.144 + 2.4.1.145 2.4.1.146 2.4.1.147 2.4.1.148 + 2.4.1.149 2.4.1.150 2.4.1.155 2.4.1.163 + 2.4.1.164 2.4.1.165 2.4.1.167 2.4.1.174 + 2.4.1.175 2.4.1.183 2.4.1.187 2.4.1.188 + 2.4.1.198 2.4.1.201 2.4.1.206 2.4.1.212 + 2.4.1.222 2.4.1.223 2.4.1.224 2.4.1.225 + 2.4.1.226 2.4.1.227 2.4.1.228 2.4.1.244 + 2.4.1.255 2.4.1.274 2.4.1.275 2.4.1.- + 2.4.2.24 2.4.2.26 2.4.2.38 2.4.2.- +NODE 1 + 1 UDP -0.4 0.3 +EDGE 0 +/// diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/findKEGG.py --- a/get_data/kegg_glycan/findKEGG.py Wed Mar 23 14:35:56 2016 -0400 +++ b/get_data/kegg_glycan/findKEGG.py Fri May 06 08:05:48 2016 -0400 @@ -1,6 +1,6 @@ __author__ = 'cbarnett' __license__ = "MIT" -__version__ = "0.3" +__version__ = "0.4" # http://www.kegg.jp/kegg/rest/keggapi.html @@ -16,8 +16,18 @@ raise IOError("no db given") if query == [] or query == "" or query is None: raise IOError("no query given") - query = query.replace('\n', ' ') # in case of new lines - query = query.replace('\r', ' ') # in case of new lines + query = query.replace('\n', '+') # in case of new lines, assume this means the user want to "AND" + query = query.replace('\r', '+') # in case of new lines, assume this means the user want to "AND" + query = query.replace('ec: ', 'ec:') # in case of ec: spaces - e.g. issue "ec: 2.4.99.1" spaces are ok usually as allows for combination searching "2.4.99.1 2.4.99.6" + + import re + p = re.compile(' *\+ *') # ensure no unneccesary space in an AND query, otherwise incorrect behaviour from KEGG + queryfix = p.subn('+', query) + query=queryfix[0] + + if ' ' in query: + query='"'+query+'"' # if spaces, query must be placed in quotes, otherwise incorrect behaviour from KEGG + query = query.replace(' ', '%20') # previous behaviour was ignoring text after a space, rather convert to '%20' and pass on to KEGG REST service uri = 'http://rest.kegg.jp/find/' fulluri = uri + db + "/" + query try: @@ -25,7 +35,7 @@ except Exception as e: raise urllib2.HTTPError(e.url, e.code, e.msg, e.hdrs, e.fp) if str(response.strip()) == "": - return None + return "" # change return from None to "" for easily writing to file return response diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/findKEGG.pyc Binary file get_data/kegg_glycan/findKEGG.pyc has changed diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/findKEGG.xml --- a/get_data/kegg_glycan/findKEGG.xml Wed Mar 23 14:35:56 2016 -0400 +++ b/get_data/kegg_glycan/findKEGG.xml Fri May 06 08:05:48 2016 -0400 @@ -1,4 +1,4 @@ - + using the KEGG database python_for_glycan_tools diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/found_entries.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/found_entries.txt Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,19 @@ +ec:1.1.1.133 dTDP-4-dehydrorhamnose reductase; dTDP-4-keto-L-rhamnose reductase; dTDP-4-ketorhamnose reductase; TDP-4-keto-rhamnose reductase; thymidine diphospho-4-ketorhamnose reductase; dTDP-6-deoxy-L-mannose:NADP+ 4-oxidoreductase; dTDP-6-deoxy-beta-L-mannose:NADP+ 4-oxidoreductase +ec:1.1.1.340 1-deoxy-11beta-hydroxypentalenate dehydrogenase; 1-deoxy-11beta-hydroxypentalenic acid dehydrogenase; ptlF (gene name); penF (gene name) +ec:1.14.11.35 1-deoxypentalenic acid 11beta-hydroxylase; ptlH (gene name); sav2991 (gene name); pntH (gene name) +ec:2.3.1.202 UDP-4-amino-4,6-dideoxy-N-acetyl-beta-L-altrosamine N-acetyltransferase; PseH +ec:2.4.1.27 DNA beta-glucosyltransferase; T4-HMC-beta-glucosyl transferase; T4-beta-glucosyl transferase; T4 phage beta-glucosyltransferase; UDP glucose-DNA beta-glucosyltransferase; uridine diphosphoglucose-deoxyribonucleate beta-glucosyltransferase +ec:2.4.1.28 glucosyl-DNA beta-glucosyltransferase; T6-glucosyl-HMC-beta-glucosyl transferase; T6-beta-glucosyl transferase; uridine diphosphoglucose-glucosyldeoxyribonucleate beta-glucosyltransferase +ec:2.4.1.335 dolichyl N-acetyl-alpha-D-glucosaminyl phosphate 3-beta-D-2,3-diacetamido-2,3-dideoxy-beta-D-glucuronosyltransferase; AglC; UDP-Glc-2,3-diNAcA glycosyltransferase +ec:2.6.1.87 UDP-4-amino-4-deoxy-L-arabinose aminotransferase; UDP-(beta-L-threo-pentapyranosyl-4''-ulose diphosphate) aminotransferase; UDP-4-amino-4-deoxy-L-arabinose---oxoglutarate aminotransferase; UDP-Ara4O aminotransferase; UDP-L-Ara4N transaminase +ec:2.6.1.92 UDP-4-amino-4,6-dideoxy-N-acetyl-beta-L-altrosamine transaminase; PseC +ec:2.7.7.7 DNA-directed DNA polymerase; DNA polymerase I; DNA polymerase II; DNA polymerase III; DNA polymerase alpha; DNA polymerase beta; DNA polymerase gamma; DNA nucleotidyltransferase (DNA-directed); DNA nucleotidyltransferase (DNA-directed); deoxyribonucleate nucleotidyltransferase; deoxynucleate polymerase; deoxyribonucleic acid duplicase; deoxyribonucleic acid polymerase; deoxyribonucleic duplicase; deoxyribonucleic polymerase; deoxyribonucleic polymerase I; DNA duplicase; DNA nucleotidyltransferase; DNA polymerase; DNA replicase; DNA-dependent DNA polymerase; duplicase; Klenow fragment; sequenase; Taq DNA polymerase; Taq Pol I; Tca DNA polymerase +ec:3.1.6.9 chondro-4-sulfatase; chondroitin-4-sulfatase; 4-deoxy-beta-D-gluc-4-enuronosyl-(1,3)-N-acetyl-D-galactosamine-4-sulfate 4-sulfohydrolase +ec:3.1.6.10 chondro-6-sulfatase; 4-deoxy-beta-D-gluc-4-enuronosyl-(1,3)-N-acetyl-D-galactosamine-6-sulfate 6-sulfohydrolase +ec:3.2.1.52 beta-N-acetylhexosaminidase; hexosaminidase; beta-acetylaminodeoxyhexosidase; N-acetyl-beta-D-hexosaminidase; N-acetyl-beta-hexosaminidase; beta-hexosaminidase; beta-acetylhexosaminidinase; beta-D-N-acetylhexosaminidase; beta-N-acetyl-D-hexosaminidase; beta-N-acetylglucosaminidase; hexosaminidase A; N-acetylhexosaminidase; beta-D-hexosaminidase +ec:3.2.1.92 peptidoglycan beta-N-acetylmuramidase; exo-beta-N-acetylmuramidase; exo-beta-acetylmuramidase; beta-2-acetamido-3-O-(D-1-carboxyethyl)-2-deoxy-D-glucoside acetamidodeoxyglucohydrolase +ec:3.2.1.96 mannosyl-glycoprotein endo-beta-N-acetylglucosaminidase; N,N'-diacetylchitobiosyl beta-N-acetylglucosaminidase; endo-beta-N-acetylglucosaminidase; mannosyl-glycoprotein endo-beta-N-acetylglucosamidase; di-N-acetylchitobiosyl beta-N-acetylglucosaminidase; endo-beta-acetylglucosaminidase; endo-beta-(1->4)-N-acetylglucosaminidase; mannosyl-glycoprotein 1,4-N-acetamidodeoxy-beta-D-glycohydrolase; endoglycosidase S; endo-N-acetyl-beta-D-glucosaminidase; endo-N-acetyl-beta-glucosaminidase; endo-beta-N-acetylglucosaminidase D; endo-beta-N-acetylglucosaminidase F; endo-beta-N-acetylglucosaminidase H; endo-beta-N-acetylglucosaminidase L; glycopeptide-D-mannosyl-4-N-(N-acetyl-D-glucosaminyl)2-asparagine 1,4-N-acetyl-beta-glucosaminohydrolase; endoglycosidase H +ec:3.5.1.105 chitin disaccharide deacetylase; chitobiose amidohydolase; COD; chitin oligosaccharide deacetylase; chitin oligosaccharide amidohydolase; 2-(acetylamino)-4-O-[2-(acetylamino)-2-deoxy-beta-D-glucopyranosyl]-2-deoxy-D-glucopyranose acetylhydrolase +ec:3.6.1.57 UDP-2,4-diacetamido-2,4,6-trideoxy-beta-L-altropyranose hydrolase; PseG; UDP-6-deoxy-AltdiNAc hydrolase; Cj1312; UDP-2,4-bis(acetamido)-2,4,6-trideoxy-beta-L-altropyranose hydrolase +ec:4.1.2.20 2-dehydro-3-deoxyglucarate aldolase; 2-keto-3-deoxyglucarate aldolase; alpha-keto-beta-deoxy-D-glucarate aldolase; 2-dehydro-3-deoxy-D-glucarate tartronate-semialdehyde-lyase; 2-dehydro-3-deoxy-D-glucarate tartronate-semialdehyde-lyase (pyruvate-forming) +ec:4.2.1.115 UDP-N-acetylglucosamine 4,6-dehydratase (configuration-inverting); FlaA1; UDP-N-acetylglucosamine 5-inverting 4,6-dehydratase; PseB; UDP-N-acetylglucosamine hydro-lyase (inverting; UDP-2-acetamido-2,6-dideoxy-beta-L-arabino-hex-4-ulose-forming) diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/getkcfKEGG.pyc Binary file get_data/kegg_glycan/getkcfKEGG.pyc has changed diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/kcf.output --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/kcf.output Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,22 @@ +ENTRY G10495 Glycan +NODE 3 + 1 * 8 0 + 2 Glc 0 0 + 3 * -8 0 +EDGE 2 + 1 2:a1 1 + 2 3 2:4 +BRACKET 1 -4.0 2.0 -4.0 -2.0 + 1 5.0 -2.0 5.0 2.0 + 1 n +/// +ENTRY G10608 Glycan +NODE 1 + 1 UDP-Glc -0.3 0 +EDGE 0 +/// +ENTRY G10619 Glycan +NODE 1 + 1 UDP -0.4 0.3 +EDGE 0 +/// diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/linkKEGG.py --- a/get_data/kegg_glycan/linkKEGG.py Wed Mar 23 14:35:56 2016 -0400 +++ b/get_data/kegg_glycan/linkKEGG.py Fri May 06 08:05:48 2016 -0400 @@ -1,6 +1,6 @@ __author__ = 'cbarnett' __license__ = "MIT" -__version = "0.3" +__version = "0.3.1" # http://www.kegg.jp/kegg/rest/keggapi.html @@ -13,6 +13,15 @@ import urllib2 uri = 'http://rest.kegg.jp/link/' + + import re + p = re.compile(' *\+ *') # ensure no unneccessary space in an AND query + sdbfix = p.subn('+', sourcedb) + sourcedb=sdbfix[0] + + if ' ' in sourcedb: + sourcedb = sourcedb.replace(' ', '%20') # previous behaviour was ignoring text after a space, rather convert to '%20' and pass on to KEGG REST service + fulluri = uri + targetdb + "/" + sourcedb try: response = urllib2.urlopen(fulluri).read() diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/linkKEGG.pyc Binary file get_data/kegg_glycan/linkKEGG.pyc has changed diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/linkKEGG.xml --- a/get_data/kegg_glycan/linkKEGG.xml Wed Mar 23 14:35:56 2016 -0400 +++ b/get_data/kegg_glycan/linkKEGG.xml Fri May 06 08:05:48 2016 -0400 @@ -1,4 +1,4 @@ - + searches KEGG for related database entries python_for_glycan_tools @@ -34,7 +34,7 @@ - + diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/linked_entries.txt diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/plus --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/plus Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,21 @@ +ec:1.1.1.125 2-deoxy-D-gluconate 3-dehydrogenase; 2-deoxygluconate dehydrogenase +ec:1.1.1.126 2-dehydro-3-deoxy-D-gluconate 6-dehydrogenase; 2-keto-3-deoxy-D-gluconate dehydrogenase; 2-keto-3-deoxygluconate dehydrogenase +ec:1.1.1.127 2-dehydro-3-deoxy-D-gluconate 5-dehydrogenase; 2-keto-3-deoxygluconate 5-dehydrogenase; 2-keto-3-deoxy-D-gluconate dehydrogenase; 2-keto-3-deoxygluconate (nicotinamide adenine dinucleotide (phosphate)) dehydrogenase; 2-keto-3-deoxy-D-gluconate (3-deoxy-D-glycero-2,5-hexodiulosonic acid) dehydrogenase +ec:1.1.1.133 dTDP-4-dehydrorhamnose reductase; dTDP-4-keto-L-rhamnose reductase; dTDP-4-ketorhamnose reductase; TDP-4-keto-rhamnose reductase; thymidine diphospho-4-ketorhamnose reductase; dTDP-6-deoxy-L-mannose:NADP+ 4-oxidoreductase; dTDP-6-deoxy-beta-L-mannose:NADP+ 4-oxidoreductase +ec:1.1.1.134 dTDP-6-deoxy-L-talose 4-dehydrogenase (NADP+); thymidine diphospho-6-deoxy-L-talose dehydrogenase; TDP-6-deoxy-L-talose dehydrogenase; dTDP-6-deoxy-L-talose dehydrogenase (4-reductase); dTDP-6-deoxy-L-talose:NADP+ 4-oxidoreductase +ec:1.1.1.135 GDP-6-deoxy-D-talose 4-dehydrogenase; guanosine diphospho-6-deoxy-D-talose dehydrogenase; GDP-6-deoxy-D-talose:NAD(P)+ 4-oxidoreductase +ec:1.1.1.136 UDP-N-acetylglucosamine 6-dehydrogenase; uridine diphosphoacetylglucosamine dehydrogenase; UDP-acetylglucosamine dehydrogenase; UDP-2-acetamido-2-deoxy-D-glucose:NAD oxidoreductase; UDP-GlcNAc dehydrogenase; WbpA; WbpO +ec:1.1.1.187 GDP-4-dehydro-D-rhamnose reductase; GDP-4-keto-6-deoxy-D-mannose reductase; GDP-4-keto-D-rhamnose reductase; guanosine diphosphate-4-keto-D-rhamnose reductase; GDP-6-deoxy-D-mannose:NAD(P)+ 4-oxidoreductase; GDP-6-deoxy-alpha-D-mannose:NAD(P)+ 4-oxidoreductase +ec:1.1.1.235 8-oxocoformycin reductase; 8-ketodeoxycoformycin reductase +ec:1.1.1.266 dTDP-4-dehydro-6-deoxyglucose reductase; dTDP-4-keto-6-deoxyglucose reductase; dTDP-D-fucose:NADP+ oxidoreductase; Fcf1; dTDP-6-deoxy-D-xylo-hex-4-ulopyranose reductase +ec:1.1.1.267 1-deoxy-D-xylulose-5-phosphate reductoisomerase; DXP-reductoisomerase; 1-deoxy-D-xylulose-5-phosphate isomeroreductase; 2-C-methyl-D-erythritol 4-phosphate (MEP) synthase +ec:1.1.1.271 GDP-L-fucose synthase; GDP-4-keto-6-deoxy-D-mannose-3,5-epimerase-4-reductase; GDP-L-fucose:NADP+ 4-oxidoreductase (3,5-epimerizing) +ec:1.1.1.281 GDP-4-dehydro-6-deoxy-D-mannose reductase; GDP-4-keto-6-deoxy-D-mannose reductase [ambiguous]; GDP-6-deoxy-D-lyxo-4-hexulose reductase; Rmd; GDP-6-deoxy-D-mannose:NAD(P)+ 4-oxidoreductase (D-rhamnose-forming); GDP-6-deoxy-alpha-D-mannose:NAD(P)+ 4-oxidoreductase (D-rhamnose-forming) +ec:1.1.1.329 2-deoxy-scyllo-inosamine dehydrogenase; neoA (gene name); kanK (gene name, ambiguous); kanE (gene name, ambiguous) +ec:1.1.1.335 UDP-N-acetyl-2-amino-2-deoxyglucuronate dehydrogenase; WlbA; WbpB +ec:1.1.1.339 dTDP-6-deoxy-L-talose 4-dehydrogenase (NAD+); tll (gene name) +ec:1.1.1.340 1-deoxy-11beta-hydroxypentalenate dehydrogenase; 1-deoxy-11beta-hydroxypentalenic acid dehydrogenase; ptlF (gene name); penF (gene name) +ec:1.1.1.344 dTDP-6-deoxy-L-talose 4-dehydrogenase [NAD(P)+]; tal (gene name) +ec:1.1.1.364 dTDP-4-dehydro-6-deoxy-alpha-D-gulose 4-ketoreductase; dTDP-4-dehydro-6-deoxygulose reductase; tylD (gene name); gerKI (gene name); chmD (gene name); mydI (gene name) +ec:1.1.1.384 dTDP-3,4-didehydro-2,6-dideoxy-alpha-D-glucose 3-reductase; KijD10; dTDP-4-keto-2,6-dideoxy-D-glucose 3-oxidoreductase; dTDP-4-dehydro-2,6-dideoxy-alpha-D-glucose 3-oxidoreductase +ec:1.1.1.389 2-dehydro-3-deoxy-L-galactonate 5-dehydrogenase diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/test-data/shiga-toxin-example-AND --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/test-data/shiga-toxin-example-AND Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,103 @@ +ece:Z1464 stx2A; shiga-like toxin II A subunit encoded by bacteriophage BP-933W; K11006 shiga toxin subunit A +ece:Z1465 stx2B; shiga-like toxin II B subunit encoded by bacteriophage BP-933W; K11007 shiga toxin subunit B +ece:Z3343 stx1B; shiga-like toxin 1 subunit B encoded within prophage CP-933V; K11007 shiga toxin subunit B +ece:Z3344 stx1A; shiga-like toxin 1 subunit A encoded within prophage CP-933V; K11006 shiga toxin subunit A +ecs:ECs1205 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +ecs:ECs1206 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +ecs:ECs2973 Shiga toxin I subunit B; K11007 shiga toxin subunit B +ecs:ECs2974 Shiga toxin I subunit A; K11006 shiga toxin subunit A +ecf:ECH74115_2905 shigatoxin 2, subunit B; K11007 shiga toxin subunit B +ecf:ECH74115_2906 shiga toxin subunit A; K11006 shiga toxin subunit A +ecf:ECH74115_3532 shiga toxin 2 B subunit; K11007 shiga toxin subunit B +ecf:ECH74115_3533 shiga toxin subunit A; K11006 shiga toxin subunit A +etw:ECSP_2722 stx2cB; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +etw:ECSP_2723 stx2A1; Shiga-like toxin II subunit A precursor; K11006 shiga toxin subunit A +etw:ECSP_3252 stx2B; shiga toxin II subunit B; K11007 shiga toxin subunit B +etw:ECSP_3253 stx2A2; shiga toxin II subunit A; K11006 shiga toxin subunit A +elx:CDCO157_1154 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +elx:CDCO157_1155 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +elx:CDCO157_2738 Shiga toxin I subunit B precursor; K11007 shiga toxin subunit B +elx:CDCO157_2739 Shiga toxin I subunit A precursor; K11006 shiga toxin subunit A +eoj:ECO26_1599 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoj:ECO26_1600 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eoi:ECO111_2429 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eoi:ECO111_2430 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +eoi:ECO111_3361 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoi:ECO111_3362 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eoh:ECO103_2844 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eoh:ECO103_2845 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +eoh:ECO103_5197 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoh:ECO103_5198 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eso:O3O_09170 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eso:O3O_09165 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +esm:O3M_16105 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +esm:O3M_16110 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +esl:O3K_16130 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +esl:O3K_16135 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +ecoo:ECRM13514_3144 stx2B; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +ecoo:ECRM13514_3145 stx2A; Shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +ecoh:ECRM13516_2315 stx2B; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +ecoh:ECRM13516_2316 stx2A; Shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +stm:STM0284 shiga-like toxin A subunit +seo:STM14_0332 putative Shiga-like toxin A subunit +sev:STMMW_02891 putative shiga-like toxin A subunit +sem:STMDT12_C02790 putative Shiga-like toxin A subunit +sej:STMUK_0287 putative Shiga-like toxin A subunit +setu:STU288_13325 putative shiga-like toxin A subunit +setc:CFSAN001921_15985 Shiga toxin A subunit +send:DT104_02831 sciR; shiga-like toxin a subunit, type VI secretion system SciR protein flags: precursor +seni:CY43_01420 Shiga toxin A subunit +seen:SE451236_07435 Shiga toxin A subunit +spt:SPA2480 putative shiga-like toxin A subunit +sek:SSPA2315 shiga-like toxin A subunit +sei:SPC_0292 putative shiga-like toxin A subunit +sec:SCH_0277 putative shiga-like toxin A subunit +shb:SU5_0926 SciR Shiga-like toxin A subunit +senh:CFSAN002069_07720 Shiga toxin A subunit +seeh:SEEH1578_10515 putative shiga-like toxin A subunit +seec:CFSAN002050_07960 Shiga toxin A subunit +sene:IA1_01505 Shiga toxin A subunit +senc:SEET0819_08350 Shiga toxin A subunit +sdy:SDY_1389 stxA; Shiga toxin subunit A; K11006 shiga toxin subunit A +sdy:SDY_1390 stxB; Shiga toxin subunit B; K11007 shiga toxin subunit B +sdz:Asd1617_01826 Shiga toxin subunit A (EC:3.2.2.22); K11006 shiga toxin subunit A +ebi:EbC_13780 Putative shiga-like toxin A subunit +psos:POS17_2009 P9; putative Shiga-like toxin alpha subunit +ssab:SSABA_v1c03870 hypothetical protein; K11006 shiga toxin subunit A +ssab:SSABA_v1c09020 hypothetical protein; K11006 shiga toxin subunit A +calt:Cal6303_2132 ribosome-inactivating protein; K11006 shiga toxin subunit A +vg:22277199 PI30_gp34; Shigella phage POCJ13; shiga toxin A-chain precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:22277200 PI30_gp35; Shigella phage POCJ13; shiga toxin I subunit B precursor; K11007 shiga toxin subunit B +vg:1262301 APSE-1_07; Endosymbiont phage APSE-1; P7; K11007 shiga toxin subunit B +vg:1481747 stx1A, Stx1_p142; Escherichia Stx1 converting phage; Shiga toxin1 subunit A; K11006 shiga toxin subunit A +vg:1481748 stx1B, Stx1_p143; Escherichia Stx1 converting phage; Shiga toxin1 subunit B; K11007 shiga toxin subunit B +vg:1481767 stx2A, Stx2II_p143; Stx2 converting phage II; Shiga toxin2 subunit A; K11006 shiga toxin subunit A +vg:1481768 stx2B, Stx2II_p144; Stx2 converting phage II; Shiga toxin2 subunit B; K11007 shiga toxin subunit B +vg:26228052 AS349_gp84; Escherichia phage PA2; shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:26228100 AS349_gp83; Escherichia phage PA2; shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +vg:26516496 stx2A, AU085_gp42; Enterobacteria phage VT2phi_272; Shiga toxin 2 A subunit; K11006 shiga toxin subunit A +vg:26516448 stx2B, AU085_gp41; Enterobacteria phage VT2phi_272; Shiga toxin 2 B subunit; K11007 shiga toxin subunit B +vg:26516283 stxB, phi191_00011, AU083_gp11; Escherichia phage phi191; shiga toxin subunit B precursor; K11007 shiga toxin subunit B +vg:26516284 stxA, phi191_00012, AU083_gp12; Escherichia phage phi191; shiga toxin subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:26519429 AU154_gp39; Shigella phage Ss-VASD; Stx1 A subunit; K11006 shiga toxin subunit A +vg:26519430 AU154_gp40; Shigella phage Ss-VASD; Stx1 B subunit; K11007 shiga toxin subunit B +vg:1261950 stxA2, L0103, sltIIA, stx2A, 933Wp40; Enterobacteria phage 933W; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:1262010 stxB2, L0104, sltIIB, stx2B, 933Wp41; Enterobacteria phage 933W; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:2641645 stxA1, phi4795p38, PBV4795_ORF40; Enterobacteria phage BP-4795; Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +vg:2641657 stxB1, phi4795p39, PBV4795_ORF41; Enterobacteria phage BP-4795; Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +vg:929695 stxA2e, P27p25; Enterobacteria phage phiP27; shiga toxin 2e A-subunit; K11006 shiga toxin subunit A +vg:929727 stxB2e, P27p26; Enterobacteria phage phiP27; shiga toxin 2e B-subunit; K11007 shiga toxin subunit B +vg:4397483 stx2A, Stx2-86_gp01; Stx2-converting phage 86; shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:4397484 stx2B, Stx2-86_gp02; Stx2-converting phage 86; shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:6159405 stx2A, pMIN27_41; Enterobacteria phage Min27; ORF44; K11006 shiga toxin subunit A +vg:6159351 stx2B, pMIN27_42; Enterobacteria phage Min27; ORF45; K11007 shiga toxin subunit B +vg:6973138 Stx2-1717_gp41; Stx2-converting phage 1717; verocytotoxin 2 variant 2c subunit A; K11006 shiga toxin subunit A +vg:6972909 stx2cB, Stx2-1717_gp42; Stx2-converting phage 1717; verocytotoxin 2 variant 2c subunit B; K11007 shiga toxin subunit B +vg:6973079 YYZ_gp39; Enterobacteria phage YYZ-2008; Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +vg:6973080 YYZ_gp40; Enterobacteria phage YYZ-2008; Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +vg:13828571 stx2A, D300_gp43; Escherichia phage P13374; shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:13828535 stx2B, D300_gp42; Escherichia phage P13374; shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:14005228 F366_gp36; Escherichia phage TL-2011c; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:14005229 F366_gp37; Escherichia phage TL-2011c; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:1262249 stx2A, VT2-Sap42; Enterobacteria phage VT2-Sakai; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:1262250 stx2B, VT2-Sap43; Enterobacteria phage VT2-Sakai; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/test-data/shiga-toxin-example-AND-broken --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/test-data/shiga-toxin-example-AND-broken Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,88 @@ +ece:Z1464 stx2A; shiga-like toxin II A subunit encoded by bacteriophage BP-933W; K11006 shiga toxin subunit A +ece:Z1465 stx2B; shiga-like toxin II B subunit encoded by bacteriophage BP-933W; K11007 shiga toxin subunit B +ece:Z3343 stx1B; shiga-like toxin 1 subunit B encoded within prophage CP-933V; K11007 shiga toxin subunit B +ece:Z3344 stx1A; shiga-like toxin 1 subunit A encoded within prophage CP-933V; K11006 shiga toxin subunit A +ecs:ECs1205 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +ecs:ECs1206 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +ecs:ECs2973 Shiga toxin I subunit B; K11007 shiga toxin subunit B +ecs:ECs2974 Shiga toxin I subunit A; K11006 shiga toxin subunit A +ecf:ECH74115_2905 shigatoxin 2, subunit B; K11007 shiga toxin subunit B +ecf:ECH74115_2906 shiga toxin subunit A; K11006 shiga toxin subunit A +ecf:ECH74115_3532 shiga toxin 2 B subunit; K11007 shiga toxin subunit B +ecf:ECH74115_3533 shiga toxin subunit A; K11006 shiga toxin subunit A +etw:ECSP_2722 stx2cB; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +etw:ECSP_2723 stx2A1; Shiga-like toxin II subunit A precursor; K11006 shiga toxin subunit A +etw:ECSP_3252 stx2B; shiga toxin II subunit B; K11007 shiga toxin subunit B +etw:ECSP_3253 stx2A2; shiga toxin II subunit A; K11006 shiga toxin subunit A +elx:CDCO157_1154 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +elx:CDCO157_1155 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +elx:CDCO157_2738 Shiga toxin I subunit B precursor; K11007 shiga toxin subunit B +elx:CDCO157_2739 Shiga toxin I subunit A precursor; K11006 shiga toxin subunit A +eoj:ECO26_1599 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoj:ECO26_1600 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eoi:ECO111_2429 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eoi:ECO111_2430 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +eoi:ECO111_3361 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoi:ECO111_3362 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eoh:ECO103_2844 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eoh:ECO103_2845 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +eoh:ECO103_5197 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoh:ECO103_5198 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eso:O3O_09170 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eso:O3O_09165 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +esm:O3M_16105 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +esm:O3M_16110 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +esl:O3K_16130 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +esl:O3K_16135 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +ecoo:ECRM13514_3144 stx2B; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +ecoo:ECRM13514_3145 stx2A; Shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +ecoh:ECRM13516_2315 stx2B; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +ecoh:ECRM13516_2316 stx2A; Shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +setc:CFSAN001921_15985 Shiga toxin A subunit +seni:CY43_01420 Shiga toxin A subunit +seen:SE451236_07435 Shiga toxin A subunit +senh:CFSAN002069_07720 Shiga toxin A subunit +seec:CFSAN002050_07960 Shiga toxin A subunit +sene:IA1_01505 Shiga toxin A subunit +senc:SEET0819_08350 Shiga toxin A subunit +sdy:SDY_1389 stxA; Shiga toxin subunit A; K11006 shiga toxin subunit A +sdy:SDY_1390 stxB; Shiga toxin subunit B; K11007 shiga toxin subunit B +sdz:Asd1617_01826 Shiga toxin subunit A (EC:3.2.2.22); K11006 shiga toxin subunit A +ssab:SSABA_v1c03870 hypothetical protein; K11006 shiga toxin subunit A +ssab:SSABA_v1c09020 hypothetical protein; K11006 shiga toxin subunit A +calt:Cal6303_2132 ribosome-inactivating protein; K11006 shiga toxin subunit A +vg:22277199 PI30_gp34; Shigella phage POCJ13; shiga toxin A-chain precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:22277200 PI30_gp35; Shigella phage POCJ13; shiga toxin I subunit B precursor; K11007 shiga toxin subunit B +vg:1262301 APSE-1_07; Endosymbiont phage APSE-1; P7; K11007 shiga toxin subunit B +vg:1481747 stx1A, Stx1_p142; Escherichia Stx1 converting phage; Shiga toxin1 subunit A; K11006 shiga toxin subunit A +vg:1481748 stx1B, Stx1_p143; Escherichia Stx1 converting phage; Shiga toxin1 subunit B; K11007 shiga toxin subunit B +vg:1481767 stx2A, Stx2II_p143; Stx2 converting phage II; Shiga toxin2 subunit A; K11006 shiga toxin subunit A +vg:1481768 stx2B, Stx2II_p144; Stx2 converting phage II; Shiga toxin2 subunit B; K11007 shiga toxin subunit B +vg:26228052 AS349_gp84; Escherichia phage PA2; shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:26228100 AS349_gp83; Escherichia phage PA2; shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +vg:26516496 stx2A, AU085_gp42; Enterobacteria phage VT2phi_272; Shiga toxin 2 A subunit; K11006 shiga toxin subunit A +vg:26516448 stx2B, AU085_gp41; Enterobacteria phage VT2phi_272; Shiga toxin 2 B subunit; K11007 shiga toxin subunit B +vg:26516283 stxB, phi191_00011, AU083_gp11; Escherichia phage phi191; shiga toxin subunit B precursor; K11007 shiga toxin subunit B +vg:26516284 stxA, phi191_00012, AU083_gp12; Escherichia phage phi191; shiga toxin subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:26519429 AU154_gp39; Shigella phage Ss-VASD; Stx1 A subunit; K11006 shiga toxin subunit A +vg:26519430 AU154_gp40; Shigella phage Ss-VASD; Stx1 B subunit; K11007 shiga toxin subunit B +vg:1261950 stxA2, L0103, sltIIA, stx2A, 933Wp40; Enterobacteria phage 933W; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:1262010 stxB2, L0104, sltIIB, stx2B, 933Wp41; Enterobacteria phage 933W; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:2641645 stxA1, phi4795p38, PBV4795_ORF40; Enterobacteria phage BP-4795; Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +vg:2641657 stxB1, phi4795p39, PBV4795_ORF41; Enterobacteria phage BP-4795; Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +vg:929695 stxA2e, P27p25; Enterobacteria phage phiP27; shiga toxin 2e A-subunit; K11006 shiga toxin subunit A +vg:929727 stxB2e, P27p26; Enterobacteria phage phiP27; shiga toxin 2e B-subunit; K11007 shiga toxin subunit B +vg:4397483 stx2A, Stx2-86_gp01; Stx2-converting phage 86; shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:4397484 stx2B, Stx2-86_gp02; Stx2-converting phage 86; shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:6159405 stx2A, pMIN27_41; Enterobacteria phage Min27; ORF44; K11006 shiga toxin subunit A +vg:6159351 stx2B, pMIN27_42; Enterobacteria phage Min27; ORF45; K11007 shiga toxin subunit B +vg:6973138 Stx2-1717_gp41; Stx2-converting phage 1717; verocytotoxin 2 variant 2c subunit A; K11006 shiga toxin subunit A +vg:6972909 stx2cB, Stx2-1717_gp42; Stx2-converting phage 1717; verocytotoxin 2 variant 2c subunit B; K11007 shiga toxin subunit B +vg:6973079 YYZ_gp39; Enterobacteria phage YYZ-2008; Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +vg:6973080 YYZ_gp40; Enterobacteria phage YYZ-2008; Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +vg:13828571 stx2A, D300_gp43; Escherichia phage P13374; shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:13828535 stx2B, D300_gp42; Escherichia phage P13374; shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:14005228 F366_gp36; Escherichia phage TL-2011c; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:14005229 F366_gp37; Escherichia phage TL-2011c; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:1262249 stx2A, VT2-Sap42; Enterobacteria phage VT2-Sakai; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:1262250 stx2B, VT2-Sap43; Enterobacteria phage VT2-Sakai; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/test-data/shiga-toxin-example-OR --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/test-data/shiga-toxin-example-OR Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,88 @@ +ece:Z1464 stx2A; shiga-like toxin II A subunit encoded by bacteriophage BP-933W; K11006 shiga toxin subunit A +ece:Z1465 stx2B; shiga-like toxin II B subunit encoded by bacteriophage BP-933W; K11007 shiga toxin subunit B +ece:Z3343 stx1B; shiga-like toxin 1 subunit B encoded within prophage CP-933V; K11007 shiga toxin subunit B +ece:Z3344 stx1A; shiga-like toxin 1 subunit A encoded within prophage CP-933V; K11006 shiga toxin subunit A +ecs:ECs1205 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +ecs:ECs1206 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +ecs:ECs2973 Shiga toxin I subunit B; K11007 shiga toxin subunit B +ecs:ECs2974 Shiga toxin I subunit A; K11006 shiga toxin subunit A +ecf:ECH74115_2905 shigatoxin 2, subunit B; K11007 shiga toxin subunit B +ecf:ECH74115_2906 shiga toxin subunit A; K11006 shiga toxin subunit A +ecf:ECH74115_3532 shiga toxin 2 B subunit; K11007 shiga toxin subunit B +ecf:ECH74115_3533 shiga toxin subunit A; K11006 shiga toxin subunit A +etw:ECSP_2722 stx2cB; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +etw:ECSP_2723 stx2A1; Shiga-like toxin II subunit A precursor; K11006 shiga toxin subunit A +etw:ECSP_3252 stx2B; shiga toxin II subunit B; K11007 shiga toxin subunit B +etw:ECSP_3253 stx2A2; shiga toxin II subunit A; K11006 shiga toxin subunit A +elx:CDCO157_1154 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +elx:CDCO157_1155 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +elx:CDCO157_2738 Shiga toxin I subunit B precursor; K11007 shiga toxin subunit B +elx:CDCO157_2739 Shiga toxin I subunit A precursor; K11006 shiga toxin subunit A +eoj:ECO26_1599 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoj:ECO26_1600 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eoi:ECO111_2429 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eoi:ECO111_2430 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +eoi:ECO111_3361 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoi:ECO111_3362 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eoh:ECO103_2844 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eoh:ECO103_2845 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +eoh:ECO103_5197 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoh:ECO103_5198 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eso:O3O_09170 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eso:O3O_09165 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +esm:O3M_16105 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +esm:O3M_16110 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +esl:O3K_16130 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +esl:O3K_16135 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +ecoo:ECRM13514_3144 stx2B; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +ecoo:ECRM13514_3145 stx2A; Shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +ecoh:ECRM13516_2315 stx2B; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +ecoh:ECRM13516_2316 stx2A; Shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +setc:CFSAN001921_15985 Shiga toxin A subunit +seni:CY43_01420 Shiga toxin A subunit +seen:SE451236_07435 Shiga toxin A subunit +senh:CFSAN002069_07720 Shiga toxin A subunit +seec:CFSAN002050_07960 Shiga toxin A subunit +sene:IA1_01505 Shiga toxin A subunit +senc:SEET0819_08350 Shiga toxin A subunit +sdy:SDY_1389 stxA; Shiga toxin subunit A; K11006 shiga toxin subunit A +sdy:SDY_1390 stxB; Shiga toxin subunit B; K11007 shiga toxin subunit B +sdz:Asd1617_01826 Shiga toxin subunit A (EC:3.2.2.22); K11006 shiga toxin subunit A +ssab:SSABA_v1c03870 hypothetical protein; K11006 shiga toxin subunit A +ssab:SSABA_v1c09020 hypothetical protein; K11006 shiga toxin subunit A +calt:Cal6303_2132 ribosome-inactivating protein; K11006 shiga toxin subunit A +vg:22277199 PI30_gp34; Shigella phage POCJ13; shiga toxin A-chain precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:22277200 PI30_gp35; Shigella phage POCJ13; shiga toxin I subunit B precursor; K11007 shiga toxin subunit B +vg:1262301 APSE-1_07; Endosymbiont phage APSE-1; P7; K11007 shiga toxin subunit B +vg:1481747 stx1A, Stx1_p142; Escherichia Stx1 converting phage; Shiga toxin1 subunit A; K11006 shiga toxin subunit A +vg:1481748 stx1B, Stx1_p143; Escherichia Stx1 converting phage; Shiga toxin1 subunit B; K11007 shiga toxin subunit B +vg:1481767 stx2A, Stx2II_p143; Stx2 converting phage II; Shiga toxin2 subunit A; K11006 shiga toxin subunit A +vg:1481768 stx2B, Stx2II_p144; Stx2 converting phage II; Shiga toxin2 subunit B; K11007 shiga toxin subunit B +vg:26228052 AS349_gp84; Escherichia phage PA2; shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:26228100 AS349_gp83; Escherichia phage PA2; shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +vg:26516496 stx2A, AU085_gp42; Enterobacteria phage VT2phi_272; Shiga toxin 2 A subunit; K11006 shiga toxin subunit A +vg:26516448 stx2B, AU085_gp41; Enterobacteria phage VT2phi_272; Shiga toxin 2 B subunit; K11007 shiga toxin subunit B +vg:26516283 stxB, phi191_00011, AU083_gp11; Escherichia phage phi191; shiga toxin subunit B precursor; K11007 shiga toxin subunit B +vg:26516284 stxA, phi191_00012, AU083_gp12; Escherichia phage phi191; shiga toxin subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:26519429 AU154_gp39; Shigella phage Ss-VASD; Stx1 A subunit; K11006 shiga toxin subunit A +vg:26519430 AU154_gp40; Shigella phage Ss-VASD; Stx1 B subunit; K11007 shiga toxin subunit B +vg:1261950 stxA2, L0103, sltIIA, stx2A, 933Wp40; Enterobacteria phage 933W; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:1262010 stxB2, L0104, sltIIB, stx2B, 933Wp41; Enterobacteria phage 933W; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:2641645 stxA1, phi4795p38, PBV4795_ORF40; Enterobacteria phage BP-4795; Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +vg:2641657 stxB1, phi4795p39, PBV4795_ORF41; Enterobacteria phage BP-4795; Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +vg:929695 stxA2e, P27p25; Enterobacteria phage phiP27; shiga toxin 2e A-subunit; K11006 shiga toxin subunit A +vg:929727 stxB2e, P27p26; Enterobacteria phage phiP27; shiga toxin 2e B-subunit; K11007 shiga toxin subunit B +vg:4397483 stx2A, Stx2-86_gp01; Stx2-converting phage 86; shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:4397484 stx2B, Stx2-86_gp02; Stx2-converting phage 86; shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:6159405 stx2A, pMIN27_41; Enterobacteria phage Min27; ORF44; K11006 shiga toxin subunit A +vg:6159351 stx2B, pMIN27_42; Enterobacteria phage Min27; ORF45; K11007 shiga toxin subunit B +vg:6973138 Stx2-1717_gp41; Stx2-converting phage 1717; verocytotoxin 2 variant 2c subunit A; K11006 shiga toxin subunit A +vg:6972909 stx2cB, Stx2-1717_gp42; Stx2-converting phage 1717; verocytotoxin 2 variant 2c subunit B; K11007 shiga toxin subunit B +vg:6973079 YYZ_gp39; Enterobacteria phage YYZ-2008; Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +vg:6973080 YYZ_gp40; Enterobacteria phage YYZ-2008; Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +vg:13828571 stx2A, D300_gp43; Escherichia phage P13374; shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:13828535 stx2B, D300_gp42; Escherichia phage P13374; shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:14005228 F366_gp36; Escherichia phage TL-2011c; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:14005229 F366_gp37; Escherichia phage TL-2011c; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:1262249 stx2A, VT2-Sap42; Enterobacteria phage VT2-Sakai; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:1262250 stx2B, VT2-Sap43; Enterobacteria phage VT2-Sakai; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/test-data/shiga-toxin-example-OR-broken --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/get_data/kegg_glycan/test-data/shiga-toxin-example-OR-broken Fri May 06 08:05:48 2016 -0400 @@ -0,0 +1,103 @@ +ece:Z1464 stx2A; shiga-like toxin II A subunit encoded by bacteriophage BP-933W; K11006 shiga toxin subunit A +ece:Z1465 stx2B; shiga-like toxin II B subunit encoded by bacteriophage BP-933W; K11007 shiga toxin subunit B +ece:Z3343 stx1B; shiga-like toxin 1 subunit B encoded within prophage CP-933V; K11007 shiga toxin subunit B +ece:Z3344 stx1A; shiga-like toxin 1 subunit A encoded within prophage CP-933V; K11006 shiga toxin subunit A +ecs:ECs1205 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +ecs:ECs1206 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +ecs:ECs2973 Shiga toxin I subunit B; K11007 shiga toxin subunit B +ecs:ECs2974 Shiga toxin I subunit A; K11006 shiga toxin subunit A +ecf:ECH74115_2905 shigatoxin 2, subunit B; K11007 shiga toxin subunit B +ecf:ECH74115_2906 shiga toxin subunit A; K11006 shiga toxin subunit A +ecf:ECH74115_3532 shiga toxin 2 B subunit; K11007 shiga toxin subunit B +ecf:ECH74115_3533 shiga toxin subunit A; K11006 shiga toxin subunit A +etw:ECSP_2722 stx2cB; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +etw:ECSP_2723 stx2A1; Shiga-like toxin II subunit A precursor; K11006 shiga toxin subunit A +etw:ECSP_3252 stx2B; shiga toxin II subunit B; K11007 shiga toxin subunit B +etw:ECSP_3253 stx2A2; shiga toxin II subunit A; K11006 shiga toxin subunit A +elx:CDCO157_1154 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +elx:CDCO157_1155 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +elx:CDCO157_2738 Shiga toxin I subunit B precursor; K11007 shiga toxin subunit B +elx:CDCO157_2739 Shiga toxin I subunit A precursor; K11006 shiga toxin subunit A +eoj:ECO26_1599 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoj:ECO26_1600 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eoi:ECO111_2429 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eoi:ECO111_2430 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +eoi:ECO111_3361 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoi:ECO111_3362 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eoh:ECO103_2844 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eoh:ECO103_2845 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +eoh:ECO103_5197 Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +eoh:ECO103_5198 Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +eso:O3O_09170 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +eso:O3O_09165 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +esm:O3M_16105 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +esm:O3M_16110 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +esl:O3K_16130 Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +esl:O3K_16135 Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +ecoo:ECRM13514_3144 stx2B; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +ecoo:ECRM13514_3145 stx2A; Shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +ecoh:ECRM13516_2315 stx2B; Shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +ecoh:ECRM13516_2316 stx2A; Shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +stm:STM0284 shiga-like toxin A subunit +seo:STM14_0332 putative Shiga-like toxin A subunit +sev:STMMW_02891 putative shiga-like toxin A subunit +sem:STMDT12_C02790 putative Shiga-like toxin A subunit +sej:STMUK_0287 putative Shiga-like toxin A subunit +setu:STU288_13325 putative shiga-like toxin A subunit +setc:CFSAN001921_15985 Shiga toxin A subunit +send:DT104_02831 sciR; shiga-like toxin a subunit, type VI secretion system SciR protein flags: precursor +seni:CY43_01420 Shiga toxin A subunit +seen:SE451236_07435 Shiga toxin A subunit +spt:SPA2480 putative shiga-like toxin A subunit +sek:SSPA2315 shiga-like toxin A subunit +sei:SPC_0292 putative shiga-like toxin A subunit +sec:SCH_0277 putative shiga-like toxin A subunit +shb:SU5_0926 SciR Shiga-like toxin A subunit +senh:CFSAN002069_07720 Shiga toxin A subunit +seeh:SEEH1578_10515 putative shiga-like toxin A subunit +seec:CFSAN002050_07960 Shiga toxin A subunit +sene:IA1_01505 Shiga toxin A subunit +senc:SEET0819_08350 Shiga toxin A subunit +sdy:SDY_1389 stxA; Shiga toxin subunit A; K11006 shiga toxin subunit A +sdy:SDY_1390 stxB; Shiga toxin subunit B; K11007 shiga toxin subunit B +sdz:Asd1617_01826 Shiga toxin subunit A (EC:3.2.2.22); K11006 shiga toxin subunit A +ebi:EbC_13780 Putative shiga-like toxin A subunit +psos:POS17_2009 P9; putative Shiga-like toxin alpha subunit +ssab:SSABA_v1c03870 hypothetical protein; K11006 shiga toxin subunit A +ssab:SSABA_v1c09020 hypothetical protein; K11006 shiga toxin subunit A +calt:Cal6303_2132 ribosome-inactivating protein; K11006 shiga toxin subunit A +vg:22277199 PI30_gp34; Shigella phage POCJ13; shiga toxin A-chain precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:22277200 PI30_gp35; Shigella phage POCJ13; shiga toxin I subunit B precursor; K11007 shiga toxin subunit B +vg:1262301 APSE-1_07; Endosymbiont phage APSE-1; P7; K11007 shiga toxin subunit B +vg:1481747 stx1A, Stx1_p142; Escherichia Stx1 converting phage; Shiga toxin1 subunit A; K11006 shiga toxin subunit A +vg:1481748 stx1B, Stx1_p143; Escherichia Stx1 converting phage; Shiga toxin1 subunit B; K11007 shiga toxin subunit B +vg:1481767 stx2A, Stx2II_p143; Stx2 converting phage II; Shiga toxin2 subunit A; K11006 shiga toxin subunit A +vg:1481768 stx2B, Stx2II_p144; Stx2 converting phage II; Shiga toxin2 subunit B; K11007 shiga toxin subunit B +vg:26228052 AS349_gp84; Escherichia phage PA2; shiga-like toxin II subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:26228100 AS349_gp83; Escherichia phage PA2; shiga-like toxin II subunit B precursor; K11007 shiga toxin subunit B +vg:26516496 stx2A, AU085_gp42; Enterobacteria phage VT2phi_272; Shiga toxin 2 A subunit; K11006 shiga toxin subunit A +vg:26516448 stx2B, AU085_gp41; Enterobacteria phage VT2phi_272; Shiga toxin 2 B subunit; K11007 shiga toxin subunit B +vg:26516283 stxB, phi191_00011, AU083_gp11; Escherichia phage phi191; shiga toxin subunit B precursor; K11007 shiga toxin subunit B +vg:26516284 stxA, phi191_00012, AU083_gp12; Escherichia phage phi191; shiga toxin subunit A precursor (EC:3.2.2.22); K11006 shiga toxin subunit A +vg:26519429 AU154_gp39; Shigella phage Ss-VASD; Stx1 A subunit; K11006 shiga toxin subunit A +vg:26519430 AU154_gp40; Shigella phage Ss-VASD; Stx1 B subunit; K11007 shiga toxin subunit B +vg:1261950 stxA2, L0103, sltIIA, stx2A, 933Wp40; Enterobacteria phage 933W; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:1262010 stxB2, L0104, sltIIB, stx2B, 933Wp41; Enterobacteria phage 933W; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:2641645 stxA1, phi4795p38, PBV4795_ORF40; Enterobacteria phage BP-4795; Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +vg:2641657 stxB1, phi4795p39, PBV4795_ORF41; Enterobacteria phage BP-4795; Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +vg:929695 stxA2e, P27p25; Enterobacteria phage phiP27; shiga toxin 2e A-subunit; K11006 shiga toxin subunit A +vg:929727 stxB2e, P27p26; Enterobacteria phage phiP27; shiga toxin 2e B-subunit; K11007 shiga toxin subunit B +vg:4397483 stx2A, Stx2-86_gp01; Stx2-converting phage 86; shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:4397484 stx2B, Stx2-86_gp02; Stx2-converting phage 86; shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:6159405 stx2A, pMIN27_41; Enterobacteria phage Min27; ORF44; K11006 shiga toxin subunit A +vg:6159351 stx2B, pMIN27_42; Enterobacteria phage Min27; ORF45; K11007 shiga toxin subunit B +vg:6973138 Stx2-1717_gp41; Stx2-converting phage 1717; verocytotoxin 2 variant 2c subunit A; K11006 shiga toxin subunit A +vg:6972909 stx2cB, Stx2-1717_gp42; Stx2-converting phage 1717; verocytotoxin 2 variant 2c subunit B; K11007 shiga toxin subunit B +vg:6973079 YYZ_gp39; Enterobacteria phage YYZ-2008; Shiga toxin 1 subunit A; K11006 shiga toxin subunit A +vg:6973080 YYZ_gp40; Enterobacteria phage YYZ-2008; Shiga toxin 1 subunit B; K11007 shiga toxin subunit B +vg:13828571 stx2A, D300_gp43; Escherichia phage P13374; shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:13828535 stx2B, D300_gp42; Escherichia phage P13374; shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:14005228 F366_gp36; Escherichia phage TL-2011c; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:14005229 F366_gp37; Escherichia phage TL-2011c; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B +vg:1262249 stx2A, VT2-Sap42; Enterobacteria phage VT2-Sakai; Shiga toxin 2 subunit A; K11006 shiga toxin subunit A +vg:1262250 stx2B, VT2-Sap43; Enterobacteria phage VT2-Sakai; Shiga toxin 2 subunit B; K11007 shiga toxin subunit B diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/test_findKEGG.py --- a/get_data/kegg_glycan/test_findKEGG.py Wed Mar 23 14:35:56 2016 -0400 +++ b/get_data/kegg_glycan/test_findKEGG.py Fri May 06 08:05:48 2016 -0400 @@ -41,9 +41,10 @@ m = fk.find_entries_in_KEGG("john", "glucose") def test_unfindable_entry(self): - """should return None""" + """should return an empty string""" m = fk.find_entries_in_KEGG("glycan", "sally") - self.assertIsNone(m) + emptystring="" + self.assertItemsEqual(m,emptystring,"Expected Empty String for non-existent entry") def test_find_example(self): m = fk.find_entries_in_KEGG("glycan", "glucose") @@ -52,9 +53,123 @@ def test_query_has_newlines(self): """ - should be fine and return entries + Assume a new line query is an AND query. + """ + m = fk.find_entries_in_KEGG("glycan", "glucose\nUDP") + self.assertIsNotNone(m) + print m + self.assertIn("UDP-D-glucose", m) + + def test_query_has_newlines_and_a_space(self): + """ + glucose\\n UDP. OR's should pass """ m = fk.find_entries_in_KEGG("glycan", "glucose\n UDP") self.assertIsNotNone(m) self.assertIn("UDP-D-glucose", m) + def test_gene_specific_or(self): + """ + test "shiga toxin" returns. + /find/genes/"shiga toxin" for keywords "shiga toxin" + """ + m = fk.find_entries_in_KEGG("genes","shiga toxin") + self.assertIsNotNone(m) + #. not matching to all entries - that is silly, the db get updated! + self.assertIn("shiga", m) + self.assertIn("toxin", m) + self.assertNotIn("stm:STM0284",m) # should not be found in the OR query + + def test_gene_specific_and(self): + """ + test "shiga+toxin" returns. it should + /find/genes/shiga+toxin for keywords "shiga" and "toxin" + """ + m = fk.find_entries_in_KEGG("genes","shiga+toxin") + self.assertIsNotNone(m) + #. not matching to all entries - that is silly, the db get updated! + self.assertIn("shiga", m) + self.assertIn("toxin", m) + self.assertIn("stm:STM0284",m) # should be found in the AND query + + def test_enzyme_specific_1(self): + """ + test 2.4.99.1 returns + """ + m = fk.find_entries_in_KEGG("enzyme","2.4.99.1") + self.assertIsNotNone(m) + #. not matching to all entries - that is silly, the db get updated! + self.assertIn("2.4.99.1", m) + + def test_enzyme_specific_2(self): + """ + test 2.4.99.6 returns + """ + m = fk.find_entries_in_KEGG("enzyme","2.4.99.6") + self.assertIsNotNone(m) + #. not matching to all entries - that is silly, the db get updated! + self.assertIn("2.4.99.6", m) + + def test_enzyme_specific_3(self): + """ + test ec: 2.4.99.6 with space (tests stripping space functionality) + """ + m = fk.find_entries_in_KEGG("enzyme","ec: 2.4.99.6") + self.assertIsNotNone(m) + #. not matching to all entries - that is silly, the db get updated! + self.assertIn("2.4.99.6", m) + + def test_enzyme_specific_4(self): + """ + test ec: 2.4.99. , should return 2.4.99.* + """ + m = fk.find_entries_in_KEGG("enzyme","ec: 2.4.99.") + self.assertIsNotNone(m) + #. not matching to all entries - that is silly, the db get updated! + self.assertIn("2.4.99.1", m) + self.assertIn("2.4.99.6", m) + self.assertIn("2.4.99.11", m) + + def test_enzyme_specific_5(self): + """ + test ec: 2.4.99.1+2.4.99.6 . AND function, so returns nothing here. Do not expect an enzyme to be doubly classified. + """ + m = fk.find_entries_in_KEGG("enzyme","2.4.99.1+2.4.99.6") + self.assertIsNotNone(m) + emptystring="" + self.assertItemsEqual(m,emptystring,"Expected Empty String for non-existent entry") + + def test_enzyme_specific_6(self): + """ + test ec: 2.4.99.1 2.4.99.6 . OR function, should return something but does not (KEGG FAILURE?). + note that trying this without "" will return the AND function result which is incorrect. + """ + m = fk.find_entries_in_KEGG("enzyme","2.4.99.1 2.4.99.6") + self.assertIsNotNone(m) + #self.assertIn("2.4.99.1", m) + emptystring="" + print m + self.assertItemsEqual(m,emptystring,"Expected Empty String for non-existent entry") + + + def test_enzyme_specific_7(self): + """ + test deoxy+1.1.1. . AND function, that should return something + """ + m = fk.find_entries_in_KEGG("enzyme","deoxy+1.1.1") + self.assertIsNotNone(m) + print m + self.assertIn("deoxy", m) + self.assertIn("1.1.1", m) + + def test_enzyme_specific_8(self): + """ + test deoxy 1.1.1. . OR function. should return deoxy or 1.1.1. but does not (KEGG FAILURE?). i + note that trying this without "" will return the AND function result which is incorrect. + """ + m = fk.find_entries_in_KEGG("enzyme","deoxy 1.1.1") + self.assertIsNotNone(m) + emptystring="" + print m + self.assertItemsEqual(m,emptystring,"Expected Empty String for non-existent entry") + diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/test_findKEGG.pyc Binary file get_data/kegg_glycan/test_findKEGG.pyc has changed diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/test_getkcfKEGG.pyc Binary file get_data/kegg_glycan/test_getkcfKEGG.pyc has changed diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/test_linkKEGG.py --- a/get_data/kegg_glycan/test_linkKEGG.py Wed Mar 23 14:35:56 2016 -0400 +++ b/get_data/kegg_glycan/test_linkKEGG.py Fri May 06 08:05:48 2016 -0400 @@ -40,3 +40,76 @@ m = lk.linked_entries_from_kegg("br", "gl:G10496") self.assertEquals(m,"") + def test_enzyme_glycan_search_1(self): + """ + test "2.4.99.1 ec: " returns + """ + m = lk.linked_entries_from_kegg("glycan", "2.4.99.1 ec:") + self.assertIn("2.4.99.1", m) + + + def test_enzyme_glycan_search_2(self): + """ + test "2.4.99.1 ec: 2.4.99.6" returns + """ + m = lk.linked_entries_from_kegg("glycan", "2.4.99.1 ec: 2.4.99.6" ) + self.assertIn("2.4.99.1", m) + self.assertIn("2.4.99.6", m) + + def test_enzyme_glycan_search_3(self): + """ + test "2.4.99.1 ec:2.4.99.6" returns + """ + m = lk.linked_entries_from_kegg("glycan", "2.4.99.1 ec:2.4.99.6" ) + self.assertIn("2.4.99.1", m) + self.assertIn("2.4.99.6", m) + + def test_enzyme_glycan_search_4(self): + """ + test "2.4.99.1+2.4.99.6" returns. This time '+' is or. + """ + m = lk.linked_entries_from_kegg("glycan", "2.4.99.1+2.4.99.6" ) + self.assertIn("2.4.99.1", m) + self.assertIn("2.4.99.6", m) + + def test_enzyme_glycan_search_4b(self): + """ + test "2.4.99.1+ 2.4.99.6" returns. This time '+' is or. + """ + m = lk.linked_entries_from_kegg("glycan", "2.4.99.1+ 2.4.99.6" ) + self.assertIn("2.4.99.1", m) + self.assertIn("2.4.99.6", m) + + def test_enzyme_glycan_search_5(self): + """ + test "2.4.99.1 2.4.99.6" returns. Space also means or for the link db. + """ + m = lk.linked_entries_from_kegg("glycan", "2.4.99.1 2.4.99.6" ) + self.assertIn("2.4.99.1", m) + self.assertIn("2.4.99.6", m) + + + def test_enzyme_glycan_search_6(self): + """ + test "2.4.99.1+nana+2.4.99.6" returns. strangely when inserting junk it still works. + """ + m = lk.linked_entries_from_kegg("glycan", "2.4.99.1+nana+2.4.99.6" ) + self.assertIn("2.4.99.1", m) + self.assertIn("2.4.99.6", m) + + def test_enzyme_glycan_search_6b(self): + """ + test "2.4.99.1 nana 2.4.99.6" returns. strangely when inserting junk it still works. + """ + m = lk.linked_entries_from_kegg("glycan", "2.4.99.1+nana+2.4.99.6" ) + self.assertIn("2.4.99.1", m) + self.assertIn("2.4.99.6", m) + + def test_enzyme_glycan_search_7(self): + """ + test "\"2.4.99.1\"" is a bad request as it includes quotes. + """ + from urllib2 import HTTPError + with self.assertRaises(HTTPError): + m = lk.linked_entries_from_kegg("glycan", "\"2.4.99.1\"" ) + diff -r 89592faa2875 -r 0a5e0df17054 get_data/kegg_glycan/test_linkKEGG.pyc Binary file get_data/kegg_glycan/test_linkKEGG.pyc has changed