diff test-data/dup_check.txt @ 0:fd5c0b39569a draft

"planemo upload for repository https://github.com/computational-metabolomics/metfrag-galaxy commit e20ce56f23d9fe30df64542ece2295d654ca142d"
author computational-metabolomics
date Wed, 05 Feb 2020 12:30:06 -0500
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/dup_check.txt	Wed Feb 05 12:30:06 2020 -0500
@@ -0,0 +1,149 @@
+ACCESSION: FU000001
+RECORD_TITLE: 1111111111111111
+DATE: 2016.01.19 (Created 2009.02.18, modified 2011.05.06)
+AUTHORS: Matsuura F, Ohta M, Kittaka M, Faculty of Life Science and Biotechnology, Fukuyama University
+LICENSE: CC BY-SA
+CH$NAME: 3-Man2GlcNAc
+CH$NAME: Man-alpha-1-3Man-beta-1-4GlcNac
+CH$COMPOUND_CLASS: Natural Product; Oligosaccharide; N-linked glycan; High-mannose type
+CH$FORMULA: C20H35NO16
+CH$EXACT_MASS: 545.19558
+CH$SMILES: CC(=O)NC(C(O)1)C(O)C(OC(O2)C(O)C(OC(O3)C(O)C(O)C(O)C(CO)3)C(O)C(CO)2)C(CO)O1
+CH$IUPAC: InChI=1/C20H35NO16/c1-5(25)21-9-12(28)16(8(4-24)33-18(9)32)36-20-15(31)17(11(27)7(3-23)35-20)37-19-14(30)13(29)10(26)6(2-22)34-19/h6-20,22-24,26-32H,2-4H2,1H3,(H,21,25)/t6-,7-,8-,9-,10-,11-,12-,13+,14-,15+,16-,17+,18+,19-,20+/m1/s1/f/h21H
+CH$LINK: CHEMSPIDER 24606097
+CH$LINK: KEGG G00319
+AC$INSTRUMENT: 2695 HPLC Quadro Micro API, Waters
+AC$INSTRUMENT_TYPE: LC-ESI-QQ
+AC$MASS_SPECTROMETRY: MS_TYPE MS2
+AC$MASS_SPECTROMETRY: ION_MODE POSITIVE
+AC$MASS_SPECTROMETRY: COLLISION_ENERGY 15.0 V
+AC$MASS_SPECTROMETRY: DATAFORMAT Centroid
+AC$MASS_SPECTROMETRY: DESOLVATION_GAS_FLOW 897 L/Hr
+AC$MASS_SPECTROMETRY: DESOLVATION_TEMPERATURE 399 C
+AC$MASS_SPECTROMETRY: FRAGMENTATION_METHOD LOW-ENERGY CID
+AC$MASS_SPECTROMETRY: IONIZATION ESI
+AC$MASS_SPECTROMETRY: SCANNING 1 amu/sec (m/z = 20-2040)
+AC$MASS_SPECTROMETRY: SOURCE_TEMPERATURE 100C
+AC$CHROMATOGRAPHY: COLUMN_NAME TSK-GEL Amide-80 2.0 mm X 250 mm (TOSOH)
+AC$CHROMATOGRAPHY: COLUMN_TEMPERATURE 40 C
+AC$CHROMATOGRAPHY: FLOW_GRADIENT 74/26 at 0 min, 50/50 at 60 min.
+AC$CHROMATOGRAPHY: FLOW_RATE 0.2 ml/min
+AC$CHROMATOGRAPHY: RETENTION_TIME 7.080 min
+AC$CHROMATOGRAPHY: SAMPLING_CONE 43.10 V
+AC$CHROMATOGRAPHY: SOLVENT CH3CN/H2O
+MS$FOCUSED_ION: DERIVATIVE_FORM C29H46N2O17
+MS$FOCUSED_ION: DERIVATIVE_MASS 694.27965
+MS$FOCUSED_ION: DERIVATIVE_TYPE ABEE (p-Aminobenzoic acid ethyl ester)
+MS$FOCUSED_ION: PRECURSOR_M/Z 695.00
+MS$FOCUSED_ION: PRECURSOR_TYPE [M+H]+
+PK$SPLASH: splash10-0006-0002029000-bfe86aa7211a87812a06
+PK$NUM_PEAK: 8
+PK$PEAK: m/z int. rel.int.
+  370.8 3.277e5 366
+  371.4 3.036e4 34
+  532.0 5.812e4 65
+  532.6 2.982e5 333
+  533.3 5.196e4 58
+  694.1 4.564e5 510
+  694.8 8.939e5 999
+  695.4 5.537e4 62
+
+ACCESSION: FU000001
+RECORD_TITLE: 222222222222222222
+DATE: 2016.01.19 (Created 2009.02.18, modified 2011.05.06)
+AUTHORS: Matsuura F, Ohta M, Kittaka M, Faculty of Life Science and Biotechnology, Fukuyama University
+LICENSE: CC BY-SA
+CH$NAME: 3-Man2GlcNAc
+CH$NAME: Man-alpha-1-3Man-beta-1-4GlcNac
+CH$COMPOUND_CLASS: Natural Product; Oligosaccharide; N-linked glycan; High-mannose type
+CH$FORMULA: C20H35NO16
+CH$EXACT_MASS: 545.19558
+CH$SMILES: CC(=O)NC(C(O)1)C(O)C(OC(O2)C(O)C(OC(O3)C(O)C(O)C(O)C(CO)3)C(O)C(CO)2)C(CO)O1
+CH$IUPAC: InChI=1/C20H35NO16/c1-5(25)21-9-12(28)16(8(4-24)33-18(9)32)36-20-15(31)17(11(27)7(3-23)35-20)37-19-14(30)13(29)10(26)6(2-22)34-19/h6-20,22-24,26-32H,2-4H2,1H3,(H,21,25)/t6-,7-,8-,9-,10-,11-,12-,13+,14-,15+,16-,17+,18+,19-,20+/m1/s1/f/h21H
+CH$LINK: CHEMSPIDER 24606097
+CH$LINK: KEGG G00319
+AC$INSTRUMENT: 2695 HPLC Quadro Micro API, Waters
+AC$INSTRUMENT_TYPE: LC-ESI-QQ
+AC$MASS_SPECTROMETRY: MS_TYPE MS2
+AC$MASS_SPECTROMETRY: ION_MODE POSITIVE
+AC$MASS_SPECTROMETRY: COLLISION_ENERGY 15.0 V
+AC$MASS_SPECTROMETRY: DATAFORMAT Centroid
+AC$MASS_SPECTROMETRY: DESOLVATION_GAS_FLOW 897 L/Hr
+AC$MASS_SPECTROMETRY: DESOLVATION_TEMPERATURE 399 C
+AC$MASS_SPECTROMETRY: FRAGMENTATION_METHOD LOW-ENERGY CID
+AC$MASS_SPECTROMETRY: IONIZATION ESI
+AC$MASS_SPECTROMETRY: SCANNING 1 amu/sec (m/z = 20-2040)
+AC$MASS_SPECTROMETRY: SOURCE_TEMPERATURE 100C
+AC$CHROMATOGRAPHY: COLUMN_NAME TSK-GEL Amide-80 2.0 mm X 250 mm (TOSOH)
+AC$CHROMATOGRAPHY: COLUMN_TEMPERATURE 40 C
+AC$CHROMATOGRAPHY: FLOW_GRADIENT 74/26 at 0 min, 50/50 at 60 min.
+AC$CHROMATOGRAPHY: FLOW_RATE 0.2 ml/min
+AC$CHROMATOGRAPHY: RETENTION_TIME 7.080 min
+AC$CHROMATOGRAPHY: SAMPLING_CONE 43.10 V
+AC$CHROMATOGRAPHY: SOLVENT CH3CN/H2O
+MS$FOCUSED_ION: DERIVATIVE_FORM C29H46N2O17
+MS$FOCUSED_ION: DERIVATIVE_MASS 694.27965
+MS$FOCUSED_ION: DERIVATIVE_TYPE ABEE (p-Aminobenzoic acid ethyl ester)
+MS$FOCUSED_ION: PRECURSOR_M/Z 695.00
+MS$FOCUSED_ION: PRECURSOR_TYPE [M+H]+
+PK$SPLASH: splash10-0006-0002029000-bfe86aa7211a87812a06
+PK$NUM_PEAK: 8
+PK$PEAK: m/z int. rel.int.
+  370.8 3.277e5 366
+  371.4 3.036e4 34
+  532.0 5.812e4 65
+  532.6 2.982e5 333
+  533.3 5.196e4 58
+  694.1 4.564e5 510
+  694.8 8.939e5 999
+  695.4 5.537e4 62
+
+ACCESSION: FU000001
+RECORD_TITLE: 33333333333333333
+DATE: 2016.01.19 (Created 2009.02.18, modified 2011.05.06)
+AUTHORS: Matsuura F, Ohta M, Kittaka M, Faculty of Life Science and Biotechnology, Fukuyama University
+LICENSE: CC BY-SA
+CH$NAME: 3-Man2GlcNAc
+CH$NAME: Man-alpha-1-3Man-beta-1-4GlcNac
+CH$COMPOUND_CLASS: Natural Product; Oligosaccharide; N-linked glycan; High-mannose type
+CH$FORMULA: C20H35NO16
+CH$EXACT_MASS: 545.19558
+CH$SMILES: CC(=O)NC(C(O)1)C(O)C(OC(O2)C(O)C(OC(O3)C(O)C(O)C(O)C(CO)3)C(O)C(CO)2)C(CO)O1
+CH$IUPAC: InChI=1/C20H35NO16/c1-5(25)21-9-12(28)16(8(4-24)33-18(9)32)36-20-15(31)17(11(27)7(3-23)35-20)37-19-14(30)13(29)10(26)6(2-22)34-19/h6-20,22-24,26-32H,2-4H2,1H3,(H,21,25)/t6-,7-,8-,9-,10-,11-,12-,13+,14-,15+,16-,17+,18+,19-,20+/m1/s1/f/h21H
+CH$LINK: CHEMSPIDER 24606097
+CH$LINK: KEGG G00319
+AC$INSTRUMENT: 2695 HPLC Quadro Micro API, Waters
+AC$INSTRUMENT_TYPE: LC-ESI-QQ
+AC$MASS_SPECTROMETRY: MS_TYPE MS2
+AC$MASS_SPECTROMETRY: ION_MODE POSITIVE
+AC$MASS_SPECTROMETRY: COLLISION_ENERGY 15.0 V
+AC$MASS_SPECTROMETRY: DATAFORMAT Centroid
+AC$MASS_SPECTROMETRY: DESOLVATION_GAS_FLOW 897 L/Hr
+AC$MASS_SPECTROMETRY: DESOLVATION_TEMPERATURE 399 C
+AC$MASS_SPECTROMETRY: FRAGMENTATION_METHOD LOW-ENERGY CID
+AC$MASS_SPECTROMETRY: IONIZATION ESI
+AC$MASS_SPECTROMETRY: SCANNING 1 amu/sec (m/z = 20-2040)
+AC$MASS_SPECTROMETRY: SOURCE_TEMPERATURE 100C
+AC$CHROMATOGRAPHY: COLUMN_NAME TSK-GEL Amide-80 2.0 mm X 250 mm (TOSOH)
+AC$CHROMATOGRAPHY: COLUMN_TEMPERATURE 40 C
+AC$CHROMATOGRAPHY: FLOW_GRADIENT 74/26 at 0 min, 50/50 at 60 min.
+AC$CHROMATOGRAPHY: FLOW_RATE 0.2 ml/min
+AC$CHROMATOGRAPHY: RETENTION_TIME 7.080 min
+AC$CHROMATOGRAPHY: SAMPLING_CONE 43.10 V
+AC$CHROMATOGRAPHY: SOLVENT CH3CN/H2O
+MS$FOCUSED_ION: DERIVATIVE_FORM C29H46N2O17
+MS$FOCUSED_ION: DERIVATIVE_MASS 694.27965
+MS$FOCUSED_ION: DERIVATIVE_TYPE ABEE (p-Aminobenzoic acid ethyl ester)
+MS$FOCUSED_ION: PRECURSOR_M/Z 695.00
+MS$FOCUSED_ION: PRECURSOR_TYPE [M+H]+
+PK$SPLASH: splash10-0006-0002029000-bfe86aa7211a87812a06
+PK$NUM_PEAK: 8
+PK$PEAK: m/z int. rel.int.
+  370.8 3.277e5 366
+  371.4 3.036e4 34
+  532.0 5.812e4 65
+  532.6 2.982e5 333
+  533.3 5.196e4 58
+  694.1 4.564e5 510
+  694.8 8.939e5 999
+  695.4 5.537e4 62