view PDAUG_Peptide_Ngrams/test-data/test1.fasta @ 5:f93187136dfb draft

"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit edb37634e419f75dd66292e712de51278746d883"
author jay
date Wed, 30 Dec 2020 02:42:16 +0000
parents c3f0b3a6339e
children
line wrap: on
line source

>ACP0
GLWSKIKEVGKEAAKAAAKAAGKAALGAVSEAV
>ACP2
GLFDIIKKIAESI
>ACP4
GLLDIVKKVVGAFGSL
>ACP6
GLFDIVKKVVGALGSL
>ACP8
GLFDIVKKVVGTLAGL
>ACP10
GLFDIAKKVIGVIGSL
>ACP12
GLFDIVKKIAGHIAGSI
>ACP14
GLFDIVKKIAGHIVSSI
>ACP16
AACARFIDDFCDTLTPNIYRPRDNGQRCYAVNGHRCDFTVFNTNNGGNPIRASTPNCKTVLRTAANRCPTGGRGKINPNAPFLFAIDPNDGDCSTNF
>ACP18
HGVSGHGQHGVHG
>ACP20
FKCRRWQWRMKKLGAPSITCVRRAF
>ACP22
KWKLFKKIKFLHSAKKF
>ACP24
KSSAYSLQMGATAIKQVKKLFKKWGW
>ACP26
GIGTKILGGVKTALKGALKELASTYAN
>ACP28
GIGGKILSGLKTALKGAAKELASTYLH
>ACP30
GIGGVLLSAGKAALKGLAKVLAEKYAN
>ACP32
SIGAKILGGVKTFFKGALKELASTYLQ
>ACP34
FLPLLAGLAANFLPTIICKISYKC
>ACP36
FVQWFSKFLGRIL
>ACP38
KWKIFKKIEKVGRNIRNGIIKAGPAVAVLGEAKAL
>ACP40
GWLKKIGKKIERVGQHTRDATIQTIGVAQQAANVAATLK
>ACP42
KWKLFKKIEKVGQNIRDGIIKAGPAVAVVGQATQIAK
>ACP44
SQLGDLGSGAGQGGGGGGSIRAAGGAFGKLEAAREEEFFYKKQKEQLERLKNDQIHQAEFHHQQIKEHEEAIQRHKDFLNNLHK
>ACP46
GIGKFLHSAKKFGKAFVGEIMNS
>ACP48
GIGAVLKVLTTGLPALISWIKRKRQQ
>ACP50
ALWKNMLKGIGKLAGQAALGAVKTLVGAE
>ACP52
ACYCRIPACIAGERRYGTCIYQGRLWAFCC
>ACP54
ECRRLCYKQRCVTYCRGR
>ACP56
LKLKSIVSWAKKVL
>ACP58
KWCFRVCYRGICYRRCR
>ACP60
KSCCRNTWARNCYNVCRLPGTISREICAKKCDCKIISGTTCPSDYPK
>ACP62
GLLSVLGSVAKHVLPHVVPVIAEHL
>ACP64
GLLSVLGSVVKHVIPHVVPVIAEHL
>ACP66
GLFKVLGSVAKHLLPHVAPVIAEK
>ACP68
GLFGVLGSIAKHVLPHVVPVIAEK
>ACP70
GLFVGVLAKVAAHVVPAIAEHF
>ACP72
GLFVGLAKVAAHNNPAIAEHFQA
>ACP74
GFVDFLKKVAGTIANVVT
>ACP76
GLLQTIKEKLESLESLAKGIVSGIQA
>ACP78
TRSSRAGLQFPVGRVHRLLRK
>ACP80
FFGWLIKGAIHAGKAIHGLIHRRRH
>ACP82
GLFDVIKKVASVIGGL
>ACP84
GLFDIIKKVASVVGGL
>ACP86
GRFKRFRKKFKKLFKKLSPVIPLLHLG
>ACP88
GGLRSLGRKILRAWKKYGPIIVPIIRIG
>ACP90
RRRPRPPYLPRPRPPPFFPPRLPPRIPPGFPPRFPPRFP
>ACP92
GLLGPLLKIAAKVGSNLL
>ACP94
GLICESCRKIIQKLEDMVGPQPNEDTVTQAASQVCDKLKILRGLCKKIMRSFLRRISWDILTGKKPQAICVDIKICKEKTGLI
>ACP96
DHYNCVSSGGQCLYSACPIFTKIQGTCYRGKAKCCK
>ACP98
FFHHIFRGIVHVGKTIHRLVTG
>ACP100
KLAKLAKKLAKLAK
>ACP102
KTCENLADTFRGPCFATSNC
>ACP104
IDWKKLLDAAKQIL
>ACP106
FLIGMTQGLICLITRKC
>ACP108
ILPILSLIGGLLGK
>ACP110
GLLGLLGSVVSHVVPAIVGHF
>ACP112
GLLGLLGSVVSHVLPAITQHL
>ACP114
GIKCRFCCGCCTPGICGVCCRF
>ACP116
QSHLSLCRWCCNCCRSNKGC
>ACP118
ILGPVISTIGGVLGGLLKNL
>ACP120
FLPILASLAAKFGPKLFCLVTKKC
>ACP122
GLWSKIKEAAKAAGKAALNAVTGLVNQGDQPS
>ACP124
LLGMIPLAISAISALSKL
>ACP126
GLPVCGETCVGGTCNTPGCSCSWPVCTRN
>ACP128
GVPICGETCTLGTCYTAGCSCSWPVCTRN
>ACP130
GIPCGESCVWIPCISSAIGCSCKSKVCYRN
>ACP132
GIPCAESCVWIPCTVTALIGCGCSNKVCYN
>ACP134
GTFPCGESCVFIPCLTSAIGCSCKSKVCYKN
>ACP136
GLLPCAESCVYIPCLTTVIGCSCKSKVCYKN
>ACP138
GRDYRTCLTIVQKLKKMVDKPTQRSVSNAATRVCRTGRSRWRDVCRNFMRRYQSRVTQGLVAGETAQQICEDLRLCIPSTGPL
>ACP140
GETDPNTQLLNDLGNNMAWGAALGAPGGLGSAALGAAGGALQTVGQGLIDHGPVNVFIPVLIGPSWNGSGSGYNSATSSSGSGS
>ACP142
GFKDLLKGAAKALVKTVLF
>ACP144
KSCCPNTTGRNIYNACRLTGAPRPTCAKLSGCKIISGSTCPSDYPK
>ACP146
KSCCPNTTGRNIYNTCRFGGGSREVCARISGCKIISASTCPSDYPK
>ACP148
KSCCPNTTGRNIYNTCRLTGSSRETCAKLSGCKIISASTCPSNYPK
>ACP150
MRKEFHNVLSSGQLLADKRPARDYNRK
>ACP152
KSCCKNTTGRNIYNTCRFAGGSRERCAKLSGCKIISASTCPSDYPK
>ACP154
FIFHIIKGLFHAGKMIHGLVTRRRH
>ACP156
FLPAIVGAAAKFLPKIFCAISKKC
>ACP158
FLPIIAGVAAKVLPKIFCAISKKC
>ACP160
FLPIIAGIAAKFLPKIFCTISKKC
>ACP162
FLPVIAGVAANFLPKLFCAISKKC
>ACP164
FLPIIAGAAAKVVQKIFCAISKKC
>ACP166
GLMDTIKGVAKTVAASWLDKLKCKITGC
>ACP168
VNWKKVLGKIIKVAK
>ACP170
VNWKKILGKIIKVAK
>ACP172
FFSLLPSLIGGLVSAIK
>ACP174
RFRLPFRRPPIRIHPPPFYPPFRRFL
>ACP176
KWKLFKKIPKFLHLAKKF
>ACP178
YKQCHKKGGHCFPKEKICLPPSSDFGKMDCRWRWKCCKKGSG
>ACP180
GIPCGESCVFIPCITGAIGCSCKSKVCYRN
>ACP182
GEFLKCGESCVQGECYTPGCSCDWPICKKN
>ACP184
GLPTCGETCTLGTCYVPDCSCSWPICMKN
>ACP186
GLPVCGETCFGGTCNTPGCTCDPWPVCTRN
>ACP188
FVDLKKIANIINSIFGK
>ACP190
GSIPCGESCVFIPCISSVIGCACKSKVCYKN
>ACP192
GIPCGESCVFIPCISSVIGCSCSSKVCYRN
>ACP194
GSIPCGESCVFIPCISAVIGCSCSNKVCYKN
>ACP196
GSIPCEGSCVFIPCISAIIGCSCSNKVCYKN
>ACP198
GIPCGESCVFIPCLTSAIDCSCKSKVCYRN
>ACP200
GMWSKILGHLIR
>ACP202
GKWMSLLKHILK
>ACP204
GFGMALKLLKKVL
>ACP206
GTGLPMSERRKIMLMMR
>ACP208
GIACGESCVFLGCFIPGCSCKSKVCYFN
>ACP210
GVIPCGESCVFIPCISSVLGCSCKNKVCYRD
>ACP212
KLCGETCFKFKCYTPGCSCSYPFCK
>ACP214
GDACGETCFTGICFTAGCSCNPWPTCTRN
>ACP216
GIPCAESCVWIPPCTITALMGCSCKNNVCYNN
>ACP218
IPCGESCVWIPCITAIAGCSCKNKVCYT
>ACP220
AIPCGESCVWIPCISTVIGCSCSNKVCYR
>ACP222
GEYCGESCYLIPCFTPGCYCVSRQCVNKN
>ACP224
IPCGESCVWIPCISGMFGCSCKDKVCYS
>ACP226
FLGWLFKWASK
>ACP228
FLKWLFKWAKK
>ACP230
KWKSFLKTFKSAKKTVLHTALKAISS
>ACP232
KWKSFLKTFKSLKKTVLHTLLKAISS
>ACP234
MPFLFCNVNDVCNFASRNDYSCNYYSNSYSFWLASLNPER
>ACP236
KWKLFKKIGAVLKVL
>ACP238
GACFSIAHECGA
>ACP240
TCCATGACGTTCCTGACGTT
>ACP242
KRFKQDGGASHASPASS
>ACP244
KRAKAAGGWSHWSPWSSC
>ACP246
LLGDFFRKSKEKIGKEFKRIVQRIKDFLRNLVPRTES
>ACP248
FLGALFKVASKVLPSVKCAITKKC
>ACP250
GIGKFLKKAKKFGKAFVKILKK
>ACP252
GIGKFLKKAKKGIGAVLKVLTTGL
>ACP254
VECYGPNRPQF
>ACP256
KRFKQDGGWSHWSPWSSC
>ACP258
RQVFQVAYIIIKA
>ACP260
KAFDITYVRLKF
>ACP262
DFKLFAVTIKYR
>ACP264
DFKLFAVYIKYR
>ACP266
WHSDMEWWYLLG
>ACP268
HTMYYHHYQHHL
>ACP270
RLVSYNGIIFFLK
>ACP272
GRENYHGCTTHWGFTLC
>ACP274
ASSSYPLIHWRPWAR