Mercurial > repos > iuc > icescreen
changeset 9:cca2a89210ae draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/icescreen commit c45c31257dbfd6991c86cee56bb8961e4c5cbe47
author | iuc |
---|---|
date | Sun, 23 Feb 2025 16:52:34 +0000 |
parents | 130a217f8d3f |
children | |
files | icescreen.xml macros.xml test-data/NC_004668_137848_164286_detected_SP_withMEIds.tsv test-data/NC_004668_137848_164286_icescreen.embl test-data/NC_004668_137848_164286_icescreen.gb test-data/NC_004668_137848_164286_icescreen.gff |
diffstat | 6 files changed, 83 insertions(+), 1252 deletions(-) [+] |
line wrap: on
line diff
--- a/icescreen.xml Fri Feb 09 21:26:42 2024 +0000 +++ b/icescreen.xml Sun Feb 23 16:52:34 2025 +0000 @@ -1,16 +1,12 @@ <tool id="icescreen" name="ICEscreen" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="20.09"> - <description>detects and annotates ICEs (Integrative and Conjugative Elements) and IMEs (Integrative and Mobilizable Elements) in Bacillota genomes.</description> + <description>annotates ICEs and IMEs in Bacillota genomes</description> + <macros> - <token name="@TOOL_VERSION@">1.3.1</token> - <token name="@VERSION_SUFFIX@">0</token> + <import>macros.xml</import> </macros> - <xrefs> - <xref type="bio.tools">icescreen</xref> - </xrefs> - <requirements> - <requirement type="package" version="@TOOL_VERSION@">icescreen</requirement> - <requirement type="package" version="3.0">zip</requirement> - </requirements> + <expand macro="xrefs"/> + <expand macro="requirements"/> + <version_command><![CDATA[ icescreen --version ]]> @@ -18,37 +14,23 @@ <command detect_errors="aggressive"><![CDATA[ #set $gbname = 'galaxy_genbank' mkdir -p ./tmp_icescreen/source_genbank + && mkdir -p ./tmp_icescreen/icescreen_result && ln -s '${genome}' ./tmp_icescreen/source_genbank/${gbname}.gb && icescreen --galaxy --gbdir ./tmp_icescreen/source_genbank - --outdir ./tmp_icescreen + --outdir ./tmp_icescreen/icescreen_result --phylum '${taxonomy.phylum}' --jobs "\${GALAXY_SLOTS:-4}" > ./tmp_icescreen/ICEscreen_log.txt 2>&1 - - && cat ./tmp_icescreen/ICEscreen_results/results/${gbname}/icescreen_detection_ME/${gbname}_detected_ME.summary > '${summary}' - && cat ./tmp_icescreen/ICEscreen_results/results/${gbname}/icescreen_detection_ME/${gbname}_detected_SP_withMEIds.tsv > '${detected_sp}' - && cat ./tmp_icescreen/ICEscreen_results/results/${gbname}/icescreen_detection_ME/${gbname}_detected_ME.tsv > '${detected_me}' + + && cat ./tmp_icescreen/icescreen_result/ICEscreen_results/${gbname}/detected_mobile_elements/${gbname}_detected_ME.summary > '${summary}' + && cat ./tmp_icescreen/icescreen_result/ICEscreen_results/${gbname}/detected_mobile_elements/${gbname}_detected_SP_withMEIds.tsv > '${detected_sp}' + && cat ./tmp_icescreen/icescreen_result/ICEscreen_results/${gbname}/detected_mobile_elements/${gbname}_detected_ME.tsv > '${detected_me}' - #if "output_annotation_genbank" in $additional_output.optional_files: - && mv ./tmp_icescreen/ICEscreen_results/results/${gbname}/visualization_files/${gbname}_icescreen.gb '${gbout}' - #end if - #if "output_annotation_gff" in $additional_output.optional_files: - && mv ./tmp_icescreen/ICEscreen_results/results/${gbname}/visualization_files/${gbname}_icescreen.gff '${gffout}' - #end if - #if "output_annotation_embl" in $additional_output.optional_files: - && mv ./tmp_icescreen/ICEscreen_results/results/${gbname}/visualization_files/${gbname}_icescreen.embl '${emblout}' - #end if - #if "output_log" in $additional_output.optional_files: - && mv ./tmp_icescreen/ICEscreen_log.txt '${log}' - #end if - #if "output_zip_all_files" in $additional_output.optional_files: - && cd ./tmp_icescreen/ICEscreen_results/results/${gbname} && zip --quiet -r - -- . > '${outzip}' - #end if ]]> </command> <inputs> - <param name="genome" type="data" format="genbank" label="Input genomes to analyze in Genbank format" help="Multi-genbank files (i.e. gbff) are supported. Each record must include the ORIGIN nucleotide sequence at the end."/> + <param name="genome" type="data" format="genbank" label="Input genomes to analyze in Genbank format" help="Multi-genbank files (i.e. gbff) are supported. Each record must include the nucleotide sequence."/> <section name="taxonomy" title="Phylum of the genomes to analyse" expanded="True"> <param name="phylum" type="select" label="Bacillota is the defaut parameter"> <option value="bacillota" selected="true">Bacillota</option> @@ -56,11 +38,12 @@ </section> <section name="additional_output" title="Additional output files" expanded="False"> <param name="optional_files" type="select" label="Make the following optional files available in the Galaxy history" multiple="true" optional="true" display="checkboxes" > - <option value="output_annotation_genbank">Genome annotation in genbank format</option> - <option value="output_annotation_gff">Genome annotation in gff format</option> - <option value="output_annotation_embl">Genome annotation in embl format</option> - <option value="output_zip_all_files">Zip of all final and intermediate results</option> - <option value="output_log">ICEscreen log</option> + <option value="output_annotation_genbank" selected="false">Annotation in genbank format (full)</option> + <option value="output_annotation_gff" selected="false">Annotation in gff format (ICEs and IMEs only)</option> + <option value="output_annotation_embl" selected="false">Annotation in embl format (ICEs and IMEs only)</option> + <option value="output_tar_gz_intermediate_files" selected="false">Archive of intermediate files</option> + <option value="output_log" selected="false">Log file</option> + <option value="output_param_conf" selected="false">Param conf file</option> </param> </section> </inputs> @@ -68,20 +51,23 @@ <data format="tabular" name="detected_sp" label="${tool.name} on ${on_string}: Signature Proteins table" /> <data format="tabular" name="detected_me" label="${tool.name} on ${on_string}: ICEs/IMEs table" /> <data format="txt" name="summary" label="${tool.name} on ${on_string}: results summary" /> - <data format="genbank" name="gbout" label="${tool.name} on ${on_string}: annotated genbank" > + <data format="genbank.gz" name="gbout" from_work_dir="./tmp_icescreen/icescreen_result/ICEscreen_results/galaxy_genbank/detected_mobile_elements/standard_genome_annotation_formats/galaxy_genbank_icescreen.gb.gz" label="${tool.name} on ${on_string}: genbank annotation (full)" > <filter>additional_output['optional_files'] and "output_annotation_genbank" in additional_output['optional_files']</filter> </data> - <data format="gff3" name="gffout" label="${tool.name} on ${on_string}: annotated GFF3" > + <data format="gff3.gz" name="gffout" from_work_dir="./tmp_icescreen/icescreen_result/ICEscreen_results/galaxy_genbank/detected_mobile_elements/standard_genome_annotation_formats/galaxy_genbank_icescreen.gff.gz" label="${tool.name} on ${on_string}: GFF3 annotation (ICEs and IMEs only)" > <filter>additional_output['optional_files'] and "output_annotation_gff" in additional_output['optional_files']</filter> </data> - <data format="embl" name="emblout" label="${tool.name} on ${on_string}: annotated EMBL" > - <filter>additional_output['optional_files'] and "output_annotation_embl" in additional_output['optional_files']</filter> + <data format="embl.gz" name="emblout" from_work_dir="./tmp_icescreen/icescreen_result/ICEscreen_results/galaxy_genbank/detected_mobile_elements/standard_genome_annotation_formats/galaxy_genbank_icescreen.embl.gz" label="${tool.name} on ${on_string}: EMBL annotation (ICEs and IMEs only)" > + <filter>additional_output['optional_files'] and "output_annotation_embl" in additional_output['optional_files']</filter> + </data> + <data format="tar.gz" name="intermediate_tar_gz" from_work_dir="./tmp_icescreen/icescreen_result/ICEscreen_results/galaxy_genbank/tmp_intermediate_files.tar.gz" label="${tool.name} on ${on_string}: intermediate files archive"> + <filter>additional_output['optional_files'] and "output_tar_gz_intermediate_files" in additional_output['optional_files']</filter> </data> - <data format="zip" name="outzip" label="${tool.name} on ${on_string}: all results zipped"> - <filter>additional_output['optional_files'] and "output_zip_all_files" in additional_output['optional_files']</filter> + <data format="txt" name="log" from_work_dir="./tmp_icescreen/ICEscreen_log.txt" label="${tool.name} on ${on_string}: log file" > + <filter>additional_output['optional_files'] and "output_log" in additional_output['optional_files']</filter> </data> - <data format="txt" name="log" label="${tool.name} on ${on_string}: log file" > - <filter>additional_output['optional_files'] and "output_log" in additional_output['optional_files']</filter> + <data format="gz" name="param_conf" from_work_dir="./tmp_icescreen/icescreen_result/ICEscreen_results/galaxy_genbank/param.conf.gz" label="${tool.name} on ${on_string}: param conf file" > + <filter>additional_output['optional_files'] and "output_param_conf" in additional_output['optional_files']</filter> </data> </outputs> <tests> @@ -102,24 +88,36 @@ <test expect_num_outputs="4"> <param name="genome" value="genbank/NC_004668_137848_164286.gb" ftype="genbank" /> <param name="optional_files" value="output_annotation_genbank" /> - <output name="gbout" file="NC_004668_137848_164286_icescreen.gb" ftype="genbank" /> + <output name="gbout" ftype="genbank.gz"> + <assert_contents> + <has_size value="19794" delta="100"/> + </assert_contents> + </output> </test> <test expect_num_outputs="4"> <param name="genome" value="genbank/NC_004668_137848_164286.gb" ftype="genbank" /> <param name="optional_files" value="output_annotation_gff" /> - <output name="gffout" file="NC_004668_137848_164286_icescreen.gff" ftype="gff3" /> + <output name="gffout" ftype="gff3.gz"> + <assert_contents> + <has_size value="794" delta="100"/> + </assert_contents> + </output> </test> <test expect_num_outputs="4"> <param name="genome" value="genbank/NC_004668_137848_164286.gb" ftype="genbank" /> <param name="optional_files" value="output_annotation_embl" /> - <output name="emblout" file="NC_004668_137848_164286_icescreen.embl" ftype="embl" /> + <output name="emblout" ftype="embl.gz"> + <assert_contents> + <has_size value="1002" delta="100"/> + </assert_contents> + </output> </test> <test expect_num_outputs="4"> <param name="genome" value="genbank/NC_004668_137848_164286.gb" ftype="genbank" /> - <param name="optional_files" value="output_zip_all_files" /> - <output name="outzip" > + <param name="optional_files" value="output_tar_gz_intermediate_files" /> + <output name="intermediate_tar_gz" > <assert_contents> - <has_archive_member path=".*/*_detected_SP_withMEIds.tsv"><has_text text="ICE_IME_id" /></has_archive_member> + <has_archive_member path=".*/*_detected_SP.tsv"><has_text text="Is_hit_blast" /></has_archive_member> </assert_contents> </output> </test> @@ -146,10 +144,10 @@ </assert_contents> </output> </test> - <test expect_num_outputs="5"> + <test expect_num_outputs="6"> <param name="genome" value="genbank/NC_004668_137848_164286.gb" ftype="genbank" /> <param name="phylum" value="bacillota" /> - <param name="optional_files" value="output_zip_all_files,output_log" /> + <param name="optional_files" value="output_tar_gz_intermediate_files,output_log,output_param_conf" /> <output name="log" > <assert_contents> <has_text text="bacillota" /> @@ -173,7 +171,7 @@ <help><![CDATA[ .. class:: warningmark - ICEscreen requires input files in genbank format. Multigenbank files (i.e. gbff files featuring multiple genome records back to back) are supported. Each Genbank record must include the ORIGIN nucleotide sequence. + ICEscreen requires input files in genbank format. Multigenbank files (i.e. gbff files featuring multiple genome records back to back) are supported. Each Genbank record must include the nucleotide sequence. ----- @@ -198,18 +196,16 @@ Other optional and additional output files generated by ICEscreen: - - Annotated Genbank, EMBL, and GFF3 files: tose files contains the annotations of the original Genbank file in addition to annotations added by ICEscreen such as ICEscreen signature proteins and mobile elements. - - All results zipped file: You can download this file locally and unzip it to have the complete output folder generated by the tool, including intermediate processing files. See https://icescreen.migale.inrae.fr for details. - - Log file (`*_detected_ME.log`): this file contains the detailed internal details used by ICEscreen to generate the results and logs of each step of the ICEscreen tool pipeline. + - Genbank annotation file (full): annotations of the original Genbank file as well as annotations of ICEscreen on ICEs, IMEs, and the detected signature proteins. + - EMBL and GFF3 annotation files (ICEs and IMEs only): annotations of ICEscreen on ICEs, IMEs, and the detected signature proteins. + - Intermediate files (tar.gz): You can download this file locally and uncompress it to have the intermediate files generated by the tool. See https://icescreen.migale.inrae.fr for details. + - Log file (`*_detected_ME.log`): this file contains the log of each step of the ICEscreen pipeline. + - Param conf file (`param.conf.gz`): this file contains the configuration parameters related to the ICEscreen run. ]]> </help> - <citations> - <citation type="bibtex">@UNPUBLISHED{Kim07aninterior-point, - author = {Julie Lao and Thomas Lacroix and Gérard Guédon and Charles Coluzzi and Nathalie Leblond-Bourget and Hélène Chiapello}, - title = {"See our latest publication at https://icescreen.migale.inrae.fr."} - } - </citation> - </citations> + + <expand macro="citation"/> + </tool>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/macros.xml Sun Feb 23 16:52:34 2025 +0000 @@ -0,0 +1,19 @@ +<macros> + <token name="@TOOL_VERSION@">1.3.3</token> + <token name="@VERSION_SUFFIX@">0</token> + <xml name="citation"> + <citations> + <citation type="doi">10.1093/nargab/lqac079</citation> + </citations> + </xml> + <xml name="requirements"> + <requirements> + <requirement type="package" version="@TOOL_VERSION@">icescreen</requirement> + </requirements> + </xml> + <xml name="xrefs"> + <xrefs> + <xref type="bio.tools">icescreen</xref> + </xrefs> + </xml> +</macros>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/NC_004668_137848_164286_detected_SP_withMEIds.tsv Sun Feb 23 16:52:34 2025 +0000 @@ -0,0 +1,5 @@ +ICE_IME_id ICE_IME_id_need_manual_curation Segment_number Comments_ICE_IME_structure Is_hit_blast Is_hit_HMM CDS_num Genome_accession Genome_accession_rank CDS_locus_tag CDS_protein_id CDS_strand CDS_start CDS_end CDS_length Is_pseudo CDS_Protein_type CDS_Protein_type_blast Description_of_blast_most_similar_ref_SP Id_of_blast_most_similar_ref_SP Length_of_blast_most_similar_ref_SP Blast_ali_length Blast_ali_start_CDS Blast_ali_end_CDS Blast_ali_start_Query_blast Blast_ali_end_Query_blast Blast_ali_identity_perc Blast_ali_E-value Blast_ali_bitscore CDS_coverage_blast Blast_ali_coverage_most_similar_ref_SP Protein_type_of_blast_most_similar_ref_SP Associated_element_type_of_blast_most_similar_ref_SP ICE_superfamily_of_most_similar_ref_SP ICE_family_of_most_similar_ref_SP IME_superfamily_of_most_similar_ref_SP Relaxase_family_domain_of_most_similar_ref_SP Relaxase_family_MOB_of_most_similar_ref_SP Coupling_type_of_most_similar_ref_SP False_positives SP_blast_validation Use_annotation Protein_type_of_matching_HMM_profile Description_of_matching_HMM_profile Profile_name Length_of_matching_HMM_profile HMM_ali_i-Evalue HMM_ali_E-value HMM_ali_Score HMM_ali_Bias HMM_ali_Global_score HMM_ali_Global_bias HMM_coverage CDS_coverage_hmm +ID_1 1 1 1 1 NC_004668.1 1 EF_RS00630 WP_002359295.1 + 1 1512 503 - Coupling protein Coupling protein Coupling protein TcpA AAO80014 503 503 1 503 1 503 100.0 0 1031.0 100.0 100.0 Coupling protein ICE Tn916 ICESt3 - - - TcpA - validated yes Coupling protein TcpA tcpA 464 8.8e-94 7e-94 301.2 5.6 301.5 5.6 96.98 90.06 +ID_1 1 1 1 5 NC_004668.1 1 EF_RS00650 WP_002359299.1 + 3098 4381 427 - Relaxase Relaxase Relaxase MOBT (PF02486) AAO80018 447 427 1 427 21 447 99.77 0 862.0 100.0 95.53 Relaxase ICE Tn916 ICESt3 - PF02486 MOBT - - validated yes Relaxase MOBT T4SS_MOBT 366 3.4000000000000003e-128 3e-128 413.4 10.4 413.6 10.4 99.45 88.99 +ID_1 1 1 1 19 NC_004668.1 1 EF_RS00720 WP_002359320.1 + 17920 20427 835 - VirB4 VirB4 VirB4 CAE52368 834 836 1 833 3 834 41.15 0 655.0 99.76 99.76 VirB4 ICE Tn916 ICESt3 - - - - - validated yes VirB4 VirB4 T4SS_virb4 943 2.4e-28 1.8000000000000002e-28 84.9 6.4 85.3 6.4 69.35 88.98 +ID_1 1 Downstream integrase EF_RS00760 has been associated to the structure ID_1 pre-merging because it is adjacent to the conj module and there is no upstream/downstream ambiguity. 1 1 27 NC_004668.1 1 EF_RS00760 WP_002392915.1 + 25273 26439 388 - Tyrosine integrase Tyrosine integrase Tyrosine integrase AAO80040 388 388 1 388 1 388 100.0 0 804.0 100.0 100.0 Integrase ICE - - - - - - - validated yes Tyrosine integrase Tyrosine integrase Phage_integrase 172 9.7e-29 4.4e-29 86.5 0.6 87.6 0.6 88.37 42.53
--- a/test-data/NC_004668_137848_164286_icescreen.embl Fri Feb 09 21:26:42 2024 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,73 +0,0 @@ -ID NC_004668; SV 1; ; DNA; ; UNC; 0 BP. -XX -AC NC_004668; -XX -PR Project:PRJNA224116; -XX -DE Enterococcus faecalis V583, complete sequence -XX -OS . -OC . -XX -FH Key Location/Qualifiers -FH -FT CDS 1..1512 -FT /origid="EF_RS00630" -FT /function="Coupling Protein" -FT /protein_id="WP_002359295.1" -FT /locus_tag="EF_RS00630" -FT /codon_start=1 -FT /color=6 -FT /note="ICEscreen prediction: Coupling protein; BlastP -FT result (Annotation confidence: HIGH): Coupling protein TcpA -FT [Hit with AAO80014; Identity:100.00%; E-value:0.00e+00; -FT Query coverage:100.00%]; Hmmscan result: TcpA [Hit with -FT tcpA HMM profile; E-value:7.00e-94; i-Evalue:8.80e-94]" -FT CDS 3098..4381 -FT /origid="EF_RS00650" -FT /function="Relaxase" -FT /protein_id="WP_002359299.1" -FT /locus_tag="EF_RS00650" -FT /codon_start=1 -FT /color=7 -FT /note="ICEscreen prediction: Relaxase; BlastP result -FT (Annotation confidence: HIGH): Relaxase MOBT (PF02486) [Hit -FT with AAO80018; Identity:99.77%; E-value:0.00e+00; Query -FT coverage:95.53%]; Hmmscan result: MOBT [Hit with T4SS_MOBT -FT HMM profile; E-value:3.00e-128; i-Evalue:3.40e-128]" -FT CDS 17920..20427 -FT /origid="EF_RS00720" -FT /function="VirB4" -FT /protein_id="WP_002359320.1" -FT /locus_tag="EF_RS00720" -FT /codon_start=1 -FT /color="184 134 11" -FT /note="ICEscreen prediction: VirB4; BlastP result -FT (Annotation confidence: HIGH): VirB4 [Hit with CAE52368; -FT Identity:41.15%; E-value:0.00e+00; Query coverage:99.76%]; -FT Hmmscan result: VirB4 [Hit with T4SS_virb4 HMM profile; -FT E-value:1.80e-28; i-Evalue:2.40e-28]" -FT CDS 25273..26439 -FT /origid="EF_RS00760" -FT /function="Tyrosine Integrase" -FT /protein_id="WP_002392915.1" -FT /locus_tag="EF_RS00760" -FT /codon_start=1 -FT /color=8 -FT /note="ICEscreen prediction: Tyrosine integrase; BlastP -FT result (Annotation confidence: HIGH): Tyrosine integrase -FT [Hit with AAO80040; Identity:100.00%; E-value:0.00e+00; -FT Query coverage:100.00%]; Hmmscan result: Tyrosine integrase -FT [Hit with Phage_integrase HMM profile; E-value:4.40e-29; -FT i-Evalue:9.70e-29]" -FT mobile_element 1..26439 -FT /mobile_element_type="other: integrative and conjugative -FT element" -FT /note="ICEscreen prediction: Putative ICE (one integrase -FT Tyr) [Element structure: Single; ICE superfamily: Tn916; -FT ICE family: ICESt3; Relaxase family: - (MOBT); Coupling -FT protein family: TcpA] (ICEscreen ID: ID_1)" -FT /color=15 -XX -SQ Sequence 0 BP; 0 A; 0 C; 0 G; 0 T; 0 other; -//
--- a/test-data/NC_004668_137848_164286_icescreen.gb Fri Feb 09 21:26:42 2024 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,1109 +0,0 @@ -LOCUS NC_004668 26439 bp DNA UNK 01-JAN-1980 -DEFINITION Enterococcus faecalis V583, complete sequence. -ACCESSION NC_004668 -VERSION NC_004668.1 -DBLINK BioProject: PRJNA224116 - BioSample: SAMN02603978 - Assembly: GCF_000007785.1 -KEYWORDS . -SOURCE . - ORGANISM . - . -FEATURES Location/Qualifiers - source 1..26439 - /organism="Enterococcus faecalis V583" - /mol_type="genomic DNA" - /strain="V583" - /db_xref="taxon:226185" - gene 1..1512 - /locus_tag="EF_RS00630" - /old_locus_tag="EF0139" - /old_locus_tag="EF_0139" - CDS 1..1512 - /locus_tag="EF_RS00630" - /old_locus_tag="EF0139" - /old_locus_tag="EF_0139" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002359295.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="cell division protein FtsK" - /protein_id="WP_002359295.1" - /translation="MLKKLFRYRGRRIRYSSRNLLALYRVLFFMPILACLGYFVGYKWI - YPLYLSNPPDWKIYIVPALIIVGISIGAIVLITLLIKASIINSGYFSKVEQRQVLAHMI - IDNGYYTKKQVKSSDGKTKEKIKFPKIYYKSAKNSIFVSFETAGNKFQEKFETIGGFLE - TTFHADNLNKIDEKGFVTYELATDVYNKRIWIKDMQADEGKVQLMKGLYWHFDKDPHLL - LGGGTGGGKTFTILSLIYALCRVGEVEICDPKNSDLMALGKLPLFAGKVHTGKKDITQC - LENTVELMETRFKTMNNSSRYKMGKNYAYYGLKPKFVFIDEFAAFKAELANDYSTDGEV - DEYLTQLILKARQAGIFFIVAMQRPDGEFLKTALRDQFMFRMSVGRLSETGILMIFGDE - NKNKKFKYVEKIDGQKVYGRGYVAQGGGTAREFYSPQVPQDFDFIEEFIKISKELGYED - VPKEVQEEVSQKISKHIDKEALAEIDEEFQAEKNQLSELSEKYSA" - gene 1552..2085 - /locus_tag="EF_RS00635" - /old_locus_tag="EF0140" - /old_locus_tag="EF_0140" - CDS 1552..2085 - /locus_tag="EF_RS00635" - /old_locus_tag="EF0140" - /old_locus_tag="EF_0140" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002359296.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002359296.1" - /translation="MDSNEIIKRVRERVYREVKKKYTRDDLDTRIQDVLYYRSETYMKL - VSFANGKRIKKLADPRKFEKFMDTKGVKIVAEVLDGLNNQPKMQAMEYEQKVLTKVRQW - YQKKNHPELVDLEEEAFEQLVEKNIIYKKMKKRLYEEQDNQGFVYSDNFDMQLIRDSCD - IEEALYLDITLGDY" - gene 2106..2393 - /locus_tag="EF_RS00640" - /old_locus_tag="EF0141" - /old_locus_tag="EF_0141" - CDS 2106..2393 - /locus_tag="EF_RS00640" - /old_locus_tag="EF0141" - /old_locus_tag="EF_0141" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002359297.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002359297.1" - /translation="MKFKSRVQMLNYVIGKKPDIMKTVDRRAEKEGVTDDNRLLDYKLL - VISVLDAEAVYDEDRPIEEKKFSTSQEVDKYLETRFKEHMDSAWKEMFNK" - gene 2403..2807 - /locus_tag="EF_RS00645" - /old_locus_tag="EF0142" - /old_locus_tag="EF_0142" - CDS 2403..2807 - /locus_tag="EF_RS00645" - /old_locus_tag="EF0142" - /old_locus_tag="EF_0142" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002414864.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002414864.1" - /translation="MYSFDQVILELDNAIALKTLKNWANRIEKMTDTRFERRYAKNSAG - HSYSYKVFSIKDIENFQELLRLRENNVPLNEAINEVFMSDENKATHINKQEIEDLKRDM - RQLLKVSQSILAENASLKERIGALERGTAE" - gene 3098..4381 - /locus_tag="EF_RS00650" - /old_locus_tag="EF0143" - /old_locus_tag="EF_0143" - CDS 3098..4381 - /locus_tag="EF_RS00650" - /old_locus_tag="EF0143" - /old_locus_tag="EF_0143" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_016627242.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="replication initiation factor domain-containing - protein" - /protein_id="WP_002359299.1" - /translation="MRGVDLKRYRKELKLKQQELASKLGIERSLISKIESGKRVISKEL - EQKIINVLNLDGGHASVEAKIDFLRIRFKTLDVRTVIEKLLHMDMNWFTHESRGFYHYT - ETFSYSSIRIFRNPENVNMGIMLDLSGEGCRQLEEIFEEDNNRSWTEFFRSLYDDDIFG - QGILVDTKITRIDIALDELIVKGQENFDLYVLKEKMEQGLVDTTFKNFDFSGGFVYENK - KMVNKGLSLYFGSRQSPLYFNFYQKDYELARKESMSVEEAREKHEIKNRYEIRLSDEKA - FLFVEYFLSSGESLDWLVKEIINQSLTVYDIEDDMKVYCKSWHDVVDKLEGLKLSVQGE - KPSIEKTLRWLSNYLAPSLKMIKEIDNLLGTNELMERIDLAELKEKHEEIIEMVSVDAK - DLLFTNRDNKSVRSYMEREFELEEMYPF" - gene 4399..5013 - /locus_tag="EF_RS00655" - /old_locus_tag="EF0144" - /old_locus_tag="EF_0144" - CDS 4399..5013 - /locus_tag="EF_RS00655" - /old_locus_tag="EF0144" - /old_locus_tag="EF_0144" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002393276.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002393276.1" - /translation="MDKELIKKNIKLMDATIEKMIHVMSSIHKLQLSVKELEDSNELTV - SYVKRECTKLEERVKELRPSISRCVFMYREYVEEFETKLRDRIVTEKFFRIKRFYGKEV - LAFKEFQEKYQNYIPKDIIDIKKQVRQKLEEVGYEIDGAFEGDFTSWVGVYARPKDKPT - YLDPANAEEVVLQEKYSVNGFKQDFSEWFEFEIKDNVVYGI" - gene 5111..5416 - /locus_tag="EF_RS00660" - /old_locus_tag="EF0145" - /old_locus_tag="EF_0145" - CDS 5111..5416 - /locus_tag="EF_RS00660" - /old_locus_tag="EF0145" - /old_locus_tag="EF_0145" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002365956.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_010782977.1" - /translation="MTKKLIKIWRKEMLALMNEDADWYRNEDTERFKRIQELARKIETA - NTRQFSSHISKERFEAYQKMGLQFKEIAEEFHITTTALQQWRKDNGYPIYNKNNRK" - gene 5427..8132 - /gene="sea1" - /locus_tag="EF_RS00665" - /old_locus_tag="EF0146" - /old_locus_tag="EF_0146" - /gene_synonym="prgA" - CDS 5427..8132 - /gene="sea1" - /locus_tag="EF_RS00665" - /old_locus_tag="EF0146" - /old_locus_tag="EF_0146" - /gene_synonym="prgA" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_011109619.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="surface exclusion protein SEA1/PrgA" - /protein_id="WP_010784266.1" - /translation="MKKIASAGLSILVATGVAGIGGNEVQAAEQAQPKTPENSSTEQPA - VKATETTEQAITEKQQQVTEKQAIVDQKQQVADTAKKEKDTIDQSVKDQQAVVDQNKGA - LDQSQQAVTDQQAVVDEAKKVVDEATPSAIEKAKNQVATDTQAVDDQQKVVDQAQADVN - QQQAVVEEKAKETNAAKVQNDKDQQAVTAAKQEQAKLEELAKNAEVEKAKAEKEQAAKE - AELANKQKEEAKAKDQKTKDDQAVADQQTVVTTSQEKVADAKADTAAKQADLTAKENAL - KDKQTATKQVQNTLDKSKEELKGHKGINLPANFTPDYYKKLSEQEKQAMEKEALALNKV - FPENQADVAKATEMINVKNPTGKQKQQMSDYVVGLINDVREKLGLQKLKISNQAMRFAW - DVAKYDNPKEFDHDVNAINRAAKENGFKEYPGQNFYENLSMGYFETINGTISQLEFEKA - ARKTIADMLFDDESSAYSHIDSLLKGDTTNMAVSISGDLNDISAKIHIISYNQSKLVEA - NTYEEGTAPVFKSKETLQKEVATNQEKLATAQQAESDAQQAKSASQQVLNTAKTTQATA - EKELSVHKATLASLQAVATKSTTNYEEKVRQTATAEKSLQQTKDQLATINELIQNRAAV - LEKAKTNVSEAQAIEQTSAKVLKEKQAAQKAEENTLNSLKEVLNLAKENLNQKQVAFKT - STRSLSRLENAQPTYEKALNELNKAEAAAVQAQEAYENSLKSLEELKEQQAVATLAYTQ - AQEDLSNAKLELQQYQGVLRELEAQQAEQQRQEALQEQVAKEQQRLEREAKQSQTLVAS - ATSADKTPGLQQLSFSKQKEQPKAQALTHSESRKTKQVAKAPDSLPHTGEKNNKWLAIA - GLIFALLGAAGIISFISRNEKKVKNIFKIK" - gene 8603..12520 - /locus_tag="EF_RS00670" - /old_locus_tag="EF0149" - /old_locus_tag="EF_0149" - CDS 8603..12520 - /locus_tag="EF_RS00670" - /old_locus_tag="EF0149" - /old_locus_tag="EF_0149" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002395058.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="LPXTG-anchored aggregation substance" - /protein_id="WP_011109430.1" - /translation="MNQQTEVKKRFKMYKAKKHWIVAPILFLGVLGAVGLATDNVQAAE - LDTQPGTTTVQPDNPNPQSRNETLKTAVSEEAALQKDTTSQPTTAEEVVPKGIAAEQSS - ATSNDTTNVQQPTAEAEKSAQEQPVVSPETTIEPLGQPTEVAPAENDANKSTSIPKEFE - TPDVDKAVDEAKKDPNITVVEKPTEDLGNVSSKDLAAKEKEVDQLQKEQAQKIAQQAAE - LKAKNEKIAKENAEIAAKNKAEKERYEKEVAEYNKHKNDKGYVNEAISKDLVFDSSIVT - KDTKIDKITGGKFIKASDFNKVNQGQSKDIFTKLSKDMNGKATGNFQSSKVAAVEFGPK - GGYAVLLEKNKPVNVTYTGLNASYLDRKITKAEFIYELQSAPSQSGTLNAVFSNDPIIT - AFVGTKNANGKDVKVRLTIKLYDANGKEVLPDKDHAFAYALSSLNSSLGTNYSVEHAEF - VSDFGSKNEFKYINGSYVKKQADGKFYSTEDLDYGTGPSGLKNSDWDAVGHKNAYYGSG - VGLAREGGRISFSFGMTTKGKVNLSGAQWFAFSTNLNAKSIRPYQKKGNPKEPEKATIE - FNRYKANVVPVLVPNKEVTDGQKNINDLNVKRGDSLQYIVTGDTTELAKVDPKTVTKQG - IRDTFDAEKVTIDLSKVKVYQADASLNEKDLKAVAAAINSGKAIDVTASYVLNLDQNTV - TAMMKTNADGSVVLAMGYKYLLVLPFVVKNVEGDFENTAVQLTNDGETVTNTVINHVPV - SNPSKDVKADKNGTVGSVSLHDKDIPLQTKIYYEVKSSERPANYGGITEEWGMNDVLDT - THDRFTGKWHAITNYDLKVGDKTLKAGTDISAYILLENKDNKDLTFTMNQALLAALNEG - SNKVGKQAWSVYLEVERIKTGDVENTQTENYNKELVRSNTVVTHTPDDPKPTKAVHNKK - GEDINHGKVARGDVLSYEMTWDLKGYDKDFAFDTVDLATGVSFFDDYDETKVTPIKDLL - RVKDSKGADITNQFTISWDDAKGTVTISAKDPQAFILAYGGQELRVTLPTKVKANVSGD - VYNSAEQNTFGQRIKTNTVVNHIPKVNPKKDVVIKVGDKQSQNGATIKLGEKFFYEFTS - SDIPAEYAGVVEEWSISDKLDVKHDKFSGQWSVFANSNFVLADGTKVNKGDDISKLFTM - TFEQGVVKITASQAFLDAMNLKENKHVAHSWKAFIGVERIAAGDVYNTIEESFNNEKIK - TNTVVTHTPEKPQTPPEKTVIVPPTPKTPQAPVEPLVVEKASVAPELPHTGEKENTLLS - VLGAGMLVGLAWFGLKKREVK" - gene complement(12713..13570) - /locus_tag="EF_RS00675" - /old_locus_tag="EF0150" - /old_locus_tag="EF_0150" - CDS complement(12713..13570) - /locus_tag="EF_RS00675" - /old_locus_tag="EF0150" - /old_locus_tag="EF_0150" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002359308.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002359308.1" - /translation="MNIDFFNQLIKPVGILLPIVIGFFTIYSSIYGYVISDSFKKNLFS - SPTEIGLYKIFKGFINLISSLLLSSGIFAYALITTDTAFTDFVSDINNLTKEGKAYLTY - FIIYFIVFIFSIAKLPDIYRTLIPSNSRSKHSNFYVLSQELSLNDIPCNTKVFLVSMIN - KDTVLLTYYLNKEFVRLIYSLNEIQKIKIFYHKQLSFFQKIKEFNESITKETYYFAFLP - TIFIMLPSIIMSFISKSMTNIYFGATIAAISELIILSPSLIKYIKIAYKKIYLTIKNQN - KPKK" - gene 13629..14183 - /locus_tag="EF_RS00680" - /old_locus_tag="EF0151" - /old_locus_tag="EF_0151" - CDS 13629..14183 - /locus_tag="EF_RS00680" - /old_locus_tag="EF0151" - /old_locus_tag="EF_0151" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002359309.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002359309.1" - /translation="MLIKLGTELTKEEYVTRYMRNFQKLLLLGDRPKVLTNREEQLLQY - EKELCVLFYEQFIKKHHRAPDEATLDDQVKANFIERSKIFARSPLVMDEGNFTQAHIGQ - LKRLRELRMEDYLPDNYTHILQREEELARNYFRKHDDYPFGYECLCISRSREVVNQGLE - KLLEGFYDSYQVYYRRYRKNG" - gene 14226..14669 - /locus_tag="EF_RS00685" - /old_locus_tag="EF0152" - /old_locus_tag="EF_0152" - CDS 14226..14669 - /locus_tag="EF_RS00685" - /old_locus_tag="EF0152" - /old_locus_tag="EF_0152" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002359311.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002359311.1" - /translation="MAEESKYPPVKEKSVFYQRYSRVSTISMLMDLGFSVSEAQIDNED - IVYMEQYKEFLLNKGIVEEKVPFKREFVAEYPLSKMRRLFVEGYYLRKPSGEKMYGSYY - YDFYFKEYSGMGIYCTKATKSLFLHVFEQRIRKIKKLKHRLEE" - gene 14672..15520 - /locus_tag="EF_RS00690" - /old_locus_tag="EF0153" - /old_locus_tag="EF_0153" - CDS 14672..15520 - /locus_tag="EF_RS00690" - /old_locus_tag="EF0153" - /old_locus_tag="EF_0153" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_011109431.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="LPXTG cell wall anchor domain-containing protein" - /protein_id="WP_011109431.1" - /translation="MKKMIIIALFSTSLLAGGSSVSAYAQESEGNLGETTGSVLPDEPN - VPTDPITPSEPEQPTEPSTPEQPSEPSTPTEPSEPSKPTDPSLPDEPSVPTEPTTPSKP - EQPTEPTTPSVPEQPTEPSVPEKPVEPNKPTEPEKPVPVVPEKPVVPQQPEQPTDVVVK - PNGEIATGESTQQPTVPIETNNLSEVTHVPTVTTPIETASGEAIVAVDKGVPLTQTADG - LKPIKSEYKVLPSGNVQVKSADGKMKVLPYTGEKMGIIGSIAGVCLTVLSGILIYKKRK - V" - gene 15531..16520 - /locus_tag="EF_RS00695" - /old_locus_tag="EF0154" - /old_locus_tag="EF_0154" - CDS 15531..16520 - /locus_tag="EF_RS00695" - /old_locus_tag="EF0154" - /old_locus_tag="EF_0154" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002370321.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="conjugal transfer protein" - /protein_id="WP_002359315.1" - /translation="MKFLKKIQTKEKSKKSPRVRLLSQKKANRLVLIVGCALFGLSLIG - AIRANVMAGNVIRLSQQLETINKDVKKIKEKKRVYDSSALSFYVRNFVNEYINFNGKAT - DEEKKARDEKLASYFSGDLALDKGTDNAAKDLIRKLLQVSVTRVEESEELLLVHASISY - KVQQKGQDLLDTQEIVLPIQEKNGLFSIVGRPYFLAMNVPKGKQEPLQSVKEPLDVEKK - ERQGIEKFLQLFFEKYAKGNTEELSVLMKEPVKTSGQATVSSIEEKELRFFETKQKGVT - GVQVSVNFKDKAINFLYTEDFSLWLTKTENSYFVQELKHYYTEKAGDK" - gene 16520..16744 - /locus_tag="EF_RS00700" - /old_locus_tag="EF0155" - /old_locus_tag="EF_0155" - CDS 16520..16744 - /locus_tag="EF_RS00700" - /old_locus_tag="EF0155" - /old_locus_tag="EF_0155" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002370320.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002359317.1" - /translation="MDTSKLSQFMSSGLITLIAFGVIILILKHWKEAAWLKIGSVIVIA - LILNDFATNNGQNIFKVVKWVLGLFGIQL" - gene 16757..17146 - /locus_tag="EF_RS00705" - /old_locus_tag="EF0156" - /old_locus_tag="EF_0156" - CDS 16757..17146 - /locus_tag="EF_RS00705" - /old_locus_tag="EF0156" - /old_locus_tag="EF_0156" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_016626678.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="conjugal transfer protein" - /protein_id="WP_002359318.1" - /translation="MKHFDYSRGLKAPYSLQVIKSPKGKIVWYFAQPLSLAYLVMLFLG - IVLTGIFWKFVPLPLIFGINLNLMIMLYFPNKVARWYTETEFEGKTGLAFLKDGFVYVK - NYVLDNRSIISFERVKEIEEFSFKR" - gene complement(17224..17532) - /locus_tag="EF_RS00710" - CDS complement(17224..17532) - /locus_tag="EF_RS00710" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002386531.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002386531.1" - /translation="MRKESVIKSFLYILIPIIIGTIISLFTSAPIFLIAGIIYIILLLF - LLPTLDFGITDFNAKQINPSYRPERKIDKNESIVTVLLLVIGIIVCAVMLYLKYRNS" - gene complement(17538..17756) - /locus_tag="EF_RS00715" - /old_locus_tag="EF0157" - /old_locus_tag="EF_0157" - CDS complement(17538..17756) - /locus_tag="EF_RS00715" - /old_locus_tag="EF0157" - /old_locus_tag="EF_0157" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002359319.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002359319.1" - /translation="MKKKVCLALTIFAMVTPFIFSSEASAREAEFGSSCPGGFYFKKGG - WSTGGKNMSGGYCVPLGNMGNMNNKIW" - gene 17920..20427 - /locus_tag="EF_RS00720" - /old_locus_tag="EF0158" - /old_locus_tag="EF_0158" - CDS 17920..20427 - /locus_tag="EF_RS00720" - /old_locus_tag="EF0158" - /old_locus_tag="EF_0158" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002359320.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="ATP-binding protein" - /protein_id="WP_002359320.1" - /translation="MQLEYPLTNHMKRNMVLTKENQVIAYYRIRSETVGLTDFEKKRKT - KKKVARTLKRLQENEGFEIVLLPVNADIRGKMGGMRQLVDKENHSVAVDKLMKTAQYLE - NEIGMVYEYIWLIGVPLVKKERSIDIKETFSTALNNLSEKVVKGLGLEVGVAEDWEEAY - KDQEQEVYQNLSELLVERLTEDELYYYQAYQFLNNIQHEKKELLTSQNLDNLLANKITP - FRGGLELSNEFGKSYIAHLPLGDCGVTIDGNHLLELVQKMSYPVSVKLQAGFAETKGQL - ALSGRSARARTRTKNIMEEAHLAGSKQKRKIVEGQHSLDDLDQKIDDDIPIIDWKAVLV - ISGNSKKQLRERKKNLMNRLDSLGIPLIRATFDNVYLFQATLLGNFQRFSTSNWQHTST - LETFSELNFFTSLHAGTKTGFYLGRVDATLEEKESRKQIVSGSKNIVYMNLLLANKQNI - EGKKTNNPHWLVSGDTGNGKSVFSKWLFLYSSLLDVKVLYIDPKKEVRQQFMRTINDPE - YQRKYPLDVAFIKTFNFVTLDVRKKENHGVLDPIVLFDETEAIATAKAMLNNINEDKWK - MPHKTAINETVAEVVAERKAGKQVGFWHVIERLISHSEKDVHEMGRFLLSTIKGSILEL - AFSHGEVEGLSFEKKVTILEIEDLDLPTDRHDELDENQRLSVTLMFALGTFCSKFGSRN - RKEETVTFFDEAWIFQSSPEGQKILKSMKRIGRSFNNFMVLITQSVNDVLDNGDGTGFG - TVVCFDEVDNREGILRYLKLPVNEINLKWVSNMIQGQCLMKDMFNQVNRIVIDVIFEEW - LELFETVDDTEASVMENDYVARW" - gene 20434..22398 - /locus_tag="EF_RS00725" - /old_locus_tag="EF0159" - /old_locus_tag="EF_0159" - CDS 20434..22398 - /locus_tag="EF_RS00725" - /old_locus_tag="EF0159" - /old_locus_tag="EF_0159" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002403502.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002359321.1" - /translation="MKYLIDSYTAYMVNGGLLDKGSEVVNWFFIELPFFFLRMGAMIFL - IMENVMNQSDYFVGKQQEAYDYSLDILKGFGGTGIVKGSLLGLAIILSAYYLLYSFFSN - RRNFMKSLLHYFAVFALFICWFGQVKTIDGKTQNGAIFLISSVSEMTKQVQGKFTSNVN - FGGDTSQEVDDGKKKVYQSPMFDATVLQTFNYVNSGSIDGKMANGKKLDYDKLLEKPNL - NDKEKKDFREKRNAYIEQQEKDNPYFSQDTLKTMEKSFAVWTGATNLFILAIPVLYINL - MLSLIQLLVVFLILIFPVVLLASFFPRCQMLLFKFFQGLIGALFTPIIYGIFLSVLFWI - NKLIDGAFLGVAKKVSGSLLELISGSTVYMIVLFVAVVVKIVVLRKVWKNKYAILAYFS - NGQVSQPVFEQKVEQLSERTKEVATGGAQVALGAYTGNLGMVANGAGNILPNQDKAIEM - GQEHFIDDNGSFTGVKAGLQSIFRQPVTEEEQGELNEEQFSEVETESIDHELTDIEEIG - QTELESDSLDNSIIELEPMTSEDLVVDVDNMSSDIDVELASVEEVGEEPPMNAEEYSGY - DNVIVTNFDELAMAREERDYFDGGKEQELVETNGVELVNNIYPFVQTEEYLANLEQTEA - QFFGTDEFEKELEQIEEWA" - gene 22429..23460 - /locus_tag="EF_RS00730" - /old_locus_tag="EF0160" - /old_locus_tag="EF_0160" - CDS 22429..23460 - /locus_tag="EF_RS00730" - /old_locus_tag="EF0160" - /old_locus_tag="EF_0160" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002386530.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="phage tail tip lysozyme" - /protein_id="WP_010775499.1" - /translation="MKKIFLGILGLFSFLFLLPFLLFLGTMSTEIGNNTQFQATTPQEK - VALEVSNFVTKNGGSLQFASAWLGNMEHESGLNPARIQSDLTFNSAWAFNPSTNGYALG - LAMMDGERRVNLLNFAKEQKKDWQAVPVQLEYMWNHDGSDSALLKRMSKSSDVNQLAVD - ILVHWERAGTKNDPNEQIKRKTSANNWYKRLSTGSMGAGSANIGGGKIDVLEQMLGQTV - NGGQCYGGTSYYVEKMGFQSLMNTGHMFASEIGNDYAWEQSGWQVIKNPNYSDVKAGDV - INFAMGGYATSVYGHTGIVASVEGNGKLVLYEQNAEKGQIIAKYFRQWGAEYPNVTSIV - RKK" - gene 23475..23765 - /locus_tag="EF_RS00735" - /old_locus_tag="EF0161" - /old_locus_tag="EF_0161" - CDS 23475..23765 - /locus_tag="EF_RS00735" - /old_locus_tag="EF0161" - /old_locus_tag="EF_0161" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002359323.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_002359323.1" - /translation="MKKEEMDVVSLRIIKLYFLGIRELNFPDYNKRFQQKDMELFIQLA - DMMENLPNLDEQLIYELEELKDYLFYVKTEKYSLTVHDMFLEMKSELEKII" - gene 23807..24022 - /locus_tag="EF_RS00740" - /old_locus_tag="EF0162" - /old_locus_tag="EF_0162" - CDS 23807..24022 - /locus_tag="EF_RS00740" - /old_locus_tag="EF0162" - /old_locus_tag="EF_0162" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002393223.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="hypothetical protein" - /protein_id="WP_025186164.1" - /translation="MFRKKNGLTNRQVLAICTKFQCKKNEFVAHRLSDGYLVAVNNKEY - RVKFSEGFFSKIVYAKEVQRKGARKS" - gene 24019..24537 - /locus_tag="EF_RS00745" - /old_locus_tag="EF0163" - /old_locus_tag="EF_0163" - CDS 24019..24537 - /locus_tag="EF_RS00745" - /old_locus_tag="EF0163" - /old_locus_tag="EF_0163" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002370311.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="lipoprotein" - /protein_id="WP_002359325.1" - /translation="MNKLPLLILLLGGVLLVSGCQSHKEENKSSKVSTEETTVIETVAR - EQSKESFTSEATKKQTETTKLEEPDHVKLLEAYGNAYANFTSINDRNEKLKPLMTEKCI - KKNGIDVKTGVALVSVGKVTTIYKNDQHEYALLLDCEQNGTQTRVLLLAKVKNNKISEM - TYNSVKQEY" - gene 24611..24985 - /locus_tag="EF_RS00750" - /old_locus_tag="EF0164" - /old_locus_tag="EF_0164" - CDS 24611..24985 - /locus_tag="EF_RS00750" - /old_locus_tag="EF0164" - /old_locus_tag="EF_0164" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002359326.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="lipoprotein" - /protein_id="WP_002359326.1" - /translation="MKKSIVTMLFLMLGIVVFTSCGSKMDKTAEEFKNKIISHVGDLYD - EKYQEKEFSFLIYKDKDTNEYLAKALVPYEGEPNSVESKYFYNVNKELETIEPFSGGRT - FDYAKSHGNYEVIYKSGKFK" - gene 25068..25280 - /locus_tag="EF_RS00755" - /old_locus_tag="EF0165" - /old_locus_tag="EF_0165" - CDS 25068..25280 - /locus_tag="EF_RS00755" - /old_locus_tag="EF0165" - /old_locus_tag="EF_0165" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_016623907.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="DUF3173 domain-containing protein" - /protein_id="WP_002359328.1" - /translation="MLIVTKEDLMNLGYGKYQAEDIIRKAKAVMVSKGYAYYLNKRLGR - VPVGAVESVLGIELESIAKEVETVG" - gene 25273..26439 - /locus_tag="EF_RS00760" - /old_locus_tag="EF0166" - /old_locus_tag="EF_0166" - CDS 25273..26439 - /locus_tag="EF_RS00760" - /old_locus_tag="EF0166" - /old_locus_tag="EF_0166" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_002392915.1" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /codon_start=1 - /transl_table=11 - /product="site-specific integrase" - /protein_id="WP_002392915.1" - /translation="MVKFKKDKRGKYYFTASLGFDEVTGKRVQKMRSGFSTIKEAREAY - AEIINNFGKEAYSSNSTMLYEEFFYTIFLPYYKGRVKERTYNNRLSMIKNTFAYFFKMK - LKSIAPVHIQKWQNELLEQYENTYVRNIYGLFQMSLDRAVVLGMISSNPAKIVGNVKKS - KKEIDFWTKEEFEKVVKTFYVEDYYQNFSFICIWLLFMTGMRIGEATALTWKDVNLDRR - YLTVKKSLYYKNAQTYELVSPKTRASIRTIYLDEDTVHYLRDWKKRQDDVGGIEFILSY - NSVPTQKHTVRHIIKRHAKLAEVHDIRIHALRHSHASLLISMGTNALLIKERLGHEDVQ - TTLGTYGHLYPSSSTEIANELKGIVNVEFTNQNMASEVTNQFTKGVKK" - CDS 1..1512 - /origid="EF_RS00630" - /function="Coupling Protein" - /protein_id="WP_002359295.1" - /locus_tag="EF_RS00630" - /codon_start=1 - /color=6 - /note="ICEscreen prediction: Coupling protein; BlastP - result (Annotation confidence: HIGH): Coupling protein TcpA - [Hit with AAO80014; Identity:100.00%; E-value:0.00e+00; - Query coverage:100.00%]; Hmmscan result: TcpA [Hit with - tcpA HMM profile; E-value:7.00e-94; i-Evalue:8.80e-94]" - CDS 3098..4381 - /origid="EF_RS00650" - /function="Relaxase" - /protein_id="WP_002359299.1" - /locus_tag="EF_RS00650" - /codon_start=1 - /color=7 - /note="ICEscreen prediction: Relaxase; BlastP result - (Annotation confidence: HIGH): Relaxase MOBT (PF02486) [Hit - with AAO80018; Identity:99.77%; E-value:0.00e+00; Query - coverage:95.53%]; Hmmscan result: MOBT [Hit with T4SS_MOBT - HMM profile; E-value:3.00e-128; i-Evalue:3.40e-128]" - CDS 17920..20427 - /origid="EF_RS00720" - /function="VirB4" - /protein_id="WP_002359320.1" - /locus_tag="EF_RS00720" - /codon_start=1 - /color="184 134 11" - /note="ICEscreen prediction: VirB4; BlastP result - (Annotation confidence: HIGH): VirB4 [Hit with CAE52368; - Identity:41.15%; E-value:0.00e+00; Query coverage:99.76%]; - Hmmscan result: VirB4 [Hit with T4SS_virb4 HMM profile; - E-value:1.80e-28; i-Evalue:2.40e-28]" - CDS 25273..26439 - /origid="EF_RS00760" - /function="Tyrosine Integrase" - /protein_id="WP_002392915.1" - /locus_tag="EF_RS00760" - /codon_start=1 - /color=8 - /note="ICEscreen prediction: Tyrosine integrase; BlastP - result (Annotation confidence: HIGH): Tyrosine integrase - [Hit with AAO80040; Identity:100.00%; E-value:0.00e+00; - Query coverage:100.00%]; Hmmscan result: Tyrosine integrase - [Hit with Phage_integrase HMM profile; E-value:4.40e-29; - i-Evalue:9.70e-29]" - mobile_element 1..26439 - /mobile_element_type="other: integrative and conjugative - element" - /note="ICEscreen prediction: Putative ICE (one integrase - Tyr) [Element structure: Single; ICE superfamily: Tn916; - ICE family: ICESt3; Relaxase family: - (MOBT); Coupling - protein family: TcpA] (ICEscreen ID: ID_1)" - /color=15 -ORIGIN - 1 atgttaaaaa aattatttag atatagagga aggcgtattc gttattcttc aagaaacctg - 61 ttggcactct atcgagtgtt attttttatg ccaattttag cttgtttagg gtattttgtt - 121 ggctataaat ggatttatcc tttatatctt tcaaatccgc ctgattggaa aatatacatt - 181 gtgccagcgt tgataattgt aggtatttct ataggtgcaa ttgtgctaat tacattgctt - 241 attaaagctt caattattaa ttcggggtat ttttctaaag tggaacaacg tcaagtatta - 301 gcacatatga ttattgacaa cgggtattac acaaaaaaac aagtgaaaag tagtgacggc - 361 aaaacaaaag aaaaaatcaa gtttccaaaa atttattata agtctgcaaa aaatagtatt - 421 tttgtttcat ttgaaacagc gggtaataaa tttcaggaaa aatttgaaac cattggtggt - 481 tttttggaaa caacgtttca tgcagataat ttaaataaga ttgatgaaaa aggttttgtt - 541 acctatgaat tagcaacaga tgtgtacaat aagcgtattt ggattaagga tatgcaagca - 601 gacgaaggca aagttcagtt gatgaaaggg ttgtattggc actttgataa agatccacat - 661 ttgttattag gtggaggcac tggtggaggt aaaactttta caattttgtc tctgatctat - 721 gcgctttgtc gagtgggtga ggtggaaatc tgtgacccga aaaattctga cttgatggct - 781 ttaggcaagt taccgctatt tgcaggaaaa gttcatactg gaaaaaaaga tattactcaa - 841 tgcttggaaa atacagtgga gttaatggaa acacgtttta aaacgatgaa taatagttca - 901 cgttacaaga tggggaaaaa ctatgcgtat tatggattaa aaccaaaatt tgtttttata - 961 gatgaatttg cggcctttaa agctgaattg gcaaatgatt attcaacaga cggagaagta - 1021 gatgagtatc ttacgcaact tattttgaaa gctcgtcaag caggtatttt ctttattgtt - 1081 gcaatgcaac gtccagatgg agaattttta aaaacagcat tacgtgacca atttatgttt - 1141 cgcatgtctg ttggacgtct atctgaaaca ggtattttga tgattttcgg tgatgaaaat - 1201 aaaaataaaa agtttaaata tgttgaaaaa attgacggtc agaaagtcta tggtcgtgga - 1261 tatgtggctc aaggaggagg aactgcacgt gaattttata gtcctcaagt accacaagac - 1321 tttgacttca ttgaagaatt tatcaaaatt tctaaagagt taggttatga agatgttcca - 1381 aaagaagtac aagaagaagt atctcaaaaa atatctaaac atattgataa agaagcactg - 1441 gcagaaattg atgaagaatt tcaagcagaa aaaaatcagt tatcagagtt aagtgagaaa - 1501 tattctgctt aaaaagaagt cacataaatt agttggaaaa ggaaggtttt tatggattct - 1561 aatgaaataa ttaaacgtgt cagagaacga gtatatagag aagtaaagaa aaaatatact - 1621 agagacgatt tggatactcg tattcaagat gtattatatt atcgttcaga aacatatatg - 1681 aaattagtta gctttgcaaa tggtaaaaga attaagaagt tagctgatcc tagaaaattt - 1741 gaaaagttta tggatacaaa aggagtaaag attgttgcag aagtacttga tggattgaat - 1801 aatcaaccaa aaatgcaagc tatggaatac gaacaaaagg tacttactaa agtacgtcaa - 1861 tggtatcaga aaaagaatca ccctgagctt gtagatttgg aagaagaagc atttgaacaa - 1921 cttgtagaaa aaaatatcat ctataaaaaa atgaagaaaa ggttgtatga agaacaggat - 1981 aatcaaggtt ttgtttattc ggataatttt gatatgcaat tgattcgtga ttcatgtgat - 2041 attgaagagg ctctatactt agatatcacg ttgggggatt actaagtgaa aggagtaaaa - 2101 agaaagtgaa atttaaatct cgagtacaaa tgttaaacta tgtgattggg aagaaaccag - 2161 acatcatgaa aacagttgat cggagagcag aaaaagaggg ggttacagat gataatagat - 2221 tacttgatta taaattatta gtaatttctg ttttagatgc agaagctgtt tacgatgaag - 2281 atagaccaat tgaggaaaag aaattttcaa catcacaaga agttgataag tatttagaaa - 2341 caagatttaa ggagcatatg gattctgctt ggaaagaaat gtttaataag taggtgtgga - 2401 aaatgtattc atttgatcaa gtaattttag agctagacaa tgctattgct ttgaaaacac - 2461 tgaaaaattg ggcaaatagg attgaaaaaa tgactgatac acgttttgaa cgccgatatg - 2521 caaagaatag tgcaggtcat agttatagct ataaggtttt ttctattaaa gatatagaaa - 2581 attttcaaga gttgctacgt ttgcgtgaaa ataatgttcc gcttaatgag gcaataaatg - 2641 aagtatttat gtctgatgag aataaagcta cacatattaa taaacaagaa attgaggatt - 2701 tgaaaagaga tatgaggcaa cttttaaagg tgtctcaatc tattcttgcg gagaatgcaa - 2761 gcttaaaaga gagaattggt gcattagaac gaggaacagc tgaataacgg ctgtttattt - 2821 gaaggattgt tgctagtaat aagtatacgt gggcgaagca gagcgaaagc ccacgtatac - 2881 ttttagcaac ggaaaatcct tttaaaatga acagacgtaa ggtgggcgaa tgcccacctt - 2941 acgtcaaaaa ccccctattt ataacatggg ggtagaattt aatataccgt ataaaaaagt - 3001 tgcttaaaag ctatgtccta caagggattg agcgattatg attttgtcac atttttcgac - 3061 taaagttgtc acattttttg gaagtaggtt taaagcagtg agaggtgttg atttaaagcg - 3121 atatagaaaa gaactaaaat taaaacagca agaattggca agtaaattag gaatcgagcg - 3181 ttcgttaatt tcaaaaatag aatctggaaa acgtgttatt tctaaagagt tagaacaaaa - 3241 gattattaat gtgttgaact tagatggtgg gcacgcttcg gtagaagcaa aaattgactt - 3301 tttaagaata cgatttaaaa cattagatgt tcggacagtt attgaaaagt tgttgcacat - 3361 ggatatgaac tggtttactc atgaatctag agggttttat cattacacgg aaacattttc - 3421 atatagctct attcggattt ttcggaatcc ggaaaatgtc aatatgggaa ttatgttgga - 3481 cttgtctggc gaaggctgtc gtcaattaga agaaatcttt gaggaagata acaaccgatc - 3541 gtggacagaa ttttttcgct ctctttatga tgacgatatt ttcggtcaag gcattttagt - 3601 agatacaaaa atcactcgaa ttgatattgc tcttgatgaa ttgattgtga aggggcaaga - 3661 aaattttgat ttgtatgttt taaaagaaaa aatggagcag gggcttgttg acaccacatt - 3721 taaaaatttt gattttagcg gtggatttgt ttacgaaaat aaaaaaatgg tgaataaagg - 3781 tttatccctt tattttggta gtcgtcaatc gccactgtat tttaactttt accaaaaaga - 3841 ttacgagtta gcaagaaaag aaagtatgag tgttgaagaa gcaagagaaa aacatgaaat - 3901 taaaaatcga tacgaaattc gcctttctga tgaaaaggcg tttttgtttg tagaatattt - 3961 tctatcaagc ggtgagtcgc tagattggtt agtgaaagaa attattaatc aatctttgac - 4021 tgtctatgac attgaagatg atatgaaagt ttattgtaaa tcttggcatg atgttgttga - 4081 taaattggaa ggcttaaaat tgtctgtgca aggtgaaaaa ccgtctattg aaaagacgct - 4141 tcgatggcta tcaaattatt tagccccttc attaaagatg attaaagaga ttgataatct - 4201 gttaggaaca aatgaattga tggaacgcat tgatttagca gaattaaaag aaaagcatga - 4261 agagattatt gaaatggtga gtgttgatgc aaaagacttg ttgtttacca atagagataa - 4321 taaaagtgtt cggtcctata tggaacgaga gttcgaatta gaagaaatgt acccgtttta - 4381 gaaaggtgga ttgatagaat ggataaagaa ttaatcaaaa aaaatataaa acttatggat - 4441 gccactattg agaaaatgat tcatgtgatg agttctattc ataaacttca attgagtgta - 4501 aaagaacttg aagacagtaa cgaattaact gtttcttatg taaaaagaga atgtacaaaa - 4561 ttggaagaga gggttaagga acttagaccg agtatttcaa gatgtgtttt tatgtatcga - 4621 gaatatgtag aagaatttga aacaaaactt agagatagaa tagttacaga aaagtttttt - 4681 cgaataaaaa ggttctatgg taaagaagta ttagctttta aggaatttca agaaaagtat - 4741 caaaattata ttcctaaaga tattattgat ataaagaaac aagttcgtca gaagctagaa - 4801 gaagttggtt atgaaattga tggtgctttt gagggggatt ttacaagttg ggtaggtgtt - 4861 tatgcgcgtc caaaagataa accgacctat ttagaccctg cgaatgcgga agaagtagtt - 4921 ttacaagaaa aatatagcgt caatggattt aaacaagatt tttcagaatg gtttgaattt - 4981 gaaattaaag ataatgttgt ttatggcatt taataattgt catgtaaaag acatttttta - 5041 ttttctctaa aaggttacta ttttcataat aaatattatt ttgttattgt taatttgagg - 5101 tgaaaggggt atgactaaaa aattaataaa aatatggcgt aaagaaatgt tggcattaat - 5161 gaatgaagac gcagactggt ataggaatga agataccgag cgttttaaac gaatacaaga - 5221 acttgcaaga aagatagaaa cagcaaacac cagacaattt tcttcgcata ttagcaagga - 5281 aagatttgaa gcctatcaaa aaatgggctt acagtttaaa gaaatagcgg aagagttcca - 5341 tataacaact acagcgttac aacaatggcg taaagacaat gggtatccca tttacaacaa - 5401 aaataatcgg aagtgaggaa aataaaatga aaaagatcgc aagtgcaggg ttaagtattt - 5461 tagtcgcaac gggggtagca ggtattgggg gaaatgaagt acaggcagca gaacaagcgc - 5521 aaccaaaaac acctgaaaac agttctacag aacaaccagc agtgaaagct acagaaacaa - 5581 cggagcaagc cattactgaa aaacagcaac aagtaacaga gaaacaagca attgtcgatc - 5641 aaaaacaaca agttgctgac actgcgaaaa aagaaaaaga caccattgat caatctgtta - 5701 aagaccaaca agcagtggtc gatcaaaaca aaggtgcatt ggatcaaagt caacaagcag - 5761 tgactgacca acaagcggtc gtagacgaag caaaaaaagt tgtggatgaa gcaacacctt - 5821 cagccattga aaaagccaaa aaccaagtgg ctacggatac acaagctgtt gatgaccaac - 5881 aaaaagtagt ggatcaagct caagcagacg ttaaccaaca acaagcagtt gtcgaagaaa - 5941 aagcaaaaga aacgaatgct gctaaagtgc aaaatgataa agatcaacaa gcagtaacag - 6001 ctgcgaaaca agaacaagcc aagcttgaag aattagcgaa aaatgcggaa gtggaaaaag - 6061 caaaggctga aaaagaacaa gcagcaaaag aagctgaact ggctaacaaa cagaaagaag - 6121 aagccaaagc taaagatcaa aaaacgaagg acgatcaagc agtcgcagac caacaaactg - 6181 ttgtgacaac tagtcaagag aaagtagcag acgcaaaagc agatacagct gcgaaacagg - 6241 cagacttaac agcgaaagag aatgctttga aagacaagca aacagcaaca aagcaagtgc - 6301 agaatacttt agataaatca aaagaagagc taaaaggaca taaaggaatt aacttgcctg - 6361 ctaacttcac acctgattat tacaaaaaat tatctgaaca agaaaagcaa gcaatggaaa - 6421 aagaagcatt agcattaaat aaagtttttc ctgaaaatca agcagatgtg gcaaaagcaa - 6481 cggaaatgat caatgtcaaa aatcctaccg gaaaacaaaa gcaacaaatg agcgattacg - 6541 ttgtaggact tatcaatgat gttcgcgaaa agcttgggtt acaaaagttg aagatttcta - 6601 accaagctat gagatttgct tgggatgtag caaaatatga taatcccaaa gagtttgatc - 6661 atgacgtaaa tgcaattaat cgtgcagcaa aagaaaatgg ttttaaagag tatccagggc - 6721 aaaactttta tgaaaatcta agtatgggct attttgaaac gattaatggc actatttctc - 6781 aactagagtt tgaaaaagct gctcgaaaaa caattgctga tatgctcttt gacgatgaaa - 6841 gttcagcgta ttctcatata gattcattgc taaaagggga cacaacaaac atggcagttt - 6901 ctatttcagg agatttaaat gatatttcgg caaaaatcca tatcattagc tataatcaat - 6961 caaaattagt tgaagcaaat acctatgaag aaggcactgc tccagtcttt aagagtaaag - 7021 aaacccttca aaaagaagta gcaaccaatc aagaaaaatt agctactgca caacaagcag - 7081 aatcagacgc tcaacaagca aaaagtgcaa gtcagcaagt cttaaataca gccaaaacaa - 7141 cacaagcaac agcagaaaaa gaactatctg ttcataaagc gacattggct agtcttcaag - 7201 cagttgcgac taaaagtacg acaaattatg aagaaaaagt acgacaaact gcaacggcag - 7261 aaaaaagcct tcaacaaaca aaagatcaat tggcaacaat caatgagtta attcagaatc - 7321 gagctgctgt tttagaaaaa gcgaaaacaa acgtttcgga agcacaagca attgaacaaa - 7381 cgtctgctaa agtgctgaaa gaaaaacaag cagcccaaaa agcagaagaa aacacattga - 7441 atagcttgaa ggaagtattg aatttagcaa aagaaaattt aaatcaaaaa caagttgcat - 7501 ttaaaacaag tacacgttca ttgtctcgtt tagaaaatgc tcaaccaaca tacgaaaaag - 7561 cattaaacga gttaaacaaa gcagaagcag cagcggtcca agcacaagaa gcctatgaaa - 7621 attctctgaa atcattggag gaacttaaag aacaacaagc cgttgctaca cttgcttata - 7681 cacaagcaca agaagacctt tctaacgcga agttagagct acagcagtac cagggcgtat - 7741 taagagaatt agaagcacaa caagccgaac agcagcgaca agaagcgttg caagaacaag - 7801 tagcaaaaga acaacaacgc cttgaacgag aagcaaaaca aagccaaacg ttagtagcaa - 7861 gtgctacttc agcagacaaa acacctggtc tccaacagtt atctttttct aaacaaaaag - 7921 aacagccaaa agcacaagca ttaacacatt cagaatctcg taagacgaaa caagtagcaa - 7981 aagccccaga ttctttacca catacaggag aaaaaaataa taaatggtta gctatagctg - 8041 gtctgatatt tgctttgtta ggagctgcgg gtattataag ttttattagt agaaacgaga - 8101 agaaagtaaa aaatatcttt aaaattaaat aataaagtca aaggagcgac atatttcgct - 8161 cctttttatt gtaatcattg gaataaattg aaaaataaaa aaatagccaa ccaaaatggt - 8221 tggctgattg tattaaaggc agaagaatct accaaattta ggagccaacc agtttccgct - 8281 ggtcaacaaa aaataaatgg attgtctcgg atggagacac ttaaatagta cctgacaata - 8341 aaattttagg caacaaaaaa gtcagccgtt ttccgccgac tgactaaacg aataagattt - 8401 gtaaagaagt gatttgtact ttttacacaa ttatgatagc acgttaaatg tttttaacgc - 8461 aaaaaaaagc taagggaatc gaaaaacttt cggttctctt tttgtgagga ggaatggaaa - 8521 taatgatgaa aaagcaacga gctccttgtg ttgcgtgaac tatttttaca aacaaaaaat - 8581 aaaaaatcga ggagaatgat acatgaatca acagactgaa gtaaaaaaac gttttaaaat - 8641 gtataaggca aagaaacact ggattgtagc ccctattctt tttttaggtg tattaggagc - 8701 tgtaggatta gctacagata atgtacaagc cgcggaatta gatacgcaac caggaacaac - 8761 gacggtgcaa cccgataatc ccaacccgca gtcacgaaat gaaacactta aaacggcagt - 8821 atctgaagaa gcagcattac aaaaagacac tacttctcaa ccaaccacag cagaagaagt - 8881 agtgccgaaa ggaattgctg ctgaacaaag ttcagctacc tcaaatgata ccacaaacgt - 8941 ccaacaacca acagcagaag cagaaaaatc agcacaagaa caaccagtag tcagccctga - 9001 aacaaccatt gaacctctag ggcagccaac agaagttgca ccagcagaaa atgacgctaa - 9061 taaatcaacg tcaattccta aagaatttga aacaccagac gttgacaaag cagttgatga - 9121 agcgaaaaaa gatccaaaca ttaccgtcgt ggaaaaacca actgaagact taggaaatgt - 9181 ttcttctaaa gatttagctg caaaagaaaa agaagtagac caactacaaa aagaacaagc - 9241 ccaaaagatt gcccaacaag cagctgaatt aaaagccaaa aatgaaaaaa ttgccaaaga - 9301 aaatgcagaa attgcggcaa aaaataaagc ggaaaaagag cgctacgaaa aagaagtggc - 9361 ggaatacaac aaacacaaaa atgacaaagg ctatgtgaat gaagcaatca gcaaagactt - 9421 agtttttgat tcaagcattg tgactaagga tactaaaata gacaagatta caggtggcaa - 9481 gtttattaaa gcttccgatt ttaacaaagt aaaccaagga caatccaaag atatttttac - 9541 aaaattaagt aaggatatga atggaaaagc aacaggcaac ttccaaagct caaaagtggc - 9601 tgctgttgaa tttggcccta aaggaggata cgcggttctt ttagaaaaaa acaaaccggt - 9661 caatgtcacg tatacaggat taaatgctag ttatttagac cgaaaaatca caaaagcaga - 9721 gttcatttat gaacttcaat ctgcaccaag tcaaagcggc accttaaatg cagtattttc - 9781 gaatgatcct attattacag catttgttgg tactaaaaat gccaatggga aggacgtaaa - 9841 agttcgctta accattaaat tatatgatgc taatggcaaa gaagttttac cagataaaga - 9901 ccatgccttt gcctatgcgt tatcgtcatt aaactctagt ctaggaacaa attatagtgt - 9961 agaacatgcg gaatttgttt cagactttgg ctcaaaaaat gagttcaagt atattaatgg - 10021 ttcctacgta aagaaacaag cggatgggaa attctactca accgaagacc ttgattatgg - 10081 gacaggtcct tcaggactaa aaaatagtga ttgggacgct gtaggtcata aaaatgcgta - 10141 ctatggttct ggtgtaggtc tagctagaga gggtggacgt atttctttct cttttggtat - 10201 gacaaccaaa ggaaaagtca acctatctgg tgcgcaatgg tttgccttta gtaccaattt - 10261 aaatgcgaaa tcaattagac cataccaaaa gaaagggaat ccaaaagaac cagaaaaagc - 10321 aacaattgaa ttcaatcgat acaaagccaa tgtcgttcct gttcttgtgc cgaataaaga - 10381 agtcactgat ggtcagaaaa atatcaatga tttaaatgtg aaacgaggcg attctttaca - 10441 atacattgtg acaggggata cgacagaact tgccaaagta gatccgaaaa cagtgacaaa - 10501 acaagggatt cgggatacct ttgatgcaga aaaagtgacg attgatttat ccaaagtgaa - 10561 ggtttatcaa gcagatgcaa gtctaaacga gaaagactta aaagctgttg ctgcagcgat - 10621 taattcagga aaagctatag acgtgactgc ttcttatgtt cttaatttag atcaaaacac - 10681 cgtcacagca atgatgaaaa ccaacgcaga cggttccgtt gttttagcaa tggggtataa - 10741 atatttactt gtcttgccgt ttgtagtgaa aaatgtagaa ggcgattttg aaaatacagc - 10801 tgttcagctg acaaatgatg gcgaaacggt aacaaataca gtgattaacc atgtgccggt - 10861 tagtaatcct tccaaagatg taaaagcaga taaaaacggt acagttggca gtgtttctct - 10921 acatgataaa gatattccgt tacaaacaaa aatttattat gaagtgaaat cttccgaacg - 10981 tccagctaac tatggcggaa ttaccgaaga atggggcatg aatgatgtct tggacacgac - 11041 ccatgatcgt ttcacaggta aatggcacgc tattacaaac tatgacctta aagtagggga - 11101 caaaacgtta aaagcaggaa cagatatttc tgcctacatt cttttagaaa acaaagacaa - 11161 taaagacttg acgtttacaa tgaatcaagc attattagca gcgttaaatg aaggaagcaa - 11221 taaagtaggc aaacaagctt ggtctgtata tctggaagtc gaacggatca aaacaggtga - 11281 cgtagaaaat acgcaaacag aaaactacaa caaagaactt gttcgttcta atacggtggt - 11341 gacgcataca cctgatgatc caaaaccaac caaagccgtt cacaacaaga aaggggaaga - 11401 tattaaccat ggaaaagttg ctcgtggtga tgttctttct tatgaaatga cgtgggactt - 11461 aaaagggtac gataaagact ttgcttttga cacagtcgat cttgcgacag gagtttcttt - 11521 cttcgatgat tacgacgaaa cgaaagtgac accaatcaaa gacttacttc gtgtcaaaga - 11581 ttctaaaggg gcagacatta cgaaccagtt cacgatctct tgggacgatg ccaaaggcac - 11641 ggtgacaatc tctgccaaag acccacaagc ctttattcta gcgtatggtg ggcaagaatt - 11701 gcgtgtaacg ctccctacaa aagtcaaagc caatgtttct ggtgatgttt ataattcagc - 11761 ggaacaaaat acatttggtc aacgaattaa aacaaatacc gttgtcaacc atattccaaa - 11821 agtgaaccct aaaaaagacg tggttattaa agttggtgac aaacaaagtc aaaatggcgc - 11881 cacaatcaaa ttaggggaga aattcttcta tgaatttaca agtagtgaca ttcctgcaga - 11941 atacgctggt gttgtggaag aatggtcgat tagcgataaa ctagacgtaa aacatgacaa - 12001 atttagtggc caatggtctg tgtttgccaa ttctaatttt gttttagcag acggaaccaa - 12061 agtgaataaa ggggacgaca tttcgaaact attcacgatg acctttgaac aaggggtagt - 12121 taaaatcacg gccagtcaag cgtttttgga tgcgatgaat ctaaaagaaa acaaacacgt - 12181 tgcgcactca tggaaagcgt tcattggtgt agaacgaatt gcggcaggag acgtttacaa - 12241 cacaatcgaa gaatctttca acaatgagaa gattaaaact aatacggtag tgacacatac - 12301 gccagaaaaa ccacaaacac caccagaaaa aacagtgatt gtaccaccaa caccaaaaac - 12361 accacaagca ccagtagagc cattagtggt agaaaaagca agtgtggcac ccgaactacc - 12421 tcatacaggt gaaaaagaaa acaccctatt atctgtacta ggtgccggaa tgctagttgg - 12481 tctggcttgg tttggtttga aaaaacgtga agtgaaataa tgagtaaaaa gaaaaagcac - 12541 tgtgaaaaat cagtgctttt tgtttatttt agaaaaagtg tggtgttgtc aagtgtggat - 12601 aataattttt gcgttaagtt gtatcgtagt atctataata attggagcat ttgtcagtgc - 12661 aacggtcgat gaacgattgg gagacaatat ttttttgcta cttctagtta ttttattttt - 12721 ttggtttatt ttgattttta attgttaagt atattttttt atatgctatt ttaatatatt - 12781 taataagact aggtgaaagt attattaatt cagagatagc tgctattgta gctccgaaat - 12841 aaatattggt catacttttt gaaataaacg acattattat agaaggtagc attataaata - 12901 ttgttggcaa aaaggcaaaa taataagttt ctttggtgat agattcgtta aattctttga - 12961 ttttttgaaa gaaagatagt tgtttatgat agaatatctt aattttctgt atctcgttta - 13021 aagaataaat taagcgcaca aattctttat ttaggtaata agttagaaga acggtatctt - 13081 tgttaatcat tgaaactaag aaaacttttg tattacatgg gatatcattt aaagaaagtt - 13141 cttgggacag tacgtaaaag ttactatgct tacttcttga attagaaggt attaaggttc - 13201 tataaatatc agggagcttt gctattgaga aaataaatac aataaaataa atgataaagt - 13261 aagttaagta agctttaccc tctttagtaa ggttatttat atctgaaaca aaatcggtga - 13321 atgctgtgtc tgtagttatt aatgcataag caaaaatacc agatgaaagt agtaaagagg - 13381 atattagatt aataaaacct ttaaagattt tatataatcc gatttcagtg ggagaggaaa - 13441 aaaggttttt tttaaatgaa tcacttatta cgtatccata gatggaggaa taaattgtga - 13501 aaaagcctat aactataggt aaaagtatac ccactggttt tattaattgg ttaaaaaaat - 13561 caatgttcat ataaataatt actccttata aactttttat aataattata tcaaaaggac - 13621 gtgaatatat gttaataaaa ttaggtacag aattgacgaa agaagaatat gttacaaggt - 13681 atatgcgaaa ctttcagaaa ttattgttgc tcggcgatcg gccaaaagta ttaacgaatc - 13741 gtgaagaaca actcttgcag tatgaaaaag aattatgtgt gctgttttat gaacaattta - 13801 taaagaaaca tcatagagcg cctgatgaag ccacgctaga cgatcaagtt aaagcgaatt - 13861 tcatagagcg ctctaaaatt ttcgctcgat ctcccttagt aatggacgaa ggaaatttta - 13921 cgcaagcaca tattggtcaa ctaaaacggt tgcgtgaatt gcgcatggaa gactatttgc - 13981 cagacaatta tacgcatatt ttacaacgag aagaagaatt ggcacgtaac tattttcgaa - 14041 aacatgatga ttatccattt gggtatgagt gtttatgtat tagtcggtca cgagaagtgg - 14101 tgaaccaagg gctagaaaag ctcttagagg ggttttatga cagttatcag gtttattatc - 14161 gtcggtatcg taaaaatggt tagaaatgga agtaggaata aaaagcgcag gaggtgtagc - 14221 gagcaatggc agaagaatcc aaatatccgc cagtgaaaga aaaatctgtg ttttatcagc - 14281 gttatagtcg tgtttcgacg atttctatgt tgatggattt aggttttagt gtgagtgaag - 14341 cccagattga taatgaagat attgtttata tggaacagta taaagagttt ttattaaata - 14401 aaggaattgt ggaagaaaaa gttcctttta aacgagaatt tgtagcggag tatccattaa - 14461 gcaaaatgcg acgacttttt gtagaaggct attatttacg aaaaccgagt ggtgaaaaaa - 14521 tgtatggtag ctactattac gatttttatt ttaaagagta ttcaggaatg gggatttatt - 14581 gtacgaaagc aacaaaatct ctttttttac atgtttttga acaaagaatt agaaaaataa - 14641 aaaaattaaa acatagattg gaagaatgaa aatgaaaaaa atgattatta ttgccttatt - 14701 cagtacaagc cttttagcag ggggaagcag tgtttctgct tatgcgcaag aatcagaagg - 14761 aaatcttggt gaaacaacag ggagtgtttt accagatgaa ccgaatgtac caactgaccc - 14821 aataacgcca agtgagccag agcaaccaac agagccaagt acaccagagc aaccatcgga - 14881 accgtcaaca ccaaccgaac ctagtgagcc ttcaaaaccg acggatcctt cgttaccaga - 14941 cgaaccgagc gtaccaacag agccaacaac gccaagtaag ccagagcaac caacagagcc - 15001 aacaacgcca agtgtaccag agcaaccaac agagccaagt gtaccagaaa aaccagtaga - 15061 accaaataaa ccaaccgagc cagaaaagcc tgtgccagtt gttcctgaaa aaccagttgt - 15121 accacaacaa ccagagcaac caacagatgt ggtggtaaag ccaaatggag aaattgcaac - 15181 aggagaatct acacaacagc caactgttcc aattgaaacg aataaccttt cagaagtaac - 15241 acatgtccca actgtgacga caccgattga aacagcaagc ggagaagcaa ttgtcgcagt - 15301 ggataagggc gttcctttaa cacaaacggc tgatggatta aaaccgatta aaagtgaata - 15361 taaagtatta ccaagtggca atgtacaagt gaaaagtgct gacggaaaaa tgaaagtact - 15421 tccttacact ggtgaaaaaa tgggcataat tgggtcaatc gctggtgtat gtttgactgt - 15481 tttatcagga atcttaattt ataaaaaacg taaagtgtag tgagtgatgt atgaaatttt - 15541 taaaaaaaat tcaaacaaag gaaaaaagca aaaagagccc aagagttcgt ttactatcac - 15601 aaaaaaaagc gaatcgatta gtattaattg tggggtgtgc tctttttgga ttgtcattga - 15661 ttggtgctat tcgagcaaat gtgatggcag gcaacgtgat ccgcctcagt caacaattag - 15721 aaacaataaa taaagatgtc aaaaaaataa aagaaaaaaa gagagtgtat gattcgtcgg - 15781 cactctcttt ttatgtcaga aattttgtga atgagtatat caattttaat ggaaaagcaa - 15841 cagatgaaga gaaaaaagca cgtgatgaga aattagcgag ttatttttca ggagatttag - 15901 cgttagataa aggaacagac aatgctgcaa aagacttaat tcgtaaatta ttacaagtct - 15961 ctgttactcg tgtagaagaa tctgaagagc tattacttgt gcatgcgagt atatcttata - 16021 aagtgcaaca aaaagggcag gatttactag atacacaaga aattgtttta cctattcaag - 16081 aaaaaaatgg gttgttttct attgttggtc gtccctattt tttagcaatg aatgttccga - 16141 aaggaaaaca ggaaccattg caatcagtga aagaaccgct tgatgttgaa aaaaaagaac - 16201 gacaagggat tgaaaaattt ttacaattat tttttgaaaa atatgcgaag gggaatacag - 16261 aagaattgtc tgttttaatg aaagaaccag ttaaaacaag tggtcaagca actgtgtcgt - 16321 ctattgaaga aaaagaacta cgtttttttg aaacgaaaca aaaaggtgtt acaggcgttc - 16381 aggtgtcagt gaactttaaa gacaaagcaa taaatttcct ttacacggaa gatttttcgt - 16441 tgtggttaac gaaaacagaa aattcgtatt ttgtacaaga gttaaaacat tattatacag - 16501 aaaaggcagg agataaatag tggatacaag taaattaagt caatttatga gtagtggatt - 16561 gattacactt attgcgtttg gtgtgatcat tttaatttta aagcattgga aagaagctgc - 16621 gtggttaaag attggttcag ttattgtcat tgcattgatt ttaaatgact ttgcgacaaa - 16681 taatgggcag aacattttca aagttgtgaa gtgggtctta ggattatttg ggattcagct - 16741 gtagaggaga gaaataatga aacattttga ttattcgagg ggcttaaaag ccccttactc - 16801 attacaagtt attaagtccc caaaagggaa aattgtttgg tattttgcac aacccttaag - 16861 tttagcttat ttagtgatgt tatttttagg gattgtacta acaggcattt tttggaagtt - 16921 tgtaccattg ccgttaattt ttggtattaa tcttaaccta atgattatgt tgtattttcc - 16981 aaataaagtg gctcgatggt atacagaaac agagtttgaa gggaaaacag gattagcttt - 17041 tttaaaagat ggttttgttt atgtaaaaaa ttatgtgtta gacaatagat caattatatc - 17101 ctttgaacga gtaaaggaaa tagaagaatt ttcatttaaa cgttagtaat aagaaagagt - 17161 gtattatggt gaaaacatga aaaaaagaag tgtgttgtaa taacttcttt tttcatgttt - 17221 aaattatgaa tttctatatt ttaaataaag cataactgca cagactatta ttccaataac - 17281 taaaagtagc acagtaacaa tactttcatt tttatctatt tttctttcag gtctatagct - 17341 aggattaatt tgtttggcgt taaaatcagt aattccaaag tctaaagtag gaagtaaaaa - 17401 gagtaataaa ataatatata taattcccgc tataaggaaa ataggggcgc tagtgaaaag - 17461 tgaaataatg gtacctatga ttataggaat taaaatgtat aaaaaggatt tgataacaga - 17521 ttcttttctc attttaatta ccaaattttg ttattcatgt ttcccatatt tcctaaagga - 17581 acacaataac caccgctcat atttttccca cctgtagacc agccaccttt tttaaaataa - 17641 aaacctccag gacaagagct accaaattca gcttctcttg cactagcttc tgagctaaaa - 17701 ataaaaggtg ttaccatcgc gaaaatagtt aaagctaaac aaactttttt cttcatatac - 17761 gttccttctt tccaattatt atttaaaagc tatattgaat atagctttta aataataata - 17821 actgaatgaa aaaaaactgt ccaataatat atagaaattt ctgaaaaatc atttttaatg - 17881 taaattattt taataaaatt aataagaaag gaaaaaaata tgcaactaga atatccatta - 17941 acgaatcata tgaaaagaaa catggtttta actaaagaaa atcaagtgat tgcgtattat - 18001 cgtattcggt cagaaacagt tggcttaaca gattttgaga aaaaaaggaa aacaaagaaa - 18061 aaagtagctc gaacgttgaa acgtttacaa gagaatgagg gttttgaaat tgttctttta - 18121 cctgtgaatg cggatattcg agggaaaatg ggaggtatgc gccaattagt ggacaaagaa - 18181 aatcatagtg tagcggtgga taagttgatg aaaactgctc agtatcttga aaatgaaatt - 18241 ggcatggtct atgagtatat ttggttaatt ggcgtgcctt tagtaaagaa agagcggtca - 18301 attgatatta aagaaacatt ttctacggcg ttaaataatc tatctgaaaa agtggttaaa - 18361 ggacttggtt tagaagtagg agtagcggag gattgggaag aagcttataa agaccaagaa - 18421 caagaagtat atcagaattt gtcagaattg ttagtggaac gattgacaga agacgagttg - 18481 tattactacc aagcctatca atttttaaat aatattcaac atgagaaaaa agaacttttg - 18541 actagtcaga acttagataa tttactagcg aacaaaatca ctccttttcg aggtgggtta - 18601 gaattgtcta atgagtttgg gaaaagttat attgctcatt taccattggg ggattgtggg - 18661 gtcacgattg atggtaatca cttgctagaa ctggttcaaa aaatgtctta tcctgtttct - 18721 gtgaagttac aggctggttt tgctgaaaca aaaggccaat tagcgttatc aggacgttct - 18781 gctcgtgcga gaacacgaac aaagaatatc atggaagaag cacatttagc aggttcaaaa - 18841 caaaaaagaa aaattgttga ggggcaacat tcacttgatg atttagatca aaaaattgat - 18901 gatgatattc cgattattga ttggaaagca gtattagtga ttagtgggaa ttcaaaaaaa - 18961 caattacgtg agcgaaagaa aaatttgatg aatcgactag atagcttagg aattccgtta - 19021 atccgtgcaa cgtttgataa tgtctatctt tttcaagcaa cgttattagg caactttcaa - 19081 cgtttttcaa ccagtaattg gcaacatacg tcgacgttag aaacattttc agagttgaat - 19141 ttctttactt cgttacacgc aggtacaaag acagggtttt atttgggacg tgtggacgcc - 19201 acgttagaag aaaaagaaag tcggaaacaa attgtttctg gctctaaaaa tattgtctat - 19261 atgaatctat tgcttgcaaa caaacagaat attgaaggaa agaaaacaaa taatccccat - 19321 tggttggtat cgggagatac aggtaacggg aaatcagtat tttctaaatg gttatttttg - 19381 tattcttctc tattagatgt gaaagtgtta tacattgatc caaaaaaaga agttcgccaa - 19441 cagtttatgc gaacgattaa tgatccagaa tatcaaagaa aatacccact tgatgtggca - 19501 tttattaaga cgtttaattt tgtgacactt gatgttcgta aaaaagaaaa ccatggggta - 19561 cttgatccaa ttgtattatt tgatgaaaca gaagcaatcg caacggcaaa agctatgtta - 19621 aataatatta acgaggataa gtggaaaatg ccacataaga cggcgattaa tgaaacagta - 19681 gcagaagtgg tggctgaacg gaaagcaggc aaacaagttg gattttggca tgtaattgaa - 19741 cgtttaatta gtcattcaga gaaagacgtt catgaaatgg gtcgtttttt attatctacg - 19801 attaaaggat cgattttaga gttagccttt tctcatggtg aagtagaagg actttctttt - 19861 gagaagaaag tgaccatttt agaaattgaa gatttagatt tacccacaga tcggcacgat - 19921 gaattagacg agaatcaacg gttatctgtg actttaatgt ttgcattagg cacgttttgt - 19981 tcaaaatttg ggtcacgcaa tcggaaagaa gaaacagtca ctttctttga tgaagcgtgg - 20041 atttttcaat cgtcaccaga aggacaaaag attctaaaat cgatgaaacg gatcggacgt - 20101 tcgtttaata attttatggt attaattacg caatcggtca acgatgtgtt agataatggc - 20161 gatggtacag gctttggaac ggtggtttgt ttcgatgaag tggataatcg agaagggatt - 20221 ttacgttatt taaaattacc agtcaatgag attaatttaa aatgggtatc gaatatgatt - 20281 caaggacaat gtctcatgaa agatatgttt aaccaagtga atcgaatcgt gatagacgtt - 20341 atttttgaag aatggttaga actctttgaa acagttgatg atacagaagc gtccgttatg - 20401 gaaaacgatt atgtggcgag gtggtgagaa agtatgaaat atctcattga tagttataca - 20461 gcctatatgg tgaatggtgg tttattagat aaaggatcag aagtcgtcaa ttggttcttt - 20521 attgaattgc cttttttctt tttgcgtatg ggggcaatga ttttcttaat tatggagaat - 20581 gtcatgaatc agtcagatta ttttgttggt aaacaacaag aagcatacga ttattctttg - 20641 gatattttaa aaggatttgg tggaactggg attgtcaaag ggagtttgct tggattggca - 20701 attatcctaa gtgcctatta tctattgtat agcttttttt ctaatcggcg taatttcatg - 20761 aaaagtttgt tgcattattt tgcggtgttt gccttgttta tttgttggtt tggacaagta - 20821 aaaacaattg atggtaaaac gcaaaatggg gcaatttttt tgattagttc ggttagtgag - 20881 atgacaaaac aagtacaagg caagtttact tctaatgtaa actttggagg ggatacaagc - 20941 caagaagtag acgatggaaa gaaaaaagtg tatcaaagcc caatgtttga cgcaacggtt - 21001 ttacagacgt ttaactatgt caatagtggc tcgattgatg gcaaaatggc aaatgggaag - 21061 aagcttgatt atgataaact attagaaaag cctaacctga atgataaaga gaaaaaggat - 21121 tttagagaaa aaagaaatgc ttatattgaa cagcaggaga aagacaatcc ttatttttcg - 21181 caagatacct taaaaactat ggaaaaaagt tttgcggtat ggacgggtgc aacaaattta - 21241 tttattctag caattcctgt gttatatatt aatttaatgt tgtcgttgat acagctgtta - 21301 gttgtctttt taattcttat atttccagtt gttttgttgg cttccttttt tccacggtgt - 21361 caaatgttac tattcaagtt ctttcaaggt ttaattggtg cgttattcac gccaattatt - 21421 tatggtattt ttttatcggt gctgttttgg attaacaaac tgattgatgg ggcattttta - 21481 ggtgtcgcaa aaaaagtcag tggcagcttg cttgaattga tttcaggtag tacggtttat - 21541 atgatcgttt tatttgtagc agtggtagtg aagattgtag ttttacgaaa agtttggaaa - 21601 aataaatatg ccattcttgc ttacttttca aatgggcaag tgtcacagcc tgtgtttgaa - 21661 caaaaagtgg aacagttgtc tgaacgaacg aaagaagtag caactggtgg agcgcaagtt - 21721 gccctaggtg cttatacagg caatctgggc atggtcgcaa acggtgcagg taatattcta - 21781 ccgaatcaag ataaagccat tgaaatgggc caagaacatt ttattgatga taatggttca - 21841 tttactgggg taaaagcggg tttacagtct atttttaggc aaccagtgac agaagaagaa - 21901 caaggggagc tgaacgagga acagttttca gaagtggaaa cggaatcgat agatcatgag - 21961 ttaacagata ttgaagaaat aggacagaca gagttagaat ctgatagttt agataactct - 22021 attattgaat tagagcctat gacgagtgaa gatttagtag tggatgtcga taatatgagt - 22081 tctgatatag atgtggagct agcatcagta gaagaagttg gggaagagcc accaatgaac - 22141 gcagaggaat attcaggtta tgataatgtg attgtgacca actttgatga attggctatg - 22201 gcaagagaag aacgtgatta ttttgacggt ggcaaagaac aagagctagt cgagacaaat - 22261 ggagttgaat tggttaataa tatttatccg tttgttcaaa cagaagagta tctagctaat - 22321 cttgaacaga cagaagccca gttttttgga acagatgagt ttgagaaaga attagaacag - 22381 atagaggagt gggcataacc acttctcttt ttatgttagg tggtgcaaat gaaaaaaatc - 22441 tttttaggaa tccttggctt gtttagcttt ttgtttttat tgcctttttt gttatttttg - 22501 ggcaccatgt caacagaaat tggaaacaat acacaatttc aagcaacaac gccacaagaa - 22561 aaagtagcgc tagaggtatc caattttgtt accaaaaatg gtggatcgtt acaatttgcc - 22621 tctgcatggc taggaaatat ggaacatgag agcggattaa atcctgctag aatacaaagt - 22681 gatttaacgt ttaattcagc gtgggcgttt aatccttcga ccaatggtta tgcgttaggt - 22741 ttagcaatga tggacggtga gcgccgtgta aacttgttaa attttgccaa agaacaaaag - 22801 aaagattggc aggctgtccc agtacaactc gagtatatgt ggaatcatga cggctcagac - 22861 agtgccttgc tgaaacgtat gtcgaaaagc tctgatgtga atcaattagc tgtagatatt - 22921 ttggtacatt gggaacgtgc aggcactaaa aatgatccca acgaacaaat caaacgaaaa - 22981 acaagtgcga ataattggta taagagactg tctacaggtt ctatgggggc aggttcagcc - 23041 aatattggtg gtggcaaaat tgatgtgtta gaacaaatgt tagggcaaac agtcaatgga - 23101 ggtcagtgtt atggggggac ttcttattat gttgaaaaga tgggctttca atctttaatg - 23161 aatacagggc atatgtttgc cagtgaaatt ggcaatgatt atgcgtggga acaatctggc - 23221 tggcaggtaa tcaaaaatcc aaactattct gatgtcaaag caggtgatgt gattaatttc - 23281 gcaatgggcg gttatgcgac cagcgtttac ggtcatactg gaattgtagc tagtgttgaa - 23341 ggtaatggaa agcttgtttt atatgaacag aacgctgaaa aaggacaaat aattgctaaa - 23401 tattttcgac aatggggagc agaatatcct aacgtgacaa gtattgtaag gaagaaatag - 23461 aggagagatt tttgatgaaa aaagaagaaa tggacgttgt ttcattgcgg attataaagc - 23521 tttatttttt aggcattagg gaattaaatt tcccagatta taataaaagg tttcagcaaa - 23581 aagatatgga attgtttatt caactagctg atatgatgga aaatttacca aatcttgatg - 23641 aacaactaat ttatgaatta gaagagttga aagattattt attctatgtc aaaaccgaaa - 23701 agtattcttt aacagttcat gatatgtttt tggaaatgaa atccgagctt gaaaaaataa - 23761 tttagaagaa atgtagtgtc aaaaaagaga gggtgtagtg tcaaaaatgt ttagaaagaa - 23821 aaatggttta acaaatcggc aagtattagc gatttgtaca aaatttcagt gtaaaaagaa - 23881 tgagtttgtc gcccatcgat taagtgatgg gtatttagta gcagtaaata ataaagaata - 23941 ccgagtaaaa ttttcggaag gctttttttc aaaaattgta tatgcaaaag aagtgcaacg - 24001 gaaaggagct cggaaatcgt gaataagcta cctttactta ttttattgtt aggcggagtg - 24061 ttgcttgtta gtggctgtca aagccataag gaagaaaaca agtctagtaa agtatcgaca - 24121 gaagaaacga cagtgattga aacagtagca agggaacaat cgaaggaatc gtttacgagt - 24181 gaagcaacta aaaaacagac agaaacaacg aaattagaag aaccagatca tgtaaaactt - 24241 ctagaagctt atggaaatgc gtatgcgaac tttacaagta ttaatgatcg caatgaaaag - 24301 ctaaagcccc tcatgactga aaaatgtatc aaaaaaaatg gaattgatgt taaaactgga - 24361 gtagcgttag tttccgtagg aaaggttaca acgatttata aaaatgatca acatgaatat - 24421 gctttacttt tggattgtga acaaaatgga acgcagacac gagtgttact tttggctaag - 24481 gtgaagaaca ataaaatttc tgaaatgacc tataattcag ttaagcaaga gtattagaaa - 24541 ctcttgatat taatagattc catgctagat ttatggtaca attacacata ataaataaag - 24601 gagaaaacca atgaaaaaaa gtattgtaac gatgttattt ttgatgttgg ggatagttgt - 24661 atttactagt tgtgggtcta aaatggataa gacagcagaa gagtttaaga ataagattat - 24721 aagtcatgtc ggtgatcttt atgatgaaaa atatcaagaa aaagaattta gctttttaat - 24781 ttacaaagat aaggatacaa atgaatattt agctaaagct ttggttcctt atgaaggtga - 24841 gcctaatagt gtagaatcta agtattttta taatgtaaat aaagaattag aaactattga - 24901 accatttagt ggaggtagaa cgtttgatta tgctaagtct catggtaact atgaggtaat - 24961 atataaatca ggaaaattta aatagaattt gaacttaaga taaattaaat ttatgtttga - 25021 gagcagtgct tagagcattg ctcttttttg ttttaggagg gaaaacaatg ttaattgtaa - 25081 caaaagaaga cctaatgaat ttaggatatg gaaaatatca agcggaagat ataattagga - 25141 aagcaaaggc agtaatggtg tctaagggat acgcatatta cctaaataaa cgattaggaa - 25201 gagttcctgt tggagctgtc gaaagtgtat taggaataga actagaatct atagcaaaag - 25261 aggttgaaac ggttggttaa gtttaaaaaa gataagagag gaaagtatta ttttactgct - 25321 agtttgggtt ttgatgaagt aactggtaag agggttcaaa aaatgcgttc agggttttcc - 25381 acgattaaag aagcaaggga agcttatgcg gaaataatta ataatttcgg taaagaagca - 25441 tattcttcaa atagcacaat gctgtatgaa gaattttttt atactatttt tttgccatat - 25501 tataagggac gggttaaaga aagaacttat aataatagac ttagtatgat aaaaaatact - 25561 tttgcctatt tttttaaaat gaaattgaaa agtatagctc ctgttcatat acagaagtgg - 25621 cagaatgagc tgttggaaca gtatgaaaac acgtatgtaa gaaatattta tggactgttt - 25681 cagatgtctt tagatcgagc tgttgtgtta ggaatgattt cttcaaatcc agcaaagatc - 25741 gttggtaatg tgaaaaaaag taagaaagaa attgattttt ggacaaaaga agaatttgaa - 25801 aaagttgtta agacttttta tgtagaagat tattaccaaa atttttcttt tatttgtatc - 25861 tggttattat ttatgacagg catgagaata ggtgaggcta ctgctttaac ttggaaagat - 25921 gtgaatttag atagaagata tttaacagta aaaaaatcac tatattataa aaatgcgcaa - 25981 acttatgaat tagtgtctcc aaagactaga gccagtatta ggacgattta tttagatgaa - 26041 gatacagttc actatttaag agattggaaa aaaaggcaag atgatgttgg aggaattgaa - 26101 tttattttat cttataattc agttcctact caaaaacata cagtaagaca tattattaaa - 26161 cgtcatgcaa aattggcaga ggtacatgat attaggattc atgctttaag acattctcat - 26221 gcttctttat taataagtat gggtactaat gctttgttga taaaagaacg attgggtcat - 26281 gaagatgtgc aaacaacttt aggtacttat ggacacttat atccaagtag ctccactgaa - 26341 atagctaatg aattgaaggg aatagttaat gttgagttta ctaatcaaaa tatggcttcg - 26401 gaggttacta atcaatttac taaaggagta aaaaaataa -//
--- a/test-data/NC_004668_137848_164286_icescreen.gff Fri Feb 09 21:26:42 2024 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,7 +0,0 @@ -##gff-version 3 -##sequence-region NC_004668.1 1 0 -NC_004668.1 ICEscreen CDS 1 1512 .+ 1 origid=EF_RS00630;function=Coupling Protein;protein_id=WP_002359295.1;locus_tag=EF_RS00630;codon_start=1;color=6;Note=ICEscreen prediction%3A Coupling protein%3B BlastP result %28Annotation confidence%3A HIGH%29%3A Coupling protein TcpA %5BHit with AAO80014%3B Identity%3A100.00%25%3B E-value%3A0.00e%2B00%3B Query coverage%3A100.00%25%5D%3B Hmmscan result%3A TcpA %5BHit with tcpA HMM profile%3B E-value%3A7.00e-94%3B i-Evalue%3A8.80e-94%5D -NC_004668.1 ICEscreen CDS 3098 4381 .+ 1 origid=EF_RS00650;function=Relaxase;protein_id=WP_002359299.1;locus_tag=EF_RS00650;codon_start=1;color=7;Note=ICEscreen prediction%3A Relaxase%3B BlastP result %28Annotation confidence%3A HIGH%29%3A Relaxase MOBT %28PF02486%29 %5BHit with AAO80018%3B Identity%3A99.77%25%3B E-value%3A0.00e%2B00%3B Query coverage%3A95.53%25%5D%3B Hmmscan result%3A MOBT %5BHit with T4SS_MOBT HMM profile%3B E-value%3A3.00e-128%3B i-Evalue%3A3.40e-128%5D -NC_004668.1 ICEscreen CDS 17920 20427 .+ 1 origid=EF_RS00720;function=VirB4;protein_id=WP_002359320.1;locus_tag=EF_RS00720;codon_start=1;color=184 134 11;Note=ICEscreen prediction%3A VirB4%3B BlastP result %28Annotation confidence%3A HIGH%29%3A VirB4 %5BHit with CAE52368%3B Identity%3A41.15%25%3B E-value%3A0.00e%2B00%3B Query coverage%3A99.76%25%5D%3B Hmmscan result%3A VirB4 %5BHit with T4SS_virb4 HMM profile%3B E-value%3A1.80e-28%3B i-Evalue%3A2.40e-28%5D -NC_004668.1 ICEscreen CDS 25273 26439 .+ 1 origid=EF_RS00760;function=Tyrosine Integrase;protein_id=WP_002392915.1;locus_tag=EF_RS00760;codon_start=1;color=8;Note=ICEscreen prediction%3A Tyrosine integrase%3B BlastP result %28Annotation confidence%3A HIGH%29%3A Tyrosine integrase %5BHit with AAO80040%3B Identity%3A100.00%25%3B E-value%3A0.00e%2B00%3B Query coverage%3A100.00%25%5D%3B Hmmscan result%3A Tyrosine integrase %5BHit with Phage_integrase HMM profile%3B E-value%3A4.40e-29%3B i-Evalue%3A9.70e-29%5D -NC_004668.1 ICEscreen mobile_element 1 26439 .+ . mobile_element_type=other%3A integrative and conjugative element;Note=ICEscreen prediction%3A Putative ICE %28one integrase Tyr%29 %5BElement structure%3A Single%3B ICE superfamily%3A Tn916%3B ICE family%3A ICESt3%3B Relaxase family%3A - %28MOBT%29%3B Coupling protein family%3A TcpA%5D %28ICEscreen ID%3A ID_1%29;color=15