Mercurial > repos > iuc > icescreen
changeset 3:0d38ba6112be draft
planemo upload for repository https://forgemia.inra.fr/ices_imes_analysis/icescreen commit a9bc15365abc70c0367d732b790763d8fa53b220
| author | iuc |
|---|---|
| date | Tue, 28 Feb 2023 14:10:26 +0000 |
| parents | 411d99e24c62 |
| children | 49bf81065a47 |
| files | icescreen.xml test-data/NC_004668_137848_164286_detected_ME.summary test-data/NC_004668_137848_164286_detected_ME.tsv test-data/NC_004668_137848_164286_icescreen.embl test-data/NC_004668_137848_164286_icescreen.gb test-data/NC_004668_137848_164286_icescreen.gff test-data/NC_013798_298468_322494_NC_020450_643089_661957_detected_ME.summary test-data/NC_013798_298468_322494_NC_020450_643089_661957_detected_ME.tsv test-data/genbank/NC_013798_298468_322494_NC_020450_643089_661957.gb |
| diffstat | 9 files changed, 1928 insertions(+), 94 deletions(-) [+] |
line wrap: on
line diff
--- a/icescreen.xml Sat Apr 02 21:04:43 2022 +0000 +++ b/icescreen.xml Tue Feb 28 14:10:26 2023 +0000 @@ -1,7 +1,7 @@ <tool id="icescreen" name="ICEscreen" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="20.09"> <description>detects and annotates ICEs (Integrative and Conjugative Elements) and IMEs (Integrative and Mobilizable Elements) in Firmicutes genomes.</description> <macros> - <token name="@TOOL_VERSION@">1.0.4</token> + <token name="@TOOL_VERSION@">1.1.1</token> <token name="@VERSION_SUFFIX@">0</token> </macros> <requirements> @@ -45,7 +45,7 @@ ]]> </command> <inputs> - <param name="genome" type="data" format="genbank" label="Input genomes to analyze in Genbank format" help=""/> + <param name="genome" type="data" format="genbank" label="Input genomes to analyze in Genbank format" help="Multi-genbank files (i.e. gbff) are supported. Each record must include the ORIGIN nucleotide sequence at the end."/> <section name="taxonomy" title="Taxonomy of the genomes to analyse" expanded="False"> <param name="mode" type="select" label="Firmicutes is the defaut parameter" help="Streptomyces is EXPERIMENTAL and is NOT recommended."> <option value="firmicutes" selected="true">Firmicutes</option> @@ -89,10 +89,10 @@ <output name="detected_me" file="NC_004668_137848_164286_detected_ME.tsv" ftype="tabular" /> <output name="detected_sp" > <assert_contents> - <has_text text="ICE IME Number" /> + <has_text text="ICE_IME_id" /> <has_text text="WP_002359295" /> <has_text text="VirB4" /> - <has_n_columns n="47" /> + <has_n_columns n="54" /> <has_n_lines n="5" /> </assert_contents> </output> @@ -115,10 +115,9 @@ <test expect_num_outputs="4"> <param name="genome" value="genbank/NC_004668_137848_164286.gb" ftype="genbank" /> <param name="optional_files" value="output_zip_all_files" /> - <output name="outzip" > <assert_contents> - <has_archive_member path=".*/*_detected_SP_withMEIds.tsv"><has_text text="ICE IME Number" /></has_archive_member> + <has_archive_member path=".*/*_detected_SP_withMEIds.tsv"><has_text text="ICE_IME_id" /></has_archive_member> </assert_contents> </output> </test> @@ -156,11 +155,23 @@ </assert_contents> </output> </test> + <test expect_num_outputs="3"> + <param name="genome" value="genbank/NC_013798_298468_322494_NC_020450_643089_661957.gb" ftype="genbank" /> + <output name="summary" file="NC_013798_298468_322494_NC_020450_643089_661957_detected_ME.summary" ftype="txt" /> + <output name="detected_me" file="NC_013798_298468_322494_NC_020450_643089_661957_detected_ME.tsv" ftype="tabular" /> + <output name="detected_sp" > + <assert_contents> + <has_text text="ICE_IME_id" /> + <has_text text="WP_044555479.1" /> + <has_text text="WP_015426013.1" /> + </assert_contents> + </output> + </test> </tests> <help><![CDATA[ .. class:: warningmark - This tool requires *genbank* format. + ICEscreen requires input files in genbank format. Multigenbank files (i.e. gbff files featuring multiple genome records back to back) are supported. Each Genbank record must include the ORIGIN nucleotide sequence. ----- @@ -170,7 +181,7 @@ **Main features of ICEscreen** - - Detection of signature proteins (SPs) of ICEs/IMEs by using blastP on a curated resource. BlastP allows for an accurate assignment of hits to a given ICE/IME superfamily or family. The curated resource was derived from an analysis of over 120 ICEs and IMEs in Streptococcus genomes by the DINAMIC lab. + - Detection of signature proteins (SPs) of ICEs/IMEs by using blastP on a curated resource. BlastP allows for an accurate assignment of hits to a given ICE/IME superfamily or family. The curated resource was derived from an analysis of over 120 ICEs and IMEs in Streptococcus genomes by the DINAMIC lab. - Detection of distant homologs of SPs by using HMM profiles of ICEs/IMEs protein families. The HMM profiles have been either imported from trusted resources or created and curated when needed. - Detection of the ICE/IME structures: ICEScreen groups together SPs that belong to the same ICE/IME structures to the best of its ability. - Delimitation of the elements at the gene or nucleotide level is not yet implemented and still needs manual curation.
--- a/test-data/NC_004668_137848_164286_detected_ME.summary Sat Apr 02 21:04:43 2022 +0000 +++ b/test-data/NC_004668_137848_164286_detected_ME.summary Tue Feb 28 14:10:26 2023 +0000 @@ -1,44 +1,44 @@ -##################### Mobile elements detection statistics ##################### -# Number of complete elements -Complete ICE (4 types of SP): 1 -Complete IME (R+I, R+C+I): 0 - -# Number of complete modules -Conjugation module (R+C+V): 0 -Mobilizable element (R+C with size <= 10 CDS): 0 -# Number of partial elements -Partial ICE (at least V): 0 -Other partial element (R+C, R+V, V+C with size > 10 CDS): 0 +##################### Main parameters of the ICEscreen analysis ##################### +Maximum distance in CDS between consecutive SPs within a segments: 100 +Maximum distance in CDS between consecutive SPs within an IME element: 14 -# Composite elements -Total nested elements (partial or complete): 0 -Host element: 0 -Guest element: 0 -Element that are both host and guest: 0 + +##################### ICEscreen statistics for genome accession NC_004668.1 ##################### -################### Signature proteins detection statistics #################### -# Total SP detected -Total SP: 4 -Total Integrase: 1 -Total Relaxase: 1 -Total Coupling protein: 1 -Total VirB4: 1 +##### Mobile elements ##### +## Number of complete elements +Complete ICE (4 types of SP): 1 +Complete IME (R+I, R+C+I with distance between consecutive SPs <= 14 CDSs): 0 +## Number of complete modules +Conjugation module (R+C+V): 0 +Mobilizable element (R+C with distance between consecutive SPs <= 14 CDS): 0 +## Number of partial elements +Partial ICE (at least V): 0 +Other partial element (R+C, R+V, V+C with distance between consecutive SPs > 14 CDS): 0 +## Composite elements +Total nested elements (partial or complete): 0 +Host element: 0 +Guest element: 0 +Element that are both host and guest: 0 -# Unassigned SP -Unassigned SP: 0 -Unassigned Integrase: 0 -Unassigned Relaxase: 0 -Unassigned Coupling protein: 0 -Unassigned VirB4: 0 +##### Signature proteins ##### +## Total SPs detected +Total SPs: 4 +Total Integrase: 1 +Total Relaxase: 1 +Total Coupling protein: 1 +Total VirB4: 1 +## Unassigned SPs +Unassigned SPs: 0 +Unassigned Integrase: 0 +Unassigned Relaxase: 0 +Unassigned Coupling protein: 0 +Unassigned VirB4: 0 -############################# Segments statistics ############################## -Number of segments: 1 -Segment with one element: 1 -Segment with several elements: 0 -Segment with nested elements: 0 -Segment with no element: 0 +##### Segments ##### +Number of segments with one element: 1 +Number of segments with several elements: 0 +Number of segments with nested elements: 0 +Number of segments with exclusively isolated SPs to manually verify: 0 -############################### Parameters used ################################ -Maximum CDS numbers in initial segments: 100 -Maximum CDS numbers in an IME element: 10
--- a/test-data/NC_004668_137848_164286_detected_ME.tsv Sat Apr 02 21:04:43 2022 +0000 +++ b/test-data/NC_004668_137848_164286_detected_ME.tsv Tue Feb 28 14:10:26 2023 +0000 @@ -1,2 +1,2 @@ -ICE IME Number segment number category of element category of integrase host ICE / IME guest ICE / IME other ICE / IME colocalized ICEline format ICE SuperFamily From Blast Of SP Conj Module ICE Family From Blast Of SP Conj Module IME Family From Blast Of SP Conj Module family SP conj module HMM integrase upstream integrase downstream relaxase coupling protein VirB4 list ordered SPs SPs conj module to manually review Integrase to manually review comment -2 1 Complete ICE (4 types of SP) one integrase - Tyr C3.R1:V7.I Tn916 ICESt3 C:TcpA, R:MOBT, V:VirB4 WP_002392915.1-25273 WP_002359299.1-3098 WP_002359295.1-1 WP_002359320.1-17920 WP_002359295.1-1, WP_002359299.1-3098, WP_002359320.1-17920, WP_002392915.1-25273 Integrase WP_002392915.1-25273 has been associated to the structure 2 because they are adjacent, this integrase has already be seen rattached to this conjugaison module family, and there is no upstream/downstream ambiguity. +ICE_IME_id Segment_number Genome_accession Category_of_element Category_of_integrase Host_ICE_IME_ids Guest_ICE_IME_ids Colocalized_ICE_IME_ids ICEline_format ICE_consensus_superfamily_SP_conj_module ICE_consensus_family_SP_conj_module IME_relaxase_family_domains_blast HMM_family_SP_conj_module Integrase_upstream Integrase_downstream Relaxase Coupling_protein VirB4 List_SP_ordered_genomic_position Other_potential_SP_conj_module_need_manual_curation_and_review Other_potential_integrase_need_manual_curation_and_review Comments_regarding_structure +ID_1 1 NC_004668.1 Complete ICE (C+R+V+I) one integrase Tyr - - - C3.R1:V7.I Tn916 ICESt3 - C:TcpA, R:MOBT, V:VirB4 - EF_RS00760 EF_RS00650 EF_RS00630 EF_RS00720 EF_RS00630, EF_RS00650, EF_RS00720, EF_RS00760 - - Downstream integrase EF_RS00760 has been associated to the structure ID_1 pre-merging because it is adjacent to the conj module and there is no upstream/downstream ambiguity.
--- a/test-data/NC_004668_137848_164286_icescreen.embl Sat Apr 02 21:04:43 2022 +0000 +++ b/test-data/NC_004668_137848_164286_icescreen.embl Tue Feb 28 14:10:26 2023 +0000 @@ -11,8 +11,8 @@ XX FH Key Location/Qualifiers FH -FT CDS 1..1511 -FT /origid="WP_002359295.1" +FT CDS 1..1512 +FT /origid="EF_RS00630" FT /function="Coupling Protein" FT /protein_id="WP_002359295.1" FT /locus_tag="EF_RS00630" @@ -20,11 +20,11 @@ FT /color=6 FT /note="ICEscreen prediction: Coupling protein; BlastP FT result (Annotation confidence: HIGH): Coupling protein TcpA -FT [Hit with AAO80014; Identity:100.00%; E-value:0; Query -FT coverage:100.00%]; Hmmscan result: TcpA [Hit with tcpA HMM -FT profile; E-value:0; i-Evalue:0]" -FT CDS 3098..4380 -FT /origid="WP_002359299.1" +FT [Hit with AAO80014; Identity:100.00%; E-value:0.00e+00; +FT Query coverage:100.00%]; Hmmscan result: TcpA [Hit with +FT tcpA HMM profile; E-value:7.00e-94; i-Evalue:8.80e-94]" +FT CDS 3098..4381 +FT /origid="EF_RS00650" FT /function="Relaxase" FT /protein_id="WP_002359299.1" FT /locus_tag="EF_RS00650" @@ -32,11 +32,11 @@ FT /color=7 FT /note="ICEscreen prediction: Relaxase; BlastP result FT (Annotation confidence: HIGH): Relaxase MOBT (PF02486) [Hit -FT with AAO80018; Identity:99.77%; E-value:0; Query +FT with AAO80018; Identity:99.77%; E-value:0.00e+00; Query FT coverage:95.53%]; Hmmscan result: MOBT [Hit with T4SS_MOBT -FT HMM profile; E-value:0; i-Evalue:0]" -FT CDS 17920..20426 -FT /origid="WP_002359320.1" +FT HMM profile; E-value:3.00e-128; i-Evalue:3.40e-128]" +FT CDS 17920..20427 +FT /origid="EF_RS00720" FT /function="VirB4" FT /protein_id="WP_002359320.1" FT /locus_tag="EF_RS00720" @@ -44,11 +44,11 @@ FT /color="184 134 11" FT /note="ICEscreen prediction: VirB4; BlastP result FT (Annotation confidence: HIGH): VirB4 [Hit with CAE52368; -FT Identity:41.15%; E-value:0; Query coverage:99.76%]; Hmmscan -FT result: VirB4 [Hit with T4SS_virb4 HMM profile; E-value:0; -FT i-Evalue:0]" -FT CDS 25273..26438 -FT /origid="WP_002392915.1" +FT Identity:41.15%; E-value:0.00e+00; Query coverage:99.76%]; +FT Hmmscan result: VirB4 [Hit with T4SS_virb4 HMM profile; +FT E-value:1.80e-28; i-Evalue:2.40e-28]" +FT CDS 25273..26439 +FT /origid="EF_RS00760" FT /function="Tyrosine Integrase" FT /protein_id="WP_002392915.1" FT /locus_tag="EF_RS00760" @@ -56,16 +56,17 @@ FT /color=8 FT /note="ICEscreen prediction: Tyrosine integrase; BlastP FT result (Annotation confidence: HIGH): Tyrosine integrase -FT [Hit with AAO80040; Identity:100.00%; E-value:0; Query -FT coverage:100.00%]; Hmmscan result: Tyrosine integrase [Hit -FT with Phage_integrase HMM profile; E-value:0; i-Evalue:0]" +FT [Hit with AAO80040; Identity:100.00%; E-value:0.00e+00; +FT Query coverage:100.00%]; Hmmscan result: Tyrosine integrase +FT [Hit with Phage_integrase HMM profile; E-value:4.40e-29; +FT i-Evalue:9.70e-29]" FT mobile_element 1..26439 FT /mobile_element_type="other: integrative and conjugative FT element" -FT /note="ICEscreen prediction: Putative ICE (one integrase - +FT /note="ICEscreen prediction: Putative ICE (one integrase FT Tyr) [Element structure: Single; ICE superfamily: Tn916; -FT ICE family: ICESt3; Relaxase family: MOBT; Coupling protein -FT family: TcpA] (ICEscreen ID: 2)" +FT ICE family: ICESt3; Relaxase family: - (MOBT); Coupling +FT protein family: TcpA] (ICEscreen ID: ID_1)" FT /color=15 XX SQ Sequence 0 BP; 0 A; 0 C; 0 G; 0 T; 0 other;
--- a/test-data/NC_004668_137848_164286_icescreen.gb Sat Apr 02 21:04:43 2022 +0000 +++ b/test-data/NC_004668_137848_164286_icescreen.gb Tue Feb 28 14:10:26 2023 +0000 @@ -607,8 +607,8 @@ YLTVKKSLYYKNAQTYELVSPKTRASIRTIYLDEDTVHYLRDWKKRQDDVGGIEFILSY NSVPTQKHTVRHIIKRHAKLAEVHDIRIHALRHSHASLLISMGTNALLIKERLGHEDVQ TTLGTYGHLYPSSSTEIANELKGIVNVEFTNQNMASEVTNQFTKGVKK" - CDS 1..1511 - /origid="WP_002359295.1" + CDS 1..1512 + /origid="EF_RS00630" /function="Coupling Protein" /protein_id="WP_002359295.1" /locus_tag="EF_RS00630" @@ -616,11 +616,11 @@ /color=6 /note="ICEscreen prediction: Coupling protein; BlastP result (Annotation confidence: HIGH): Coupling protein TcpA - [Hit with AAO80014; Identity:100.00%; E-value:0; Query - coverage:100.00%]; Hmmscan result: TcpA [Hit with tcpA HMM - profile; E-value:0; i-Evalue:0]" - CDS 3098..4380 - /origid="WP_002359299.1" + [Hit with AAO80014; Identity:100.00%; E-value:0.00e+00; + Query coverage:100.00%]; Hmmscan result: TcpA [Hit with + tcpA HMM profile; E-value:7.00e-94; i-Evalue:8.80e-94]" + CDS 3098..4381 + /origid="EF_RS00650" /function="Relaxase" /protein_id="WP_002359299.1" /locus_tag="EF_RS00650" @@ -628,11 +628,11 @@ /color=7 /note="ICEscreen prediction: Relaxase; BlastP result (Annotation confidence: HIGH): Relaxase MOBT (PF02486) [Hit - with AAO80018; Identity:99.77%; E-value:0; Query + with AAO80018; Identity:99.77%; E-value:0.00e+00; Query coverage:95.53%]; Hmmscan result: MOBT [Hit with T4SS_MOBT - HMM profile; E-value:0; i-Evalue:0]" - CDS 17920..20426 - /origid="WP_002359320.1" + HMM profile; E-value:3.00e-128; i-Evalue:3.40e-128]" + CDS 17920..20427 + /origid="EF_RS00720" /function="VirB4" /protein_id="WP_002359320.1" /locus_tag="EF_RS00720" @@ -640,11 +640,11 @@ /color="184 134 11" /note="ICEscreen prediction: VirB4; BlastP result (Annotation confidence: HIGH): VirB4 [Hit with CAE52368; - Identity:41.15%; E-value:0; Query coverage:99.76%]; Hmmscan - result: VirB4 [Hit with T4SS_virb4 HMM profile; E-value:0; - i-Evalue:0]" - CDS 25273..26438 - /origid="WP_002392915.1" + Identity:41.15%; E-value:0.00e+00; Query coverage:99.76%]; + Hmmscan result: VirB4 [Hit with T4SS_virb4 HMM profile; + E-value:1.80e-28; i-Evalue:2.40e-28]" + CDS 25273..26439 + /origid="EF_RS00760" /function="Tyrosine Integrase" /protein_id="WP_002392915.1" /locus_tag="EF_RS00760" @@ -652,16 +652,17 @@ /color=8 /note="ICEscreen prediction: Tyrosine integrase; BlastP result (Annotation confidence: HIGH): Tyrosine integrase - [Hit with AAO80040; Identity:100.00%; E-value:0; Query - coverage:100.00%]; Hmmscan result: Tyrosine integrase [Hit - with Phage_integrase HMM profile; E-value:0; i-Evalue:0]" + [Hit with AAO80040; Identity:100.00%; E-value:0.00e+00; + Query coverage:100.00%]; Hmmscan result: Tyrosine integrase + [Hit with Phage_integrase HMM profile; E-value:4.40e-29; + i-Evalue:9.70e-29]" mobile_element 1..26439 /mobile_element_type="other: integrative and conjugative element" - /note="ICEscreen prediction: Putative ICE (one integrase - + /note="ICEscreen prediction: Putative ICE (one integrase Tyr) [Element structure: Single; ICE superfamily: Tn916; - ICE family: ICESt3; Relaxase family: MOBT; Coupling protein - family: TcpA] (ICEscreen ID: 2)" + ICE family: ICESt3; Relaxase family: - (MOBT); Coupling + protein family: TcpA] (ICEscreen ID: ID_1)" /color=15 ORIGIN 1 atgttaaaaa aattatttag atatagagga aggcgtattc gttattcttc aagaaacctg
--- a/test-data/NC_004668_137848_164286_icescreen.gff Sat Apr 02 21:04:43 2022 +0000 +++ b/test-data/NC_004668_137848_164286_icescreen.gff Tue Feb 28 14:10:26 2023 +0000 @@ -1,3 +1,7 @@ ##gff-version 3 -##sequence-region NC_004668.1 1 26439 -NC_004668.1 ICEscreen CDS 1 1511 .+ 1 origid=WP_002359295.1;function=Coupling Protein;protein_id=WP_002359295.1;locus_tag=EF_RS00630;codon_start=1;color=6;Note=ICEscreen prediction%3A Coupling protein%3B BlastP result %28Annotation confidence%3A HIGH%29%3A Coupling protein TcpA %5BHit with AAO80014%3B Identity%3A100.00%25%3B E-value%3A0%3B Query coverage%3A100.00%25%5D%3B Hmmscan result%3A TcpA %5BHit with tcpA HMM profile%3B E-value%3A0%3B i-Evalue%3A0%5DNC_004668.1 ICEscreen CDS 3098 4380 .+ 1 origid=WP_002359299.1;function=Relaxase;protein_id=WP_002359299.1;locus_tag=EF_RS00650;codon_start=1;color=7;Note=ICEscreen prediction%3A Relaxase%3B BlastP result %28Annotation confidence%3A HIGH%29%3A Relaxase MOBT %28PF02486%29 %5BHit with AAO80018%3B Identity%3A99.77%25%3B E-value%3A0%3B Query coverage%3A95.53%25%5D%3B Hmmscan result%3A MOBT %5BHit with T4SS_MOBT HMM profile%3B E-value%3A0%3B i-Evalue%3A0%5DNC_004668.1 ICEscreen CDS 17920 20426 .+ 1 origid=WP_002359320.1;function=VirB4;protein_id=WP_002359320.1;locus_tag=EF_RS00720;codon_start=1;color=184 134 11;Note=ICEscreen prediction%3A VirB4%3B BlastP result %28Annotation confidence%3A HIGH%29%3A VirB4 %5BHit with CAE52368%3B Identity%3A41.15%25%3B E-value%3A0%3B Query coverage%3A99.76%25%5D%3B Hmmscan result%3A VirB4 %5BHit with T4SS_virb4 HMM profile%3B E-value%3A0%3B i-Evalue%3A0%5DNC_004668.1 ICEscreen CDS 25273 26438 .+ 1 origid=WP_002392915.1;function=Tyrosine Integrase;protein_id=WP_002392915.1;locus_tag=EF_RS00760;codon_start=1;color=8;Note=ICEscreen prediction%3A Tyrosine integrase%3B BlastP result %28Annotation confidence%3A HIGH%29%3A Tyrosine integrase %5BHit with AAO80040%3B Identity%3A100.00%25%3B E-value%3A0%3B Query coverage%3A100.00%25%5D%3B Hmmscan result%3A Tyrosine integrase %5BHit with Phage_integrase HMM profile%3B E-value%3A0%3B i-Evalue%3A0%5DNC_004668.1 ICEscreen mobile_element 1 26439 .+ . mobile_element_type=other%3A integrative and conjugative element;Note=ICEscreen prediction%3A Putative ICE %28one integrase - Tyr%29 %5BElement structure%3A Single%3B ICE superfamily%3A Tn916%3B ICE family%3A ICESt3%3B Relaxase family%3A MOBT%3B Coupling protein family%3A TcpA%5D %28ICEscreen ID%3A 2%29;color=15 \ No newline at end of file +##sequence-region NC_004668.1 1 0 +NC_004668.1 ICEscreen CDS 1 1512 .+ 1 origid=EF_RS00630;function=Coupling Protein;protein_id=WP_002359295.1;locus_tag=EF_RS00630;codon_start=1;color=6;Note=ICEscreen prediction%3A Coupling protein%3B BlastP result %28Annotation confidence%3A HIGH%29%3A Coupling protein TcpA %5BHit with AAO80014%3B Identity%3A100.00%25%3B E-value%3A0.00e%2B00%3B Query coverage%3A100.00%25%5D%3B Hmmscan result%3A TcpA %5BHit with tcpA HMM profile%3B E-value%3A7.00e-94%3B i-Evalue%3A8.80e-94%5D +NC_004668.1 ICEscreen CDS 3098 4381 .+ 1 origid=EF_RS00650;function=Relaxase;protein_id=WP_002359299.1;locus_tag=EF_RS00650;codon_start=1;color=7;Note=ICEscreen prediction%3A Relaxase%3B BlastP result %28Annotation confidence%3A HIGH%29%3A Relaxase MOBT %28PF02486%29 %5BHit with AAO80018%3B Identity%3A99.77%25%3B E-value%3A0.00e%2B00%3B Query coverage%3A95.53%25%5D%3B Hmmscan result%3A MOBT %5BHit with T4SS_MOBT HMM profile%3B E-value%3A3.00e-128%3B i-Evalue%3A3.40e-128%5D +NC_004668.1 ICEscreen CDS 17920 20427 .+ 1 origid=EF_RS00720;function=VirB4;protein_id=WP_002359320.1;locus_tag=EF_RS00720;codon_start=1;color=184 134 11;Note=ICEscreen prediction%3A VirB4%3B BlastP result %28Annotation confidence%3A HIGH%29%3A VirB4 %5BHit with CAE52368%3B Identity%3A41.15%25%3B E-value%3A0.00e%2B00%3B Query coverage%3A99.76%25%5D%3B Hmmscan result%3A VirB4 %5BHit with T4SS_virb4 HMM profile%3B E-value%3A1.80e-28%3B i-Evalue%3A2.40e-28%5D +NC_004668.1 ICEscreen CDS 25273 26439 .+ 1 origid=EF_RS00760;function=Tyrosine Integrase;protein_id=WP_002392915.1;locus_tag=EF_RS00760;codon_start=1;color=8;Note=ICEscreen prediction%3A Tyrosine integrase%3B BlastP result %28Annotation confidence%3A HIGH%29%3A Tyrosine integrase %5BHit with AAO80040%3B Identity%3A100.00%25%3B E-value%3A0.00e%2B00%3B Query coverage%3A100.00%25%5D%3B Hmmscan result%3A Tyrosine integrase %5BHit with Phage_integrase HMM profile%3B E-value%3A4.40e-29%3B i-Evalue%3A9.70e-29%5D +NC_004668.1 ICEscreen mobile_element 1 26439 .+ . mobile_element_type=other%3A integrative and conjugative element;Note=ICEscreen prediction%3A Putative ICE %28one integrase Tyr%29 %5BElement structure%3A Single%3B ICE superfamily%3A Tn916%3B ICE family%3A ICESt3%3B Relaxase family%3A - %28MOBT%29%3B Coupling protein family%3A TcpA%5D %28ICEscreen ID%3A ID_1%29;color=15
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/NC_013798_298468_322494_NC_020450_643089_661957_detected_ME.summary Tue Feb 28 14:10:26 2023 +0000 @@ -0,0 +1,82 @@ + +##################### Main parameters of the ICEscreen analysis ##################### +Maximum distance in CDS between consecutive SPs within a segments: 100 +Maximum distance in CDS between consecutive SPs within an IME element: 14 + + +##################### ICEscreen statistics for genome accession NC_013798.1 ##################### + +##### Mobile elements ##### +## Number of complete elements +Complete ICE (4 types of SP): 1 +Complete IME (R+I, R+C+I with distance between consecutive SPs <= 14 CDSs): 0 +## Number of complete modules +Conjugation module (R+C+V): 0 +Mobilizable element (R+C with distance between consecutive SPs <= 14 CDS): 0 +## Number of partial elements +Partial ICE (at least V): 0 +Other partial element (R+C, R+V, V+C with distance between consecutive SPs > 14 CDS): 0 +## Composite elements +Total nested elements (partial or complete): 0 +Host element: 0 +Guest element: 0 +Element that are both host and guest: 0 + +##### Signature proteins ##### +## Total SPs detected +Total SPs: 4 +Total Integrase: 1 +Total Relaxase: 1 +Total Coupling protein: 1 +Total VirB4: 1 +## Unassigned SPs +Unassigned SPs: 0 +Unassigned Integrase: 0 +Unassigned Relaxase: 0 +Unassigned Coupling protein: 0 +Unassigned VirB4: 0 + +##### Segments ##### +Number of segments with one element: 1 +Number of segments with several elements: 0 +Number of segments with nested elements: 0 +Number of segments with exclusively isolated SPs to manually verify: 0 + +##################### ICEscreen statistics for genome accession NC_020450.1 ##################### + +##### Mobile elements ##### +## Number of complete elements +Complete ICE (4 types of SP): 1 +Complete IME (R+I, R+C+I with distance between consecutive SPs <= 14 CDSs): 0 +## Number of complete modules +Conjugation module (R+C+V): 0 +Mobilizable element (R+C with distance between consecutive SPs <= 14 CDS): 0 +## Number of partial elements +Partial ICE (at least V): 0 +Other partial element (R+C, R+V, V+C with distance between consecutive SPs > 14 CDS): 0 +## Composite elements +Total nested elements (partial or complete): 0 +Host element: 0 +Guest element: 0 +Element that are both host and guest: 0 + +##### Signature proteins ##### +## Total SPs detected +Total SPs: 4 +Total Integrase: 1 +Total Relaxase: 1 +Total Coupling protein: 1 +Total VirB4: 1 +## Unassigned SPs +Unassigned SPs: 0 +Unassigned Integrase: 0 +Unassigned Relaxase: 0 +Unassigned Coupling protein: 0 +Unassigned VirB4: 0 + +##### Segments ##### +Number of segments with one element: 1 +Number of segments with several elements: 0 +Number of segments with nested elements: 0 +Number of segments with exclusively isolated SPs to manually verify: 0 +
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/NC_013798_298468_322494_NC_020450_643089_661957_detected_ME.tsv Tue Feb 28 14:10:26 2023 +0000 @@ -0,0 +1,3 @@ +ICE_IME_id Segment_number Genome_accession Category_of_element Category_of_integrase Host_ICE_IME_ids Guest_ICE_IME_ids Colocalized_ICE_IME_ids ICEline_format ICE_consensus_superfamily_SP_conj_module ICE_consensus_family_SP_conj_module IME_relaxase_family_domains_blast HMM_family_SP_conj_module Integrase_upstream Integrase_downstream Relaxase Coupling_protein VirB4 List_SP_ordered_genomic_position Other_potential_SP_conj_module_need_manual_curation_and_review Other_potential_integrase_need_manual_curation_and_review Comments_regarding_structure +ID_1 1 NC_013798.1 Complete ICE (V+C+R+D) one integrase DDE - - - V8.C7.R2.D Tn5252 TnGBS2 - C:VirD4, R:MOBP, V:VirB4 - GALLO_RS01755 GALLO_RS01740 GALLO_RS01695 GALLO_RS01650 GALLO_RS01650, GALLO_RS01695, GALLO_RS01740, GALLO_RS01755 - - Downstream integrase GALLO_RS01755 has been associated to the structure ID_1 pre-merging because it is adjacent to the conj module and there is no upstream/downstream ambiguity. +ID_2 2 NC_020450.1 Complete ICE (C+R+V+I) one integrase Tyr - - - C1.R1:V5.I Tn916 - - C:TcpA, R:MOBT, V:VirB4 - LILO_RS03350 LILO_RS03260 LILO_RS03250 LILO_RS03320 LILO_RS03250, LILO_RS03260, LILO_RS03320, LILO_RS03350 - - Downstream integrase LILO_RS03350 has been associated to the structure ID_2 pre-merging because it is adjacent to the conj module and there is no upstream/downstream ambiguity.
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/genbank/NC_013798_298468_322494_NC_020450_643089_661957.gb Tue Feb 28 14:10:26 2023 +0000 @@ -0,0 +1,1732 @@ +LOCUS NC_013798 24027 bp DNA linear CON 24-DEC-2022 +DEFINITION Streptococcus gallolyticus UCN34, complete sequence. +ACCESSION NC_013798 REGION: 298468..322494 +VERSION NC_013798.1 +DBLINK BioProject: PRJNA224116 + BioSample: SAMEA2272396 + Assembly: GCF_000027185.1 +KEYWORDS RefSeq; complete genome. +SOURCE Streptococcus gallolyticus UCN34 + ORGANISM Streptococcus gallolyticus UCN34 + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 + AUTHORS Rusniok,C., Couve,E., Da Cunha,V., El Gana,R., Zidane,N., + Bouchier,C., Poyart,C., Leclercq,R., Trieu-Cuot,P. and Glaser,P. + TITLE Genome sequence of Streptococcus gallolyticus: insights into its + adaptation to the bovine rumen and its ability to cause + endocarditis + JOURNAL J Bacteriol 192 (8), 2266-2276 (2010) + PUBMED 20139183 +REFERENCE 2 (bases 1 to 24027) + AUTHORS Rusniok,C. + TITLE Direct Submission + JOURNAL Submitted (23-NOV-2009) Rusniok C., Unite de Biologie des Bacteries + Intracellulaires, Institut Pasteur, 25, 28 rue du Docteur Roux, + 75015, FRANCE +COMMENT REFSEQ INFORMATION: The reference sequence is identical to + FN597254.1. + The annotation was added by the NCBI Prokaryotic Genome Annotation + Pipeline (PGAP). Information about PGAP can be found here: + https://www.ncbi.nlm.nih.gov/genome/annotation_prok/ + + ##Genome-Annotation-Data-START## + Annotation Provider :: NCBI RefSeq + Annotation Date :: 12/24/2022 01:57:52 + Annotation Pipeline :: NCBI Prokaryotic Genome + Annotation Pipeline (PGAP) + Annotation Method :: Best-placed reference protein + set; GeneMarkS-2+ + Annotation Software revision :: 6.4 + Features Annotated :: Gene; CDS; rRNA; tRNA; ncRNA + Genes (total) :: 2,343 + CDSs (total) :: 2,250 + Genes (coding) :: 2,234 + CDSs (with protein) :: 2,234 + Genes (RNA) :: 93 + rRNAs :: 6, 6, 6 (5S, 16S, 23S) + complete rRNAs :: 6, 6, 6 (5S, 16S, 23S) + tRNAs :: 71 + ncRNAs :: 4 + Pseudo Genes (total) :: 16 + CDSs (without protein) :: 16 + Pseudo Genes (ambiguous residues) :: 0 of 16 + Pseudo Genes (frameshifted) :: 11 of 16 + Pseudo Genes (incomplete) :: 6 of 16 + Pseudo Genes (internal stop) :: 5 of 16 + Pseudo Genes (multiple problems) :: 5 of 16 + CRISPR Arrays :: 2 + ##Genome-Annotation-Data-END## + COMPLETENESS: full length. +FEATURES Location/Qualifiers + source 1..24027 + /organism="Streptococcus gallolyticus UCN34" + /mol_type="genomic DNA" + /strain="UCN34" + /sub_species="gallolyticus" + /db_xref="taxon:637909" + gene <1..24 + /locus_tag="GALLO_RS01645" + /old_locus_tag="GALLO_0278" + CDS <1..24 + /locus_tag="GALLO_RS01645" + /old_locus_tag="GALLO_0278" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_001037290.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="PrgI family protein" + /protein_id="WP_012961395.1" + /translation="MNKLGSEFFKAIDQFERSIIGGFTWRQIIMMLGIVVGAGLAALI + TMFKLPSILFYLSLTLTIVPSFVYGIKKDEVIKERLLFKFKIQERSYQTEYESEEING + KYIPEKGVHEWNDLD" + gene 2..2362 + /locus_tag="GALLO_RS01650" + /old_locus_tag="GALLO_0279" + CDS 2..2362 + /locus_tag="GALLO_RS01650" + /old_locus_tag="GALLO_0279" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_001014604.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="ATP-binding protein" + /protein_id="WP_044555479.1" + /translation="MSGTTLTKEDKERAKQLKKALKASTQNTIKYTSLFEDGLMHIDG + EEYSKTWELGDANYLTADEEEKLDIIDYYVEALNGLDSDNTYQLLIINRPVPSTLLSQ + ITYEVEGDNRDIFRQEYNDMITARFATDQNNFKVEKFVTVSTQSRDRKQAYRKLNDVD + NHFKKQFQVVDIPFKSLNGTDRLNIFADLLRGNPYLNVDYKDVRISDLTTKSFIAPGR + ILFQEDQFLMDKQYCRVLFARSFPAFLNDRLVKSITDIGIELAITIHAKPYDVAEAVK + KVNTAEAGVKMDMVKSQAAAAEKGISSNLAVSSVAQATAEEAEKWKTEINDNDQKMFS + GVFAVMLKADTPEELADYTSRVKQAGRKHVVEFEEIYYHQEEALNTMLPIGKTYLDVK + RRFMRDLTTTNIATQIPFTNTDLQSNSPLANYYGQNQISNNIITLDRQRDLATASGVI + LGSSGSGKSVFVKTNEVIPAILRFPNDRVIIVDPEEEYVDIGRAFDAQVIDIYPGTKT + HFNLMDIPDQDKLRDEDKDFVGQKSSLIMGLFENILQEVTDDDISLIDRVTRLCYEQI + TDRTPTLKDWHDILLEQPEEEAQSLALKSESYTKGSQDIFAYETNVDLNKQVVIFNLK + KLSGKLKPFALMVIQDYIWQHVVEHKGEFVTRAYFDEMQYQFETEDQATFFTNMYARI + RKYGSIPTGITQSVETLLDRKEGRNLLYNSEFIVLLKQKKTTIPYLLKTINLTDALIR + YVEKPKAKGTGLIIAGEIAVPFENPIPENTELFRLVATDAYRKIEE" + gene 2364..2957 + /locus_tag="GALLO_RS01655" + /old_locus_tag="GALLO_0280" + CDS 2364..2957 + /locus_tag="GALLO_RS01655" + /old_locus_tag="GALLO_0280" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_017794877.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_012961397.1" + /translation="MFEDVTLKLSKKKEKELLAHYNTKIQDAIEKTFEDKEFYKPMVR + MSGLCRWLDVSTTTVVKWQKEGMPHMVIDGVTLYDKRKILKWLNHFERNKIISQENQM + KVLPGYLSIKHVFGTIITYPKEVVLDLIEDLRETDVQDFSYWSPLYFLEYDELGCPVY + LTYLVNEVGIAMHPNRYYYVTLTEEQEKALESLELSI" + gene 2972..3220 + /locus_tag="GALLO_RS01660" + /old_locus_tag="GALLO_0281" + CDS 2972..3220 + /locus_tag="GALLO_RS01660" + /old_locus_tag="GALLO_0281" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_017647992.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_012961398.1" + /translation="MNLKDFETIFQQQTKARNKRILIVLGIFFSVITAKHIFGLIITS + ILSLAFIVDFVWLRYKKRKKWLETDTKAIAAKRRVESE" + gene 3259..5958 + /locus_tag="GALLO_RS01665" + /old_locus_tag="GALLO_0282" + CDS 3259..5958 + /locus_tag="GALLO_RS01665" + /old_locus_tag="GALLO_0282" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_000066069.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="phage tail tip lysozyme" + /protein_id="WP_012961399.1" + /translation="MSDKNDLRKRVVRNRHIKESVQRHNQLSARKAQKAAKAEYQKAK + TNLKKAEEALNKAKEELKTADLSDKEKAEKLKELEANVKKAKAEVKAAKKVKKKVRKT + NPTVGQRARKTGRNIGKTVSREVLTTALTQDDTLSDAVKLKRQARQTAITMKHAGRAT + AKGTKLAYRGAKGTVKLSVKATKYTYKGARKGTQKATQATAKVAAKTAQGFVTVAKSA + ASAATTLLANPITWIVSGVVALVLFLVIIVSSIFSSNVAQQTEFSLNQSWLHISQVDR + KNSSDQVDYYTDIDSILLYMNYRYGGDWEPDAKWDDGTGGKLAGTLGFNHFSDALDDI + WKEENKDIGNLKTMAELYTNGKEWLKLDDDDLAEYKEILESQSETGKYLAYQELSNPF + YAADDDKSETEYLTISKRYGYTDKDTIDPTSTLQASSGQKLYATMDGKVTVTTKDLKG + NETETTNVIITDSDARFIYYNIASIRVKTGDKVEAGTELGIVSGSSQKIAYVKKYGEV + DPKDSQWLQDIKDKDVSYGYTEKTTKNKTNVWVFVNPGFYFPFVKYSQTTVVTKTSSE + MSGRAKQFYDLVKKYYPNATDNGIAAVVGNFAVESSITAKRAEGDYLSPPVGASDGCW + DDETWLNMGGTEIYGGGYPNILHRGLGLGQWTDTSDGGTRHTMLINYANAIGKKWYEL + ETQVRFMLEGDSPYYQNILKSVLTSNADTDSLTKSFLTKWEGINNGTLSQRQSYAKQA + LSWFHQSIAGGGTLASSWDFPEEYRDKIKSMPTTASMTTQAGSGYKVGQCTWYAYNRL + VELGEITDLSGSYGHLGNGQDWVRNLVAKGWHYSTTPSVGAVCSTAGGFDSTYAIYGH + VMIVEAVNDDGSFLVSECNYAGNQSQIHWRVCQNASYYTFATP" + gene 5975..6592 + /locus_tag="GALLO_RS01670" + /old_locus_tag="GALLO_0284" + /pseudo + CDS 5975..6592 + /locus_tag="GALLO_RS01670" + /old_locus_tag="GALLO_0284" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_017794862.1" + /note="internal stop; Derived by automated computational + analysis using gene prediction method: Protein Homology." + /pseudo + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + gene 6576..6788 + /locus_tag="GALLO_RS11895" + /old_locus_tag="GALLO_0285" + CDS 6576..6788 + /locus_tag="GALLO_RS11895" + /old_locus_tag="GALLO_0285" + /inference="COORDINATES: protein motif:HMM:NF012651.2" + /GO_function="GO:0003697 - single-stranded DNA binding + [Evidence IEA]" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="single-stranded DNA-binding protein" + /protein_id="WP_012961400.1" + /translation="MSLTAKGDTLQVTGRLQTRTYKDKKEVTHKVTELQVDKWYLVGV + SQTQGDYPVKEKTIIKDSDNLDKLSL" + gene 6807..7082 + /locus_tag="GALLO_RS01680" + /old_locus_tag="GALLO_0286" + CDS 6807..7082 + /locus_tag="GALLO_RS01680" + /old_locus_tag="GALLO_0286" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_014295369.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_012961401.1" + /translation="MTEETYTTEQQTSKASRRQKSTSERLMAKQNQLAKAKASQAVMQ + KKIKGLEEEIKILENKRQQEILQEYGMSLSDLEAFLANNKDKLGGDA" + gene 7082..7912 + /locus_tag="GALLO_RS01685" + /old_locus_tag="GALLO_0287" + CDS 7082..7912 + /locus_tag="GALLO_RS01685" + /old_locus_tag="GALLO_0287" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_003030379.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_012961402.1" + /translation="MFRIQNLGTGQEQEFPNRAALLLGLEGEENRCLQLNQIATFQVF + HLDKNQEVLESMELTIPSSGSEDVKMLLGDFGLKKEESRAFWKRGRQKPKQEEQSKDR + SHPVKKVIVKEKAPKPSNLSKSQTASTLFGRGLKALVLVITLLLSCVSLWVSLSAREE + KQKSTAKTVQVTIDQKADVFCRYFIGNYFANSSAREDFVSKSLDLDQMTVEKATTLSV + LLESQTAQQTTTTLTYVISCRYDDETTENKRLTLTVKQNKEAKYGYLVTKLPQLTAYP + " + gene 7931..8425 + /locus_tag="GALLO_RS01690" + /old_locus_tag="GALLO_0288" + CDS 7931..8425 + /locus_tag="GALLO_RS01690" + /old_locus_tag="GALLO_0288" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_000371894.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="DUF3801 domain-containing protein" + /protein_id="WP_012961403.1" + /translation="MEQEQILDRGARVTLDTGRQLFQFLAYAAGQLYKVYDERKLTGK + QSYKNFFNQNSLTKDHIDFLEADVNLKKFTKELEKSGVRFAFKDNSDGTKQVWFEAHN + REVIADALRQTLNEIINDPKKAKEKYMKSEKELTPKEQITKIKEATKEKVDTVKAKKK + GKSI" + gene 8425..10455 + /locus_tag="GALLO_RS01695" + /old_locus_tag="GALLO_0289" + CDS 8425..10455 + /locus_tag="GALLO_RS01695" + /old_locus_tag="GALLO_0289" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_013851992.1" + /GO_component="GO:0016020 - membrane [Evidence IEA]" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="type IV secretory system conjugative DNA + transfer family protein" + /protein_id="WP_012961404.1" + /translation="MTYQKKPFIPYLLLSFVLAFCTHRAYVLYSLAPAPDMSDLFGQY + TYVLDHYFDRPIFYLDTSPLALLAALVGFFIGMLFYLKIKPGGTYRHGEEAGSARFAT + AQELSGFKDSEPTNNMIFSKQAQMGLFNKLLPFQWQLNKNVVVVGLPGDGKTFTYVKP + NLMQMNSSFIVTDPKGLLVREVGSMLEKHGYQVKVFDLVNLTNSDMFNPFHYMTSELD + IDRITEAIVEGTKKGDREGEDFWNQAKLLLNRALIGYLYFDSQVRDYTPNLSMVSELL + RNMKRPNEKEPSPVEKMFDELEAAMPGNYACRQWDLFNSNFEAETRTSVLAIVATQYS + IFDHEAVTDLIKADTMEMETWNTEKTAVFVAISETNKAYSFLASTLFTVMFDQLTHTA + DAIIQGQKEGYTTDELIHVQFIFDEFANIGKIPHFNEVLASVRSREMSVKIIIQAISQ + LDTIYGDKARKSIINNCATLLFLGTNDEDTMRYFSMRAGKQTITQNSYSEQRGQRVSG + TTSIQSHQRDLMTPDEIARIGVDEALVFISKQNVFRDKKAMVSDHPMKDELSNHPTDG + KWYAYRRFMVEDPEFFNAVYQGKISAENIWYPDMADYGEFVKENPFVESSQQATEGLV + DEQVPVQMAETTSESQSQTPPTHLRTVDLETGELFELPPEEEDETDDYYGEV" + gene 10865..11608 + /locus_tag="GALLO_RS01700" + /old_locus_tag="GALLO_0290" + CDS 10865..11608 + /locus_tag="GALLO_RS01700" + /old_locus_tag="GALLO_0290" + /inference="COORDINATES: ab initio + prediction:GeneMarkS-2+" + /note="Derived by automated computational analysis using + gene prediction method: GeneMarkS-2+." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_012961405.1" + /translation="MYDYFDFYGLWIEQLTILQKEGLSQWIENDDFFLFDFLYDLDGI + SFDCGNHYNCSLKFELNDKCYRNSQCHGIVLPLPTQPQLMNTAYSSVDDIVRDLKAAY + GQYLPKDFDYKANICHAQASMWEFGPDNDFKKNDEPIKQELPMFVIDGYHAISSKIGL + MIEYPEKILKDIFDLTEEDLSKSTRLSPLYEVSDSSKEKIYQYFLVDNMGLPLSNDSI + YWIKLSDKDDHLLKKVLIDLTSWISFKYS" + gene 11685..12038 + /locus_tag="GALLO_RS01705" + /old_locus_tag="GALLO_0291" + CDS 11685..12038 + /locus_tag="GALLO_RS01705" + /old_locus_tag="GALLO_0291" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_006739176.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_012961406.1" + /translation="MTIYELDPNFFVNLGKTAPYKVTEIIGKDHPDNFLTPGEEKSFL + ILDKEKAWIVHADSLVSVAEELEGYLGMSVDDFIMISLGTQYHKRFCFNDDYEIWERY + FTKLREAYYSDSSSK" + gene 12092..12574 + /locus_tag="GALLO_RS01710" + /old_locus_tag="GALLO_0292" + CDS 12092..12574 + /locus_tag="GALLO_RS01710" + /old_locus_tag="GALLO_0292" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_001202059.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_012961407.1" + /translation="MTKVLKKLIEENLSPLGIVELIDERYDKFGGYYLLYSLSLTAIT + PEFSESGTVDIEVSFSDYQELTYELGKYSIPFYVNSKEELKCLLEGIVDLPLPFSVSY + EPIKEVTWDRYIVSIDGVKTTRIIELVTMIKVLEDYLSQIEPLLNQNVLKIMKNRENN + " + gene 12609..14345 + /locus_tag="GALLO_RS01715" + /old_locus_tag="GALLO_0293" + CDS 12609..14345 + /locus_tag="GALLO_RS01715" + /old_locus_tag="GALLO_0293" + /EC_number="5.6.2.-" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_017768605.1" + /GO_function="GO:0003677 - DNA binding [Evidence IEA]; + GO:0003916 - DNA topoisomerase activity [Evidence IEA]" + /GO_process="GO:0006265 - DNA topological change [Evidence + IEA]" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="DNA topoisomerase" + /protein_id="WP_052828722.1" + /translation="MKYLLLAEKPDQAKKYATALGNPKNEKGVWRVQSSVLNAEVIVA + PAVGHLVERINPYTNFENWEMTNLPALPEGFSYEPKKDTIKRFNAIKKAVKEVDAIII + GTDPDREGEAIAYRILELIPEALRKIKYRLWANSLTKRGLEQAFANLRSPTDSINYFH + EADARSDADWLVGFNLSPFVTIKMKEEGYLDKKDHSMSVGRVQTPIVSLIVRNDEAIE + NFKPSPYWRLKLIDSEAEVIFSNDIKYQSQMEAEQVLQQLANTAVVKTVTSEEKAQEA + PKLYNLTNLQSEMSKLYHFDATKTKELVQSLYQKGYLSYPRTDSTLITTNEFSYLVDH + IEEYQKAINKQLETPNRSPRKNYVNDKKVLEHYAIIPTENIPDLSELSDDEKLIYQKA + VFRTLLMFTPDYRYQSTSVILDNHGLEFKATGTVTKDKGWRGYFAVKKEDKELPHYQE + GQEVIVDCNLLEEMTKPPTRITEQILLKKLLPKYHLGTSATRDGMIDLIQDKGYVTKH + KKTGQFFPTERGKLLIHYLDQLEIAYTNPETTGKWEEVLAQIGQGKIQKEAFVNKIKW + AITKQIEKGKQL" + gene 14398..18747 + /locus_tag="GALLO_RS01720" + /old_locus_tag="GALLO_0294" + CDS 14398..18747 + /locus_tag="GALLO_RS01720" + /old_locus_tag="GALLO_0294" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_000002618.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="PBECR4 domain-containing protein" + /protein_id="WP_012961409.1" + /translation="MANMQELLSQRFEAQRQKLVSMDIVAVAESLGMTLKPGSSGTYY + WEEHDSFHIYPNTNTFRWWSRSIGTNTIDLVQVVQEEMTGHKPSFREAAAFLETGHFE + NVTVQPIVKEPFEYYLERYEHPDFNIGRQYLKEERGLSDETIDTFLASGNMATATRKK + GDYFEPVIVFKSCDNDGKMIGASLQGLVENRVQHPERGRLKQIMKNSEGTAGFSLDVG + TPKRLVFAEAPIDLMSYYEVNKDDLQDVKLVAMDGLKKGVISRYVADMLTDGKYSQTM + SAEQIRGALDALNQTTNLLQEHSDMITLAVDNDEAGQNFVKGLQDDGIPVIPDLPPRQ + PAQKKMDWNDYLKQMKKESAQMAETPEVEKQSLSELQESLSNEGDLVSTITSDSSIIY + TNTVSFNQDYNLNLEIHSPNEVDNLSDIQAPWTLEVMKKGQSLGYLAYGEDWGNDFDI + EDELVNLENWVKDNQVTNHLYTQKDINAFLASTQEVEPKMGDFVLKGGGIYDFGKSQL + EGEELRQHAIDAMISDITDAETYYLWHDEELEKLNAPDEAFLNFHYHLQDIQYNQNDI + HLYVSESSTDGVTGYLSLDGNSLDSDSIEEYLADQDWTFNQKVQFLKNLKTAVDDTWN + KVTDHYNEQFNAIVDQYGLSLQKEKTPEVPQEQESANSEQQKKVENPIGDLPEQSQEA + APLPNTHEEYSLNESSPTQTQSQPLLHFNISNPDKSIYKVGYHPVNRKELNKLNRYAA + QIQENATWYKNELADSNVTYFYKNNDNLEALKVTFKAEQYPHLIGFFAIDENQSASKT + LDDLASGKGDYQNIMVANRGATFSKIQVLPDFKAVVDSNSFIFDDLSEVERMNRLDLA + KAIRTEDKDVLIAFRNVDGEYLPASLMKVTNKLESELSIANNKDVLGIVGEKNGEFKV + LSVNEEIIKDGGKKMLSIVKNNQFENLSKAEVTAEDFTKVLDAVYNVGAQVGKDNRAN + IPKELYPAWDKYYEYAERYDNNFDVIVKAARADNLFDENSDFYKDVWLRKIQEENQKV + KDSDGDGLTDDEEIALGTNPYSPDTDGDSVIDSIERGSGTDATNPSDTPDNRQKEQMK + HNLTLSEMIKAKDTVALNQHLQEGIKDYFDSDTYKNYLEGMAHFNHYSARNIQLIKAQ + LPEATMVASFEEWKKRNGHVNKGEKALYVQAPVTVIKKDADGNPVINSETGEKETFTY + FKPVPVFDISQISPQQGKQLNLPKSSEAIPAQLNKDYYQNVYRALRDISQKENGIPIR + FRELEQFDGFYNPKTNDITIKKGMTYEQTLSTLIHEMAHSELHNKKSLTERFEGKLTR + SSKELQAESVAYVVSNHLGFDTSNDSFAYLASWSQEPDGLENLKAQLEIVQEEASSLM + NRIDKQLTKYQTLTVSKDETLTETQKRNLEKSANPFYQSLQKAKAEVNNMKKGDEPNN + EQTVKKDNRPTKC" + gene 18796..19089 + /locus_tag="GALLO_RS01725" + /old_locus_tag="GALLO_0295" + CDS 18796..19089 + /locus_tag="GALLO_RS01725" + /old_locus_tag="GALLO_0295" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_000255675.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_012961410.1" + /translation="MITDEMMTITEMILMSYYFDMSEWLKGNKIINSDIVQKSKDDLL + DVLKTDFEQLTTEDNNDYLDDLSISIGTLEELSEDNYQKLKTAIFSWEPSKKK" + gene 19402..19776 + /locus_tag="GALLO_RS01735" + /old_locus_tag="GALLO_0296" + CDS 19402..19776 + /locus_tag="GALLO_RS01735" + /old_locus_tag="GALLO_0296" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_000436063.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="plasmid mobilization relaxosome protein MobC" + /protein_id="WP_012961411.1" + /translation="MTIKRRKRPIEFKLRTTDEEAFQLRQRITMANKKTFQGYALEML + LKGKIETYDYSELQRLRVEVNHIGQNVNQLVRYVNTFDEIDSELFKALQAEIDEMKVL + LIDEFKTKGRAKLNGGDKSNPD" + gene 19748..21367 + /locus_tag="GALLO_RS01740" + /old_locus_tag="GALLO_0297" + CDS 19748..21367 + /locus_tag="GALLO_RS01740" + /old_locus_tag="GALLO_0297" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_008090066.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="relaxase/mobilization nuclease domain-containing + protein" + /protein_id="WP_012961412.1" + /translation="MVVTKVIQIKSSRNLKRAINYITRDNATLKLDSERLEGDDNYSY + EMVNGQVMKRLVSGHDVTDISDPQTIYDDFVLLKQSVDALYNNDELSDLKNDKRVLAH + HIIQSFSPEDGLTPEEVNEIGRKTALELTGGDYQFVVATHMDKGHLHNHIIFNTTNEV + TLKKFRWQKGTKKSLEHISDKYAELYGAKVLEPRLRNSHTDYSAWRRKNNFRFEIKER + LNFLLKHSLDMTDFLQKAKTLNLQVDTSGKYIKYKLLDQPQERFVRDRTLSKKGKFSL + EKIKEQIATNEVVYDLNVIKEKYDEEQESKQDDFEMQLTIEPWQIEQLTHQSIYVPIT + FGLDRKGTVSIPARMLDQNEDGTFTAYLKKNDFFYFLNTDHSEQNRFIKGVTLIKQLS + AQNGEMILTKNKNITNLDRLVDEFNFLAANNVTNSKQFENLQQQFLEQLDETDKTLAA + LGDKIFYLNKLLGALSDYQNNIVPSEVSLDLLEKGKIDKTMKLDELQKEIKELQIERD + TLKKHRDKIVKDYDFTKEIKQTHEKRTGISL" + gene 21472..21660 + /locus_tag="GALLO_RS01745" + /old_locus_tag="GALLO_0298" + CDS 21472..21660 + /locus_tag="GALLO_RS01745" + /old_locus_tag="GALLO_0298" + /inference="COORDINATES: ab initio + prediction:GeneMarkS-2+" + /note="Derived by automated computational analysis using + gene prediction method: GeneMarkS-2+." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_012961413.1" + /translation="MATNKEQIKNSGKCLFVETTTKLSSDELLKAIADDNMTEEQVEQ + LKIDLDIFLKQRAAAFKE" + gene 21688..22395 + /locus_tag="GALLO_RS01750" + /old_locus_tag="GALLO_0299" + CDS 21688..22395 + /locus_tag="GALLO_RS01750" + /old_locus_tag="GALLO_0299" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_013643517.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="class A sortase" + /protein_id="WP_148211633.1" + /translation="MKLLKGLLLVLLLLIGVALIFNKSIRNTLIAWNTNQYQVSQVSK + QTIEQNKDANVSYDFDSVESISTESVLKAQTNSANLPVIGGVAIPEVGINLPIFKGLG + NTELTYGAGTMKENQVMGSGNYALASHHVFGLTGSSQMLFSPLENVKTGMKIYLTDKE + TVYTYIVTSIESVAPSQVAVIDDTEETEVTLVTCTDAEATSRTIVKGVYDSEVSFDQA + PEDILDAFNTAYNQIAL" + gene 22686..24026 + /locus_tag="GALLO_RS01755" + /old_locus_tag="GALLO_0300" + CDS 22686..24026 + /locus_tag="GALLO_RS01755" + /old_locus_tag="GALLO_0300" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_006531843.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="UPF0236 family protein" + /protein_id="WP_044555481.1" + /translation="MVVMRFDERGFVEELYRQREYEFLKRVAAYDKQIAPTMRANGYK + RVDSSERTVLFTFGAMTFSRSRWRRGTKTRYPVDEWLGLKKYMRCSLELMYHLVRYAS + EMSYRQVCRMIKLSYHLDITKDTVLKAVKLTGQLFSEKSHYRYFVEEEVSEKIKAPVI + YIEGDGVLVKTNTGGDEKHNTDLAHFLVHTGTKIVHGRTVLLNKHEIIHTDYEVARDE + LLDYLYNHFEITNQTILVTNSDNGKGYTRRVFQNIQKALKIKRHEHFWDAHHVKEKIT + SFFKSYPKILKDLMFKAIQTHNRKLLKTVLDTVESLVTDDEEYLVFQKFRKKFLNNFK + DTKPAKLRGLSHKGIGVMESQHCKVTFRMKHRGMYWSIKGACAMARLILLERIDQLEN + LFFGNWRKDYQYYKDNQLGVGYLRESKADHSPTPQRIFKRAGKIMSLDRQKFKY" +ORIGIN + 1 catgagtgga acgaccttga ctaaagaaga caaagagcgg gcaaagcagc tcaaaaaagc + 61 gttaaaggct agcacccaaa atacgattaa atacacctct ttatttgaag atgggctcat + 121 gcatattgac ggggaagagt attctaaaac ttgggaactt ggtgatgcga attacctaac + 181 ggcggacgag gaggaaaaac ttgatattat cgactattat gttgaagctt tgaatggttt + 241 ggatagtgat aatacctatc agctgctgat tattaatcgt cctgtaccct caaccctttt + 301 aagtcaaatt acctatgagg tagaaggcga taatcgtgat atctttcgtc aagaatataa + 361 cgatatgatt accgctcgtt ttgcgacaga tcaaaataat tttaaggttg aaaaatttgt + 421 cacggtctct acacaatcgc gagatcgaaa gcaagcctac cgtaaattaa atgacgttga + 481 caatcacttt aagaaacaat ttcaagtcgt tgacatcccc tttaagtcat taaatggaac + 541 tgaccgctta aatatttttg ctgatttact tcgtgggaat ccttatctga acgttgatta + 601 taaagatgtc cgtattagtg atttaaccac aaaatccttt attgctcctg gacgaatctt + 661 gtttcaagag gatcaatttc tgatggataa acagtattgc agggttcttt ttgctagaag + 721 ttttcctgct tttttaaatg atcgcttagt caagtctatt acagatattg gaattgaact + 781 agccattacg attcatgcga agccttatga tgtcgcagaa gctgttaaaa aagtgaatac + 841 ggctgaagca ggtgtcaaaa tggatatggt taagtcacaa gctgcggcag cggagaaagg + 901 tatctcaagt aatctagctg tttcgagtgt ggctcaagct accgctgaag aagctgaaaa + 961 atggaaaaca gaaatcaatg acaatgacca gaaaatgttc tctggtgtct ttgcagtcat + 1021 gcttaaggcc gatacaccag aagaattagc tgattatacc agtcgtgtca aacaggcagg + 1081 ccgaaaacat gtggttgaat ttgaagaaat ctattatcat caagaagaag ccttaaatac + 1141 catgttaccg attggtaaaa cgtaccttga tgtcaaacgt cgctttatgc gtgatttgac + 1201 cacaacaaat attgcaactc aaatcccatt taccaacacg gacttacaaa gtaacagtcc + 1261 attagctaat tattacggtc agaatcaaat ttcgaataac attatcactc ttgaccgcca + 1321 acgtgattta gcaaccgctt caggagttat tctagggtca tctggctcag gaaagtctgt + 1381 ctttgttaaa acaaatgaag tcattccagc gattttaaga tttcctaatg atcgtgtcat + 1441 catcgttgac cctgaagaag aatatgtcga tatcggtcgt gcctttgatg ctcaagtcat + 1501 tgatatctat ccagggacta aaacgcattt taatctcatg gatattcctg atcaagataa + 1561 actacgcgat gaagacaaag actttgtcgg tcaaaaatca tctctcatca tgggcttatt + 1621 tgaaaatatt cttcaagagg tgaccgacga tgatatctct ctgattgacc gtgtgactcg + 1681 tctttgttat gaacagatta ctgatcgaac accaacccta aaggattggc atgatattct + 1741 tctagagcag cctgaagagg aagctcaaag tcttgcgctt aaatcagaat cgtacaccaa + 1801 aggctcacag gatatttttg cttatgaaac gaatgtcgat ttaaataagc aagttgttat + 1861 tttcaacttg aaaaaattaa gtggtaaatt aaaacctttt gcactgatgg tcattcagga + 1921 ttatatttgg caacatgtgg tagaacacaa aggtgagttc gtcactagag catactttga + 1981 tgagatgcag tatcaatttg aaactgaaga ccaagctact ttctttacga atatgtatgc + 2041 tcgtatccgt aaatatggct ctattccaac aggtatcacc caaagcgttg aaactctact + 2101 agatcgtaaa gaaggtcgaa acttgctcta taatagtgaa tttattgttc tcttaaaaca + 2161 aaagaaaaca acgatacctt atctactaaa gacgatcaat cttaccgacg cccttattcg + 2221 ctatgttgaa aagccaaaag cgaaaggaac tggcttaatt attgcgggtg agatagcagt + 2281 accatttgag aatccaattc ctgagaacac tgaattgttc aggttggttg ctaccgatgc + 2341 ttatagaaag atagaggaat aaaatgtttg aagatgttac tttaaagtta tctaaaaaaa + 2401 aggaaaaaga gttattagct cattataata ctaaaataca ggatgctatt gaaaaaacct + 2461 ttgaagacaa ggaattttat aagccaatgg ttcgcatgtc tggtttatgt cgttggctag + 2521 atgtttcgac aactactgtt gttaaatggc aaaaagaagg tatgccccat atggtcattg + 2581 atggagtaac tttatacgat aaacgaaaaa ttttaaaatg gttaaatcat tttgaaagaa + 2641 ataaaattat ttctcaagaa aatcagatga aagttttacc tggctactta tcaattaagc + 2701 atgtatttgg gacaattatt acttatccta aggaagttgt tcttgattta attgaagatc + 2761 ttagagaaac tgatgttcaa gatttttctt attggtcacc actatatttt ttagaatatg + 2821 atgaactagg atgccctgtt tatttaactt atctagtaaa tgaagttggt attgcgatgc + 2881 atccaaatcg ttattactac gttacattga cagaggaaca agagaaggca ctggaaagtt + 2941 tagaattatc tatttaaaaa gaggtattgt tatgaactta aaagattttg agactatttt + 3001 tcaacaacaa actaaagcta gaaataaaag aattttgata gttttaggta tcttttttag + 3061 tgtcataacc gctaagcata tatttggttt aattattact agcatattgt cactggcatt + 3121 catagttgat tttgtttggc tacgctataa gaagcgtaag aaatggctgg aaacagatac + 3181 taaagcaata gcagcaaaac gtagagttga aagtgaatag aaatgcttaa aagaaatata + 3241 cctgaaaggg ggtgaaccat gtcagataaa aatgatttaa gaaagcgtgt ggtgagaaat + 3301 cgtcacatta aagaaagtgt tcaacgtcac aatcagctat ctgctcgaaa agcccaaaag + 3361 gcagcgaaag cagagtatca aaaagcaaaa acaaatctca aaaaagctga ggaagcttta + 3421 aataaagcta aagaagagtt aaaaacggct gatttgtcag ataaagaaaa agctgaaaag + 3481 ctcaaagagt tagaggctaa tgtcaaaaaa gctaaagctg aagtgaaggc tgctaagaag + 3541 gtcaagaaga aggttcggaa aacaaatcct acagttggtc aaagagctcg aaaaacaggt + 3601 agaaatattg gtaaaacggt tagtcgtgaa gtgttaacaa ccgctctgac acaagatgat + 3661 actctttcgg atgccgttaa gttaaaacgt caagcacgcc aaaccgcaat cacaatgaaa + 3721 cacgcaggcc gagcgactgc taaaggaacg aaattagctt atcgtggtgc caaaggaacg + 3781 gttaagttgt ctgtcaaagc taccaaatac acttacaaag gggctaggaa aggcacgcaa + 3841 aaagcgacgc aagctaccgc aaaagtagcc gctaaaacgg ctcaggggtt tgtgacagtt + 3901 gctaaaagtg cggcaagtgc cgcaacgact ttgctggcaa acccaattac ttggattgtt + 3961 agtggcgttg tagccctggt gcttttttta gttattatcg tttcctcaat cttttcaagt + 4021 aacgttgccc aacaaaccga atttagccta aatcagtcgt ggcttcacat ctctcaagtg + 4081 gatcgaaaga actcttctga ccaagtagac tactacaccg acattgattc cattttactt + 4141 tacatgaact accgttatgg tggtgactgg gaacctgatg caaaatggga tgatggtaca + 4201 ggtggaaaac tagcaggtac tcttggcttc aatcactttt cagatgcttt agatgatatt + 4261 tggaaagaag aaaataagga tattggtaac ctaaaaacca tggcggaact ttacactaat + 4321 ggtaaggagt ggctgaaact agatgacgat gatttagctg aatataagga aattcttgaa + 4381 agtcaatctg aaacaggaaa atatttagct tatcaagaat taagcaatcc tttttacgca + 4441 gctgatgatg acaaaagtga aacggagtat ttaacgattt caaagcgtta tgggtacacg + 4501 gataaggata ctattgatcc tacaagtacc ttacaagctt catcaggaca aaaactttat + 4561 gccactatgg atggaaaggt caccgtcaca acaaaagact taaaaggtaa tgaaacagag + 4621 acgactaatg tgattattac agatagcgat gctcggttta tctattataa tattgctagt + 4681 atccgagtca aaacaggtga taaagtcgaa gcaggaactg aacttggaat tgtttcaggt + 4741 agttctcaaa agatagccta tgttaaaaaa tatggtgagg ttgatcctaa agattctcag + 4801 tggttacaag acatcaagga caaagacgtt tcctatggct acaccgaaaa aacaacaaag + 4861 aataagacta atgtctgggt gttcgttaac ccaggctttt attttccctt tgtaaaatat + 4921 agccaaacca ctgtggtgac caaaacatct tctgaaatga gtggtcgagc gaaacagttt + 4981 tatgatttag tgaaaaaata ttacccaaat gcgacggata acggtattgc ggctgttgtt + 5041 ggtaactttg cggtggagtc ctcaattaca gcgaaacgtg ctgaaggcga ttatttaagt + 5101 ccgcctgttg gtgcatctga tggttgctgg gatgatgaaa cttggttaaa tatgggcggt + 5161 acagaaatct acggtggtgg ctaccctaat attcttcatc gaggacttgg cttaggtcaa + 5221 tggacggaca cctctgacgg tgggactcgt cataccatgt taatcaatta tgcaaatgct + 5281 attggcaaaa aatggtatga attggaaacg caagtccgat tcatgttgga aggtgattca + 5341 ccttattatc aaaatatatt gaagagtgtt ttaacttcta atgctgatac agatagcctt + 5401 accaaaagtt tcttaacgaa atgggaaggg atcaacaatg gtacactttc tcaacggcaa + 5461 agctatgcca aacaagcctt atcttggttc caccaatcaa ttgcaggtgg tgggacatta + 5521 gcttcctctt gggattttcc tgaagaatac cgagataaaa tcaaaagcat gccaaccact + 5581 gcaagcatga ccacacaagc aggtagtggt tataaagtgg ggcaatgcac ctggtatgct + 5641 tataaccgtt tggtagaact cggcgaaatc acagacctat caggaagtta tggtcatcta + 5701 ggaaatggtc aggattgggt gaggaattta gttgcgaaag gttggcatta ttcaacgaca + 5761 ccatctgtag gagccgtttg ctcaaccgct ggtggttttg acagcactta cgctatttac + 5821 ggacatgtca tgattgtcga agcggttaat gatgatggta gcttcttagt ttcggaatgc + 5881 aattatgcag gaaatcaatc ccaaattcac tggcgagttt gtcaaaacgc ttcttactat + 5941 acatttgcga caccatagaa aggaaaagaa atcaatgata gatacgaata aactgacctg + 6001 gtataaacgt ctttttttag tgattggctt tattattgtt tttctcatcg gcttaggatt + 6061 cggtcaaatg gggaaaacga atcaaaaaca agtgacaaca cctaagacaa cgaccaaaaa + 6121 ggtaacagca ggtagttaat tgacggaaaa gtgggtcaaa aagttcttaa ttgcttacta + 6181 taccaaaaaa gatttggaag agaaccgcaa tcgttataaa gaatatatga ctgaaggcat + 6241 gtataatgcg acgatttctg aagaagaaac cgcccaaaac caagcctata aaggctatgt + 6301 ggttaatttt gaatttcagt cagcccaaat ttatatcgat caaaccaatg aaaaagtcat + 6361 ttgctacgtg aattacacga atgaccttct tcaggaaaaa gattccagtg aaggcgcaca + 6421 aacagatgtt agcaacacaa caattatcca actaacctac agtaaagtgg ataaaacgta + 6481 tcttgttaat aatatgagta ctctgttaat cacagattct caagacccaa ccagttcaca + 6541 agaagcttat ggcgatgtga ttgcgagtaa ttttggtgag cctaaccgct aaaggagata + 6601 ccttacaagt cacaggacgc ctacaaacac gaacctataa ggataaaaaa gaagtgactc + 6661 acaaagtgac agaacttcag gttgacaaat ggtaccttgt tggtgttagc caaactcaag + 6721 gtgattatcc tgttaaagaa aaaacgatta tcaaggatag tgataacttg gataagttat + 6781 cactttaaaa cgaaaggaaa cagaatatga ctgaagaaac atatacaact gagcaacaga + 6841 cttcaaaagc ttcacgtcgt caaaaatcaa cgagtgagcg tttaatggct aaacagaacc + 6901 agttagcaaa agcaaaagcc tcacaagctg ttatgcaaaa gaaaattaaa ggcttggaag + 6961 aagagattaa gattctcgaa aataaacggc aacaagaaat tttacaagaa tatgggatga + 7021 gcctttcgga tttggaagct tttctagcta ataacaaaga taaattaggg ggtgatgcgt + 7081 aatgtttcgc atccaaaatt taggaacagg acaagaacaa gaatttccaa accgagcagc + 7141 tcttttattg ggattggaag gtgaagaaaa tcggtgttta cagttaaacc aaattgcaac + 7201 ctttcaagtc tttcaccttg ataaaaatca agaagtatta gagtcaatgg aactgaccat + 7261 tccctcatct ggcagtgagg atgtcaaaat gcttttgggt gattttggac tcaaaaaaga + 7321 ggaaagcagg gccttttgga agcgtggtcg tcagaagcca aaacaagaag aacagtctaa + 7381 agatcgttct catccagtca aaaaggttat tgtaaaagaa aaagccccta agccatctaa + 7441 cttatcaaaa agtcaaacag ctagcacact ttttggaagg ggacttaagg cactcgtatt + 7501 agtgattact ttgttactgt cttgtgtgag cctgtgggtc tctttaagcg caagagaaga + 7561 aaaacaaaag tctacggcca aaacagtgca agtcacgatt gatcagaagg cagatgtgtt + 7621 ttgtcgttat tttattggta actattttgc caattcctca gctcgtgagg atttcgtgtc + 7681 gaaatcactg gatcttgacc aaatgacagt tgagaaagct actacgctta gtgtgttact + 7741 ggaaagccaa accgcacagc aaacgacaac aactttgacg tatgtgattt cgtgtcgcta + 7801 tgatgatgag acgaccgaaa ataaacgctt aacattaacg gttaaacaaa ataaggaagc + 7861 taaatatggt tatctagtga ctaaactacc acagttaacc gcttatcctt aagtaggagg + 7921 aaaaaacgtt atggaacaag aacaaatctt agatagaggc gcccgtgtga cgttagatac + 7981 gggaagacaa ctgtttcaat ttttagctta tgcagcaggt cagttatata aagtttatga + 8041 tgaacgcaaa ttaactggga agcagtccta taaaaacttt ttcaatcaga actcactgac + 8101 gaaagatcat atcgatttct tagaagcaga tgtcaacctt aaaaaattta ccaaagagct + 8161 cgaaaaatca ggggtacgtt ttgcttttaa agataatagt gatggcacga aacaggtttg + 8221 gtttgaagcg cacaatagag aagttatcgc tgatgcgctt cgccaaacgc ttaatgagat + 8281 tatcaatgat cctaaaaaag ctaaagaaaa atacatgaaa tctgaaaagg agttaacacc + 8341 aaaagaacag attaccaaaa tcaaggaagc cactaaggaa aaagtggata cggttaaagc + 8401 gaaaaagaaa ggaaagagta tttgatgacc tatcaaaaga aaccattcat tccttatctt + 8461 cttctcagtt ttgttttagc tttttgtaca cacagggcat atgtcttata tagtttagct + 8521 cctgcccctg acatgtctga tctatttggt caatatacct acgttttaga tcattatttt + 8581 gatcgaccaa ttttttatct tgatacgagt ccactagcgc ttttagcagc tttagtgggc + 8641 ttttttattg gcatgctatt ttatttgaaa attaaaccag gtggtactta tcgccatggt + 8701 gaagaagctg ggtcagctcg ctttgcgact gctcaagaac tttctggttt taaagattcc + 8761 gaaccaacca acaacatgat tttttcaaaa caagcccaga tggggctatt taataagtta + 8821 ttaccctttc aatggcaact gaataaaaat gtcgtcgtgg taggtcttcc tggcgatggg + 8881 aagaccttta cttatgtaaa gcctaatttg atgcaaatga attccagttt tatcgtaact + 8941 gaccctaaag gactcttagt tcgtgaggtt ggaagtatgc ttgaaaaaca tggctatcaa + 9001 gtaaaagtct ttgaccttgt caatctcacc aattcagata tgttcaatcc ttttcattac + 9061 atgacgtctg aactagatat tgatcgtatc acggaagcga ttgttgaagg cactaaaaaa + 9121 ggtgatcgtg aaggcgaaga cttttggaat caagcgaaac tacttcttaa tcgggcttta + 9181 attggttacc tctattttga tagtcaagtt agggattata cccctaactt gtcaatggtt + 9241 tctgagcttc ttcgaaacat gaaacgtcca aatgaaaaag aaccaagtcc agttgaaaag + 9301 atgtttgatg agcttgaagc agccatgcca ggaaattatg cttgtcggca atgggatctg + 9361 tttaacagta actttgaagc agaaacaagg acgagtgttc tagccattgt tgctacccaa + 9421 tactctatct ttgaccatga agctgtcaca gatttgatta aagctgatac gatggagatg + 9481 gaaacatgga acactgaaaa aacagcagtc tttgtggcta tttcagaaac gaataaagct + 9541 tatagctttt tagcctctac tttatttaca gttatgtttg accaactaac acacactgca + 9601 gatgcgatta tccaaggaca aaaagagggg tacacgactg atgagttaat acacgtgcaa + 9661 ttcatttttg atgagtttgc gaacattggt aaaattcctc attttaatga agtcttggct + 9721 tctgttcgta gtcgtgaaat gtcggtcaaa attatcattc aggccattag tcagctagac + 9781 acgatttatg gcgataaggc tcgaaaatcg attatcaaca actgtgcaac cttgttattt + 9841 ttagggacta acgatgaaga tactatgcgg tacttttcaa tgcgtgcagg aaaacaaacg + 9901 attacgcaaa acagttattc tgaacagcga gggcaacgtg tttcaggaac aacaagtatt + 9961 caatctcatc agcgggattt aatgacacct gatgagattg ctcgtattgg ggttgatgag + 10021 gctctggtct ttatttccaa acaaaatgtt tttcgggata aaaaagcaat ggttagcgac + 10081 catcctatga aagatgagtt atctaatcat ccaaccgatg gcaagtggta tgcttatcgt + 10141 cggttcatgg tagaagaccc agaattcttt aatgcggttt atcaagggaa aatctcagct + 10201 gagaatattt ggtatccaga tatggcagat tacggtgagt ttgtgaaaga aaatccgttt + 10261 gttgagagtt ctcagcaagc cacagagggt cttgttgatg aacaagtacc cgttcaaatg + 10321 gctgaaacga cctcagaaag ccaatctcag acaccaccaa ctcacttaag gacagtagat + 10381 cttgaaacag gtgaactctt tgaattacca cctgaagaag aggacgaaac tgatgattat + 10441 tatggtgaag tctaacgtca aatgagttat aataacttag ggaggttaac atgacaagag + 10501 aaaagcaaag caaagctctt tttttaaaat acttggcatt tcagaagacg acttattaag + 10561 ttatctgaag gaacatccta acgaccctct agttagtaaa ctagagcaat tattattaaa + 10621 cttatcagct aaaaaatagg ctacatcgtt aaacggtgta gcttttgttg tatgtatatg + 10681 gaggaaaaat agatggaaca aaaatattat gcggtactaa tgcaaatcaa tattggtaag + 10741 agcgtctggt tagtccctca agaaagtggg aaactagcct ggtcatttaa ttagaaatta + 10801 tttttatgct gcagttaatt ttagcaatta gctgtttttt agttacagaa aggattttat + 10861 tattatgtat gactatttcg atttttatgg cctttggata gaacagctta ctatcctaca + 10921 aaaagaagga ctgtctcaat ggatagaaaa cgatgacttc ttcctttttg actttttata + 10981 cgacttagat ggtatttcgt ttgactgtgg caatcattat aattgttctc tcaaatttga + 11041 actaaacgat aaatgttatc gtaacagtca atgtcatggg attgtattac cattaccaac + 11101 ccaacctcaa ctcatgaata ccgcttattc atccgtggac gatattgtac gagacttaaa + 11161 agcagcatat ggtcaatatt taccgaaaga ttttgattat aaagctaata tttgtcatgc + 11221 acaagcttcg atgtgggagt ttggtcctga taatgatttc aagaagaatg atgagcccat + 11281 taagcaagag ttaccaatgt ttgtaattga cgggtatcat gctatttcct caaaaattgg + 11341 tcttatgata gaatatccag aaaagatttt aaaggatatt tttgatttaa ctgaggaaga + 11401 cttaagcaag tcaacaagac tttctccatt atatgaagta agtgatagta gtaaagaaaa + 11461 gatataccag tattttttgg tagataacat gggtttacct ttaagcaatg atagtattta + 11521 ttggataaaa ttatcagata aagatgacca cttgttgaaa aaagttctga ttgatctgac + 11581 ttcatggatt tcatttaaat atagctagct gctcgttaat ttcagagagc tcactcatca + 11641 agaatgactt gattttgaaa taatcgtaaa ggtgaactaa aaagatgact atttatgaat + 11701 tagatcctaa tttttttgta aacttaggta aaacagcacc ttacaaggtg acagaaataa + 11761 tcgggaaaga tcacccagat aattttttaa ctcctggtga ggaaaaaagt ttccttatat + 11821 tggataaaga aaaagcatgg attgttcatg cagactcctt ggtatccgta gctgaggaat + 11881 tagaaggtta tttaggaatg tctgtagacg attttatcat gatttcactt ggaacacagt + 11941 atcataagcg tttttgcttt aatgacgatt acgagatttg ggagagatac tttacgaaat + 12001 taagagaagc ttattactct gactcatcct caaagtaaaa atttcttaac aagttggaat + 12061 catagagtag acagatgaaa gaagaattga tatgacaaaa gtacttaaaa aattgataga + 12121 agaaaactta tcacctctag gaattgtaga gttgattgat gaacgatatg ataagtttgg + 12181 gggatattat ttattatata gtctctcatt gactgctatc accccagaat tttcagaatc + 12241 aggaactgtc gatattgaag ttagttttag cgattatcag gagctgactt acgagttggg + 12301 caaatattct atcccctttt atgttaacag taaagaagaa ctgaagtgct tattggaggg + 12361 aatagtagat cttccactcc ctttttcagt tagttatgaa ccaattaagg aggtaacatg + 12421 ggataggtat atagttagta ttgatggggt taaaaccaca cggataattg aacttgttac + 12481 aatgataaaa gtcttagaag attacctcag tcaaattgaa ccgttactga atcaaaatgt + 12541 tttaaagata atgaagaata gggaaaataa ttagctgctt ttcatttaca gagaggatgg + 12601 tgagttcatt gaaataccta ttactggcag aaaagccaga tcaagccaaa aaatatgcga + 12661 ccgctttggg gaatcctaaa aatgagaaag gcgtttggcg tgttcagtcg tctgtattaa + 12721 atgctgaagt cattgttgct ccagctgtcg gtcatttagt tgaacgaatt aatccatata + 12781 ctaactttga aaattgggag atgactaatc ttcctgcttt gccagaaggc ttttcttatg + 12841 agcctaaaaa ggatactatt aaacggttta atgctatcaa aaaagccgtt aaagaagtag + 12901 atgccattat tattggtact gaccctgacc gtgaaggaga agccattgct tatcggattt + 12961 tagaattaat cccagaggca ttaagaaaga ttaagtatcg tttatgggca aattctttaa + 13021 cgaaaagagg attagaacaa gcttttgcta acttaagaag ccctactgac tccattaact + 13081 attttcatga ggcggacgct agaagtgatg cagactggct ggttgggttt aatttgagtc + 13141 cttttgtaac catcaaaatg aaagaagagg gttacctgga taaaaaggat cattctatgt + 13201 cagttggacg tgtacaaaca cctattgtta gtctaattgt tagaaatgat gaagcgattg + 13261 aaaactttaa accaagtcct tattggcggc taaaacttat tgattctgaa gctgaagtta + 13321 tatttagcaa tgatattaag tatcaatccc aaatggaagc tgaacaagtc ctacaacagt + 13381 tggccaatac agctgttgtc aagacggtta cgagtgaaga aaaggcacaa gaagcgccaa + 13441 aactttataa tctaaccaat ttacaatcag aaatgagtaa actatatcat tttgatgcca + 13501 ctaaaaccaa agaattggtt caaagtctgt atcaaaaagg gtatctttct tatccacgta + 13561 ccgattcaac cttgattaca accaatgagt tttcttatct ggttgatcat atcgaagagt + 13621 atcaaaaagc tattaataaa caactagaga cccctaatcg atcaccaagg aaaaactatg + 13681 tgaatgataa gaaagtgcta gaacactatg ctattattcc aactgagaat attcctgatt + 13741 tgagtgaatt aagtgatgat gaaaagctca tttatcaaaa agcggtcttt agaactttgc + 13801 tgatgtttac gcctgattat cgttaccaat caacaagtgt tattctcgat aatcatggac + 13861 ttgaatttaa agcaacaggt accgtaacga aggataaagg ttggcgtggg tatttcgcag + 13921 tcaaaaaaga agacaaagag ttacctcatt accaggaggg gcaagaggtg attgtcgatt + 13981 gtaacctttt agaagaaatg accaagccac caacacgaat caccgagcaa attctactaa + 14041 agaaattatt accaaaatac catttaggga cgtccgcaac tcgtgatggg atgattgatt + 14101 taattcagga taaaggatac gtcactaaac ataaaaaaac agggcaattt ttcccaactg + 14161 aaagaggaaa actattaatc cactatcttg accaactaga gattgcttat actaatcctg + 14221 aaacaacagg aaaatgggaa gaagtcttag ctcaaattgg tcaaggaaaa attcaaaaag + 14281 aagcctttgt caacaaaatc aaatgggcga ttaccaaaca aattgaaaaa ggcaaacaac + 14341 tttaaacgct actatttagt taacatagta gcgctttttt atggaaagga gtaacgaatg + 14401 gcaaatatgc aagaattgct ttcgcaacgg tttgaagctc aaaggcaaaa actcgttagc + 14461 atggatattg tggcagttgc ggaatcttta ggaatgacac taaaaccagg ttccagtggt + 14521 acctattatt gggaagaaca tgatagcttt catatctacc ctaatacgaa tacgttccgc + 14581 tggtggtcaa gaagtattgg cacaaatact attgacctgg ttcaagtggt acaagaagaa + 14641 atgacaggtc ataaaccaag ttttagagaa gcagcagcct ttcttgaaac tggtcacttt + 14701 gagaatgtaa cagtacaacc aattgtgaaa gaaccttttg agtattatct agagcgctat + 14761 gagcaccctg attttaatat tgggagacag tatctgaaag aagaacgtgg tttgtctgat + 14821 gaaacaattg atacgttttt agcgtcaggc aatatggcaa ctgcaacacg taaaaaaggg + 14881 gattattttg aacctgtaat tgtttttaaa agctgtgaca atgacgggaa aatgattggc + 14941 gccagtctgc aagggcttgt tgaaaatcgt gtacagcatc ctgaacgagg acggcttaag + 15001 caaattatga agaattcgga gggaactgca ggctttagtt tagatgttgg aactcctaaa + 15061 cggttagtct ttgcggaagc cccaatcgat ttaatgtcct attatgaggt caacaaagac + 15121 gacttacaag atgttaagct tgtggctatg gatggtctga aaaagggcgt tattagtcgt + 15181 tatgtcgctg atatgctaac ggatggtaaa tactctcaaa ccatgtcagc tgaacaaatt + 15241 agaggtgctt tggatgcgtt aaatcagacc actaatctgt tacaagagca ttcagatatg + 15301 attacgctag cagttgataa tgatgaggca ggtcaaaatt ttgttaaagg cttgcaggat + 15361 gatggtattc ctgtgatacc agatttacca ccacgtcaac cagctcaaaa gaaaatggat + 15421 tggaacgatt atcttaaaca aatgaagaaa gagagcgcac aaatggcaga aacaccagaa + 15481 gtagaaaaac aatcactttc tgagctccaa gaaagcttat caaacgaagg tgatttagtt + 15541 agtaccatta caagtgatag cagtattatt tatacgaata cagtaagttt taaccaagat + 15601 tataacctta atttagagat tcatagtcct aatgaagtag ataatctctc agatattcaa + 15661 gcaccttgga cacttgaagt tatgaagaaa ggtcagtcac ttggctatct tgcttatggt + 15721 gaagattggg gcaatgattt tgatattgaa gatgagttag ttaatcttga aaattgggtt + 15781 aaagacaacc aagttactaa tcatttatat actcaaaaag atattaatgc gtttttagct + 15841 agcacacaag aggttgagcc caaaatgggt gactttgtcc ttaaaggtgg tggtatttat + 15901 gatttcggaa agagtcagct tgaaggagaa gaattacgtc aacatgccat tgatgcaatg + 15961 atttctgata ttacagatgc tgaaacctat tacctttggc acgatgaaga gttagaaaaa + 16021 ctaaatgcac ccgacgaagc tttcttgaat ttccattacc atttacaaga tattcaatac + 16081 aaccaaaatg atattcatct ttatgtgtca gaatcatcaa ctgatggtgt tacaggttat + 16141 ctttcactag acggaaattc tcttgatagt gatagtattg aagagtattt agctgatcaa + 16201 gattggacgt ttaatcaaaa agtacagttt cttaagaatt taaaaactgc agttgatgat + 16261 acctggaata aagttactga ccattataat gaacaattta atgcaatcgt tgaccagtat + 16321 gggttatctt tacaaaaaga aaaaactccc gaagtacctc aagagcaaga aagtgctaat + 16381 tcagagcaac aaaaaaaggt tgagaaccca atcggggatt tacctgagca aagtcaggag + 16441 gcagcacctc tacctaatac tcacgaagag tactctttga atgagtcgtc accgactcaa + 16501 actcagtctc aacctttact tcattttaac atttctaatc cagataagtc aatttataag + 16561 gtcggttatc atccagtcaa tagaaaagag ttaaacaaat taaatcgcta tgcagcccaa + 16621 attcaagaaa atgcaacctg gtataagaac gaattggctg atagtaatgt cacttatttt + 16681 tataaaaata acgataatct agaagcttta aaggttactt ttaaagcaga gcagtaccca + 16741 catctcatag gtttctttgc aattgatgaa aatcaaagcg caagtaaaac cttggatgat + 16801 ttagcatctg ggaaaggaga ttatcaaaat attatggttg ccaaccgagg ggctaccttt + 16861 agtaaaattc aagtattacc tgattttaaa gctgttgttg attcaaatag ctttattttt + 16921 gatgatttat cagaagtaga acgcatgaat cgtcttgact tagcaaaggc tattcgaaca + 16981 gaggataagg atgttttgat tgcttttaga aatgttgatg gtgagtatct tcctgcatct + 17041 cttatgaaag ttactaataa gcttgagtca gagttgtcaa tcgcaaataa taaagacgtt + 17101 ttaggtattg ttggtgagaa aaatggagag tttaaagttc tttcagtcaa tgaagaaatt + 17161 atcaaagatg gtggtaaaaa aatgttatca attgtaaaaa ataaccaatt tgaaaatctt + 17221 tctaaagcag aagtgactgc tgaagacttt actaaagttt tagatgctgt ttacaatgtt + 17281 ggtgctcaag ttggtaaaga taacagagct aatattccca aagaattgta tccagcttgg + 17341 gataaatact atgaatatgc tgaaagatat gataacaatt ttgatgttat tgttaaagca + 17401 gcaagagcag ataatctctt tgatgaaaat tctgattttt ataaagatgt ctggcttcga + 17461 aaaattcaag aagaaaatca gaaagtaaaa gattctgatg gcgatggtct aaccgatgat + 17521 gaagaaatcg cattaggaac aaatccttat agtccagata ctgatggtga cagtgtcata + 17581 gatagtattg aaagaggaag tggaacagat gcgacgaatc cttctgatac accagacaat + 17641 cgacaaaaag aacaaatgaa acacaactta accttgtcgg aaatgattaa agctaaagat + 17701 accgttgctc ttaatcagca cttgcaagaa gggattaaag attactttga tagtgatacc + 17761 tataaaaatt atttggaagg tatggcacac ttcaatcact attctgctcg taacattcaa + 17821 ttgataaaag cacaattgcc agaggcaaca atggtcgctt cttttgaaga atggaaaaag + 17881 agaaatggtc atgttaacaa gggtgaaaaa gctctatatg ttcaagcacc agtaactgtg + 17941 attaaaaaag atgctgacgg taaccctgtc atcaattcag aaactggtga aaaagaaact + 18001 ttcacttact ttaaacccgt tcctgttttt gatattagcc aaatttctcc tcagcaaggc + 18061 aaacagctta acctgcccaa atcatctgaa gcaattcctg cccaacttaa taaagattat + 18121 tatcaaaatg tttatcgagc gctaagagat atctcccaaa aagaaaatgg tattcccatt + 18181 cgttttagag aactagagca attcgatggt ttctacaatc ctaaaacaaa tgatattacg + 18241 atcaaaaaag ggatgaccta tgaacaaacc ctttcaacac taattcatga aatggcacat + 18301 tctgaattac acaacaagaa gagtttgaca gaacgttttg aaggtaaact aacacgttct + 18361 tcaaaagaac tacaagctga atcagtcgct tatgttgtgt caaaccattt agggtttgat + 18421 actagtaacg attcgtttgc ttatcttgct tcttggtcgc aagaaccaga cggattagaa + 18481 aatctaaaag ctcaacttga aattgttcaa gaagaagcta gttcactgat gaaccgcatt + 18541 gataagcagt taactaaata ccaaacgttg acggtttcaa aagatgaaac gttaaccgaa + 18601 actcaaaaac gtaacttaga gaagtcagca aatccctttt atcaaagttt gcaaaaagcc + 18661 aaagccgaag ttaacaacat gaaaaaaggt gatgaaccta acaatgagca aaccgtaaaa + 18721 aaagacaatc gacctacgaa gtgttaacac agcgtaggtc acgtcgaaaa caactaaccc + 18781 cacaaggagg acaatatgat aacagacgaa atgatgacga taactgaaat gatattaatg + 18841 agttattact ttgatatgag cgaatggctc aaaggaaata aaatcattaa tagtgatatc + 18901 gttcaaaaat caaaagatga tttattggat gtgcttaaaa ctgattttga acaactcaca + 18961 accgaagata ataacgatta tcttgatgac ctctcaatca gtattggcac tcttgaagag + 19021 ttgtcagaag ataactacca aaaattaaaa acagctattt tttcttggga gccaagcaag + 19081 aaaaaataaa aatcgtaaaa gaaggtggct gacaattgtt caattgtcag tttttctttt + 19141 gttgcatttt accaaaatgc aagtatcaaa aatggtcatt tttgaaaaat gcacatcgtg + 19201 cgagaaaagg ggtttgggga tttccccaaa atgtaaaaag tcaaaagtcg gtttgtaggg + 19261 tttctgcaaa ctggcttatt gaccttttta ttttcgcaag tggtgcccca cttgctacgc + 19321 ttgccagagt aaaagtaggt ctggcctaag gcttagctga agagctgaca ttataacaaa + 19381 ttgtatagaa tggagagaat aatgacgata aaaagacgca aacgtccaat tgaatttaag + 19441 cttagaacaa ctgatgaaga agcgtttcaa ttacgccaac ggataacaat ggctaataag + 19501 aaaacctttc aaggctatgc gttagagatg ttgttgaaag gcaaaattga aacctatgat + 19561 tattcagaat tacaacggtt gcgagtagaa gttaatcata ttggtcaaaa cgttaaccag + 19621 ttagtgcgtt atgtgaatac gtttgatgag attgatagtg aattgtttaa agctttacaa + 19681 gctgaaattg atgagatgaa agtattgctc attgatgaat ttaaaacgaa aggtcgggca + 19741 aaattaaatg gtggtgacaa aagtaatcca gattaaaagc agtcgtaact taaaacgggc + 19801 aattaattat attacacgtg ataatgcaac attgaaatta gatagcgaac gtttagaagg + 19861 tgatgacaat tattcttatg agatggtcaa tggtcaagtg atgaaacggt tggtatctgg + 19921 tcatgatgtc accgatattt cagatccaca aacaatttat gatgattttg ttttgttaaa + 19981 acaatctgtt gatgctcttt ataataacga tgagctatcc gatttgaaaa atgataaacg + 20041 tgttttagca caccatatca ttcaatcgtt ttcgccagaa gatggcttaa ccccagaaga + 20101 ggttaacgag attggacgaa aaaccgcttt agagttaacg ggaggtgatt atcaatttgt + 20161 cgttgcaaca catatggata aagggcattt gcataatcat attattttta acacaacgaa + 20221 tgaagtgact ctgaaaaagt ttcgttggca aaaaggaacc aaaaagagtt tagaacatat + 20281 ttcagataag tatgctgagc tttatggtgc aaaagtttta gaaccgagac ttagaaattc + 20341 tcacacagat tattcggcat ggcgccgaaa aaataatttt cggtttgaga ttaaagaacg + 20401 attgaatttt ttgttaaagc actctttaga tatgactgac tttttacaaa aagccaaaac + 20461 tttaaattta caagttgata cgagtggtaa atatattaaa tacaaattac ttgaccagcc + 20521 acaagagcgt tttgttcgtg accgtacgtt atcaaaaaaa ggaaagttct cacttgaaaa + 20581 aatcaaagaa caaattgcaa caaacgaagt tgtttatgat ttaaacgtca taaaagaaaa + 20641 atatgatgaa gagcaagaaa gtaaacaaga tgattttgaa atgcagctca ccattgaacc + 20701 atggcaaatt gaacaactca ctcatcagtc aatttatgtt cccattactt ttggtttaga + 20761 tcgaaaagga acggtttcca ttcctgcacg gatgttagac caaaatgaag atggaacgtt + 20821 tacggcttat ctcaagaaaa atgatttctt ttatttttta aatacagatc attcggaaca + 20881 aaatcgtttt attaaaggag tcactttaat caaacagtta tcggctcaaa atggtgaaat + 20941 gattttaaca aaaaataaaa atatcactaa cctagatagg ttagttgatg aatttaactt + 21001 tttagcagca aacaacgtta ccaattcaaa acaatttgaa aatctgcaac aacaattttt + 21061 agagcagctg gatgagacgg ataaaacttt agccgcactg ggtgataaga ttttttatct + 21121 taataaattg ctaggagcat tatctgatta tcaaaataat attgttccat cagaagtgag + 21181 tcttgacctt ttagaaaaag gaaaaattga taagacaatg aaacttgacg agttacaaaa + 21241 agaaattaaa gagcttcaaa ttgaacgtga cacactcaaa aagcatagag ataagattgt + 21301 aaaagattat gactttacta aagagatcaa acaaacgcat gaaaaacgca ctggaatatc + 21361 attgtaagca atttaacaaa agggatagtc tcaaaaagat agtaactaac tttttctata + 21421 gtgcttttta tctgatataa taaactaaat gatacaaaag gaaatgatac tatggcaaca + 21481 aataaagaac agattaaaaa ttcaggaaag tgtctctttg ttgagacgac cacaaaactt + 21541 tcaagtgatg agttattaaa agcaatagct gatgacaaca tgacagaaga gcaagtggaa + 21601 caattaaaaa ttgatctgga tatcttttta aaacaaagag cagctgcttt caaggaatga + 21661 ggtgaggaat tgcaaaaaca taacctaata aaactattaa aggggcttct cttggtgcta + 21721 ttattgctta taggagtagc cttaattttt aacaaatcta tccgaaatac cttaattgcg + 21781 tggaatacta atcagtatca agtctcacag gtttctaaac aaaccattga gcaaaataaa + 21841 gacgctaatg tgagttatga ttttgattcg gtcgaatcca tttcaaccga atctgttcta + 21901 aaagcccaaa ccaatagcgc taatcttcct gttattggtg gggttgctat tccagaggtt + 21961 gggattaatc ttcccatttt taagggactc ggtaatacag aattgactta tggggcagga + 22021 accatgaaag aaaatcaagt catgggaagt ggtaactacg ctcttgccag tcaccatgtg + 22081 tttggcttaa caggttcttc tcaaatgctc ttttcccctt tagaaaatgt taaaacgggg + 22141 atgaagattt acttaacaga taaagaaacg gtgtatactt acattgtcac atcaattgag + 22201 agtgtcgcac ctagtcaagt agcggtgatt gatgatacgg aagagacaga agtgacccta + 22261 gttacgtgta cggatgctga agcaacctca cggacgattg tcaaaggagt ttatgactct + 22321 gaagttagtt ttgaccaagc accggaggac attttagacg cttttaatac agcttataat + 22381 caaattgctt tataaagaca aataaaaaat aggcagtagc tattctaatt agggtagctg + 22441 ctgcctattt ttgtgctttt caagtgttaa aggtacgctt gtgttaattt taagggattg + 22501 aaaagcattt tggctattat aacatagttt cttaaaaggg aaaaggtgat tacaaacttg + 22561 taaccacctt aggagatttt tgaaaagttt ttttgggata ataatagtat agcaattttt + 22621 ctttttataa gctaataatc agcatgttat gtcacaaatt ttcaaaaatt cgttaaaata + 22681 gaactatggt agtaatgaga tttgatgaaa gaggatttgt agaagaactt tatagacaac + 22741 gggagtatga gttcttaaag cgagtcgcag cctatgataa acaaatagct cccactatgc + 22801 gagcaaacgg ttataaaaga gtagatagca gtgagcgaac tgtgttattt acgtttggcg + 22861 caatgacatt ttcaagaagc cgctggcgac gagggacgaa aacccgttat cctgtggatg + 22921 aatggttggg gttgaagaag tatatgcgct gttcgttgga acttatgtat catctggtaa + 22981 gatatgcttc agagatgtct tatcgccaag tttgtcggat gataaagcta tcttaccact + 23041 tagatattac aaaagatacg gtcttaaaag cggtaaaatt aacaggacag ttattctctg + 23101 aaaagagcca ttatcgttac tttgttgagg aagaggtatc agaaaaaatc aaagcaccgg + 23161 ttatttatat tgagggtgat ggtgttctgg taaaaacaaa tacgggtgga gatgagaagc + 23221 acaatacgga tttagcacat tttcttgttc atacgggaac aaaaatagta catggacgaa + 23281 cagtcttgct taataaacat gaaattattc atacagacta tgaagttgcc agagatgaat + 23341 tactagatta tctctataat cattttgaaa tcaccaatca aactattcta gtgactaact + 23401 cagataatgg caagggctat accagacgtg tctttcaaaa tattcaaaag gcgctcaaaa + 23461 ttaaacgtca tgaacacttt tgggacgccc atcatgtcaa ggaaaaaatt acttcatttt + 23521 ttaaaagtta tcctaaaata ctgaaagatt tgatgtttaa agccattcaa acccataatc + 23581 gaaaattatt aaaaactgtt ttggatacag ttgaatcatt ggtcactgac gatgaagagt + 23641 acctagtttt tcaaaagttt aggaagaaat ttttgaataa ttttaaggat acaaaacctg + 23701 ctaaactaag aggtctctcc cataagggaa ttggggtcat ggaaagtcag cactgtaaag + 23761 taacctttcg catgaaacat cgtggcatgt actggtcaat taaaggtgcc tgtgctatgg + 23821 ctagacttat tctgttagaa cggattgatc aattagaaaa cctctttttt ggcaattggc + 23881 gcaaagatta tcagtactat aaagataacc agttaggtgt tggttattta agggagtcga + 23941 aagccgatca ttctcccacg cctcaaagaa tctttaaacg agctggtaaa atcatgtcat + 24001 tagatcgtca aaagtttaaa tattaac +// +LOCUS NC_020450 18869 bp DNA linear CON 24-DEC-2022 +DEFINITION Lactococcus lactis subsp. lactis IO-1, complete sequence. +ACCESSION NC_020450 REGION: 643089..661957 +VERSION NC_020450.1 +DBLINK BioProject: PRJNA224116 + BioSample: SAMD00060995 + Assembly: GCF_000344575.1 +KEYWORDS RefSeq. +SOURCE Lactococcus lactis subsp. lactis IO-1 + ORGANISM Lactococcus lactis subsp. lactis IO-1 + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Lactococcus. +REFERENCE 1 + AUTHORS Kato,H., Shiwa,Y., Oshima,K., Machii,M., Araya-Kojima,T., Zendo,T., + Shimizu-Kadota,M., Hattori,M., Sonomoto,K. and Yoshikawa,H. + TITLE Complete genome sequence of Lactococcus lactis IO-1, a lactic acid + bacterium that utilizes xylose and produces high levels of L-lactic + acid + JOURNAL J Bacteriol 194 (8), 2102-2103 (2012) + PUBMED 22461545 +REFERENCE 2 (bases 1 to 18869) + AUTHORS Shimizu-Kadota,M., Kato,H., Shiwa,Y., Sonomoto,K. and Yoshikawa,H. + TITLE Direct Submission + JOURNAL Submitted (28-SEP-2011) Contact:Hirofumi Yoshikawa Tokyo University + of Agriculture, Department of Bioscience; 1-1-1 Sakuragaoka, + Setagaya-ku, Tokyo 156-8502, Japan URL + :http://nodai.cc-town.net/laboratory/single.php?id=23 +COMMENT REFSEQ INFORMATION: The reference sequence is identical to + AP012281.1. + The annotation was added by the NCBI Prokaryotic Genome Annotation + Pipeline (PGAP). Information about PGAP can be found here: + https://www.ncbi.nlm.nih.gov/genome/annotation_prok/ + + ##Genome-Assembly-Data-START## + Assembly Method :: phrap v.1.080730 + Genome Coverage :: 8.75x + Sequencing Technology :: ABI 3730xl + ##Genome-Assembly-Data-END## + + ##Genome-Annotation-Data-START## + Annotation Provider :: NCBI RefSeq + Annotation Date :: 12/24/2022 01:48:57 + Annotation Pipeline :: NCBI Prokaryotic Genome + Annotation Pipeline (PGAP) + Annotation Method :: Best-placed reference protein + set; GeneMarkS-2+ + Annotation Software revision :: 6.4 + Features Annotated :: Gene; CDS; rRNA; tRNA; ncRNA + Genes (total) :: 2,359 + CDSs (total) :: 2,271 + Genes (coding) :: 2,261 + CDSs (with protein) :: 2,261 + Genes (RNA) :: 88 + rRNAs :: 7, 6, 6 (5S, 16S, 23S) + complete rRNAs :: 7, 6, 6 (5S, 16S, 23S) + tRNAs :: 65 + ncRNAs :: 4 + Pseudo Genes (total) :: 10 + CDSs (without protein) :: 10 + Pseudo Genes (ambiguous residues) :: 0 of 10 + Pseudo Genes (frameshifted) :: 4 of 10 + Pseudo Genes (incomplete) :: 5 of 10 + Pseudo Genes (internal stop) :: 3 of 10 + Pseudo Genes (multiple problems) :: 2 of 10 + ##Genome-Annotation-Data-END## +FEATURES Location/Qualifiers + source 1..18869 + /organism="Lactococcus lactis subsp. lactis IO-1" + /mol_type="genomic DNA" + /strain="IO-1" + /sub_species="lactis" + /db_xref="taxon:1046624" + gene 2..1684 + /locus_tag="LILO_RS03250" + /old_locus_tag="lilo_0603" + CDS 2..1684 + /locus_tag="LILO_RS03250" + /old_locus_tag="lilo_0603" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_015426013.1" + /GO_function="GO:0005524 - ATP binding [Evidence IEA]; + GO:0003677 - DNA binding [Evidence IEA]; GO:0000166 - + nucleotide binding [Evidence IEA]" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="FtsK/SpoIIIE domain-containing protein" + /protein_id="WP_015426013.1" + /translation="MAKRTISKGSRLKLRDKYDREFFVLITGLLFASPVGFFYKNFET + LPPKVLAIYAVDILLIAFSVAFGLLILLYHKFLFFSKNNYKRLLLNYVVKHGLVEKEM + VKDEKGSHEKLKLAPIYLKQPNTYELHTYFPIDGGVHQEKFLDLADGLETTFFADYQE + QNFINESKILSKKAFVEYVFAIDGERNRISVNDVIVDKKLGLKLMNGVYWNYEADPHM + LIAGGTGGGKTVLLMSILSALAKVGHVDICDPKRSDFVGMRDVPVFENRVFFDKESMI + ECLRSKMQFMDERYDYMTNHPDYKAGKRYSDYCLTPEFVLFDEWAAFISSLDFREFDE + VIQILTQIVLKGRQSGVFLILAMQRPDAEYLKSALRDNFMKRLAVGRLTGSGYRMVFG + DENEKKVFKYIKGKIGRGYVANNGELAREFYSPSVPFDKGYDFHEELSKLPVLADTTE + VQLEAPPISNVEQERAESELLEEKFYTITSLSRKLGQPSKTVKTAIERLTSGGYSISE + KSPYNEDDFIALQTVFLTKETEECTLNEAVDTVLADEAEFEKEFVTFDKEVA" + gene 1706..1876 + /locus_tag="LILO_RS12075" + CDS 1706..1876 + /locus_tag="LILO_RS12075" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_003129468.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_012897120.1" + /translation="MAEKSVRVTISKDNKTTELTLRGVAVKDFEKLFFAVQNQMKSCE + KKEDKHHAIGGE" + gene 2314..3468 + /locus_tag="LILO_RS03260" + /old_locus_tag="lilo_0605" + CDS 2314..3468 + /locus_tag="LILO_RS03260" + /old_locus_tag="lilo_0605" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_014570871.1" + /GO_function="GO:0003677 - DNA binding [Evidence IEA]; + GO:0003916 - DNA topoisomerase activity [Evidence IEA]" + /GO_process="GO:0006270 - DNA replication initiation + [Evidence IEA]" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="replication initiation factor domain-containing + protein" + /protein_id="WP_015426015.1" + /translation="MADLLGISLVYYRKMENGDRPLSKQFEEKIRNSFFKKRESSTVF + VGTNDYTNIRFQTLNVREVVSKILGLNVENFQLNEYNRYQYPFYISYGHINVYYHDKD + IKAGVLIEMSGQACREMEYEFEYHQKQRTWYDFFNDCFLYANKKAPENDDFVKITRFD + LALDEQYNPQEGNFDLFKLLTSAREGRWNGRKQNYSAVLGGRRTKEGMINDGLTVYFG + SKQTHLFFRFYEKDYERASQEMTSVEAIREMYGLRNRYEISMRKEISTDFIKRYIEED + FDLADEGVKIINDNLTFYDKEGNLDSEWYDMMGRMDAYHFTVRPEAPDLNRKYTWFER + GGPVSTYLLLKKAEELTGESRLEEIFNEAELTERQEKFLKEFRMIRGANG" + gene 3604..3933 + /locus_tag="LILO_RS03265" + /old_locus_tag="lilo_0606" + CDS 3604..3933 + /locus_tag="LILO_RS03265" + /old_locus_tag="lilo_0606" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_014570869.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_015426016.1" + /translation="MIKPNIEHFQKRMLRVPNNVRMLQYKMSGYEFNLKKFEQGVYDQ + LFFYIPNETEALGLLNEIGLMFPPDSMTRKKYYSLYQEKRIADLPEGYKMAIYFLIDN + DLAQATL" + gene 4020..4331 + /locus_tag="LILO_RS03270" + /old_locus_tag="lilo_0607" + CDS 4020..4331 + /locus_tag="LILO_RS03270" + /old_locus_tag="lilo_0607" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019293439.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_015426017.1" + /translation="MPTLKTGLKQLTTDLNEIEAVINAGNAYQEAVSKLKGQGKALRT + LENDTSISDDTVEVIANRTNDLIRNLLKGSTAYNFTKKSFNELKGKLEEAEAQARSGA + K" + gene 4463..4723 + /locus_tag="LILO_RS03275" + /old_locus_tag="lilo_0608" + CDS 4463..4723 + /locus_tag="LILO_RS03275" + /old_locus_tag="lilo_0608" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_003129681.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_015426018.1" + /translation="MTVTNMSKARPQIDFSLHKAPYKDLYDIQILFPDGTNQFWSGIN + EKKVMWLCEKYNPISTPLSIAIAPRFLPKSNIQKPNWEIRKG" + gene 4829..5038 + /locus_tag="LILO_RS03280" + CDS 4829..5038 + /locus_tag="LILO_RS03280" + /inference="COORDINATES: protein motif:HMM:NF024252.2" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="helix-turn-helix transcriptional regulator" + /protein_id="WP_042230155.1" + /translation="MSVFAERLKELRKEKGLTQSQVGVHLGMSQQNYRRWEVGERSPS + GETLIKLADYFDVSTDYLLGRKSEK" + gene 5035..5331 + /locus_tag="LILO_RS03285" + /old_locus_tag="lilo_0609" + CDS 5035..5331 + /locus_tag="LILO_RS03285" + /old_locus_tag="lilo_0609" + /inference="COORDINATES: ab initio + prediction:GeneMarkS-2+" + /note="Derived by automated computational analysis using + gene prediction method: GeneMarkS-2+." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_015426019.1" + /translation="MNIQQLYLIINKMNKVLKVARLISLIPVTLIGLAFEILTSMFLS + GTICWWLAAFKIISENNKIIFYLFSVIIFLILLVYSLIGILKVLENKLKEKEVK" + gene 5331..5750 + /locus_tag="LILO_RS03290" + /old_locus_tag="lilo_0610" + CDS 5331..5750 + /locus_tag="LILO_RS03290" + /old_locus_tag="lilo_0610" + /inference="COORDINATES: protein motif:HMM:NF024363.2" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="DUF3850 domain-containing protein" + /protein_id="WP_168694145.1" + /translation="MTVHKKKLDFQFHKPVETGEKPFEVRINDCDYQVGDIIELKSYG + KCCNYCDGKSYKKYYSGNCSGWMNCYESEAETIRVKILRVIYPKEINYALTHGVILSS + SFGKINLDDVREVLKEYFNRKTLPKDYVLLEIEVIKK" + gene 5846..8254 + /locus_tag="LILO_RS03295" + /old_locus_tag="lilo_0611" + CDS 5846..8254 + /locus_tag="LILO_RS03295" + /old_locus_tag="lilo_0611" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_017865118.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="SpaA isopeptide-forming pilin-related protein" + /protein_id="WP_015426021.1" + /translation="MSKHKKLLNGLTSEKKVTNWKMHKRKKVFVAFAGVLAVGLGTAG + LVYASAQSTSAKASLPTDTTVNWENNKPLYYEIDQTGKEHPKPMLKLSDGTPAWCLGL + GVPLVNNITQAQLDSSNAILNALSDEQIAVINNVAYLAQKQGTLLAYAQAQHATYLLL + DEAGVSVNQTKDLIVKPNTLLQEPNAIKTGANDLITQAKALRKLPSFHGTTVDVVQGV + EKTVTDSNSVLANFPNFKSNVSGLSESVSGNDLKLKADITAKVGITPKAIQFQNTPLS + IADLPYYVFSTDGDSTGKASQSVIASQDPSKANGYLNVNVIGLGETTLTKVDADTGSG + ETQGAAQLKGAVFGLFNKSDNSPVKWSDGQKGYPITVTAGTKADDTNVSIKLGDDLKA + GLKNLDNSKEYYWKETVAPEGYSLSTEKYEVKFDSSSKFDDKTSNFIDDDKATDKVLD + LNFGFIKAQDVNGSLTGLNGRTFRYTPTGDTKGKPIEVTSGANEDSNGVTNNGQVNFT + KIPFGDGLLEELPQKDDKLQLINPISIVTTTNKDKDENITGYTVTFTDTVTKQVITTL + DVSLDKVTDNSTMFKVNLGTLVDKPVTPVVPTIKTKAHTKDGDQTIQKVEISKTTPLY + DKIMTTNAIKGDQMVATLHRVVTGKDGKVTESKVIRTLNFTVDDETVKAQEKQIESTV + DTTKDADVPETSTVAYVWTEDLFDEGKNPKTDEPKAKHDDLKDQDQTLTVEKVEKPVT + PPSSKPTPPSTTPTETPKVSLPTTGSETGDMIMYGGALAVLIALGTGAVYYMKKKKST + KEEG" + gene 8381..8569 + /locus_tag="LILO_RS03300" + CDS 8381..8569 + /locus_tag="LILO_RS03300" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_014570866.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_042230157.1" + /translation="MYVVKMRGGYLCANGGATKHLKFATTFDTKKKAEEVAEKWLRSD + VSFKAVEKESEEYEQNKN" + gene 8550..9821 + /locus_tag="LILO_RS03305" + /old_locus_tag="lilo_0612" + CDS 8550..9821 + /locus_tag="LILO_RS03305" + /old_locus_tag="lilo_0612" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_014570446.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="translation initiation factor IF-2 N-terminal + domain-containing protein" + /protein_id="WP_042230159.1" + /translation="MSRIKISELADEFKIDRKDVLAKAQEFGVSAKLATKTLSESEEK + QLRTYYQQVPHSMAETSKNQVLENVGQKKLDPKEEVSEKKEEPSKAEQVEKKKSKFSI + LGHKKSEKKKGKLLTRLSNEKPPSKKQFTAKQGGALVVGGVGILILSNMVLFGLMASG + YQPTQKIIHEQVSASQKVSGNGLDLQAKNYLDGFVQTYFTFPENEKDQEQAVKDINGY + FVQQLPVISQGLQRSPSKFEEAVLMNLTDNEATYKVTYGAGAVTKKGKSNVVNYHDVT + TLFTIPYQKVGSSYYVSDEPYFSSVNDLQAKESQVPVKTWSGTDNNSASTKKDLDKFT + KALFTAYTTDSDTLKLISEGLSLNDSETFQSLDQATYEPKGDTYQAIVQVTMKNELGT + HVENYQFTISKQKQSYFATDFKHTLPKGNKE" + gene 9834..10097 + /locus_tag="LILO_RS03310" + /old_locus_tag="lilo_0613" + CDS 9834..10097 + /locus_tag="LILO_RS03310" + /old_locus_tag="lilo_0613" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_003131793.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="TcpD family membrane protein" + /protein_id="WP_015426023.1" + /translation="MKELLNYHIAVVYGDIGLSNFWNTFQTNVKYIIFAGTLWFMIRE + WKNKAVGKMVMTFIVGAILFALTLNPETVLQPIGQKLMQMIGA" + gene 10111..10506 + /locus_tag="LILO_RS03315" + CDS 10111..10506 + /locus_tag="LILO_RS03315" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_003131794.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="TcpE family conjugal transfer membrane protein" + /protein_id="WP_042230162.1" + /translation="MSKENKKGLKYSNKSSLSQPLRIQKLFDGWSLGKAWRLSFFIYF + GLFGFILWKLLFSKLVVFPIGFRLVVESFMCYKSALFLAEIRIDDKSPFIYLKDMISF + IITFGLKGKSIYKGWIYPLRKRKEELKEK" + gene 10503..13112 + /locus_tag="LILO_RS03320" + /old_locus_tag="lilo_0614" + CDS 10503..13112 + /locus_tag="LILO_RS03320" + /old_locus_tag="lilo_0614" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_014570447.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="ATP-binding protein" + /protein_id="WP_042230164.1" + /translation="MKKKATWENHILSVHENLVLKDDGTVFAMFEVPASIISMMDEKG + KKNHKQTTQAVITSLYEHLGFEILMKPITKDLLKAYGYLLEDCDPRTREFGEYLLEQS + YLELENELGKIYNHKFFLTVPLSDFAFSGDLKKMMKEGWQRFRKSVVQLIRRELEFTV + NWYEDYEQTALDLEMNLNLLQARPLKQEETLLYNSLNYLRGIDVNQDELLADVNNAIE + NIDDTTVDVRSDGLLEIHHPQGESLLKFLPLADYPDVVNDIHLIEHIQTLPFPVEFRV + KARFRKNKGALGMEATAERTRDRIGTELSEADEQGNVTKNSSVSAYVILEDIIAGVDG + GEYFLDFLPVFAITGSTPDEINYYKKMLMTAMEGLGIKIVPSQWDQPYLFYKMRSTEE + LTRSDKYWVQNMKVSAFVENLFFVSQKVGSDVGFYFGRVDHTQLNWAGNFEKAIASSP + TPFFWNMFQANKDDIEGKLGDSPHVGIFGDTGSGKSFFAKQGFVNHSILKGLSLYIDP + KDEMKSQFLAVRDKLESYLPEMEEKISELVVLIEDDEILARRIRNLEFSYHKPLIDYI + NHIHFVSLDVKDKKNIGALDPIVFLEGNQATELATQVTKGLIGDKLTEDDRFENCFNQ + KVQEVIEARAKGKTVGLLNVFQLMAKSEEDFIRYRAENILSKISGTMLELVFSEGQNS + SVSMDEHITILGVTGLNLAKSGEVKTAQNEMSDIIMYALGDFCRFFGARDREQETVIW + LDEGWFFNTTDIGKGILMRMKRVGRSENNFLVLISQSVKDGASEEDDTAFGTIFAFKE + TGNTTAALKAIGLPDDVEEIIKWYENMTKGLALLKDPFGRIGRVVIQGQNSALNECFK + TSFSKMKSTKAVA" + gene 13112..15229 + /locus_tag="LILO_RS03325" + /old_locus_tag="lilo_0615" + CDS 13112..15229 + /locus_tag="LILO_RS03325" + /old_locus_tag="lilo_0615" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_003131796.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="metal-dependent phosphohydrolase" + /protein_id="WP_015426025.1" + /translation="MKKKMLLVVGLLAFLGGVALPSQADTAFNVPTTPSFSSAKNPTV + SKAPTSSSSTASSKSSTTSPSYPVNNGFVGGDLGDYSSSNSPSKVMNEVEKKKARENL + DNYTSYMYFDDGKFLTGSMSAGMQTFFVRSQFFVTKTIYRFVNAVNEKLNSDSLITQW + TAQMFATVKKIYNQFSNPQLYPIIAIGVISSLLYYWFKRRFLEGVRKVILVMLLVGLF + INGGQKLTEQINSSLNTATTTLMSTVKVAGVSSRNSNDLKTTMVEVPFLYMNFDNVKI + NADGSSNISEDNIVKLLTSDDDNDKLKTIQSDLKDSHLTSKKMGEKVLTALASIFNAI + LVGFIYLAFAVMAFVMRMFFLILLLLLPFVGILSLFPFFDVVILRWAKATGGALIVSN + VVVIGTALISILDSIVSSAVTSMIGSDYFFITLIKFIVYIILFKKREKILEIFKAGHL + GNSGFAGRMDGLLSNVRRKGSNMIKAPLLAGSSAGLVAGLTAGQMATGKAKEIAKNRL + TNGTGSLWHGGLNKKADRTMNKMDKANPNSKKGQKLQAKEEKIKQRLEKRKQKFENPN + LLKRKVADYRKQYQQRKTMNNPNLAQKMEQKNKEKNASIQALYDKNKTQLQARAIERR + MREAVPDQEKPNLSELAKNKQKALAKEKLDERAMKQSAGRMAERFEKEKVSHSSFKRK + PNYPWDNNDTNQKLNNPFVIDEK" + gene 15239..16279 + /locus_tag="LILO_RS11840" + /old_locus_tag="lilo_0616" + CDS 15239..16279 + /locus_tag="LILO_RS11840" + /old_locus_tag="lilo_0616" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_017371146.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="phage tail tip lysozyme" + /protein_id="WP_080619315.1" + /translation="MKKAIKRKVILVSLPFLLLLLPILAFFSLFVGSNSSSDTDINTN + TPQQQTAKVIWDRVLKEGGTKEGAAALLGNNQAESELQPSIIQSNATYNEAKAMDTTL + GGYAFGLAQWDSGRRVNLLNYAKSQKKSWTDTNLQVEFMFEQDGTDSTLLKQLIKGTN + VKQTTEDIMRKWERAGAVDSLSKRQGFAEYWYTFMTTGGDSGTGGGSGITPDIPSGWT + LDKPINTSGYITSSYEYKQCTWFTWNRAKEFGITFSPFMGNGADWQHQAGYTVTTTPT + LHSAVSFSGGQTVGGQWNADPVYGHVAFVEAIHSDGSVLISQSGTGFSTVYTFQVLTK + AQASQLHYVIGK" + gene 16374..16868 + /locus_tag="LILO_RS03335" + /old_locus_tag="lilo_0617" + CDS 16374..16868 + /locus_tag="LILO_RS03335" + /old_locus_tag="lilo_0617" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_017371147.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_015426027.1" + /translation="MTKLEEVRASGKMSERVLENNFRHFDHRLREIEGELRLYPYATL + SEVIAWAEQLKIAIGKIKAIQESSIIKSKKEWGILEEKMLGYLQIDKAFIHVFSDHVI + FLVQLEQRYRQRLSIFANNLDNSVRYLKRYADDLEKQGFSITGILAESRNLSDMNWLS + ILNY" + gene 16894..17385 + /locus_tag="LILO_RS03340" + /old_locus_tag="lilo_0618" + CDS 16894..17385 + /locus_tag="LILO_RS03340" + /old_locus_tag="lilo_0618" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_017371148.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="antirestriction protein ArdA" + /protein_id="WP_015426028.1" + /translation="METPKIYVVNLNSYNNGRTRGKWYELPVDFSRIKSDLLLDVEHG + EEYAIHDFENFYGYKVGEYSSIQELNEYAEKLEEISDIEHLKDFLEIYSIDDVINNKD + DLDFVEAENDEDLAQELIEQMGGLEVLSVETLQRYFNFGAYGRDLAIGDYSKTSHGYI + RDI" + gene 17440..17646 + /locus_tag="LILO_RS03345" + /old_locus_tag="lilo_0619" + CDS 17440..17646 + /locus_tag="LILO_RS03345" + /old_locus_tag="lilo_0619" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_015426029.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="WP_015426029.1" + /translation="MEENYKDKRGISKLFDVPIKTLNNDLTEMRRTEFNVYILRPSHK + RVYINVQGYKSFLEYKQKIRESTI" + gene 17729..18868 + /locus_tag="LILO_RS03350" + /old_locus_tag="lilo_0620" + CDS 17729..18868 + /locus_tag="LILO_RS03350" + /old_locus_tag="lilo_0620" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_014570452.1" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /codon_start=1 + /transl_table=11 + /product="site-specific integrase" + /protein_id="WP_042230166.1" + /translation="MFYKQLDSGKYRYFEKYFDEKRNKWRQVTVTLKSKSRVAQSEAK + NRLARKIEQSKKVPTAIELQEQIVQNKTIQEIYEEWVVIRKQDVKPASFVAEQISLKG + FIEKFSKYKVSEVTTADIQSYLMELDIANSTRKNRRIYIRILFKYAENIGYINSNPAD + KVVLPKVRLEIETLERANEKFLSKEEMSSVLIFCKSYKKNIRYTLAMEFIFLTGCRFG + EFASIRYQDVDFKNKLLRIDHTLEYRVAKYDDRVIQTPKTVGSIRTISLSNRCLEIID + YFQKNCLDDKFVFVNAVGGIFRQPVFYKFICDNCQKVLGNERKYGIHLLRHSHVSLLV + ELGVPIKAIMERVGHRDESITLRIYSHISGTIKNEISQKLNQINL" +ORIGIN + 1 aatggcaaaa cgtacaataa gtaaaggctc tcgtttaaag cttagagata agtatgaccg + 61 tgaatttttt gtattgatta ctggtttact tttcgctagt cctgtagggt tcttttataa + 121 aaattttgaa accttgccac caaaagtgct agcaatttat gctgtagata ttctgctcat + 181 tgcattttcg gtggcttttg gtttattgat tttgctttat cacaagttcc ttttcttttc + 241 aaaaaacaat tataaaagat tgttactgaa ctatgttgtg aagcatggtt tagttgaaaa + 301 agaaatggtt aaagatgaaa aaggaagtca tgaaaagtta aaactagcgc ctatttatct + 361 gaagcaacct aacacgtatg aattacatac atattttcca attgacggtg gagttcatca + 421 agaaaaattt cttgatttag ctgacggttt agaaacaact ttttttgccg attatcaaga + 481 acaaaatttt attaatgaaa gtaaaattct ttctaaaaaa gcatttgttg agtatgtttt + 541 tgctattgac ggagaacgta atcgtatttc agttaatgat gtcatagtcg ataaaaaatt + 601 aggtttaaaa ttaatgaatg gggtttactg gaattatgaa gctgacccac atatgcttat + 661 tgcaggtggt actgggggtg gcaaaaccgt tcttttgatg tcaattttat cagcccttgc + 721 taaagtagga catgttgata tatgtgaccc taaacgttct gactttgtgg gaatgagaga + 781 tgttccagtt tttgaaaatc gtgtgttctt tgataaagag tctatgattg agtgtttacg + 841 ttcaaaaatg caatttatgg acgaacgcta tgattatatg acaaatcacc ctgattataa + 901 ggcagggaaa cgatattctg attattgttt gacacctgaa tttgtacttt ttgatgaatg + 961 ggctgctttt atttctagtt tagattttag agaatttgat gaagtaattc aaattttaac + 1021 tcaaattgtt ttaaagggtc gtcaatcagg ggtcttctta attcttgcca tgcaacgtcc + 1081 agatgctgaa tatctgaaat cagctttacg tgataacttt atgaaacggt tggcggttgg + 1141 tcgtttgact ggttcaggtt atcgtatggt ctttggtgat gaaaatgaga aaaaagtttt + 1201 caaatacatc aagggtaaaa ttggtcgtgg ttatgttgcc aataatggcg aacttgcacg + 1261 tgaattttat agcccttctg taccatttga taaaggctat gattttcatg aagagctttc + 1321 aaaattacca gttttagctg atactactga agttcagctt gaagctccac caatttctaa + 1381 cgttgaacag gaacgagcag aaagtgagct tttggaagaa aaattttata cgattacctc + 1441 tttatctcgc aagttgggtc aaccgtcaaa aactgtgaaa acagccatag agcgtttaac + 1501 aagtggcgga tattctataa gtgaaaaatc accttacaat gaagatgatt ttattgcttt + 1561 acaaactgtt ttcttaacca aagaaacaga agaatgtact ttgaatgaag ccgttgatac + 1621 tgtcttagct gatgaagcag agtttgaaaa agaatttgtg acttttgaca aagaagttgc + 1681 ctagtttgaa aatgaggtaa aaataatggc agaaaaaagt gttagagtaa ctatttcaaa + 1741 ggataataaa acgacggaat tgacccttag aggggttgct gttaaagact ttgaaaagct + 1801 attctttgct gttcaaaatc aaatgaaatc ttgtgaaaaa aaggaagata aacaccacgc + 1861 aatcggcggt gagtaaatga taggaacttg tttccgtttg tctttagaca acttgccgta + 1921 ggcaagccat tttccacggt cgaattgccc tcgcaaacgg tagtgcgcga cagcggttta + 1981 ttcttgaaag aattggagga aaaactattg ggttttgttt taaggctatt gcgttttaaa + 2041 cgtaatgctt tttttgaaaa agtgcaagaa cgtaagcata gctccgagcg tagcgtaagg + 2101 agtgagcgtg tgattgcacg gctgacggct tgccgtcagc ttggacttga ccccccaaat + 2161 gctaatgagg gggggtacaa gtgatacaag tctaactatc ctagttatat caaggttcta + 2221 ggttgtatca cctgtgactt atgtttagaa agtgaggaac gaacgattga attaaaggat + 2281 atacgctcta gcgcaaatgt tactcaacaa ttcatggctg acttactagg tatatcttta + 2341 gtctattatc gaaaaatgga aaatggagac cgtccactct cgaaacagtt tgaagaaaaa + 2401 attagaaatt cttttttcaa aaaaagagag agttcaacgg tctttgttgg tacaaatgac + 2461 tatacaaata ttcgttttca gactttaaat gttcgtgaag tagtttctaa gattttaggt + 2521 ctaaatgttg agaattttca acttaatgag tataaccgtt atcaataccc tttctatatt + 2581 agttacggtc acatcaatgt ttattatcac gataaagata taaaagcagg tgtgctaatt + 2641 gaaatgagcg gtcaagcgtg ccgtgaaatg gaatatgagt ttgaatatca tcaaaaacag + 2701 cgtacttggt acgatttttt taacgattgt tttctctatg ccaataaaaa agcaccagaa + 2761 aatgatgatt ttgtaaaaat cacacgtttt gatttagcac ttgatgaaca atacaaccca + 2821 caagaaggaa attttgactt gttcaaactt ttaacttctg cccgtgaggg gcggtggaat + 2881 ggtcgtaaac aaaactattc tgcggtactt ggtggaagaa gaacaaaaga gggaatgatt + 2941 aatgacggtc taaccgttta ttttggatct aaacaaactc atttattttt tcggttctac + 3001 gaaaaagatt atgagagagc aagtcaagaa atgacttcgg ttgaagcaat acgtgaaatg + 3061 tatggtttgc gaaatcgtta tgaaatttcc atgcgaaaag aaatatcaac cgactttata + 3121 aaaagatata tcgaggaaga ttttgattta gccgatgaag gggtcaaaat tattaatgat + 3181 aatctgacat tttatgataa ggaaggaaac ttagatagtg aatggtacga tatgatgggt + 3241 agaatggatg cttatcattt tactgttcgt cctgaagcgc ctgatttgaa ccgaaaatat + 3301 acatggtttg aacgtggtgg tcctgtatca acttatctat tgttaaaaaa agctgaagaa + 3361 ctgacaggtg aaagtcgttt ggaagaaatt tttaatgaag ctgaactcac agaaagacaa + 3421 gaaaagttcc tgaaggaatt tagaatgata aggggtgcaa atggatagca tattcaaatt + 3481 agcaggtttt tcagttaatg aaatagttta taaagtgtta tttatcatta ttttatgggc + 3541 tataattggt gcaatacttg gtgaaatttt tcagtgataa ttagataagg aggaaaggga + 3601 gaggtgataa aacctaatat agaacatttt caaaaaagaa tgttgagagt tccaaacaac + 3661 gtccgaatgc tccagtataa aatgagtgga tatgaattta atttgaaaaa atttgagcag + 3721 ggagtttatg accagctctt tttttatatt ccaaatgaaa ctgaagcgtt gggattgctc + 3781 aatgaaatag gcttgatgtt tccacctgat tcaatgacac gaaaaaaata ttattcactc + 3841 tatcaagaaa aaaggattgc ggatttgcct gaaggctata aaatggcaat ttatttttta + 3901 attgataatg atttagcaca agccacttta tgatttttca taaataaaaa caaagttatt + 3961 tttcagataa gggaaggcaa attttgtggt gggaaataaa aaaagaaaag agataaaata + 4021 tgccaacttt aaaaacaggc cttaaacaac ttacaactga tttaaacgaa attgaagctg + 4081 taatcaatgc aggaaatgcc tatcaagaag ccgtttcaaa actcaaagga caaggaaaag + 4141 cacttcgtac acttgaaaat gatacctcaa tttcagatga tacagtcgaa gttattgcca + 4201 atcgtacaaa tgatttgatt agaaatcttc tcaaaggttc aactgcatac aactttacaa + 4261 agaaatcatt taatgaatta aaaggaaaac tggaagaagc agaagcgcaa gcacgtagtg + 4321 gcgctaaata aatagtccac gtaaaacttt aaaataaggg gagggtttgc ctttccttat + 4381 ctgaaaaata acattgtaaa agcctcactc atggtaaggc ataagagaaa ggacacctca + 4441 ccatgagtga gaaataaaaa atatgacagt aacaaatatg agcaaagcac gaccacagat + 4501 tgatttttca cttcataaag caccatataa agatttatat gatattcaaa ttttgtttcc + 4561 tgatggtaca aatcaatttt ggtctggaat taatgaaaaa aaggtcatgt ggctgtgtga + 4621 gaaatacaat cctatctcaa ctccgctgtc aattgcgatt gctcctcgat ttttaccaaa + 4681 atctaatatt caaaaaccta attgggaaat tagaaagggt tagaaaatag atagaaacaa + 4741 atatttaaaa atcgctattt attttgatat tttcttagca atttttggac taacttattt + 4801 attaatgaaa ttctttggag gttgaattat gagtgtattt gctgaaagat taaaagagtt + 4861 gcgaaaagaa aaaggactta cacaaagtca agtaggtgtt catttgggaa tgtcacagca + 4921 aaattatcgt aggtgggaag taggcgaacg ttcacctagt ggtgaaactt tgataaagct + 4981 cgcagattat tttgatgtta gcacagatta tttattggga agaaaaagtg aaaaatgaac + 5041 attcaacaac tctatttaat tattaataaa atgaataaag tgcttaaagt tgctagactt + 5101 atttcgctaa ttccagttac gcttattgga ttagcttttg aaatacttac ctctatgttc + 5161 ttatcaggta caatatgttg gtggctggca gcttttaaaa ttatttcaga aaataataag + 5221 attatatttt atctttttag tgtcattatc ttcctcatat tgctagttta tagtttgatt + 5281 gggattctta aagttttaga aaacaaactt aaagagaaag aagttaaatg atgacagtac + 5341 ataagaaaaa actagatttc caatttcata aacccgttga aacgggggaa aaaccttttg + 5401 aagttcgtat aaatgattgt gattatcaag taggcgatat tattgaacta aagtcttatg + 5461 ggaaatgttg taactattgt gatggaaaat catataaaaa atattattca ggaaattgta + 5521 gcggttggat gaattgctat gaatctgaag ctgaaactat cagagtaaag atattaagag + 5581 ttatttatcc taaagaaatc aattatgctt taacgcatgg ggttatttta tcaagcagtt + 5641 tcggtaaaat aaatcttgat gatgttagag aagtattgaa agaatacttt aacagaaaaa + 5701 cgttacctaa agattatgta cttcttgaaa ttgaggttat taaaaaataa ataaaacttg + 5761 tccgaaacga caaaaaacta gtcgcttaac tgtcagaaat ggcagttttt ttattttagc + 5821 taaattaaaa aaaggagatt tactcatgag taaacacaaa aaattgttaa atggcttaac + 5881 ttctgaaaag aaagttacca attggaaaat gcacaaacgt aaaaaagtat ttgttgcctt + 5941 tgcaggagtt ttggctgtgg gtttgggtac agcaggactt gtatatgcta gtgcacaaag + 6001 tacaagtgcg aaggctagtt taccaacaga tacaacggtt aactgggaaa ataacaagcc + 6061 tttgtattat gaaatcgacc aaacaggaaa agaacaccca aaacctatgc ttaaactatc + 6121 agatggaaca cctgcatggt gtttgggtct tggtgtgcct ttggttaaca acataactca + 6181 agctcaatta gattctagta atgcaatttt aaatgcctta tctgatgaac agattgctgt + 6241 gattaacaat gtggcatatt tagctcaaaa acaaggaacg ttgttggcat atgcacaagc + 6301 tcaacatgcc acataccttt tacttgatga agcaggggta tctgtcaatc agacaaaaga + 6361 tttgattgta aaaccaaaca ctttattaca agaacctaat gccattaaaa caggcgcaaa + 6421 tgacttgatt acacaagcaa aagctcttcg taaattgcca agttttcatg gaacaacggt + 6481 agatgtggtt caaggggtag aaaaaacagt tactgattca aacagtgttc ttgctaattt + 6541 tccaaatttc aaaagtaatg tttctggttt atcagaaagt gtttcaggca atgatttgaa + 6601 actgaaagct gatattacgg caaaagttgg aatcactcca aaagcaattc aattccaaaa + 6661 cacacctctt tcaattgctg atttacctta ttatgtcttt tcgactgatg gagatagtac + 6721 agggaaagca agtcaatctg tgattgcttc acaagaccct tcaaaagcta atggttatct + 6781 aaacgttaat gttattggtc ttggagaaac aacattgaca aaagtggatg ccgatactgg + 6841 cagtggtgaa acacaaggag ctgcacaatt aaaaggggct gtctttggtt tgttcaataa + 6901 atcagacaat tcacctgtga aatggtctga cggtcaaaaa ggatatccta ttacagttac + 6961 tgctggtact aaagcagatg atactaatgt ttccattaag cttggtgatg acttgaaagc + 7021 aggattgaaa aatcttgata actcaaaaga gtattattgg aaagaaaccg ttgctcctga + 7081 aggttatagc ttatcaaccg aaaaatatga agtaaaattt gattcttcaa gtaaatttga + 7141 tgataaaaca tcaaacttta tagatgatga taaggcaact gataaagtcc ttgacttaaa + 7201 ttttggcttt atcaaagcgc aagatgtcaa cggttcattg actggcttaa atggtcgtac + 7261 tttccgatat actcctacag gagatactaa aggaaaacca attgaagtga cttcaggagc + 7321 aaatgaagat tctaacggtg taacgaacaa cggacaagtt aatttcacca aaattccttt + 7381 tggtgatgga cttcttgaag aactcccaca aaaagatgat aaacttcaat taatcaaccc + 7441 tatctctatt gttacgacaa ctaacaagga taaggatgaa aatatcacag gttatacagt + 7501 cacatttact gatactgtta caaaacaagt gattacaacg cttgatgttt cgttggataa + 7561 agtaactgat aattctacaa tgttcaaagt taatcttgga actttggtag ataaaccagt + 7621 tactcctgtc gtgccaacca ttaaaacaaa ggcacatacc aaagatggcg accaaacgat + 7681 tcaaaaagtc gaaatttcca aaacaactcc tctctacgat aaaatcatga caacaaatgc + 7741 tataaaaggc gaccaaatgg tggctacact tcaccgtgtt gtgacgggta aagacggaaa + 7801 agtgacagaa tcaaaagtta tccgtacttt gaatttcacg gttgatgatg aaacggtcaa + 7861 agcacaagaa aaacaaattg aatctactgt tgatacaacg aaagacgctg atgttcctga + 7921 aacttcaact gtagcctatg tttggactga agatttattt gatgaaggaa aaaatcctaa + 7981 aacagatgaa ccaaaagcaa aacatgatga tttgaaagac caagaccaaa cattgaccgt + 8041 cgaaaaagtt gaaaaaccag ttactccacc aagttcaaaa cctactccac caagtaccac + 8101 tcctacagaa actcctaaag tttcattacc aactacagga agtgaaacag gcgatatgat + 8161 tatgtatggt ggtgcattag ccgtcttaat cgctcttggt actggtgctg tttattatat + 8221 gaaaaagaaa aaatcaacta aagaagaagg gtagaaaaga gcagacttga tgtctgcttt + 8281 tattttgaat aaaaatgaaa aatacaaaat ataaatcaag aactccacca aataaatttt + 8341 atgaagtgtt atttcaaatt tataaataag agaggaaaaa atgtacgttg taaaaatgcg + 8401 tggtggctat ctttgtgcca atggtggagc gactaaacac ttaaaatttg ctaccacttt + 8461 tgatactaaa aagaaagctg aagaagtggc tgaaaaatgg ttaagaagtg atgtatcttt + 8521 taaagctgtt gaaaaagaaa gtgaggaata tgagcagaat aaaaattagt gagttggcag + 8581 atgaattcaa aattgacaga aaagatgtgc tggctaaagc gcaggaattt ggggtttcag + 8641 ctaaattggc aacgaaaacc ttgagtgaat cagaagaaaa acagttgaga acatattatc + 8701 aacaggttcc acattcaatg gctgaaacaa gcaaaaatca agttttagaa aatgtaggac + 8761 agaaaaagct tgaccctaaa gaagaagttt cagaaaaaaa agaagaaccc tctaaagcag + 8821 aacaagtgga aaaaaagaaa tcaaaatttt caatattggg tcataaaaag tctgaaaaga + 8881 aaaaggggaa actgctcact cgcctttcaa atgaaaaacc accgtcaaaa aagcagttta + 8941 ctgcaaagca gggtggggca ttagttgtgg gtggggttgg aatcttaata ttatctaaca + 9001 tggtcttgtt tggtttaatg gcaagtggtt atcagccgac acaaaaaatc attcatgaac + 9061 aggtaagtgc cagtcaaaaa gtttcaggaa atggacttga tttacaagcg aaaaattatc + 9121 ttgatggctt tgttcaaacc tactttactt ttcctgaaaa tgaaaaagac caagaacaag + 9181 cggtcaaaga tattaatggt tactttgttc aacaattgcc agtcattagc caagggcttc + 9241 aacgttcacc ttcaaagttt gaagaagcgg tattaatgaa tttaaccgat aatgaagcca + 9301 cttataaagt gacttatggg gcaggggcag tcacgaaaaa gggaaaatca aatgtggtga + 9361 attatcatga tgtcacaact ttatttacta ttccttatca aaaagtaggg tcaagttatt + 9421 atgtttctga tgaaccttac ttttcaagtg ttaatgattt acaagctaaa gaaagtcaag + 9481 tccctgtcaa aacatggtca ggaacagata ataatagcgc ttcgactaag aaagacttag + 9541 ataagttcac aaaagcttta tttacggctt atacaactga tagtgatacc ttaaagctga + 9601 tttcagaagg gttatctttg aatgatagcg aaacgttcca gtctttagac caagccactt + 9661 atgaacctaa aggtgacaca tatcaagcta ttgttcaagt gacaatgaaa aatgagctag + 9721 gtactcatgt agaaaactat caatttacaa tttcaaaaca aaagcagtct tattttgcga + 9781 ctgactttaa gcatactttg ccaaaaggca ataaagaata ggagaaatta aaggtgaaag + 9841 aattattaaa ttatcatatt gccgttgttt atggagatat tggactttct aatttttgga + 9901 atacatttca aaccaatgtg aaatatatta tttttgcagg gactttatgg tttatgataa + 9961 gggaatggaa aaacaaagcg gttggtaaaa tggtaatgac ttttattgtt ggggctattt + 10021 tatttgcatt aacattgaat ccagaaactg tccttcaacc aataggacaa aagttaatgc + 10081 aaatgattgg ggcgtaatta aggagcgaaa atgtcaaaag aaaataaaaa aggactgaaa + 10141 tattcaaata aaagttcact ttcacaaccg ttaagaatcc aaaagctttt tgatggatgg + 10201 tcgctaggca aggcttggcg gttgtccttt tttatttact ttggattgtt tggctttatt + 10261 ttatggaaac ttttattttc aaaattagtg gtttttccta ttggctttcg attggtcgtt + 10321 gagagcttta tgtgttataa aagcgcctta tttttagcgg aaatacggat tgatgataaa + 10381 tcgccgttta tttatctaaa agatatgata agtttcatta taacttttgg cttgaaagga + 10441 aaaagcattt ataaagggtg gatttaccct ttacgcaaga gaaaagagga attaaaagaa + 10501 aaatgaagaa aaaagcgaca tgggaaaatc atattttatc agttcatgaa aatttggttt + 10561 taaaagatga tggcacagtt tttgccatgt ttgaagttcc agcttcaatt atttcaatga + 10621 tggatgaaaa aggaaagaaa aaccataaac aaacaacaca agcggtgatt accagtttgt + 10681 atgaacattt aggctttgaa attttgatga agcctatcac aaaggattta ctcaaagcgt + 10741 acggctattt actggaagat tgtgacccac gaacacgaga gtttggggag tatttattag + 10801 aacaatctta tcttgaatta gaaaatgagt tagggaagat ttacaatcat aaattctttt + 10861 taactgttcc attgagtgac tttgcttttt caggcgattt gaaaaagatg atgaaagaag + 10921 ggtggcaaag atttagaaaa tcagtcgttc aattgattcg ccgtgagctt gaatttacgg + 10981 tcaattggta tgaagattat gaacaaacgg ctttagattt agaaatgaat ttaaatctcc + 11041 ttcaagctcg tccattaaaa caagaagaaa cactgcttta taattcctta aattacttgc + 11101 gtggcattga tgtcaatcaa gatgaacttt tggctgatgt gaacaatgcg attgaaaata + 11161 ttgatgatac aacggttgat gttcgctcag atggtttgct tgaaattcat catccccaag + 11221 gagagagcct gttaaaattt ttgcccctcg ctgattaccc tgatgtggtc aatgatattc + 11281 atttaataga acatattcaa accttgccct ttccagttga atttcgtgtc aaggctcgtt + 11341 ttagaaagaa caaaggggct ttaggaatgg aagcaacagc agaaagaaca cgtgaccgaa + 11401 taggaacgga actttctgaa gcagatgagc aaggcaatgt gactaaaaac tcatctgtga + 11461 gtgcctatgt gattcttgaa gatattattg caggggtgga tggtggggaa tatttcttag + 11521 actttttacc tgtttttgcg attactggtt caacgcctga tgaaattaat tattataaaa + 11581 aaatgttaat gacggcaatg gaaggtttag gaatcaaaat tgttcctagt caatgggatc + 11641 aaccctatct attttataaa atgcgctcaa cggaagagtt gacccgttcg gataagtatt + 11701 gggtgcaaaa tatgaaagtt tcggcatttg ttgaaaattt attctttgtg agccaaaagg + 11761 ttggttcgga tgttgggttt tattttggac gagttgacca tactcaactg aattgggcag + 11821 gaaattttga aaaagccatc gctagctcac ctactccttt tttctggaat atgtttcaag + 11881 ccaataagga cgatattgaa gggaaattgg gagatagtcc tcacgtgggt atttttggtg + 11941 atacaggctc agggaaatct ttttttgcca aacaaggatt tgttaatcat tctatcttaa + 12001 aaggattgag cctttatatt gaccctaaag atgaaatgaa aagtcaattt ttagctgttc + 12061 gagataaatt agaatcttat ctgcctgaaa tggaagaaaa aatttctgaa ttagtggttc + 12121 tcattgaaga tgatgagatt ctagctcgaa gaattaggaa tttagagttt tcttatcata + 12181 aaccactgat tgattatatt aatcatattc attttgtcag cttggatgtc aaagataaga + 12241 aaaacatcgg agcgcttgac cctattgtct ttttagaagg caatcaagcc acagagcttg + 12301 ccacgcaagt cacaaaaggt ttaattggcg ataagttaac agaagatgac cgctttgaga + 12361 attgtttcaa tcaaaaagtt caagaagtga ttgaagccag agccaaagga aaaacggtag + 12421 gacttttaaa tgtttttcaa ctcatggcaa aatcagaaga agattttatc agataccgag + 12481 cagaaaatat tttatctaaa atttcaggta cgatgttaga gctggtcttt tcagaaggtc + 12541 aaaattcctc agtcagtatg gatgaacata ttactatttt aggagtgaca ggcttaaatt + 12601 tagcgaaatc aggggaagtc aaaacagctc aaaatgaaat gtctgatatt atcatgtatg + 12661 ccttaggtga tttttgtcgg ttctttgggg cgagagatag agaacaggaa acggtcattt + 12721 ggttagatga aggttggttt tttaatacaa cagatattgg aaaaggaatt ttaatgcgaa + 12781 tgaaacgtgt cgggcgttca gaaaacaatt ttttagtttt gattagccaa agtgtgaaag + 12841 atggtgcatc agaagaagat gatacggcat ttggtacaat ctttgccttt aaagaaactg + 12901 ggaacacaac ggcagctctt aaagcgattg gactgcctga tgatgtggaa gaaatcatta + 12961 aatggtatga aaatatgaca aaagggctgg cgcttttgaa agacccattt ggtcgaattg + 13021 gtcgtgtggt cattcaaggt caaaattcag cgttgaatga atgctttaaa acctcattta + 13081 gtaaaatgaa atcaacgaag gcggtggcat aatgaaaaag aaaatgttgt tagtggtagg + 13141 gctgttggca tttttaggag gggttgccct acctagtcaa gcggatacgg cttttaacgt + 13201 tccaaccact cctagttttt cgagtgctaa aaatccaaca gtttcaaaag cccctacttc + 13261 atcatcttca acggcttcaa gcaaaagctc aaccacaagt ccttcttatc cagttaacaa + 13321 tgggtttgtt ggtggggatt tgggtgatta ttcttcgtct aactctccaa gtaaagtaat + 13381 gaatgaagta gagaagaaaa aagcgaggga aaatttagat aattatacct cttatatgta + 13441 ttttgatgat ggaaaatttc tcacgggctc aatgagtgct gggatgcaga ccttttttgt + 13501 tcgttctcaa tttttcgtca caaaaaccat ttatcggttt gtgaatgcgg tcaatgaaaa + 13561 actcaatagt gattctttga ttacacaatg gacagcgcaa atgtttgcga cagtaaaaaa + 13621 aatttacaat caattttcta accctcaact ttacccaatc attgccattg gcgttattag + 13681 tagcttattg tattattggt ttaaacgtcg ttttttagaa ggagtgagaa aagtcatact + 13741 ggtcatgtta ttagtggggc tttttatcaa tgggggtcaa aaactaactg aacaaatcaa + 13801 ttcatcattg aatacagcta caactacgtt gatgtcaacg gttaaggtgg caggcgtttc + 13861 ttcaagaaat tcaaatgatt taaaaacaac aatggtcgaa gtcccttttc tttatatgaa + 13921 ttttgataat gtcaaaatca atgcggatgg ttcatcaaat atttctgagg ataatattgt + 13981 aaaacttctc acctctgatg atgacaatga taagttaaaa acgattcaat ctgatttaaa + 14041 agattcacat ttgacctcga aaaaaatggg cgaaaaagta ttaactgctc tagccagtat + 14101 tttcaatgcg atattagttg gttttattta cctagctttt gcggtgatgg cttttgtcat + 14161 gcgaatgttt ttcttaattc tcttactttt actacccttt gtggggattc tttccttatt + 14221 tcctttcttt gatgtagtga ttttaaggtg ggcaaaagca acaggtgggg cgttgattgt + 14281 ttctaatgtg gtcgttattg ggacagcttt aattagtatc ttagatagta ttgtgtcttc + 14341 tgcggtaact tcaatgattg ggagcgatta tttctttatt acactcatca aatttattgt + 14401 ttatattatc ctctttaaaa agcgtgaaaa gattcttgaa atatttaagg caggacatct + 14461 ggggaatagt ggctttgcag ggcgtatgga tggcttactc tcaaatgtgc ggagaaaagg + 14521 ctcaaatatg attaaagctc cacttctagc aggttcttca gcaggactgg tcgcaggttt + 14581 aaccgcaggt caaatggcaa ctggtaaggc gaaagaaatt gctaaaaatc gtttgacaaa + 14641 cggtacaggc agtttatggc atggtggttt gaataaaaaa gcagaccgta ccatgaataa + 14701 aatggataaa gcaaatccta atagtaaaaa aggtcaaaaa ttacaggcta aagaagaaaa + 14761 aatcaaacaa cgtttggaaa aacgcaaaca gaaatttgaa aatcctaatc tgctaaaacg + 14821 aaaagtagct gactatcgca aacagtatca acaacgaaaa actatgaata acccaaatct + 14881 tgctcaaaag atggaacaaa aaaataaaga aaaaaatgct tcgattcaag ctctttatga + 14941 taaaaataaa actcaacttc aagcaagagc aattgagcgt agaatgcgtg aagctgttcc + 15001 tgaccaagaa aaacctaatc tatcagaatt agctaaaaat aagcaaaaag ctttagctaa + 15061 agaaaagtta gatgaaagag caatgaaaca atcagcaggt agaatggctg aaagatttga + 15121 aaaggaaaaa gttagtcata gtagttttaa acgtaaacca aactatcctt gggataataa + 15181 tgataccaat caaaaactta acaatccatt tgtgattgat gaaaaatagg gggtgaaaat + 15241 gaaaaaagca attaagcgga aggttatatt agttagcctt ccttttttgt tgcttttatt + 15301 gccaatatta gctttctttt cattatttgt tggttcaaat tcttcttcag atacagatat + 15361 taataccaat acaccacagc aacaaacagc aaaagtgatt tgggatagag ttctaaaaga + 15421 aggtggaacg aaagaagggg cggctgcttt acttggtaat aatcaagcag aaagtgaact + 15481 tcaaccttca attattcaat ctaatgcaac ttataatgaa gcaaaagcaa tggataccac + 15541 tttaggcggt tatgctttcg gtttggctca atgggatagt ggcaggcgag taaatttgct + 15601 taactatgca aaaagtcaga agaaatcttg gacagatact aatcttcaag tcgagttcat + 15661 gtttgagcaa gacggtacag attctacgtt gcttaaacaa ttaattaaag gaactaatgt + 15721 taagcaaaca actgaagata ttatgcgaaa gtgggaacgt gcaggggcgg ttgatagcct + 15781 ttcaaaacgt caaggttttg cggaatattg gtacacgttc atgacgactg gtggtgatag + 15841 tggaactggt ggcggttcag gtattactcc agatatacct tcaggttgga ctttggataa + 15901 accaattaac acaagcggtt atattacttc aagttatgaa tataaacaat gtacttggtt + 15961 tacgtggaat cgagcgaaag aattcggtat tacttttagt ccatttatgg gaaatggtgc + 16021 tgattggcaa catcaagcag gatatactgt aacgacaact ccaacactcc atagtgcggt + 16081 tagctttagc ggtggtcaaa cagtaggcgg tcaatggaac gcagacccag tttatggtca + 16141 cgtggctttt gtggaagcaa tacattcaga cggttcagtc ttaatttcac agtcaggaac + 16201 tggttttagt acggtttata ctttccaagt gctgacaaaa gcacaagcca gtcaattaca + 16261 ttacgtgata ggaaaataaa aaatagtcga ttaacgttcg gtattagcct agttttcacg + 16321 ttgaaaattc cagggttttg aaagttattt ccgaacaatg gaaaggagag agtatgacta + 16381 aacttgaaga agttagagca agtgggaaaa tgtcagaaag ggtattagag aataatttta + 16441 gacactttga ccacagactg cgagaaatag aaggagaatt aagactttac ccttatgcga + 16501 ctttatctga agttatagca tgggctgaac aactaaaaat agcaattggg aaaattaaag + 16561 caatacaaga aagtagtatt ataaaatcta aaaaagaatg gggaatctta gaagaaaaaa + 16621 tgttgggtta tttgcagata gacaaagcat ttattcatgt attttctgac catgttattt + 16681 tccttgttca attggaacag cggtatcggc aaagattaag tatttttgcg aacaatttag + 16741 ataatagtgt tcgctatcta aaaagatatg cggatgattt agaaaagcaa ggattttcta + 16801 taactggaat acttgctgaa agtagaaatt taagtgatat gaactggttg agtatcttaa + 16861 attattaatt tagaaaatta tgagggtata aaaatggaaa caccaaaaat ttatgttgta + 16921 aatttaaaca gttataacaa tggaagaaca agggggaagt ggtatgaatt acctgttgat + 16981 ttttcaagaa ttaaatcaga tttactttta gatgtagagc atggggaaga atatgcaata + 17041 catgactttg aaaattttta cggttataaa gtaggcgagt attcgtcaat tcaggaactt + 17101 aatgagtatg cggaaaaatt agaagaaatt tctgacatag aacatttaaa agattttctt + 17161 gaaatttata gtattgatga tgttatcaat aataaagatg atttggactt tgtggaagct + 17221 gaaaatgatg aagatttggc acaagaatta attgagcaaa tgggcggttt agaagttcta + 17281 agcgtagaaa cgttacaaag atattttaac tttggtgctt atggtcgaga tttagcaatt + 17341 ggtgattatt caaaaacaag tcatggatat attagagata tttaaaggtt aagtaaaaga + 17401 gcaagaaaaa ccttgctcta ttttttgttg gaggaaaaaa tggaagaaaa ttataaagat + 17461 aaacggggaa tttcaaaatt atttgatgta cctataaaaa cacttaataa tgatttaact + 17521 gaaatgagac gaacagaatt taatgtttat atattacgac caagtcataa acgtgtttat + 17581 ataaatgtcc agggttataa atcttttctt gaatataagc aaaaaataag agaaagtaca + 17641 atttagaaaa aagataaaag taatatacag atatgatata atataagtgc tgtatagctt + 17701 tcttttatct ttggtaaaag gaggaaatat gttttataag caacttgata gtggaaaata + 17761 tagatacttt gaaaaatatt tcgatgaaaa gagaaataaa tggcgacaag taacggtcac + 17821 tttaaaatca aaatcaaggg ttgctcaatc agaagctaaa aatagattag caagaaaaat + 17881 tgaacaatca aaaaaagtac caactgctat cgagcttcag gaacaaatcg ttcaaaataa + 17941 gacgatacaa gaaatttatg aagaatgggt tgtaattaga aaacaagatg ttaagccagc + 18001 aagttttgta gcggagcaaa tttctttaaa aggatttatc gaaaaatttt caaaatataa + 18061 agtctcagaa gtgacgaccg cagatataca aagttattta atggaattag atattgcgaa + 18121 ttcaacaaga aaaaatcgta gaatttacat tagaattttg ttcaaatatg ctgaaaacat + 18181 cgggtatatt aattcaaatc cagctgacaa agtagtatta cctaaagtaa ggttagaaat + 18241 tgaaacatta gaacgagcaa atgaaaaatt tttaagtaaa gaagaaatga gttctgtttt + 18301 gatattttgc aaatcttata aaaaaaatat aagatacact ttagctatgg aatttatttt + 18361 cctaacagga tgtagattcg gtgaatttgc ttctattcgt tatcaagatg ttgatttcaa + 18421 aaataagtta ctaagaattg accacacttt agaatatcgt gttgcaaaat atgatgatcg + 18481 agttattcaa acacctaaaa cggtaggttc gattcgtaca attagtttaa gtaatcgttg + 18541 cttggaaatt attgattatt tccaaaaaaa ctgtttagat gataagtttg tttttgtaaa + 18601 tgcggttggt ggaattttca gacaacctgt attttataag tttatttgtg ataattgtca + 18661 aaaagtatta ggaaatgaaa gaaaatacgg tatacattta ttgagacatt ctcatgtatc + 18721 attacttgtg gaacttggag ttccaattaa agcaattatg gaacgagttg gtcatagaga + 18781 cgagtcaatc actctgagga tttattctca tataagtggt acaattaaaa atgaaattag + 18841 tcaaaagttg aaccaaatta atctctaaa +// +
