Repository 'racon'
hg clone https://eddie.galaxyproject.org/repos/bgruening/racon

Changeset 0:1c2e93f2d7c0 (2018-06-11)
Next changeset 1:059c552c137a (2018-07-19)
Commit message:
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/racon commit f6dd7c41a45584b478b8af48df5294e3c39f5203
added:
macros.xml
racon.xml
test-data/consensus_result2.fasta
test-data/sample_layout.fasta
test-data/sample_overlaps.sam
test-data/sample_reads.fasta
b
diff -r 000000000000 -r 1c2e93f2d7c0 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Mon Jun 11 16:39:36 2018 -0400
b
@@ -0,0 +1,14 @@
+<macros>
+    <xml name="requirements">
+        <requirements>
+        <requirement type="package" version="1.3.1">racon</requirement>
+            <yield/>
+        </requirements>
+    </xml>
+    <xml name="citations">
+        <citations>
+            <citation type="doi">10.1101/gr.214270.116</citation>
+            <yield />
+        </citations>
+    </xml>
+</macros>
\ No newline at end of file
b
diff -r 000000000000 -r 1c2e93f2d7c0 racon.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/racon.xml Mon Jun 11 16:39:36 2018 -0400
[
@@ -0,0 +1,81 @@
+<tool id="racon" name="Racon" version="1.3.1">
+    <description>Consensus module for raw de novo DNA assembly of long uncorrected reads.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+    <expand macro="requirements" />
+    <version_command>racon --version</version_command>
+    <command detect_errors="exit_code"><![CDATA[
+        ln -s '$reads' reads.${reads.ext} && 
+        ln -s '$overlaps' overlaps.${overlaps.ext} && 
+        ln -s '$corrected_reads' corrected_reads.${corrected_reads.ext} && 
+
+        racon 
+            reads.${reads.ext}  
+            overlaps.${overlaps.ext}  
+            corrected_reads.${corrected_reads.ext}
+            -t \${GALAXY_SLOTS:-4} 
+            $u
+            $f
+            -w $w
+            -q $q
+            -e $e
+            -m $m
+            -x $x
+            -g $g
+            > racon_polished_consensus.fa  
+    ]]></command>
+    <inputs>
+        <param type="data" name="reads" format="fasta,fasta.gz,fastq,fastq.gz" label="Sequences"/>
+        <param type="data" name="overlaps" format="sam" label="Overlaps"/>
+        <param type="data" name="corrected_reads" format="fasta,fasta.gz,fastq,fastq.gz" label="Target sequences"/>
+
+        <param argument="-u" type="boolean" truevalue="-u" falsevalue="" label="output unpolished target sequences" />
+        <param argument="-f" type="boolean" truevalue="-f" falsevalue="" label="perform fragment correction instead of contig polishing" />
+        <param argument="-w" type="integer" value="500" label="Size of window on which POA is performed" />
+        <param argument="-q" type="float" value="10.0" label="Threshold for average base quality of windows used in poa" />
+        <param argument="-e" type="float" value="0.3" label="Maximum allowed error rate used for filtering overlaps" />
+        <param argument="-m" type="integer" value="5" label="Score for matching bases" />
+        <param argument="-x" type="integer" value="-4" label="Score for mismatching bases" />
+        <param argument="-g" type="integer" value="-8" max="0" label="Gap penalty" />        
+        
+    </inputs>
+    <outputs>
+        <data name="consensus" format="fasta" from_work_dir="racon_polished_consensus.fa" />
+    </outputs>
+    <tests>
+        <test>
+            <param name="reads" ftype="fasta" value="sample_reads.fasta"/>
+            <param name="overlaps" ftype="sam" value="sample_overlaps.sam"/>
+            <param name="corrected_reads" ftype="fasta" value="sample_layout.fasta"/>
+            <param name="u" value="true"/>
+            <param name="f" value="true"/>
+            <param name="w" value="800"/>
+            <param name="e" value="0.2"/>
+            <output name="consensus" ftype="fasta" file="consensus_result2.fasta"/>
+        </test>
+    </tests>
+    <help><![CDATA[
+
+**What it does**
+
+Consensus module for raw de novo DNA assembly of long uncorrected reads.
+
+Racon is intended as a standalone consensus module to correct raw contigs generated by rapid assembly methods
+which do not include a consensus step. The goal of Racon is to generate genomic consensus which is of similar
+or better quality compared to the output generated by assembly methods which employ both error correction
+and consensus steps, while providing a speedup of several times compared to those methods.
+It supports data produced by both Pacific Biosciences and Oxford Nanopore Technologies.
+
+Racon can be used as a polishing tool after the assembly with either Illumina data or data
+produced by third generation of sequencing. The type of data inputed is automatically detected.
+
+Racon takes as input only three files: contigs in FASTA/FASTQ format, reads in FASTA/FASTQ
+format and overlaps/alignments between the reads and the contigs in SAM format. Output is a set of polished contigs in FASTA format printed to stdout.
+
+Racon can also be used as a read error-correction tool. In this scenario, the SAM file needs
+to contain pairwise overlaps between reads including dual overlaps.
+
+    ]]></help>
+    <expand macro="citations" />
+</tool>
b
diff -r 000000000000 -r 1c2e93f2d7c0 test-data/consensus_result2.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/consensus_result2.fasta Mon Jun 11 16:39:36 2018 -0400
b
b'@@ -0,0 +1,2 @@\n+>utg000001lr LN:i:46960 RC:i:200 XC:f:1.000000\n+ATGATTATCATCTACATATCACAACGTGCGTGGAGGCCATCAAACCACGTCAAATAATCAATTATGACGCAGGTATCGTATTAATTGATCTGCATCAACTTAACGTAAAAACAACTTCAGACAATACAAATCAGCGACACTGAATACGGGGCAACCTCATGTCAACGAAGAACAGAACCCGCAGAACAACAACCCGCAACATCCGCTTTTCTAACCAAATGATTGAACAAATTAACATCGCTCTTGAGCAAAGGGGTCGGGAATTTCTCAGCCTGGGTCATTGAAGCCTGCCGTCGGAGACTAACGTCAGAAAGAGAGCATATACATCAATTAAAGTGATGAAGAATGAACATCCCGCGTTCTTCCCTCCGAACAGGACGATATTGTAAATTCACTTAATTACGAGGGCATTGCAGTAATTGAGTTGCAGTTTTACCACTTTCCTGACAGTGACAGACTGCGTGTTGGCTCTGTCACAGACTAAATAGTTTGAATGATTAGCAGTTATGGTGATCAGTCAACCACCAGGGAATAATCCTTCATATTATTATCGTGCTTCACCAACGCTGCCTCAATTGCTCTGAATGCTTCCAGAGACACCTTATGTTCTATACATGCAATTACAACATCAGGGTAACTCATAGAAATGGTGCTATTAAGCATATTTTTACACGAATCAGATCCACGGAGGGATCATCAGCAGATTGTTCTTTATTCATTTTGTCGCTCCATGCGCTTGCTCTTCATCTAGCGGTTAAAATATTACTTCAAATCTTTCTGTATGAAGATTTGAGCACGTTGGCCTTACATACATCTGTCGGTTGTATTTCCCTCCAGAATGCCAGCAGGACCGCACTTTGTTACGCAACCAATACTATTAAGTGAAAACATTCCTAATATTTGACATAAATCATCAACAAAACACAAGGAGGTCAGACCAGATTGAAACGATAAAACGATAATGCAAACTACGCGCCCTCGTATCACATGGAAGGTTTTACCAATGGCTCAGGTTGCCATTTTAAAGAAATATTCGATCAAGTGCGAAAAGATTTAGACTGTGAATTGTTTTATTCTGAACTAAAACGTCACAACGTCTCACATTATATTTACTATCTAGCCACAGATAATATTCACATCGTGTTAGAAAACGATAACACCGTGTTAATAAAAAGGACTTAAAAAGGTTGTAAATGTTAAATTCTCAAGAAACACGCATCTTATAGAAACGTCCTATGATAGGTTGAAATCAAGAGAAATCACATTTCAGCAATACAGGGAAAATCTTGCTAAAGCAGGAGTTTTCCGATGGGGTTACAAATATCCATGAACATAAAGATATTACTATACCTTTGATAATTCATTACTATTTACTGAGAGCATTCAGAACACTACACAAATCTTTCCACGCTAAATCATAACGTCCGGTTTCTTCCGTGTCAGCACCGGGGCGTTGGCATAATGCAATATACGTGTACGCGCTAAACCCTGTGTGCATCGTTTTAATTATTCCCGGACACTCCCGCAGAGAAGTTCCCCGTCAGGGCTGTGGACATAGTTAATCCGGGAATACAATGACGATTCATCGCACCTGACATACATTAATAAATATTAACAATATGAAATTTCAACTCATTGTTTAGGGTTTGTTTAATTTTCTACACATACGATTCTGCGAACTTCAAAGCATCGGGAATAACACCATGAAAAATGCCTACTCGCTACTGCGCTGGCCCTGCTTATTACAGGATGTGCTCAACAGACGTTTACTGTTCAAACAAAACCGGCAGCAGTAGCACCAAAGGAAACCATCACCCATCATTTCTTCGTTTCTGGAATTGGGCAGAAGAAAACTGTCGATGCAGCCAAATTTGTGGCGGCGCAGAAAATGTTGTTAAAACAGAAACCCAGCAAACATTCGTAAATGGATTGCTCGGTTTTATTACTTTAGGCATTTATACTCCGCTGGAAGCGCGTGTATTGCTCACAATAATTGCATGAGTTGCCCATCGATATGGGCAACTCTATCTGCACTGCTCATTAATATACTTCTGGGTTCCTTCCAGTTGTTTTGCATAGTGATCAGCCTCTCTCTGAGGGTGAAATAATCCCGTTCAGCTCTGTCTGCCAGTCGGGGGAGGCTGCATTATCCACGCCGGAGGCGGTGCTTGGCTTCACGCACTGACTGAGACTGCTTTGATGTGCAACCGACGACGACGACCAGCGGCAACATCATCACGCAGAGCAGAGCATTTTCAGCTTTAGCATCAGCTAACTCCTTCGTGTATTTTGCATCGAGAGCAGCAGCAACATCACGCTGACGCATCTGCATGTCAGTAATTGCCGCGTTCGCCAGCTTCAGTTCTCTGGCATTTTGTCGCGCTGGGCTTTGTAGGTAATGGCGTTATCACGGTAATGATTAACAGCCCATGACAGGCAGACGATGATGCAGATAACCAGAGCGGAGATCGCGGTCGCGGTGACTCTGCTCATACATCAATCTCTCTGACCGTTCCGCCCGCTTCTTTGAATTTGCAATCAGGCTGTCAGCCTTATGCTCGAACTGACCAGACCAGCGCCCGGCAGTGAAGCCCAGATATTGCTGCAACGGTCGATTGCCTGACGGATATCACCACGATCAATCATAGGTAAAGCGCCACGCTCCTTAATCTGCTGCAATGCCACAGCGTCCTGACTTTCGGAGAGAAGTCTTTCAGGCCAAGCTGCTTGCGGTAGGCATCCCACCAACGGGAAAGAAGCTGGTAGCGTCCGGCGCCTGTTGATTTGAGTTTTGGGTTTAGCGTGACAAGTTTGCGAGGGATGATCGGAGTAATCAGTAAATAGCTCTCCGCCTACAATGACGTCATAACCATGATTTCTGGTTTTCTGACGTTATCAGTTCCCTCCGACCACGCCAGCATATCGAGGAACGCCTTACGTTGATTATTGATTTCTACCATCTTCTACTCCGGCTTTTTTAGCAGCGAAGCGTTTGATAAGCGAACCAATCGAGTCAGTACCGATGTAGCCGATAAACACGCTCGTTATAAGCGAGATTGCTACTTAGTCCGGCGAAGTCGAGAAGGTCACGAATGAACTAGGCGATAATGGCGCACATCGTTGCGTCGATTACTGTTTTGTAAACGCACCGCCATTATATCTGCCGCGAAGGTACGCCATTGCAAACGCAAGGATTGCCCCGATGCCTTGTTCCTTTGCCGCGAGAATGGCGGCCAACAGGTCATGTTTTCTGGCATCTTCATGTCTTACCCCCAATAAGGGGATTTGCTCTATTTAATTAGGAATAAGGTCGATTACTGATAGAACAAATCCAGGCTACTGTGTTTAGTAATCAGATTTGTTCGTGACCGATATGCACGGGCAAAACGGCAGGAGGAGTGTTAGCGCGACCTCCTGCCACGCGGATTTCACGAAGGTCATGTGTAAAAGGCCGCAGCGTAACTATTACTAATGAATTCAGGACAGACAGTGGCTACGGCTCAGTTTGGGTTGTGCTGTTGCTGGGCGGCGATGACGCCTGTACGCATTTGGTGATCCGGTTCTGCTTCCGGTATTCGCTTAATTCATTCAGCACAACGGAAAGAGCACGACCTGGCTAACCAGGCTCGCCGACTCTTCACGATTATCGACTCAATGCTCTTACCTGTTGTGCAGATATAAAAATCCCGAAACCGTTATGCAGGCTCTAACTATTACCTGCGAACTGTTTCGGGATTGCATTTTGCAGACCTCTGCCTGCGATGGTTGGAGTTCCAGACGATACGTCGAAGTACCAACTAGGCGGAATCGGTAGTAAGCGCCGCCTCTTTCATCTCACTACACAACGAGCGAATTAACCCATCGTTGAGTCAAATTTACCCAATTTTATTCAATAAGTCAATATCATGCCGTTAATATGTTGCCATCCGTGGCA'..b'GCCCCATAAATGACGCCCACGACTCGTTCGCACTGGCCCGTGCCGTGGAGTAGCTCATCTGGGCGTAATTCCGGGAAAGCTGCTCATACGAGACACCCAGCCCGGCAGCGATATACCGCAGCAGTGACTGCTCAAACACGGAGTAGCCGTTATCCGTATCCTGAGCCGTCTGCAGGTTCAGTGAGAGTACCGGCATCAGGTGCGGTACTTTTGCGCCTCCAGCCGGACCGGCGCTGCTGCGGCGTAATACGCGGCAATTTCACCAATCCAGCCGGTCAGCCTTTCCCGCTGCTCCTGACTGTTCGCGCCCAGAATAAAATCCATCGCTGACTGCGTATCCAGCTCACTCTCAATGGTGGCGGCATACATCGCCTTCACAATGGCGCTCTGCAGCTGCGTGTTTCTGCAGCGTGTCGAGCATCTTCATCTGCTCCATCACGCTGTAAAAACATTTGCACCGCGAGTCTGCCCGTCCTCCACGGTTCAAAACGTGAATGAACGAGGAGGCGCCCGCCGGGTAACTCACGGGGTATCCATGTCCATTTCTGCGGCATCCAGCCAGGATACCCGTCCTCGCTGACGTAATATCCCAGCGCCGCACCGCTGTCATTAATCTGCACACCGGCACGGCAGTTCCGGCTGTCGCCGGTATTGTTCGGGTTGCTGATGCGCTTCGGGCTGACCATCCGGAAGAACTGTGTTTAGAAAAGCCGCGACGAACTGGTATCCCAGGCCTGAACGAACAGTTCACCGTTAAAGGCGTGCATGGCCACACCTTCCCGAATCATCATGGTAAACGTGCGTTTTCGCTCAACGTCAATGCAGCAGCAGTCATCCTCGGCAAACTCTTTCCATGCCGCTTCAACCTCGCGGGAAAGGCACGGGCTTCTTCCTCCCCGATGCCCAGATAGCGCCAGCTTGGGCGATGACTGAGCCGGAAAAGACCCGACGATATGATCCTGATGCAGCTGGATGGCGTTGGCGGCATAGCCGTTATTGCGTACCAGATCGTCTGCGCGGCATTGCCACGGGTAAAGTTGGGCAACAGGGCTGCATCCACACTTTCACTCGGTGGGTTCCACGACCGCAACTGCCCTCCAAATCCGCTGCCACCGCCGCGTGATAACCGGCATATTCGCGCAGCGATGTCATGCCGTCCGGCCCCAGAAGGGTGGGAATGGTGGGCGTTTTCATACATAAATCCTGCAGGTCTCTCCCTGCGTCGCTGTGTCATGCCGGTCTGCACTTCCAGCTCTGCAATATATTTTCAGGTCAGACACGGAAGTGGCCGTAAACTCCACCCTTCGTCCGTCTTTCTGTACTGTTGCCACCCGTTTACCTGTCATCAGGTCATGCAGTGCCGCACGGGCAGCGGCAAGTTCTTCCTGTCGCGTCATTCATCCTCTCCGGATAAGGCACGGCACGGCGTAATCTGCCAGTGTTTTCTTGTTGGTTGCTGCACCATCCTCTTCCTGCAGGCTCGCCAGCAGCGCACTGAGATCCAGCTGCCAGCGGGAAATACTGATGCGCAGCGCCGCCAGCGCATAAACGAAGCAGTCGAGTGCCTCATTGCGTCGCTTTTGCTGTCCACAGTATTTTCCTGCCATCCACCCATTTTCGACCTGCTCTTCAGCAGTCAGCTGCTGCGCTTCGGGTCAGATCAAAATATCCGGGTTATTCGGGAATGAACGGCACCGGGAAGCGGTTCATCCCCTTCCGGCGTCAGTGTGAAGCGGTTATAAATCTGCTCTCTTCGCGGTATCCGTACCGATTTCGGTAAGGTAAACCCCGTTTTGTTTCGCTTACGTGGCATGCTGGCCACCGGCTTTCCGTAGACGGATGCCCCTTTAATGGGGATCACCCGGAACAGCCCATGTTTTTCGAGCGTTCATACACAATGGTCGGGTCAATCCCGCCAGTATCCCAGCAGATACGGGATATCGACATTTCTGCACCATTCGGCGGGTATAGGTTTATTATTGATGGCCTCATCCACGCAGCAGCGTCTGTTCATCGTCGTGGCGGCCCATAATAATCTGCCGGTCAATCAGCCAGCTTTCCTCACCCGGCCCCATCCCCATACGCGCATTTCGTAGCGGTCCAGCTGGGAGTCGATACCGGCGGTCAGGTAAGCCACACGGTCAGGAACGGGCGCTGAATAATGCTCTTCCGCTCTGCCATCACTTCAGCATCCGGACGTTCGCCAATTTTCGCCTCCCACGTCTCACGAGCGTGGTGTTTACGAAGGTTTTACGTTTTCCCGTATCCCTTTCGTTTTCATCCAGTCTTTGACAATCTTGCACCCAGGTGGTGAACGGGCTGTACGCTGTCCAGATGTGAAAGGTCACACTGTCAGGGAGCTCAATCTCTTCACCGGATGACGAAAACCAGAGAATGCCATCACGGGTCCAGATCCCGGTCTTTCGCAGATATAACGGGCATCAGTAAAGTCCAGCTCCTGCTGGCGGATGACGCAGGCATTATGCTCGCAGAGATAAAACACGCTGGAGGGGTCATCCGGCGTCCATTTGAGGCCAAACGGCGTCTCTTTGTCGCCAAATTTAAGATACTGCTCCTCCCCCGCAATGCGGGCAGGCAACATGAAAACGCATAAAATGCGGGGATTCACTGGCTGCACGCTCAATCTGACAGGTGCCTCTCACTTTTGGCGTGGAGCCACGGATGGACTTTGGCCAGACCGAGCCTTCAATACGCTTGTTACCCAGGAACGTCGGAGAGCCTTCCTGTTCAATATCATCATCAAAAGCAGCAAGTTCATCATAACCCGCCACATCCACCGACTTTCACGGTAGTTTTGCCGCTTTACCGCCCAGGCAGCACCAGAAGCCACGCCCATTAGTGAACGCTTCATGGTGAGCGTGTTATCCCGGTGCTTTTGCCATACCACGGGGCCAGCGCCAGCAGCGACGGAATATCACGAATAGTCGGCTCAACGTGGGTTTTCATAAAGTTCTCGGCATCACCATCCGTCGGCAACCAGATAAGGGTGTGCGCTGCTTATGCTCTATAAAGTAGGCATAAACACCCAGCAGCATTTTGGAATAACCGACACGGCAGACTTCACCACATTCACCTCACGGATGTAGTCGCTGCCCATCGCATTCATGATGGCCCGCTGAAAGGGCAGTGTTTCCCAGCGCCCTTCCTGGTATGCGGATTCTTTTCGGGAGATAGTAATTAGCATCCGCCCATTCAACGGCGGTCTGTGGCTCCGGCCTGAACAGGAGCGAAGCCCGGCGCGGACAAAATGCCGCAGCCTGTTAACCTGACTGTTCGATATATTCACTCAGCAACCCCGGTATCAGTTCATCCAGCGCGGCTGCTTTGTTCATGGCTTTGATGATATCCCGTTTCAGGAAATCAACATGTCGGTTTTCCAGTTCCGGAAAACGCCGCTGCACCGACAGGGGAGCCGTCGAGAATACTGGCAATTTCACCTGCGATTGAGCGACAGCACGAAAGTACAGAATGCGGTTTCCACCACTTCAGCGGAGTCTCTGGCATTCTTCAGTTCCTGTGCGTCGGCCGGCGCACGCGTAAGTCGATGGCGTTCGTACTCAATAGTTCCTGGCTGGAGATCTGCCTCGCTGGCTGCTGCCGCAGTTCTTCAACCTCCCGGCGCAGCTTTTCGTTCTCAATTTCAGCATCCCTTCGGCATACCATTTTATGACGGCGCTGCAGAGTCATAAAGCACCTCATTACCCTGCCACCGCCTCGCAGAACGGGCATTCCCTGTTCCTGCCAGTTCTGAATGGTACGGATACTCGCACCGAAAATGTCAGCCAGCTGCTTTTGTTGACTTCCATTGTTCATTCCACGGACAAAACAGAGAAAGGAACGACAGAGGCCAAAAGCTCGCTTTCAGCAGCCCTGTCGTTTCCTTCTTTCAGAGGGTATTTTAAATAAAAACATTAAGTTATGACGAAGAAGAACGGAAACGCCTTAAACCGGAAAATTTTCATAAATAGCGAAAACCC\n'
b
diff -r 000000000000 -r 1c2e93f2d7c0 test-data/sample_layout.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/sample_layout.fasta Mon Jun 11 16:39:36 2018 -0400
b
b'@@ -0,0 +1,2 @@\n+>utg000001l\n+AAAGTGATAATGATTATGATTATCATCTACATATCTACAACGTGCGTGGAGGCCATCAAACCACGTCAAATAATCAATTATGACGCAGGTATCGTATTAATTGATCTGCATCAACTTAACGGTTCAAAACAACTTCAGACAATACAAAGGTCAGCACTGAATACGGGGCAACCTCATGTCAACGAAGAAACCAAAGAACCCGCAGAACAACAACCCGGACCCGCTTTTCCAACCAAATGATTGAACAAATTAACATCGCTGAGCAAAGGGAGTCGGGAATTCTCAGCCTGGGTCATTGAAGCCTGCTGGAGACTAACGTCAGAAAAGAGAGCATATACATCAATTAAAGTGATGAAGAATGAACATCCCGCGTTCTTCCCTCGAGAACAGGACGGTATGTAACCCCACTTAAGTCCCGAAGTCGCAGGAGTGAAGCATCTGAGTTGCAGTTACCACTTTCCTGACAGTGACTTGCGTGTGTGTTGGCTGGTGTCACAGACTAAATAGTTTGAATGATTAGCAGTTATGGTGATCAGTCAACCACTAGGAATAATCCTTCATATTATTATCGTGCTTCACCAACGCTTCCACTTCCTCGCATCCTTCCCCTACACCTTGCTGTTCTACATGCAATTACAACATCAGGGTAACTCATAGAAATGGGTGCTATTAAGCATATTTACACGAATCAGATCACGGAGGAGTAAATCAGCAGATTGTTCTTTATTCATTTTGTCGCTCATGCGCGCTTGCTCTTCATCTAGCGGTTAAAATATTACTTCAAATCTCTTTCTGTATGAAGATTTGAGCACGTTGGCCTTAAGCCATCTGTCGGTTTAGCGTTGTATTTCCCTCCAGAATGCCAGCAGGACGCAATTTTGTTACGCAACCAATACTATTAAGTGAAAACATTCCTAATATTGACATAAATCATCAACAAACACAGGAATAAGACAGATTGAACGATAAAAACGATAATGCAAACTACGTGCCTGCAGTACAGGGGAAGTACCAGCATGGAGCCGAGAGATGCCATTTAAAGAAATATTCCAATCAAGTGCGAAGGATTTAGACTGTGAATTGTTTTTATTCTGAACTAAACGTCACAACGTTCACATTATATTTGTTATCTAGCCCAGACTACTGTCGCCTTCGTGCCACGCTACAGCCGCGTGTTATAACCCGCCAATCTTAAAAAGGTTGTAAATGTTAATTCTCAAGAAACACGCATTATAAGAAACGTCCTATGATAGATTGAAATCAAGAGAAATCACATTTCAGCAATAAGGGAAAAATCTTAAAGCAGGAGTTTTCCGATCGGTTACAAATATCCATGAACATAAAGATATTACTATACCTTTGATAATTCATTACTATTTACTGAGAGCATTCAGAACACTACACAAATCTTTCCACGAAGCTCATAACGTTGCTACGCTTCTTCCGTGCGTGTCAGCACCGGGGCGTTGGCATCAATGCAATACCGTGTACGCGCTAAACCCTGTGTGTGCATCGGTCCTCAATTATTTACGCCGGACACTCCCCGCAGAGAATTCCCGTCAGGGCTGTGGACATAGTTAATCCGGGATCACGACCGATTGCCGCACCGAGAATACAGCAGTAAATATTAAATATGAAATTTCAACTCATTGTTTATAGGGTTTATTAATTTTCTACACATACGATTCTGCGAACTTCAAAAAGCATCGGGAATAACACCATGAAAAATGCCTCGGGCCTCCGCCCCTGCTTATTGGATGTGCTCAACAGACGTTTACTGTTCAAACAAAAGCAGCAGTAGCACCAAGGAAACCATCACCATCATTTCTTCTTTCGTTTCTGGAATTGGGCAGAAGAAAACTGTCGTGATGCAGCCAAATTTGTGGCGGCGCAGAAAATGTTGTCAAACAGAAACCCAGCAAACATTCAAATGGAATTGCTCGGTTTTATTACTTTAGCATTTATACTCATGGAAGCGCGTGTGTATTGCTCAATAATTGCATTCATGCATTACAGTCCGATATGGGCAACTCTATCTGCACTGCTCAGGATATATTTCTGGGTTCCTTCCAGTTGTTTAGCAGTGATGATCAGCCTCTCTCTGAGGGTGAAATAATCCCGTTTAAGCTCCGTCTGCCAGTCGGGGGAGGCTGCATTATCCACGGAGGCGGTGGTGGCTGCATTCACGCAGCACGACCCCGTGGAGTGGCAAATGAGCACGACGAGAAGAGCTTAACATCATCACGCAGAGCATCCTTCAGCTTAGCATCAGCCTACTAACTAATTCGTGCCTTTCCCATTTCGGGCTGCCGGCGATAATACAGCCCGCTGACGCATCTGCAGTGTCAGTAATTGCCGCGTTCTCAGCTTCGTTTTCTCTGAGAGCATTTTGTCGCGCTCCGTTGTAGGCATGGCGTTATCACGGTAATGATTAACAGCCCATGAATAAGCAGACGATGAGGATGCAGATAACCAGAGCGGAGATACTAATCGCGGTGACTGCTCATACGTAATCTCTGACCGTTCTCACGCTTCTTGAATTTGCAATCAGGCTGTCAGCCTTATGCTGAACTGACCAGACAGGGGACGGCAGTGAAGCCCCAGATATGCTGCAACGGTCGATTGCCTGACGGATATCACCACAGATCAATCATAGGTAAAGCGCCACGCGGGCTTAATCTTGCTGCATGCCACAGCGTCTGACTTTCGGAGAGAAGTCTTTTCAGCCAAGCTGCTTGCGGGTAGGCATCCCACCAACGGAAAGAAGCTGGCTCAGTCGGCGCCTGTTGATTTGAGTTTTGGGTTTAGCGTGACATTTTGCTCCTGCAGGGAAGCTCCCAGCAGCGCACACCGCCTCCGAGACACAATAGTCCATAACCATGATTTCTGGTTGGTAGTCGTTATCAGTTCCCTCCGACCACGTCAGCATATCGAGGAACGCCTACGTTGATTATTGATTTCTACCATCTTCTACTCCGGCTTTACAACGGCAGCGAAGCGTTTGATAAGCGAACCAATTCGAGTCAGTACCGATGTAGCCGATAAACACGCTCGTTATAAGCCGAGATTGCTACTTAGAGTCCGTGAAGTCGAGAAGTACAGGAGAATGAACTAGCGGCGATAATGGCGCGCGCACATCGTTGCGGTTCGTCGATTACTGTTTTGTAAACGCACCGGGTTTATATCTGCCTCGAAGGTACGCCATTGCAAACGCATTAAAGCAATGCCTTGTTCCGGCTCCTTTGCCGCGAGAAGCGGCCAACAGGTCATGTTTTTCTCGGCATCTTCATGTCTTACCCCAATAAAGGGATTTGCTCTATTTAATTAGGAATAAGTGATTACTGACGCTAAACAAATCCAGGCTGTGTTTATAATCAGATTTGTTCGTGACCGATATGCACGGGCAAAACGGAGATTTGTCCCCTGGCTCCTGCCTCGCCCGCTTCACGAAGGTCATCCCGAGGGAAGGAGCCCGTACACGTCCCAGCATGAATCCCAGAGAAGACAGTGGCTACGGCTCAGTTTGGGTTGTGCTGTTGCCTGGCGGCGATGACGCCTGATGGATTTGTGATCCGGTTCTGCTTCGGTATTCACTCACGGTGATTCACACAACGCGGAAAGAGCAGATCTGGCTAACCAGGCTCGACTCTTCACGATTATCGACTCAATGCTTATTACCTGTTTGTACCACTACAAAAACCCCGAAATCCATTCATGCAGGCTCACTATTACCTGCGAACTGTTTTCGGGATTGCATTTGCAGACCTCTCTGCCATGCGATGGTTGGAGTTCCAGACGATACGTCGAAGTGACCAACTAGGCGGAATCGGTAGTAAGGCCCCCTCTTTTCATCTCACCCACAACGAGCGAATTAACCCATCGTTGAGTCAAATTTACCCAATTTATTCAATAAGTCAATATCATGCCGTTAATATGTTGCCATCCGTGGCAATCATGCTGCTAACGTGA'..b'TGCCGTGGAGGAGCTCATCTGGGCGTAATTCCGGGAAAGCTGCTCATACGAGACACCCAGCCCGGGCATGCGATATACCGCAGCAGTGACTGCTCAAACACGGAGTAGCCGTTATCCGTATCCTGAGCCGTCTGCAGGTTCAGGTCATCTAGCATCAGGTGCGGTACTTTGCGCCTCCAGCCGGACCGGCGCTGCGATGCGTAATACGGCAATTTCACTCAATCCAGCCGGTCAGCCTTTCCCGCCTGCTCCTGACTGTTCGCGCCCAGAATAAAATCCATCGCTGACTGCGTATCCAGCTCACTCTAATGGTGGCGGCATACATCGCCTTCAATGGCGCTCTGCAGCTGCGTGTTTCTGCCCGTGGTTGCTGAGCATCTTCATCATCTGCTCCATCACGCTGTAAAACATTTGCACCGCGAGTCTGCCCGTCCTCCACGGGGTTCAAACGTGAATGAACGCTGGAGGCGCGCCCTAGTATAACTCACGGGGTATCCATGTCCATTTCTGCGCATCCAGCCAGGATACCCGTCCTCGCTGACGTAATATCCCCAGCGCCGCACCGCTGTCATTAATCTGCACAAGGCACGGCAGTCCCGGCTGTCGCCGGTATTGTTCCTGATGCTGATGCGGTCATGCGTGACCATCCGCCAGAACTGTGTCCGGAAAAGCCGGAGACGAACTGGTATCCCAGGCCTGAACGAACAGTTCACCGTTAAAGGCGTGCAAGGCCACACTTCCCGAATCATCATGGTAAACGTGCGTTAAAACGCTCAACGTCAATGCAGCAGAGCAGTCATCCTCGGCAAACTCTTTCCATGCCGCTTCAACCCGGAAAGCACGGGCTTCTTCCTCCCGATGCCAGATAGCGCCAGCTGCTTGGGCATGACTGAGCCGGAAAAGACCCGACGATGATCCTGATGCAGCTGGATGGCGTTATTGGCGGCATCGTTATTGGGCCAGATCGTCTGCGCCGGCATTGCCACGGGTAAAGTTGGGCAACACAGGGCTGCATCCACTTTCACTCGGTGGGTTCCACGACCGCAACTGCCCTCCAAATCCGCTGCCACCCCGGGTCAACCGGGATATTCATCGATGTCATGCCGTCCGGCCCCAAAGCGGGGAATGGTGGGCGTTTTCATACATAAATCCTGCAGGTCTCCCTGCGTCGCTGTGTCATGCCCCGGTCTGCACTTCCAGCTCTGCAATATGTTTCCAGTACCACGGAAGTGGCCGTCGACTCCACCTTCGTCCGTCTTCTGTACTGTTGCCACCCCGTTTACCTGTCATCAGGTCATGCAGTGCCGCACGGGCAGCGGCAAGTCTTCCTGTCGCGTCATTCATCCTCTCTGGATAAGGCACGGCGTAATCTTGCCAGTGTTTTCTGTGCTTGGTTGCTGGACCCCTTCCTGCAGGCTCGCCAGCAGCGCACTGAGATCCAGCTGCCAGCGGAAATACTGGGTGATGCGCAGCGCCGCCAGCGCATAAACGAAGCAGTCGAGTGCCTCATTGCGTCGCTTTGCTGTCCCACAGTATTTTCCTGCCATCCACCCATTTTTCGACCTGCTCTTCAGCGCAGTCAGCTGCTGCGCTTCGGGTCAGATCAAAATATCCGGGTTATTCGGAAGTGAACGGCACCGGGAAGCGGTTCATCCCCTTCGGGCGTCAGTGTGAAGCCGGTTATATAAATCTGCTCCTTCGCGGTATCCGTACCGATTTCGGTAAGGTAAACCCCGTTTTGTGCTTCGCTTAATGGCGGATGCTGATTCACCGGCTTTCCGGTAGACGCGGGTTGCCCCTTAGCATGGGGATCACCCGGAACAGCCCAGCTTTTCCGGGCGAGTTCATACACAATGGTCCTGGTCAGTCAATCCCGCCAGTATCCCCAGCGCAGGATACGGGATATCGACCTTCTGCTGCACCATTCGGCCGGGTATAGGTATTTTATTGATGGCCTCATCCACGCAGCAGCGTCTGTTCATGGTTTAGTGGCGGCCCATACGTAATAATCTGCCGGTCAATCAGCCGAGCTGTTCCTCTACCAGCCCCGGTACCGCCATACGCATTTCGGGCTGTCCAGCTGGGAGTCGATACCGGCGGTCAGGTACAGCCAATCGTCACGGAAACGGGCGCTGAAGACGAATAATGCTTCCGCCTTGCCATCATTTCAGCATCCGGACGTTCGCCAATTTTCTCCTCCCACGTACCTGACTACGAGCGTGGTGTTTACGAAGGTTTTACGGTTTTCCCCGTATCCCTTCCACTTCATCCAGTCTTTGACAATCTTAAGAGGTGAGGAACGGGCTGTACGCTGTCCAGATGTGAAAGGTCACACTGTCAGGGCGTCCAATCTGTTCACGGATGACGAAAACCAGAGAATGCCATCACGGGTCCAATCCCGGTCTTTCGCAGATATAACGGGCATCAGTACACTGAAGTCCAGTGCTCCTGCTGGCGGATGACGCAGGCATTATGCTCGCAGAGATAAACACGCTGGAGGCGATTCATCCGTCATTTGAGGCCAAACGGCGTCTCTTTGTCCGCCTAAATTTAAGATACTGCTCTCCCCCGCAATGCGAGCAGGGCAACATGAAAACGCATAAAATGCCGGGATTTCACTGGCTGCACTCAATCTGACAGGTGCCTCTCACTTTGGCGTGGAGCCACGGATGGACTTTACAGACCGAGCCTTCAATACGCTTGTTACCCAGGAACGTCGGAGAGCCTTCCTGTTCAATATCATCATCAAAAGCAGCAAGTTCATCATAACCCGCCATCCACCGCTAATCTTCACGCTTAGTTTTGCCGCTTTACCGCCCAGGCAGCCCAGAAGCCACGCCCATTAGTGAACGCTTCATGGGCCGTGTTATCCCGTGCTTTTGCCATACCACGGGGCCAGCGCCAGCAGCGACGGAATATCACGAATAGTCTATCCAACGTGGGTTTTCATAAAGTTCTCGGCATCACCATCCGTCGGCAACCAGATACCGGTGTTGCGCTGCTTATGCTCTATAAAGTAGGCATAAACACCCAGCAGCATTTTGTAGAATAACCGACACGGCAGACTTCACCACATTCACCTCACGGATGTGGTACCTGCTGCCATCGCATTCATGATGGCCCGCCTGAAAGGCAGTGTTTCCCCAGCGCCCTTCCTGGTATGCGGATTCTTTCGGGAGAGATAGTAATTAGCATCCGCCCATTCAAACGGCGGTTCTGTGGCTCCGGCCTGAACAGGTGGGAAGCCCGGCGCGGACAAATGCCGCAGCCTGTTAACCTGACTGTTCGGTTATATTCTGACTGATGAGCAACCCCGGTATCAGTTCATGCAGCGCGGCTGCTTTGTTTGTCATGGCTTTGATGATATTTCCCGTTTCAGGAAATCAACATGTCGGTTTTCCAGTTCCGGAACGCCGCACCGACGGAGAGCCGTCGAGAATACTGAATTCACCTGCGACGTGTGACAGGCACGAAAGTACGAATGCGGTTTCCACCACTTCAGCGGAGTCTGGCATTCTTCAGGTTCCTGTGCGTCGGCCGGGCACGCGAGTTAGATGGCGTTCGTACTCAATAGTTCCCTGGCGTTCGCGATTCTGCCTCGCTGTGCCTGCTTGCCGCAGTTCTTCAACCTCCCGGCGCAGCTTTTCGTTCCAATTTCAGCATCCCTTCGATACCATTTTACTGACGCTGCAGAGTCATAAAGCACCTCATTACCCTGCCACCGCCTCGCAAGAACGGCATCCCTGTTCCTGCCCAGTTCTGAATGGCGGTAACGGGATACTCGCACCGAAAATGTCGAGCCATAGCTGCTTTGTCTTGACTTCCATTGTTCATTCCACGGACAAACAGGAAAGGAACGACAGAGGCCACAAACCCGCTTTCAGCTACCCTGTCGTTTCCTTCTTTCAGAGGGGTATTTGTAAAGTAAAAACATTAAGTTATGACGAAGAAGAACGGAAACGCCTTAACCGGAAAATTTTCAAATAGCGAAAACCCGC\n'
b
diff -r 000000000000 -r 1c2e93f2d7c0 test-data/sample_overlaps.sam
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/sample_overlaps.sam Mon Jun 11 16:39:36 2018 -0400
b
b'@@ -0,0 +1,257 @@\n+@PG\tID:minimap2\tPN:minimap2\tVN:2.1.1-r369-dirty\tCL:minimap2 -Qax map-ont sample_layout.fasta sample_reads.fastq\n+@SQ\tSN:utg000001l\tLN:47564\n+1\t0\tutg000001l\t29076\t60\t28S21M1D12M1D15M1I16M3D3M2I10M1D2M3D7M2I2M4I4M1I21M1D6M1D15M2I27M1I15M1D23M1I5M1I2M7I7M3D1M2D5M1I6M6D4M1D9M1I4M2D4M1I1M1I4M1I38M5I2M3D10M1D9M1D3M1I7M5D29M1D2M3I8M4I4M1D2M6D10M4I1M1D16M3D2M6I5M2D2M1I5M4D28M1D13M1D9M2D5M2I8M1I3M3I21M1D4M1D7M2D4M2D9M4I4M1D30M2I3M1I5M2D3M1D10M1I7M2D7M1I12M1D2M1D14M1I6M1D5M1D3M3I7M1D5M1I3M1D3M1D8M2D7M1I24M1D6M3I14M1D13M3D13M2I6M2D5M3I16M1D5M2I11M1I2M1D1M1D4M1D3M1D2M1I18M1D12M1D40M1D6M1D2M2D5M1I6M3D3M1D6M2I1M1D7M2D3M3D11M2I3M1I18M2I6M2D4M1D8M4D6M1D3M1D5M1I9M2I37M1I3M1D1M1D3M2D4M2I25M1I10M1D1M2I18M2I5M1I6M1D6M1D18M2I2M1D1M2D1M1D6M1D6M1I36M1D2M1D9M1I33M1I18M1I17M2I2M1I2M1I5M1D5M1I2M3I3M2I1M2I5M1D2M2D3M1D2M1D4M7I19M1D8M2I20M1I10M1D9M1D3M1D2M1I31M1D8M2I3M2D5M1D6M2I1M1I10M1I7M3I2M1D20M3D20M1I2M2I4M1I4M2I7M1I17M1I15M2D1M1D21M1D20M2I3M1D8M1D3M2D15M1I5M2I5M1D7M1I10M3D32M1I20M2I20M38S\t*\t0\t0\tAGGTAGCCTGTTTTATGAGTGGGGATTACAAAGGATGGTCATCGGTCACGTGACAGTACGGGTACCTGACGGCCGTCACACTGCTTTCACGCTGGCTAGGAAAAGCCGGCCCGCCTTTGTAGGGCCAATGTCCCCGACGATTTTCCGCCCTCAGCGTACCGTTTATCGTACAGTTTCAGCTATCGTCACATTACTGAGCGTCCCGGGGTTCGCATTCACACTGCCACACTGATATCCGCATTTTAGCGGTCATTTCAGTTTGCTGTGTCAGGGAAAGCGGAGGATTGCGCAGGCCTGTAGTAAGCGTGAGCGTCAGGCGGTGCTTCAGGAACACTTCTTCGTTCGCTGAATATCTGGTTGCCCTGCGCCAAACGACCGGCGTTCATTCCCGTTTGCCGTATAATAAATGCATCCCACGATTGGCGGCATGATCCAGAAACTGGGCTCAGTTTGCCTTCCTCCGTGTCCTCCATGCTCAGCGGACCCGCGACATAATGTTTGCCGTCTTTATTCTGCTCAATTTGACGACGCCCGGGCATTCACACTTATCGACTGGCGGCATCCTTCCACTCTGTTCGAAACCCTCCAGTGCTTAGTTATCCTCCGTCATAGCCGGACTTTTCCAGCAGCTCCTGCCGAGGTATGAGGATTGCTTCTTGCCTTTGGAAAATCGAGGTAACCTTCCGCATCATGCCGCCCGACCGACGGCCTCCACGAATGCCGATTTGCCAACGTGTTCCACTGCGAGATAAACATAATCGCTGGCCCGGTTTGATATTGATACTGCGGCTATCCAGTACAGCGCCGTACCAAGATAACGCGTGCTGGTTTCAATGGCTGTCTGATATCCGCAATCTGCTTTTCAGGGGACCAGAACTCAAACTGTACCGTCCGTATAAACGGCAAGATGCGGCGTGGCGGTTATCTGAAGACCCCGGCGTCAGCTCAATCCTCGACGGTGCTGCAGCAATCAGAACGGAATACCATAAGGACCCGCTTAATCGCGCGCCCGCATTTACCGCCCGGTGACTGTCGACCTGTAGTTCCCCAGCGCCAGTGCGTGAAGCGGTATGTGGTTTCCGTCGTCCGCTGCCGTGCTGACCAGCCGCTCACTGCCGTCGTCGTCCGTTACGGTCACGGCCAGCAGGAAACTCACGCCGGTCCCTAGGCTTCGGTGTGTCCCATCGCGCCAGCACCTGATATTCCATGTTGTAGCAGTACTTCTGCGGTCAGGTGCAGTGAGGGGCGGGCGGGATCACCATTCACCGTGCCACTCTGTTCGCCGTTACACTGCACCCGTTATCCACGATGGCCTCTTTTCCGGCACATGCTGCACGCGGGGCGATGGCATACGTGCCGTCGTCGTTCTCACGGATACTCACGCAGCGGAACAGTCACCTCTGGCTGGCGCAGCGAGCGGTTCGGCAAGCTTCAGCTCCCATACGGTGGGTCAGCAACACCGTCAGGAACACGGCTCACTTTACCTTCAGCCGTCGGTGACGACTGAACCTCCACGCTGACCGGATTGCCATTTCCGTCAACCCGAGGGATGACGGGGTCAAGGAGGATGGCAGCGTGATTCAATCCGTCGAGCGTCAGCGTCCGGTATTGGCTGTTCACACAGGCACACGACCACCGGTTAACTGATACCGGCATCATAGTCATCATGGCGCAGATTTCAATAACATCGCCCGGTACCATGGGGCAACGGATTCTGCGCCGACGGTATGAAATCCACGTCCGTTTCCAGCAGTTCTTGTTTTAATCATAGCCACATGCCCGGCGCGGTGCCTGCCCCGGCTGGTACAGCCAAAGGCATCCATCTTCGTAACATTACGACCTGTAACGGGCAATGGCCTGCGTATCTTCAACAAGCTCTGTCGCCGTCTCGAGTAGATAC\t*\ttp:A:P\tcm:i:20\ts1:i:190\ts2:i:0\tNM:i:485\tms:i:968\tAS:i:968\tnn:i:0\n+2\t0\tutg000001l\t26590\t60\t49S4M1I21M1D7M2D3M1I25M1I12M2I7M1D6M4D3M1I3M1D3M2I11M1D4M2I12M8I1M2I5M2I8M2I4M1I1M4I27M1I19M2I5M3I17M1I1M2I11M1I1M2D8M11I5M1D15M2D10M2D9M3I1M1I3M1D3M1I6M1I26M2I7M1I15M1I23M3D6M6I9M1I12M1I2M1I3M2I16M2D4M2I13M1I9M1D30M2I16M1D3M1D14M8D15M1D7M1D12M1I7M9I2M2D7M1I15M6I2M1D32M1I6M1D5M1D7M1I1M1I32M1D10M1I6M1I21M1D8M1D2M1I4M2I9M2D3M5D11M3I5M1D10M3I7M2D3M1D2M1D3M1D11M3D10M3I2M1I3M3I2M2I11M1D7M2I7M3I12M1I4M1I4M4I5M3I38M5I3M7I7M3D4M2I11M3D26M4D7M2I11M1D1M1D14M2I9M3I24M3D11M1D41M2I12M1I23M4I3M1D15M2I2M1D9M2D3M1I2M2D15M1I6M2D8M1I12M3D7M2D13M3I9M6D5M1I16M4I46M4D11M2I6M1I10M2I21M1I28M1I2M1I6M3D1M1D11M2I5M1D3M1D19M1I8M2D6M1D10M1I5M1D3M1I12M3I6M2I37M1D6M1I38M3I15M1I24M2I10M1D28M1D11M2I3M2D7M6I5M1I17M1I5M1D11M2I22M2D9M1D1M1D8M3I3M2I8M2D1M2D18M1I6M2I9M5I23M6I15M1D13M1I13M1I23M2D4M2D15M2D7M1I11M1I20M2D3M1D5M1D10M1I6M1D10M1D14M1I16M1I4M1D2M1I5M1D9M1D28M1I9M2I8M2I11M3I8M1I26M1D4M2I5M2I3M1I5M1D5M3I4M1I5M3D5M1I12M1I10M2I8M2I14M2D14M5I6M1D3M1D7M2D3M2I4M1I13M1D6M1D8M2D2M1I29M1D14M2I3M2D30M2I4M1D4M1I6M1I14M2I2M2D9'..b'AATCAATACATGCTTCCCAAATATTCGCGCATGACTCGAACAAGAGCCGGTATCGAATCTTTTAGCTCGTACCATGTCCTGATACAGGGCTTGATAATCAGGATTTCTGAATACATTTCGCGATACCGTCCCAGCGACATTCTTCCTCGGTACATAATCTCCTTTAGCGTTTCCGATGTCCGTCAAAGGCACATGGGATCCCGTGATGACCTCATTAAAACACGCTGCAATCCAATATTCCCTCATCTTTGCAGGCAAGTCCGATTTGCGTTGATTTTAATGCAGAATATGCAGTTACCGAGATGTTCCGGTATTTGCAGCAAATGAATGGTTGTTGCTTCCACCATGCGAGGATATCTTCCTTCTCAAAGTCTGACAGTTCAGCAAGATATCTGATTCCAGGCTTTGGCTTCGGCCATTCGGTTCATCAGCTCTATCCCAATCTCCACGATCTTAATTCCTCACCCGAAATGGTCATCACAGTATTTGGTGAAGGGAACGAGTTGTCAATCTGTCAGTGCAGAACGCGCCGGACGTATGGAGTGCCATATTTTCTTTACCATATCGATAAATGGCTTCGAACAGGCATTCGCGTCTGAATATCCTTTGGTTCCCATACCGTATACCCATTTGGCTGTCCAAGCTCCGGGTTGATATCATCACTGCAATGATACCGGTGAGCCGGTATCCAGAACTTCACAACTTCCCTGACAAACCGATATGTCATTGGATGTTCACAACCTGTATCCATGAAAACGTAATGCGTCTTTACCTGCCGTCGCTTTGCTCCATTAGCCAGAGCAAATAGTTGCTGACGTCTCATGCCACCGGAGAAACTAACGACATTTATCATGCAGCCTGTCTCTCCCCATCGCTTTCCACTCCGAGCCAGTCTCGCTTCGTCTGACCACCTTAACGCCACGCTCTGTACCCGAATTAATGACTGCCTGTATAAGCTCTAATATGCTCCCAAATTCGCCTACACGCATCCTGCTGGTTGACTGGCATAGATCACACAGCCATTCCCGGCAAGGTTAGAATAACATCCTGCTGCTTTAATGCTGCGGTAAACACACTTCCAGCCAGCTTTCTGCATCCAGCCAGCGACCATGCCATTCAACCTGACGGAGACGTCACCTAAGCAGGCCCATAGCTTCCTGTTTGGTCTAAGCTGCGGTTGCGTTTCCTGAAGAATGGGTTACTACGATTGGTTTGGTTGGGTCTGAGAAGGATTTGCTTACTGTGAATAGCGTTTTGCTGATGTGCTGGAGAGTACCGAATTTCAAAGGTTAGTTTTCATGACTTCCCTCTCCCCCAAATAAAGCGCCTGCGATTACCAGCAAGGCCGTTGATCAGTAATGTAGATGGTCATCTTTTAACTCCATATACCGCCAATACCCCGTTTCATCGCGGCACTCTGGCGACATCTCCTTAAAACCAGGTTCGTGCTCATCTTTCCTTCCCGTTCTTCCCTGGAGCAAACCGGTAATACCACCGTTCAGACCTTACTTCGATAACCAGAAGACCTGCCCGTGCCATTTTAGCCGCGGCCTGATTTATGCTGGTTACTCGGTTGCGCCTGTTAGCGCGGCAACGCTTCTAGGGCGCACAGAATAGATTATGGTCGCGTCTCCCCAGGTAATATGAATAGATTGCCTCCTTTGCCCGTCATACATGTGCTCCTTTCAGTCCGAACTTAGGGTTTGATTTCCTGCGATCTTCACAGCCTGTGCACGATTTAGAGGTCTACGCCCATGACAGGAAGTTGTTTTACTGGTTCTCATAGGGATCGCCTCACCACCACGGTTAATTCTCGCAAGTCATATGGACAAGCTCATCTGCGGCCTTATAAAGCGTAATTCACGAATACGGGCACCGCATGCCGCATGTTCTGATACAGGTCGTGATACCGATAGAGTAGTGCGCGTTTGATTTCACTCGATAAGACTCCGCATTGGATGGAGCGCTTCCGGCAATACTCGTAAACCATATCAAACCAGCTCGCTGACGTTTGGCAGTCACGGCGGTAACGATGCTTCTTCCCCGGCACCATGCAACAAACTGCCGGGTGATGCGGCAAGAAATTCGGACGATTCTGATGCGGACGGGCTACCGGAATTCCTGCGTTAACCTGTTCCATCGTGGTGATCCCGTTTCCCGAAAAGCCAGAACCCACTGGCGACGGATTTCGGTTCATGATTCGTTCTGGTCACGCCGTGCCATGAGAGCCGGGAAAGTCCGCCAGTAACTGGGCTGAACACACCGTTGATGATCGCATGCCTGGGTGCTGTATCCTGCGGCTTTCGTCGTTACTGTTCCGGCATGTTGTTGGCGATCCGACGCATCTGCTCACGGTCAAAGTTAACCATCTGTGCGGGGAGTGTTTTCATAATCCACCCCGTAAATCCAGTCTGTTTGTCAGGTCGAGTTTTGGTTTGCTGGCTGGCTGTCACGCCTGCCTGTTGCTTGTTACGGTTGATTCGAGTTGGGTCCACTTATCGCGCGGAGTTTGGCCGGCTCAGCACGTCGTTACCGACCAGGAAGTTTGTCCTGGCATGCCAGCGGAACAGCACAGGGTCTTCTAGGGTGGTTACGTCCGTCTACGTTCACGCATCAGCGTGGATATCGTTAGCCCGCAGCAAGTTAAATCGGTTTTCTGGCTGATGGTGCGTATAGTCTTCTTCACGTCAAACATCCACTCTGCGGCGGTCAGGTCTTCTGCCATGCATGTCCCACTTGCTGCCGCTCTGAATTGCAGCATCCGGTTTCACCACAAGAATAGTCGTTTTCTGGCTGGTCAGGATTCACAGAATTCGTGAATAATCTCTTTCTTTTCTTTTGTAATAGTGTCTTTTTGTCTCCGTTTTGAGGGATAGCAATCCCAGATTGAGGGATGTTTTATCCCTCGTTTAGGGATTTTCCAGCGTTTTGAGGGATGCACCATTCTGAGCAATGTTTTATTTGGTCCAAACATGCCGCCTTGCTGCTTGATAATTCATTCTGACGATTCTAACTTGGCTTCATTGCACCCGTTTGACAGGTAACTTTGTAATCTCGCTAAGTTGAGAATCGGTGAGTCACTCTGTCCATTGGTTTATTCCACCCATTATAGTTTTACGGCAGAATGGCAAGCAGCATAATTTAAAACTGTCGCTTGGTCAGATCTGCGCCCGATGAATAAGCCTCAAGCCGAAGCATATTTGATAGTCTGGCGTAACCATCATGAGATCTGCCATTACGCTCCTGTCCGGCAAAGTCTCCTGCCGAAGTTGAGTATTTTGCTGTATTTGATAATGACTCCTGTTGATAGATCCAGTAATGACCTCAGAACTCCATCTGGATTTGTTCGAACGCTCGGTTGCCGGATGCCGCGTTGATTGGTAGAATCGCAGCAACTTGTCGCGCCAATCGAGCCATGTCAACGTCGATAGATCCCATTCAAGAACAGCAAGCAGCATGCGTGAAAACTTTGGAATCCGGTTCTCCTTCCAAGCCTTGATCTTAGACTTATCAACGCCCACAGCTTCCATGTCTTCTTTGATCGTTTCCAAGCATTGCGATTTTGTTAAGCAACGCACTCTGGATTCTCCGTAGAGCCTCGTTGCGTTTGGCTTTTGCACGAAACCATATGTAAGTATTTCCTTAGATAACAATTGATTGAATGGTCCCAAATAAATGCAAGACGAGGTGGTTTAATTTGATGCCCTTTTCAGGGCTGGAATGGTTGTAAGAGCGGGGTTATTTATGCTGTTGTTTTGTTACTCGGGGAAGGGCAGTTACCTTCTTCCGGCAGAATTCCATCAGGACGCGTTTGAGTCGATGGTTAGTAAAATCCGGCACTTAAATGGCCTTTAATCGAGGATTTGATCGGCCCGCGTATTCTAGCTGTCTTTGGTTTGCCCAAAGCGCATTGGATAAAGAGAGTT\t*\ttp:A:P\tcm:i:196\ts1:i:1832\ts2:i:0\tNM:i:2496\tms:i:6820\tAS:i:6820\tnn:i:0\n'
b
diff -r 000000000000 -r 1c2e93f2d7c0 test-data/sample_reads.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/sample_reads.fasta Mon Jun 11 16:39:36 2018 -0400
b
b'@@ -0,0 +1,472 @@\n+>1\n+AGGTAGCCTGTTTTATGAGTGGGGATTACAAAGGATGGTCATCGGTCACGTGACAGTACGGGTACCTGACGGCCGTCACACTGCTTTCACGCTGGCTAGGAAAAGCCGGCCCGCCTTTGTAGGGCCAATGTCCCCGACGATTTTCCGCCCTCAGCGTACCGTTTATCGTACAGTTTCAGCTATCGTCACATTACTGAGCGTCCCGGGGTTCGCATTCACACTGCCACACTGATATCCGCATTTTAGCGGTCATTTCAGTTTGCTGTGTCAGGGAAAGCGGAGGATTGCGCAGGCCTGTAGTAAGCGTGAGCGTCAGGCGGTGCTTCAGGAACACTTCTTCGTTCGCTGAATATCTGGTTGCCCTGCGCCAAACGACCGGCGTTCATTCCCGTTTGCCGTATAATAAATGCATCCCACGATTGGCGGCATGATCCAGAAACTGGGCTCAGTTTGCCTTCCTCCGTGTCCTCCATGCTCAGCGGACCCGCGACATAATGTTTGCCGTCTTTATTCTGCTCAATTTGACGACGCCCGGGCATTCACACTTATCGACTGGCGGCATCCTTCCACTCTGTTCGAAACCCTCCAGTGCTTAGTTATCCTCCGTCATAGCCGGACTTTTCCAGCAGCTCCTGCCGAGGTATGAGGATTGCTTCTTGCCTTTGGAAAATCGAGGTAACCTTCCGCATCATGCCGCCCGACCGACGGCCTCCACGAATGCCGATTTGCCAACGTGTTCCACTGCGAGATAAACATAATCGCTGGCCCGGTTTGATATTGATACTGCGGCTATCCAGTACAGCGCCGTACCAAGATAACGCGTGCTGGTTTCAATGGCTGTCTGATATCCGCAATCTGCTTTTCAGGGGACCAGAACTCAAACTGTACCGTCCGTATAAACGGCAAGATGCGGCGTGGCGGTTATCTGAAGACCCCGGCGTCAGCTCAATCCTCGACGGTGCTGCAGCAATCAGAACGGAATACCATAAGGACCCGCTTAATCGCGCGCCCGCATTTACCGCCCGGTGACTGTCGACCTGTAGTTCCCCAGCGCCAGTGCGTGAAGCGGTATGTGGTTTCCGTCGTCCGCTGCCGTGCTGACCAGCCGCTCACTGCCGTCGTCGTCCGTTACGGTCACGGCCAGCAGGAAACTCACGCCGGTCCCTAGGCTTCGGTGTGTCCCATCGCGCCAGCACCTGATATTCCATGTTGTAGCAGTACTTCTGCGGTCAGGTGCAGTGAGGGGCGGGCGGGATCACCATTCACCGTGCCACTCTGTTCGCCGTTACACTGCACCCGTTATCCACGATGGCCTCTTTTCCGGCACATGCTGCACGCGGGGCGATGGCATACGTGCCGTCGTCGTTCTCACGGATACTCACGCAGCGGAACAGTCACCTCTGGCTGGCGCAGCGAGCGGTTCGGCAAGCTTCAGCTCCCATACGGTGGGTCAGCAACACCGTCAGGAACACGGCTCACTTTACCTTCAGCCGTCGGTGACGACTGAACCTCCACGCTGACCGGATTGCCATTTCCGTCAACCCGAGGGATGACGGGGTCAAGGAGGATGGCAGCGTGATTCAATCCGTCGAGCGTCAGCGTCCGGTATTGGCTGTTCACACAGGCACACGACCACCGGTTAACTGATACCGGCATCATAGTCATCATGGCGCAGATTTCAATAACATCGCCCGGTACCATGGGGCAACGGATTCTGCGCCGACGGTATGAAATCCACGTCCGTTTCCAGCAGTTCTTGTTTTAATCATAGCCACATGCCCGGCGCGGTGCCTGCCCCGGCTGGTACAGCCAAAGGCATCCATCTTCGTAACATTACGACCTGTAACGGGCAATGGCCTGCGTATCTTCAACAAGCTCTGTCGCCGTCTCGAGTAGATAC\n+>2\n+ATCTTGATAGAGATTTCTAGGGGTATGCGTTAATGATCAGAAGCTCCCAATCAGGTTCAGTCAGGCTGGCGGCATCATTTCCGGCAAAATACGGTAATTATTTTCGCCGTGTAGAAAGCCCTGCCACATAGGCTAGAGTCGCAAGCTTCTTCGGTTGTTTACCCGCAAGCGTTAGTCATGGTGGTGGTAGCCAAAATCTGGATCATTCTCCCGAGCGCTGCGGCCAGTTCATTCAGCGTATTCAGTTGCGTCAGGTGACGCGTCGATAACATCTGCTGCAATCGCGGCCAGTACAAAAGCGGTTTCGCAATCTGGGTTTGTTTGTTCCTTGACATCCGGTTGGTGCTGTTGGCGTTCCGGTCAGTGCCGGACTGTTGAGGTTGGCTTTTTCTGTTCGTTTCATCCATTACCACCTTAACCGCCTTTGGCGTTGCAGCAAGCGTTTCAGACGTGCTGTTGGTTGCACTGCTGAGCTGCTATCCGGATTTCTCGTTGTCCGCATCCTCAAGCGCGACAGCTGAAGCTATATCTTCTGCACGTTTTGCCGAATTTGCACGTATTGCCGCCGCTTCTGCCGCGCTCGCATTTGCTCTGCGATGCTGATACCGCACTTCCCGCAGCCTCCCTTCCCTTCGTGATGCCGTTGACGGCACTCCCCGCCGCCGCTGTTTGCGTCGTGCCCCGGCAGGATGAGGGGCGCGTTCCATGCTGTTTCAGATGACCTGGCATTGCGTCTCGGACGTTTTGCCTCACTGGCAGAATTTCTGCCGCCGTTGCCGAGGAAGCTGCACGACTCGGCACTTGATGATGCGTTCGTTTCTGATGATTTTGTGCCTCTTGTTGTACCGGGCATCTCGTGCTGAAGGAGTGGGGGCCTCTGACGCTTTCGTGGCCATGCGGAGGCAGAATTGGCTGATCTTTTAGTCGACTTTGGCTTAGCAGCATTCGTTTCTGTAACGTTTTCGCCGCACCGGCACTGGGCCGCCCGCGTTTTGAGAGAACTCTGCGGCTGCGGCACTTTTCCGCTTCAGTGGCCTTGCTGATGCCGCCTCTTCTGCCGCTACGGGCAGCTTCCTGAGCTGACGGATGCAGCCTGTCCGGCGGACGTGCTGTGGCGGCGCGTCGGGTCAGTTGCATCAGAGTCACAAGCTAGGCCGCGACCTGAGCAGCTGATGCACTGGCATCGCCGGCTGATTTCTTCGCGTCTGCCGTACTCTGTGCCACCACGAAGACGCGTTACGCTGGGAGCTCTTCCACCATGAGTTCGACGAAGCGACGCAGCACCTCCATGGATGGCATCATCCTCGCGTCATGGCACACAGAGAAACCTTCAGCGTCCCCGGTTGTGAATCTTCATACGGTGATGGTCCCGGCGTGCGATGGAAAACCCGTCAACCTGCAGGATATCTGACACTGTACTGACCGTACTCCACATCCATGCTGTAACGCCCGGCTTCATCCGGATTCTCTGAGCCCACCGTGTTTGCCCCACCACCGTGGTGCTGTTAATGTCTGGCTTTCAGCTGAATGGTGCAGTTCTTGACTAGTTTTCCTGTGCCTATCTTTCAGACTCCTGAAATCTTTACTGCCATATTCACCGCAAAAGCCCACCGGTTCCGGCGGGCTGTCATAACACTGTGTTACGCCTGGCTAATCAGAATTTATAACCGACCCCAACGATGAATCCGTTTAGATCGCCAGTCGCCACTGCCGGCCCAGCCTTCATAGACAGCAAGATAATGAACGGACGGACGCTGCCGGATTAATCTGTATACCTGCACTCCACGCCAACCAGGTATGCCGCATTGCATTTCGTCCCTGGCAGTGGTCGTCTCTTATCTTTCAATACCCGGGAGTGATTTCCGTCTTACGGTAATGCGGCTTGTACTGCCGGATAAGCGACTGTGAGCCACTCCATGGCTGAGAAGCCGCACTGATTTACTGATTTGTAAAACCGGTCCGGCCATCACGCCCTAACTAACGTCCACGCAGGCTCTCATAGTGAAGAAACGTATCCTCCCCGGTCATCACTGTGCTTGCTCTTTTCGACGGTGGGGACCCCAGGGAAGC'..b'GGAAGCGGTTATCTTCTTTGCATTCACGCACCGATAACATCTCCGCATCATGCAGCTTCCTCCCGAAGTCGAAATCAATACATGCTTCCCAAATATTCGCGCATGACTCGAACAAGAGCCGGTATCGAATCTTTTAGCTCGTACCATGTCCTGATACAGGGCTTGATAATCAGGATTTCTGAATACATTTCGCGATACCGTCCCAGCGACATTCTTCCTCGGTACATAATCTCCTTTAGCGTTTCCGATGTCCGTCAAAGGCACATGGGATCCCGTGATGACCTCATTAAAACACGCTGCAATCCAATATTCCCTCATCTTTGCAGGCAAGTCCGATTTGCGTTGATTTTAATGCAGAATATGCAGTTACCGAGATGTTCCGGTATTTGCAGCAAATGAATGGTTGTTGCTTCCACCATGCGAGGATATCTTCCTTCTCAAAGTCTGACAGTTCAGCAAGATATCTGATTCCAGGCTTTGGCTTCGGCCATTCGGTTCATCAGCTCTATCCCAATCTCCACGATCTTAATTCCTCACCCGAAATGGTCATCACAGTATTTGGTGAAGGGAACGAGTTGTCAATCTGTCAGTGCAGAACGCGCCGGACGTATGGAGTGCCATATTTTCTTTACCATATCGATAAATGGCTTCGAACAGGCATTCGCGTCTGAATATCCTTTGGTTCCCATACCGTATACCCATTTGGCTGTCCAAGCTCCGGGTTGATATCATCACTGCAATGATACCGGTGAGCCGGTATCCAGAACTTCACAACTTCCCTGACAAACCGATATGTCATTGGATGTTCACAACCTGTATCCATGAAAACGTAATGCGTCTTTACCTGCCGTCGCTTTGCTCCATTAGCCAGAGCAAATAGTTGCTGACGTCTCATGCCACCGGAGAAACTAACGACATTTATCATGCAGCCTGTCTCTCCCCATCGCTTTCCACTCCGAGCCAGTCTCGCTTCGTCTGACCACCTTAACGCCACGCTCTGTACCCGAATTAATGACTGCCTGTATAAGCTCTAATATGCTCCCAAATTCGCCTACACGCATCCTGCTGGTTGACTGGCATAGATCACACAGCCATTCCCGGCAAGGTTAGAATAACATCCTGCTGCTTTAATGCTGCGGTAAACACACTTCCAGCCAGCTTTCTGCATCCAGCCAGCGACCATGCCATTCAACCTGACGGAGACGTCACCTAAGCAGGCCCATAGCTTCCTGTTTGGTCTAAGCTGCGGTTGCGTTTCCTGAAGAATGGGTTACTACGATTGGTTTGGTTGGGTCTGAGAAGGATTTGCTTACTGTGAATAGCGTTTTGCTGATGTGCTGGAGAGTACCGAATTTCAAAGGTTAGTTTTCATGACTTCCCTCTCCCCCAAATAAAGCGCCTGCGATTACCAGCAAGGCCGTTGATCAGTAATGTAGATGGTCATCTTTTAACTCCATATACCGCCAATACCCCGTTTCATCGCGGCACTCTGGCGACATCTCCTTAAAACCAGGTTCGTGCTCATCTTTCCTTCCCGTTCTTCCCTGGAGCAAACCGGTAATACCACCGTTCAGACCTTACTTCGATAACCAGAAGACCTGCCCGTGCCATTTTAGCCGCGGCCTGATTTATGCTGGTTACTCGGTTGCGCCTGTTAGCGCGGCAACGCTTCTAGGGCGCACAGAATAGATTATGGTCGCGTCTCCCCAGGTAATATGAATAGATTGCCTCCTTTGCCCGTCATACATGTGCTCCTTTCAGTCCGAACTTAGGGTTTGATTTCCTGCGATCTTCACAGCCTGTGCACGATTTAGAGGTCTACGCCCATGACAGGAAGTTGTTTTACTGGTTCTCATAGGGATCGCCTCACCACCACGGTTAATTCTCGCAAGTCATATGGACAAGCTCATCTGCGGCCTTATAAAGCGTAATTCACGAATACGGGCACCGCATGCCGCATGTTCTGATACAGGTCGTGATACCGATAGAGTAGTGCGCGTTTGATTTCACTCGATAAGACTCCGCATTGGATGGAGCGCTTCCGGCAATACTCGTAAACCATATCAAACCAGCTCGCTGACGTTTGGCAGTCACGGCGGTAACGATGCTTCTTCCCCGGCACCATGCAACAAACTGCCGGGTGATGCGGCAAGAAATTCGGACGATTCTGATGCGGACGGGCTACCGGAATTCCTGCGTTAACCTGTTCCATCGTGGTGATCCCGTTTCCCGAAAAGCCAGAACCCACTGGCGACGGATTTCGGTTCATGATTCGTTCTGGTCACGCCGTGCCATGAGAGCCGGGAAAGTCCGCCAGTAACTGGGCTGAACACACCGTTGATGATCGCATGCCTGGGTGCTGTATCCTGCGGCTTTCGTCGTTACTGTTCCGGCATGTTGTTGGCGATCCGACGCATCTGCTCACGGTCAAAGTTAACCATCTGTGCGGGGAGTGTTTTCATAATCCACCCCGTAAATCCAGTCTGTTTGTCAGGTCGAGTTTTGGTTTGCTGGCTGGCTGTCACGCCTGCCTGTTGCTTGTTACGGTTGATTCGAGTTGGGTCCACTTATCGCGCGGAGTTTGGCCGGCTCAGCACGTCGTTACCGACCAGGAAGTTTGTCCTGGCATGCCAGCGGAACAGCACAGGGTCTTCTAGGGTGGTTACGTCCGTCTACGTTCACGCATCAGCGTGGATATCGTTAGCCCGCAGCAAGTTAAATCGGTTTTCTGGCTGATGGTGCGTATAGTCTTCTTCACGTCAAACATCCACTCTGCGGCGGTCAGGTCTTCTGCCATGCATGTCCCACTTGCTGCCGCTCTGAATTGCAGCATCCGGTTTCACCACAAGAATAGTCGTTTTCTGGCTGGTCAGGATTCACAGAATTCGTGAATAATCTCTTTCTTTTCTTTTGTAATAGTGTCTTTTTGTCTCCGTTTTGAGGGATAGCAATCCCAGATTGAGGGATGTTTTATCCCTCGTTTAGGGATTTTCCAGCGTTTTGAGGGATGCACCATTCTGAGCAATGTTTTATTTGGTCCAAACATGCCGCCTTGCTGCTTGATAATTCATTCTGACGATTCTAACTTGGCTTCATTGCACCCGTTTGACAGGTAACTTTGTAATCTCGCTAAGTTGAGAATCGGTGAGTCACTCTGTCCATTGGTTTATTCCACCCATTATAGTTTTACGGCAGAATGGCAAGCAGCATAATTTAAAACTGTCGCTTGGTCAGATCTGCGCCCGATGAATAAGCCTCAAGCCGAAGCATATTTGATAGTCTGGCGTAACCATCATGAGATCTGCCATTACGCTCCTGTCCGGCAAAGTCTCCTGCCGAAGTTGAGTATTTTGCTGTATTTGATAATGACTCCTGTTGATAGATCCAGTAATGACCTCAGAACTCCATCTGGATTTGTTCGAACGCTCGGTTGCCGGATGCCGCGTTGATTGGTAGAATCGCAGCAACTTGTCGCGCCAATCGAGCCATGTCAACGTCGATAGATCCCATTCAAGAACAGCAAGCAGCATGCGTGAAAACTTTGGAATCCGGTTCTCCTTCCAAGCCTTGATCTTAGACTTATCAACGCCCACAGCTTCCATGTCTTCTTTGATCGTTTCCAAGCATTGCGATTTTGTTAAGCAACGCACTCTGGATTCTCCGTAGAGCCTCGTTGCGTTTGGCTTTTGCACGAAACCATATGTAAGTATTTCCTTAGATAACAATTGATTGAATGGTCCCAAATAAATGCAAGACGAGGTGGTTTAATTTGATGCCCTTTTCAGGGCTGGAATGGTTGTAAGAGCGGGGTTATTTATGCTGTTGTTTTGTTACTCGGGGAAGGGCAGTTACCTTCTTCCGGCAGAATTCCATCAGGACGCGTTTGAGTCGATGGTTAGTAAAATCCGGCACTTAAATGGCCTTTAATCGAGGATTTGATCGGCCCGCGTATTCTAGCTGTCTTTGGTTTGCCCAAAGCGCATTGGATAAAGAGAGTT\n'