changeset 16:856cafcbf422 draft

Uploaded
author pjbriggs
date Tue, 15 May 2018 07:24:18 -0400
parents a3af1ff4cad1
children 831c838927c7
files fastq_subset.py test-data/454_microsats.out.re_match~ test-data/illuminaPE_filtered_microsats.out.re_match~ test-data/illuminaPE_filtered_microsats_occurrences.out.re_match~ test-data/illuminaPE_filtered_microsats_primers.out.re_match~ test-data/illuminaPE_filtered_microsats_rankmotifs.out.re_match~ test-data/illuminaPE_microsat_types.out.re_match~ test-data/illuminaPE_microsats.out.re_match~
diffstat 8 files changed, 74 insertions(+), 49 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/fastq_subset.py	Tue May 15 07:24:18 2018 -0400
@@ -0,0 +1,74 @@
+#!/usr/bin/env python
+
+import argparse
+import random
+from Bio.SeqIO.QualityIO import FastqGeneralIterator
+
+def count_reads(fastq):
+    """
+    Count number of reads in a Fastq file
+    """
+    n = 0
+    with open(fastq,'r') as fq:
+        while True:
+            buf = fq.read()
+            n += buf.count('\n')
+            if buf == "": break
+    return n/4
+
+def fastq_subset(fastq_in,fastq_out,indices):
+    """
+    Output a subset of reads from a Fastq file
+
+    The reads to output are specifed by a list
+    of integer indices; only reads at those
+    positions in the input file will be written
+    to the output.
+    """
+    with open(fastq_in,'r') as fq_in:
+        fq_out = open(fastq_out,'w')
+        i = 0
+        for title,seq,qual in FastqGeneralIterator(fq_in):
+            if i in indices:
+                fq_out.write("@%s\n%s\n+\n%s\n" % (title,
+                                                   seq,
+                                                   qual))
+            i += 1
+        fq_out.close()
+
+if __name__ == "__main__":
+
+    p = argparse.ArgumentParser()
+    p.add_argument("fastq_r1")
+    p.add_argument("fastq_r2")
+    p.add_argument("-n",
+                   dest="subset_size",
+                   default=None,
+                   help="subset size")
+    p.add_argument("-s",
+                   dest="seed",
+                   type=int,
+                   default=None,
+                   help="seed for random number generator")
+    args = p.parse_args()
+
+    print "Processing fastq pair:"
+    print "\t%s" % args.fastq_r1
+    print "\t%s" % args.fastq_r2
+
+    nreads = count_reads(args.fastq_r1)
+    print "Counted %d reads in %s" % (nreads,args.fastq_r1)
+
+    if args.subset_size is not None:
+        subset_size = float(args.subset_size)
+        if subset_size < 1.0:
+            subset_size = int(nreads*subset_size)
+        else:
+            subset_size = int(subset_size)
+        print "Extracting subset of reads: %s" % subset_size
+        if args.seed is not None:
+            print "Random number generator seed: %d" % args.seed
+            random.seed(args.seed)
+        subset = random.sample(xrange(nreads),subset_size)
+        fastq_subset(args.fastq_r1,"subset_r1.fq",subset)
+        fastq_subset(args.fastq_r2,"subset_r2.fq",subset)
--- a/test-data/454_microsats.out.re_match~	Mon May 14 11:10:19 2018 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,2 +0,0 @@
-SequenceID\	Repeat\ Motif\ Size\	Repeat\ Motif\	Number\ Tandem\ Repeats\	Primer\ Designed\ \(1\=y\,0\=n\)\	F\ Primer\ Name\	Forward\ Primer\	R\ Primer\ Name\	Reverse\ Primer\	Total\ Repeats\ In\ Amplicon\	Occurances\ of\ Forward\ Primer\ in\ Reads\	Occurances\ of\ Reverse\ Primer\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ PALs
-FW1N29Q04EP35X\	2\	AC\	18\	0\	\	\	\	\	\	\	\	\	
--- a/test-data/illuminaPE_filtered_microsats.out.re_match~	Mon May 14 11:10:19 2018 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,4 +0,0 @@
-readPairID\	Motifs\(bases\)\	Bases\ in\ all\ Motifs\	Possible\ Extended\	Possible\ Spanning\	Primers\ found\ \(1\=y\,0\=n\)\	F\ Primer\ Name\	Forward\ Primer\	R\ Primer\ Name\	Reverse\ Primer\	Amplicon\ Motifs\	Number\ motif\ bases\ in\ amplicon\	Primers\ on\ sep\ reads\	Extend\ with\ primers\	Spand\ with\ primers\	Occurances\ of\ Forward\ Primer\ in\ Reads\	Occurances\ of\ Reverse\ Primer\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ PALs\	R1\_Sequence\_ID\	R1\_Sequence\	R2\_Sequence\_ID\	R2\_Sequence
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\	AC\(12\)\ \	12\	\	\	1\	test\_3\	AAGTACAGTGGGGAGGCTGG\	test\_6\	TTTTCTACACAGCTCAAGTAGCCC\	AC\(12\)\ \	12\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\ 1\:N\:0\:TCCTGA\	TACTAGTCTAATAATTGCAGGCAGCTGAACTAGATAGGTCCTAAAGTACAGTGGGGAGGCTGGTGTGTGTGTGTGCATGGGATTGTCAGCCTTACCATCAGTCCTGATTTGTAGGT\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\ 2\:N\:0\:TCCTGA\	TAAACAACCAAATGAAACCATCTTTTCTACACAGCTCAAGTAGCCCTACATACAACACAAGCCACCTACAAATCAGGACTGATGGTAAGGCTGACAATCCAATCCACCACAACAAC
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\	AC\(12\)\ \	12\	\	\	1\	test\_7\	GCAGTAAACAAAGGCAAAGGG\	test\_4\	CCTGGGCAGAGGTGTTCC\	AC\(12\)\ \	12\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\ 1\:N\:0\:TCCTGA\	TCATAAGAATGAGCAGTAAACAAAGGCAAAGGGGAGATAACACACACACACAAAATAAAAAAACATCAATTTCTAATACACGCCTTTATTATAAAGAAATAAATCACTGAAAAACA\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\ 2\:N\:0\:TCCTGA\	TCCTCTGACTAGGCAACAACAGCTTTTTTGCTCCTGGGCAGAGGTGTTCCGAGTGTATATTTTTTATAATTACGGCGCGCATTGGAAATTGATGTTATTTTATTTTGCGTGTGTGT
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\	AG\(14\)\ \	14\	\	\	1\	test\_5\	TTCTCCCACTATATTTTGCATTGG\	test\_1\	TCCAGACTGAAGCTACCCTGG\	AG\(14\)\ \	14\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\ 1\:N\:0\:TCCTGA\	TACTGTTTAGAATAGACTGTTCTCCCACTATATTTTGCATTGGTGCATACTCAGCTTTAGTAATAAGTGTGATTCTGGTAGAGAGAGAGAGAGATACCAACCTCTTCTTCCCACTA\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\ 2\:N\:0\:TCCTGA\	TACTGTTTAGAAAGCCTGTTCCAGAACTTGATCACTGTCACAGAAAATCTTTCTTACTATCCAGACTGAAGCTACCCTGGTGCAGCTTTGTGCTGTTACCTTGAGTCATGTCATCA
--- a/test-data/illuminaPE_filtered_microsats_occurrences.out.re_match~	Mon May 14 11:10:19 2018 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,4 +0,0 @@
-readPairID\	Motifs\(bases\)\	Bases\ in\ all\ Motifs\	Possible\ Extended\	Possible\ Spanning\	Primers\ found\ \(1\=y\,0\=n\)\	F\ Primer\ Name\	Forward\ Primer\	R\ Primer\ Name\	Reverse\ Primer\	Amplicon\ Motifs\	Number\ motif\ bases\ in\ amplicon\	Primers\ on\ sep\ reads\	Extend\ with\ primers\	Spand\ with\ primers\	Occurances\ of\ Forward\ Primer\ in\ Reads\	Occurances\ of\ Reverse\ Primer\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ PALs\	R1\_Sequence\_ID\	R1\_Sequence\	R2\_Sequence\_ID\	R2\_Sequence
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\	AG\(14\)\ \	14\	\	\	1\	test\_7\	TTCTCCCACTATATTTTGCATTGG\	test\_6\	TCCAGACTGAAGCTACCCTGG\	AG\(14\)\ \	14\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\ 1\:N\:0\:TCCTGA\	TACTGTTTAGAATAGACTGTTCTCCCACTATATTTTGCATTGGTGCATACTCAGCTTTAGTAATAAGTGTGATTCTGGTAGAGAGAGAGAGAGATACCAACCTCTTCTTCCCACTA\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\ 2\:N\:0\:TCCTGA\	TACTGTTTAGAAAGCCTGTTCCAGAACTTGATCACTGTCACAGAAAATCTTTCTTACTATCCAGACTGAAGCTACCCTGGTGCAGCTTTGTGCTGTTACCTTGAGTCATGTCATCA
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\	AC\(12\)\ \	12\	\	\	1\	test\_5\	GCAGTAAACAAAGGCAAAGGG\	test\_2\	CCTGGGCAGAGGTGTTCC\	AC\(12\)\ \	12\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\ 1\:N\:0\:TCCTGA\	TCATAAGAATGAGCAGTAAACAAAGGCAAAGGGGAGATAACACACACACACAAAATAAAAAAACATCAATTTCTAATACACGCCTTTATTATAAAGAAATAAATCACTGAAAAACA\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\ 2\:N\:0\:TCCTGA\	TCCTCTGACTAGGCAACAACAGCTTTTTTGCTCCTGGGCAGAGGTGTTCCGAGTGTATATTTTTTATAATTACGGCGCGCATTGGAAATTGATGTTATTTTATTTTGCGTGTGTGT
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\	AC\(12\)\ \	12\	\	\	1\	test\_8\	AAGTACAGTGGGGAGGCTGG\	test\_4\	TTTTCTACACAGCTCAAGTAGCCC\	AC\(12\)\ \	12\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\ 1\:N\:0\:TCCTGA\	TACTAGTCTAATAATTGCAGGCAGCTGAACTAGATAGGTCCTAAAGTACAGTGGGGAGGCTGGTGTGTGTGTGTGCATGGGATTGTCAGCCTTACCATCAGTCCTGATTTGTAGGT\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\ 2\:N\:0\:TCCTGA\	TAAACAACCAAATGAAACCATCTTTTCTACACAGCTCAAGTAGCCCTACATACAACACAAGCCACCTACAAATCAGGACTGATGGTAAGGCTGACAATCCAATCCACCACAACAAC
--- a/test-data/illuminaPE_filtered_microsats_primers.out.re_match~	Mon May 14 11:10:19 2018 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,5 +0,0 @@
-readPairID\	Motifs\(bases\)\	Bases\ in\ all\ Motifs\	Possible\ Extended\	Possible\ Spanning\	Primers\ found\ \(1\=y\,0\=n\)\	F\ Primer\ Name\	Forward\ Primer\	R\ Primer\ Name\	Reverse\ Primer\	Amplicon\ Motifs\	Number\ motif\ bases\ in\ amplicon\	Primers\ on\ sep\ reads\	Extend\ with\ primers\	Spand\ with\ primers\	Occurances\ of\ Forward\ Primer\ in\ Reads\	Occurances\ of\ Reverse\ Primer\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ PALs\	R1\_Sequence\_ID\	R1\_Sequence\	R2\_Sequence\_ID\	R2\_Sequence
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\	AG\(14\)\ \	14\	\	\	1\	test\_7\	TTCTCCCACTATATTTTGCATTGG\	test\_2\	TCCAGACTGAAGCTACCCTGG\	AG\(14\)\ \	14\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\ 1\:N\:0\:TCCTGA\	TACTGTTTAGAATAGACTGTTCTCCCACTATATTTTGCATTGGTGCATACTCAGCTTTAGTAATAAGTGTGATTCTGGTAGAGAGAGAGAGAGATACCAACCTCTTCTTCCCACTA\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\ 2\:N\:0\:TCCTGA\	TACTGTTTAGAAAGCCTGTTCCAGAACTTGATCACTGTCACAGAAAATCTTTCTTACTATCCAGACTGAAGCTACCCTGGTGCAGCTTTGTGCTGTTACCTTGAGTCATGTCATCA
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\	TG\(12\)\ \	12\	\	\	1\	test\_5\	GCAGTAAACAAAGGCAAAGGG\	test\_3\	CCTGGGCAGAGGTGTTCC\	TG\(12\)\ \	12\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\ 1\:N\:0\:TCCTGA\	TCATAAGAATGAGCAGTAAACAAAGGCAAAGGGGAGATAACACACACACACAAAATAAAAAAACATCAATTTCTAATACACGCCTTTATTATAAAGAAATAAATCACTGAAAAACA\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\ 2\:N\:0\:TCCTGA\	TCCTCTGACTAGGCAACAACAGCTTTTTTGCTCCTGGGCAGAGGTGTTCCGAGTGTATATTTTTTATAATTACGGCGCGCATTGGAAATTGATGTTATTTTATTTTGCGTGTGTGT
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\	TG\(12\)\ \	12\	\	\	1\	test\_4\	AAGTACAGTGGGGAGGCTGG\	test\_6\	TTTTCTACACAGCTCAAGTAGCCC\	TG\(12\)\ \	12\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\ 1\:N\:0\:TCCTGA\	TACTAGTCTAATAATTGCAGGCAGCTGAACTAGATAGGTCCTAAAGTACAGTGGGGAGGCTGGTGTGTGTGTGTGCATGGGATTGTCAGCCTTACCATCAGTCCTGATTTGTAGGT\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\ 2\:N\:0\:TCCTGA\	TAAACAACCAAATGAAACCATCTTTTCTACACAGCTCAAGTAGCCCTACATACAACACAAGCCACCTACAAATCAGGACTGATGGTAAGGCTGACAATCCAATCCACCACAACAAC
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8899\:1514\	TG\(12\)\ TG\(12\)\ \	24\	\	\	1\	test\_8\	TCTTTATCTAAACACATCCTGAAATACC\	test\_1\	AAACGCAATTATTTTGAGATGTCC\	TG\(12\)\ TG\(12\)\ \	24\	1\	\	\	1\	2\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8899\:1514\ 1\:N\:0\:TCCTGA\	TCTTTATCTAAACACATCCTGAAATACCATCTGTTACACACACACACAGCAGTGGAAGTATAAAAAAAAATCTGGACATCTCAAAATAATTGCGTTTCTGAAGTGTTACATTTTTC\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8899\:1514\ 2\:N\:0\:TCCTGA\	TATCATTGAAATTTTTATAAAAACTGTGAAGAGAAAAATGTAACACTTCAGAAACGCAATTATTTTGAGATGTCCAGATTTTTTTTTATACTTCCACTGCTGTGTGTGTGTGTAAC
--- a/test-data/illuminaPE_filtered_microsats_rankmotifs.out.re_match~	Mon May 14 11:10:19 2018 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,8 +0,0 @@
-readPairID\	Motifs\(bases\)\	Bases\ in\ all\ Motifs\	Possible\ Extended\	Possible\ Spanning\	Primers\ found\ \(1\=y\,0\=n\)\	F\ Primer\ Name\	Forward\ Primer\	R\ Primer\ Name\	Reverse\ Primer\	Amplicon\ Motifs\	Number\ motif\ bases\ in\ amplicon\	Primers\ on\ sep\ reads\	Extend\ with\ primers\	Spand\ with\ primers\	Occurances\ of\ Forward\ Primer\ in\ Reads\	Occurances\ of\ Reverse\ Primer\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ PALs\	R1\_Sequence\_ID\	R1\_Sequence\	R2\_Sequence\_ID\	R2\_Sequence
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\	AC\(12\)\ \	12\	\	\	1\	test\_3\	AAGTACAGTGGGGAGGCTGG\	test\_4\	TTTTCTACACAGCTCAAGTAGCCC\	AC\(12\)\ \	12\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\ 1\:N\:0\:TCCTGA\	TACTAGTCTAATAATTGCAGGCAGCTGAACTAGATAGGTCCTAAAGTACAGTGGGGAGGCTGGTGTGTGTGTGTGCATGGGATTGTCAGCCTTACCATCAGTCCTGATTTGTAGGT\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\ 2\:N\:0\:TCCTGA\	TAAACAACCAAATGAAACCATCTTTTCTACACAGCTCAAGTAGCCCTACATACAACACAAGCCACCTACAAATCAGGACTGATGGTAAGGCTGACAATCCAATCCACCACAACAAC
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8044\:1926\	AT\(12\)\ \	12\	\	\	0\	\	\	\	\	\	\	\	\	\	\	\	\	\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8044\:1926\ 1\:N\:0\:TCCTGA\	TAGATTTTTTTTTTTATATATATATAAATATAGATGTACATATATTTATATAAATATAAAAGCACAGCATCCTCCTGTCTCTCCTCCTGATTTATTATGGTTAAAGCTTGTGACAG\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8044\:1926\ 2\:N\:0\:TCCTGA\	TCAGGCAAGGTCACTGCCACCACTGGGGAGTGCCTGTTTCTGAAGGGCCCAGCCAACTCTGTCACAAGCTTTAACCATAATAAATCAGGAGGAGAGACAGGAGGATGCTGTGCTTT
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:6204\:1090\	TC\(12\)\ \	12\	\	\	0\	\	\	\	\	\	\	\	\	\	\	\	\	\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:6204\:1090\ 1\:N\:0\:TCCTGA\	TGCTTTGGTTCTAAGAGAAAAACAATTATTATAAATGTTTATAATTGATGATAAGCATTTTTGTACAAAGCCAAGACCATTCTGAATGAAGCACCCAAAAAGCCCGGAGGCAACAA\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:6204\:1090\ 2\:N\:0\:TCCTGA\	TGCTTTGGTTCTAAGAGAAAAACAAGTGATGCACAAGCAATTCCTCGCCACCACCCAACTGATGCCCAGCCACCCCCCCAAGCAGTGAAAGAGAGAGAGAGATGAACCCCCTTCAA
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:5879\:1238\	AT\(12\)\ \	12\	\	\	0\	\	\	\	\	\	\	\	\	\	\	\	\	\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:5879\:1238\ 1\:N\:0\:TCCTGA\	TCCCCACCCTGTCATGGTTCTATGTTTTTGTTTTTGTTTTTGTTTTTATGGTTTCCGTATTCCACATTAAAACCTTATGTAACGTACGGGCCAATAAATAGTTACTCGCCATATCC\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:5879\:1238\ 2\:N\:0\:TCCTGA\	TCCCCACCCTGTCATGGTTCTATGTATATATATATAGCCATGTGTGTGGTACCAGGGATAGGTACCTGGGATTGGGGCAGTGACACTTTAGTGCCCCGTACACTACATGATGTTTT
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\	AC\(12\)\ \	12\	\	\	1\	test\_6\	GCAGTAAACAAAGGCAAAGGG\	test\_1\	CCTGGGCAGAGGTGTTCC\	AC\(12\)\ \	12\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\ 1\:N\:0\:TCCTGA\	TCATAAGAATGAGCAGTAAACAAAGGCAAAGGGGAGATAACACACACACACAAAATAAAAAAACATCAATTTCTAATACACGCCTTTATTATAAAGAAATAAATCACTGAAAAACA\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\ 2\:N\:0\:TCCTGA\	TCCTCTGACTAGGCAACAACAGCTTTTTTGCTCCTGGGCAGAGGTGTTCCGAGTGTATATTTTTTATAATTACGGCGCGCATTGGAAATTGATGTTATTTTATTTTGCGTGTGTGT
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:17449\:1584\	AC\(36\)\ \	36\	\	\	0\	\	\	\	\	\	\	\	\	\	\	\	\	\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:17449\:1584\ 1\:N\:0\:TCCTGA\	TCGTAGCATGTGTATGCTTTGGGGTTTCATGCTGTTGATTCATAACTGCTGCTGGCTGTAGACTGAACCTTCTGGGTAGGAGGAATATGCTTAGACAAGCACACCAGTCAGCCCGA\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:17449\:1584\ 2\:N\:0\:TCCTGA\	TCTGTGTGTGAGCACACACACACACACACACACACACACACACACACATGCAGGTACTTGCTCTGCCACCCCTGGCGGGCTGCGTGGTGTGCCTGACGACGTATTCTAATCCTACA
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\	TC\(14\)\ \	14\	\	\	1\	test\_7\	TTCTCCCACTATATTTTGCATTGG\	test\_2\	TCCAGACTGAAGCTACCCTGG\	TC\(14\)\ \	14\	1\	\	\	1\	1\	1\	1\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\ 1\:N\:0\:TCCTGA\	TACTGTTTAGAATAGACTGTTCTCCCACTATATTTTGCATTGGTGCATACTCAGCTTTAGTAATAAGTGTGATTCTGGTAGAGAGAGAGAGAGATACCAACCTCTTCTTCCCACTA\	\>ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\ 2\:N\:0\:TCCTGA\	TACTGTTTAGAAAGCCTGTTCCAGAACTTGATCACTGTCACAGAAAATCTTTCTTACTATCCAGACTGAAGCTACCCTGGTGCAGCTTTGTGCTGTTACCTTGAGTCATGTCATCA
--- a/test-data/illuminaPE_microsat_types.out.re_match~	Mon May 14 11:10:19 2018 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,15 +0,0 @@
-allExtended\:\	0
-allSpan\:\	0
-broken\:\	2
-compound\:\	2
-readsWithMicrosat\:\	13
-totalBases\:\	2320
-totalReads\:\	20\	\(2\ x\ 10\)
-
-
-Microsat\ Type\	monomer\ length\	total\ loci\	loci\ w\/\ primers\	reads\ with\ loci\	total\ bases\	extended\	extended\ w\/\ primers\	spanning\	spanning\ w\/\ primers
-AC\	2\	7\	4\	7\	116\	0\	0\	0\	0
-AG\	2\	0\	0\	0\	0\	0\	0\	0\	0
-AT\	2\	8\	0\	6\	106\	0\	0\	0\	0
-CG\	2\	0\	0\	0\	0\	0\	0\	0\	0
-TC\	2\	2\	1\	2\	26\	\	\	\	
--- a/test-data/illuminaPE_microsats.out.re_match~	Mon May 14 11:10:19 2018 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,11 +0,0 @@
-readPairID\	Motifs\(bases\)\	Bases\ in\ all\ Motifs\	Possible\ Extended\	Possible\ Spanning\	Primers\ found\ \(1\=y\,0\=n\)\	F\ Primer\ Name\	Forward\ Primer\	R\ Primer\ Name\	Reverse\ Primer\	Amplicon\ Motifs\	Number\ motif\ bases\ in\ amplicon\	Primers\ on\ sep\ reads\	Extend\ with\ primers\	Spand\ with\ primers\	Occurances\ of\ Forward\ Primer\ in\ Reads\	Occurances\ of\ Reverse\ Primer\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ Reads\	Occurances\ of\ Amplifiable\ Primer\ Pair\ in\ PALs
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:10979\:1695\	TC\(14\)\ \	14\	\	\	1\	test\_7\	TTCTCCCACTATATTTTGCATTGG\	test\_2\	TCCAGACTGAAGCTACCCTGG\	TC\(14\)\ \	14\	1\	\	\	1\	1\	1\	1
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:17449\:1584\	AC\(36\)\ \	36\	\	\	0\	\	\	\	\	\	\	\	\	\	\	\	\	
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:19063\:1614\	AT\(14\)\ AT\(14\)\ AT\(14\)\ AT\(14\)\ \	56\	\	\	0\	\	\	\	\	\	\	\	\	\	\	\	\	
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:1978\:1220\	AC\(12\)\ \	12\	\	\	1\	test\_6\	GCAGTAAACAAAGGCAAAGGG\	test\_1\	CCTGGGCAGAGGTGTTCC\	AC\(12\)\ \	12\	1\	\	\	1\	1\	1\	1
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:5626\:1554\	AT\(14\)\ AC\(16\)\ AC\(16\)\ AT\(12\)\ \	58\	\	\	0\	\	\	\	\	\	\	\	\	\	\	\	\	
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:5879\:1238\	AT\(12\)\ \	12\	\	\	0\	\	\	\	\	\	\	\	\	\	\	\	\	
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:6204\:1090\	TC\(12\)\ \	12\	\	\	0\	\	\	\	\	\	\	\	\	\	\	\	\	
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8044\:1926\	AT\(12\)\ \	12\	\	\	0\	\	\	\	\	\	\	\	\	\	\	\	\	
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8157\:1636\	AC\(12\)\ \	12\	\	\	1\	test\_3\	AAGTACAGTGGGGAGGCTGG\	test\_4\	TTTTCTACACAGCTCAAGTAGCCC\	AC\(12\)\ \	12\	1\	\	\	1\	1\	1\	1
-ILLUMINA\-545855\:49\:FC61RLR\:2\:1\:8899\:1514\	AC\(12\)\ AC\(12\)\ \	24\	\	\	1\	test\_8\	TCTTTATCTAAACACATCCTGAAATACC\	test\_5\	AAACGCAATTATTTTGAGATGTCC\	AC\(12\)\ AC\(12\)\ \	24\	1\	\	\	1\	2\	1\	1