# HG changeset patch # User davidvanzessen # Date 1458302570 14400 # Node ID 1558fbbc19efbb04dff442ff0706052d0a2415a3 # Parent 79696e273853a1c9268a0f6be30ab8ca407c9f54 Uploaded diff -r 79696e273853 -r 1558fbbc19ef gene_identification.py --- a/gene_identification.py Wed Mar 16 11:18:55 2016 -0400 +++ b/gene_identification.py Fri Mar 18 08:02:50 2016 -0400 @@ -40,10 +40,12 @@ print "Number of input sequences:", len(dic) +#old cm sequence: gggagtgcatccgccccaacccttttccccctcgtctcctgtgagaattccc + #lambda/kappa reference sequence searchstrings = {"ca": "catccccgaccagccccaaggtcttcccgctgagcctctgcagcacccagccagatgggaacgtggtcatcgcctgcctgg", "cg": "ctccaccaagggcccatcggtcttccccctggcaccctcctccaagagcacctctgggggcacagcggccctgggctgcctggtcaaggactacttccccgaaccggtgacggtgtcgtggaactcaggcgccctgaccag", - "cm": "gggagtgcatccgccccaacccttttccccctcgtctcctgtgagaattccc"} + "cm": "gggagtgcatccgccccaacc"} #new (shorter) cm sequence compiledregex = {"ca": [], "cg": [],