Mercurial > repos > dfornika > micall_lite
annotate resistance.py @ 29:4ff24c044fed draft default tip
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit 9d563c366233a5de79429ac1fa8f994f5d8f785d-dirty"
| author | dfornika | 
|---|---|
| date | Thu, 27 Feb 2020 22:31:32 +0000 | 
| parents | 033e0a3674bc | 
| children | 
| rev | line source | 
|---|---|
| 23 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 1 #!/usr/bin/env python | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 2 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 3 from __future__ import print_function | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 4 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 5 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 6 import argparse | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 7 from pprint import pprint | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 8 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 9 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 10 import yaml | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 11 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 12 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 13 HCV_RULES_VERSION = "1.8" | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 14 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 15 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 16 def load_rules_config(rules_config, genotype, backup_genotype=None): | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 17 rules = { | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 18 'drug_class': {}, | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 19 'drugs': {} | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 20 } | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 21 rules['alg_name'] = 'HCV_RULES' | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 22 rules['alg_version'] = HCV_RULES_VERSION | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 23 rules['level_def'] = { | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 24 '-1': 'Resistance Interpretation Not Available', | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 25 '0': 'Sequence does not meet quality-control standards', | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 26 '1': 'Likely Susceptible', | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 27 '2': 'Not Indicated', | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 28 '3': 'Mutations Detected; Effect Unknown', | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 29 '4': 'Resistance Possible', | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 30 '5': 'Resistance Likely' | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 31 } | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 32 rules['global_range'] = [('-INF', '3', '1'), ('4', '7', '4'), ('8', 'INF', '5')] | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 33 for drug in rules_config: | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 34 drug_code = drug['code'] | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 35 drug_rules = [] | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 36 region = None | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 37 for genotype_config in drug['genotypes']: | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 38 region = genotype_config['region'] | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 39 rule_text = genotype_config['rules'] | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 40 if genotype_config['genotype'] == genotype: | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 41 rules['gene_def'][genotype_config['reference']] = [region] | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 42 break | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 43 elif genotype_config['genotype'] == backup_genotype: | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 44 rules['gene_def'].setdefault(genotype_config['reference'], [region]) | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 45 break | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 46 else: | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 47 rule_text = 'SCORE FROM ( TRUE => "Not available" )' | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 48 drug_rules.append((rule_text, [('scorerange', 'useglobalrange')])) | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 49 try: | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 50 rules['drug_class'][region].append(drug_code) | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 51 except KeyError: | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 52 rules['drug_class'][region] = [drug_code] | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 53 rules['drugs'][drug_code] = (drug['name'], drug_rules) | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 54 return rules | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 55 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 56 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 57 def main(args): | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 58 with open(args.rules) as f: | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 59 rules = load_rules_config(yaml.safe_load(f), None) | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 60 pprint(rules) | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 61 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 62 | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 63 if __name__ == '__main__': | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 64 parser = argparse.ArgumentParser() | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 65 parser.add_argument("consensus", help="Consensus fasta") | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 66 parser.add_argument("--rules", help="Rules file (yaml)") | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 67 args = parser.parse_args() | 
| 
033e0a3674bc
"planemo upload for repository https://github.com/public-health-bioinformatics/galaxy_tools/blob/master/tools/micall-lite commit d5fd8bc70d31d99c2354f1e8ec2e34d147cfa048-dirty"
 dfornika parents: diff
changeset | 68 main(args) | 
