# HG changeset patch # User dfornika # Date 1582331435 0 # Node ID 647eedfd155646135c2fa7d6ad9ccfea51b7f14e "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/data_managers/data_manager_mash_sketch_builder/ commit 20558d9de7b6dd375a8835698f231cbc0c83446d-dirty" diff -r 000000000000 -r 647eedfd1556 data_manager/mash_sketch_builder.py --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/data_manager/mash_sketch_builder.py Sat Feb 22 00:30:35 2020 +0000 @@ -0,0 +1,87 @@ +#!/usr/bin/env python + +import argparse +import errno +import json +import os +import subprocess +import sys + + +DATA_TABLE_NAME = "mash_sketches" + + +def mash_sketch(mash_sketch_args, sketch_name, target_directory, data_table_name=DATA_TABLE_NAME): + UUID = str(uuid.uuid4()) + + os.mkdir(os.path.join(target_directory, UUID)) + + sketch_path = os.path.join(UUID, "sketch"), + + args = [ + '--threads', str(kraken2_args["threads"]), + '-k', str(mash_sketch_args["kmer_size"]), + '-s', str(mash_sketch_args["sketch_size"]), + '-o', sketch_path + ] + + subprocess.check_call(['mash', 'sketch'] + args, cwd=target_directory) + + if kraken2_args["clean"]: + args = [ + '--threads', str(kraken2_args["threads"]), + '--clean', + '--db', database_path + ] + + subprocess.check_call(['kraken2-build'] + args, cwd=target_directory) + + data_table_entry = { + 'data_tables': { + data_table_name: [ + { + "value": UUID, + "name": sketch_name, + "path": sketch_path, + } + ] + } + } + + return data_table_entry + + +def main(): + parser = argparse.ArgumentParser() + parser.add_argument('data_manager_json') + parser.add_argument('--kmer-size', dest='kmer_size', type=int, default=35, help='kmer length') + parser.add_argument('--sketch-size', dest='sketch_size', type=int, default=31, help='minimizer length') + parser.add_argument('--threads', dest='threads', default=1, help='threads') + parser.add_argument('--sketch-name', dest='sketch_name', help='Name for sketch') + args = parser.parse_args() + + data_manager_input = json.loads(open(args.data_manager_json).read()) + + target_directory = data_manager_input['output_data'][0]['extra_files_path'] + + try: + os.mkdir( target_directory ) + except OSError as exc: + if exc.errno == errno.EEXIST and os.path.isdir( target_directory ): + pass + else: + raise + + data_manager_output = {} + + mash_sketch_args = { + "kmer_size": args.kmer_len, + "sketch_size": args.minimizer_len, + "threads": args.threads, + } + + open(args.data_manager_json, 'w').write(json.dumps(data_manager_output, sort_keys=True)) + + +if __name__ == "__main__": + main() diff -r 000000000000 -r 647eedfd1556 data_manager/mash_sketch_builder.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/data_manager/mash_sketch_builder.xml Sat Feb 22 00:30:35 2020 +0000 @@ -0,0 +1,93 @@ + + + + + + + + + + + database builder + + mash + python + + mash --version + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + 10.1186/s13059-016-0997-x + + diff -r 000000000000 -r 647eedfd1556 data_manager_conf.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/data_manager_conf.xml Sat Feb 22 00:30:35 2020 +0000 @@ -0,0 +1,18 @@ + + + + + + + + + ${path} + mash_sketches/${path} + + ${GALAXY_DATA_MANAGER_DATA_PATH}/mash_sketches/${path} + abspath + + + + + diff -r 000000000000 -r 647eedfd1556 test-data/mash_sketch_data_manager.json --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/mash_sketch_data_manager.json Sat Feb 22 00:30:35 2020 +0000 @@ -0,0 +1,1 @@ +{"data_tables": {"mash_sketches": [{"name": "sketch", "path": "sketch", "value": "sketch"}]}} diff -r 000000000000 -r 647eedfd1556 test-data/test_assembly.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/test_assembly.fasta Sat Feb 22 00:30:35 2020 +0000 @@ -0,0 +1,3 @@ +>test +GCATGTCGATCTGTGTGCTAGTCGTAGTCGATCGATCTGATCGATCTGTCAGTCAGTAGT +CTCAGCGATGCATTATTATATTATATTATCGATCGATGCTGATCGATTATATTCGATCTG diff -r 000000000000 -r 647eedfd1556 tool-data/mash_sketches.loc.sample diff -r 000000000000 -r 647eedfd1556 tool_data_table_conf.xml.sample --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool_data_table_conf.xml.sample Sat Feb 22 00:30:35 2020 +0000 @@ -0,0 +1,8 @@ + + + + + value, name, path + +
+