Repository 'matchms'
hg clone https://eddie.galaxyproject.org/repos/recetox/matchms

Changeset 10:c3dd958cc4a5 (2022-01-28)
Previous changeset 9:f06923bdd2f2 (2022-01-10) Next changeset 11:ba9410f612bc (2022-03-17)
Commit message:
"planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit 9bc547872c98a9c13c561d15e8990fe82bdc0e72"
added:
macros.xml
matchms_similarity.xml
matchms_similarity_wrapper.py
test-data/filtering/clean_metadata.msp
test-data/filtering/default_filters.msp
test-data/filtering/input.msp
test-data/filtering/mz_range.msp
test-data/filtering/normalise_intensities.msp
test-data/filtering/relative_intensity.msp
test-data/formatter/test2_threshold_formatting.tsv
test-data/formatter/test2_topk_formatting.tsv
test-data/similarity/fill.mgf
test-data/similarity/fill.msp
test-data/similarity/matches_test1_out.tsv
test-data/similarity/matches_test3_out.tsv
test-data/similarity/matches_test4_out.tsv
test-data/similarity/matches_test5_out.tsv
test-data/similarity/recetox_gc-ei_ms_20201028.msp
test-data/similarity/recetox_gc-ei_ms_20201028_with_precursor_mz.msp
test-data/similarity/scores_test1_out.tsv
test-data/similarity/scores_test3_out.tsv
test-data/similarity/scores_test4_out.tsv
test-data/similarity/scores_test5_out.tsv
removed:
matchms.xml
matchms_wrapper.py
test-data/fill.mgf
test-data/fill.msp
test-data/matches_test1_out.tsv
test-data/matches_test3_out.tsv
test-data/matches_test4_out.tsv
test-data/matches_test5_out.tsv
test-data/matches_test6_out.tsv
test-data/matches_test7_out.tsv
test-data/recetox_gc-ei_ms_20201028.msp
test-data/scores_test1_out.tsv
test-data/scores_test3_out.tsv
test-data/scores_test4_out.tsv
test-data/scores_test5_out.tsv
test-data/scores_test6_out.tsv
test-data/scores_test7_out.tsv
test-data/test2_threshold_formatting.tsv
test-data/test2_topk_formatting.tsv
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Fri Jan 28 16:22:06 2022 +0000
[
@@ -0,0 +1,70 @@
+<macros>
+    <token name="@TOOL_VERSION@">0.11.0</token>
+
+    <xml name="creator">
+        <creator>
+            <person
+                givenName="Helge"
+                familyName="Hecht"
+                url="https://github.com/hechth"
+                identifier="0000-0001-6744-996X" />
+            <organization
+                url="https://www.recetox.muni.cz/"
+                email="GalaxyToolsDevelopmentandDeployment@space.muni.cz"
+                name="RECETOX MUNI" />
+        </creator>
+    </xml>
+
+    <token name="@HELP_matchms@">
+        <![CDATA[
+            Documentation
+                For documentation on the tool see https://github.com/matchms/matchms/blob/master/README.rst
+                and https://matchms.readthedocs.io/en/latest/.
+
+            Upstream Tools
+                +-----------+---------------+--------+-----------+
+                | Name      | Output File   | Format | Parameter |
+                +===========+===============+========+===========+
+                | RAMClustR | Mass spectra  | msp    | references|
+                +-----------+---------------+--------+-----------+
+                | RAMClustR | Mass spectra  | msp    | queries   |
+                +-----------+---------------+--------+-----------+
+
+            Downstream Tools
+                The outputs are two tsv datasets. One containing the similarity scores and the other number of matched peaks.
+        ]]>
+    </token>
+
+    <token name="@HELP_formatter@">
+        <![CDATA[
+            Usage
+                This tool creates user friendly tables from the data matrices produces by matchms.
+                The tool can be operated on two modes based on (i) thresholds or (ii) top k matches.
+
+            Input Table Format
+                The tool expects two data matrices with the format as depicted below.
+                The tool assumes the reference compound labels as row labels and the query labels as column labels (as naturally outputted by matchms).
+
+                +----------+------+------+-----+
+                |          | C001 | C002 | ... |
+                +==========+======+======+=====+
+                | Perylene | 0.1  | 0.0  | ... |
+                +----------+------+------+-----+
+                | Glycine  | 0.5  | 0.34 | ... |
+                +----------+------+------+-----+
+                |   ...    | ...  | ...  | ... |
+                +----------+------+------+-----+
+
+            Output Table Format
+                +----------+-----------+---------+--------+
+                | query    | reference | matches | scores |
+                +==========+===========+=========+========+
+                | C001     | Glycine   |      6  | 0.5    |
+                +----------+-----------+---------+--------+
+                | C002     | Glycine   |     3   | 0.34   |
+                +----------+-----------+---------+--------+
+                |   ...    | ...       | ...     | ...    |
+                +----------+-----------+---------+--------+
+        ]]>
+    </token>
+</macros>
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 matchms.xml
--- a/matchms.xml Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
b'@@ -1,148 +0,0 @@\n-<tool id="matchms" name="matchMS" version="0.9.2+galaxy1">\n-    <description>calculate the similarity score and matched peaks</description>\n-    <requirements>\n-        <requirement type="package" version="0.9.2">matchms</requirement>\n-        <requirement type="package" version="1.1.4">pandas</requirement>\n-    </requirements>\n-\n-    <environment_variables>\n-        <environment_variable name="MPLCONFIGDIR">/tmp</environment_variable>\n-    </environment_variables>\n-\n-    <command detect_errors="exit_code"><![CDATA[\n-        sh ${matchms_python_cli}\n-    ]]> </command>\n-\n-    <configfiles>\n-        <configfile name="matchms_python_cli">\n-            python3 ${__tool_directory__}/matchms_wrapper.py \\\n-            $default_filters \\\n-            $normalize_intensities \\\n-            #if $symmetric.is_symmetric\n-                -s \\\n-            #else\n-                --ref "$references" \\\n-                --ref_format "$references.ext" \\\n-            #end if\n-            "$queries" \\\n-            "$queries.ext" \\\n-            "$similarity_metric" \\\n-            "$algorithm.tolerance" \\\n-            "$algorithm.mz_power" \\\n-            "$algorithm.intensity_power" \\\n-            "$similarity_scores" \\\n-            "$similarity_matches"\n-        </configfile>\n-    </configfiles>\n-\n-    <inputs>\n-        <param label="Queries spectra" name="queries" type="data" format="msp,mgf" help="Query mass spectra to match against references." />\n-        <conditional name="symmetric">\n-            <param name="is_symmetric" label="Symmetric" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="false" />\n-        <when value="FALSE">\n-            <param label="Reference spectra" name="references" type="data" format="msp,mgf" help="Reference mass spectra to match against as library." />\n-        </when>\n-        </conditional>\n-        <param label="Similarity metric" name="similarity_metric" type="select" display="radio" help="Similarity metric to use for score computation.">\n-            <option value="CosineGreedy" selected="true">CosineGreedy</option>\n-            <option value="CosineHungarian">CosineHungarian</option>\n-            <option value="ModifiedCosine">ModifiedCosine </option>\n-        </param>\n-\n-        <section name="algorithm" title="Algorithm Parameters" expanded="true">\n-            <param label="tolerance" name="tolerance" type="float" value="0.1" help="Peaks will be considered a match when less than tolerance apart. Absolute m/z value, not in ppm." />\n-            <param label="mz_power" name="mz_power" type="float" value="0.0" help="The power to raise mz to in the cosine function." />\n-            <param label="intensity_power" name="intensity_power" type="float" value="1.0" help="The power to raise intensity to in the cosine function." />\n-        </section>\n-        <param name="default_filters" label="Default Filters" type="boolean" truevalue="-f" falsevalue="" checked="false"\n-            help="Apply default filters (make_charge_int, make_ionmode_lowercase, set_ionmode_na_when_missing, add_compound_name,\n-             derive_adduct_from_name, derive_formula_from_name, clean_compound_name, add_precursor_mz, derive_ionmode, correct_charge)."\n-        />\n-        <param name="normalize_intensities" label="Normalize Intensities" type="boolean" truevalue="-n" falsevalue="" checked="false" \n-            help="Filter to normalize intensities."/>\n-\n-    </inputs>\n-\n-    <outputs>\n-        <data label="$similarity_metric scores of ${on_string}" name="similarity_scores" format="tsv" />\n-        <data label="$similarity_metric matches of ${on_string}" name="similarity_matches" format="tsv" />\n-    </outputs>\n-\n-    <tests>\n-        <test>\n-            <param name="references" value="fill.mgf" ftype="mgf"/>\n-            <param name="queries" value="fill.msp" ftype="msp"/>\n-            <param name="similarity_metric" value="CosineGreedy"/>\n-            <output name="similarity_scores" file="scores_test1'..b'</test>\n-        <test>\n-            <param name="references" value="recetox_gc-ei_ms_20201028.msp" ftype="msp"/>\n-            <param name="queries" value="fill.msp" ftype="msp"/>\n-            <param name="similarity_metric" value="CosineGreedy"/>\n-            <output name="similarity_scores" file="scores_test2_out.tsv" ftype="tsv" checksum="md5$d2a5a01d9980636ce6a246d68834b84e"/>\n-            <output name="similarity_matches" file="matches_test2_out.tsv" ftype="tsv" checksum="md5$28dc16ce45105234437e53d59e240046"/>\n-        </test>\n-        <test>\n-            <param name="references" value="recetox_gc-ei_ms_20201028.msp" ftype="msp"/>\n-            <param name="queries" value="fill.msp" ftype="msp"/>\n-            <param name="similarity_metric" value="CosineHungarian"/>\n-            <param name="default_filters" value="TRUE" />\n-            <output name="similarity_scores" file="scores_test3_out.tsv" ftype="tsv" checksum="md5$1341369778036e0a267ff723f8cfca9c"/>\n-            <output name="similarity_matches" file="matches_test3_out.tsv" ftype="tsv" checksum="md5$28dc16ce45105234437e53d59e240046"/>\n-        </test>\n-        <test>\n-            <param name="references" value="recetox_gc-ei_ms_20201028.msp" ftype="msp"/>\n-            <param name="queries" value="recetox_gc-ei_ms_20201028.msp" ftype="msp"/>\n-            <param name="similarity_metric" value="ModifiedCosine"/>\n-            <output name="similarity_scores" file="scores_test4_out.tsv" ftype="tsv"/>\n-            <output name="similarity_matches" file="matches_test4_out.tsv" ftype="tsv"/>\n-        </test>\n-        <test>\n-            <param name="queries" value="fill.msp" ftype="msp"/>\n-            <param name="similarity_metric" value="CosineHungarian"/>\n-            <param name="is_symmetric" value="TRUE"/>\n-            <output name="similarity_scores" file="scores_test5_out.tsv" ftype="tsv"/>\n-            <output name="similarity_matches" file="matches_test5_out.tsv" ftype="tsv"/>\n-        </test>\n-        <test>\n-            <param name="references" value="recetox_gc-ei_ms_20201028.msp" ftype="msp"/>\n-            <param name="queries" value="recetox_gc-ei_ms_20201028.msp" ftype="msp"/>\n-            <param name="similarity_metric" value="ModifiedCosine"/>\n-            <param name="normalize_intensities" value="TRUE"/>\n-            <output name="similarity_scores" file="scores_test6_out.tsv" ftype="tsv"/>\n-            <output name="similarity_matches" file="matches_test6_out.tsv" ftype="tsv"/>\n-        </test>\n-            <test>\n-            <param name="references" value="recetox_gc-ei_ms_20201028.msp" ftype="msp"/>\n-            <param name="queries" value="fill.msp" ftype="msp"/>\n-            <param name="normalize_intensities" value="TRUE"/>\n-            <param name="similarity_metric" value="CosineHungarian"/>\n-            <output name="similarity_scores" file="scores_test7_out.tsv" ftype="tsv"/>\n-            <output name="similarity_matches" file="matches_test7_out.tsv" ftype="tsv"/>\n-        </test>\n-    </tests>\n-\n-    <help><![CDATA[\n-    Documentation\n-        For documentation on the tool see https://github.com/matchms/matchms/blob/master/README.rst and https://matchms.readthedocs.io/en/latest/.\n-\n-    Upstream Tools\n-        +-----------+---------------+--------+-----------+\n-        | Name      | Output File   | Format | Parameter |\n-        +===========+===============+========+===========+\n-        | RAMClustR | Mass spectra  | msp    | references|\n-        +-----------+---------------+--------+-----------+\n-        | RAMClustR | Mass spectra  | msp    | queries   |\n-        +-----------+---------------+--------+-----------+\n-\n-    Downstream Tools\n-        The outputs are two tsv datasets. One containing the similarity scores and the other number of matched peaks.\n-    ]]></help>\n-\n-\n-    <citations>\n-        <citation type="doi">10.5281/zenodo.4589154</citation>\n-        <citation type="doi">10.21105/joss.02411</citation>\n-    </citations>\n-</tool>\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 matchms_similarity.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/matchms_similarity.xml Fri Jan 28 16:22:06 2022 +0000
[
@@ -0,0 +1,129 @@
+<tool id="matchms" name="matchMS similarity" version="@TOOL_VERSION@+galaxy1">
+    <description>calculate the similarity score and matched peaks</description>
+
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+    <expand macro="creator"/>
+
+    <requirements>
+        <requirement type="package" version="@TOOL_VERSION@">matchms</requirement>
+        <requirement type="package" version="1.1.4">pandas</requirement>
+    </requirements>
+
+    <environment_variables>
+        <environment_variable name="MPLCONFIGDIR">/tmp</environment_variable>
+    </environment_variables>
+
+    <command detect_errors="exit_code"><![CDATA[
+        sh ${matchms_python_cli}
+    ]]> </command>
+
+    <configfiles>
+        <configfile name="matchms_python_cli">
+            python3 ${__tool_directory__}/matchms_similarity_wrapper.py \
+            #if $symmetric.is_symmetric
+            -s \
+            #else
+            --ref "$references" \
+            --ref_format "$references.ext" \
+            #end if
+            "$queries" \
+            "$queries.ext" \
+            "$similarity_metric" \
+            "$algorithm.tolerance" \
+            "$algorithm.mz_power" \
+            "$algorithm.intensity_power" \
+            "$similarity_scores" \
+            "$similarity_matches"
+        </configfile>
+    </configfiles>
+
+    <inputs>
+        <param label="Queries spectra" name="queries" type="data" format="msp,mgf"
+               help="Query mass spectra to match against references."/>
+        <conditional name="symmetric">
+            <param name="is_symmetric" label="Symmetric" type="boolean" truevalue="TRUE" falsevalue="FALSE"
+                   checked="false"/>
+            <when value="FALSE">
+                <param label="Reference spectra" name="references" type="data" format="msp,mgf"
+                       help="Reference mass spectra to match against as library."/>
+            </when>
+        </conditional>
+        <param label="Similarity metric" name="similarity_metric" type="select" display="radio"
+               help="Similarity metric to use for score computation.">
+            <option value="CosineGreedy" selected="true">CosineGreedy</option>
+            <option value="CosineHungarian">CosineHungarian</option>
+            <option value="ModifiedCosine">ModifiedCosine</option>
+        </param>
+
+        <section name="algorithm" title="Algorithm Parameters" expanded="true">
+            <param label="tolerance" name="tolerance" type="float" value="0.1"
+                   help="Peaks will be considered a match when less than tolerance apart. Absolute m/z value, not in ppm."/>
+            <param label="mz_power" name="mz_power" type="float" value="0.0"
+                   help="The power to raise mz to in the cosine function."/>
+            <param label="intensity_power" name="intensity_power" type="float" value="1.0"
+                   help="The power to raise intensity to in the cosine function."/>
+        </section>
+    </inputs>
+
+    <outputs>
+        <data label="$similarity_metric scores of ${on_string}" name="similarity_scores" format="tsv"/>
+        <data label="$similarity_metric matches of ${on_string}" name="similarity_matches" format="tsv"/>
+    </outputs>
+
+    <tests>
+        <test>
+            <param name="references" value="similarity/fill.mgf" ftype="mgf"/>
+            <param name="queries" value="similarity/fill.msp" ftype="msp"/>
+            <param name="similarity_metric" value="CosineGreedy"/>
+            <output name="similarity_scores" file="similarity/scores_test1_out.tsv" ftype="tsv"
+                    checksum="md5$1aff8d0777e2f4e565be2b1b393547ef"/>
+            <output name="similarity_matches" file="similarity/matches_test1_out.tsv" ftype="tsv"
+                    checksum="md5$aab26ef4a0e80a53699832db72c06340"/>
+        </test>
+        <test>
+            <param name="references" value="similarity/recetox_gc-ei_ms_20201028.msp" ftype="msp"/>
+            <param name="queries" value="similarity/fill.msp" ftype="msp"/>
+            <param name="similarity_metric" value="CosineGreedy"/>
+            <output name="similarity_scores" file="scores_test2_out.tsv" ftype="tsv"
+                    checksum="md5$d2a5a01d9980636ce6a246d68834b84e"/>
+            <output name="similarity_matches" file="matches_test2_out.tsv" ftype="tsv"
+                    checksum="md5$28dc16ce45105234437e53d59e240046"/>
+        </test>
+        <test>
+            <param name="references" value="similarity/recetox_gc-ei_ms_20201028.msp" ftype="msp"/>
+            <param name="queries" value="similarity/fill.msp" ftype="msp"/>
+            <param name="similarity_metric" value="CosineHungarian"/>
+            <output name="similarity_scores" file="similarity/scores_test3_out.tsv" ftype="tsv"
+                    checksum="md5$1341369778036e0a267ff723f8cfca9c"/>
+            <output name="similarity_matches" file="similarity/matches_test3_out.tsv" ftype="tsv"
+                    checksum="md5$28dc16ce45105234437e53d59e240046"/>
+        </test>
+        <test>
+            <param name="references" value="similarity/recetox_gc-ei_ms_20201028_with_precursor_mz.msp" ftype="msp"/>
+            <param name="queries" value="similarity/recetox_gc-ei_ms_20201028_with_precursor_mz.msp" ftype="msp"/>
+            <param name="similarity_metric" value="ModifiedCosine"/>
+            <output name="similarity_scores" file="similarity/scores_test4_out.tsv" ftype="tsv"/>
+            <output name="similarity_matches" file="similarity/matches_test4_out.tsv" ftype="tsv"/>
+        </test>
+        <test>
+            <param name="queries" value="similarity/fill.msp" ftype="msp"/>
+            <param name="similarity_metric" value="CosineHungarian"/>
+            <param name="is_symmetric" value="TRUE"/>
+            <output name="similarity_scores" file="similarity/scores_test5_out.tsv" ftype="tsv"/>
+            <output name="similarity_matches" file="similarity/matches_test5_out.tsv" ftype="tsv"/>
+        </test>
+    </tests>
+
+    <help>
+        <![CDATA[
+            @HELP_matchms@
+        ]]>
+    </help>
+
+    <citations>
+        <citation type="doi">10.5281/zenodo.4589154</citation>
+        <citation type="doi">10.21105/joss.02411</citation>
+    </citations>
+</tool>
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 matchms_similarity_wrapper.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/matchms_similarity_wrapper.py Fri Jan 28 16:22:06 2022 +0000
[
@@ -0,0 +1,100 @@
+import argparse
+import sys
+
+from matchms import calculate_scores
+from matchms.importing import load_from_mgf, load_from_msp
+from matchms.similarity import (
+    CosineGreedy,
+    CosineHungarian,
+    ModifiedCosine,
+)
+from pandas import DataFrame
+
+
+def convert_precursor_mz(spectrum):
+    """
+    Check the presence of precursor m/z since it is needed for ModifiedCosine similarity metric. Convert to float if
+    needed, raise error if missing.
+    """
+
+    if "precursor_mz" in spectrum.metadata:
+        metadata = spectrum.metadata
+        metadata["precursor_mz"] = float(metadata["precursor_mz"])
+        spectrum.metadata = metadata
+        return spectrum
+    else:
+        raise ValueError("Precursor_mz missing. Apply 'add_precursor_mz' filter first.")
+
+
+def main(argv):
+    parser = argparse.ArgumentParser(description="Compute MSP similarity scores")
+    parser.add_argument("-s", dest="symmetric", action='store_true', help="Computation is symmetric.")
+    parser.add_argument("--ref", dest="references_filename", type=str, help="Path to reference spectra library.")
+    parser.add_argument("--ref_format", dest="references_format", type=str, help="Reference spectra library file format.")
+    parser.add_argument("queries_filename", type=str, help="Path to query spectra.")
+    parser.add_argument("queries_format", type=str, help="Query spectra file format.")
+    parser.add_argument("similarity_metric", type=str, help='Metric to use for matching.')
+    parser.add_argument("tolerance", type=float, help="Tolerance to use for peak matching.")
+    parser.add_argument("mz_power", type=float, help="The power to raise mz to in the cosine function.")
+    parser.add_argument("intensity_power", type=float, help="The power to raise intensity to in the cosine function.")
+    parser.add_argument("output_filename_scores", type=str, help="Path where to store the output .tsv scores.")
+    parser.add_argument("output_filename_matches", type=str, help="Path where to store the output .tsv matches.")
+    args = parser.parse_args()
+
+    if args.queries_format == 'msp':
+        queries_spectra = list(load_from_msp(args.queries_filename))
+    elif args.queries_format == 'mgf':
+        queries_spectra = list(load_from_mgf(args.queries_filename))
+    else:
+        raise ValueError(f'File format {args.queries_format} not supported for query spectra.')
+
+    if args.symmetric:
+        reference_spectra = []
+    else:
+        if args.references_format == 'msp':
+            reference_spectra = list(load_from_msp(args.references_filename))
+        elif args.references_format == 'mgf':
+            reference_spectra = list(load_from_mgf(args.references_filename))
+        else:
+            raise ValueError(f'File format {args.references_format} not supported for reference spectra library.')
+
+    if args.similarity_metric == 'CosineGreedy':
+        similarity_metric = CosineGreedy(args.tolerance, args.mz_power, args.intensity_power)
+    elif args.similarity_metric == 'CosineHungarian':
+        similarity_metric = CosineHungarian(args.tolerance, args.mz_power, args.intensity_power)
+    elif args.similarity_metric == 'ModifiedCosine':
+        similarity_metric = ModifiedCosine(args.tolerance, args.mz_power, args.intensity_power)
+        reference_spectra = list(map(convert_precursor_mz, reference_spectra))
+        queries_spectra = list(map(convert_precursor_mz, queries_spectra))
+    else:
+        return -1
+
+    print("Calculating scores...")
+    scores = calculate_scores(
+        references=queries_spectra if args.symmetric else reference_spectra,
+        queries=queries_spectra,
+        similarity_function=similarity_metric,
+        is_symmetric=args.symmetric
+    )
+
+    write_outputs(args, scores)
+    return 0
+
+
+def write_outputs(args, scores):
+    print("Storing outputs...")
+    query_names = [spectra.metadata['name'] for spectra in scores.queries]
+    reference_names = [spectra.metadata['name'] for spectra in scores.references]
+
+    # Write scores to dataframe
+    dataframe_scores = DataFrame(data=[entry["score"] for entry in scores.scores], index=reference_names, columns=query_names)
+    dataframe_scores.to_csv(args.output_filename_scores, sep='\t')
+
+    # Write number of matches to dataframe
+    dataframe_matches = DataFrame(data=[entry["matches"] for entry in scores.scores], index=reference_names, columns=query_names)
+    dataframe_matches.to_csv(args.output_filename_matches, sep='\t')
+
+
+if __name__ == "__main__":
+    main(argv=sys.argv[1:])
+    pass
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 matchms_wrapper.py
--- a/matchms_wrapper.py Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
@@ -1,98 +0,0 @@
-import argparse
-import sys
-
-from matchms import calculate_scores
-from matchms.filtering import add_precursor_mz, default_filters, normalize_intensities
-from matchms.importing import load_from_mgf, load_from_msp
-from matchms.similarity import (
-    CosineGreedy,
-    CosineHungarian,
-    ModifiedCosine,
-)
-from pandas import DataFrame
-
-
-def main(argv):
-    parser = argparse.ArgumentParser(description="Compute MSP similarity scores")
-    parser.add_argument("-f", dest="default_filters", action='store_true', help="Apply default filters")
-    parser.add_argument("-n", dest="normalize_intensities", action='store_true', help="Normalize intensities.")
-    parser.add_argument("-s", dest="symmetric", action='store_true', help="Computation is symmetric.")
-    parser.add_argument("--ref", dest="references_filename", type=str, help="Path to reference spectra library.")
-    parser.add_argument("--ref_format", dest="references_format", type=str, help="Reference spectra library file format.")
-    parser.add_argument("queries_filename", type=str, help="Path to query spectra.")
-    parser.add_argument("queries_format", type=str, help="Query spectra file format.")
-    parser.add_argument("similarity_metric", type=str, help='Metric to use for matching.')
-    parser.add_argument("tolerance", type=float, help="Tolerance to use for peak matching.")
-    parser.add_argument("mz_power", type=float, help="The power to raise mz to in the cosine function.")
-    parser.add_argument("intensity_power", type=float, help="The power to raise intensity to in the cosine function.")
-    parser.add_argument("output_filename_scores", type=str, help="Path where to store the output .tsv scores.")
-    parser.add_argument("output_filename_matches", type=str, help="Path where to store the output .tsv matches.")
-    args = parser.parse_args()
-
-    if args.queries_format == 'msp':
-        queries_spectra = list(load_from_msp(args.queries_filename))
-    elif args.queries_format == 'mgf':
-        queries_spectra = list(load_from_mgf(args.queries_filename))
-    else:
-        raise ValueError(f'File format {args.queries_format} not supported for query spectra.')
-
-    if args.symmetric:
-        reference_spectra = []
-    else:
-        if args.references_format == 'msp':
-            reference_spectra = list(load_from_msp(args.references_filename))
-        elif args.references_format == 'mgf':
-            reference_spectra = list(load_from_mgf(args.references_filename))
-        else:
-            raise ValueError(f'File format {args.references_format} not supported for reference spectra library.')
-
-    if args.default_filters is True:
-        print("Applying default filters...")
-        queries_spectra = list(map(default_filters, queries_spectra))
-        reference_spectra = list(map(default_filters, reference_spectra))
-
-    if args.normalize_intensities is True:
-        print("Normalizing intensities...")
-        queries_spectra = list(map(normalize_intensities, queries_spectra))
-        reference_spectra = list(map(normalize_intensities, reference_spectra))
-
-    if args.similarity_metric == 'CosineGreedy':
-        similarity_metric = CosineGreedy(args.tolerance, args.mz_power, args.intensity_power)
-    elif args.similarity_metric == 'CosineHungarian':
-        similarity_metric = CosineHungarian(args.tolerance, args.mz_power, args.intensity_power)
-    elif args.similarity_metric == 'ModifiedCosine':
-        similarity_metric = ModifiedCosine(args.tolerance, args.mz_power, args.intensity_power)
-        reference_spectra = list(map(add_precursor_mz, reference_spectra))
-        queries_spectra = list(map(add_precursor_mz, queries_spectra))
-    else:
-        return -1
-
-    print("Calculating scores...")
-    scores = calculate_scores(
-        references=queries_spectra if args.symmetric else reference_spectra,
-        queries=queries_spectra,
-        similarity_function=similarity_metric,
-        is_symmetric=args.symmetric
-    )
-
-    write_outputs(args, scores)
-    return 0
-
-
-def write_outputs(args, scores):
-    print("Storing outputs...")
-    query_names = [spectra.metadata['name'] for spectra in scores.queries]
-    reference_names = [spectra.metadata['name'] for spectra in scores.references]
-
-    # Write scores to dataframe
-    dataframe_scores = DataFrame(data=[entry["score"] for entry in scores.scores], index=reference_names, columns=query_names)
-    dataframe_scores.to_csv(args.output_filename_scores, sep='\t')
-
-    # Write number of matches to dataframe
-    dataframe_matches = DataFrame(data=[entry["matches"] for entry in scores.scores], index=reference_names, columns=query_names)
-    dataframe_matches.to_csv(args.output_filename_matches, sep='\t')
-
-
-if __name__ == "__main__":
-    main(argv=sys.argv[1:])
-    pass
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/fill.mgf
--- a/test-data/fill.mgf Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,2513 +0,0 @@\n-BEGIN IONS\n-NAME=C001\n-IONMODE=Negative\n-RETENTIONTIME=38.74\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=57\n-138.9121 10186226.0 \n-148.9337 1008656.0 \n-175.0641 26780143.0 \n-186.1095 2675456.0 \n-196.8658 21390430.0 \n-198.8647 21688594.0 \n-200.8848 7742528.0 \n-206.9034 26130980.0 \n-216.9205 32607700.0 \n-234.0134 2550129.0 \n-254.8252 23747536.0 \n-256.8215 31377637.0 \n-258.8237 15532799.0 \n-266.8652 9805546.0 \n-268.8537 3090354.0 \n-306.9914 3169316.0 \n-312.7841 10051801.0 \n-316.7777 10734168.0 \n-322.8157 6317648.0 \n-324.9549 8619910.0 \n-334.849 4178412.0 \n-342.8093 3285552.0 \n-349.9455 2050695.0 \n-350.9875 6150799.0 \n-351.941 1965882.0 \n-366.8281 3253770.0 \n-370.7418 9765463.0 \n-372.7383 19374863.0 \n-382.8218 12815572.0 \n-384.8177 8311500.0 \n-392.7685 10913351.0 \n-413.2664 3965867.0 \n-426.7772 5431633.0 \n-428.7834 8554675.0 \n-434.7287 9943329.0 \n-436.8161 3705247.0 \n-440.7322 10603010.0 \n-442.7401 8271752.0 \n-450.7016 8762673.0 \n-460.7076 4528973.0 \n-462.7862 2123666.0 \n-484.7242 4273989.0 \n-486.7743 4886062.0 \n-488.6825 12267966.0 \n-492.744 7662344.0 \n-494.8953 7188793.0 \n-498.8794 6811405.0 \n-500.8484 6520691.0 \n-502.7832 3567833.0 \n-510.763 4989757.0 \n-518.7415 4243468.0 \n-546.6093 7177067.0 \n-550.6949 6104789.0 \n-566.5977 5171811.0 \n-612.6927 2005587.0 \n-676.6436 1982714.0 \n-800.4451 2792137.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C002\n-IONMODE=Negative\n-RETENTIONTIME=520.25\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=35\n-131.1733 1971789.0 \n-267.2688 6103973.0 \n-279.0196 1946255.0 \n-289.6491 46498377.0 \n-301.1565 15185412.0 \n-309.1649 18045974.0 \n-310.1623 295359836.0 \n-311.1658 13124727.0 \n-312.0296 38757284.0 \n-330.6757 12666597.0 \n-525.375 1073323842.0 \n-526.3783 181668883.0 \n-527.3812 23642795.0 \n-551.3321 111616808.0 \n-552.3348 28340614.0 \n-553.3314 2609936.0 \n-562.3269 7538206.0 \n-578.2905 7578406.0 \n-619.3008 4742103.0 \n-624.296 11790213.0 \n-813.5403 25060147.0 \n-814.5336 5865975.0 \n-955.1171 2322927.0 \n-1047.7378 150394804.0 \n-1048.7399 90978863.0 \n-1049.7432 29946438.0 \n-1050.7453 6807767.0 \n-1069.7158 5074652.0 \n-1074.1979 3402288.0 \n-1075.1968 33352763.0 \n-1076.2004 10417953.0 \n-1101.6535 2023916.0 \n-1206.3127 3738816.0 \n-1216.8041 4439324.0 \n-1217.807 3565334.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C003\n-IONMODE=Negative\n-RETENTIONTIME=483.67\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=26\n-265.2529 11366224.0 \n-266.2564 1420444.0 \n-279.6362 29849749.0 \n-280.6546 8848921.0 \n-288.6414 202172046.0 \n-378.2093 15309961.0 \n-379.1966 2902366.0 \n-522.3565 4089569222.0 \n-523.354 1201714423.0 \n-549.3267 63300808.0 \n-576.2749 7386007.0 \n-577.3074 2354251.0 \n-617.2778 2323470.0 \n-625.4543 4040374.0 \n-796.9808 13576738.0 \n-797.9841 6368973.0 \n-809.9883 12596682.0 \n-810.9916 6601055.0 \n-1043.7028 144351468.0 \n-1044.7068 83271854.0 \n-1045.706 27998321.0 \n-1046.7131 6505178.0 \n-1058.1594 20718345.0 \n-1059.1626 6608764.0 \n-1071.1639 15461047.0 \n-1072.1671 5096642.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C004\n-IONMODE=Negative\n-RETENTIONTIME=473.48\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=24\n-124.1405 6517662.0 \n-170.2437 1237313.0 \n-275.6336 28001849.0 \n-296.147 190395687.0 \n-482.3247 145772322.0 \n-483.3283 36245876.0 \n-496.34 12577588056.0 \n-497.3442 3337125302.0 \n-498.3462 532285213.0 \n-499.3493 68176083.0 \n-770.964 49250157.0 \n-771.9675 22666873.0 \n-783.9721 9839299.0 \n-784.9749 3622908.0 \n-949.6233 8009033.0 \n-950.6274 3674694.0 \n-991.6726 1420557258.0 \n-992.6749 763118028.0 \n-993.6787 239161906.0 \n-994.6801 53549573.0 \n-1017.6897 168186952.0 \n-1018.6656 120599518.0 \n-1019.6555 57647644.0 \n-1020.6591 12469103.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C005\n-IONMODE=Negative\n-RETENTIONTIME=41.72\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=20\n-218.1386 14009249.0 \n-337.0623 88672453.0 \n-338.0654 8770055.0 \n-353.0361 37061354.0 \n-359.0443 48435582.0 \n-360.0459 5025128.0 \n-375.018 29159485.0 \n-376.0216 2740193.0 \n-381.0261 13522755.0 \n-396.9999 10317665.0 \n-417.0027 13822994.0 \n-418.9966 4386311.0 \n-432'..b'TRUMTYPE=Centroid\n-NUM PEAKS=2\n-328.2481 11119434.0 \n-329.2519 2068394.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C152\n-IONMODE=Negative\n-RETENTIONTIME=385.78\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-409.1497 1369551.0 \n-427.1607 2275086.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C153\n-IONMODE=Negative\n-RETENTIONTIME=401.39\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-107.0557 2271180.0 \n-197.1612 1286942.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C154\n-IONMODE=Negative\n-RETENTIONTIME=388.72\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-239.1276 1743749.0 \n-286.9585 1645545.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C155\n-IONMODE=Negative\n-RETENTIONTIME=373.67\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-507.1617 6285930.0 \n-508.1657 1535734.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C156\n-IONMODE=Negative\n-RETENTIONTIME=378.37\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-257.2254 3302868.0 \n-777.6928 4522421.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C157\n-IONMODE=Negative\n-RETENTIONTIME=473.08\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-267.6425 11780168.0 \n-534.2949 13399261.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C158\n-IONMODE=Negative\n-RETENTIONTIME=508.15\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-380.2992 5790633.0 \n-423.2518 1386850.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C159\n-IONMODE=Negative\n-RETENTIONTIME=471.89\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-304.2357 21716257.0 \n-306.1523 8327492.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C160\n-IONMODE=Negative\n-RETENTIONTIME=465.45\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-193.1239 1274413.0 \n-295.1974 20379534.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C161\n-IONMODE=Negative\n-RETENTIONTIME=488.7\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-667.4214 3075774.0 \n-1189.7766 2040172.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C162\n-IONMODE=Negative\n-RETENTIONTIME=471.97\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-316.6601 7221684.0 \n-393.2201 8389493.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C163\n-IONMODE=Negative\n-RETENTIONTIME=465.16\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-422.3267 4962906.0 \n-431.3157 12163271.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C164\n-IONMODE=Negative\n-RETENTIONTIME=474.29\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-239.1779 8236995.0 \n-398.3268 11918127.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C165\n-IONMODE=Negative\n-RETENTIONTIME=477.74\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-249.1858 1576729.0 \n-307.15 1941191.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C166\n-IONMODE=Negative\n-RETENTIONTIME=494.51\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-355.2846 54372680.0 \n-373.2951 6108864.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C167\n-IONMODE=Negative\n-RETENTIONTIME=497.67\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-474.3486 2732000.0 \n-649.4483 2434649.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C168\n-IONMODE=Negative\n-RETENTIONTIME=498.02\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-459.2569 3550909.0 \n-539.4163 5285541.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C169\n-IONMODE=Negative\n-RETENTIONTIME=492.45\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-732.5452 4526953.0 \n-733.5465 1043642.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C170\n-IONMODE=Negative\n-RETENTIONTIME=497.3\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-450.3586 4210116.0 \n-451.3631 6446370.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C171\n-IONMODE=Negative\n-RETENTIONTIME=467.81\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-185.0776 5067455.0 \n-200.203 1398415.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C172\n-IONMODE=Negative\n-RETENTIONTIME=457.02\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-263.2347 3933284.0 \n-615.2633 1132491.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C173\n-IONMODE=Negative\n-RETENTIONTIME=443.89\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-370.2956 41596161.0 \n-371.304 9966707.0 \n-END IONS\n-\n-BEGIN IONS\n-NAME=C174\n-IONMODE=Negative\n-RETENTIONTIME=438.81\n-RETENTIONINDEX=\n-SPECTRUMTYPE=Centroid\n-NUM PEAKS=2\n-330.2563 5274387.0 \n-579.2938 6044865.0 \n-END IONS\n-\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/fill.msp
--- a/test-data/fill.msp Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,2165 +0,0 @@\n-NAME:C001\n-IONMODE:Negative\n-RETENTIONTIME:38.74\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:57\n-216.9205 32607700\n-256.8215 31377637\n-175.0641 26780143\n-206.9034 26130980\n-254.8252 23747536\n-198.8647 21688594\n-196.8658 21390430\n-372.7383 19374863\n-258.8237 15532799\n-382.8218 12815572\n-488.6825 12267966\n-392.7685 10913351\n-316.7777 10734168\n-440.7322 10603010\n-138.9121 10186226\n-312.7841 10051801\n-434.7287 9943329\n-266.8652 9805546\n-370.7418 9765463\n-450.7016 8762673\n-324.9549 8619910\n-428.7834 8554675\n-384.8177 8311500\n-442.7401 8271752\n-200.8848 7742528\n-492.744 7662344\n-494.8953 7188793\n-546.6093 7177067\n-498.8794 6811405\n-500.8484 6520691\n-322.8157 6317648\n-350.9875 6150799\n-550.6949 6104789\n-426.7772 5431633\n-566.5977 5171811\n-510.763 4989757\n-486.7743 4886062\n-460.7076 4528973\n-484.7242 4273989\n-518.7415 4243468\n-334.849 4178412\n-413.2664 3965867\n-436.8161 3705247\n-502.7832 3567833\n-342.8093 3285552\n-366.8281 3253770\n-306.9914 3169316\n-268.8537 3090354\n-800.4451 2792137\n-186.1095 2675456\n-234.0134 2550129\n-462.7862 2123666\n-349.9455 2050695\n-612.6927 2005587\n-676.6436 1982714\n-351.941 1965882\n-148.9337 1008656\n-\n-NAME:C002\n-IONMODE:Negative\n-RETENTIONTIME:520.25\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:35\n-525.375 1073323842\n-310.1623 295359836\n-526.3783 181668883\n-1047.7378 150394804\n-551.3321 111616808\n-1048.7399 90978863\n-289.6491 46498377\n-312.0296 38757284\n-1075.1968 33352763\n-1049.7432 29946438\n-552.3348 28340614\n-813.5403 25060147\n-527.3812 23642795\n-309.1649 18045974\n-301.1565 15185412\n-311.1658 13124727\n-330.6757 12666597\n-624.296 11790213\n-1076.2004 10417953\n-578.2905 7578406\n-562.3269 7538206\n-1050.7453 6807767\n-267.2688 6103973\n-814.5336 5865975\n-1069.7158 5074652\n-619.3008 4742103\n-1216.8041 4439324\n-1206.3127 3738816\n-1217.807 3565334\n-1074.1979 3402288\n-553.3314 2609936\n-955.1171 2322927\n-1101.6535 2023916\n-131.1733 1971789\n-279.0196 1946255\n-\n-NAME:C003\n-IONMODE:Negative\n-RETENTIONTIME:483.67\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:26\n-522.3565 4089569222\n-523.354 1201714423\n-288.6414 202172046\n-1043.7028 144351468\n-1044.7068 83271854\n-549.3267 63300808\n-279.6362 29849749\n-1045.706 27998321\n-1058.1594 20718345\n-1071.1639 15461047\n-378.2093 15309961\n-796.9808 13576738\n-809.9883 12596682\n-265.2529 11366224\n-280.6546 8848921\n-576.2749 7386007\n-1059.1626 6608764\n-810.9916 6601055\n-1046.7131 6505178\n-797.9841 6368973\n-1072.1671 5096642\n-625.4543 4040374\n-379.1966 2902366\n-577.3074 2354251\n-617.2778 2323470\n-266.2564 1420444\n-\n-NAME:C004\n-IONMODE:Negative\n-RETENTIONTIME:473.48\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:24\n-496.34 12577588056\n-497.3442 3337125302\n-991.6726 1420557258\n-992.6749 763118028\n-498.3462 532285213\n-993.6787 239161906\n-296.147 190395687\n-1017.6897 168186952\n-482.3247 145772322\n-1018.6656 120599518\n-499.3493 68176083\n-1019.6555 57647644\n-994.6801 53549573\n-770.964 49250157\n-483.3283 36245876\n-275.6336 28001849\n-771.9675 22666873\n-1020.6591 12469103\n-783.9721 9839299\n-949.6233 8009033\n-124.1405 6517662\n-950.6274 3674694\n-784.9749 3622908\n-170.2437 1237313\n-\n-NAME:C005\n-IONMODE:Negative\n-RETENTIONTIME:41.72\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:20\n-337.0623 88672453\n-359.0443 48435582\n-353.0361 37061354\n-375.018 29159485\n-218.1386 14009249\n-417.0027 13822994\n-381.0261 13522755\n-438.9851 11307111\n-396.9999 10317665\n-454.9592 9820452\n-432.9764 9779399\n-338.0654 8770055\n-360.0459 5025128\n-418.9966 4386311\n-512.8989 4072570\n-456.9603 3774845\n-470.9263 3632486\n-572.871 3485486\n-440.9796 3364168\n-376.0216 2740193\n-\n-NAME:C006\n-IONMODE:Negative\n-RETENTIONTIME:452.08\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:19\n-494.3249 803829845\n-495.3278 207959661\n-542.3239 193323900\n-543.3276 55501736\n-1087.6715 34676828\n-516.3076 24092471\n-274.6257 21694276\n-1088.6773 21466528\n-1001.658 11852076\n-1089.682 9948820\n-290.6256 9704443\n-1061.6562 9417442\n-987.6411 7453650\n-1037.6578 7076912\n-1062.6592 5657208\n-484.3311 5283943\n-265.6196 '..b'5.2288 1932289\n-\n-NAME:C147\n-IONMODE:Negative\n-RETENTIONTIME:563.22\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-282.2792 241362345\n-256.2615 19433189\n-\n-NAME:C148\n-IONMODE:Negative\n-RETENTIONTIME:548.47\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-305.2468 9633582\n-329.249 5814756\n-\n-NAME:C149\n-IONMODE:Negative\n-RETENTIONTIME:350.93\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-130.0643 7419216\n-190.0865 4433780\n-\n-NAME:C150\n-IONMODE:Negative\n-RETENTIONTIME:365.37\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-490.2083 5275418\n-465.1226 1763287\n-\n-NAME:C151\n-IONMODE:Negative\n-RETENTIONTIME:394.87\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-328.2481 11119434\n-329.2519 2068394\n-\n-NAME:C152\n-IONMODE:Negative\n-RETENTIONTIME:385.78\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-427.1607 2275086\n-409.1497 1369551\n-\n-NAME:C153\n-IONMODE:Negative\n-RETENTIONTIME:401.39\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-107.0557 2271180\n-197.1612 1286942\n-\n-NAME:C154\n-IONMODE:Negative\n-RETENTIONTIME:388.72\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-239.1276 1743749\n-286.9585 1645545\n-\n-NAME:C155\n-IONMODE:Negative\n-RETENTIONTIME:373.67\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-507.1617 6285930\n-508.1657 1535734\n-\n-NAME:C156\n-IONMODE:Negative\n-RETENTIONTIME:378.37\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-777.6928 4522421\n-257.2254 3302868\n-\n-NAME:C157\n-IONMODE:Negative\n-RETENTIONTIME:473.08\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-534.2949 13399261\n-267.6425 11780168\n-\n-NAME:C158\n-IONMODE:Negative\n-RETENTIONTIME:508.15\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-380.2992 5790633\n-423.2518 1386850\n-\n-NAME:C159\n-IONMODE:Negative\n-RETENTIONTIME:471.89\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-304.2357 21716257\n-306.1523 8327492\n-\n-NAME:C160\n-IONMODE:Negative\n-RETENTIONTIME:465.45\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-295.1974 20379534\n-193.1239 1274413\n-\n-NAME:C161\n-IONMODE:Negative\n-RETENTIONTIME:488.7\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-667.4214 3075774\n-1189.7766 2040172\n-\n-NAME:C162\n-IONMODE:Negative\n-RETENTIONTIME:471.97\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-393.2201 8389493\n-316.6601 7221684\n-\n-NAME:C163\n-IONMODE:Negative\n-RETENTIONTIME:465.16\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-431.3157 12163271\n-422.3267 4962906\n-\n-NAME:C164\n-IONMODE:Negative\n-RETENTIONTIME:474.29\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-398.3268 11918127\n-239.1779 8236995\n-\n-NAME:C165\n-IONMODE:Negative\n-RETENTIONTIME:477.74\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-307.15 1941191\n-249.1858 1576729\n-\n-NAME:C166\n-IONMODE:Negative\n-RETENTIONTIME:494.51\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-355.2846 54372680\n-373.2951 6108864\n-\n-NAME:C167\n-IONMODE:Negative\n-RETENTIONTIME:497.67\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-474.3486 2732000\n-649.4483 2434649\n-\n-NAME:C168\n-IONMODE:Negative\n-RETENTIONTIME:498.02\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-539.4163 5285541\n-459.2569 3550909\n-\n-NAME:C169\n-IONMODE:Negative\n-RETENTIONTIME:492.45\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-732.5452 4526953\n-733.5465 1043642\n-\n-NAME:C170\n-IONMODE:Negative\n-RETENTIONTIME:497.3\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-451.3631 6446370\n-450.3586 4210116\n-\n-NAME:C171\n-IONMODE:Negative\n-RETENTIONTIME:467.81\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-185.0776 5067455\n-200.203 1398415\n-\n-NAME:C172\n-IONMODE:Negative\n-RETENTIONTIME:457.02\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-263.2347 3933284\n-615.2633 1132491\n-\n-NAME:C173\n-IONMODE:Negative\n-RETENTIONTIME:443.89\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-370.2956 41596161\n-371.304 9966707\n-\n-NAME:C174\n-IONMODE:Negative\n-RETENTIONTIME:438.81\n-RETENTIONINDEX:\n-SPECTRUMTYPE:Centroid\n-Num Peaks:2\n-579.2938 6044865\n-330.2563 5274387\n-\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/filtering/clean_metadata.msp
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtering/clean_metadata.msp Fri Jan 28 16:22:06 2022 +0000
b
@@ -0,0 +1,212 @@
+NAME: C001
+IONMODE: Negative
+RETENTIONTIME: 38.74
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+COMPOUND_NAME: C001
+RETENTION_INDEX: None
+RETENTION_TIME: 38.74
+NUM PEAKS: 57
+138.9121 10186226.0
+148.9337 1008656.0
+175.0641 26780143.0
+186.1095 2675456.0
+196.8658 21390430.0
+198.8647 21688594.0
+200.8848 7742528.0
+206.9034 26130980.0
+216.9205 32607700.0
+234.0134 2550129.0
+254.8252 23747536.0
+256.8215 31377637.0
+258.8237 15532799.0
+266.8652 9805546.0
+268.8537 3090354.0
+306.9914 3169316.0
+312.7841 10051801.0
+316.7777 10734168.0
+322.8157 6317648.0
+324.9549 8619910.0
+334.849 4178412.0
+342.8093 3285552.0
+349.9455 2050695.0
+350.9875 6150799.0
+351.941 1965882.0
+366.8281 3253770.0
+370.7418 9765463.0
+372.7383 19374863.0
+382.8218 12815572.0
+384.8177 8311500.0
+392.7685 10913351.0
+413.2664 3965867.0
+426.7772 5431633.0
+428.7834 8554675.0
+434.7287 9943329.0
+436.8161 3705247.0
+440.7322 10603010.0
+442.7401 8271752.0
+450.7016 8762673.0
+460.7076 4528973.0
+462.7862 2123666.0
+484.7242 4273989.0
+486.7743 4886062.0
+488.6825 12267966.0
+492.744 7662344.0
+494.8953 7188793.0
+498.8794 6811405.0
+500.8484 6520691.0
+502.7832 3567833.0
+510.763 4989757.0
+518.7415 4243468.0
+546.6093 7177067.0
+550.6949 6104789.0
+566.5977 5171811.0
+612.6927 2005587.0
+676.6436 1982714.0
+800.4451 2792137.0
+
+NAME: C002
+IONMODE: Negative
+RETENTIONTIME: 520.25
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+COMPOUND_NAME: C002
+RETENTION_INDEX: None
+RETENTION_TIME: 520.25
+NUM PEAKS: 35
+131.1733 1971789.0
+267.2688 6103973.0
+279.0196 1946255.0
+289.6491 46498377.0
+301.1565 15185412.0
+309.1649 18045974.0
+310.1623 295359836.0
+311.1658 13124727.0
+312.0296 38757284.0
+330.6757 12666597.0
+525.375 1073323842.0
+526.3783 181668883.0
+527.3812 23642795.0
+551.3321 111616808.0
+552.3348 28340614.0
+553.3314 2609936.0
+562.3269 7538206.0
+578.2905 7578406.0
+619.3008 4742103.0
+624.296 11790213.0
+813.5403 25060147.0
+814.5336 5865975.0
+955.1171 2322927.0
+1047.7378 150394804.0
+1048.7399 90978863.0
+1049.7432 29946438.0
+1050.7453 6807767.0
+1069.7158 5074652.0
+1074.1979 3402288.0
+1075.1968 33352763.0
+1076.2004 10417953.0
+1101.6535 2023916.0
+1206.3127 3738816.0
+1216.8041 4439324.0
+1217.807 3565334.0
+
+NAME: C003
+IONMODE: Negative
+RETENTIONTIME: 483.67
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+COMPOUND_NAME: C003
+RETENTION_INDEX: None
+RETENTION_TIME: 483.67
+NUM PEAKS: 26
+265.2529 11366224.0
+266.2564 1420444.0
+279.6362 29849749.0
+280.6546 8848921.0
+288.6414 202172046.0
+378.2093 15309961.0
+379.1966 2902366.0
+522.3565 4089569222.0
+523.354 1201714423.0
+549.3267 63300808.0
+576.2749 7386007.0
+577.3074 2354251.0
+617.2778 2323470.0
+625.4543 4040374.0
+796.9808 13576738.0
+797.9841 6368973.0
+809.9883 12596682.0
+810.9916 6601055.0
+1043.7028 144351468.0
+1044.7068 83271854.0
+1045.706 27998321.0
+1046.7131 6505178.0
+1058.1594 20718345.0
+1059.1626 6608764.0
+1071.1639 15461047.0
+1072.1671 5096642.0
+
+NAME: C004
+IONMODE: Negative
+RETENTIONTIME: 473.48
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+COMPOUND_NAME: C004
+RETENTION_INDEX: None
+RETENTION_TIME: 473.48
+NUM PEAKS: 24
+124.1405 6517662.0
+170.2437 1237313.0
+275.6336 28001849.0
+296.147 190395687.0
+482.3247 145772322.0
+483.3283 36245876.0
+496.34 12577588056.0
+497.3442 3337125302.0
+498.3462 532285213.0
+499.3493 68176083.0
+770.964 49250157.0
+771.9675 22666873.0
+783.9721 9839299.0
+784.9749 3622908.0
+949.6233 8009033.0
+950.6274 3674694.0
+991.6726 1420557258.0
+992.6749 763118028.0
+993.6787 239161906.0
+994.6801 53549573.0
+1017.6897 168186952.0
+1018.6656 120599518.0
+1019.6555 57647644.0
+1020.6591 12469103.0
+
+NAME: C005
+IONMODE: Negative
+RETENTIONTIME: 41.72
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+COMPOUND_NAME: C005
+RETENTION_INDEX: None
+RETENTION_TIME: 41.72
+NUM PEAKS: 20
+218.1386 14009249.0
+337.0623 88672453.0
+338.0654 8770055.0
+353.0361 37061354.0
+359.0443 48435582.0
+360.0459 5025128.0
+375.018 29159485.0
+376.0216 2740193.0
+381.0261 13522755.0
+396.9999 10317665.0
+417.0027 13822994.0
+418.9966 4386311.0
+432.9764 9779399.0
+438.9851 11307111.0
+440.9796 3364168.0
+454.9592 9820452.0
+456.9603 3774845.0
+470.9263 3632486.0
+512.8989 4072570.0
+572.871 3485486.0
+
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/filtering/default_filters.msp
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtering/default_filters.msp Fri Jan 28 16:22:06 2022 +0000
b
@@ -0,0 +1,207 @@
+NAME: C001
+IONMODE: negative
+RETENTIONTIME: 38.74
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+COMPOUND_NAME: C001
+CHARGE: -1
+NUM PEAKS: 57
+138.9121 10186226.0
+148.9337 1008656.0
+175.0641 26780143.0
+186.1095 2675456.0
+196.8658 21390430.0
+198.8647 21688594.0
+200.8848 7742528.0
+206.9034 26130980.0
+216.9205 32607700.0
+234.0134 2550129.0
+254.8252 23747536.0
+256.8215 31377637.0
+258.8237 15532799.0
+266.8652 9805546.0
+268.8537 3090354.0
+306.9914 3169316.0
+312.7841 10051801.0
+316.7777 10734168.0
+322.8157 6317648.0
+324.9549 8619910.0
+334.849 4178412.0
+342.8093 3285552.0
+349.9455 2050695.0
+350.9875 6150799.0
+351.941 1965882.0
+366.8281 3253770.0
+370.7418 9765463.0
+372.7383 19374863.0
+382.8218 12815572.0
+384.8177 8311500.0
+392.7685 10913351.0
+413.2664 3965867.0
+426.7772 5431633.0
+428.7834 8554675.0
+434.7287 9943329.0
+436.8161 3705247.0
+440.7322 10603010.0
+442.7401 8271752.0
+450.7016 8762673.0
+460.7076 4528973.0
+462.7862 2123666.0
+484.7242 4273989.0
+486.7743 4886062.0
+488.6825 12267966.0
+492.744 7662344.0
+494.8953 7188793.0
+498.8794 6811405.0
+500.8484 6520691.0
+502.7832 3567833.0
+510.763 4989757.0
+518.7415 4243468.0
+546.6093 7177067.0
+550.6949 6104789.0
+566.5977 5171811.0
+612.6927 2005587.0
+676.6436 1982714.0
+800.4451 2792137.0
+
+NAME: C002
+IONMODE: negative
+RETENTIONTIME: 520.25
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+COMPOUND_NAME: C002
+CHARGE: -1
+NUM PEAKS: 35
+131.1733 1971789.0
+267.2688 6103973.0
+279.0196 1946255.0
+289.6491 46498377.0
+301.1565 15185412.0
+309.1649 18045974.0
+310.1623 295359836.0
+311.1658 13124727.0
+312.0296 38757284.0
+330.6757 12666597.0
+525.375 1073323842.0
+526.3783 181668883.0
+527.3812 23642795.0
+551.3321 111616808.0
+552.3348 28340614.0
+553.3314 2609936.0
+562.3269 7538206.0
+578.2905 7578406.0
+619.3008 4742103.0
+624.296 11790213.0
+813.5403 25060147.0
+814.5336 5865975.0
+955.1171 2322927.0
+1047.7378 150394804.0
+1048.7399 90978863.0
+1049.7432 29946438.0
+1050.7453 6807767.0
+1069.7158 5074652.0
+1074.1979 3402288.0
+1075.1968 33352763.0
+1076.2004 10417953.0
+1101.6535 2023916.0
+1206.3127 3738816.0
+1216.8041 4439324.0
+1217.807 3565334.0
+
+NAME: C003
+IONMODE: negative
+RETENTIONTIME: 483.67
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+COMPOUND_NAME: C003
+CHARGE: -1
+NUM PEAKS: 26
+265.2529 11366224.0
+266.2564 1420444.0
+279.6362 29849749.0
+280.6546 8848921.0
+288.6414 202172046.0
+378.2093 15309961.0
+379.1966 2902366.0
+522.3565 4089569222.0
+523.354 1201714423.0
+549.3267 63300808.0
+576.2749 7386007.0
+577.3074 2354251.0
+617.2778 2323470.0
+625.4543 4040374.0
+796.9808 13576738.0
+797.9841 6368973.0
+809.9883 12596682.0
+810.9916 6601055.0
+1043.7028 144351468.0
+1044.7068 83271854.0
+1045.706 27998321.0
+1046.7131 6505178.0
+1058.1594 20718345.0
+1059.1626 6608764.0
+1071.1639 15461047.0
+1072.1671 5096642.0
+
+NAME: C004
+IONMODE: negative
+RETENTIONTIME: 473.48
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+COMPOUND_NAME: C004
+CHARGE: -1
+NUM PEAKS: 24
+124.1405 6517662.0
+170.2437 1237313.0
+275.6336 28001849.0
+296.147 190395687.0
+482.3247 145772322.0
+483.3283 36245876.0
+496.34 12577588056.0
+497.3442 3337125302.0
+498.3462 532285213.0
+499.3493 68176083.0
+770.964 49250157.0
+771.9675 22666873.0
+783.9721 9839299.0
+784.9749 3622908.0
+949.6233 8009033.0
+950.6274 3674694.0
+991.6726 1420557258.0
+992.6749 763118028.0
+993.6787 239161906.0
+994.6801 53549573.0
+1017.6897 168186952.0
+1018.6656 120599518.0
+1019.6555 57647644.0
+1020.6591 12469103.0
+
+NAME: C005
+IONMODE: negative
+RETENTIONTIME: 41.72
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+COMPOUND_NAME: C005
+CHARGE: -1
+NUM PEAKS: 20
+218.1386 14009249.0
+337.0623 88672453.0
+338.0654 8770055.0
+353.0361 37061354.0
+359.0443 48435582.0
+360.0459 5025128.0
+375.018 29159485.0
+376.0216 2740193.0
+381.0261 13522755.0
+396.9999 10317665.0
+417.0027 13822994.0
+418.9966 4386311.0
+432.9764 9779399.0
+438.9851 11307111.0
+440.9796 3364168.0
+454.9592 9820452.0
+456.9603 3774845.0
+470.9263 3632486.0
+512.8989 4072570.0
+572.871 3485486.0
+
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/filtering/input.msp
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtering/input.msp Fri Jan 28 16:22:06 2022 +0000
b
@@ -0,0 +1,196 @@
+NAME:C001
+IONMODE:Negative
+RETENTIONTIME:38.74
+RETENTIONINDEX:
+SPECTRUMTYPE:Centroid
+Num Peaks:57
+216.9205 32607700
+256.8215 31377637
+175.0641 26780143
+206.9034 26130980
+254.8252 23747536
+198.8647 21688594
+196.8658 21390430
+372.7383 19374863
+258.8237 15532799
+382.8218 12815572
+488.6825 12267966
+392.7685 10913351
+316.7777 10734168
+440.7322 10603010
+138.9121 10186226
+312.7841 10051801
+434.7287 9943329
+266.8652 9805546
+370.7418 9765463
+450.7016 8762673
+324.9549 8619910
+428.7834 8554675
+384.8177 8311500
+442.7401 8271752
+200.8848 7742528
+492.744 7662344
+494.8953 7188793
+546.6093 7177067
+498.8794 6811405
+500.8484 6520691
+322.8157 6317648
+350.9875 6150799
+550.6949 6104789
+426.7772 5431633
+566.5977 5171811
+510.763 4989757
+486.7743 4886062
+460.7076 4528973
+484.7242 4273989
+518.7415 4243468
+334.849 4178412
+413.2664 3965867
+436.8161 3705247
+502.7832 3567833
+342.8093 3285552
+366.8281 3253770
+306.9914 3169316
+268.8537 3090354
+800.4451 2792137
+186.1095 2675456
+234.0134 2550129
+462.7862 2123666
+349.9455 2050695
+612.6927 2005587
+676.6436 1982714
+351.941 1965882
+148.9337 1008656
+
+NAME:C002
+IONMODE:Negative
+RETENTIONTIME:520.25
+RETENTIONINDEX:
+SPECTRUMTYPE:Centroid
+Num Peaks:35
+525.375 1073323842
+310.1623 295359836
+526.3783 181668883
+1047.7378 150394804
+551.3321 111616808
+1048.7399 90978863
+289.6491 46498377
+312.0296 38757284
+1075.1968 33352763
+1049.7432 29946438
+552.3348 28340614
+813.5403 25060147
+527.3812 23642795
+309.1649 18045974
+301.1565 15185412
+311.1658 13124727
+330.6757 12666597
+624.296 11790213
+1076.2004 10417953
+578.2905 7578406
+562.3269 7538206
+1050.7453 6807767
+267.2688 6103973
+814.5336 5865975
+1069.7158 5074652
+619.3008 4742103
+1216.8041 4439324
+1206.3127 3738816
+1217.807 3565334
+1074.1979 3402288
+553.3314 2609936
+955.1171 2322927
+1101.6535 2023916
+131.1733 1971789
+279.0196 1946255
+
+NAME:C003
+IONMODE:Negative
+RETENTIONTIME:483.67
+RETENTIONINDEX:
+SPECTRUMTYPE:Centroid
+Num Peaks:26
+522.3565 4089569222
+523.354 1201714423
+288.6414 202172046
+1043.7028 144351468
+1044.7068 83271854
+549.3267 63300808
+279.6362 29849749
+1045.706 27998321
+1058.1594 20718345
+1071.1639 15461047
+378.2093 15309961
+796.9808 13576738
+809.9883 12596682
+265.2529 11366224
+280.6546 8848921
+576.2749 7386007
+1059.1626 6608764
+810.9916 6601055
+1046.7131 6505178
+797.9841 6368973
+1072.1671 5096642
+625.4543 4040374
+379.1966 2902366
+577.3074 2354251
+617.2778 2323470
+266.2564 1420444
+
+NAME:C004
+IONMODE:Negative
+RETENTIONTIME:473.48
+RETENTIONINDEX:
+SPECTRUMTYPE:Centroid
+Num Peaks:24
+496.34 12577588056
+497.3442 3337125302
+991.6726 1420557258
+992.6749 763118028
+498.3462 532285213
+993.6787 239161906
+296.147 190395687
+1017.6897 168186952
+482.3247 145772322
+1018.6656 120599518
+499.3493 68176083
+1019.6555 57647644
+994.6801 53549573
+770.964 49250157
+483.3283 36245876
+275.6336 28001849
+771.9675 22666873
+1020.6591 12469103
+783.9721 9839299
+949.6233 8009033
+124.1405 6517662
+950.6274 3674694
+784.9749 3622908
+170.2437 1237313
+
+NAME:C005
+IONMODE:Negative
+RETENTIONTIME:41.72
+RETENTIONINDEX:
+SPECTRUMTYPE:Centroid
+Num Peaks:20
+337.0623 88672453
+359.0443 48435582
+353.0361 37061354
+375.018 29159485
+218.1386 14009249
+417.0027 13822994
+381.0261 13522755
+438.9851 11307111
+396.9999 10317665
+454.9592 9820452
+432.9764 9779399
+338.0654 8770055
+360.0459 5025128
+418.9966 4386311
+512.8989 4072570
+456.9603 3774845
+470.9263 3632486
+572.871 3485486
+440.9796 3364168
+376.0216 2740193
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/filtering/mz_range.msp
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtering/mz_range.msp Fri Jan 28 16:22:06 2022 +0000
b
@@ -0,0 +1,132 @@
+NAME: C001
+IONMODE: Negative
+RETENTIONTIME: 38.74
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 41
+306.9914 3169316.0
+312.7841 10051801.0
+316.7777 10734168.0
+322.8157 6317648.0
+324.9549 8619910.0
+334.849 4178412.0
+342.8093 3285552.0
+349.9455 2050695.0
+350.9875 6150799.0
+351.941 1965882.0
+366.8281 3253770.0
+370.7418 9765463.0
+372.7383 19374863.0
+382.8218 12815572.0
+384.8177 8311500.0
+392.7685 10913351.0
+413.2664 3965867.0
+426.7772 5431633.0
+428.7834 8554675.0
+434.7287 9943329.0
+436.8161 3705247.0
+440.7322 10603010.0
+442.7401 8271752.0
+450.7016 8762673.0
+460.7076 4528973.0
+462.7862 2123666.0
+484.7242 4273989.0
+486.7743 4886062.0
+488.6825 12267966.0
+492.744 7662344.0
+494.8953 7188793.0
+498.8794 6811405.0
+500.8484 6520691.0
+502.7832 3567833.0
+510.763 4989757.0
+518.7415 4243468.0
+546.6093 7177067.0
+550.6949 6104789.0
+566.5977 5171811.0
+612.6927 2005587.0
+676.6436 1982714.0
+
+NAME: C002
+IONMODE: Negative
+RETENTIONTIME: 520.25
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 16
+301.1565 15185412.0
+309.1649 18045974.0
+310.1623 295359836.0
+311.1658 13124727.0
+312.0296 38757284.0
+330.6757 12666597.0
+525.375 1073323842.0
+526.3783 181668883.0
+527.3812 23642795.0
+551.3321 111616808.0
+552.3348 28340614.0
+553.3314 2609936.0
+562.3269 7538206.0
+578.2905 7578406.0
+619.3008 4742103.0
+624.296 11790213.0
+
+NAME: C003
+IONMODE: Negative
+RETENTIONTIME: 483.67
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 11
+378.2093 15309961.0
+379.1966 2902366.0
+522.3565 4089569222.0
+523.354 1201714423.0
+549.3267 63300808.0
+576.2749 7386007.0
+577.3074 2354251.0
+617.2778 2323470.0
+625.4543 4040374.0
+796.9808 13576738.0
+797.9841 6368973.0
+
+NAME: C004
+IONMODE: Negative
+RETENTIONTIME: 473.48
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 10
+482.3247 145772322.0
+483.3283 36245876.0
+496.34 12577588056.0
+497.3442 3337125302.0
+498.3462 532285213.0
+499.3493 68176083.0
+770.964 49250157.0
+771.9675 22666873.0
+783.9721 9839299.0
+784.9749 3622908.0
+
+NAME: C005
+IONMODE: Negative
+RETENTIONTIME: 41.72
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 19
+337.0623 88672453.0
+338.0654 8770055.0
+353.0361 37061354.0
+359.0443 48435582.0
+360.0459 5025128.0
+375.018 29159485.0
+376.0216 2740193.0
+381.0261 13522755.0
+396.9999 10317665.0
+417.0027 13822994.0
+418.9966 4386311.0
+432.9764 9779399.0
+438.9851 11307111.0
+440.9796 3364168.0
+454.9592 9820452.0
+456.9603 3774845.0
+470.9263 3632486.0
+512.8989 4072570.0
+572.871 3485486.0
+
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/filtering/normalise_intensities.msp
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtering/normalise_intensities.msp Fri Jan 28 16:22:06 2022 +0000
b
@@ -0,0 +1,197 @@
+NAME: C001
+IONMODE: Negative
+RETENTIONTIME: 38.74
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 57
+138.9121 0.31238713555387226
+148.9337 0.03093306182282099
+175.0641 0.8212827951680125
+186.1095 0.08204982258791635
+196.8658 0.6559932163262051
+198.8647 0.6651371915222478
+200.8848 0.23744477531380626
+206.9034 0.8013745219687375
+216.9205 1.0
+234.0134 0.0782063439003671
+254.8252 0.7282800074828951
+256.8215 0.9622769161885076
+258.8237 0.4763537140000675
+266.8652 0.30071259242448867
+268.8537 0.09477374975849262
+306.9914 0.09719532503059093
+312.7841 0.30826464301376666
+316.7777 0.3291912033047409
+322.8157 0.1937471210787636
+324.9549 0.2643519782137348
+334.849 0.12814188059875428
+342.8093 0.10076000453880525
+349.9455 0.06288990023828728
+350.9875 0.18863026217733847
+351.941 0.06028888882073866
+366.8281 0.09978532677864431
+370.7418 0.29948334289140294
+372.7383 0.5941806076478868
+382.8218 0.3930228749651156
+384.8177 0.2548937827568335
+392.7685 0.33468631642219476
+413.2664 0.1216236349083192
+426.7772 0.1665751647616974
+428.7834 0.262351377128715
+434.7287 0.3049380667756389
+436.8161 0.11363104420121628
+440.7322 0.32516890182380237
+442.7401 0.25367480687076976
+450.7016 0.268730177228078
+460.7076 0.13889274619185038
+462.7862 0.06512774590050817
+484.7242 0.13107299809554185
+486.7743 0.14984380989766222
+488.6825 0.376229111528872
+492.744 0.23498572423077985
+494.8953 0.22046305013846423
+498.8794 0.20888946475832396
+500.8484 0.19997396320500985
+502.7832 0.10941688619559184
+510.763 0.15302388699601627
+518.7415 0.13013699218282798
+546.6093 0.2201034418250904
+550.6949 0.18721924576097057
+566.5977 0.15860704680182902
+612.6927 0.061506545999871196
+676.6436 0.06080508591528995
+800.4451 0.08562814917948829
+
+NAME: C002
+IONMODE: Negative
+RETENTIONTIME: 520.25
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 35
+131.1733 0.0018370867419900284
+267.2688 0.005686981655625982
+279.0196 0.0018132970906277511
+289.6491 0.04332185234360982
+301.1565 0.014148024487841387
+309.1649 0.01681316793110052
+310.1623 0.2751824048272655
+311.1658 0.012228114653210135
+312.0296 0.03610959011940033
+330.6757 0.011801281686240601
+525.375 1.0
+526.3783 0.16925822001818533
+527.3812 0.022027643545069038
+551.3321 0.10399173449088443
+552.3348 0.026404532249270578
+553.3314 0.00243163889393971
+562.3269 0.0070232353973927655
+578.2905 0.007060689144739971
+619.3008 0.004418147454139941
+624.296 0.010984767633625341
+813.5403 0.023348169508005768
+814.5336 0.005465242427736922
+955.1171 0.0021642368399005527
+1047.7378 0.1401206216753359
+1048.7399 0.08476366539149328
+1049.7432 0.027900654796038715
+1050.7453 0.006342696149667753
+1069.7158 0.004727978454800783
+1074.1979 0.0031698615710057058
+1075.1968 0.03107427758042852
+1076.2004 0.009706253222314986
+1101.6535 0.0018856526994021623
+1206.3127 0.003483399747305716
+1216.8041 0.004136052723591693
+1217.807 0.0033217691254826334
+
+NAME: C003
+IONMODE: Negative
+RETENTIONTIME: 483.67
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 26
+265.2529 0.0027793206039538215
+266.2564 0.00034733340430054716
+279.6362 0.0072989959038771346
+280.6546 0.002163778266032735
+288.6414 0.049436024927126176
+378.2093 0.0037436610481220017
+379.1966 0.0007096996877780199
+522.3565 1.0
+523.354 0.29384865685493955
+549.3267 0.015478600450010918
+576.2749 0.0018060599048590942
+577.3074 0.0005756721239330571
+617.2778 0.0005681454143142512
+625.4543 0.0009879705613649104
+796.9808 0.0033198455052339984
+797.9841 0.0015573701420036753
+809.9883 0.0030801977705220513
+810.9916 0.0016141198844341264
+1043.7028 0.035297475152995465
+1044.7068 0.020362011126266247
+1045.706 0.0068462763386867055
+1046.7131 0.0015906756058816994
+1058.1594 0.00506614361447774
+1059.1626 0.0016160049240511426
+1071.1639 0.0037806052815603864
+1072.1671 0.0012462539997079428
+
+NAME: C004
+IONMODE: Negative
+RETENTIONTIME: 473.48
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 24
+124.1405 0.0005181964913289414
+170.2437 9.837442556482469e-05
+275.6336 0.002226328996889195
+296.147 0.015137694616192635
+482.3247 0.011589847063758851
+483.3283 0.00288178272643532
+496.34 1.0
+497.3442 0.2653231515567137
+498.3462 0.04232013408533278
+499.3493 0.005420441717160338
+770.964 0.003915707588825487
+771.9675 0.0018021637295703144
+783.9721 0.0007822882222085712
+784.9749 0.0002880447335267696
+949.6233 0.0006367701791743273
+950.6274 0.00029216205711611197
+991.6726 0.11294353509394345
+992.6749 0.06067284320350776
+993.6787 0.01901492598860482
+994.6801 0.004257539105397458
+1017.6897 0.013371955835345416
+1018.6656 0.00958844553208827
+1019.6555 0.004583362385803359
+1020.6591 0.0009913747329363162
+
+NAME: C005
+IONMODE: Negative
+RETENTIONTIME: 41.72
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 20
+218.1386 0.15798873862212878
+337.0623 1.0
+338.0654 0.09890394032518758
+353.0361 0.4179579198062785
+359.0443 0.5462303157441691
+360.0459 0.0566706776455141
+375.018 0.3288449119592981
+376.0216 0.03090241565776916
+381.0261 0.15250232222627247
+396.9999 0.1163570494660839
+417.0027 0.1558882553976487
+418.9966 0.049466444781898614
+432.9764 0.11028677643551825
+438.9851 0.12751548668671656
+440.9796 0.037939268467062706
+454.9592 0.11074974998154162
+456.9603 0.042570661713847026
+470.9263 0.04096521385282981
+512.8989 0.04592824335196862
+572.871 0.03930742730214083
+
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/filtering/relative_intensity.msp
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/filtering/relative_intensity.msp Fri Jan 28 16:22:06 2022 +0000
b
@@ -0,0 +1,54 @@
+NAME: C001
+IONMODE: Negative
+RETENTIONTIME: 38.74
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 16
+138.9121 0.31238713555387226
+175.0641 0.8212827951680125
+196.8658 0.6559932163262051
+198.8647 0.6651371915222478
+206.9034 0.8013745219687375
+254.8252 0.7282800074828951
+258.8237 0.4763537140000675
+266.8652 0.30071259242448867
+312.7841 0.30826464301376666
+316.7777 0.3291912033047409
+372.7383 0.5941806076478868
+382.8218 0.3930228749651156
+392.7685 0.33468631642219476
+434.7287 0.3049380667756389
+440.7322 0.32516890182380237
+488.6825 0.376229111528872
+
+NAME: C002
+IONMODE: Negative
+RETENTIONTIME: 520.25
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 0
+
+NAME: C003
+IONMODE: Negative
+RETENTIONTIME: 483.67
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 0
+
+NAME: C004
+IONMODE: Negative
+RETENTIONTIME: 473.48
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 0
+
+NAME: C005
+IONMODE: Negative
+RETENTIONTIME: 41.72
+RETENTIONINDEX: 
+SPECTRUMTYPE: Centroid
+NUM PEAKS: 3
+353.0361 0.4179579198062785
+359.0443 0.5462303157441691
+375.018 0.3288449119592981
+
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/formatter/test2_threshold_formatting.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/formatter/test2_threshold_formatting.tsv Fri Jan 28 16:22:06 2022 +0000
[
@@ -0,0 +1,19 @@
+query reference matches score
+C007 Benzo[b]naphtho[2,1-d]thiophene 3 0.4302304171927885
+C023 Butylated hydroxytoluene 3 0.4899347755610658
+C016 Drometrizole 3 0.5535081364244014
+C040 Deltamethrin 4 0.5995685829585914
+C040 cis-Cypermethrin_isomer1 3 0.7514936043388737
+C040 cis-Cypermethrin_isomer2 3 0.6205879323732599
+C043 Carbofuran phenol 3 0.5173781620618291
+C023 Alachlor 4 0.4289634841639738
+C012 Chlorpyrifos 3 0.43976068904478827
+C016 Atrazine 5 0.4399647084473271
+C029 Metolachlor 3 0.8624580271763471
+C073 Praziquantel 3 0.6840766738581763
+C034 Carbaryl 3 0.4781026376526427
+C043 Carbofuran 3 0.5212598550187718
+C013 Indoxacarb 5 0.4827488304818007
+C073 Oxadixyl 4 0.7910256109540179
+C073 Amitraz 4 0.5270236660009217
+C008 Spirotetramat 5 0.40641914075077024
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/formatter/test2_topk_formatting.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/formatter/test2_topk_formatting.tsv Fri Jan 28 16:22:06 2022 +0000
[
b"@@ -0,0 +1,523 @@\n+query\treference\tmatches\tscore\n+C001\tChlorpyrifos\t7\t0.2439698460078672\n+C001\ttrans-Chlordane\t10\t0.1709889053423956\n+C001\tcis-Chlordane\t10\t0.16934374734008048\n+C002\tCarfentrazone-ethyl\t1\t0.023438813553203555\n+C002\t2,2',3,3',4,5',6,6'-Octachlorobiphenyl\t2\t0.012935401162453864\n+C002\tPyridaben\t4\t0.011168624908917228\n+C003\tPerylene_2H12\t2\t0.0005256270959446041\n+C003\tMetalaxyl\t1\t1.7567415612900304e-06\n+C003\tPerylene\t0\t0.0\n+C004\t17-alpha-Ethynylestradiol\t2\t0.002716713573623163\n+C004\tCoronene\t1\t0.0009680981940665212\n+C004\tProgesterone\t2\t0.0007924296222333303\n+C005\tTetraconazole\t3\t0.12154746411094572\n+C005\tSulfentrazone\t1\t0.05393598836706972\n+C005\tIndoxacarb\t1\t0.0441412960627566\n+C006\tTris(4-tert-butylphenyl) phosphate\t2\t0.12426514943875827\n+C006\tPerylene_2H12\t0\t0.0\n+C006\tPerylene\t0\t0.0\n+C007\tBenzo[b]naphtho[2,1-d]thiophene\t3\t0.4302304171927885\n+C007\t2-Chlorobiphenyl\t2\t0.30327152545734354\n+C007\tRetene\t3\t0.16318259462298138\n+C008\tSpirotetramat\t5\t0.40641914075077024\n+C008\tEthofumesate\t4\t0.17576877383827938\n+C008\t2,4-Di-tert-butyl-6-(5-chloro-2H-benzotriazol-2-yl)phenol\t3\t0.1419543758042326\n+C009\tPicoxystrobin\t1\t0.0006870380110630028\n+C009\tTris(isopropylphenyl)phosphate\t1\t0.00023550942343171069\n+C009\tTebufenpyrad\t1\t0.00017257075992195458\n+C010\tcis-Permethrin\t1\t0.008724226797557697\n+C010\ttrans-Permethrin\t1\t0.008418860878033153\n+C010\tcis-Phenothrin\t1\t0.005882714253167312\n+C011\tFuberidazole\t1\t0.2308319926807784\n+C011\tPrometryn\t2\t0.1773186209832549\n+C011\tBenzoximate\t1\t0.07676637011355666\n+C012\tChlorpyrifos\t3\t0.43976068904478827\n+C012\tTerbufos\t1\t0.4006683041096004\n+C012\t2,6-Dichloro-4-nitroaniline\t1\t0.20998341159494333\n+C013\tIndoxacarb\t5\t0.4827488304818007\n+C013\tTemephos\t2\t0.32810153796559577\n+C013\tNuarimol\t2\t0.2936210041931014\n+C014\tChlorferone\t1\t0.5119124308782732\n+C014\tPiperonyl butoxide\t1\t0.4857177881241794\n+C014\t2,6-Dichloro-4-nitroaniline\t2\t0.33898957004708385\n+C015\tMetazachlor\t1\t0.0011434403294572687\n+C015\talpha-Amylcinnamyl alcohol\t1\t0.0005805859933790689\n+C015\tPendimethalin\t1\t0.0005015386924657569\n+C016\tDrometrizole\t3\t0.5535081364244014\n+C016\tAcenaphthylene\t2\t0.540073031173669\n+C016\tAtrazine\t5\t0.4399647084473271\n+C017\t4-tert-Octylphenol\t1\t0.9088788152148044\n+C017\tPropargite_isomer2\t1\t0.8953233485170952\n+C017\tPropargite_isomer1\t1\t0.8942159049307404\n+C018\tTris(4-tert-butylphenyl) phosphate\t1\t0.189695375366971\n+C018\tPerylene_2H12\t0\t0.0\n+C018\tPerylene\t0\t0.0\n+C019\tTriclosan\t1\t0.13434903881343435\n+C019\tTerbufos\t1\t0.08080384965580391\n+C019\tEpoxiconazole\t2\t0.07313225916488224\n+C020\tTris(isopropylphenyl)phosphate\t2\t0.2520159660977677\n+C020\tAmitraz\t2\t0.1245102870796828\n+C020\tMetribuzin\t1\t0.05224979683560159\n+C021\tTebuthiuron\t2\t0.9340205348244696\n+C021\t1,5-Dimethylnaphthalene\t1\t0.6803608761410861\n+C021\t2,6-Dimethylnaphthalene\t1\t0.6264160291669295\n+C022\t2-Bromoallyl(2,4,6-tribromophenyl) ether\t1\t0.11311229152083695\n+C022\t2,3,4,5,6-Pentabromobenzyl alcohol\t2\t0.07003350703850979\n+C022\tAllyl 2,4,6-tribromophenyl ether\t1\t0.06571493640420596\n+C023\tPhenanthrene_2H10\t1\t0.7408591267092633\n+C023\t2-Chlorobiphenyl\t1\t0.6159214014775711\n+C023\tButylated hydroxytoluene\t3\t0.4899347755610658\n+C024\tMepronil\t2\t0.18000248105004787\n+C024\tSpirotetramat\t8\t0.17523909122675907\n+C024\tEstrone\t7\t0.17146514923780354\n+C025\tTris(4-tert-butylphenyl) phosphate\t2\t0.2957673370199089\n+C025\tPerylene_2H12\t0\t0.0\n+C025\tPerylene\t0\t0.0\n+C026\tIsodecyl diphenyl phosphate\t2\t0.4122773057565717\n+C026\tDicofol\t1\t0.32235849897575225\n+C026\tTris(isopropylphenyl)phosphate\t2\t0.18207675907106227\n+C027\tFenobucarb\t1\t0.058048257187677615\n+C027\tIsoprocarb\t1\t0.056638368345330564\n+C027\tDioxacarb\t1\t0.041723437047250914\n+C028\tPhosmet\t1\t0.7848313885767587\n+C028\tAlachlor\t1\t0.5400260886224933\n+C028\tButafenacil\t2\t0.5287006460619553\n+C029\tMetolachlor\t3\t0.8624580271763471\n+C029\tSafrole\t2\t0.591167446764124\n+C029\tAmitraz\t2\t0.4100617029164697\n+C030\tEthofumesate\t2\t0.1283368182166788\n+C030\tIprovalicarb isomer 1\t1\t0.1278518291141877\n+C030\tAcephate\t4\t0.12723099231343524\n+C031\tProgesterone\t1\t1.642699424"..b"\n+C138\tPhenanthrene_2H10\t0\t0.0\n+C139\tPerylene_2H12\t0\t0.0\n+C139\tPerylene\t0\t0.0\n+C139\tPhenanthrene_2H10\t0\t0.0\n+C140\tRotenone\t1\t0.0015990284859575886\n+C140\tPerylene_2H12\t0\t0.0\n+C140\tPerylene\t0\t0.0\n+C141\tTebufenpyrad\t2\t0.2938100129854653\n+C141\tTris(isopropylphenyl)phosphate\t2\t0.020202034111700597\n+C141\tIpconazole\t1\t0.017041584156450424\n+C142\tPerylene_2H12\t0\t0.0\n+C142\tPerylene\t0\t0.0\n+C142\tPhenanthrene_2H10\t0\t0.0\n+C143\tDimethomorph_isomer2\t1\t0.16685279162562694\n+C143\tDimethomorph _isomer1\t1\t0.16482807037456434\n+C143\t2,3,4,5,6-Pentabromotoluene\t1\t0.032682863992618404\n+C144\tEtoxazole\t2\t0.1027909809180103\n+C144\t2,4-Di-tert-butyl-6-(5-chloro-2H-benzotriazol-2-yl)phenol\t2\t0.04732776045289416\n+C144\tAzoxystrobin\t2\t0.035630773587232864\n+C145\tPerylene_2H12\t0\t0.0\n+C145\tPerylene\t0\t0.0\n+C145\tPhenanthrene_2H10\t0\t0.0\n+C146\tPropargite_isomer1\t1\t0.0633083562823998\n+C146\tPropargite_isomer2\t1\t0.05654738208679003\n+C146\t2,2',3,3',4,5',6,6'-Octachlorobiphenyl\t1\t0.035712333462604294\n+C147\t2,2',3,4,4',5',6-Heptabromodiphenyl ether\t1\t0.03047378825096018\n+C147\tChlorferone\t1\t0.01855122445019196\n+C147\tProgesterone\t2\t0.007867919703105094\n+C148\tBuprofezin\t1\t0.01875857752389424\n+C148\tPerylene_2H12\t0\t0.0\n+C148\tPerylene\t0\t0.0\n+C149\tMetalaxyl\t2\t0.29742589743178666\n+C149\t1,4-Naphthoquinone\t1\t0.2740480911849054\n+C149\tPraziquantel\t1\t0.260732240603901\n+C150\ttrans-Prallethrin\t1\t0.00633664692361121\n+C150\tPerylene_2H12\t0\t0.0\n+C150\tPerylene\t0\t0.0\n+C151\tSpirotetramat\t1\t0.011452966094891676\n+C151\tPerylene_2H12\t0\t0.0\n+C151\tPerylene\t0\t0.0\n+C152\tTris(3,5-xylenyl)phosphate\t1\t0.05756111981021594\n+C152\tTris(isopropylphenyl)phosphate\t1\t0.0449470954588726\n+C152\tPerylene_2H12\t0\t0.0\n+C153\tEthiofencarb\t1\t0.8284613374855048\n+C153\t1,1-Dibromo-2,3,3,4,4,5-hexachloro-2-cyclopenta-2,4-dien-1-ylcyclooctane\t1\t0.4257874890609336\n+C153\tIsomethyl-alpha-ionone\t1\t0.36103138237616267\n+C154\t7,12-Dimethylbenz[a]anthracene\t1\t0.29226381053937395\n+C154\tEnzacamene\t1\t0.14396940230197552\n+C154\tTriflumizole\t1\t0.10858411907186044\n+C155\tPerylene_2H12\t0\t0.0\n+C155\tPerylene\t0\t0.0\n+C155\tPhenanthrene_2H10\t0\t0.0\n+C156\t7,12-Dimethylbenz[a]anthracene\t1\t0.08248293081186396\n+C156\tMethoprotryne\t1\t0.0432082364937662\n+C156\tProgesterone\t1\t0.02316539180928352\n+C157\tPerylene_2H12\t0\t0.0\n+C157\tPerylene\t0\t0.0\n+C157\tPhenanthrene_2H10\t0\t0.0\n+C158\tTris(4-tert-butylphenyl) phosphate\t1\t0.012341356867974116\n+C158\tPerylene_2H12\t0\t0.0\n+C158\tPerylene\t0\t0.0\n+C159\tTrifluralin\t1\t0.1883562158254524\n+C159\tFenpropathrin\t1\t0.015975881134824614\n+C159\tEthiprole\t1\t0.007596489095240584\n+C160\tBumetrizole\t1\t0.04337092323628775\n+C160\ttrans-Cypermethrin_isomer2\t1\t0.030241071137562938\n+C160\tPerylene_2H12\t1\t0.029465908012253836\n+C161\tPerylene_2H12\t0\t0.0\n+C161\tPerylene\t0\t0.0\n+C161\tPhenanthrene_2H10\t0\t0.0\n+C162\tPerylene_2H12\t0\t0.0\n+C162\tPerylene\t0\t0.0\n+C162\tPhenanthrene_2H10\t0\t0.0\n+C163\tPerylene_2H12\t0\t0.0\n+C163\tPerylene\t0\t0.0\n+C163\tPhenanthrene_2H10\t0\t0.0\n+C164\t7,12-Dimethylbenz[a]anthracene\t1\t0.2284760273276565\n+C164\tEnzacamene\t1\t0.112547485896346\n+C164\tFenamidone\t1\t0.0486288864876461\n+C165\tBoscalid\t1\t0.08498662209290331\n+C165\tBuprofezin\t1\t0.08205704595848827\n+C165\tIpconazole\t1\t0.08152620214218925\n+C166\tTris(2-butoxyethyl) phosphate\t1\t0.008342150525801997\n+C166\tRotenone\t1\t0.0015006556689027325\n+C166\tPerylene_2H12\t0\t0.0\n+C167\tPerylene_2H12\t0\t0.0\n+C167\tPerylene\t0\t0.0\n+C167\tPhenanthrene_2H10\t0\t0.0\n+C168\tPerylene_2H12\t0\t0.0\n+C168\tPerylene\t0\t0.0\n+C168\tPhenanthrene_2H10\t0\t0.0\n+C169\tPerylene_2H12\t0\t0.0\n+C169\tPerylene\t0\t0.0\n+C169\tPhenanthrene_2H10\t0\t0.0\n+C170\tPerylene_2H12\t0\t0.0\n+C170\tPerylene\t0\t0.0\n+C170\tPhenanthrene_2H10\t0\t0.0\n+C171\t2,4-D butyl ester\t1\t0.6610587362108564\n+C171\tTerbutryn\t1\t0.6012657870951452\n+C171\tEstrone\t2\t0.31623371975319553\n+C172\tPerylene_2H12\t1\t0.06765194944236241\n+C172\t17-alpha-Ethynylestradiol\t1\t0.01884162876915315\n+C172\tProgesterone\t1\t0.01306130902820296\n+C173\tSpiromesifen\t1\t0.016586079079264453\n+C173\tRotenone\t1\t0.0025109428261963678\n+C173\tPerylene_2H12\t0\t0.0\n+C174\tPerylene_2H12\t0\t0.0\n+C174\tPerylene\t0\t0.0\n+C174\tPhenanthrene_2H10\t0\t0.0\n"
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/matches_test1_out.tsv
--- a/test-data/matches_test1_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,175 +0,0 @@\n-\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n-C001\t57\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C002\t0\t35\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C003\t0\t0\t26\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C004\t0\t0\t0\t24\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C005\t0\t0\t0\t0\t20\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C006\t0\t0\t0\t0\t0\t19\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C007\t0\t0\t0\t0\t0\t0\t15\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C008\t0\t1\t0\t0\t0\t0\t0\t15\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C009\t0\t0\t0\t0\t0\t0\t0\t0\t14\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t'..b'\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C164\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C165\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C166\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\n-C167\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\n-C168\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\n-C169\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\n-C170\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\n-C171\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\n-C172\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\n-C173\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\n-C174\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/matches_test3_out.tsv
--- a/test-data/matches_test3_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,387 +0,0 @@\n-\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n-Perylene_2H12\t0\t0\t2\t0\t1\t0\t0\t1\t0\t0\t0\t0\t2\t0\t0\t3\t0\t0\t0\t1\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\n-Perylene\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t0\t1\t1\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Phenanthrene_2H10\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t2\t0\t1\t0\t0\t0\t0\t1\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\n-Phenanthrene\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Anthracene\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t2\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Acenaphthylene\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Acenaphthene\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t3\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Fluoranthene\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t1\t0\t1\t0\t0\t0\t2\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Pyrene\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t2\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0'..b'ph_isomer2\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Spirodiclofen\t3\t2\t0\t0\t0\t0\t4\t1\t0\t0\t1\t1\t4\t0\t0\t4\t3\t0\t1\t2\t4\t0\t2\t0\t0\t1\t0\t0\t2\t1\t0\t0\t3\t1\t0\t0\t1\t1\t1\t1\t0\t0\t2\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t3\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t1\t1\t1\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Spiromesifen\t1\t1\t0\t1\t0\t0\t2\t2\t0\t1\t1\t0\t2\t1\t0\t5\t0\t0\t0\t1\t3\t0\t3\t4\t0\t1\t2\t1\t2\t1\t0\t0\t1\t7\t0\t0\t2\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t3\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t2\t0\t1\t0\t0\t0\t0\t1\t2\t0\t1\t0\t0\t0\t0\t0\t2\t0\t0\t3\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\n-Spirotetramat\t2\t2\t0\t1\t0\t0\t2\t5\t0\t2\t1\t0\t6\t1\t0\t7\t1\t0\t1\t2\t4\t0\t4\t8\t0\t3\t2\t1\t2\t1\t0\t0\t3\t7\t0\t0\t3\t0\t0\t4\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t3\t0\t0\t3\t0\t0\t3\t0\t0\t1\t0\t0\t1\t0\t0\t3\t1\t3\t0\t0\t0\t0\t0\t2\t2\t3\t0\t1\t0\t0\t1\t0\t0\t3\t0\t2\t3\t2\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t2\t1\t0\t1\t1\t0\t0\t1\t2\t0\t1\t0\t2\t0\t0\t1\t1\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t1\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\n-17-alpha-Ethynylestradiol\t1\t0\t0\t2\t0\t0\t2\t2\t0\t1\t1\t0\t4\t1\t1\t5\t1\t0\t0\t1\t2\t0\t3\t4\t0\t2\t2\t1\t2\t1\t0\t0\t3\t7\t0\t0\t1\t1\t0\t4\t0\t0\t2\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t2\t0\t1\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t1\t0\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t2\t1\t0\t3\t1\t0\t0\t0\t0\t0\t1\t0\t0\t2\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t2\t1\t0\t0\n-Bisphenol A\t0\t0\t0\t0\t0\t0\t1\t1\t0\t1\t0\t0\t1\t0\t0\t3\t1\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t3\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-4-tert-Octylphenol\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Estrone\t1\t0\t0\t0\t0\t0\t1\t1\t0\t1\t1\t0\t3\t1\t1\t6\t0\t0\t0\t2\t1\t0\t2\t7\t0\t1\t3\t1\t2\t1\t0\t0\t3\t7\t0\t0\t0\t1\t0\t3\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t1\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t3\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t1\t0\t1\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\n-17-beta-Estradiol\t2\t0\t0\t0\t0\t0\t4\t2\t0\t1\t1\t0\t2\t0\t1\t4\t0\t0\t0\t0\t1\t0\t4\t4\t0\t0\t0\t1\t1\t0\t1\t0\t1\t6\t0\t0\t1\t1\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t1\t0\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t2\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Progesterone\t2\t3\t0\t2\t0\t0\t3\t3\t0\t2\t2\t0\t4\t2\t1\t6\t1\t0\t0\t2\t2\t0\t4\t9\t0\t4\t3\t1\t5\t2\t1\t0\t3\t6\t0\t0\t3\t0\t2\t4\t0\t0\t2\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t1\t1\t1\t1\t1\t2\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t2\t1\t4\t0\t1\t0\t0\t1\t2\t2\t2\t0\t1\t0\t0\t2\t0\t0\t2\t2\t3\t3\t2\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t2\t1\t0\t0\t1\t0\t1\t0\t2\t0\t1\t0\t1\t0\t0\t1\t2\t2\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t2\t0\t0\t0\t2\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t2\t1\t0\t0\n-Testosterone\t1\t1\t0\t1\t1\t0\t0\t2\t0\t1\t1\t0\t4\t1\t1\t5\t0\t0\t0\t1\t2\t0\t3\t7\t0\t2\t2\t1\t4\t1\t0\t0\t3\t3\t0\t0\t1\t0\t1\t2\t0\t0\t3\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t1\t1\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t4\t0\t1\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t2\t0\t0\t2\t2\t3\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t1\t0\t2\t0\t2\t0\t1\t0\t0\t0\t0\t1\t1\t2\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t2\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/matches_test4_out.tsv
--- a/test-data/matches_test4_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
b"@@ -1,387 +0,0 @@\n-\tPerylene_2H12\tPerylene\tPhenanthrene_2H10\tPhenanthrene\tAnthracene\tAcenaphthylene\tAcenaphthene\tFluoranthene\tPyrene\tpara-Terphenyl\tRetene\tBenzo[b]naphtho[2,1-d]thiophene\t2,3-Benzofluorene\tBenzo[ghi]fluoranthene\tTriphenylene\tBenzanthracene/Benzophenanthrene\tBenzofluoranthene\tBenzo(k)fluoranthene\tBenzo[e]pyrene\tBenzo(a)pyrene\tIndeno[1,2,3-cd]pyrene\tBenzo(g,h,i)perylene\tAnthanthrene\tDibenzanthracene\tCoronene\tDicofol\tBenzophenone\t2-tert-Butyl-4-methoxyphenol\tButylated hydroxytoluene\tBumetrizole\t4-Methylbenzophenone\t2,4,6-Tribromophenol\t2,6-Dichloro-4-nitroaniline\t1-Methylphenanthrene\tTriclosan\tDrometrizole\tEnzacamene\t2,4-Di-tert-butyl-6-(5-chloro-2H-benzotriazol-2-yl)phenol\tOctrizole\t1,2,7,9-Tetrachlorodibenzofuran\t2,2',3,4,5,5',6-Heptachlorobiphenyl\t2,4,6-Trichlorobiphenyl\t2,2',3,3',4,5',6,6'-Octachlorobiphenyl\tMirex\tbeta-Hexachlorocyclohexane\talpha-1,2,3,4,5,6-Hexachlorocyclohexane\tLindane\tdelta-Hexachlorocyclohexane\tepsilon-Hexachlorocyclohexane\tPentachlorobenzene\tHexachlorobenzene\t2,4'-Dichlorodiphenyldichloroethylene\t2,4'-Dichlorodiphenyldichloroethane\t2,4'-Dichlorodiphenyltrichloroethane\t1,2,7,9-Tetrachlorodibenzo-p-dioxin\t2,4,4'-Trichlorobiphenyl\t2,2',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5-Pentachlorobiphenyl\t2,2',3,4,4',5'-Hexachlorobiphenyl\t2,2',4,4',5,5'-Hexachlorobiphenyl\t2,2',3,4,4',5,5'-Heptachlorobiphenyl\t2,2',5,5'-Tetrachlorobiphenyl\t2,3',4,6-Tetrachlorobiphenyl\t2,3',5',6-Tetrachlorobiphenyl\t2,2',3,4',5-Pentachlorobiphenyl\t2,3,3',4,5-Pentachlorobiphenyl\t3,3',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5',6-Hexachlorobiphenyl\t2,3,3',4,5,6-Hexachlorobiphenyl\t2,3,3',4',5',6-Hexachlorobiphenyl\t2,3,3',4',5,6-Hexachlorobiphenyl\t2,3,3',4',5,5',6-Heptachlorobiphenyl\tcis-Prallethrin\ttrans-Prallethrin\tcis-Resmethrin\ttrans-Resmethrin\tcis-Tetramethrin\ttrans-Tetramethrin\tBifenthrin\tFenpropathrin\tcis-Phenothrin\ttrans-Phenothrin\tcis-Cyphenothrin\ttrans-Cyphenothrin\tFlucythrinate_isomer1\tFlucythrinate_isomer2\tcis-Fenvalerate\ttrans-Fenvalerate\tDeltamethrin\tChlorpyrifos oxon\tlambda-Cyhalothrin\tTefluthrin\tTransfluthrin\tcis-Permethrin\ttrans-Permethrin\tcis-Allethrin\ttrans-Allethrin\tcis-Cypermethrin_isomer1\ttrans-Cypermethrin_isomer1\tcis-Cypermethrin_isomer2\ttrans-Cypermethrin_isomer2\tcis-Cyfluthrin_isomer1\ttrans-Cyfluthrin_isomer1\tcis-Cyfluthrin_isomer2\ttrans-Cyfluthrin_Isomer2\t1,2,3,4,7,8-Hexachlorodibenzo-p-dioxin\t1,2,3,4,6,7,8-Heptachlorodibenzo-p-dioxin\tOctachlorodibenzo-p-dioxin\tOctachlorodibenzofuran\t1,2,3,7,8-Pentachlorodibenzofuran\t1,2,3,4,7,8-Hexachlorodibenzofuran\t1,2,3,4,6,7,8-Heptachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzo-p-dioxin\t1,2,3,7,8-Pentachlorodibenzo-p-dioxin\t2,3,4,5-Tetrabromo-6-chlorotoluene\t2,3,4,5,6-Pentabromotoluene\t2,3,4,5,6-Pentabromoethylbenzene\t2,3,5,6-Tetrabromo-p-xylene\tAllyl 2,4,6-tribromophenyl ether\t2-Bromoallyl(2,4,6-tribromophenyl) ether\tPentabromobenzene\tHexabromobenzene\t2,3,4,5,6-Pentabromobenzyl alcohol\t2-Ethylhexyl 2,3,4,5-Tetrabromobenzoate\tsyn-Dechlorane plus\tanti-Dechlorane plus\talpha-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\tbeta-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\t1,2,5,6-Tetrabromocyclooctane\t1,1-Dibromo-2,3,3,4,4,5-hexachloro-2-cyclopenta-2,4-dien-1-ylcyclooctane\talpha-Amylcinnamaldehyde\ttrans-Cinnamaldehyde\tCitral (Geranial)\t1-Fluronaphthalene\talpha-Hexylcinnamaldehyde\tLilial\talpha-Amylcinnamyl alcohol\tEugenol\tIsoeugenol\t4-Methoxybenzyl alcohol\tMethyleugenol\tCinnamyl alcohol\tBenzyl alcohol\tEstragole\tBenzyl benzoate\tBenzyl cinnamate\tBenzyl salicylate\tCamphor\tEucalyptol\tCoumarin\tLimonene\tIsomethyl-alpha-ionone\tdelta-Iraldeine\tSafrole\tCashmeran\tCelestolide\tPhantolide\tTonalide\tTraseolide\tGalaxolide\tAldrin\tEndosulfan\tHeptachlor\tcis-Heptachlor epoxide\tEndosulfan sulphate\tEndrin ketone\ttrans-Chlordane\tcis-Chlordane\tEndrin aldehyde\tEndrin\t4,4'-Dichlorodiphenyldichloroethylene\tMethoxychlor\t4,4'-Dichlorodiphenyldichloroethane\t4,4'-Dichlorodiphenyltrichloroethane\tTris(4-tert-butylphenyl) phosphate\tTri-n-butyl-phosphate\tTris(1,3-dichloro-2-propy"..b'39\t11\t10\t27\t32\t19\t34\t20\t25\t21\t47\t11\t36\t46\t25\t47\t36\t44\t37\t31\t33\t34\t39\t61\t9\t23\t30\t44\t15\t19\t21\t18\t18\t22\t14\t18\t22\t21\t24\t17\t16\t24\t29\t34\t31\t22\t45\t37\t26\t34\t36\t12\t12\t17\t49\t22\t30\t29\t13\t22\t57\t14\t33\t16\t17\t18\t22\t12\t6\t8\t17\t10\t55\t34\t40\t15\t9\t13\t49\t34\t22\t35\t7\t10\t19\t18\t26\t45\t23\t47\t38\t22\t19\t20\t7\t13\t37\t23\t7\t30\t22\t7\t12\t55\t52\t41\t39\t26\t37\t8\t12\t18\t16\t36\t32\t19\t31\t17\t2\t6\t35\t40\t19\t35\t29\t20\t16\t35\t47\t16\t31\t35\t18\t20\t19\t38\t24\t42\t27\t28\t17\t25\t60\t19\t20\t20\t34\t28\t36\t11\t16\t19\t14\t27\t21\t20\t13\t17\t30\t46\t75\t36\t3\t29\t10\t23\t45\t31\t21\t35\t18\t34\t10\t28\t51\t61\t56\t48\t62\t16\t8\t11\t44\t68\t80\t78\t26\t13\t88\t56\t85\t72\n-17-beta-Estradiol\t11\t11\t7\t12\t13\t9\t7\t13\t12\t16\t17\t15\t12\t12\t13\t14\t11\t12\t12\t12\t9\t9\t24\t12\t15\t16\t14\t28\t34\t34\t16\t18\t24\t13\t26\t21\t53\t22\t13\t13\t18\t13\t38\t1\t19\t19\t18\t20\t21\t4\t6\t11\t13\t10\t22\t12\t15\t12\t18\t18\t17\t13\t13\t12\t17\t13\t11\t15\t14\t15\t11\t17\t18\t22\t30\t27\t16\t7\t12\t30\t27\t25\t21\t19\t37\t28\t26\t27\t34\t18\t19\t12\t18\t19\t20\t13\t11\t31\t24\t26\t40\t23\t31\t28\t33\t9\t8\t8\t9\t13\t11\t12\t11\t13\t11\t6\t6\t10\t7\t31\t14\t9\t6\t21\t12\t16\t13\t7\t10\t5\t27\t38\t10\t23\t10\t25\t30\t31\t24\t27\t13\t29\t19\t10\t19\t17\t22\t6\t13\t21\t7\t13\t24\t19\t20\t42\t32\t29\t35\t13\t42\t21\t22\t16\t12\t9\t26\t7\t10\t48\t37\t11\t18\t12\t11\t20\t9\t6\t26\t27\t24\t12\t29\t20\t16\t18\t14\t1\t18\t14\t37\t17\t35\t14\t30\t8\t7\t21\t25\t15\t26\t17\t19\t25\t28\t11\t26\t30\t19\t39\t24\t35\t30\t23\t22\t28\t23\t50\t6\t14\t27\t37\t9\t20\t16\t14\t14\t15\t9\t14\t18\t16\t15\t11\t13\t18\t21\t25\t24\t16\t34\t31\t22\t23\t28\t11\t8\t13\t38\t14\t26\t26\t11\t18\t44\t9\t22\t10\t14\t13\t14\t10\t4\t4\t17\t7\t39\t31\t34\t15\t8\t11\t34\t27\t18\t30\t5\t9\t14\t16\t20\t35\t15\t37\t34\t17\t15\t13\t6\t14\t24\t13\t5\t28\t16\t6\t9\t46\t27\t31\t31\t18\t34\t6\t8\t15\t11\t27\t22\t12\t27\t15\t2\t6\t27\t28\t11\t34\t20\t11\t11\t20\t34\t13\t19\t26\t11\t14\t10\t31\t19\t35\t21\t20\t10\t16\t42\t17\t15\t16\t33\t17\t33\t12\t13\t14\t7\t17\t21\t13\t8\t13\t17\t30\t58\t28\t1\t17\t11\t23\t33\t28\t20\t24\t17\t28\t6\t26\t38\t47\t46\t41\t47\t12\t7\t11\t32\t50\t63\t63\t24\t9\t56\t67\t62\t60\n-Progesterone\t18\t10\t17\t16\t18\t13\t10\t14\t12\t23\t35\t19\t16\t13\t18\t17\t12\t13\t14\t13\t11\t10\t31\t14\t24\t28\t21\t46\t42\t64\t23\t38\t56\t21\t50\t27\t103\t32\t16\t21\t19\t28\t71\t2\t45\t42\t44\t42\t43\t12\t10\t24\t26\t24\t35\t20\t25\t19\t19\t22\t20\t25\t24\t21\t26\t18\t20\t21\t20\t20\t13\t18\t40\t51\t55\t48\t34\t21\t15\t59\t47\t45\t54\t47\t59\t48\t43\t55\t63\t38\t28\t21\t31\t24\t30\t47\t39\t52\t47\t51\t74\t42\t53\t52\t67\t20\t18\t14\t15\t16\t17\t20\t20\t17\t16\t13\t9\t18\t11\t61\t23\t13\t8\t51\t31\t22\t22\t15\t21\t15\t40\t48\t14\t43\t13\t40\t38\t39\t38\t39\t24\t43\t28\t16\t27\t19\t33\t8\t21\t33\t9\t24\t31\t31\t28\t65\t42\t40\t45\t16\t57\t50\t68\t27\t29\t21\t55\t17\t22\t112\t78\t29\t29\t23\t24\t30\t10\t15\t50\t41\t41\t17\t57\t44\t32\t32\t21\t5\t26\t37\t84\t30\t44\t22\t44\t11\t9\t29\t38\t20\t34\t23\t26\t42\t56\t15\t45\t68\t29\t62\t46\t58\t61\t34\t42\t41\t57\t81\t10\t30\t39\t56\t27\t24\t26\t28\t26\t28\t24\t21\t21\t22\t26\t20\t20\t21\t39\t45\t40\t22\t55\t39\t29\t43\t51\t12\t15\t25\t68\t25\t43\t42\t18\t20\t77\t14\t47\t24\t20\t18\t26\t14\t7\t9\t22\t14\t80\t44\t49\t19\t13\t10\t54\t34\t20\t43\t10\t14\t28\t20\t35\t59\t27\t58\t49\t31\t10\t24\t6\t15\t43\t34\t11\t40\t29\t9\t14\t83\t52\t50\t44\t35\t44\t9\t13\t21\t23\t44\t37\t27\t35\t19\t7\t16\t42\t52\t15\t46\t49\t34\t21\t52\t69\t18\t47\t44\t16\t37\t29\t51\t33\t52\t40\t38\t21\t30\t91\t23\t22\t29\t46\t36\t44\t14\t22\t31\t27\t32\t32\t28\t20\t28\t44\t59\t103\t43\t9\t33\t24\t44\t63\t43\t34\t55\t36\t52\t15\t43\t80\t101\t84\t86\t100\t16\t9\t14\t80\t81\t125\t95\t29\t13\t85\t62\t168\t125\n-Testosterone\t14\t8\t13\t13\t15\t12\t10\t14\t12\t24\t36\t18\t16\t10\t17\t16\t9\t9\t10\t9\t10\t9\t28\t12\t22\t25\t19\t44\t39\t48\t22\t35\t46\t19\t38\t25\t101\t27\t15\t18\t17\t26\t51\t2\t38\t36\t39\t37\t37\t8\t6\t20\t22\t21\t25\t18\t21\t16\t17\t15\t18\t23\t24\t19\t21\t15\t15\t16\t16\t16\t9\t15\t39\t46\t43\t44\t29\t20\t10\t46\t37\t36\t40\t34\t43\t36\t30\t41\t51\t33\t19\t20\t24\t17\t22\t41\t35\t38\t33\t36\t65\t34\t39\t36\t52\t13\t12\t10\t11\t11\t11\t13\t14\t14\t11\t7\t3\t10\t5\t51\t19\t7\t3\t41\t25\t19\t16\t11\t17\t14\t35\t48\t14\t41\t15\t35\t37\t37\t38\t37\t22\t44\t26\t15\t29\t16\t29\t8\t21\t32\t10\t24\t32\t30\t28\t63\t38\t34\t42\t16\t49\t41\t46\t19\t20\t15\t44\t13\t16\t91\t63\t24\t21\t19\t20\t27\t10\t13\t32\t27\t27\t15\t51\t30\t21\t27\t19\t3\t23\t35\t72\t29\t44\t18\t37\t8\t8\t26\t33\t17\t31\t21\t23\t32\t47\t13\t44\t56\t28\t60\t39\t52\t60\t37\t39\t38\t48\t78\t10\t26\t40\t49\t24\t22\t22\t24\t21\t24\t18\t15\t17\t18\t21\t15\t17\t17\t33\t39\t35\t18\t48\t38\t29\t39\t42\t12\t14\t18\t60\t23\t36\t36\t16\t16\t61\t13\t42\t21\t19\t16\t26\t14\t7\t8\t19\t14\t64\t41\t42\t19\t12\t11\t46\t34\t19\t40\t7\t15\t27\t20\t29\t49\t27\t55\t41\t30\t10\t21\t6\t15\t38\t28\t12\t37\t28\t7\t14\t75\t37\t43\t43\t33\t43\t9\t12\t20\t14\t39\t33\t21\t33\t18\t5\t13\t41\t45\t10\t44\t44\t28\t20\t43\t57\t15\t41\t38\t15\t30\t27\t46\t30\t49\t39\t36\t20\t27\t70\t22\t20\t25\t44\t27\t45\t13\t18\t26\t18\t26\t30\t21\t18\t25\t34\t45\t86\t38\t7\t24\t22\t32\t50\t37\t25\t48\t34\t47\t14\t37\t66\t81\t71\t74\t84\t15\t8\t12\t68\t60\t96\t82\t27\t13\t72\t60\t125\t130\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/matches_test5_out.tsv
--- a/test-data/matches_test5_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,175 +0,0 @@\n-\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n-C001\t57\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C002\t0\t35\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C003\t0\t0\t26\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C004\t0\t0\t0\t24\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C005\t0\t0\t0\t0\t20\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C006\t0\t0\t0\t0\t0\t19\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C007\t0\t0\t0\t0\t0\t0\t15\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C008\t0\t1\t0\t0\t0\t0\t0\t15\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C009\t0\t0\t0\t0\t0\t0\t0\t0\t14\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t'..b'\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C164\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C165\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-C166\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\n-C167\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\n-C168\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\n-C169\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\n-C170\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\n-C171\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\n-C172\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\n-C173\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\n-C174\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/matches_test6_out.tsv
--- a/test-data/matches_test6_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
b"@@ -1,387 +0,0 @@\n-\tPerylene_2H12\tPerylene\tPhenanthrene_2H10\tPhenanthrene\tAnthracene\tAcenaphthylene\tAcenaphthene\tFluoranthene\tPyrene\tpara-Terphenyl\tRetene\tBenzo[b]naphtho[2,1-d]thiophene\t2,3-Benzofluorene\tBenzo[ghi]fluoranthene\tTriphenylene\tBenzanthracene/Benzophenanthrene\tBenzofluoranthene\tBenzo(k)fluoranthene\tBenzo[e]pyrene\tBenzo(a)pyrene\tIndeno[1,2,3-cd]pyrene\tBenzo(g,h,i)perylene\tAnthanthrene\tDibenzanthracene\tCoronene\tDicofol\tBenzophenone\t2-tert-Butyl-4-methoxyphenol\tButylated hydroxytoluene\tBumetrizole\t4-Methylbenzophenone\t2,4,6-Tribromophenol\t2,6-Dichloro-4-nitroaniline\t1-Methylphenanthrene\tTriclosan\tDrometrizole\tEnzacamene\t2,4-Di-tert-butyl-6-(5-chloro-2H-benzotriazol-2-yl)phenol\tOctrizole\t1,2,7,9-Tetrachlorodibenzofuran\t2,2',3,4,5,5',6-Heptachlorobiphenyl\t2,4,6-Trichlorobiphenyl\t2,2',3,3',4,5',6,6'-Octachlorobiphenyl\tMirex\tbeta-Hexachlorocyclohexane\talpha-1,2,3,4,5,6-Hexachlorocyclohexane\tLindane\tdelta-Hexachlorocyclohexane\tepsilon-Hexachlorocyclohexane\tPentachlorobenzene\tHexachlorobenzene\t2,4'-Dichlorodiphenyldichloroethylene\t2,4'-Dichlorodiphenyldichloroethane\t2,4'-Dichlorodiphenyltrichloroethane\t1,2,7,9-Tetrachlorodibenzo-p-dioxin\t2,4,4'-Trichlorobiphenyl\t2,2',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5-Pentachlorobiphenyl\t2,2',3,4,4',5'-Hexachlorobiphenyl\t2,2',4,4',5,5'-Hexachlorobiphenyl\t2,2',3,4,4',5,5'-Heptachlorobiphenyl\t2,2',5,5'-Tetrachlorobiphenyl\t2,3',4,6-Tetrachlorobiphenyl\t2,3',5',6-Tetrachlorobiphenyl\t2,2',3,4',5-Pentachlorobiphenyl\t2,3,3',4,5-Pentachlorobiphenyl\t3,3',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5',6-Hexachlorobiphenyl\t2,3,3',4,5,6-Hexachlorobiphenyl\t2,3,3',4',5',6-Hexachlorobiphenyl\t2,3,3',4',5,6-Hexachlorobiphenyl\t2,3,3',4',5,5',6-Heptachlorobiphenyl\tcis-Prallethrin\ttrans-Prallethrin\tcis-Resmethrin\ttrans-Resmethrin\tcis-Tetramethrin\ttrans-Tetramethrin\tBifenthrin\tFenpropathrin\tcis-Phenothrin\ttrans-Phenothrin\tcis-Cyphenothrin\ttrans-Cyphenothrin\tFlucythrinate_isomer1\tFlucythrinate_isomer2\tcis-Fenvalerate\ttrans-Fenvalerate\tDeltamethrin\tChlorpyrifos oxon\tlambda-Cyhalothrin\tTefluthrin\tTransfluthrin\tcis-Permethrin\ttrans-Permethrin\tcis-Allethrin\ttrans-Allethrin\tcis-Cypermethrin_isomer1\ttrans-Cypermethrin_isomer1\tcis-Cypermethrin_isomer2\ttrans-Cypermethrin_isomer2\tcis-Cyfluthrin_isomer1\ttrans-Cyfluthrin_isomer1\tcis-Cyfluthrin_isomer2\ttrans-Cyfluthrin_Isomer2\t1,2,3,4,7,8-Hexachlorodibenzo-p-dioxin\t1,2,3,4,6,7,8-Heptachlorodibenzo-p-dioxin\tOctachlorodibenzo-p-dioxin\tOctachlorodibenzofuran\t1,2,3,7,8-Pentachlorodibenzofuran\t1,2,3,4,7,8-Hexachlorodibenzofuran\t1,2,3,4,6,7,8-Heptachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzo-p-dioxin\t1,2,3,7,8-Pentachlorodibenzo-p-dioxin\t2,3,4,5-Tetrabromo-6-chlorotoluene\t2,3,4,5,6-Pentabromotoluene\t2,3,4,5,6-Pentabromoethylbenzene\t2,3,5,6-Tetrabromo-p-xylene\tAllyl 2,4,6-tribromophenyl ether\t2-Bromoallyl(2,4,6-tribromophenyl) ether\tPentabromobenzene\tHexabromobenzene\t2,3,4,5,6-Pentabromobenzyl alcohol\t2-Ethylhexyl 2,3,4,5-Tetrabromobenzoate\tsyn-Dechlorane plus\tanti-Dechlorane plus\talpha-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\tbeta-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\t1,2,5,6-Tetrabromocyclooctane\t1,1-Dibromo-2,3,3,4,4,5-hexachloro-2-cyclopenta-2,4-dien-1-ylcyclooctane\talpha-Amylcinnamaldehyde\ttrans-Cinnamaldehyde\tCitral (Geranial)\t1-Fluronaphthalene\talpha-Hexylcinnamaldehyde\tLilial\talpha-Amylcinnamyl alcohol\tEugenol\tIsoeugenol\t4-Methoxybenzyl alcohol\tMethyleugenol\tCinnamyl alcohol\tBenzyl alcohol\tEstragole\tBenzyl benzoate\tBenzyl cinnamate\tBenzyl salicylate\tCamphor\tEucalyptol\tCoumarin\tLimonene\tIsomethyl-alpha-ionone\tdelta-Iraldeine\tSafrole\tCashmeran\tCelestolide\tPhantolide\tTonalide\tTraseolide\tGalaxolide\tAldrin\tEndosulfan\tHeptachlor\tcis-Heptachlor epoxide\tEndosulfan sulphate\tEndrin ketone\ttrans-Chlordane\tcis-Chlordane\tEndrin aldehyde\tEndrin\t4,4'-Dichlorodiphenyldichloroethylene\tMethoxychlor\t4,4'-Dichlorodiphenyldichloroethane\t4,4'-Dichlorodiphenyltrichloroethane\tTris(4-tert-butylphenyl) phosphate\tTri-n-butyl-phosphate\tTris(1,3-dichloro-2-propy"..b'39\t11\t10\t27\t32\t19\t34\t20\t25\t21\t47\t11\t36\t46\t25\t47\t36\t44\t37\t31\t33\t34\t39\t61\t9\t23\t30\t44\t15\t19\t21\t18\t18\t22\t14\t18\t22\t21\t24\t17\t16\t24\t29\t34\t31\t22\t45\t37\t26\t34\t36\t12\t12\t17\t49\t22\t30\t29\t13\t22\t57\t14\t33\t16\t17\t18\t22\t12\t6\t8\t17\t10\t55\t34\t40\t15\t9\t13\t49\t34\t22\t35\t7\t10\t19\t18\t26\t45\t23\t47\t38\t22\t19\t20\t7\t13\t37\t23\t7\t30\t22\t7\t12\t55\t52\t41\t39\t26\t37\t8\t12\t18\t16\t36\t32\t19\t31\t17\t2\t6\t35\t40\t19\t35\t29\t20\t16\t35\t47\t16\t31\t35\t18\t20\t19\t38\t24\t42\t27\t28\t17\t25\t60\t19\t20\t20\t34\t28\t36\t11\t16\t19\t14\t27\t21\t20\t13\t17\t30\t46\t75\t36\t3\t29\t10\t23\t45\t31\t21\t35\t18\t34\t10\t28\t51\t61\t56\t48\t62\t16\t8\t11\t44\t68\t80\t78\t26\t13\t88\t56\t85\t72\n-17-beta-Estradiol\t11\t11\t7\t12\t13\t9\t7\t13\t12\t16\t17\t15\t12\t12\t13\t14\t11\t12\t12\t12\t9\t9\t24\t12\t15\t16\t14\t28\t34\t34\t16\t18\t24\t13\t26\t21\t53\t22\t13\t13\t18\t13\t38\t1\t19\t19\t18\t20\t21\t4\t6\t11\t13\t10\t22\t12\t15\t12\t18\t18\t17\t13\t13\t12\t17\t13\t11\t15\t14\t15\t11\t17\t18\t22\t30\t27\t16\t7\t12\t30\t27\t25\t21\t19\t37\t28\t26\t27\t34\t18\t19\t12\t18\t19\t20\t13\t11\t31\t24\t26\t40\t23\t31\t28\t33\t9\t8\t8\t9\t13\t11\t12\t11\t13\t11\t6\t6\t10\t7\t31\t14\t9\t6\t21\t12\t16\t13\t7\t10\t5\t27\t38\t10\t23\t10\t25\t30\t31\t24\t27\t13\t29\t19\t10\t19\t17\t22\t6\t13\t21\t7\t13\t24\t19\t20\t42\t32\t29\t35\t13\t42\t21\t22\t16\t12\t9\t26\t7\t10\t48\t37\t11\t18\t12\t11\t20\t9\t6\t26\t27\t24\t12\t29\t20\t16\t18\t14\t1\t18\t14\t37\t17\t35\t14\t30\t8\t7\t21\t25\t15\t26\t17\t19\t25\t28\t11\t26\t30\t19\t39\t24\t35\t30\t23\t22\t28\t23\t50\t6\t14\t27\t37\t9\t20\t16\t14\t14\t15\t9\t14\t18\t16\t15\t11\t13\t18\t21\t25\t24\t16\t34\t31\t22\t23\t28\t11\t8\t13\t38\t14\t26\t26\t11\t18\t44\t9\t22\t10\t14\t13\t14\t10\t4\t4\t17\t7\t39\t31\t34\t15\t8\t11\t34\t27\t18\t30\t5\t9\t14\t16\t20\t35\t15\t37\t34\t17\t15\t13\t6\t14\t24\t13\t5\t28\t16\t6\t9\t46\t27\t31\t31\t18\t34\t6\t8\t15\t11\t27\t22\t12\t27\t15\t2\t6\t27\t28\t11\t34\t20\t11\t11\t20\t34\t13\t19\t26\t11\t14\t10\t31\t19\t35\t21\t20\t10\t16\t42\t17\t15\t16\t33\t17\t33\t12\t13\t14\t7\t17\t21\t13\t8\t13\t17\t30\t58\t28\t1\t17\t11\t23\t33\t28\t20\t24\t17\t28\t6\t26\t38\t47\t46\t41\t47\t12\t7\t11\t32\t50\t63\t63\t24\t9\t56\t67\t62\t60\n-Progesterone\t18\t10\t17\t16\t18\t13\t10\t14\t12\t23\t35\t19\t16\t13\t18\t17\t12\t13\t14\t13\t11\t10\t31\t14\t24\t28\t21\t46\t42\t64\t23\t38\t56\t21\t50\t27\t103\t32\t16\t21\t19\t28\t71\t2\t45\t42\t44\t42\t43\t12\t10\t24\t26\t24\t35\t20\t25\t19\t19\t22\t20\t25\t24\t21\t26\t18\t20\t21\t20\t20\t13\t18\t40\t51\t55\t48\t34\t21\t15\t59\t47\t45\t54\t47\t59\t48\t43\t55\t63\t38\t28\t21\t31\t24\t30\t47\t39\t52\t47\t51\t74\t42\t53\t52\t67\t20\t18\t14\t15\t16\t17\t20\t20\t17\t16\t13\t9\t18\t11\t61\t23\t13\t8\t51\t31\t22\t22\t15\t21\t15\t40\t48\t14\t43\t13\t40\t38\t39\t38\t39\t24\t43\t28\t16\t27\t19\t33\t8\t21\t33\t9\t24\t31\t31\t28\t65\t42\t40\t45\t16\t57\t50\t68\t27\t29\t21\t55\t17\t22\t112\t78\t29\t29\t23\t24\t30\t10\t15\t50\t41\t41\t17\t57\t44\t32\t32\t21\t5\t26\t37\t84\t30\t44\t22\t44\t11\t9\t29\t38\t20\t34\t23\t26\t42\t56\t15\t45\t68\t29\t62\t46\t58\t61\t34\t42\t41\t57\t81\t10\t30\t39\t56\t27\t24\t26\t28\t26\t28\t24\t21\t21\t22\t26\t20\t20\t21\t39\t45\t40\t22\t55\t39\t29\t43\t51\t12\t15\t25\t68\t25\t43\t42\t18\t20\t77\t14\t47\t24\t20\t18\t26\t14\t7\t9\t22\t14\t80\t44\t49\t19\t13\t10\t54\t34\t20\t43\t10\t14\t28\t20\t35\t59\t27\t58\t49\t31\t10\t24\t6\t15\t43\t34\t11\t40\t29\t9\t14\t83\t52\t50\t44\t35\t44\t9\t13\t21\t23\t44\t37\t27\t35\t19\t7\t16\t42\t52\t15\t46\t49\t34\t21\t52\t69\t18\t47\t44\t16\t37\t29\t51\t33\t52\t40\t38\t21\t30\t91\t23\t22\t29\t46\t36\t44\t14\t22\t31\t27\t32\t32\t28\t20\t28\t44\t59\t103\t43\t9\t33\t24\t44\t63\t43\t34\t55\t36\t52\t15\t43\t80\t101\t84\t86\t100\t16\t9\t14\t80\t81\t125\t95\t29\t13\t85\t62\t168\t125\n-Testosterone\t14\t8\t13\t13\t15\t12\t10\t14\t12\t24\t36\t18\t16\t10\t17\t16\t9\t9\t10\t9\t10\t9\t28\t12\t22\t25\t19\t44\t39\t48\t22\t35\t46\t19\t38\t25\t101\t27\t15\t18\t17\t26\t51\t2\t38\t36\t39\t37\t37\t8\t6\t20\t22\t21\t25\t18\t21\t16\t17\t15\t18\t23\t24\t19\t21\t15\t15\t16\t16\t16\t9\t15\t39\t46\t43\t44\t29\t20\t10\t46\t37\t36\t40\t34\t43\t36\t30\t41\t51\t33\t19\t20\t24\t17\t22\t41\t35\t38\t33\t36\t65\t34\t39\t36\t52\t13\t12\t10\t11\t11\t11\t13\t14\t14\t11\t7\t3\t10\t5\t51\t19\t7\t3\t41\t25\t19\t16\t11\t17\t14\t35\t48\t14\t41\t15\t35\t37\t37\t38\t37\t22\t44\t26\t15\t29\t16\t29\t8\t21\t32\t10\t24\t32\t30\t28\t63\t38\t34\t42\t16\t49\t41\t46\t19\t20\t15\t44\t13\t16\t91\t63\t24\t21\t19\t20\t27\t10\t13\t32\t27\t27\t15\t51\t30\t21\t27\t19\t3\t23\t35\t72\t29\t44\t18\t37\t8\t8\t26\t33\t17\t31\t21\t23\t32\t47\t13\t44\t56\t28\t60\t39\t52\t60\t37\t39\t38\t48\t78\t10\t26\t40\t49\t24\t22\t22\t24\t21\t24\t18\t15\t17\t18\t21\t15\t17\t17\t33\t39\t35\t18\t48\t38\t29\t39\t42\t12\t14\t18\t60\t23\t36\t36\t16\t16\t61\t13\t42\t21\t19\t16\t26\t14\t7\t8\t19\t14\t64\t41\t42\t19\t12\t11\t46\t34\t19\t40\t7\t15\t27\t20\t29\t49\t27\t55\t41\t30\t10\t21\t6\t15\t38\t28\t12\t37\t28\t7\t14\t75\t37\t43\t43\t33\t43\t9\t12\t20\t14\t39\t33\t21\t33\t18\t5\t13\t41\t45\t10\t44\t44\t28\t20\t43\t57\t15\t41\t38\t15\t30\t27\t46\t30\t49\t39\t36\t20\t27\t70\t22\t20\t25\t44\t27\t45\t13\t18\t26\t18\t26\t30\t21\t18\t25\t34\t45\t86\t38\t7\t24\t22\t32\t50\t37\t25\t48\t34\t47\t14\t37\t66\t81\t71\t74\t84\t15\t8\t12\t68\t60\t96\t82\t27\t13\t72\t60\t125\t130\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/matches_test7_out.tsv
--- a/test-data/matches_test7_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,387 +0,0 @@\n-\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n-Perylene_2H12\t0\t0\t2\t0\t1\t0\t0\t1\t0\t0\t0\t0\t2\t0\t0\t3\t0\t0\t0\t1\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\n-Perylene\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t0\t1\t1\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Phenanthrene_2H10\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t2\t0\t1\t0\t0\t0\t0\t1\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\n-Phenanthrene\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Anthracene\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t2\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Acenaphthylene\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Acenaphthene\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t3\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Fluoranthene\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t1\t0\t1\t0\t0\t0\t2\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Pyrene\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t2\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0'..b'ph_isomer2\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Spirodiclofen\t3\t2\t0\t0\t0\t0\t4\t1\t0\t0\t1\t1\t4\t0\t0\t4\t3\t0\t1\t2\t4\t0\t2\t0\t0\t1\t0\t0\t2\t1\t0\t0\t3\t1\t0\t0\t1\t1\t1\t1\t0\t0\t2\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t3\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t1\t1\t1\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Spiromesifen\t1\t1\t0\t1\t0\t0\t2\t2\t0\t1\t1\t0\t2\t1\t0\t5\t0\t0\t0\t1\t3\t0\t3\t4\t0\t1\t2\t1\t2\t1\t0\t0\t1\t7\t0\t0\t2\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t3\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t2\t0\t1\t0\t0\t0\t0\t1\t2\t0\t1\t0\t0\t0\t0\t0\t2\t0\t0\t3\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\n-Spirotetramat\t2\t2\t0\t1\t0\t0\t2\t5\t0\t2\t1\t0\t6\t1\t0\t7\t1\t0\t1\t2\t4\t0\t4\t8\t0\t3\t2\t1\t2\t1\t0\t0\t3\t7\t0\t0\t3\t0\t0\t4\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t3\t0\t0\t3\t0\t0\t3\t0\t0\t1\t0\t0\t1\t0\t0\t3\t1\t3\t0\t0\t0\t0\t0\t2\t2\t3\t0\t1\t0\t0\t1\t0\t0\t3\t0\t2\t3\t2\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t2\t1\t0\t1\t1\t0\t0\t1\t2\t0\t1\t0\t2\t0\t0\t1\t1\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t1\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\n-17-alpha-Ethynylestradiol\t1\t0\t0\t2\t0\t0\t2\t2\t0\t1\t1\t0\t4\t1\t1\t5\t1\t0\t0\t1\t2\t0\t3\t4\t0\t2\t2\t1\t2\t1\t0\t0\t3\t7\t0\t0\t1\t1\t0\t4\t0\t0\t2\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t2\t0\t1\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t1\t0\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t2\t1\t0\t3\t1\t0\t0\t0\t0\t0\t1\t0\t0\t2\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t2\t1\t0\t0\n-Bisphenol A\t0\t0\t0\t0\t0\t0\t1\t1\t0\t1\t0\t0\t1\t0\t0\t3\t1\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t3\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-4-tert-Octylphenol\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Estrone\t1\t0\t0\t0\t0\t0\t1\t1\t0\t1\t1\t0\t3\t1\t1\t6\t0\t0\t0\t2\t1\t0\t2\t7\t0\t1\t3\t1\t2\t1\t0\t0\t3\t7\t0\t0\t0\t1\t0\t3\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t1\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t3\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t1\t0\t1\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\n-17-beta-Estradiol\t2\t0\t0\t0\t0\t0\t4\t2\t0\t1\t1\t0\t2\t0\t1\t4\t0\t0\t0\t0\t1\t0\t4\t4\t0\t0\t0\t1\t1\t0\t1\t0\t1\t6\t0\t0\t1\t1\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t1\t0\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t2\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n-Progesterone\t2\t3\t0\t2\t0\t0\t3\t3\t0\t2\t2\t0\t4\t2\t1\t6\t1\t0\t0\t2\t2\t0\t4\t9\t0\t4\t3\t1\t5\t2\t1\t0\t3\t6\t0\t0\t3\t0\t2\t4\t0\t0\t2\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t1\t1\t1\t1\t1\t2\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t2\t1\t4\t0\t1\t0\t0\t1\t2\t2\t2\t0\t1\t0\t0\t2\t0\t0\t2\t2\t3\t3\t2\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t2\t1\t0\t0\t1\t0\t1\t0\t2\t0\t1\t0\t1\t0\t0\t1\t2\t2\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t2\t0\t0\t0\t2\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t2\t1\t0\t0\n-Testosterone\t1\t1\t0\t1\t1\t0\t0\t2\t0\t1\t1\t0\t4\t1\t1\t5\t0\t0\t0\t1\t2\t0\t3\t7\t0\t2\t2\t1\t4\t1\t0\t0\t3\t3\t0\t0\t1\t0\t1\t2\t0\t0\t3\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t1\t1\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t4\t0\t1\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t2\t0\t0\t2\t2\t3\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t1\t0\t2\t0\t2\t0\t1\t0\t0\t0\t0\t1\t1\t2\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t2\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/recetox_gc-ei_ms_20201028.msp
--- a/test-data/recetox_gc-ei_ms_20201028.msp Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
b'@@ -1,31986 +0,0 @@\n-NAME: Perylene_2H12\r\n-SCANNUMBER: -1\r\n-RETENTIONTIME: -1\r\n-RETENTIONINDEX: 2876\r\n-PRECURSORMZ: 264.16858\r\n-PRECURSORTYPE: [M]+\r\n-IONMODE: Positive\r\n-SPECTRUMTYPE: Centroid\r\n-FORMULA: C20H12\r\n-INCHIKEY: CSHWQDPOILHKBI-AQZSQYOVSA-N\r\n-INCHI: \r\n-SMILES: [2H]C1=C(C2=C3C(=C1[2H])C4=C(C(=C(C5=C4C(=C(C(=C5[2H])[2H])[2H])C3=C(C(=C2[2H])[2H])[2H])[2H])[2H])[2H])[2H]\r\n-AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\r\n-COLLISIONENERGY: 70eV\r\n-INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\r\n-INSTRUMENTTYPE: GC-EI-Orbitrap\r\n-IONIZATION: EI+\r\n-LICENSE: CC BY-NC\r\n-COMMENT: \r\n-Num Peaks: 33\r\n-116.05576\t29277\r\n-118.06992\t49651\r\n-128.0558\t37001\r\n-130.06996\t78584\r\n-130.57159\t17533\r\n-132.08408\t65686\r\n-132.5858\t12593\r\n-207.0322\t39569\r\n-222.08282\t13141\r\n-223.06346\t20762\r\n-225.04277\t18058\r\n-227.02202\t26370\r\n-232.11204\t30354\r\n-236.1405\t22796\r\n-252.09322\t8564\r\n-256.11212\t41765\r\n-257.11557\t8688\r\n-258.12622\t21742\r\n-259.13446\t11564\r\n-260.14041\t248997\r\n-261.14358\t51721\r\n-262.15466\t33597\r\n-263.16254\t63732\r\n-264.16858\t829577\r\n-265.01968\t18286\r\n-265.17191\t176460\r\n-266.17523\t18876\r\n-283.03036\t10261\r\n-287.00632\t11352\r\n-295.10288\t26727\r\n-299.06152\t33379\r\n-359.0282\t67046\r\n-400.98447\t17406\r\n-\r\n-NAME: Perylene\r\n-SCANNUMBER: -1\r\n-RETENTIONTIME: -1\r\n-RETENTIONINDEX: 2886.9\r\n-PRECURSORMZ: 252.09323\r\n-PRECURSORTYPE: [M]+\r\n-IONMODE: Positive\r\n-SPECTRUMTYPE: Centroid\r\n-FORMULA: C20H12\r\n-INCHIKEY: CSHWQDPOILHKBI-UHFFFAOYSA-N\r\n-INCHI: \r\n-SMILES: C1=CC2=C3C(=C1)C1=CC=CC4=C1C(=CC=C4)C3=CC=C2\r\n-AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\r\n-COLLISIONENERGY: 70eV\r\n-INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\r\n-INSTRUMENTTYPE: GC-EI-Orbitrap\r\n-IONIZATION: EI+\r\n-LICENSE: CC BY-NC\r\n-COMMENT: \r\n-Num Peaks: 19\r\n-112.03071\t49892\r\n-113.03854\t87510\t"Theoretical m/z 113.039125, Mass diff 0 (0 ppm), Formula C9H5"\r\n-124.03076\t100146\r\n-124.53242\t24923\r\n-125.03855\t179254\t"Theoretical m/z 125.039125, Mass diff 0 (0 ppm), Formula C10H5"\r\n-125.54019\t49039\r\n-126.04636\t131679\r\n-126.54804\t36313\r\n-222.04645\t28905\r\n-224.06192\t55632\r\n-226.04175\t37413\r\n-246.04646\t23286\r\n-248.06204\t140007\r\n-249.07072\t62236\t"Theoretical m/z 249.070425, Mass diff -0.001 (0 ppm), Formula C20H9"\r\n-250.07765\t641789\r\n-251.07967\t137600\r\n-252.09323\t1955166\t"Theoretical m/z 252.093354, Mass diff 0 (0.49 ppm), SMILES C1=CC=2C=CC=C3C4=CC=CC5=CC=CC(C(=C1)C23)=C54, Annotation [C20H12]+, Rule of HR False"\r\n-253.09656\t402252\r\n-254.09985\t39987\r\n-\r\n-NAME: Phenanthrene_2H10\r\n-SCANNUMBER: -1\r\n-RETENTIONTIME: -1\r\n-RETENTIONINDEX: 1827.1\r\n-PRECURSORMZ: 188.14029\r\n-PRECURSORTYPE: [M]+\r\n-IONMODE: Positive\r\n-SPECTRUMTYPE: Centroid\r\n-FORMULA: C14H10\r\n-INCHIKEY: YNPNZTXNASCQKK-LHNTUAQVSA-N\r\n-INCHI: \r\n-SMILES: [2H]C1=C(C(=C2C(=C1[2H])C(=C(C3=C(C(=C(C(=C32)[2H])[2H])[2H])[2H])[2H])[2H])[2H])[2H]\r\n-AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\r\n-COLLISIONENERGY: 70eV\r\n-INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\r\n-INSTRUMENTTYPE: GC-EI-Orbitrap\r\n-IONIZATION: EI+\r\n-LICENSE: CC BY-NC\r\n-COMMENT: \r\n-Num Peaks: 17\r\n-76.02767\t185421\r\n-78.0418\t256858\r\n-80.05586\t881271\r\n-90.04181\t200162\r\n-92.06206\t537968\r\n-94.06999\t628791\r\n-156.08402\t836513\r\n-158.09808\t477819\r\n-160.11218\t2421148\r\n-161.11554\t310248\r\n-176.10866\t308983\r\n-184.11224\t2784543\r\n-185.11562\t445833\r\n-186.12637\t1283282\r\n-188.14029\t15115275\r\n-189.1436\t2312386\r\n-190.14688\t151400\r\n-\r\n-NAME: Phenanthrene\r\n-SCANNUMBER: -1\r\n-RETENTIONTIME: -1\r\n-RETENTIONINDEX: 1832.9\r\n-PRECURSORMZ: 178.0775\r\n-PRECURSORTYPE: [M]+\r\n-IONMODE: Positive\r\n-SPECTRUMTYPE: Centroid\r\n-FORMULA: C14H10\r\n-INCHIKEY: YNPNZTXNASCQKK-UHFFFAOYSA-N\r\n-INCHI: \r\n-SMILES: C1=CC2=C(C=C1)C1=C(C=CC=C1)C=C2\r\n-AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\r\n-COLLISIONENERGY: 70eV\r\n-INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\r\n-INSTRUMENTTYPE: GC-EI-Orbitrap\r\n-IONIZATION: EI+\r\n-LICENSE: CC BY-NC\r\n-COMMENT: \r\n-Num Peaks: 19\r\n-74.01508\t137808\t"Theoretical m/z 74.01565, Mass diff 0 (0 ppm), Formula C6H2"\r\n-75.02295\t278714\t"Theoretical m/z 75.023475, Mass diff 0 (0 ppm), Formula C6H3"\r\n-76.03075\t6'..b'pm), SMILES C=C2CCC1CC(C)CCC1C2(C)C, Annotation [C14H24-7H]+, Rule of HR True"\r\n-187.14806\t422332\t"Theoretical m/z 187.148122, Mass diff 0 (0.33 ppm), SMILES CC2CCC1C(CCCC1(C)(C))C2(C), Annotation [C14H26-7H]+, Rule of HR True"\r\n-188.1559\t151252\t"Theoretical m/z 188.155947, Mass diff 0 (0.25 ppm), SMILES CC2CCC1C(CCCC1(C)(C))C2(C), Annotation [C14H26-6H]+, Rule of HR False"\r\n-189.12735\t68862\t"Theoretical m/z 189.127389, Mass diff 0 (0.21 ppm), SMILES O=C2C=C1CCCC(CC)C1(C)CC2, Annotation [C13H20O-3H]+, Rule of HR True"\r\n-189.16364\t163919\t"Theoretical m/z 189.163772, Mass diff 0 (0.7 ppm), SMILES CC2CCC1C(CCCC1(C)(C))C2(C), Annotation [C14H26-5H]+, Rule of HR True"\r\n-190.13504\t97146\r\n-195.11685\t57370\t"Theoretical m/z 195.117375, Mass diff 0 (0 ppm), Formula C15H15"\r\n-197.13249\t50230\t"Theoretical m/z 197.132481, Mass diff 0 (0.04 ppm), SMILES C=C3CCC2C(CCC1CCCC12)C3C, Annotation [C15H24-7H]+, Rule of HR True"\r\n-199.14803\t221936\t"Theoretical m/z 199.148122, Mass diff 0 (0.46 ppm), SMILES C=C2CCC1C(C)C(C)CCC1C2(C)C, Annotation [C15H26-7H]+, Rule of HR True"\r\n-200.15579\t108028\r\n-201.16364\t216321\t"Theoretical m/z 201.163772, Mass diff 0 (0.65 ppm), SMILES C=C2CCC1C(C)C(C)CCC1C2(C)C, Annotation [C15H26-5H]+, Rule of HR True"\r\n-202.17162\t208618\r\n-203.14304\t1200123\t"Theoretical m/z 203.143035, Mass diff 0 (0.02 ppm), SMILES OC3CCC2C3(CCC1C(C)CCCC12), Annotation [C14H24O-5H]+, Rule of HR True"\r\n-204.14627\t283454\r\n-206.16646\t32118\r\n-209.13243\t45976\t"Theoretical m/z 209.133026, Mass diff 0 (0 ppm), Formula C16H17"\r\n-211.14809\t272618\t"Theoretical m/z 211.148132, Mass diff 0 (-0.2 ppm), SMILES CC1=C(C)C2=C([CH+]CCC=C(C)\\C=C/2)C=C1, Annotation [C16H19]+, Rule of HR True"\r\n-212.15134\t57168\r\n-213.16373\t355360\t"Theoretical m/z 213.163773, Mass diff 0 (-0.2 ppm), SMILES CC1=C(C)C2=C([CH+]CCC=C(C)CC2)C=C1, Annotation [C16H21]+, Rule of HR True"\r\n-214.16698\t92310\r\n-215.143\t60304\t"Theoretical m/z 215.143035, Mass diff 0 (0.16 ppm), SMILES OC3CCC2C3(CCC1C(C(=C)CCC12)C), Annotation [C15H24O-5H]+, Rule of HR True"\r\n-216.15102\t55312\r\n-217.15874\t113508\t"Theoretical m/z 217.158691, Mass diff 0 (0.23 ppm), SMILES OC3CCC2C3(CCC1C2(CCCC1(C)(C))), Annotation [C15H26O-5H]+, Rule of HR True"\r\n-218.16704\t51076\r\n-226.17177\t37673\r\n-227.1797\t204277\t"Theoretical m/z 227.179433, Mass diff 0 (1.18 ppm), SMILES C=C2CCC1C(CC)C(C)CCC1C2(C)CC, Annotation [C17H30-7H]+, Rule of HR True"\r\n-228.1873\t842856\r\n-229.1588\t359919\t"Theoretical m/z 229.158691, Mass diff 0 (0.48 ppm), SMILES OC3CCC2C3(CCC1C2(CCC(=C)C1(C)(C))), Annotation [C16H26O-5H]+, Rule of HR True"\r\n-230.16186\t41138\r\n-231.17433\t428563\t"Theoretical m/z 231.174335, Mass diff 0 (0.02 ppm), SMILES O=C3C=C2CCC1C(C)CCCC1C2(C)CC3, Annotation [C16H24O-H]+, Rule of HR True"\r\n-232.17703\t61957\r\n-237.16373\t184777\t"Theoretical m/z 237.164326, Mass diff 0 (0 ppm), Formula C18H21"\r\n-238.16693\t38109\r\n-241.15854\t66162\t"Theoretical m/z 241.158691, Mass diff 0 (0.62 ppm), SMILES O=C3C=C2CCC1C(CC)CCCC1C2(C)CC3, Annotation [C17H26O-5H]+, Rule of HR True"\r\n-242.16649\t51489\r\n-245.19052\t102650\t"Theoretical m/z 245.189996, Mass diff 0.001 (2.14 ppm), SMILES OC1CCC2C3CCC(=C)C(C)(C)C3(CCC12(C)), Annotation [C17H28O-3H]+, Rule of HR True"\r\n-246.19786\t1126362\r\n-247.2011\t212107\r\n-252.18724\t143505\r\n-255.17436\t288345\t"Theoretical m/z 255.174341, Mass diff 0 (0.08 ppm), SMILES O=C3C=C2CCC1C4CCCC4(CCC1C2(C)CC3), Annotation [C18H26O-3H]+, Rule of HR True"\r\n-256.17764\t54890\r\n-259.16943\t50245\t"Theoretical m/z 259.169244, Mass diff 0 (0.72 ppm), SMILES O=C3C=C2CCC1C(C)C(CO)CCC1C2(C)CC3, Annotation [C17H26O2-3H]+, Rule of HR True"\r\n-260.17758\t70396\r\n-270.19791\t397018\r\n-271.20062\t89701\r\n-273.18549\t199263\t"Theoretical m/z 273.184894, Mass diff 0.001 (2.18 ppm), SMILES O=C3C=C2CCC1C4CCC(O)C4(CCC1C2(C)CC3), Annotation [C18H26O2-H]+, Rule of HR True"\r\n-274.18863\t88305\r\n-288.20841\t1123316\t"Theoretical m/z 288.208375, Mass diff 0 (0.12 ppm), SMILES O=C4C=C3CCC1C(CCC2(C)(C(O)CCC12))C3(C)CC4, Annotation [C19H28O2]+, Rule of HR False"\r\n-289.21173\t220898\r\n-\r\n-\r\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/scores_test1_out.tsv
--- a/test-data/scores_test1_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,175 +0,0 @@\n-\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n-C001\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.01131824210476606\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.048050183216295894\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-C002\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\t9.826519226227062e-05\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.058818978905494305\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.012123553350886735\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.003604401443170206\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-C003\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.001996725260781092\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.003441767933265955\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-C004\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t2.962804993140071e-05\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0040278645118103865\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-C005\t0.0\t0.0\t0.0\t0.0\t0.9999999999999992\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t'..b'.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.18149359661870704\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-C170\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.2793597601790586\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\n-C171\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.030541540271258622\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\n-C172\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.9156381551854462\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\n-C173\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.00045173712879657656\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.14221557456489292\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\n-C174\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/scores_test3_out.tsv
--- a/test-data/scores_test3_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,387 +0,0 @@\n-\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n-Perylene_2H12\t0.0\t0.0\t0.0005256270959446041\t0.0\t0.03073097535576865\t0.0\t0.0\t6.245570704427149e-05\t0.0\t0.0\t0.0\t0.0\t0.004564716964324222\t0.0\t0.0\t0.013203066603708824\t0.0\t0.0\t0.0\t0.00039214513461787934\t0.0\t0.0\t0.0007918167287744314\t0.0\t0.0\t0.0004447561432835879\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.014053019016690342\t0.0\t0.0\t0.0\t0.0\t0.0\t0.010864712316628122\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.1457986453664692\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.07136533213674005\t0.0\t0.0\t0.0\t0.0\t0.0\t0.008502864326957613\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.008332485011325066\t0.06707997408159612\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.014331972335452473\t0.0\t0.00279044697331512\t0.0\t0.0\t0.0\t0.0\t0.08644538826313944\t0.0\t0.0230223502665467\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.05194618366505897\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.07451431952403163\t0.0\t0.0\t0.0\t0.0\t0.008606424963572753\t0.0\t0.0\t0.0\t0.0\t0.0\t0.029465908012253836\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.06765194944236241\t0.0\t0.0\n-Perylene\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0032741303817077237\t0.0\t0.01059895859620056\t0.0\t0.0\t0.011988179251417755\t0.004445067503941489\t0.0\t0.0\t0.0\t0.0\t0.0\t0.010205422020394999\t0.0\t0.0\t0.07094451588225481\t0.0\t0.0\t0.0012435925952213776\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0028113782310797255\t0.0\t0.0\t0.0015057844692663734\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.015722861787553524\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.04875136828344371\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.023395854503055747\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.07014255094522087\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-Phenanthrene_2H10\t0.0024478437470211957\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.044583058787688194\t0.0\t0.0\t0.010556784103056164\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.053243824199748255\t0.0\t0.7408591267092633\t0.0\t0.0\t0.0\t0.0\t0.12202560685242986\t0.04568269717012136\t0.004157278401108382\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.028649962860904238\t0.0\t0.0391645806143903\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.008485163950429123\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.004892255878207329\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.027071584755955534\t0.0\t0.0\t0.0\n-Phenanthrene\t0.00561720665430217\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0014924956391185538\t0.12453944133920959\t0.0\t0.087078422418'..b'5369148999\t0.0\t0.0\t0.0\t0.05477359359289294\t0.014982137997848574\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.011712224528606202\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-Progesterone\t0.009204773873174418\t0.0003433200025161085\t0.0\t0.0007924296222333302\t0.0\t0.0\t0.009441153443328694\t0.005947519671344408\t0.0\t0.0005356814581771544\t0.006215857342936553\t0.0\t0.009417667003961789\t0.009918679539108183\t0.00023339501999512072\t0.02671768716952186\t0.00030790986345821436\t0.0\t0.0\t0.0013743163821902838\t0.01723317359032806\t0.0\t0.031565466787107484\t0.012448459343477094\t0.0\t0.007750527312298496\t0.0070234525583043545\t0.02059761160321701\t0.023913761352649478\t0.011281962106545012\t1.6426994248357484e-05\t0.0\t0.03697516657930819\t0.033662224880288756\t0.0\t0.0\t0.023540677910418206\t0.0\t0.036138976947232074\t0.02542494090112982\t0.0\t0.0\t0.011503400057545196\t0.0\t0.00020822196303031898\t0.0\t0.0\t0.0\t0.0\t0.0014763317286047445\t0.0\t0.0012583838846539634\t0.0\t0.003999037208194656\t0.013710430439412245\t0.0013524730258847118\t0.007867754340786993\t0.040527384587716785\t0.010996257146538806\t0.0\t0.0\t0.06835446607134321\t0.0\t0.0\t0.008591363167784043\t0.0\t0.0\t0.0\t0.0\t0.0\t0.007090284250167511\t0.008465564938609326\t0.08040814196887734\t0.0\t0.028294996723359764\t0.0\t0.0\t0.0038398141926578064\t0.16023981186600048\t0.04805946943116568\t0.037035561711554706\t0.0\t0.0005120942309216829\t0.0\t0.0\t0.03494182656191998\t0.0\t0.0\t0.027888357150312005\t0.01258535522221259\t0.03740123828771993\t0.008517825868349588\t0.00913703375472102\t0.0\t0.0\t0.0\t0.0\t0.0\t0.029300775267851735\t0.0\t0.0\t0.0\t0.01295087988307018\t0.0005955124138932553\t0.0\t0.0\t0.0\t0.005304965226057589\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.039134050766579234\t0.2714869727438596\t0.003527160692631183\t0.0\t0.0\t0.020497841819279862\t0.0\t0.002511329287084922\t0.0\t0.3500845873047567\t0.0\t0.002239902702309837\t0.0\t0.005491138035803363\t0.0\t0.0\t0.011672805021412769\t0.02568290039984708\t0.07006608189710377\t0.018632962351792192\t0.0\t0.04153373284622605\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.00786791970310509\t0.0\t0.047481418502903334\t0.0\t0.0\t0.0\t0.10974594417370813\t0.034291658672408076\t0.0\t0.023165391809283516\t0.0\t0.0\t0.0\t0.0002833417563650782\t0.0\t0.0\t0.0\t0.026807362599866824\t0.003975994609085822\t0.0\t0.0\t0.0\t0.0\t0.0\t0.06458445415629567\t0.013061309028202963\t0.0\t0.0\n-Testosterone\t0.00963321193050066\t0.00024864315729290006\t0.0\t0.00023222574210458811\t0.0009261428396286391\t0.0\t0.0\t0.00040034384039336243\t0.0\t6.734322542065858e-05\t0.0016889974488375878\t0.0\t0.1780813812315969\t0.007271975837211051\t0.0001534940265342155\t0.027912903539727703\t0.0\t0.0\t0.0\t0.0005797401705402813\t0.01109882605223559\t0.0\t0.024485309434567656\t0.020836980610370613\t0.0\t0.004730656796420955\t0.009055625850088012\t0.01764485751937845\t0.0342974876068616\t0.003171910470299864\t0.0\t0.0\t0.039580956813763224\t0.008699485073663131\t0.0\t0.0\t0.027921629937492445\t0.0\t0.011883152521337894\t0.00473955367711716\t0.0\t0.0\t0.06041370798509162\t0.0\t0.042697154051077546\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0028714022903154834\t0.021418156386493012\t0.0015186515255164064\t0.006270179831850896\t0.029915893967898583\t0.00688460931497788\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.001333543171051696\t0.0\t0.08702752210600657\t0.0\t0.03171198034450119\t0.0\t0.0\t0.0\t0.0\t0.0007660193758873158\t0.010813507002141582\t0.0\t0.0\t0.0\t0.0\t0.004200894168035819\t0.0\t0.0\t0.02349484368553467\t0.01816654272894712\t0.06339867284692742\t0.00859117181156952\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.11646566920503162\t0.0\t0.0\t0.0\t0.0\t0.0031342530947578136\t0.0\t0.15489171142643712\t0.0\t0.013048242174815912\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.001658310433454475\t0.03949452321180806\t0.0\t0.0\t0.0\t0.021990926351807643\t0.0\t0.13014922112429483\t0.0\t0.18331721895001493\t0.0\t0.0014411200837741657\t0.0\t0.0\t0.0\t0.0\t0.010921053413542842\t0.00943243671087211\t0.06421886680272976\t0.025882956568067213\t0.0\t0.03618383380922253\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0006655628265325035\t0.0\t0.026485058850513155\t0.0\t0.0\t0.0\t0.10783284756046711\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.12344754627650137\t0.0\t0.0\t0.0\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/scores_test4_out.tsv
--- a/test-data/scores_test4_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
b"@@ -1,387 +0,0 @@\n-\tPerylene_2H12\tPerylene\tPhenanthrene_2H10\tPhenanthrene\tAnthracene\tAcenaphthylene\tAcenaphthene\tFluoranthene\tPyrene\tpara-Terphenyl\tRetene\tBenzo[b]naphtho[2,1-d]thiophene\t2,3-Benzofluorene\tBenzo[ghi]fluoranthene\tTriphenylene\tBenzanthracene/Benzophenanthrene\tBenzofluoranthene\tBenzo(k)fluoranthene\tBenzo[e]pyrene\tBenzo(a)pyrene\tIndeno[1,2,3-cd]pyrene\tBenzo(g,h,i)perylene\tAnthanthrene\tDibenzanthracene\tCoronene\tDicofol\tBenzophenone\t2-tert-Butyl-4-methoxyphenol\tButylated hydroxytoluene\tBumetrizole\t4-Methylbenzophenone\t2,4,6-Tribromophenol\t2,6-Dichloro-4-nitroaniline\t1-Methylphenanthrene\tTriclosan\tDrometrizole\tEnzacamene\t2,4-Di-tert-butyl-6-(5-chloro-2H-benzotriazol-2-yl)phenol\tOctrizole\t1,2,7,9-Tetrachlorodibenzofuran\t2,2',3,4,5,5',6-Heptachlorobiphenyl\t2,4,6-Trichlorobiphenyl\t2,2',3,3',4,5',6,6'-Octachlorobiphenyl\tMirex\tbeta-Hexachlorocyclohexane\talpha-1,2,3,4,5,6-Hexachlorocyclohexane\tLindane\tdelta-Hexachlorocyclohexane\tepsilon-Hexachlorocyclohexane\tPentachlorobenzene\tHexachlorobenzene\t2,4'-Dichlorodiphenyldichloroethylene\t2,4'-Dichlorodiphenyldichloroethane\t2,4'-Dichlorodiphenyltrichloroethane\t1,2,7,9-Tetrachlorodibenzo-p-dioxin\t2,4,4'-Trichlorobiphenyl\t2,2',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5-Pentachlorobiphenyl\t2,2',3,4,4',5'-Hexachlorobiphenyl\t2,2',4,4',5,5'-Hexachlorobiphenyl\t2,2',3,4,4',5,5'-Heptachlorobiphenyl\t2,2',5,5'-Tetrachlorobiphenyl\t2,3',4,6-Tetrachlorobiphenyl\t2,3',5',6-Tetrachlorobiphenyl\t2,2',3,4',5-Pentachlorobiphenyl\t2,3,3',4,5-Pentachlorobiphenyl\t3,3',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5',6-Hexachlorobiphenyl\t2,3,3',4,5,6-Hexachlorobiphenyl\t2,3,3',4',5',6-Hexachlorobiphenyl\t2,3,3',4',5,6-Hexachlorobiphenyl\t2,3,3',4',5,5',6-Heptachlorobiphenyl\tcis-Prallethrin\ttrans-Prallethrin\tcis-Resmethrin\ttrans-Resmethrin\tcis-Tetramethrin\ttrans-Tetramethrin\tBifenthrin\tFenpropathrin\tcis-Phenothrin\ttrans-Phenothrin\tcis-Cyphenothrin\ttrans-Cyphenothrin\tFlucythrinate_isomer1\tFlucythrinate_isomer2\tcis-Fenvalerate\ttrans-Fenvalerate\tDeltamethrin\tChlorpyrifos oxon\tlambda-Cyhalothrin\tTefluthrin\tTransfluthrin\tcis-Permethrin\ttrans-Permethrin\tcis-Allethrin\ttrans-Allethrin\tcis-Cypermethrin_isomer1\ttrans-Cypermethrin_isomer1\tcis-Cypermethrin_isomer2\ttrans-Cypermethrin_isomer2\tcis-Cyfluthrin_isomer1\ttrans-Cyfluthrin_isomer1\tcis-Cyfluthrin_isomer2\ttrans-Cyfluthrin_Isomer2\t1,2,3,4,7,8-Hexachlorodibenzo-p-dioxin\t1,2,3,4,6,7,8-Heptachlorodibenzo-p-dioxin\tOctachlorodibenzo-p-dioxin\tOctachlorodibenzofuran\t1,2,3,7,8-Pentachlorodibenzofuran\t1,2,3,4,7,8-Hexachlorodibenzofuran\t1,2,3,4,6,7,8-Heptachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzo-p-dioxin\t1,2,3,7,8-Pentachlorodibenzo-p-dioxin\t2,3,4,5-Tetrabromo-6-chlorotoluene\t2,3,4,5,6-Pentabromotoluene\t2,3,4,5,6-Pentabromoethylbenzene\t2,3,5,6-Tetrabromo-p-xylene\tAllyl 2,4,6-tribromophenyl ether\t2-Bromoallyl(2,4,6-tribromophenyl) ether\tPentabromobenzene\tHexabromobenzene\t2,3,4,5,6-Pentabromobenzyl alcohol\t2-Ethylhexyl 2,3,4,5-Tetrabromobenzoate\tsyn-Dechlorane plus\tanti-Dechlorane plus\talpha-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\tbeta-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\t1,2,5,6-Tetrabromocyclooctane\t1,1-Dibromo-2,3,3,4,4,5-hexachloro-2-cyclopenta-2,4-dien-1-ylcyclooctane\talpha-Amylcinnamaldehyde\ttrans-Cinnamaldehyde\tCitral (Geranial)\t1-Fluronaphthalene\talpha-Hexylcinnamaldehyde\tLilial\talpha-Amylcinnamyl alcohol\tEugenol\tIsoeugenol\t4-Methoxybenzyl alcohol\tMethyleugenol\tCinnamyl alcohol\tBenzyl alcohol\tEstragole\tBenzyl benzoate\tBenzyl cinnamate\tBenzyl salicylate\tCamphor\tEucalyptol\tCoumarin\tLimonene\tIsomethyl-alpha-ionone\tdelta-Iraldeine\tSafrole\tCashmeran\tCelestolide\tPhantolide\tTonalide\tTraseolide\tGalaxolide\tAldrin\tEndosulfan\tHeptachlor\tcis-Heptachlor epoxide\tEndosulfan sulphate\tEndrin ketone\ttrans-Chlordane\tcis-Chlordane\tEndrin aldehyde\tEndrin\t4,4'-Dichlorodiphenyldichloroethylene\tMethoxychlor\t4,4'-Dichlorodiphenyldichloroethane\t4,4'-Dichlorodiphenyltrichloroethane\tTris(4-tert-butylphenyl) phosphate\tTri-n-butyl-phosphate\tTris(1,3-dichloro-2-propy"..b'99004\t0.25699522150266857\t0.10086896866641386\t0.19470204063894617\t0.11098877289750769\t0.006075991834095414\t0.12927366381808264\t0.2082286991025265\t0.27240094810916426\t0.1654349689057302\t0.19840999142874\t0.16569982850423232\t0.2161122709425279\t0.14188794086609754\t0.13892041895889107\t0.163316162934255\t0.19714612348281121\t0.11328276368401106\t0.1797393737639574\t0.11912510425789868\t0.1513410655357927\t0.17376963876857818\t0.11727276196549535\t0.18242398225791773\t0.42587475586474854\t0.26019712746688456\t0.14368704499704515\t0.2071878076412335\t0.09453837918890001\t0.17883495196186588\t0.230407695094039\t0.2003708220640954\t0.28221288790938787\t0.1632240149541304\t0.33569524175870596\t0.3064105089065634\t0.06757663229398125\t0.1875387758604876\t0.14809372567415943\t0.0852574772349589\t0.038518437729193764\t0.1694183013806351\t0.15289185256222845\t0.1323269305931256\t0.14183815846488648\t0.11892832652180535\t0.12040055943475189\t0.055133306975097635\t0.059734777165814525\t0.0566711436003959\t0.10411276944449463\t0.09983202384693853\t0.038921466584489514\t0.0866119306764878\t0.06992238111265867\t0.09431159408139042\t0.0938643626333852\t0.08034523157647287\t0.30621301093750836\t0.1961893280957181\t0.1611360617918086\t0.23758939346985095\t0.12271395237074852\t0.1430157698712594\t0.0833933983294341\t0.035843502317569234\t0.1633740133739675\t0.1483671806190231\t0.13613729576468475\t0.13641339521522466\t0.10219746530932572\t0.24528101783913517\t0.22010021314888892\t0.17232404535039347\t0.17930641471345765\t0.15547769438760414\t0.1764623247344844\t0.08065948881320073\t0.19144552461877729\t0.3183099871734532\t0.06306342224555873\t0.05987974210984678\t0.05740354384209485\t0.20721138046115542\t0.328456758896439\t0.32098885468030136\t0.23821868337793292\t0.07145396369303544\t0.19081119513093286\t0.057616601871621285\t0.2340183931599587\t0.23822558856834722\t0.06797270073648182\t0.43003853617809873\t0.02792424887822149\t0.18822156250959438\t0.16114686619257262\t0.22810608062777601\t0.0838224184080167\t0.08443319924123477\t0.1894850392430079\t0.265083072227541\t0.10874839217026484\t0.21783385621466414\t0.006793839193263404\t0.08475249990448121\t0.12988582068761828\t0.2837084520725496\t0.07764215735572715\t0.08398679648212394\t0.09380315448372266\t0.21450922103222061\t0.27742281155579906\t0.04435157844941482\t0.35472454340204307\t0.3010423011492258\t0.06572111033523048\t0.35449933960739016\t0.184212014644299\t0.16510341696367972\t0.22650136131747978\t0.08545503348016772\t0.054746540083621745\t0.07158142375321293\t0.05222918108605921\t0.29873505869435935\t0.1592048730563699\t0.12242150172343544\t0.06834825436267856\t0.11787482883203612\t0.06533075716795377\t0.29220597270428633\t0.3204987910247821\t0.23075740046511872\t0.16013387140172308\t0.1031810078648983\t0.11609557607181138\t0.06536501695877456\t0.07528353746322132\t0.14631099884719126\t0.31686299036015636\t0.15686508283056178\t0.2502894060505306\t0.15632555985381263\t0.06157073783891902\t0.17850524434839174\t0.15082352190116588\t0.10496525194001774\t0.0328681907045638\t0.24179240409750177\t0.20560588522808376\t0.2271655674450096\t0.218989372412798\t0.09854462852017379\t0.1117782001836314\t0.32586231433297036\t0.16492586594387235\t0.1863221551020623\t0.23621550072877454\t0.12483921692480258\t0.16889581762525904\t0.03249926663036536\t0.015295084861858975\t0.20368054392043403\t0.18965962379608556\t0.1016530064450796\t0.12816683398762763\t0.06555661306024704\t0.022930759762077174\t0.019231613914197573\t0.15747279820504434\t0.088105124422038\t0.34732800952940357\t0.12915213761674713\t0.026497694389320044\t0.07320003712462311\t0.15992895420273134\t0.04418658553634053\t0.22031587132600947\t0.10334439566995825\t0.054857312240601364\t0.14588090116315752\t0.0720775597079632\t0.2322377084263006\t0.009182131128330325\t0.08725499132616112\t0.23335439715459685\t0.26456927574996886\t0.20593724958472245\t0.16953436023943352\t0.2915911520785385\t0.1972305838560561\t0.061557676013784396\t0.08503438513801481\t0.16053915107475406\t0.14738299237590127\t0.3485715331892874\t0.331614755581215\t0.149139047638064\t0.14441111333967438\t0.3881349843527812\t0.3574090148392564\t0.8662836910447197\t1.0\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/scores_test5_out.tsv
--- a/test-data/scores_test5_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,175 +0,0 @@\n-\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n-C001\t1.0000000000000002\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.011318242104766061\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0480501832162959\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-C002\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\t9.826519226227063e-05\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.05881897890549432\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.012123553350886737\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0036044014431702073\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-C003\t0.0\t0.0\t0.9999999999999999\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.001996725260781092\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0034417679332659546\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-C004\t0.0\t0.0\t0.0\t0.9999999999999998\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t2.96280499314007e-05\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0040278645118103865\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-C005\t0.0\t0.0\t0.0\t0.0\t0.9999999999999999\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t'..b'0.0\t0.0\t0.0\t0.0\t0.18149359661870704\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.9999999999999998\t0.0\t0.0\t0.0\t0.0\t0.0\n-C170\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.2793597601790586\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\n-C171\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.030541540271258626\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0000000000000002\t0.0\t0.0\t0.0\n-C172\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.9156381551854463\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0000000000000002\t0.0\t0.0\n-C173\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.00045173712879657656\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.14221557456489292\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0000000000000002\t0.0\n-C174\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0000000000000002\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/scores_test6_out.tsv
--- a/test-data/scores_test6_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
b"@@ -1,387 +0,0 @@\n-\tPerylene_2H12\tPerylene\tPhenanthrene_2H10\tPhenanthrene\tAnthracene\tAcenaphthylene\tAcenaphthene\tFluoranthene\tPyrene\tpara-Terphenyl\tRetene\tBenzo[b]naphtho[2,1-d]thiophene\t2,3-Benzofluorene\tBenzo[ghi]fluoranthene\tTriphenylene\tBenzanthracene/Benzophenanthrene\tBenzofluoranthene\tBenzo(k)fluoranthene\tBenzo[e]pyrene\tBenzo(a)pyrene\tIndeno[1,2,3-cd]pyrene\tBenzo(g,h,i)perylene\tAnthanthrene\tDibenzanthracene\tCoronene\tDicofol\tBenzophenone\t2-tert-Butyl-4-methoxyphenol\tButylated hydroxytoluene\tBumetrizole\t4-Methylbenzophenone\t2,4,6-Tribromophenol\t2,6-Dichloro-4-nitroaniline\t1-Methylphenanthrene\tTriclosan\tDrometrizole\tEnzacamene\t2,4-Di-tert-butyl-6-(5-chloro-2H-benzotriazol-2-yl)phenol\tOctrizole\t1,2,7,9-Tetrachlorodibenzofuran\t2,2',3,4,5,5',6-Heptachlorobiphenyl\t2,4,6-Trichlorobiphenyl\t2,2',3,3',4,5',6,6'-Octachlorobiphenyl\tMirex\tbeta-Hexachlorocyclohexane\talpha-1,2,3,4,5,6-Hexachlorocyclohexane\tLindane\tdelta-Hexachlorocyclohexane\tepsilon-Hexachlorocyclohexane\tPentachlorobenzene\tHexachlorobenzene\t2,4'-Dichlorodiphenyldichloroethylene\t2,4'-Dichlorodiphenyldichloroethane\t2,4'-Dichlorodiphenyltrichloroethane\t1,2,7,9-Tetrachlorodibenzo-p-dioxin\t2,4,4'-Trichlorobiphenyl\t2,2',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5-Pentachlorobiphenyl\t2,2',3,4,4',5'-Hexachlorobiphenyl\t2,2',4,4',5,5'-Hexachlorobiphenyl\t2,2',3,4,4',5,5'-Heptachlorobiphenyl\t2,2',5,5'-Tetrachlorobiphenyl\t2,3',4,6-Tetrachlorobiphenyl\t2,3',5',6-Tetrachlorobiphenyl\t2,2',3,4',5-Pentachlorobiphenyl\t2,3,3',4,5-Pentachlorobiphenyl\t3,3',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5',6-Hexachlorobiphenyl\t2,3,3',4,5,6-Hexachlorobiphenyl\t2,3,3',4',5',6-Hexachlorobiphenyl\t2,3,3',4',5,6-Hexachlorobiphenyl\t2,3,3',4',5,5',6-Heptachlorobiphenyl\tcis-Prallethrin\ttrans-Prallethrin\tcis-Resmethrin\ttrans-Resmethrin\tcis-Tetramethrin\ttrans-Tetramethrin\tBifenthrin\tFenpropathrin\tcis-Phenothrin\ttrans-Phenothrin\tcis-Cyphenothrin\ttrans-Cyphenothrin\tFlucythrinate_isomer1\tFlucythrinate_isomer2\tcis-Fenvalerate\ttrans-Fenvalerate\tDeltamethrin\tChlorpyrifos oxon\tlambda-Cyhalothrin\tTefluthrin\tTransfluthrin\tcis-Permethrin\ttrans-Permethrin\tcis-Allethrin\ttrans-Allethrin\tcis-Cypermethrin_isomer1\ttrans-Cypermethrin_isomer1\tcis-Cypermethrin_isomer2\ttrans-Cypermethrin_isomer2\tcis-Cyfluthrin_isomer1\ttrans-Cyfluthrin_isomer1\tcis-Cyfluthrin_isomer2\ttrans-Cyfluthrin_Isomer2\t1,2,3,4,7,8-Hexachlorodibenzo-p-dioxin\t1,2,3,4,6,7,8-Heptachlorodibenzo-p-dioxin\tOctachlorodibenzo-p-dioxin\tOctachlorodibenzofuran\t1,2,3,7,8-Pentachlorodibenzofuran\t1,2,3,4,7,8-Hexachlorodibenzofuran\t1,2,3,4,6,7,8-Heptachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzo-p-dioxin\t1,2,3,7,8-Pentachlorodibenzo-p-dioxin\t2,3,4,5-Tetrabromo-6-chlorotoluene\t2,3,4,5,6-Pentabromotoluene\t2,3,4,5,6-Pentabromoethylbenzene\t2,3,5,6-Tetrabromo-p-xylene\tAllyl 2,4,6-tribromophenyl ether\t2-Bromoallyl(2,4,6-tribromophenyl) ether\tPentabromobenzene\tHexabromobenzene\t2,3,4,5,6-Pentabromobenzyl alcohol\t2-Ethylhexyl 2,3,4,5-Tetrabromobenzoate\tsyn-Dechlorane plus\tanti-Dechlorane plus\talpha-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\tbeta-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\t1,2,5,6-Tetrabromocyclooctane\t1,1-Dibromo-2,3,3,4,4,5-hexachloro-2-cyclopenta-2,4-dien-1-ylcyclooctane\talpha-Amylcinnamaldehyde\ttrans-Cinnamaldehyde\tCitral (Geranial)\t1-Fluronaphthalene\talpha-Hexylcinnamaldehyde\tLilial\talpha-Amylcinnamyl alcohol\tEugenol\tIsoeugenol\t4-Methoxybenzyl alcohol\tMethyleugenol\tCinnamyl alcohol\tBenzyl alcohol\tEstragole\tBenzyl benzoate\tBenzyl cinnamate\tBenzyl salicylate\tCamphor\tEucalyptol\tCoumarin\tLimonene\tIsomethyl-alpha-ionone\tdelta-Iraldeine\tSafrole\tCashmeran\tCelestolide\tPhantolide\tTonalide\tTraseolide\tGalaxolide\tAldrin\tEndosulfan\tHeptachlor\tcis-Heptachlor epoxide\tEndosulfan sulphate\tEndrin ketone\ttrans-Chlordane\tcis-Chlordane\tEndrin aldehyde\tEndrin\t4,4'-Dichlorodiphenyldichloroethylene\tMethoxychlor\t4,4'-Dichlorodiphenyldichloroethane\t4,4'-Dichlorodiphenyltrichloroethane\tTris(4-tert-butylphenyl) phosphate\tTri-n-butyl-phosphate\tTris(1,3-dichloro-2-propy"..b'26685\t0.10086896866641389\t0.1947020406389462\t0.11098877289750769\t0.006075991834095411\t0.12927366381808267\t0.20822869910252648\t0.2724009481091642\t0.16543496890573017\t0.19840999142874002\t0.1656998285042323\t0.2161122709425279\t0.1418879408660975\t0.13892041895889104\t0.1633161629342549\t0.19714612348281121\t0.11328276368401105\t0.1797393737639574\t0.1191251042578987\t0.15134106553579268\t0.17376963876857826\t0.11727276196549538\t0.1824239822579177\t0.4258747558647484\t0.26019712746688456\t0.14368704499704518\t0.20718780764123357\t0.09453837918889996\t0.17883495196186594\t0.23040769509403897\t0.20037082206409543\t0.2822128879093878\t0.1632240149541304\t0.33569524175870596\t0.30641050890656346\t0.06757663229398125\t0.18753877586048753\t0.14809372567415943\t0.0852574772349589\t0.03851843772919378\t0.1694183013806351\t0.15289185256222845\t0.13232693059312559\t0.14183815846488648\t0.11892832652180534\t0.12040055943475188\t0.05513330697509764\t0.059734777165814525\t0.0566711436003959\t0.10411276944449462\t0.09983202384693853\t0.038921466584489514\t0.08661193067648779\t0.06992238111265867\t0.09431159408139039\t0.09386436263338525\t0.08034523157647287\t0.30621301093750825\t0.19618932809571804\t0.16113606179180862\t0.23758939346985095\t0.12271395237074857\t0.1430157698712594\t0.08339339832943408\t0.03584350231756923\t0.1633740133739675\t0.14836718061902307\t0.13613729576468475\t0.13641339521522464\t0.1021974653093257\t0.24528101783913503\t0.220100213148889\t0.1723240453503934\t0.17930641471345757\t0.15547769438760414\t0.1764623247344844\t0.08065948881320074\t0.1914455246187773\t0.31830998717345316\t0.06306342224555872\t0.05987974210984676\t0.057403543842094853\t0.20721138046115545\t0.328456758896439\t0.3209888546803013\t0.23821868337793287\t0.07145396369303543\t0.19081119513093284\t0.05761660187162128\t0.2340183931599587\t0.2382255885683472\t0.06797270073648182\t0.43003853617809906\t0.02792424887822149\t0.1882215625095944\t0.1611468661925726\t0.2281060806277761\t0.08382241840801669\t0.08443319924123475\t0.18948503924300789\t0.26508307222754085\t0.10874839217026484\t0.2178338562146641\t0.006793839193263404\t0.08475249990448121\t0.12988582068761825\t0.2837084520725496\t0.07764215735572716\t0.08398679648212394\t0.09380315448372264\t0.2145092210322206\t0.27742281155579906\t0.04435157844941482\t0.35472454340204307\t0.30104230114922564\t0.06572111033523048\t0.35449933960739\t0.18421201464429898\t0.16510341696367972\t0.22650136131747978\t0.08545503348016771\t0.05474654008362175\t0.0715814237532129\t0.052229181086059215\t0.2987350586943593\t0.15920487305636982\t0.12242150172343545\t0.06834825436267859\t0.11787482883203612\t0.06533075716795375\t0.2922059727042863\t0.32049879102478224\t0.23075740046511867\t0.16013387140172314\t0.10318100786489835\t0.11609557607181131\t0.06536501695877454\t0.07528353746322129\t0.14631099884719126\t0.31686299036015625\t0.15686508283056178\t0.25028940605053057\t0.15632555985381263\t0.061570737838919025\t0.17850524434839174\t0.15082352190116585\t0.10496525194001774\t0.03286819070456378\t0.24179240409750166\t0.20560588522808373\t0.22716556744500943\t0.21898937241279798\t0.09854462852017383\t0.11177820018363145\t0.3258623143329703\t0.16492586594387235\t0.18632215510206235\t0.2362155007287745\t0.12483921692480261\t0.16889581762525907\t0.03249926663036536\t0.015295084861858977\t0.20368054392043405\t0.1896596237960856\t0.10165300644507959\t0.12816683398762765\t0.065556613060247\t0.022930759762077178\t0.019231613914197577\t0.15747279820504434\t0.08810512442203798\t0.3473280095294035\t0.12915213761674713\t0.026497694389320044\t0.0732000371246231\t0.15992895420273126\t0.044186585536340514\t0.2203158713260095\t0.10334439566995822\t0.05485731224060137\t0.14588090116315747\t0.0720775597079632\t0.23223770842630054\t0.009182131128330325\t0.08725499132616109\t0.23335439715459674\t0.2645692757499689\t0.20593724958472245\t0.1695343602394335\t0.2915911520785384\t0.19723058385605607\t0.06155767601378439\t0.0850343851380148\t0.16053915107475394\t0.14738299237590127\t0.3485715331892873\t0.3316147555812152\t0.14913904763806404\t0.14441111333967438\t0.388134984352781\t0.3574090148392564\t0.8662836910447191\t0.9999999999999992\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/scores_test7_out.tsv
--- a/test-data/scores_test7_out.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,387 +0,0 @@\n-\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n-Perylene_2H12\t0.0\t0.0\t0.0005256270959446022\t0.0\t0.030730975355768627\t0.0\t0.0\t6.245570704430632e-05\t0.0\t0.0\t0.0\t0.0\t0.00456471696432429\t0.0\t0.0\t0.013203066603708858\t0.0\t0.0\t0.0\t0.00039214513461791224\t0.0\t0.0\t0.0007918167287744574\t0.0\t0.0\t0.00044475614328358696\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.014053019016690354\t0.0\t0.0\t0.0\t0.0\t0.0\t0.010864712316628151\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.1457986453664692\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.07136533213674011\t0.0\t0.0\t0.0\t0.0\t0.0\t0.008502864326957616\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.008332485011325061\t0.06707997408159616\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.01433197233545246\t0.0\t0.0027904469733151184\t0.0\t0.0\t0.0\t0.0\t0.08644538826313945\t0.0\t0.023022350266546702\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.05194618366505899\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.07451431952403163\t0.0\t0.0\t0.0\t0.0\t0.008606424963572739\t0.0\t0.0\t0.0\t0.0\t0.0\t0.029465908012253867\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.06765194944236244\t0.0\t0.0\n-Perylene\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0032741303817076985\t0.0\t0.010598958596200674\t0.0\t0.0\t0.011988179251417768\t0.004445067503941529\t0.0\t0.0\t0.0\t0.0\t0.0\t0.01020542202039499\t0.0\t0.0\t0.07094451588225487\t0.0\t0.0\t0.0012435925952213516\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.002811378231079725\t0.0\t0.0\t0.0015057844692663723\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.015722861787553544\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.048751368283443716\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.023395854503055768\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.07014255094522091\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-Phenanthrene_2H10\t0.0024478437470211766\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.04458305878768816\t0.0\t0.0\t0.010556784103056174\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0532438241997481\t0.0\t0.7408591267092633\t0.0\t0.0\t0.0\t0.0\t0.12202560685242984\t0.04568269717012124\t0.0041572784011083466\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.028649962860904203\t0.0\t0.039164580614390335\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.008485163950429093\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.004892255878207331\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.027071584755955516\t0.0\t0.0\t0.0\n-Phenanthrene\t0.0056172066543021745\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0014924956391185894\t0.12453944133920962\t0.0\t0.087078'..b'9148988\t0.0\t0.0\t0.0\t0.05477359359289298\t0.014982137997848585\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.011712224528606234\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n-Progesterone\t0.009204773873174423\t0.0003433200025161091\t0.0\t0.0007924296222333437\t0.0\t0.0\t0.009441153443328711\t0.005947519671344486\t0.0\t0.0005356814581771492\t0.006215857342936542\t0.0\t0.009417667003961776\t0.009918679539108202\t0.00023339501999512595\t0.02671768716952178\t0.00030790986345822244\t0.0\t0.0\t0.0013743163821902551\t0.017233173590328076\t0.0\t0.03156546678710745\t0.012448459343477037\t0.0\t0.007750527312298441\t0.007023452558304406\t0.020597611603217016\t0.023913761352649537\t0.011281962106545067\t1.6426994248360046e-05\t0.0\t0.036975166579308216\t0.03366222488028883\t0.0\t0.0\t0.023540677910418275\t0.0\t0.03613897694723206\t0.025424940901129782\t0.0\t0.0\t0.011503400057545235\t0.0\t0.00020822196303032738\t0.0\t0.0\t0.0\t0.0\t0.0014763317286047319\t0.0\t0.0012583838846539571\t0.0\t0.003999037208194644\t0.01371043043941223\t0.0013524730258847192\t0.007867754340786983\t0.040527384587716805\t0.010996257146538875\t0.0\t0.0\t0.06835446607134321\t0.0\t0.0\t0.008591363167784047\t0.0\t0.0\t0.0\t0.0\t0.0\t0.007090284250167495\t0.008465564938609312\t0.0804081419688773\t0.0\t0.028294996723359767\t0.0\t0.0\t0.0038398141926578038\t0.16023981186600045\t0.048059469431165694\t0.037035561711554706\t0.0\t0.0005120942309216938\t0.0\t0.0\t0.03494182656192\t0.0\t0.0\t0.027888357150311995\t0.012585355222212598\t0.03740123828771999\t0.008517825868349625\t0.009137033754720997\t0.0\t0.0\t0.0\t0.0\t0.0\t0.029300775267851718\t0.0\t0.0\t0.0\t0.012950879883070195\t0.0005955124138932699\t0.0\t0.0\t0.0\t0.005304965226057578\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.039134050766579234\t0.27148697274385963\t0.0035271606926311947\t0.0\t0.0\t0.020497841819279865\t0.0\t0.0025113292870849193\t0.0\t0.3500845873047569\t0.0\t0.0022399027023098433\t0.0\t0.005491138035803351\t0.0\t0.0\t0.011672805021412765\t0.025682900399847042\t0.07006608189710375\t0.018632962351792206\t0.0\t0.041533732846226044\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.007867919703105077\t0.0\t0.04748141850290333\t0.0\t0.0\t0.0\t0.10974594417370812\t0.034291658672408076\t0.0\t0.02316539180928352\t0.0\t0.0\t0.0\t0.00028334175636508574\t0.0\t0.0\t0.0\t0.026807362599866817\t0.003975994609085816\t0.0\t0.0\t0.0\t0.0\t0.0\t0.06458445415629566\t0.013061309028202977\t0.0\t0.0\n-Testosterone\t0.00963321193050065\t0.0002486431572929109\t0.0\t0.00023222574210456643\t0.0009261428396286549\t0.0\t0.0\t0.0004003438403933666\t0.0\t6.734322542067866e-05\t0.0016889974488375967\t0.0\t0.1780813812315968\t0.0072719758372110635\t0.00015349402653421068\t0.027912903539727803\t0.0\t0.0\t0.0\t0.0005797401705402625\t0.011098826052235526\t0.0\t0.024485309434567667\t0.020836980610370554\t0.0\t0.004730656796420984\t0.009055625850088003\t0.01764485751937844\t0.03429748760686156\t0.0031719104702998832\t0.0\t0.0\t0.0395809568137632\t0.008699485073663105\t0.0\t0.0\t0.027921629937492448\t0.0\t0.011883152521337885\t0.0047395536771171875\t0.0\t0.0\t0.06041370798509152\t0.0\t0.04269715405107753\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.002871402290315492\t0.021418156386493005\t0.001518651525516398\t0.006270179831850886\t0.02991589396789859\t0.006884609314977859\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0013335431710517\t0.0\t0.08702752210600646\t0.0\t0.031711980344501185\t0.0\t0.0\t0.0\t0.0\t0.0007660193758873304\t0.010813507002141598\t0.0\t0.0\t0.0\t0.0\t0.004200894168035754\t0.0\t0.0\t0.023494843685534682\t0.018166542728947157\t0.06339867284692752\t0.008591171811569502\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.11646566920503164\t0.0\t0.0\t0.0\t0.0\t0.003134253094757806\t0.0\t0.15489171142643712\t0.0\t0.013048242174815932\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0016583104334544857\t0.03949452321180806\t0.0\t0.0\t0.0\t0.021990926351807622\t0.0\t0.13014922112429486\t0.0\t0.183317218950015\t0.0\t0.0014411200837741863\t0.0\t0.0\t0.0\t0.0\t0.010921053413542851\t0.009432436710872127\t0.06421886680272977\t0.02588295656806723\t0.0\t0.03618383380922252\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0006655628265324854\t0.0\t0.0264850588505131\t0.0\t0.0\t0.0\t0.10783284756046718\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.12344754627650141\t0.0\t0.0\t0.0\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/fill.mgf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/fill.mgf Fri Jan 28 16:22:06 2022 +0000
b
b'@@ -0,0 +1,2513 @@\n+BEGIN IONS\n+NAME=C001\n+IONMODE=Negative\n+RETENTIONTIME=38.74\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=57\n+138.9121 10186226.0 \n+148.9337 1008656.0 \n+175.0641 26780143.0 \n+186.1095 2675456.0 \n+196.8658 21390430.0 \n+198.8647 21688594.0 \n+200.8848 7742528.0 \n+206.9034 26130980.0 \n+216.9205 32607700.0 \n+234.0134 2550129.0 \n+254.8252 23747536.0 \n+256.8215 31377637.0 \n+258.8237 15532799.0 \n+266.8652 9805546.0 \n+268.8537 3090354.0 \n+306.9914 3169316.0 \n+312.7841 10051801.0 \n+316.7777 10734168.0 \n+322.8157 6317648.0 \n+324.9549 8619910.0 \n+334.849 4178412.0 \n+342.8093 3285552.0 \n+349.9455 2050695.0 \n+350.9875 6150799.0 \n+351.941 1965882.0 \n+366.8281 3253770.0 \n+370.7418 9765463.0 \n+372.7383 19374863.0 \n+382.8218 12815572.0 \n+384.8177 8311500.0 \n+392.7685 10913351.0 \n+413.2664 3965867.0 \n+426.7772 5431633.0 \n+428.7834 8554675.0 \n+434.7287 9943329.0 \n+436.8161 3705247.0 \n+440.7322 10603010.0 \n+442.7401 8271752.0 \n+450.7016 8762673.0 \n+460.7076 4528973.0 \n+462.7862 2123666.0 \n+484.7242 4273989.0 \n+486.7743 4886062.0 \n+488.6825 12267966.0 \n+492.744 7662344.0 \n+494.8953 7188793.0 \n+498.8794 6811405.0 \n+500.8484 6520691.0 \n+502.7832 3567833.0 \n+510.763 4989757.0 \n+518.7415 4243468.0 \n+546.6093 7177067.0 \n+550.6949 6104789.0 \n+566.5977 5171811.0 \n+612.6927 2005587.0 \n+676.6436 1982714.0 \n+800.4451 2792137.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C002\n+IONMODE=Negative\n+RETENTIONTIME=520.25\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=35\n+131.1733 1971789.0 \n+267.2688 6103973.0 \n+279.0196 1946255.0 \n+289.6491 46498377.0 \n+301.1565 15185412.0 \n+309.1649 18045974.0 \n+310.1623 295359836.0 \n+311.1658 13124727.0 \n+312.0296 38757284.0 \n+330.6757 12666597.0 \n+525.375 1073323842.0 \n+526.3783 181668883.0 \n+527.3812 23642795.0 \n+551.3321 111616808.0 \n+552.3348 28340614.0 \n+553.3314 2609936.0 \n+562.3269 7538206.0 \n+578.2905 7578406.0 \n+619.3008 4742103.0 \n+624.296 11790213.0 \n+813.5403 25060147.0 \n+814.5336 5865975.0 \n+955.1171 2322927.0 \n+1047.7378 150394804.0 \n+1048.7399 90978863.0 \n+1049.7432 29946438.0 \n+1050.7453 6807767.0 \n+1069.7158 5074652.0 \n+1074.1979 3402288.0 \n+1075.1968 33352763.0 \n+1076.2004 10417953.0 \n+1101.6535 2023916.0 \n+1206.3127 3738816.0 \n+1216.8041 4439324.0 \n+1217.807 3565334.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C003\n+IONMODE=Negative\n+RETENTIONTIME=483.67\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=26\n+265.2529 11366224.0 \n+266.2564 1420444.0 \n+279.6362 29849749.0 \n+280.6546 8848921.0 \n+288.6414 202172046.0 \n+378.2093 15309961.0 \n+379.1966 2902366.0 \n+522.3565 4089569222.0 \n+523.354 1201714423.0 \n+549.3267 63300808.0 \n+576.2749 7386007.0 \n+577.3074 2354251.0 \n+617.2778 2323470.0 \n+625.4543 4040374.0 \n+796.9808 13576738.0 \n+797.9841 6368973.0 \n+809.9883 12596682.0 \n+810.9916 6601055.0 \n+1043.7028 144351468.0 \n+1044.7068 83271854.0 \n+1045.706 27998321.0 \n+1046.7131 6505178.0 \n+1058.1594 20718345.0 \n+1059.1626 6608764.0 \n+1071.1639 15461047.0 \n+1072.1671 5096642.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C004\n+IONMODE=Negative\n+RETENTIONTIME=473.48\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=24\n+124.1405 6517662.0 \n+170.2437 1237313.0 \n+275.6336 28001849.0 \n+296.147 190395687.0 \n+482.3247 145772322.0 \n+483.3283 36245876.0 \n+496.34 12577588056.0 \n+497.3442 3337125302.0 \n+498.3462 532285213.0 \n+499.3493 68176083.0 \n+770.964 49250157.0 \n+771.9675 22666873.0 \n+783.9721 9839299.0 \n+784.9749 3622908.0 \n+949.6233 8009033.0 \n+950.6274 3674694.0 \n+991.6726 1420557258.0 \n+992.6749 763118028.0 \n+993.6787 239161906.0 \n+994.6801 53549573.0 \n+1017.6897 168186952.0 \n+1018.6656 120599518.0 \n+1019.6555 57647644.0 \n+1020.6591 12469103.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C005\n+IONMODE=Negative\n+RETENTIONTIME=41.72\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=20\n+218.1386 14009249.0 \n+337.0623 88672453.0 \n+338.0654 8770055.0 \n+353.0361 37061354.0 \n+359.0443 48435582.0 \n+360.0459 5025128.0 \n+375.018 29159485.0 \n+376.0216 2740193.0 \n+381.0261 13522755.0 \n+396.9999 10317665.0 \n+417.0027 13822994.0 \n+418.9966 4386311.0 \n+432'..b'TRUMTYPE=Centroid\n+NUM PEAKS=2\n+328.2481 11119434.0 \n+329.2519 2068394.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C152\n+IONMODE=Negative\n+RETENTIONTIME=385.78\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+409.1497 1369551.0 \n+427.1607 2275086.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C153\n+IONMODE=Negative\n+RETENTIONTIME=401.39\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+107.0557 2271180.0 \n+197.1612 1286942.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C154\n+IONMODE=Negative\n+RETENTIONTIME=388.72\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+239.1276 1743749.0 \n+286.9585 1645545.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C155\n+IONMODE=Negative\n+RETENTIONTIME=373.67\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+507.1617 6285930.0 \n+508.1657 1535734.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C156\n+IONMODE=Negative\n+RETENTIONTIME=378.37\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+257.2254 3302868.0 \n+777.6928 4522421.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C157\n+IONMODE=Negative\n+RETENTIONTIME=473.08\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+267.6425 11780168.0 \n+534.2949 13399261.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C158\n+IONMODE=Negative\n+RETENTIONTIME=508.15\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+380.2992 5790633.0 \n+423.2518 1386850.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C159\n+IONMODE=Negative\n+RETENTIONTIME=471.89\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+304.2357 21716257.0 \n+306.1523 8327492.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C160\n+IONMODE=Negative\n+RETENTIONTIME=465.45\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+193.1239 1274413.0 \n+295.1974 20379534.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C161\n+IONMODE=Negative\n+RETENTIONTIME=488.7\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+667.4214 3075774.0 \n+1189.7766 2040172.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C162\n+IONMODE=Negative\n+RETENTIONTIME=471.97\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+316.6601 7221684.0 \n+393.2201 8389493.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C163\n+IONMODE=Negative\n+RETENTIONTIME=465.16\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+422.3267 4962906.0 \n+431.3157 12163271.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C164\n+IONMODE=Negative\n+RETENTIONTIME=474.29\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+239.1779 8236995.0 \n+398.3268 11918127.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C165\n+IONMODE=Negative\n+RETENTIONTIME=477.74\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+249.1858 1576729.0 \n+307.15 1941191.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C166\n+IONMODE=Negative\n+RETENTIONTIME=494.51\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+355.2846 54372680.0 \n+373.2951 6108864.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C167\n+IONMODE=Negative\n+RETENTIONTIME=497.67\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+474.3486 2732000.0 \n+649.4483 2434649.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C168\n+IONMODE=Negative\n+RETENTIONTIME=498.02\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+459.2569 3550909.0 \n+539.4163 5285541.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C169\n+IONMODE=Negative\n+RETENTIONTIME=492.45\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+732.5452 4526953.0 \n+733.5465 1043642.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C170\n+IONMODE=Negative\n+RETENTIONTIME=497.3\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+450.3586 4210116.0 \n+451.3631 6446370.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C171\n+IONMODE=Negative\n+RETENTIONTIME=467.81\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+185.0776 5067455.0 \n+200.203 1398415.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C172\n+IONMODE=Negative\n+RETENTIONTIME=457.02\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+263.2347 3933284.0 \n+615.2633 1132491.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C173\n+IONMODE=Negative\n+RETENTIONTIME=443.89\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+370.2956 41596161.0 \n+371.304 9966707.0 \n+END IONS\n+\n+BEGIN IONS\n+NAME=C174\n+IONMODE=Negative\n+RETENTIONTIME=438.81\n+RETENTIONINDEX=\n+SPECTRUMTYPE=Centroid\n+NUM PEAKS=2\n+330.2563 5274387.0 \n+579.2938 6044865.0 \n+END IONS\n+\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/fill.msp
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/fill.msp Fri Jan 28 16:22:06 2022 +0000
b
b'@@ -0,0 +1,2165 @@\n+NAME:C001\n+IONMODE:Negative\n+RETENTIONTIME:38.74\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:57\n+216.9205 32607700\n+256.8215 31377637\n+175.0641 26780143\n+206.9034 26130980\n+254.8252 23747536\n+198.8647 21688594\n+196.8658 21390430\n+372.7383 19374863\n+258.8237 15532799\n+382.8218 12815572\n+488.6825 12267966\n+392.7685 10913351\n+316.7777 10734168\n+440.7322 10603010\n+138.9121 10186226\n+312.7841 10051801\n+434.7287 9943329\n+266.8652 9805546\n+370.7418 9765463\n+450.7016 8762673\n+324.9549 8619910\n+428.7834 8554675\n+384.8177 8311500\n+442.7401 8271752\n+200.8848 7742528\n+492.744 7662344\n+494.8953 7188793\n+546.6093 7177067\n+498.8794 6811405\n+500.8484 6520691\n+322.8157 6317648\n+350.9875 6150799\n+550.6949 6104789\n+426.7772 5431633\n+566.5977 5171811\n+510.763 4989757\n+486.7743 4886062\n+460.7076 4528973\n+484.7242 4273989\n+518.7415 4243468\n+334.849 4178412\n+413.2664 3965867\n+436.8161 3705247\n+502.7832 3567833\n+342.8093 3285552\n+366.8281 3253770\n+306.9914 3169316\n+268.8537 3090354\n+800.4451 2792137\n+186.1095 2675456\n+234.0134 2550129\n+462.7862 2123666\n+349.9455 2050695\n+612.6927 2005587\n+676.6436 1982714\n+351.941 1965882\n+148.9337 1008656\n+\n+NAME:C002\n+IONMODE:Negative\n+RETENTIONTIME:520.25\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:35\n+525.375 1073323842\n+310.1623 295359836\n+526.3783 181668883\n+1047.7378 150394804\n+551.3321 111616808\n+1048.7399 90978863\n+289.6491 46498377\n+312.0296 38757284\n+1075.1968 33352763\n+1049.7432 29946438\n+552.3348 28340614\n+813.5403 25060147\n+527.3812 23642795\n+309.1649 18045974\n+301.1565 15185412\n+311.1658 13124727\n+330.6757 12666597\n+624.296 11790213\n+1076.2004 10417953\n+578.2905 7578406\n+562.3269 7538206\n+1050.7453 6807767\n+267.2688 6103973\n+814.5336 5865975\n+1069.7158 5074652\n+619.3008 4742103\n+1216.8041 4439324\n+1206.3127 3738816\n+1217.807 3565334\n+1074.1979 3402288\n+553.3314 2609936\n+955.1171 2322927\n+1101.6535 2023916\n+131.1733 1971789\n+279.0196 1946255\n+\n+NAME:C003\n+IONMODE:Negative\n+RETENTIONTIME:483.67\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:26\n+522.3565 4089569222\n+523.354 1201714423\n+288.6414 202172046\n+1043.7028 144351468\n+1044.7068 83271854\n+549.3267 63300808\n+279.6362 29849749\n+1045.706 27998321\n+1058.1594 20718345\n+1071.1639 15461047\n+378.2093 15309961\n+796.9808 13576738\n+809.9883 12596682\n+265.2529 11366224\n+280.6546 8848921\n+576.2749 7386007\n+1059.1626 6608764\n+810.9916 6601055\n+1046.7131 6505178\n+797.9841 6368973\n+1072.1671 5096642\n+625.4543 4040374\n+379.1966 2902366\n+577.3074 2354251\n+617.2778 2323470\n+266.2564 1420444\n+\n+NAME:C004\n+IONMODE:Negative\n+RETENTIONTIME:473.48\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:24\n+496.34 12577588056\n+497.3442 3337125302\n+991.6726 1420557258\n+992.6749 763118028\n+498.3462 532285213\n+993.6787 239161906\n+296.147 190395687\n+1017.6897 168186952\n+482.3247 145772322\n+1018.6656 120599518\n+499.3493 68176083\n+1019.6555 57647644\n+994.6801 53549573\n+770.964 49250157\n+483.3283 36245876\n+275.6336 28001849\n+771.9675 22666873\n+1020.6591 12469103\n+783.9721 9839299\n+949.6233 8009033\n+124.1405 6517662\n+950.6274 3674694\n+784.9749 3622908\n+170.2437 1237313\n+\n+NAME:C005\n+IONMODE:Negative\n+RETENTIONTIME:41.72\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:20\n+337.0623 88672453\n+359.0443 48435582\n+353.0361 37061354\n+375.018 29159485\n+218.1386 14009249\n+417.0027 13822994\n+381.0261 13522755\n+438.9851 11307111\n+396.9999 10317665\n+454.9592 9820452\n+432.9764 9779399\n+338.0654 8770055\n+360.0459 5025128\n+418.9966 4386311\n+512.8989 4072570\n+456.9603 3774845\n+470.9263 3632486\n+572.871 3485486\n+440.9796 3364168\n+376.0216 2740193\n+\n+NAME:C006\n+IONMODE:Negative\n+RETENTIONTIME:452.08\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:19\n+494.3249 803829845\n+495.3278 207959661\n+542.3239 193323900\n+543.3276 55501736\n+1087.6715 34676828\n+516.3076 24092471\n+274.6257 21694276\n+1088.6773 21466528\n+1001.658 11852076\n+1089.682 9948820\n+290.6256 9704443\n+1061.6562 9417442\n+987.6411 7453650\n+1037.6578 7076912\n+1062.6592 5657208\n+484.3311 5283943\n+265.6196 '..b'5.2288 1932289\n+\n+NAME:C147\n+IONMODE:Negative\n+RETENTIONTIME:563.22\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+282.2792 241362345\n+256.2615 19433189\n+\n+NAME:C148\n+IONMODE:Negative\n+RETENTIONTIME:548.47\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+305.2468 9633582\n+329.249 5814756\n+\n+NAME:C149\n+IONMODE:Negative\n+RETENTIONTIME:350.93\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+130.0643 7419216\n+190.0865 4433780\n+\n+NAME:C150\n+IONMODE:Negative\n+RETENTIONTIME:365.37\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+490.2083 5275418\n+465.1226 1763287\n+\n+NAME:C151\n+IONMODE:Negative\n+RETENTIONTIME:394.87\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+328.2481 11119434\n+329.2519 2068394\n+\n+NAME:C152\n+IONMODE:Negative\n+RETENTIONTIME:385.78\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+427.1607 2275086\n+409.1497 1369551\n+\n+NAME:C153\n+IONMODE:Negative\n+RETENTIONTIME:401.39\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+107.0557 2271180\n+197.1612 1286942\n+\n+NAME:C154\n+IONMODE:Negative\n+RETENTIONTIME:388.72\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+239.1276 1743749\n+286.9585 1645545\n+\n+NAME:C155\n+IONMODE:Negative\n+RETENTIONTIME:373.67\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+507.1617 6285930\n+508.1657 1535734\n+\n+NAME:C156\n+IONMODE:Negative\n+RETENTIONTIME:378.37\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+777.6928 4522421\n+257.2254 3302868\n+\n+NAME:C157\n+IONMODE:Negative\n+RETENTIONTIME:473.08\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+534.2949 13399261\n+267.6425 11780168\n+\n+NAME:C158\n+IONMODE:Negative\n+RETENTIONTIME:508.15\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+380.2992 5790633\n+423.2518 1386850\n+\n+NAME:C159\n+IONMODE:Negative\n+RETENTIONTIME:471.89\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+304.2357 21716257\n+306.1523 8327492\n+\n+NAME:C160\n+IONMODE:Negative\n+RETENTIONTIME:465.45\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+295.1974 20379534\n+193.1239 1274413\n+\n+NAME:C161\n+IONMODE:Negative\n+RETENTIONTIME:488.7\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+667.4214 3075774\n+1189.7766 2040172\n+\n+NAME:C162\n+IONMODE:Negative\n+RETENTIONTIME:471.97\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+393.2201 8389493\n+316.6601 7221684\n+\n+NAME:C163\n+IONMODE:Negative\n+RETENTIONTIME:465.16\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+431.3157 12163271\n+422.3267 4962906\n+\n+NAME:C164\n+IONMODE:Negative\n+RETENTIONTIME:474.29\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+398.3268 11918127\n+239.1779 8236995\n+\n+NAME:C165\n+IONMODE:Negative\n+RETENTIONTIME:477.74\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+307.15 1941191\n+249.1858 1576729\n+\n+NAME:C166\n+IONMODE:Negative\n+RETENTIONTIME:494.51\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+355.2846 54372680\n+373.2951 6108864\n+\n+NAME:C167\n+IONMODE:Negative\n+RETENTIONTIME:497.67\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+474.3486 2732000\n+649.4483 2434649\n+\n+NAME:C168\n+IONMODE:Negative\n+RETENTIONTIME:498.02\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+539.4163 5285541\n+459.2569 3550909\n+\n+NAME:C169\n+IONMODE:Negative\n+RETENTIONTIME:492.45\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+732.5452 4526953\n+733.5465 1043642\n+\n+NAME:C170\n+IONMODE:Negative\n+RETENTIONTIME:497.3\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+451.3631 6446370\n+450.3586 4210116\n+\n+NAME:C171\n+IONMODE:Negative\n+RETENTIONTIME:467.81\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+185.0776 5067455\n+200.203 1398415\n+\n+NAME:C172\n+IONMODE:Negative\n+RETENTIONTIME:457.02\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+263.2347 3933284\n+615.2633 1132491\n+\n+NAME:C173\n+IONMODE:Negative\n+RETENTIONTIME:443.89\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+370.2956 41596161\n+371.304 9966707\n+\n+NAME:C174\n+IONMODE:Negative\n+RETENTIONTIME:438.81\n+RETENTIONINDEX:\n+SPECTRUMTYPE:Centroid\n+Num Peaks:2\n+579.2938 6044865\n+330.2563 5274387\n+\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/matches_test1_out.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/matches_test1_out.tsv Fri Jan 28 16:22:06 2022 +0000
b
b'@@ -0,0 +1,175 @@\n+\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n+C001\t57\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C002\t0\t35\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C003\t0\t0\t26\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C004\t0\t0\t0\t24\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C005\t0\t0\t0\t0\t20\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C006\t0\t0\t0\t0\t0\t19\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C007\t0\t0\t0\t0\t0\t0\t15\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C008\t0\t1\t0\t0\t0\t0\t0\t15\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C009\t0\t0\t0\t0\t0\t0\t0\t0\t14\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t'..b'\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C164\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C165\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C166\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\n+C167\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\n+C168\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\n+C169\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\n+C170\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\n+C171\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\n+C172\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\n+C173\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\n+C174\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/matches_test3_out.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/matches_test3_out.tsv Fri Jan 28 16:22:06 2022 +0000
b
b'@@ -0,0 +1,387 @@\n+\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n+Perylene_2H12\t0\t0\t2\t0\t1\t0\t0\t1\t0\t0\t0\t0\t2\t0\t0\t3\t0\t0\t0\t1\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\n+Perylene\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t0\t1\t1\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+Phenanthrene_2H10\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t2\t0\t1\t0\t0\t0\t0\t1\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\n+Phenanthrene\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+Anthracene\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t2\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+Acenaphthylene\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+Acenaphthene\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t3\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+Fluoranthene\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t1\t0\t1\t0\t0\t0\t2\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+Pyrene\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t2\t1\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0'..b'ph_isomer2\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+Spirodiclofen\t3\t2\t0\t0\t0\t0\t4\t1\t0\t0\t1\t1\t4\t0\t0\t4\t3\t0\t1\t2\t4\t0\t2\t0\t0\t1\t0\t0\t2\t1\t0\t0\t3\t1\t0\t0\t1\t1\t1\t1\t0\t0\t2\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t3\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t1\t1\t1\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+Spiromesifen\t1\t1\t0\t1\t0\t0\t2\t2\t0\t1\t1\t0\t2\t1\t0\t5\t0\t0\t0\t1\t3\t0\t3\t4\t0\t1\t2\t1\t2\t1\t0\t0\t1\t7\t0\t0\t2\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t3\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t2\t0\t1\t0\t0\t0\t0\t1\t2\t0\t1\t0\t0\t0\t0\t0\t2\t0\t0\t3\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\n+Spirotetramat\t2\t2\t0\t1\t0\t0\t2\t5\t0\t2\t1\t0\t6\t1\t0\t7\t1\t0\t1\t2\t4\t0\t4\t8\t0\t3\t2\t1\t2\t1\t0\t0\t3\t7\t0\t0\t3\t0\t0\t4\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t3\t0\t0\t3\t0\t0\t3\t0\t0\t1\t0\t0\t1\t0\t0\t3\t1\t3\t0\t0\t0\t0\t0\t2\t2\t3\t0\t1\t0\t0\t1\t0\t0\t3\t0\t2\t3\t2\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t2\t1\t0\t1\t1\t0\t0\t1\t2\t0\t1\t0\t2\t0\t0\t1\t1\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t1\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\n+17-alpha-Ethynylestradiol\t1\t0\t0\t2\t0\t0\t2\t2\t0\t1\t1\t0\t4\t1\t1\t5\t1\t0\t0\t1\t2\t0\t3\t4\t0\t2\t2\t1\t2\t1\t0\t0\t3\t7\t0\t0\t1\t1\t0\t4\t0\t0\t2\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t2\t0\t1\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t1\t0\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t2\t1\t0\t3\t1\t0\t0\t0\t0\t0\t1\t0\t0\t2\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t2\t1\t0\t0\n+Bisphenol A\t0\t0\t0\t0\t0\t0\t1\t1\t0\t1\t0\t0\t1\t0\t0\t3\t1\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t3\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+4-tert-Octylphenol\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+Estrone\t1\t0\t0\t0\t0\t0\t1\t1\t0\t1\t1\t0\t3\t1\t1\t6\t0\t0\t0\t2\t1\t0\t2\t7\t0\t1\t3\t1\t2\t1\t0\t0\t3\t7\t0\t0\t0\t1\t0\t3\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t1\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t3\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t1\t0\t1\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\n+17-beta-Estradiol\t2\t0\t0\t0\t0\t0\t4\t2\t0\t1\t1\t0\t2\t0\t1\t4\t0\t0\t0\t0\t1\t0\t4\t4\t0\t0\t0\t1\t1\t0\t1\t0\t1\t6\t0\t0\t1\t1\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t3\t0\t1\t0\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t2\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t2\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+Progesterone\t2\t3\t0\t2\t0\t0\t3\t3\t0\t2\t2\t0\t4\t2\t1\t6\t1\t0\t0\t2\t2\t0\t4\t9\t0\t4\t3\t1\t5\t2\t1\t0\t3\t6\t0\t0\t3\t0\t2\t4\t0\t0\t2\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t1\t1\t1\t1\t1\t2\t0\t0\t2\t0\t0\t1\t0\t0\t0\t0\t0\t2\t1\t4\t0\t1\t0\t0\t1\t2\t2\t2\t0\t1\t0\t0\t2\t0\t0\t2\t2\t3\t3\t2\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t1\t2\t1\t0\t0\t1\t0\t1\t0\t2\t0\t1\t0\t1\t0\t0\t1\t2\t2\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t2\t0\t0\t0\t2\t1\t0\t1\t0\t0\t0\t1\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t2\t1\t0\t0\n+Testosterone\t1\t1\t0\t1\t1\t0\t0\t2\t0\t1\t1\t0\t4\t1\t1\t5\t0\t0\t0\t1\t2\t0\t3\t7\t0\t2\t2\t1\t4\t1\t0\t0\t3\t3\t0\t0\t1\t0\t1\t2\t0\t0\t3\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t1\t1\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t4\t0\t1\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t2\t0\t0\t2\t2\t3\t1\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t1\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t1\t0\t2\t0\t2\t0\t1\t0\t0\t0\t0\t1\t1\t2\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t2\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/matches_test4_out.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/matches_test4_out.tsv Fri Jan 28 16:22:06 2022 +0000
[
b"@@ -0,0 +1,387 @@\n+\tPerylene_2H12\tPerylene\tPhenanthrene_2H10\tPhenanthrene\tAnthracene\tAcenaphthylene\tAcenaphthene\tFluoranthene\tPyrene\tpara-Terphenyl\tRetene\tBenzo[b]naphtho[2,1-d]thiophene\t2,3-Benzofluorene\tBenzo[ghi]fluoranthene\tTriphenylene\tBenzanthracene/Benzophenanthrene\tBenzofluoranthene\tBenzo(k)fluoranthene\tBenzo[e]pyrene\tBenzo(a)pyrene\tIndeno[1,2,3-cd]pyrene\tBenzo(g,h,i)perylene\tAnthanthrene\tDibenzanthracene\tCoronene\tDicofol\tBenzophenone\t2-tert-Butyl-4-methoxyphenol\tButylated hydroxytoluene\tBumetrizole\t4-Methylbenzophenone\t2,4,6-Tribromophenol\t2,6-Dichloro-4-nitroaniline\t1-Methylphenanthrene\tTriclosan\tDrometrizole\tEnzacamene\t2,4-Di-tert-butyl-6-(5-chloro-2H-benzotriazol-2-yl)phenol\tOctrizole\t1,2,7,9-Tetrachlorodibenzofuran\t2,2',3,4,5,5',6-Heptachlorobiphenyl\t2,4,6-Trichlorobiphenyl\t2,2',3,3',4,5',6,6'-Octachlorobiphenyl\tMirex\tbeta-Hexachlorocyclohexane\talpha-1,2,3,4,5,6-Hexachlorocyclohexane\tLindane\tdelta-Hexachlorocyclohexane\tepsilon-Hexachlorocyclohexane\tPentachlorobenzene\tHexachlorobenzene\t2,4'-Dichlorodiphenyldichloroethylene\t2,4'-Dichlorodiphenyldichloroethane\t2,4'-Dichlorodiphenyltrichloroethane\t1,2,7,9-Tetrachlorodibenzo-p-dioxin\t2,4,4'-Trichlorobiphenyl\t2,2',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5-Pentachlorobiphenyl\t2,2',3,4,4',5'-Hexachlorobiphenyl\t2,2',4,4',5,5'-Hexachlorobiphenyl\t2,2',3,4,4',5,5'-Heptachlorobiphenyl\t2,2',5,5'-Tetrachlorobiphenyl\t2,3',4,6-Tetrachlorobiphenyl\t2,3',5',6-Tetrachlorobiphenyl\t2,2',3,4',5-Pentachlorobiphenyl\t2,3,3',4,5-Pentachlorobiphenyl\t3,3',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5',6-Hexachlorobiphenyl\t2,3,3',4,5,6-Hexachlorobiphenyl\t2,3,3',4',5',6-Hexachlorobiphenyl\t2,3,3',4',5,6-Hexachlorobiphenyl\t2,3,3',4',5,5',6-Heptachlorobiphenyl\tcis-Prallethrin\ttrans-Prallethrin\tcis-Resmethrin\ttrans-Resmethrin\tcis-Tetramethrin\ttrans-Tetramethrin\tBifenthrin\tFenpropathrin\tcis-Phenothrin\ttrans-Phenothrin\tcis-Cyphenothrin\ttrans-Cyphenothrin\tFlucythrinate_isomer1\tFlucythrinate_isomer2\tcis-Fenvalerate\ttrans-Fenvalerate\tDeltamethrin\tChlorpyrifos oxon\tlambda-Cyhalothrin\tTefluthrin\tTransfluthrin\tcis-Permethrin\ttrans-Permethrin\tcis-Allethrin\ttrans-Allethrin\tcis-Cypermethrin_isomer1\ttrans-Cypermethrin_isomer1\tcis-Cypermethrin_isomer2\ttrans-Cypermethrin_isomer2\tcis-Cyfluthrin_isomer1\ttrans-Cyfluthrin_isomer1\tcis-Cyfluthrin_isomer2\ttrans-Cyfluthrin_Isomer2\t1,2,3,4,7,8-Hexachlorodibenzo-p-dioxin\t1,2,3,4,6,7,8-Heptachlorodibenzo-p-dioxin\tOctachlorodibenzo-p-dioxin\tOctachlorodibenzofuran\t1,2,3,7,8-Pentachlorodibenzofuran\t1,2,3,4,7,8-Hexachlorodibenzofuran\t1,2,3,4,6,7,8-Heptachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzo-p-dioxin\t1,2,3,7,8-Pentachlorodibenzo-p-dioxin\t2,3,4,5-Tetrabromo-6-chlorotoluene\t2,3,4,5,6-Pentabromotoluene\t2,3,4,5,6-Pentabromoethylbenzene\t2,3,5,6-Tetrabromo-p-xylene\tAllyl 2,4,6-tribromophenyl ether\t2-Bromoallyl(2,4,6-tribromophenyl) ether\tPentabromobenzene\tHexabromobenzene\t2,3,4,5,6-Pentabromobenzyl alcohol\t2-Ethylhexyl 2,3,4,5-Tetrabromobenzoate\tsyn-Dechlorane plus\tanti-Dechlorane plus\talpha-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\tbeta-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\t1,2,5,6-Tetrabromocyclooctane\t1,1-Dibromo-2,3,3,4,4,5-hexachloro-2-cyclopenta-2,4-dien-1-ylcyclooctane\talpha-Amylcinnamaldehyde\ttrans-Cinnamaldehyde\tCitral (Geranial)\t1-Fluronaphthalene\talpha-Hexylcinnamaldehyde\tLilial\talpha-Amylcinnamyl alcohol\tEugenol\tIsoeugenol\t4-Methoxybenzyl alcohol\tMethyleugenol\tCinnamyl alcohol\tBenzyl alcohol\tEstragole\tBenzyl benzoate\tBenzyl cinnamate\tBenzyl salicylate\tCamphor\tEucalyptol\tCoumarin\tLimonene\tIsomethyl-alpha-ionone\tdelta-Iraldeine\tSafrole\tCashmeran\tCelestolide\tPhantolide\tTonalide\tTraseolide\tGalaxolide\tAldrin\tEndosulfan\tHeptachlor\tcis-Heptachlor epoxide\tEndosulfan sulphate\tEndrin ketone\ttrans-Chlordane\tcis-Chlordane\tEndrin aldehyde\tEndrin\t4,4'-Dichlorodiphenyldichloroethylene\tMethoxychlor\t4,4'-Dichlorodiphenyldichloroethane\t4,4'-Dichlorodiphenyltrichloroethane\tTris(4-tert-butylphenyl) phosphate\tTri-n-butyl-phosphate\tTris(1,3-dichloro-2-propy"..b'39\t11\t10\t27\t32\t19\t34\t20\t25\t21\t47\t11\t36\t46\t25\t47\t36\t44\t37\t31\t33\t34\t39\t61\t9\t23\t30\t44\t15\t19\t21\t18\t18\t22\t14\t18\t22\t21\t24\t17\t16\t24\t29\t34\t31\t22\t45\t37\t26\t34\t36\t12\t12\t17\t49\t22\t30\t29\t13\t22\t57\t14\t33\t16\t17\t18\t22\t12\t6\t8\t17\t10\t55\t34\t40\t15\t9\t13\t49\t34\t22\t35\t7\t10\t19\t18\t26\t45\t23\t47\t38\t22\t19\t20\t7\t13\t37\t23\t7\t30\t22\t7\t12\t55\t52\t41\t39\t26\t37\t8\t12\t18\t16\t36\t32\t19\t31\t17\t2\t6\t35\t40\t19\t35\t29\t20\t16\t35\t47\t16\t31\t35\t18\t20\t19\t38\t24\t42\t27\t28\t17\t25\t60\t19\t20\t20\t34\t28\t36\t11\t16\t19\t14\t27\t21\t20\t13\t17\t30\t46\t75\t36\t3\t29\t10\t23\t45\t31\t21\t35\t18\t34\t10\t28\t51\t61\t56\t48\t62\t16\t8\t11\t44\t68\t80\t78\t26\t13\t88\t56\t85\t72\n+17-beta-Estradiol\t11\t11\t7\t12\t13\t9\t7\t13\t12\t16\t17\t15\t12\t12\t13\t14\t11\t12\t12\t12\t9\t9\t24\t12\t15\t16\t14\t28\t34\t34\t16\t18\t24\t13\t26\t21\t53\t22\t13\t13\t18\t13\t38\t1\t19\t19\t18\t20\t21\t4\t6\t11\t13\t10\t22\t12\t15\t12\t18\t18\t17\t13\t13\t12\t17\t13\t11\t15\t14\t15\t11\t17\t18\t22\t30\t27\t16\t7\t12\t30\t27\t25\t21\t19\t37\t28\t26\t27\t34\t18\t19\t12\t18\t19\t20\t13\t11\t31\t24\t26\t40\t23\t31\t28\t33\t9\t8\t8\t9\t13\t11\t12\t11\t13\t11\t6\t6\t10\t7\t31\t14\t9\t6\t21\t12\t16\t13\t7\t10\t5\t27\t38\t10\t23\t10\t25\t30\t31\t24\t27\t13\t29\t19\t10\t19\t17\t22\t6\t13\t21\t7\t13\t24\t19\t20\t42\t32\t29\t35\t13\t42\t21\t22\t16\t12\t9\t26\t7\t10\t48\t37\t11\t18\t12\t11\t20\t9\t6\t26\t27\t24\t12\t29\t20\t16\t18\t14\t1\t18\t14\t37\t17\t35\t14\t30\t8\t7\t21\t25\t15\t26\t17\t19\t25\t28\t11\t26\t30\t19\t39\t24\t35\t30\t23\t22\t28\t23\t50\t6\t14\t27\t37\t9\t20\t16\t14\t14\t15\t9\t14\t18\t16\t15\t11\t13\t18\t21\t25\t24\t16\t34\t31\t22\t23\t28\t11\t8\t13\t38\t14\t26\t26\t11\t18\t44\t9\t22\t10\t14\t13\t14\t10\t4\t4\t17\t7\t39\t31\t34\t15\t8\t11\t34\t27\t18\t30\t5\t9\t14\t16\t20\t35\t15\t37\t34\t17\t15\t13\t6\t14\t24\t13\t5\t28\t16\t6\t9\t46\t27\t31\t31\t18\t34\t6\t8\t15\t11\t27\t22\t12\t27\t15\t2\t6\t27\t28\t11\t34\t20\t11\t11\t20\t34\t13\t19\t26\t11\t14\t10\t31\t19\t35\t21\t20\t10\t16\t42\t17\t15\t16\t33\t17\t33\t12\t13\t14\t7\t17\t21\t13\t8\t13\t17\t30\t58\t28\t1\t17\t11\t23\t33\t28\t20\t24\t17\t28\t6\t26\t38\t47\t46\t41\t47\t12\t7\t11\t32\t50\t63\t63\t24\t9\t56\t67\t62\t60\n+Progesterone\t18\t10\t17\t16\t18\t13\t10\t14\t12\t23\t35\t19\t16\t13\t18\t17\t12\t13\t14\t13\t11\t10\t31\t14\t24\t28\t21\t46\t42\t64\t23\t38\t56\t21\t50\t27\t103\t32\t16\t21\t19\t28\t71\t2\t45\t42\t44\t42\t43\t12\t10\t24\t26\t24\t35\t20\t25\t19\t19\t22\t20\t25\t24\t21\t26\t18\t20\t21\t20\t20\t13\t18\t40\t51\t55\t48\t34\t21\t15\t59\t47\t45\t54\t47\t59\t48\t43\t55\t63\t38\t28\t21\t31\t24\t30\t47\t39\t52\t47\t51\t74\t42\t53\t52\t67\t20\t18\t14\t15\t16\t17\t20\t20\t17\t16\t13\t9\t18\t11\t61\t23\t13\t8\t51\t31\t22\t22\t15\t21\t15\t40\t48\t14\t43\t13\t40\t38\t39\t38\t39\t24\t43\t28\t16\t27\t19\t33\t8\t21\t33\t9\t24\t31\t31\t28\t65\t42\t40\t45\t16\t57\t50\t68\t27\t29\t21\t55\t17\t22\t112\t78\t29\t29\t23\t24\t30\t10\t15\t50\t41\t41\t17\t57\t44\t32\t32\t21\t5\t26\t37\t84\t30\t44\t22\t44\t11\t9\t29\t38\t20\t34\t23\t26\t42\t56\t15\t45\t68\t29\t62\t46\t58\t61\t34\t42\t41\t57\t81\t10\t30\t39\t56\t27\t24\t26\t28\t26\t28\t24\t21\t21\t22\t26\t20\t20\t21\t39\t45\t40\t22\t55\t39\t29\t43\t51\t12\t15\t25\t68\t25\t43\t42\t18\t20\t77\t14\t47\t24\t20\t18\t26\t14\t7\t9\t22\t14\t80\t44\t49\t19\t13\t10\t54\t34\t20\t43\t10\t14\t28\t20\t35\t59\t27\t58\t49\t31\t10\t24\t6\t15\t43\t34\t11\t40\t29\t9\t14\t83\t52\t50\t44\t35\t44\t9\t13\t21\t23\t44\t37\t27\t35\t19\t7\t16\t42\t52\t15\t46\t49\t34\t21\t52\t69\t18\t47\t44\t16\t37\t29\t51\t33\t52\t40\t38\t21\t30\t91\t23\t22\t29\t46\t36\t44\t14\t22\t31\t27\t32\t32\t28\t20\t28\t44\t59\t103\t43\t9\t33\t24\t44\t63\t43\t34\t55\t36\t52\t15\t43\t80\t101\t84\t86\t100\t16\t9\t14\t80\t81\t125\t95\t29\t13\t85\t62\t168\t125\n+Testosterone\t14\t8\t13\t13\t15\t12\t10\t14\t12\t24\t36\t18\t16\t10\t17\t16\t9\t9\t10\t9\t10\t9\t28\t12\t22\t25\t19\t44\t39\t48\t22\t35\t46\t19\t38\t25\t101\t27\t15\t18\t17\t26\t51\t2\t38\t36\t39\t37\t37\t8\t6\t20\t22\t21\t25\t18\t21\t16\t17\t15\t18\t23\t24\t19\t21\t15\t15\t16\t16\t16\t9\t15\t39\t46\t43\t44\t29\t20\t10\t46\t37\t36\t40\t34\t43\t36\t30\t41\t51\t33\t19\t20\t24\t17\t22\t41\t35\t38\t33\t36\t65\t34\t39\t36\t52\t13\t12\t10\t11\t11\t11\t13\t14\t14\t11\t7\t3\t10\t5\t51\t19\t7\t3\t41\t25\t19\t16\t11\t17\t14\t35\t48\t14\t41\t15\t35\t37\t37\t38\t37\t22\t44\t26\t15\t29\t16\t29\t8\t21\t32\t10\t24\t32\t30\t28\t63\t38\t34\t42\t16\t49\t41\t46\t19\t20\t15\t44\t13\t16\t91\t63\t24\t21\t19\t20\t27\t10\t13\t32\t27\t27\t15\t51\t30\t21\t27\t19\t3\t23\t35\t72\t29\t44\t18\t37\t8\t8\t26\t33\t17\t31\t21\t23\t32\t47\t13\t44\t56\t28\t60\t39\t52\t60\t37\t39\t38\t48\t78\t10\t26\t40\t49\t24\t22\t22\t24\t21\t24\t18\t15\t17\t18\t21\t15\t17\t17\t33\t39\t35\t18\t48\t38\t29\t39\t42\t12\t14\t18\t60\t23\t36\t36\t16\t16\t61\t13\t42\t21\t19\t16\t26\t14\t7\t8\t19\t14\t64\t41\t42\t19\t12\t11\t46\t34\t19\t40\t7\t15\t27\t20\t29\t49\t27\t55\t41\t30\t10\t21\t6\t15\t38\t28\t12\t37\t28\t7\t14\t75\t37\t43\t43\t33\t43\t9\t12\t20\t14\t39\t33\t21\t33\t18\t5\t13\t41\t45\t10\t44\t44\t28\t20\t43\t57\t15\t41\t38\t15\t30\t27\t46\t30\t49\t39\t36\t20\t27\t70\t22\t20\t25\t44\t27\t45\t13\t18\t26\t18\t26\t30\t21\t18\t25\t34\t45\t86\t38\t7\t24\t22\t32\t50\t37\t25\t48\t34\t47\t14\t37\t66\t81\t71\t74\t84\t15\t8\t12\t68\t60\t96\t82\t27\t13\t72\t60\t125\t130\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/matches_test5_out.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/matches_test5_out.tsv Fri Jan 28 16:22:06 2022 +0000
b
b'@@ -0,0 +1,175 @@\n+\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n+C001\t57\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C002\t0\t35\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C003\t0\t0\t26\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C004\t0\t0\t0\t24\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C005\t0\t0\t0\t0\t20\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C006\t0\t0\t0\t0\t0\t19\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C007\t0\t0\t0\t0\t0\t0\t15\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C008\t0\t1\t0\t0\t0\t0\t0\t15\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C009\t0\t0\t0\t0\t0\t0\t0\t0\t14\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t'..b'\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C164\t0\t0\t0\t0\t0\t0\t1\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C165\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\n+C166\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\n+C167\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\n+C168\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\n+C169\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\n+C170\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\t0\n+C171\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\t0\n+C172\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\t0\n+C173\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t1\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\t0\n+C174\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t0\t2\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/recetox_gc-ei_ms_20201028.msp
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/recetox_gc-ei_ms_20201028.msp Fri Jan 28 16:22:06 2022 +0000
[
b'@@ -0,0 +1,31986 @@\n+NAME: Perylene_2H12\r\n+SCANNUMBER: -1\r\n+RETENTIONTIME: -1\r\n+RETENTIONINDEX: 2876\r\n+PRECURSORMZ: 264.16858\r\n+PRECURSORTYPE: [M]+\r\n+IONMODE: Positive\r\n+SPECTRUMTYPE: Centroid\r\n+FORMULA: C20H12\r\n+INCHIKEY: CSHWQDPOILHKBI-AQZSQYOVSA-N\r\n+INCHI: \r\n+SMILES: [2H]C1=C(C2=C3C(=C1[2H])C4=C(C(=C(C5=C4C(=C(C(=C5[2H])[2H])[2H])C3=C(C(=C2[2H])[2H])[2H])[2H])[2H])[2H])[2H]\r\n+AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\r\n+COLLISIONENERGY: 70eV\r\n+INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\r\n+INSTRUMENTTYPE: GC-EI-Orbitrap\r\n+IONIZATION: EI+\r\n+LICENSE: CC BY-NC\r\n+COMMENT: \r\n+Num Peaks: 33\r\n+116.05576\t29277\r\n+118.06992\t49651\r\n+128.0558\t37001\r\n+130.06996\t78584\r\n+130.57159\t17533\r\n+132.08408\t65686\r\n+132.5858\t12593\r\n+207.0322\t39569\r\n+222.08282\t13141\r\n+223.06346\t20762\r\n+225.04277\t18058\r\n+227.02202\t26370\r\n+232.11204\t30354\r\n+236.1405\t22796\r\n+252.09322\t8564\r\n+256.11212\t41765\r\n+257.11557\t8688\r\n+258.12622\t21742\r\n+259.13446\t11564\r\n+260.14041\t248997\r\n+261.14358\t51721\r\n+262.15466\t33597\r\n+263.16254\t63732\r\n+264.16858\t829577\r\n+265.01968\t18286\r\n+265.17191\t176460\r\n+266.17523\t18876\r\n+283.03036\t10261\r\n+287.00632\t11352\r\n+295.10288\t26727\r\n+299.06152\t33379\r\n+359.0282\t67046\r\n+400.98447\t17406\r\n+\r\n+NAME: Perylene\r\n+SCANNUMBER: -1\r\n+RETENTIONTIME: -1\r\n+RETENTIONINDEX: 2886.9\r\n+PRECURSORMZ: 252.09323\r\n+PRECURSORTYPE: [M]+\r\n+IONMODE: Positive\r\n+SPECTRUMTYPE: Centroid\r\n+FORMULA: C20H12\r\n+INCHIKEY: CSHWQDPOILHKBI-UHFFFAOYSA-N\r\n+INCHI: \r\n+SMILES: C1=CC2=C3C(=C1)C1=CC=CC4=C1C(=CC=C4)C3=CC=C2\r\n+AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\r\n+COLLISIONENERGY: 70eV\r\n+INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\r\n+INSTRUMENTTYPE: GC-EI-Orbitrap\r\n+IONIZATION: EI+\r\n+LICENSE: CC BY-NC\r\n+COMMENT: \r\n+Num Peaks: 19\r\n+112.03071\t49892\r\n+113.03854\t87510\t"Theoretical m/z 113.039125, Mass diff 0 (0 ppm), Formula C9H5"\r\n+124.03076\t100146\r\n+124.53242\t24923\r\n+125.03855\t179254\t"Theoretical m/z 125.039125, Mass diff 0 (0 ppm), Formula C10H5"\r\n+125.54019\t49039\r\n+126.04636\t131679\r\n+126.54804\t36313\r\n+222.04645\t28905\r\n+224.06192\t55632\r\n+226.04175\t37413\r\n+246.04646\t23286\r\n+248.06204\t140007\r\n+249.07072\t62236\t"Theoretical m/z 249.070425, Mass diff -0.001 (0 ppm), Formula C20H9"\r\n+250.07765\t641789\r\n+251.07967\t137600\r\n+252.09323\t1955166\t"Theoretical m/z 252.093354, Mass diff 0 (0.49 ppm), SMILES C1=CC=2C=CC=C3C4=CC=CC5=CC=CC(C(=C1)C23)=C54, Annotation [C20H12]+, Rule of HR False"\r\n+253.09656\t402252\r\n+254.09985\t39987\r\n+\r\n+NAME: Phenanthrene_2H10\r\n+SCANNUMBER: -1\r\n+RETENTIONTIME: -1\r\n+RETENTIONINDEX: 1827.1\r\n+PRECURSORMZ: 188.14029\r\n+PRECURSORTYPE: [M]+\r\n+IONMODE: Positive\r\n+SPECTRUMTYPE: Centroid\r\n+FORMULA: C14H10\r\n+INCHIKEY: YNPNZTXNASCQKK-LHNTUAQVSA-N\r\n+INCHI: \r\n+SMILES: [2H]C1=C(C(=C2C(=C1[2H])C(=C(C3=C(C(=C(C(=C32)[2H])[2H])[2H])[2H])[2H])[2H])[2H])[2H]\r\n+AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\r\n+COLLISIONENERGY: 70eV\r\n+INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\r\n+INSTRUMENTTYPE: GC-EI-Orbitrap\r\n+IONIZATION: EI+\r\n+LICENSE: CC BY-NC\r\n+COMMENT: \r\n+Num Peaks: 17\r\n+76.02767\t185421\r\n+78.0418\t256858\r\n+80.05586\t881271\r\n+90.04181\t200162\r\n+92.06206\t537968\r\n+94.06999\t628791\r\n+156.08402\t836513\r\n+158.09808\t477819\r\n+160.11218\t2421148\r\n+161.11554\t310248\r\n+176.10866\t308983\r\n+184.11224\t2784543\r\n+185.11562\t445833\r\n+186.12637\t1283282\r\n+188.14029\t15115275\r\n+189.1436\t2312386\r\n+190.14688\t151400\r\n+\r\n+NAME: Phenanthrene\r\n+SCANNUMBER: -1\r\n+RETENTIONTIME: -1\r\n+RETENTIONINDEX: 1832.9\r\n+PRECURSORMZ: 178.0775\r\n+PRECURSORTYPE: [M]+\r\n+IONMODE: Positive\r\n+SPECTRUMTYPE: Centroid\r\n+FORMULA: C14H10\r\n+INCHIKEY: YNPNZTXNASCQKK-UHFFFAOYSA-N\r\n+INCHI: \r\n+SMILES: C1=CC2=C(C=C1)C1=C(C=CC=C1)C=C2\r\n+AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\r\n+COLLISIONENERGY: 70eV\r\n+INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\r\n+INSTRUMENTTYPE: GC-EI-Orbitrap\r\n+IONIZATION: EI+\r\n+LICENSE: CC BY-NC\r\n+COMMENT: \r\n+Num Peaks: 19\r\n+74.01508\t137808\t"Theoretical m/z 74.01565, Mass diff 0 (0 ppm), Formula C6H2"\r\n+75.02295\t278714\t"Theoretical m/z 75.023475, Mass diff 0 (0 ppm), Formula C6H3"\r\n+76.03075\t6'..b'pm), SMILES C=C2CCC1CC(C)CCC1C2(C)C, Annotation [C14H24-7H]+, Rule of HR True"\r\n+187.14806\t422332\t"Theoretical m/z 187.148122, Mass diff 0 (0.33 ppm), SMILES CC2CCC1C(CCCC1(C)(C))C2(C), Annotation [C14H26-7H]+, Rule of HR True"\r\n+188.1559\t151252\t"Theoretical m/z 188.155947, Mass diff 0 (0.25 ppm), SMILES CC2CCC1C(CCCC1(C)(C))C2(C), Annotation [C14H26-6H]+, Rule of HR False"\r\n+189.12735\t68862\t"Theoretical m/z 189.127389, Mass diff 0 (0.21 ppm), SMILES O=C2C=C1CCCC(CC)C1(C)CC2, Annotation [C13H20O-3H]+, Rule of HR True"\r\n+189.16364\t163919\t"Theoretical m/z 189.163772, Mass diff 0 (0.7 ppm), SMILES CC2CCC1C(CCCC1(C)(C))C2(C), Annotation [C14H26-5H]+, Rule of HR True"\r\n+190.13504\t97146\r\n+195.11685\t57370\t"Theoretical m/z 195.117375, Mass diff 0 (0 ppm), Formula C15H15"\r\n+197.13249\t50230\t"Theoretical m/z 197.132481, Mass diff 0 (0.04 ppm), SMILES C=C3CCC2C(CCC1CCCC12)C3C, Annotation [C15H24-7H]+, Rule of HR True"\r\n+199.14803\t221936\t"Theoretical m/z 199.148122, Mass diff 0 (0.46 ppm), SMILES C=C2CCC1C(C)C(C)CCC1C2(C)C, Annotation [C15H26-7H]+, Rule of HR True"\r\n+200.15579\t108028\r\n+201.16364\t216321\t"Theoretical m/z 201.163772, Mass diff 0 (0.65 ppm), SMILES C=C2CCC1C(C)C(C)CCC1C2(C)C, Annotation [C15H26-5H]+, Rule of HR True"\r\n+202.17162\t208618\r\n+203.14304\t1200123\t"Theoretical m/z 203.143035, Mass diff 0 (0.02 ppm), SMILES OC3CCC2C3(CCC1C(C)CCCC12), Annotation [C14H24O-5H]+, Rule of HR True"\r\n+204.14627\t283454\r\n+206.16646\t32118\r\n+209.13243\t45976\t"Theoretical m/z 209.133026, Mass diff 0 (0 ppm), Formula C16H17"\r\n+211.14809\t272618\t"Theoretical m/z 211.148132, Mass diff 0 (-0.2 ppm), SMILES CC1=C(C)C2=C([CH+]CCC=C(C)\\C=C/2)C=C1, Annotation [C16H19]+, Rule of HR True"\r\n+212.15134\t57168\r\n+213.16373\t355360\t"Theoretical m/z 213.163773, Mass diff 0 (-0.2 ppm), SMILES CC1=C(C)C2=C([CH+]CCC=C(C)CC2)C=C1, Annotation [C16H21]+, Rule of HR True"\r\n+214.16698\t92310\r\n+215.143\t60304\t"Theoretical m/z 215.143035, Mass diff 0 (0.16 ppm), SMILES OC3CCC2C3(CCC1C(C(=C)CCC12)C), Annotation [C15H24O-5H]+, Rule of HR True"\r\n+216.15102\t55312\r\n+217.15874\t113508\t"Theoretical m/z 217.158691, Mass diff 0 (0.23 ppm), SMILES OC3CCC2C3(CCC1C2(CCCC1(C)(C))), Annotation [C15H26O-5H]+, Rule of HR True"\r\n+218.16704\t51076\r\n+226.17177\t37673\r\n+227.1797\t204277\t"Theoretical m/z 227.179433, Mass diff 0 (1.18 ppm), SMILES C=C2CCC1C(CC)C(C)CCC1C2(C)CC, Annotation [C17H30-7H]+, Rule of HR True"\r\n+228.1873\t842856\r\n+229.1588\t359919\t"Theoretical m/z 229.158691, Mass diff 0 (0.48 ppm), SMILES OC3CCC2C3(CCC1C2(CCC(=C)C1(C)(C))), Annotation [C16H26O-5H]+, Rule of HR True"\r\n+230.16186\t41138\r\n+231.17433\t428563\t"Theoretical m/z 231.174335, Mass diff 0 (0.02 ppm), SMILES O=C3C=C2CCC1C(C)CCCC1C2(C)CC3, Annotation [C16H24O-H]+, Rule of HR True"\r\n+232.17703\t61957\r\n+237.16373\t184777\t"Theoretical m/z 237.164326, Mass diff 0 (0 ppm), Formula C18H21"\r\n+238.16693\t38109\r\n+241.15854\t66162\t"Theoretical m/z 241.158691, Mass diff 0 (0.62 ppm), SMILES O=C3C=C2CCC1C(CC)CCCC1C2(C)CC3, Annotation [C17H26O-5H]+, Rule of HR True"\r\n+242.16649\t51489\r\n+245.19052\t102650\t"Theoretical m/z 245.189996, Mass diff 0.001 (2.14 ppm), SMILES OC1CCC2C3CCC(=C)C(C)(C)C3(CCC12(C)), Annotation [C17H28O-3H]+, Rule of HR True"\r\n+246.19786\t1126362\r\n+247.2011\t212107\r\n+252.18724\t143505\r\n+255.17436\t288345\t"Theoretical m/z 255.174341, Mass diff 0 (0.08 ppm), SMILES O=C3C=C2CCC1C4CCCC4(CCC1C2(C)CC3), Annotation [C18H26O-3H]+, Rule of HR True"\r\n+256.17764\t54890\r\n+259.16943\t50245\t"Theoretical m/z 259.169244, Mass diff 0 (0.72 ppm), SMILES O=C3C=C2CCC1C(C)C(CO)CCC1C2(C)CC3, Annotation [C17H26O2-3H]+, Rule of HR True"\r\n+260.17758\t70396\r\n+270.19791\t397018\r\n+271.20062\t89701\r\n+273.18549\t199263\t"Theoretical m/z 273.184894, Mass diff 0.001 (2.18 ppm), SMILES O=C3C=C2CCC1C4CCC(O)C4(CCC1C2(C)CC3), Annotation [C18H26O2-H]+, Rule of HR True"\r\n+274.18863\t88305\r\n+288.20841\t1123316\t"Theoretical m/z 288.208375, Mass diff 0 (0.12 ppm), SMILES O=C4C=C3CCC1C(CCC2(C)(C(O)CCC12))C3(C)CC4, Annotation [C19H28O2]+, Rule of HR False"\r\n+289.21173\t220898\r\n+\r\n+\r\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/recetox_gc-ei_ms_20201028_with_precursor_mz.msp
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/recetox_gc-ei_ms_20201028_with_precursor_mz.msp Fri Jan 28 16:22:06 2022 +0000
[
b'@@ -0,0 +1,32358 @@\n+NAME: Perylene_2H12\n+SCANNUMBER: -1\n+RETENTIONTIME: -1\n+RETENTIONINDEX: 2876\n+PRECURSORMZ: 264.16858\n+PRECURSORTYPE: [M]+\n+IONMODE: Positive\n+SPECTRUMTYPE: Centroid\n+FORMULA: C20H12\n+INCHIKEY: CSHWQDPOILHKBI-AQZSQYOVSA-N\n+INCHI: \n+SMILES: [2H]C1=C(C2=C3C(=C1[2H])C4=C(C(=C(C5=C4C(=C(C(=C5[2H])[2H])[2H])C3=C(C(=C2[2H])[2H])[2H])[2H])[2H])[2H])[2H]\n+AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\n+COLLISIONENERGY: 70eV\n+INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\n+INSTRUMENTTYPE: GC-EI-Orbitrap\n+IONIZATION: EI+\n+LICENSE: CC BY-NC\n+COMMENT: \n+PRECURSOR_MZ: 264.16858\n+NUM PEAKS: 33\n+116.05576\t29277.0\n+118.06992\t49651.0\n+128.0558\t37001.0\n+130.06996\t78584.0\n+130.57159\t17533.0\n+132.08408\t65686.0\n+132.5858\t12593.0\n+207.0322\t39569.0\n+222.08282\t13141.0\n+223.06346\t20762.0\n+225.04277\t18058.0\n+227.02202\t26370.0\n+232.11204\t30354.0\n+236.1405\t22796.0\n+252.09322\t8564.0\n+256.11212\t41765.0\n+257.11557\t8688.0\n+258.12622\t21742.0\n+259.13446\t11564.0\n+260.14041\t248997.0\n+261.14358\t51721.0\n+262.15466\t33597.0\n+263.16254\t63732.0\n+264.16858\t829577.0\n+265.01968\t18286.0\n+265.17191\t176460.0\n+266.17523\t18876.0\n+283.03036\t10261.0\n+287.00632\t11352.0\n+295.10288\t26727.0\n+299.06152\t33379.0\n+359.0282\t67046.0\n+400.98447\t17406.0\n+\n+NAME: Perylene\n+SCANNUMBER: -1\n+RETENTIONTIME: -1\n+RETENTIONINDEX: 2886.9\n+PRECURSORMZ: 252.09323\n+PRECURSORTYPE: [M]+\n+IONMODE: Positive\n+SPECTRUMTYPE: Centroid\n+FORMULA: C20H12\n+INCHIKEY: CSHWQDPOILHKBI-UHFFFAOYSA-N\n+INCHI: \n+SMILES: C1=CC2=C3C(=C1)C1=CC=CC4=C1C(=CC=C4)C3=CC=C2\n+AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\n+COLLISIONENERGY: 70eV\n+INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\n+INSTRUMENTTYPE: GC-EI-Orbitrap\n+IONIZATION: EI+\n+LICENSE: CC BY-NC\n+COMMENT: \n+PRECURSOR_MZ: 252.09323\n+NUM PEAKS: 19\n+112.03071\t49892.0\n+113.03854\t87510.0\n+124.03076\t100146.0\n+124.53242\t24923.0\n+125.03855\t179254.0\n+125.54019\t49039.0\n+126.04636\t131679.0\n+126.54804\t36313.0\n+222.04645\t28905.0\n+224.06192\t55632.0\n+226.04175\t37413.0\n+246.04646\t23286.0\n+248.06204\t140007.0\n+249.07072\t62236.0\n+250.07765\t641789.0\n+251.07967\t137600.0\n+252.09323\t1955166.0\n+253.09656\t402252.0\n+254.09985\t39987.0\n+\n+NAME: Phenanthrene_2H10\n+SCANNUMBER: -1\n+RETENTIONTIME: -1\n+RETENTIONINDEX: 1827.1\n+PRECURSORMZ: 188.14029\n+PRECURSORTYPE: [M]+\n+IONMODE: Positive\n+SPECTRUMTYPE: Centroid\n+FORMULA: C14H10\n+INCHIKEY: YNPNZTXNASCQKK-LHNTUAQVSA-N\n+INCHI: \n+SMILES: [2H]C1=C(C(=C2C(=C1[2H])C(=C(C3=C(C(=C(C(=C32)[2H])[2H])[2H])[2H])[2H])[2H])[2H])[2H]\n+AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\n+COLLISIONENERGY: 70eV\n+INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\n+INSTRUMENTTYPE: GC-EI-Orbitrap\n+IONIZATION: EI+\n+LICENSE: CC BY-NC\n+COMMENT: \n+PRECURSOR_MZ: 188.14029\n+NUM PEAKS: 17\n+76.02767\t185421.0\n+78.0418\t256858.0\n+80.05586\t881271.0\n+90.04181\t200162.0\n+92.06206\t537968.0\n+94.06999\t628791.0\n+156.08402\t836513.0\n+158.09808\t477819.0\n+160.11218\t2421148.0\n+161.11554\t310248.0\n+176.10866\t308983.0\n+184.11224\t2784543.0\n+185.11562\t445833.0\n+186.12637\t1283282.0\n+188.14029\t15115275.0\n+189.1436\t2312386.0\n+190.14688\t151400.0\n+\n+NAME: Phenanthrene\n+SCANNUMBER: -1\n+RETENTIONTIME: -1\n+RETENTIONINDEX: 1832.9\n+PRECURSORMZ: 178.0775\n+PRECURSORTYPE: [M]+\n+IONMODE: Positive\n+SPECTRUMTYPE: Centroid\n+FORMULA: C14H10\n+INCHIKEY: YNPNZTXNASCQKK-UHFFFAOYSA-N\n+INCHI: \n+SMILES: C1=CC2=C(C=C1)C1=C(C=CC=C1)C=C2\n+AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\n+COLLISIONENERGY: 70eV\n+INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\n+INSTRUMENTTYPE: GC-EI-Orbitrap\n+IONIZATION: EI+\n+LICENSE: CC BY-NC\n+COMMENT: \n+PRECURSOR_MZ: 178.0775\n+NUM PEAKS: 19\n+74.01508\t137808.0\n+75.02295\t278714.0\n+76.03075\t608417.0\n+87.02295\t304266.0\n+88.03076\t497050.0\n+89.03857\t441168.0\n+98.01511\t150478.0\n+150.04633\t868927.0\n+151.05415\t546351.0\n+152.0619\t2275502.0\n+153.06528\t276320.0\n+169.06468\t272559.0\n+174.04636\t365846.0\n+175.05423\t272039.0\n+176.062\t3370523.0\n+177.06982\t1751846.0\n+178.0775\t13724432.0\n+179.08078\t2250119.0\n+180.08412\t138203.0\n+\n+NAME: Anthracene\n+SCANNUMBER: -1\n+RETENTIONTIME: -1\n+R'..b'9912.0\n+227.17972\t5423840.0\n+228.18791\t2914893.0\n+229.15888\t32360466.0\n+230.16203\t6384102.0\n+231.1749\t1289341.0\n+232.18314\t332775.0\n+237.16412\t482606.0\n+238.172\t1003913.0\n+239.17972\t4289875.0\n+240.18282\t790788.0\n+241.15898\t818792.0\n+243.17453\t1942474.0\n+244.18245\t6361220.0\n+245.18564\t1031445.0\n+249.16392\t573775.0\n+251.17975\t407893.0\n+252.18788\t671025.0\n+253.19528\t4724411.0\n+254.20363\t4511072.0\n+255.20648\t1121372.0\n+256.18237\t1013544.0\n+257.19034\t3573622.0\n+258.19263\t594380.0\n+263.17984\t1236644.0\n+267.17474\t902087.0\n+269.19067\t342232.0\n+270.19833\t656479.0\n+271.20621\t2697450.0\n+272.21378\t25275140.0\n+273.21713\t5337242.0\n+274.22037\t493519.0\n+278.20316\t723267.0\n+281.19022\t3078032.0\n+282.19333\t636564.0\n+285.18503\t445716.0\n+286.19318\t505550.0\n+296.21365\t3914332.0\n+297.21619\t834583.0\n+299.20071\t17845166.0\n+300.20407\t3927878.0\n+301.20691\t386280.0\n+314.22427\t14435122.0\n+315.22732\t3171411.0\n+316.23056\t354527.0\n+447.34674\t509682.0\n+\n+NAME: Testosterone\n+SCANNUMBER: -1\n+RETENTIONTIME: -1\n+RETENTIONINDEX: 2733\n+PRECURSORMZ: 288.20841\n+PRECURSORTYPE: [M]+\n+IONMODE: Positive\n+SPECTRUMTYPE: Centroid\n+FORMULA: C19H28O2\n+INCHIKEY: MUMGGOZAMZWBJJ-DYKIIFRCSA-N\n+INCHI: \n+SMILES: CC12CCC3C(C1CCC2O)CCC4=CC(=O)CCC34C\n+AUTHORS: Price et al., RECETOX, Masaryk University (CZ)\n+COLLISIONENERGY: 70eV\n+INSTRUMENT: Q Exactive GC Orbitrap GC-MS/MS\n+INSTRUMENTTYPE: GC-EI-Orbitrap\n+IONIZATION: EI+\n+LICENSE: CC BY-NC\n+COMMENT: \n+PRECURSOR_MZ: 288.20841\n+NUM PEAKS: 130\n+67.05424\t425856.0\n+68.05758\t32423.0\n+69.06989\t40720.0\n+77.0386\t701107.0\n+78.04644\t206546.0\n+79.05425\t1677740.0\n+80.06205\t212420.0\n+81.06992\t591913.0\n+82.07324\t87864.0\n+83.08553\t132100.0\n+91.05427\t2712295.0\n+92.05762\t347222.0\n+93.06994\t1165998.0\n+94.07777\t348187.0\n+95.08556\t843191.0\n+96.05698\t438830.0\n+97.10123\t225039.0\n+103.05426\t164013.0\n+104.06209\t107889.0\n+105.06992\t1641197.0\n+106.07773\t362834.0\n+107.04917\t231952.0\n+107.08556\t791873.0\n+108.09338\t226494.0\n+109.06484\t1377189.0\n+110.07266\t295897.0\n+111.11686\t89809.0\n+115.05426\t293808.0\n+116.06208\t54416.0\n+117.0699\t705440.0\n+118.07771\t180876.0\n+119.08557\t1042378.0\n+120.09339\t283969.0\n+121.10119\t622111.0\n+122.07263\t346341.0\n+123.08047\t632087.0\n+124.0883\t3096347.0\n+125.09164\t287870.0\n+128.06206\t220792.0\n+129.06988\t580911.0\n+130.07767\t146160.0\n+131.08559\t960647.0\n+132.09337\t265447.0\n+133.10121\t554432.0\n+134.10901\t403802.0\n+135.11685\t343774.0\n+136.1247\t198902.0\n+137.0961\t277512.0\n+138.1039\t57211.0\n+141.06987\t131615.0\n+142.07773\t123164.0\n+143.08554\t501343.0\n+144.09331\t66154.0\n+145.10117\t268116.0\n+146.10899\t254486.0\n+147.0804\t95276.0\n+147.11679\t1285762.0\n+148.12456\t421900.0\n+149.09608\t321248.0\n+150.10381\t153636.0\n+151.11175\t129271.0\n+152.062\t37808.0\n+155.08546\t103204.0\n+156.09323\t64215.0\n+158.07256\t141873.0\n+159.11679\t250012.0\n+160.08816\t145963.0\n+161.13245\t257830.0\n+162.10376\t195492.0\n+163.14809\t122973.0\n+164.11951\t206339.0\n+165.12733\t237526.0\n+169.10114\t92813.0\n+171.11676\t144863.0\n+172.08818\t132181.0\n+173.1324\t250167.0\n+174.10378\t253404.0\n+175.11162\t210353.0\n+176.11943\t88738.0\n+177.1637\t38439.0\n+183.11676\t46215.0\n+185.13243\t817797.0\n+187.14806\t422332.0\n+188.1559\t151252.0\n+189.12735\t68862.0\n+189.16364\t163919.0\n+190.13504\t97146.0\n+195.11685\t57370.0\n+197.13249\t50230.0\n+199.14803\t221936.0\n+200.15579\t108028.0\n+201.16364\t216321.0\n+202.17162\t208618.0\n+203.14304\t1200123.0\n+204.14627\t283454.0\n+206.16646\t32118.0\n+209.13243\t45976.0\n+211.14809\t272618.0\n+212.15134\t57168.0\n+213.16373\t355360.0\n+214.16698\t92310.0\n+215.143\t60304.0\n+216.15102\t55312.0\n+217.15874\t113508.0\n+218.16704\t51076.0\n+226.17177\t37673.0\n+227.1797\t204277.0\n+228.1873\t842856.0\n+229.1588\t359919.0\n+230.16186\t41138.0\n+231.17433\t428563.0\n+232.17703\t61957.0\n+237.16373\t184777.0\n+238.16693\t38109.0\n+241.15854\t66162.0\n+242.16649\t51489.0\n+245.19052\t102650.0\n+246.19786\t1126362.0\n+247.2011\t212107.0\n+252.18724\t143505.0\n+255.17436\t288345.0\n+256.17764\t54890.0\n+259.16943\t50245.0\n+260.17758\t70396.0\n+270.19791\t397018.0\n+271.20062\t89701.0\n+273.18549\t199263.0\n+274.18863\t88305.0\n+288.20841\t1123316.0\n+289.21173\t220898.0\n+\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/scores_test1_out.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/scores_test1_out.tsv Fri Jan 28 16:22:06 2022 +0000
b
b'@@ -0,0 +1,175 @@\n+\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n+C001\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.01131824210476606\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.048050183216295894\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n+C002\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\t9.826519226227062e-05\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.058818978905494305\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.012123553350886735\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.003604401443170206\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n+C003\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.001996725260781092\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.003441767933265955\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n+C004\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t2.962804993140071e-05\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0040278645118103865\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n+C005\t0.0\t0.0\t0.0\t0.0\t0.9999999999999992\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t'..b'.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.18149359661870704\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\n+C170\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.2793597601790586\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\n+C171\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.030541540271258622\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\n+C172\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.9156381551854462\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\n+C173\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.00045173712879657656\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.14221557456489292\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\n+C174\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/scores_test3_out.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/scores_test3_out.tsv Fri Jan 28 16:22:06 2022 +0000
b
b'@@ -0,0 +1,387 @@\n+\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n+Perylene_2H12\t0.0\t0.0\t0.0005256270959446041\t0.0\t0.03073097535576865\t0.0\t0.0\t6.245570704427149e-05\t0.0\t0.0\t0.0\t0.0\t0.004564716964324222\t0.0\t0.0\t0.013203066603708824\t0.0\t0.0\t0.0\t0.00039214513461787934\t0.0\t0.0\t0.0007918167287744314\t0.0\t0.0\t0.0004447561432835879\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.014053019016690342\t0.0\t0.0\t0.0\t0.0\t0.0\t0.010864712316628122\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.1457986453664692\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.07136533213674005\t0.0\t0.0\t0.0\t0.0\t0.0\t0.008502864326957613\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.008332485011325066\t0.06707997408159612\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.014331972335452473\t0.0\t0.00279044697331512\t0.0\t0.0\t0.0\t0.0\t0.08644538826313944\t0.0\t0.0230223502665467\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.05194618366505897\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.07451431952403163\t0.0\t0.0\t0.0\t0.0\t0.008606424963572753\t0.0\t0.0\t0.0\t0.0\t0.0\t0.029465908012253836\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.06765194944236241\t0.0\t0.0\n+Perylene\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0032741303817077237\t0.0\t0.01059895859620056\t0.0\t0.0\t0.011988179251417755\t0.004445067503941489\t0.0\t0.0\t0.0\t0.0\t0.0\t0.010205422020394999\t0.0\t0.0\t0.07094451588225481\t0.0\t0.0\t0.0012435925952213776\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0028113782310797255\t0.0\t0.0\t0.0015057844692663734\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.015722861787553524\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.04875136828344371\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.023395854503055747\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.07014255094522087\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n+Phenanthrene_2H10\t0.0024478437470211957\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.044583058787688194\t0.0\t0.0\t0.010556784103056164\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.053243824199748255\t0.0\t0.7408591267092633\t0.0\t0.0\t0.0\t0.0\t0.12202560685242986\t0.04568269717012136\t0.004157278401108382\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.028649962860904238\t0.0\t0.0391645806143903\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.008485163950429123\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.004892255878207329\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.027071584755955534\t0.0\t0.0\t0.0\n+Phenanthrene\t0.00561720665430217\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0014924956391185538\t0.12453944133920959\t0.0\t0.087078422418'..b'5369148999\t0.0\t0.0\t0.0\t0.05477359359289294\t0.014982137997848574\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.011712224528606202\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n+Progesterone\t0.009204773873174418\t0.0003433200025161085\t0.0\t0.0007924296222333302\t0.0\t0.0\t0.009441153443328694\t0.005947519671344408\t0.0\t0.0005356814581771544\t0.006215857342936553\t0.0\t0.009417667003961789\t0.009918679539108183\t0.00023339501999512072\t0.02671768716952186\t0.00030790986345821436\t0.0\t0.0\t0.0013743163821902838\t0.01723317359032806\t0.0\t0.031565466787107484\t0.012448459343477094\t0.0\t0.007750527312298496\t0.0070234525583043545\t0.02059761160321701\t0.023913761352649478\t0.011281962106545012\t1.6426994248357484e-05\t0.0\t0.03697516657930819\t0.033662224880288756\t0.0\t0.0\t0.023540677910418206\t0.0\t0.036138976947232074\t0.02542494090112982\t0.0\t0.0\t0.011503400057545196\t0.0\t0.00020822196303031898\t0.0\t0.0\t0.0\t0.0\t0.0014763317286047445\t0.0\t0.0012583838846539634\t0.0\t0.003999037208194656\t0.013710430439412245\t0.0013524730258847118\t0.007867754340786993\t0.040527384587716785\t0.010996257146538806\t0.0\t0.0\t0.06835446607134321\t0.0\t0.0\t0.008591363167784043\t0.0\t0.0\t0.0\t0.0\t0.0\t0.007090284250167511\t0.008465564938609326\t0.08040814196887734\t0.0\t0.028294996723359764\t0.0\t0.0\t0.0038398141926578064\t0.16023981186600048\t0.04805946943116568\t0.037035561711554706\t0.0\t0.0005120942309216829\t0.0\t0.0\t0.03494182656191998\t0.0\t0.0\t0.027888357150312005\t0.01258535522221259\t0.03740123828771993\t0.008517825868349588\t0.00913703375472102\t0.0\t0.0\t0.0\t0.0\t0.0\t0.029300775267851735\t0.0\t0.0\t0.0\t0.01295087988307018\t0.0005955124138932553\t0.0\t0.0\t0.0\t0.005304965226057589\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.039134050766579234\t0.2714869727438596\t0.003527160692631183\t0.0\t0.0\t0.020497841819279862\t0.0\t0.002511329287084922\t0.0\t0.3500845873047567\t0.0\t0.002239902702309837\t0.0\t0.005491138035803363\t0.0\t0.0\t0.011672805021412769\t0.02568290039984708\t0.07006608189710377\t0.018632962351792192\t0.0\t0.04153373284622605\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.00786791970310509\t0.0\t0.047481418502903334\t0.0\t0.0\t0.0\t0.10974594417370813\t0.034291658672408076\t0.0\t0.023165391809283516\t0.0\t0.0\t0.0\t0.0002833417563650782\t0.0\t0.0\t0.0\t0.026807362599866824\t0.003975994609085822\t0.0\t0.0\t0.0\t0.0\t0.0\t0.06458445415629567\t0.013061309028202963\t0.0\t0.0\n+Testosterone\t0.00963321193050066\t0.00024864315729290006\t0.0\t0.00023222574210458811\t0.0009261428396286391\t0.0\t0.0\t0.00040034384039336243\t0.0\t6.734322542065858e-05\t0.0016889974488375878\t0.0\t0.1780813812315969\t0.007271975837211051\t0.0001534940265342155\t0.027912903539727703\t0.0\t0.0\t0.0\t0.0005797401705402813\t0.01109882605223559\t0.0\t0.024485309434567656\t0.020836980610370613\t0.0\t0.004730656796420955\t0.009055625850088012\t0.01764485751937845\t0.0342974876068616\t0.003171910470299864\t0.0\t0.0\t0.039580956813763224\t0.008699485073663131\t0.0\t0.0\t0.027921629937492445\t0.0\t0.011883152521337894\t0.00473955367711716\t0.0\t0.0\t0.06041370798509162\t0.0\t0.042697154051077546\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0028714022903154834\t0.021418156386493012\t0.0015186515255164064\t0.006270179831850896\t0.029915893967898583\t0.00688460931497788\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.001333543171051696\t0.0\t0.08702752210600657\t0.0\t0.03171198034450119\t0.0\t0.0\t0.0\t0.0\t0.0007660193758873158\t0.010813507002141582\t0.0\t0.0\t0.0\t0.0\t0.004200894168035819\t0.0\t0.0\t0.02349484368553467\t0.01816654272894712\t0.06339867284692742\t0.00859117181156952\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.11646566920503162\t0.0\t0.0\t0.0\t0.0\t0.0031342530947578136\t0.0\t0.15489171142643712\t0.0\t0.013048242174815912\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.001658310433454475\t0.03949452321180806\t0.0\t0.0\t0.0\t0.021990926351807643\t0.0\t0.13014922112429483\t0.0\t0.18331721895001493\t0.0\t0.0014411200837741657\t0.0\t0.0\t0.0\t0.0\t0.010921053413542842\t0.00943243671087211\t0.06421886680272976\t0.025882956568067213\t0.0\t0.03618383380922253\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0006655628265325035\t0.0\t0.026485058850513155\t0.0\t0.0\t0.0\t0.10783284756046711\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.12344754627650137\t0.0\t0.0\t0.0\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/scores_test4_out.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/scores_test4_out.tsv Fri Jan 28 16:22:06 2022 +0000
[
b"@@ -0,0 +1,387 @@\n+\tPerylene_2H12\tPerylene\tPhenanthrene_2H10\tPhenanthrene\tAnthracene\tAcenaphthylene\tAcenaphthene\tFluoranthene\tPyrene\tpara-Terphenyl\tRetene\tBenzo[b]naphtho[2,1-d]thiophene\t2,3-Benzofluorene\tBenzo[ghi]fluoranthene\tTriphenylene\tBenzanthracene/Benzophenanthrene\tBenzofluoranthene\tBenzo(k)fluoranthene\tBenzo[e]pyrene\tBenzo(a)pyrene\tIndeno[1,2,3-cd]pyrene\tBenzo(g,h,i)perylene\tAnthanthrene\tDibenzanthracene\tCoronene\tDicofol\tBenzophenone\t2-tert-Butyl-4-methoxyphenol\tButylated hydroxytoluene\tBumetrizole\t4-Methylbenzophenone\t2,4,6-Tribromophenol\t2,6-Dichloro-4-nitroaniline\t1-Methylphenanthrene\tTriclosan\tDrometrizole\tEnzacamene\t2,4-Di-tert-butyl-6-(5-chloro-2H-benzotriazol-2-yl)phenol\tOctrizole\t1,2,7,9-Tetrachlorodibenzofuran\t2,2',3,4,5,5',6-Heptachlorobiphenyl\t2,4,6-Trichlorobiphenyl\t2,2',3,3',4,5',6,6'-Octachlorobiphenyl\tMirex\tbeta-Hexachlorocyclohexane\talpha-1,2,3,4,5,6-Hexachlorocyclohexane\tLindane\tdelta-Hexachlorocyclohexane\tepsilon-Hexachlorocyclohexane\tPentachlorobenzene\tHexachlorobenzene\t2,4'-Dichlorodiphenyldichloroethylene\t2,4'-Dichlorodiphenyldichloroethane\t2,4'-Dichlorodiphenyltrichloroethane\t1,2,7,9-Tetrachlorodibenzo-p-dioxin\t2,4,4'-Trichlorobiphenyl\t2,2',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5-Pentachlorobiphenyl\t2,2',3,4,4',5'-Hexachlorobiphenyl\t2,2',4,4',5,5'-Hexachlorobiphenyl\t2,2',3,4,4',5,5'-Heptachlorobiphenyl\t2,2',5,5'-Tetrachlorobiphenyl\t2,3',4,6-Tetrachlorobiphenyl\t2,3',5',6-Tetrachlorobiphenyl\t2,2',3,4',5-Pentachlorobiphenyl\t2,3,3',4,5-Pentachlorobiphenyl\t3,3',4,5,5'-Pentachlorobiphenyl\t2,3',4,4',5',6-Hexachlorobiphenyl\t2,3,3',4,5,6-Hexachlorobiphenyl\t2,3,3',4',5',6-Hexachlorobiphenyl\t2,3,3',4',5,6-Hexachlorobiphenyl\t2,3,3',4',5,5',6-Heptachlorobiphenyl\tcis-Prallethrin\ttrans-Prallethrin\tcis-Resmethrin\ttrans-Resmethrin\tcis-Tetramethrin\ttrans-Tetramethrin\tBifenthrin\tFenpropathrin\tcis-Phenothrin\ttrans-Phenothrin\tcis-Cyphenothrin\ttrans-Cyphenothrin\tFlucythrinate_isomer1\tFlucythrinate_isomer2\tcis-Fenvalerate\ttrans-Fenvalerate\tDeltamethrin\tChlorpyrifos oxon\tlambda-Cyhalothrin\tTefluthrin\tTransfluthrin\tcis-Permethrin\ttrans-Permethrin\tcis-Allethrin\ttrans-Allethrin\tcis-Cypermethrin_isomer1\ttrans-Cypermethrin_isomer1\tcis-Cypermethrin_isomer2\ttrans-Cypermethrin_isomer2\tcis-Cyfluthrin_isomer1\ttrans-Cyfluthrin_isomer1\tcis-Cyfluthrin_isomer2\ttrans-Cyfluthrin_Isomer2\t1,2,3,4,7,8-Hexachlorodibenzo-p-dioxin\t1,2,3,4,6,7,8-Heptachlorodibenzo-p-dioxin\tOctachlorodibenzo-p-dioxin\tOctachlorodibenzofuran\t1,2,3,7,8-Pentachlorodibenzofuran\t1,2,3,4,7,8-Hexachlorodibenzofuran\t1,2,3,4,6,7,8-Heptachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzofuran\t2,3,7,8-Tetrachlorodibenzo-p-dioxin\t1,2,3,7,8-Pentachlorodibenzo-p-dioxin\t2,3,4,5-Tetrabromo-6-chlorotoluene\t2,3,4,5,6-Pentabromotoluene\t2,3,4,5,6-Pentabromoethylbenzene\t2,3,5,6-Tetrabromo-p-xylene\tAllyl 2,4,6-tribromophenyl ether\t2-Bromoallyl(2,4,6-tribromophenyl) ether\tPentabromobenzene\tHexabromobenzene\t2,3,4,5,6-Pentabromobenzyl alcohol\t2-Ethylhexyl 2,3,4,5-Tetrabromobenzoate\tsyn-Dechlorane plus\tanti-Dechlorane plus\talpha-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\tbeta-1,2-Dibromo-4-(1,2-dibromoethyl)cyclohexane\t1,2,5,6-Tetrabromocyclooctane\t1,1-Dibromo-2,3,3,4,4,5-hexachloro-2-cyclopenta-2,4-dien-1-ylcyclooctane\talpha-Amylcinnamaldehyde\ttrans-Cinnamaldehyde\tCitral (Geranial)\t1-Fluronaphthalene\talpha-Hexylcinnamaldehyde\tLilial\talpha-Amylcinnamyl alcohol\tEugenol\tIsoeugenol\t4-Methoxybenzyl alcohol\tMethyleugenol\tCinnamyl alcohol\tBenzyl alcohol\tEstragole\tBenzyl benzoate\tBenzyl cinnamate\tBenzyl salicylate\tCamphor\tEucalyptol\tCoumarin\tLimonene\tIsomethyl-alpha-ionone\tdelta-Iraldeine\tSafrole\tCashmeran\tCelestolide\tPhantolide\tTonalide\tTraseolide\tGalaxolide\tAldrin\tEndosulfan\tHeptachlor\tcis-Heptachlor epoxide\tEndosulfan sulphate\tEndrin ketone\ttrans-Chlordane\tcis-Chlordane\tEndrin aldehyde\tEndrin\t4,4'-Dichlorodiphenyldichloroethylene\tMethoxychlor\t4,4'-Dichlorodiphenyldichloroethane\t4,4'-Dichlorodiphenyltrichloroethane\tTris(4-tert-butylphenyl) phosphate\tTri-n-butyl-phosphate\tTris(1,3-dichloro-2-propy"..b'99004\t0.25699522150266857\t0.10086896866641386\t0.19470204063894617\t0.11098877289750769\t0.006075991834095414\t0.12927366381808264\t0.2082286991025265\t0.27240094810916426\t0.1654349689057302\t0.19840999142874\t0.16569982850423232\t0.2161122709425279\t0.14188794086609754\t0.13892041895889107\t0.163316162934255\t0.19714612348281121\t0.11328276368401106\t0.1797393737639574\t0.11912510425789868\t0.1513410655357927\t0.17376963876857818\t0.11727276196549535\t0.18242398225791773\t0.42587475586474854\t0.26019712746688456\t0.14368704499704515\t0.2071878076412335\t0.09453837918890001\t0.17883495196186588\t0.230407695094039\t0.2003708220640954\t0.28221288790938787\t0.1632240149541304\t0.33569524175870596\t0.3064105089065634\t0.06757663229398125\t0.1875387758604876\t0.14809372567415943\t0.0852574772349589\t0.038518437729193764\t0.1694183013806351\t0.15289185256222845\t0.1323269305931256\t0.14183815846488648\t0.11892832652180535\t0.12040055943475189\t0.055133306975097635\t0.059734777165814525\t0.0566711436003959\t0.10411276944449463\t0.09983202384693853\t0.038921466584489514\t0.0866119306764878\t0.06992238111265867\t0.09431159408139042\t0.0938643626333852\t0.08034523157647287\t0.30621301093750836\t0.1961893280957181\t0.1611360617918086\t0.23758939346985095\t0.12271395237074852\t0.1430157698712594\t0.0833933983294341\t0.035843502317569234\t0.1633740133739675\t0.1483671806190231\t0.13613729576468475\t0.13641339521522466\t0.10219746530932572\t0.24528101783913517\t0.22010021314888892\t0.17232404535039347\t0.17930641471345765\t0.15547769438760414\t0.1764623247344844\t0.08065948881320073\t0.19144552461877729\t0.3183099871734532\t0.06306342224555873\t0.05987974210984678\t0.05740354384209485\t0.20721138046115542\t0.328456758896439\t0.32098885468030136\t0.23821868337793292\t0.07145396369303544\t0.19081119513093286\t0.057616601871621285\t0.2340183931599587\t0.23822558856834722\t0.06797270073648182\t0.43003853617809873\t0.02792424887822149\t0.18822156250959438\t0.16114686619257262\t0.22810608062777601\t0.0838224184080167\t0.08443319924123477\t0.1894850392430079\t0.265083072227541\t0.10874839217026484\t0.21783385621466414\t0.006793839193263404\t0.08475249990448121\t0.12988582068761828\t0.2837084520725496\t0.07764215735572715\t0.08398679648212394\t0.09380315448372266\t0.21450922103222061\t0.27742281155579906\t0.04435157844941482\t0.35472454340204307\t0.3010423011492258\t0.06572111033523048\t0.35449933960739016\t0.184212014644299\t0.16510341696367972\t0.22650136131747978\t0.08545503348016772\t0.054746540083621745\t0.07158142375321293\t0.05222918108605921\t0.29873505869435935\t0.1592048730563699\t0.12242150172343544\t0.06834825436267856\t0.11787482883203612\t0.06533075716795377\t0.29220597270428633\t0.3204987910247821\t0.23075740046511872\t0.16013387140172308\t0.1031810078648983\t0.11609557607181138\t0.06536501695877456\t0.07528353746322132\t0.14631099884719126\t0.31686299036015636\t0.15686508283056178\t0.2502894060505306\t0.15632555985381263\t0.06157073783891902\t0.17850524434839174\t0.15082352190116588\t0.10496525194001774\t0.0328681907045638\t0.24179240409750177\t0.20560588522808376\t0.2271655674450096\t0.218989372412798\t0.09854462852017379\t0.1117782001836314\t0.32586231433297036\t0.16492586594387235\t0.1863221551020623\t0.23621550072877454\t0.12483921692480258\t0.16889581762525904\t0.03249926663036536\t0.015295084861858975\t0.20368054392043403\t0.18965962379608556\t0.1016530064450796\t0.12816683398762763\t0.06555661306024704\t0.022930759762077174\t0.019231613914197573\t0.15747279820504434\t0.088105124422038\t0.34732800952940357\t0.12915213761674713\t0.026497694389320044\t0.07320003712462311\t0.15992895420273134\t0.04418658553634053\t0.22031587132600947\t0.10334439566995825\t0.054857312240601364\t0.14588090116315752\t0.0720775597079632\t0.2322377084263006\t0.009182131128330325\t0.08725499132616112\t0.23335439715459685\t0.26456927574996886\t0.20593724958472245\t0.16953436023943352\t0.2915911520785385\t0.1972305838560561\t0.061557676013784396\t0.08503438513801481\t0.16053915107475406\t0.14738299237590127\t0.3485715331892874\t0.331614755581215\t0.149139047638064\t0.14441111333967438\t0.3881349843527812\t0.3574090148392564\t0.8662836910447197\t1.0\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/similarity/scores_test5_out.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/similarity/scores_test5_out.tsv Fri Jan 28 16:22:06 2022 +0000
b
b'@@ -0,0 +1,175 @@\n+\tC001\tC002\tC003\tC004\tC005\tC006\tC007\tC008\tC009\tC010\tC011\tC012\tC013\tC014\tC015\tC016\tC017\tC018\tC019\tC020\tC021\tC022\tC023\tC024\tC025\tC026\tC027\tC028\tC029\tC030\tC031\tC032\tC033\tC034\tC035\tC036\tC037\tC038\tC039\tC040\tC041\tC042\tC043\tC044\tC045\tC046\tC047\tC048\tC049\tC050\tC051\tC052\tC053\tC054\tC055\tC056\tC057\tC058\tC059\tC060\tC061\tC062\tC063\tC064\tC065\tC066\tC067\tC068\tC069\tC070\tC071\tC072\tC073\tC074\tC075\tC076\tC077\tC078\tC079\tC080\tC081\tC082\tC083\tC084\tC085\tC086\tC087\tC088\tC089\tC090\tC091\tC092\tC093\tC094\tC095\tC096\tC097\tC098\tC099\tC100\tC101\tC102\tC103\tC104\tC105\tC106\tC107\tC108\tC109\tC110\tC111\tC112\tC113\tC114\tC115\tC116\tC117\tC118\tC119\tC120\tC121\tC122\tC123\tC124\tC125\tC126\tC127\tC128\tC129\tC130\tC131\tC132\tC133\tC134\tC135\tC136\tC137\tC138\tC139\tC140\tC141\tC142\tC143\tC144\tC145\tC146\tC147\tC148\tC149\tC150\tC151\tC152\tC153\tC154\tC155\tC156\tC157\tC158\tC159\tC160\tC161\tC162\tC163\tC164\tC165\tC166\tC167\tC168\tC169\tC170\tC171\tC172\tC173\tC174\n+C001\t1.0000000000000002\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.011318242104766061\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0480501832162959\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n+C002\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\t0.0\t9.826519226227063e-05\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.05881897890549432\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.012123553350886737\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0036044014431702073\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n+C003\t0.0\t0.0\t0.9999999999999999\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.001996725260781092\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0034417679332659546\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n+C004\t0.0\t0.0\t0.0\t0.9999999999999998\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t2.96280499314007e-05\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0040278645118103865\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\n+C005\t0.0\t0.0\t0.0\t0.0\t0.9999999999999999\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t'..b'0.0\t0.0\t0.0\t0.0\t0.18149359661870704\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.9999999999999998\t0.0\t0.0\t0.0\t0.0\t0.0\n+C170\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.2793597601790586\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0\t0.0\t0.0\t0.0\t0.0\n+C171\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.030541540271258626\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0000000000000002\t0.0\t0.0\t0.0\n+C172\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.9156381551854463\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0000000000000002\t0.0\t0.0\n+C173\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.00045173712879657656\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.14221557456489292\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0000000000000002\t0.0\n+C174\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t0.0\t1.0000000000000002\n'
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/test2_threshold_formatting.tsv
--- a/test-data/test2_threshold_formatting.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
@@ -1,19 +0,0 @@
-query reference matches score
-C007 Benzo[b]naphtho[2,1-d]thiophene 3 0.4302304171927885
-C023 Butylated hydroxytoluene 3 0.4899347755610658
-C016 Drometrizole 3 0.5535081364244014
-C040 Deltamethrin 4 0.5995685829585914
-C040 cis-Cypermethrin_isomer1 3 0.7514936043388737
-C040 cis-Cypermethrin_isomer2 3 0.6205879323732599
-C043 Carbofuran phenol 3 0.5173781620618291
-C023 Alachlor 4 0.4289634841639738
-C012 Chlorpyrifos 3 0.43976068904478827
-C016 Atrazine 5 0.4399647084473271
-C029 Metolachlor 3 0.8624580271763471
-C073 Praziquantel 3 0.6840766738581763
-C034 Carbaryl 3 0.4781026376526427
-C043 Carbofuran 3 0.5212598550187718
-C013 Indoxacarb 5 0.4827488304818007
-C073 Oxadixyl 4 0.7910256109540179
-C073 Amitraz 4 0.5270236660009217
-C008 Spirotetramat 5 0.40641914075077024
b
diff -r f06923bdd2f2 -r c3dd958cc4a5 test-data/test2_topk_formatting.tsv
--- a/test-data/test2_topk_formatting.tsv Mon Jan 10 12:21:43 2022 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
b"@@ -1,523 +0,0 @@\n-query\treference\tmatches\tscore\n-C001\tChlorpyrifos\t7\t0.2439698460078672\n-C001\ttrans-Chlordane\t10\t0.1709889053423956\n-C001\tcis-Chlordane\t10\t0.16934374734008048\n-C002\tCarfentrazone-ethyl\t1\t0.023438813553203555\n-C002\t2,2',3,3',4,5',6,6'-Octachlorobiphenyl\t2\t0.012935401162453864\n-C002\tPyridaben\t4\t0.011168624908917228\n-C003\tPerylene_2H12\t2\t0.0005256270959446041\n-C003\tMetalaxyl\t1\t1.7567415612900304e-06\n-C003\tPerylene\t0\t0.0\n-C004\t17-alpha-Ethynylestradiol\t2\t0.002716713573623163\n-C004\tCoronene\t1\t0.0009680981940665212\n-C004\tProgesterone\t2\t0.0007924296222333303\n-C005\tTetraconazole\t3\t0.12154746411094572\n-C005\tSulfentrazone\t1\t0.05393598836706972\n-C005\tIndoxacarb\t1\t0.0441412960627566\n-C006\tTris(4-tert-butylphenyl) phosphate\t2\t0.12426514943875827\n-C006\tPerylene_2H12\t0\t0.0\n-C006\tPerylene\t0\t0.0\n-C007\tBenzo[b]naphtho[2,1-d]thiophene\t3\t0.4302304171927885\n-C007\t2-Chlorobiphenyl\t2\t0.30327152545734354\n-C007\tRetene\t3\t0.16318259462298138\n-C008\tSpirotetramat\t5\t0.40641914075077024\n-C008\tEthofumesate\t4\t0.17576877383827938\n-C008\t2,4-Di-tert-butyl-6-(5-chloro-2H-benzotriazol-2-yl)phenol\t3\t0.1419543758042326\n-C009\tPicoxystrobin\t1\t0.0006870380110630028\n-C009\tTris(isopropylphenyl)phosphate\t1\t0.00023550942343171069\n-C009\tTebufenpyrad\t1\t0.00017257075992195458\n-C010\tcis-Permethrin\t1\t0.008724226797557697\n-C010\ttrans-Permethrin\t1\t0.008418860878033153\n-C010\tcis-Phenothrin\t1\t0.005882714253167312\n-C011\tFuberidazole\t1\t0.2308319926807784\n-C011\tPrometryn\t2\t0.1773186209832549\n-C011\tBenzoximate\t1\t0.07676637011355666\n-C012\tChlorpyrifos\t3\t0.43976068904478827\n-C012\tTerbufos\t1\t0.4006683041096004\n-C012\t2,6-Dichloro-4-nitroaniline\t1\t0.20998341159494333\n-C013\tIndoxacarb\t5\t0.4827488304818007\n-C013\tTemephos\t2\t0.32810153796559577\n-C013\tNuarimol\t2\t0.2936210041931014\n-C014\tChlorferone\t1\t0.5119124308782732\n-C014\tPiperonyl butoxide\t1\t0.4857177881241794\n-C014\t2,6-Dichloro-4-nitroaniline\t2\t0.33898957004708385\n-C015\tMetazachlor\t1\t0.0011434403294572687\n-C015\talpha-Amylcinnamyl alcohol\t1\t0.0005805859933790689\n-C015\tPendimethalin\t1\t0.0005015386924657569\n-C016\tDrometrizole\t3\t0.5535081364244014\n-C016\tAcenaphthylene\t2\t0.540073031173669\n-C016\tAtrazine\t5\t0.4399647084473271\n-C017\t4-tert-Octylphenol\t1\t0.9088788152148044\n-C017\tPropargite_isomer2\t1\t0.8953233485170952\n-C017\tPropargite_isomer1\t1\t0.8942159049307404\n-C018\tTris(4-tert-butylphenyl) phosphate\t1\t0.189695375366971\n-C018\tPerylene_2H12\t0\t0.0\n-C018\tPerylene\t0\t0.0\n-C019\tTriclosan\t1\t0.13434903881343435\n-C019\tTerbufos\t1\t0.08080384965580391\n-C019\tEpoxiconazole\t2\t0.07313225916488224\n-C020\tTris(isopropylphenyl)phosphate\t2\t0.2520159660977677\n-C020\tAmitraz\t2\t0.1245102870796828\n-C020\tMetribuzin\t1\t0.05224979683560159\n-C021\tTebuthiuron\t2\t0.9340205348244696\n-C021\t1,5-Dimethylnaphthalene\t1\t0.6803608761410861\n-C021\t2,6-Dimethylnaphthalene\t1\t0.6264160291669295\n-C022\t2-Bromoallyl(2,4,6-tribromophenyl) ether\t1\t0.11311229152083695\n-C022\t2,3,4,5,6-Pentabromobenzyl alcohol\t2\t0.07003350703850979\n-C022\tAllyl 2,4,6-tribromophenyl ether\t1\t0.06571493640420596\n-C023\tPhenanthrene_2H10\t1\t0.7408591267092633\n-C023\t2-Chlorobiphenyl\t1\t0.6159214014775711\n-C023\tButylated hydroxytoluene\t3\t0.4899347755610658\n-C024\tMepronil\t2\t0.18000248105004787\n-C024\tSpirotetramat\t8\t0.17523909122675907\n-C024\tEstrone\t7\t0.17146514923780354\n-C025\tTris(4-tert-butylphenyl) phosphate\t2\t0.2957673370199089\n-C025\tPerylene_2H12\t0\t0.0\n-C025\tPerylene\t0\t0.0\n-C026\tIsodecyl diphenyl phosphate\t2\t0.4122773057565717\n-C026\tDicofol\t1\t0.32235849897575225\n-C026\tTris(isopropylphenyl)phosphate\t2\t0.18207675907106227\n-C027\tFenobucarb\t1\t0.058048257187677615\n-C027\tIsoprocarb\t1\t0.056638368345330564\n-C027\tDioxacarb\t1\t0.041723437047250914\n-C028\tPhosmet\t1\t0.7848313885767587\n-C028\tAlachlor\t1\t0.5400260886224933\n-C028\tButafenacil\t2\t0.5287006460619553\n-C029\tMetolachlor\t3\t0.8624580271763471\n-C029\tSafrole\t2\t0.591167446764124\n-C029\tAmitraz\t2\t0.4100617029164697\n-C030\tEthofumesate\t2\t0.1283368182166788\n-C030\tIprovalicarb isomer 1\t1\t0.1278518291141877\n-C030\tAcephate\t4\t0.12723099231343524\n-C031\tProgesterone\t1\t1.642699424"..b"\n-C138\tPhenanthrene_2H10\t0\t0.0\n-C139\tPerylene_2H12\t0\t0.0\n-C139\tPerylene\t0\t0.0\n-C139\tPhenanthrene_2H10\t0\t0.0\n-C140\tRotenone\t1\t0.0015990284859575886\n-C140\tPerylene_2H12\t0\t0.0\n-C140\tPerylene\t0\t0.0\n-C141\tTebufenpyrad\t2\t0.2938100129854653\n-C141\tTris(isopropylphenyl)phosphate\t2\t0.020202034111700597\n-C141\tIpconazole\t1\t0.017041584156450424\n-C142\tPerylene_2H12\t0\t0.0\n-C142\tPerylene\t0\t0.0\n-C142\tPhenanthrene_2H10\t0\t0.0\n-C143\tDimethomorph_isomer2\t1\t0.16685279162562694\n-C143\tDimethomorph _isomer1\t1\t0.16482807037456434\n-C143\t2,3,4,5,6-Pentabromotoluene\t1\t0.032682863992618404\n-C144\tEtoxazole\t2\t0.1027909809180103\n-C144\t2,4-Di-tert-butyl-6-(5-chloro-2H-benzotriazol-2-yl)phenol\t2\t0.04732776045289416\n-C144\tAzoxystrobin\t2\t0.035630773587232864\n-C145\tPerylene_2H12\t0\t0.0\n-C145\tPerylene\t0\t0.0\n-C145\tPhenanthrene_2H10\t0\t0.0\n-C146\tPropargite_isomer1\t1\t0.0633083562823998\n-C146\tPropargite_isomer2\t1\t0.05654738208679003\n-C146\t2,2',3,3',4,5',6,6'-Octachlorobiphenyl\t1\t0.035712333462604294\n-C147\t2,2',3,4,4',5',6-Heptabromodiphenyl ether\t1\t0.03047378825096018\n-C147\tChlorferone\t1\t0.01855122445019196\n-C147\tProgesterone\t2\t0.007867919703105094\n-C148\tBuprofezin\t1\t0.01875857752389424\n-C148\tPerylene_2H12\t0\t0.0\n-C148\tPerylene\t0\t0.0\n-C149\tMetalaxyl\t2\t0.29742589743178666\n-C149\t1,4-Naphthoquinone\t1\t0.2740480911849054\n-C149\tPraziquantel\t1\t0.260732240603901\n-C150\ttrans-Prallethrin\t1\t0.00633664692361121\n-C150\tPerylene_2H12\t0\t0.0\n-C150\tPerylene\t0\t0.0\n-C151\tSpirotetramat\t1\t0.011452966094891676\n-C151\tPerylene_2H12\t0\t0.0\n-C151\tPerylene\t0\t0.0\n-C152\tTris(3,5-xylenyl)phosphate\t1\t0.05756111981021594\n-C152\tTris(isopropylphenyl)phosphate\t1\t0.0449470954588726\n-C152\tPerylene_2H12\t0\t0.0\n-C153\tEthiofencarb\t1\t0.8284613374855048\n-C153\t1,1-Dibromo-2,3,3,4,4,5-hexachloro-2-cyclopenta-2,4-dien-1-ylcyclooctane\t1\t0.4257874890609336\n-C153\tIsomethyl-alpha-ionone\t1\t0.36103138237616267\n-C154\t7,12-Dimethylbenz[a]anthracene\t1\t0.29226381053937395\n-C154\tEnzacamene\t1\t0.14396940230197552\n-C154\tTriflumizole\t1\t0.10858411907186044\n-C155\tPerylene_2H12\t0\t0.0\n-C155\tPerylene\t0\t0.0\n-C155\tPhenanthrene_2H10\t0\t0.0\n-C156\t7,12-Dimethylbenz[a]anthracene\t1\t0.08248293081186396\n-C156\tMethoprotryne\t1\t0.0432082364937662\n-C156\tProgesterone\t1\t0.02316539180928352\n-C157\tPerylene_2H12\t0\t0.0\n-C157\tPerylene\t0\t0.0\n-C157\tPhenanthrene_2H10\t0\t0.0\n-C158\tTris(4-tert-butylphenyl) phosphate\t1\t0.012341356867974116\n-C158\tPerylene_2H12\t0\t0.0\n-C158\tPerylene\t0\t0.0\n-C159\tTrifluralin\t1\t0.1883562158254524\n-C159\tFenpropathrin\t1\t0.015975881134824614\n-C159\tEthiprole\t1\t0.007596489095240584\n-C160\tBumetrizole\t1\t0.04337092323628775\n-C160\ttrans-Cypermethrin_isomer2\t1\t0.030241071137562938\n-C160\tPerylene_2H12\t1\t0.029465908012253836\n-C161\tPerylene_2H12\t0\t0.0\n-C161\tPerylene\t0\t0.0\n-C161\tPhenanthrene_2H10\t0\t0.0\n-C162\tPerylene_2H12\t0\t0.0\n-C162\tPerylene\t0\t0.0\n-C162\tPhenanthrene_2H10\t0\t0.0\n-C163\tPerylene_2H12\t0\t0.0\n-C163\tPerylene\t0\t0.0\n-C163\tPhenanthrene_2H10\t0\t0.0\n-C164\t7,12-Dimethylbenz[a]anthracene\t1\t0.2284760273276565\n-C164\tEnzacamene\t1\t0.112547485896346\n-C164\tFenamidone\t1\t0.0486288864876461\n-C165\tBoscalid\t1\t0.08498662209290331\n-C165\tBuprofezin\t1\t0.08205704595848827\n-C165\tIpconazole\t1\t0.08152620214218925\n-C166\tTris(2-butoxyethyl) phosphate\t1\t0.008342150525801997\n-C166\tRotenone\t1\t0.0015006556689027325\n-C166\tPerylene_2H12\t0\t0.0\n-C167\tPerylene_2H12\t0\t0.0\n-C167\tPerylene\t0\t0.0\n-C167\tPhenanthrene_2H10\t0\t0.0\n-C168\tPerylene_2H12\t0\t0.0\n-C168\tPerylene\t0\t0.0\n-C168\tPhenanthrene_2H10\t0\t0.0\n-C169\tPerylene_2H12\t0\t0.0\n-C169\tPerylene\t0\t0.0\n-C169\tPhenanthrene_2H10\t0\t0.0\n-C170\tPerylene_2H12\t0\t0.0\n-C170\tPerylene\t0\t0.0\n-C170\tPhenanthrene_2H10\t0\t0.0\n-C171\t2,4-D butyl ester\t1\t0.6610587362108564\n-C171\tTerbutryn\t1\t0.6012657870951452\n-C171\tEstrone\t2\t0.31623371975319553\n-C172\tPerylene_2H12\t1\t0.06765194944236241\n-C172\t17-alpha-Ethynylestradiol\t1\t0.01884162876915315\n-C172\tProgesterone\t1\t0.01306130902820296\n-C173\tSpiromesifen\t1\t0.016586079079264453\n-C173\tRotenone\t1\t0.0025109428261963678\n-C173\tPerylene_2H12\t0\t0.0\n-C174\tPerylene_2H12\t0\t0.0\n-C174\tPerylene\t0\t0.0\n-C174\tPhenanthrene_2H10\t0\t0.0\n"