From d45c5b81b973d36d8d460066e79effe35643c8ed Mon Sep 17 00:00:00 2001 From: John Chilton Date: Tue, 30 Jul 2024 20:16:03 -0400 Subject: [PATCH] Untangle dependencies between tools.execute and tools.actions. --- lib/galaxy/tools/actions/__init__.py | 67 ++----------------------- lib/galaxy/tools/execute.py | 2 +- lib/galaxy/tools/execution_helpers.py | 70 +++++++++++++++++++++++++++ 3 files changed, 76 insertions(+), 63 deletions(-) create mode 100644 lib/galaxy/tools/execution_helpers.py diff --git a/lib/galaxy/tools/actions/__init__.py b/lib/galaxy/tools/actions/__init__.py index 1a16ed58af3c..d7278e4286c4 100644 --- a/lib/galaxy/tools/actions/__init__.py +++ b/lib/galaxy/tools/actions/__init__.py @@ -33,6 +33,11 @@ from galaxy.model.dataset_collections.builder import CollectionBuilder from galaxy.model.none_like import NoneDataset from galaxy.objectstore import ObjectStorePopulator +from galaxy.tools.execution_helpers import ( + ToolExecutionCache, + filter_output, + on_text_for_names, +) from galaxy.tools.parameters import update_dataset_ids from galaxy.tools.parameters.basic import ( DataCollectionToolParameter, @@ -54,34 +59,6 @@ log = logging.getLogger(__name__) -class ToolExecutionCache: - """An object mean to cache calculation caused by repeatedly evaluting - the same tool by the same user with slightly different parameters. - """ - - def __init__(self, trans): - self.trans = trans - self.current_user_roles = trans.get_current_user_roles() - self.chrom_info = {} - self.cached_collection_elements = {} - - def get_chrom_info(self, tool_id, input_dbkey): - genome_builds = self.trans.app.genome_builds - custom_build_hack_get_len_from_fasta_conversion = tool_id != "CONVERTER_fasta_to_len" - if custom_build_hack_get_len_from_fasta_conversion and input_dbkey in self.chrom_info: - return self.chrom_info[input_dbkey] - - chrom_info_pair = genome_builds.get_chrom_info( - input_dbkey, - trans=self.trans, - custom_build_hack_get_len_from_fasta_conversion=custom_build_hack_get_len_from_fasta_conversion, - ) - if custom_build_hack_get_len_from_fasta_conversion: - self.chrom_info[input_dbkey] = chrom_info_pair - - return chrom_info_pair - - class ToolAction: """ The actions to be taken when a tool is run (after parameters have @@ -1097,40 +1074,6 @@ def check_elements(elements): self.out_collection_instances[name] = hdca -def on_text_for_names(input_names): - # input_names may contain duplicates... this is because the first value in - # multiple input dataset parameters will appear twice once as param_name - # and once as param_name1. - unique_names = [] - for name in input_names: - if name not in unique_names: - unique_names.append(name) - input_names = unique_names - - # Build name for output datasets based on tool name and input names - if len(input_names) == 0: - on_text = "" - elif len(input_names) == 1: - on_text = input_names[0] - elif len(input_names) == 2: - on_text = "{} and {}".format(*input_names) - elif len(input_names) == 3: - on_text = "{}, {}, and {}".format(*input_names) - else: - on_text = "{}, {}, and others".format(*input_names[:2]) - return on_text - - -def filter_output(tool, output, incoming): - for filter in output.filters: - try: - if not eval(filter.text.strip(), globals(), incoming): - return True # do not create this dataset - except Exception as e: - log.debug(f"Tool {tool.id} output {output.name}: dataset output filter ({filter.text}) failed: {e}") - return False - - def get_ext_or_implicit_ext(hda): if hda.implicitly_converted_parent_datasets: # implicitly_converted_parent_datasets is a list of ImplicitlyConvertedDatasetAssociation diff --git a/lib/galaxy/tools/execute.py b/lib/galaxy/tools/execute.py index cca565294428..c81d57252843 100644 --- a/lib/galaxy/tools/execute.py +++ b/lib/galaxy/tools/execute.py @@ -29,7 +29,7 @@ tool_output_to_structure, ) from galaxy.tool_util.parser import ToolOutputCollectionPart -from galaxy.tools.actions import ( +from galaxy.tools.execution_helpers import ( filter_output, on_text_for_names, ToolExecutionCache, diff --git a/lib/galaxy/tools/execution_helpers.py b/lib/galaxy/tools/execution_helpers.py new file mode 100644 index 000000000000..147a47de186d --- /dev/null +++ b/lib/galaxy/tools/execution_helpers.py @@ -0,0 +1,70 @@ +"""Helpers meant to assist tool execution. + +Lower-level things that prevent interwoven dependencies between tool code, +tool execution code, and tool action code. +""" +import logging + +log = logging.getLogger(__name__) + + +class ToolExecutionCache: + """An object meant to cache calculation caused by repeatedly evaluting + the same tool by the same user with slightly different parameters. + """ + + def __init__(self, trans): + self.trans = trans + self.current_user_roles = trans.get_current_user_roles() + self.chrom_info = {} + self.cached_collection_elements = {} + + def get_chrom_info(self, tool_id, input_dbkey): + genome_builds = self.trans.app.genome_builds + custom_build_hack_get_len_from_fasta_conversion = tool_id != "CONVERTER_fasta_to_len" + if custom_build_hack_get_len_from_fasta_conversion and input_dbkey in self.chrom_info: + return self.chrom_info[input_dbkey] + + chrom_info_pair = genome_builds.get_chrom_info( + input_dbkey, + trans=self.trans, + custom_build_hack_get_len_from_fasta_conversion=custom_build_hack_get_len_from_fasta_conversion, + ) + if custom_build_hack_get_len_from_fasta_conversion: + self.chrom_info[input_dbkey] = chrom_info_pair + + return chrom_info_pair + + +def filter_output(tool, output, incoming): + for filter in output.filters: + try: + if not eval(filter.text.strip(), globals(), incoming): + return True # do not create this dataset + except Exception as e: + log.debug(f"Tool {tool.id} output {output.name}: dataset output filter ({filter.text}) failed: {e}") + return False + + +def on_text_for_names(input_names): + # input_names may contain duplicates... this is because the first value in + # multiple input dataset parameters will appear twice once as param_name + # and once as param_name1. + unique_names = [] + for name in input_names: + if name not in unique_names: + unique_names.append(name) + input_names = unique_names + + # Build name for output datasets based on tool name and input names + if len(input_names) == 0: + on_text = "" + elif len(input_names) == 1: + on_text = input_names[0] + elif len(input_names) == 2: + on_text = "{} and {}".format(*input_names) + elif len(input_names) == 3: + on_text = "{}, {}, and {}".format(*input_names) + else: + on_text = "{}, {}, and others".format(*input_names[:2]) + return on_text