Skip to content

Commit

Permalink
Improve error message for __EXTRACT_DATASETS__ tool
Browse files Browse the repository at this point in the history
Provides a reasonable error message to users, instead of the internal
error https://sentry.galaxyproject.org/share/issue/a197159192b64b9db065a762ee5dbbfc/:
```
KeyError: 'Dataset collection has no element_identifier with key 2.'
  File "galaxy/tools/__init__.py", line 1972, in handle_single_execution
    rval = self.execute(
  File "galaxy/tools/__init__.py", line 2069, in execute
    return self.tool_action.execute(
  File "galaxy/tools/actions/model_operations.py", line 88, in execute
    self._produce_outputs(
  File "galaxy/tools/actions/model_operations.py", line 119, in _produce_outputs
    tool.produce_outputs(
  File "galaxy/tools/__init__.py", line 3351, in produce_outputs
    extracted_element = collection[incoming["which"]["identifier"]]
  File "galaxy/model/__init__.py", line 6434, in __getitem__
    raise KeyError(error_message)
```
Also makes the `identifier` parameter explicitly required (it is now
inferred to be optional because text parameters are by default optional
if no validator raises an exception upon validating an empty string).

That prevents
```
KeyError: 'Dataset collection has no element_identifier with key None.'
  File "galaxy/tools/__init__.py", line 1972, in handle_single_execution
    rval = self.execute(
  File "galaxy/tools/__init__.py", line 2069, in execute
    return self.tool_action.execute(
  File "galaxy/tools/actions/model_operations.py", line 88, in execute
    self._produce_outputs(
  File "galaxy/tools/actions/model_operations.py", line 119, in _produce_outputs
    tool.produce_outputs(
  File "galaxy/tools/__init__.py", line 3351, in produce_outputs
    extracted_element = collection[incoming["which"]["identifier"]]
  File "galaxy/model/__init__.py", line 6434, in __getitem__
    raise KeyError(error_message)
```
  • Loading branch information
mvdbeek committed May 2, 2024
1 parent 8f4968f commit acec4f6
Show file tree
Hide file tree
Showing 3 changed files with 32 additions and 7 deletions.
10 changes: 8 additions & 2 deletions lib/galaxy/tools/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -3356,9 +3356,15 @@ def produce_outputs(self, trans, out_data, output_collections, incoming, history
if how == "first":
extracted_element = collection.first_dataset_element
elif how == "by_identifier":
extracted_element = collection[incoming["which"]["identifier"]]
try:
extracted_element = collection[incoming["which"]["identifier"]]
except KeyError as e:
raise exceptions.MessageException(e.args[0])
elif how == "by_index":
extracted_element = collection[int(incoming["which"]["index"])]
try:
extracted_element = collection[int(incoming["which"]["index"])]
except KeyError as e:
raise exceptions.MessageException(e.args[0])
else:
raise exceptions.MessageException("Invalid tool parameters.")
extracted = extracted_element.element_object
Expand Down
6 changes: 3 additions & 3 deletions lib/galaxy/tools/extract_dataset.xml
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,7 @@
</param>
<when value="first" />
<when value="by_identifier">
<param name="identifier" label="Element identifier:" type="text">
<param name="identifier" label="Element identifier:" type="text" optional="false">
<sanitizer invalid_char="">
<valid initial="string.ascii_letters,string.digits">
<add value="_" />
Expand Down Expand Up @@ -52,9 +52,9 @@ Description
The tool allow extracting datasets based on position (**The first dataset** and **Select by index** options) or name (**Select by element identifier** option). This tool effectively collapses the inner-most collection into a dataset. For nested collections (e.g a list of lists of lists: outer:middle:inner, extracting the inner dataset element) a new list is created where the selected element takes the position of the inner-most collection (so outer:middle, where middle is not a collection but the inner dataset element).
.. class:: warningmark
.. class:: warningmark
**Note**: Dataset index (numbering) begins with 0 (zero).
**Note**: Dataset index (numbering) begins with 0 (zero).
.. class:: infomark
Expand Down
23 changes: 21 additions & 2 deletions lib/galaxy_test/api/test_tools.py
Original file line number Diff line number Diff line change
Expand Up @@ -701,23 +701,42 @@ def test_database_operation_tool_with_pending_inputs(self):
hdca1_id = self.dataset_collection_populator.create_list_in_history(
history_id, contents=["a\nb\nc\nd", "e\nf\ng\nh"], wait=True
).json()["outputs"][0]["id"]
self.dataset_populator.run_tool(
run_response = self.dataset_populator.run_tool(
tool_id="cat_data_and_sleep",
inputs={
"sleep_time": 15,
"input1": {"batch": True, "values": [{"src": "hdca", "id": hdca1_id}]},
},
history_id=history_id,
)
output_hdca_id = run_response["implicit_collections"][0]["id"]
run_response = self.dataset_populator.run_tool(
tool_id="__EXTRACT_DATASET__",
inputs={
"data_collection": {"src": "hdca", "id": hdca1_id},
"data_collection": {"src": "hdca", "id": output_hdca_id},
},
history_id=history_id,
)
assert run_response["outputs"][0]["state"] != "ok"

@skip_without_tool("__EXTRACT_DATASET__")
def test_extract_dataset_invalid_element_identifier(self):
with self.dataset_populator.test_history(require_new=False) as history_id:
hdca1_id = self.dataset_collection_populator.create_list_in_history(
history_id, contents=["a\nb\nc\nd", "e\nf\ng\nh"], wait=True
).json()["outputs"][0]["id"]
run_response = self.dataset_populator.run_tool_raw(
tool_id="__EXTRACT_DATASET__",
inputs={
"data_collection": {"src": "hdca", "id": hdca1_id},
"which": {"which_dataset": "by_index", "index": 100},
},
history_id=history_id,
input_format="21.01",
)
assert run_response.status_code == 400
assert run_response.json()["err_msg"] == "Dataset collection has no element_index with key 100."

@skip_without_tool("__FILTER_FAILED_DATASETS__")
def test_filter_failed_list(self):
with self.dataset_populator.test_history(require_new=False) as history_id:
Expand Down

0 comments on commit acec4f6

Please sign in to comment.