From 355446f1579a29c17270baa85829ea79b6aa401b Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Jos=C3=A9=20Manuel=20Dom=C3=ADnguez?= Date: Fri, 28 Jun 2024 12:31:26 +0200 Subject: [PATCH] Support using a table in any database supported by SQLAlchemy as mapping for interactive tools Replace the class `InteractiveToolSqlite` in lib/galaxy/managers/interactivetool.py with a new class `InteractiveToolPropagatorSQLAlchemy`. The new class implements a SQLAlchemy "propagator" for `InteractiveToolManager` (on the same file). This propagator writes the mappings to the table named after the value of `DATABASE_TABLE_NAME`, in the database specified by the SQLAlchemy database url passed to its constructor. Change the constructor of `InteractiveToolManager` so that it uses `InteractiveToolPropagatorSQLAlchemy`. Change the method `_process_config` of `galaxy.config.GalaxyAppConfiguration` so that it converts the value of `interactivetools_map` to a SQLAlchemy database url if it is a path. Update documentation to reflect these changes. --- config/galaxy.yml.interactivetools | 2 + doc/source/admin/galaxy_options.rst | 9 +- .../admin/special_topics/interactivetools.rst | 2 + lib/galaxy/config/__init__.py | 9 +- lib/galaxy/config/sample/galaxy.yml.sample | 4 +- lib/galaxy/config/schemas/config_schema.yml | 6 +- lib/galaxy/managers/interactivetool.py | 197 +++++++++--------- 7 files changed, 124 insertions(+), 105 deletions(-) diff --git a/config/galaxy.yml.interactivetools b/config/galaxy.yml.interactivetools index add807ec9e5d..7504ab5b5002 100644 --- a/config/galaxy.yml.interactivetools +++ b/config/galaxy.yml.interactivetools @@ -12,6 +12,8 @@ gravity: galaxy: interactivetools_enable: true + # either a path to a SQLite database file or a SQLAlchemy database URL, in both cases the table "gxitproxy" on + # the target database is used interactivetools_map: database/interactivetools_map.sqlite # outputs_to_working_directory will provide you with a better level of isolation. It is highly recommended to set diff --git a/doc/source/admin/galaxy_options.rst b/doc/source/admin/galaxy_options.rst index cdf82ab688fd..8d77718b2f81 100644 --- a/doc/source/admin/galaxy_options.rst +++ b/doc/source/admin/galaxy_options.rst @@ -2128,9 +2128,12 @@ ~~~~~~~~~~~~~~~~~~~~~~~~ :Description: - Map for interactivetool proxy. - The value of this option will be resolved with respect to - . + Map for interactivetool proxy. It may be either a path to a SQLite + database or a SQLAlchemy database URL (see + https://docs.sqlalchemy.org/en/20/core/engines.html#database-urls). + In either case, mappings will be written to the table "gxitproxy" within the + database. If it is a path, the value of this option will be resolved with + respect to . :Default: ``interactivetools_map.sqlite`` :Type: str diff --git a/doc/source/admin/special_topics/interactivetools.rst b/doc/source/admin/special_topics/interactivetools.rst index 698c2d1d3d73..73fd0c00731c 100644 --- a/doc/source/admin/special_topics/interactivetools.rst +++ b/doc/source/admin/special_topics/interactivetools.rst @@ -80,6 +80,8 @@ Set these values in ``galaxy.yml``: galaxy: interactivetools_enable: true + # either a path to a SQLite database file or a SQLAlchemy database URL, in both cases the table "gxitproxy" on the + # target database is used interactivetools_map: database/interactivetools_map.sqlite # outputs_to_working_directory will provide you with a better level of isolation. It is highly recommended to set diff --git a/lib/galaxy/config/__init__.py b/lib/galaxy/config/__init__.py index 554018472dc9..a501ab790c9c 100644 --- a/lib/galaxy/config/__init__.py +++ b/lib/galaxy/config/__init__.py @@ -1103,10 +1103,15 @@ def _process_config(self, kwargs: Dict[str, Any]) -> None: self.proxy_session_map = self.dynamic_proxy_session_map self.manage_dynamic_proxy = self.dynamic_proxy_manage # Set to false if being launched externally - # InteractiveTools propagator mapping file - self.interactivetools_map = self._in_root_dir( + # InteractiveTools propagator mapping + interactivetools_map = urlparse( kwargs.get("interactivetools_map", self._in_data_dir("interactivetools_map.sqlite")) ) + self.interactivetools_map = ( + interactivetools_map.geturl() + if interactivetools_map.scheme else + "sqlite:///" + self._in_root_dir(interactivetools_map.geturl()) + ) # Compliance/Policy variables self.redact_username_during_deletion = False diff --git a/lib/galaxy/config/sample/galaxy.yml.sample b/lib/galaxy/config/sample/galaxy.yml.sample index bb4c6fc32d4f..80ca62bdcc1d 100644 --- a/lib/galaxy/config/sample/galaxy.yml.sample +++ b/lib/galaxy/config/sample/galaxy.yml.sample @@ -189,8 +189,8 @@ gravity: # Public-facing port of the proxy # port: 4002 - # Routes file to monitor. - # Should be set to the same path as ``interactivetools_map`` in the ``galaxy:`` section. This is ignored if + # Database to monitor. + # Should be set to the same value as ``interactivetools_map`` in the ``galaxy:`` section. This is ignored if # ``interactivetools_map is set``. # sessions: database/interactivetools_map.sqlite diff --git a/lib/galaxy/config/schemas/config_schema.yml b/lib/galaxy/config/schemas/config_schema.yml index e18dc2aa28e8..b27179d8bb5c 100644 --- a/lib/galaxy/config/schemas/config_schema.yml +++ b/lib/galaxy/config/schemas/config_schema.yml @@ -1518,9 +1518,11 @@ mapping: interactivetools_map: type: str default: interactivetools_map.sqlite - path_resolves_to: data_dir + path_resolves_to: data_dir # does not apply to SQLAlchemy database URLs desc: | - Map for interactivetool proxy. + Map for interactivetool proxy. It may be either a path to a SQLite database or a SQLALchemy database URL (see + https://docs.sqlalchemy.org/en/20/core/engines.html#database-urls). In either case, mappings will be written + to the table "gxitproxy" within the database. interactivetools_prefix: type: str diff --git a/lib/galaxy/managers/interactivetool.py b/lib/galaxy/managers/interactivetool.py index 8cec876ba561..fda678b133a0 100644 --- a/lib/galaxy/managers/interactivetool.py +++ b/lib/galaxy/managers/interactivetool.py @@ -1,14 +1,15 @@ import json import logging -import sqlite3 from urllib.parse import ( urlsplit, urlunsplit, ) from sqlalchemy import ( + create_engine, or_, select, + text, ) from galaxy import exceptions @@ -18,94 +19,96 @@ ) from galaxy.model.base import transaction from galaxy.security.idencoding import IdAsLowercaseAlphanumEncodingHelper -from galaxy.util.filelock import FileLock log = logging.getLogger(__name__) DATABASE_TABLE_NAME = "gxitproxy" -class InteractiveToolSqlite: - def __init__(self, sqlite_filename, encode_id): - self.sqlite_filename = sqlite_filename - self.encode_id = encode_id +class InteractiveToolPropagatorSQLAlchemy: + """ + Propagator for InteractiveToolManager implemented using SQLAlchemy. + """ + + def __init__(self, database_url, encode_id): + """ + Constructor that sets up the propagator using a SQLAlchemy database URL. + + :param database_url: SQLAlchemy database URL, read more on the SQLAlchemy documentation + https://docs.sqlalchemy.org/en/20/core/engines.html#database-urls. + :param encode_id: A helper class that can encode ids as lowercase alphanumeric strings and vice versa. + """ + self._engine = create_engine(database_url) + self._encode_id = encode_id def get(self, key, key_type): - with FileLock(self.sqlite_filename): - conn = sqlite3.connect(self.sqlite_filename) - try: - c = conn.cursor() - select = f"""SELECT token, host, port, info - FROM {DATABASE_TABLE_NAME} - WHERE key=? and key_type=?""" - c.execute( - select, - ( - key, - key_type, - ), - ) - try: - token, host, port, info = c.fetchone() - except TypeError: - log.warning("get(): invalid key: %s key_type %s", key, key_type) - return None - return dict(key=key, key_type=key_type, token=token, host=host, port=port, info=info) - finally: - conn.close() + with self._engine.connect() as conn: + query = text(f""" + SELECT token, host, port, info + FROM {DATABASE_TABLE_NAME} WHERE key=:key AND key_type=:key_type + """) + parameters = dict( + key=key, + key_type=key_type, + ) + result = conn.execute(query, parameters).fetchone() + return None if result is None else dict( + key=key, + key_type=key_type, + token=result[0], + host=result[1], + port=result[2], + info=result[3], + ) def save(self, key, key_type, token, host, port, info=None): """ - Writeout a key, key_type, token, value store that is can be used for coordinating - with external resources. + Write out a key, key_type, token, value store that is can be used for coordinating with external resources. """ assert key, ValueError("A non-zero length key is required.") assert key_type, ValueError("A non-zero length key_type is required.") assert token, ValueError("A non-zero length token is required.") - with FileLock(self.sqlite_filename): - conn = sqlite3.connect(self.sqlite_filename) - try: - c = conn.cursor() - try: - # Create table - c.execute( - f"""CREATE TABLE {DATABASE_TABLE_NAME} - (key text, - key_type text, - token text, - host text, - port integer, - info text, - PRIMARY KEY (key, key_type) - )""" - ) - except Exception: - pass - delete = f"""DELETE FROM {DATABASE_TABLE_NAME} WHERE key=? and key_type=?""" - c.execute( - delete, - ( - key, - key_type, - ), - ) - insert = f"""INSERT INTO {DATABASE_TABLE_NAME} - (key, key_type, token, host, port, info) - VALUES (?, ?, ?, ?, ?, ?)""" - c.execute( - insert, - ( - key, - key_type, - token, - host, - port, - info, - ), - ) - conn.commit() - finally: - conn.close() + with self._engine.connect() as conn: + # create gx-it-proxy table if not exists + query = text(f""" + CREATE TABLE IF NOT EXISTS {DATABASE_TABLE_NAME} ( + key TEXT, + key_type TEXT, + token TEXT, + host TEXT, + port INTEGER, + info TEXT, + PRIMARY KEY (key, key_type) + ) + """) + conn.execute(query) + + # delete existing data with same key + query = text(f""" + DELETE FROM {DATABASE_TABLE_NAME} WHERE key=:key AND key_type=:key_type + """) + parameters = dict( + key=key, + key_type=key_type, + ) + conn.execute(query, parameters) + + # save data + query = text(f""" + INSERT INTO {DATABASE_TABLE_NAME} (key, key_type, token, host, port, info) + VALUES (:key, :key_type, :token, :host, :port, :info) + """) + parameters = dict( + key=key, + key_type=key_type, + token=token, + host=host, + port=port, + info=info, + ) + conn.execute(query, parameters) + + conn.commit() def remove(self, **kwd): """ @@ -113,30 +116,32 @@ def remove(self, **kwd): with external resources. Remove entries that match all provided key=values """ assert kwd, ValueError("You must provide some values to key upon") - delete = f"DELETE FROM {DATABASE_TABLE_NAME} WHERE" - value_list = [] - for i, (key, value) in enumerate(kwd.items()): - if i != 0: - delete += " and" - delete += f" {key}=?" - value_list.append(value) - with FileLock(self.sqlite_filename): - conn = sqlite3.connect(self.sqlite_filename) - try: - c = conn.cursor() - try: - # Delete entry - c.execute(delete, tuple(value_list)) - except Exception as e: - log.debug("Error removing entry (%s): %s", delete, e) - conn.commit() - finally: - conn.close() + with self._engine.connect() as conn: + query = ( + f"DELETE FROM {DATABASE_TABLE_NAME} WHERE {{conditions}}" + ) + conditions = ( + "{key}=:{value}".format( + key=key, + value=f"value_{i}", + ) + for i, key in enumerate(kwd) + ) + query = query.format( + conditions=" AND ".join(conditions) + ) + query = text(query) + parameters = { + f"value_{i}": value + for i, value in enumerate(kwd.values()) + } + conn.execute(query, parameters) + conn.commit() def save_entry_point(self, entry_point): """Convenience method to easily save an entry_point.""" return self.save( - self.encode_id(entry_point.id), + self._encode_id(entry_point.id), entry_point.__class__.__name__.lower(), entry_point.token, entry_point.host, @@ -151,7 +156,7 @@ def save_entry_point(self, entry_point): def remove_entry_point(self, entry_point): """Convenience method to easily remove an entry_point.""" - return self.remove(key=self.encode_id(entry_point.id), key_type=entry_point.__class__.__name__.lower()) + return self.remove(key=self._encode_id(entry_point.id), key_type=entry_point.__class__.__name__.lower()) class InteractiveToolManager: @@ -166,7 +171,7 @@ def __init__(self, app): self.sa_session = app.model.context self.job_manager = app.job_manager self.encoder = IdAsLowercaseAlphanumEncodingHelper(app.security) - self.propagator = InteractiveToolSqlite(app.config.interactivetools_map, self.encoder.encode_id) + self.propagator = InteractiveToolPropagatorSQLAlchemy(app.config.interactivetools_map, self.encoder.encode_id) def create_entry_points(self, job, tool, entry_points=None, flush=True): entry_points = entry_points or tool.ports