diff --git a/.mailmap b/.mailmap index 71a84fdefc..7bbf47d237 100644 --- a/.mailmap +++ b/.mailmap @@ -57,3 +57,4 @@ Utheri Wagura <36386988+uwagura@users.noreply.github.com> github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> github-actions[bot] GitHub Action Diquan Jabbour <165976689+Diquan-BOM@users.noreply.github.com> +Maxime Rio diff --git a/tests/integration/test_job_runner_mgr.py b/tests/integration/test_job_runner_mgr.py new file mode 100644 index 0000000000..93663aec89 --- /dev/null +++ b/tests/integration/test_job_runner_mgr.py @@ -0,0 +1,85 @@ +# THIS FILE IS PART OF THE CYLC WORKFLOW ENGINE. +# Copyright (C) NIWA & British Crown (Met Office) & Contributors. +# +# This program is free software: you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with this program. If not, see . + +import errno +import logging +from pathlib import Path +import re +from textwrap import dedent + +from cylc.flow.job_runner_mgr import JobRunnerManager +from cylc.flow.pathutil import get_workflow_run_job_dir +from cylc.flow.task_state import TASK_STATUS_RUNNING +from cylc.flow.subprocctx import SubProcContext + + +async def test_kill_error(one, start, test_dir, capsys, log_filter): + """It should report the failure to kill a job.""" + async with start(one) as log: + # make it look like the task is running + itask = one.pool.get_tasks()[0] + itask.submit_num += 1 + itask.state_reset(TASK_STATUS_RUNNING) + + # fake job details + workflow_job_log_dir = Path(get_workflow_run_job_dir(one.workflow)) + job_id = itask.tokens.duplicate(job='01').relative_id + job_log_dir = Path(workflow_job_log_dir, job_id) + + # create job status file (give it a fake pid) + job_log_dir.mkdir(parents=True) + (job_log_dir / 'job.status').write_text(dedent(''' + CYLC_JOB_RUNNER_NAME=background + CYLC_JOB_ID=99999999 + CYLC_JOB_PID=99999999 + ''')) + + # attempt to kill the job using the jobs-kill script + # (note this is normally run via a subprocess) + capsys.readouterr() + JobRunnerManager().jobs_kill(str(workflow_job_log_dir), [job_id]) + + # the kill should fail, the failure should be written to stdout + # (the jobs-kill callback will read this in and handle it) + out, err = capsys.readouterr() + assert re.search( + # # NOTE: ESRCH = no such process + rf'TASK JOB ERROR.*{job_id}.*Errno {errno.ESRCH}', + out, + ) + + # feed this jobs-kill output into the scheduler + # (as if we had run the jobs-kill script as a subprocess) + one.task_job_mgr._kill_task_jobs_callback( + # mock the subprocess + SubProcContext( + one.task_job_mgr.JOBS_KILL, + ['mock-cmd'], + # provide it with the out/err the script produced + out=out, + err=err, + ), + one.workflow, + [itask], + ) + + # a warning should be logged + assert log_filter( + log, + regex=r'1/one/01:running.*job kill failed', + level=logging.WARNING, + ) + assert itask.state(TASK_STATUS_RUNNING)