Source code for pyjob.slurm

# MIT License
#
# Copyright (c) 2017-18 Felix Simkovic
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.

__author__ = 'Felix Simkovic'
__version__ = '1.0'

import logging
import uuid

from pyjob.cexec import cexec
from pyjob.exception import PyJobExecutableNotFoundError, PyJobError
from pyjob.script import Script
from pyjob.task import ClusterTask

logger = logging.getLogger(__name__)


[docs]class SlurmTask(ClusterTask): """Slurm executable :obj:`~pyjob.task.Task`""" JOB_ARRAY_INDEX = '$SLURM_ARRAY_TASK_ID' SCRIPT_DIRECTIVE = '#SBATCH' @property def info(self): """:obj:`~pyjob.slurm.SlurmTask` information""" if self.pid is None: return {} try: cexec(['squeue', '-j', str(self.pid)]) except (PyJobExecutableNotFoundError, Exception): return {} else: return {'job_number': self.pid, 'status': 'Running'}
[docs] def kill(self): """Immediately terminate the :obj:`~pyjob.slurm.SlurmTask`""" if self.pid is None: return cexec(['scancel', str(self.pid)]) logger.debug("Terminated task: %d", self.pid)
def _check_requirements(self): """Check if the requirements for task execution are met""" self._ensure_exec_available('squeue') def _run(self): """Method to initialise :obj:`~pyjob.slurm.SlurmTask` execution""" self.runscript = self._create_runscript() self.runscript.write() stdout = cexec(['sbatch', self.runscript.path], cwd=self.directory) self.pid = int(stdout.strip().split()[-1]) logger.debug('%s [%d] submission script is %s', self.__class__.__name__, self.pid, self.runscript.path) def _create_runscript(self): """Utility method to create runscript""" runscript = Script(directory=self.directory, prefix='slurm_', suffix='.script', stem=str(uuid.uuid1().int)) runscript.append(self.__class__.SCRIPT_DIRECTIVE + ' --export=ALL') runscript.append(self.__class__.SCRIPT_DIRECTIVE + ' --job-name={}'.format(self.name)) if self.dependency: cmd = '--depend=afterok:{}'.format(':'.join(map(str, self.dependency))) runscript.append(self.__class__.SCRIPT_DIRECTIVE + ' ' + cmd) if self.queue: cmd = '-p {}'.format(self.queue) runscript.append(self.__class__.SCRIPT_DIRECTIVE + ' ' + cmd) if self.nprocesses: cmd = '-n {}'.format(self.nprocesses) runscript.append(self.__class__.SCRIPT_DIRECTIVE + ' ' + cmd) if self.directory: cmd = '--workdir={}'.format(self.directory) runscript.append(self.__class__.SCRIPT_DIRECTIVE + ' ' + cmd) if self.runtime: cmd = '-t {}'.format(self.get_time(self.runtime)) runscript.append(self.__class__.SCRIPT_DIRECTIVE + ' ' + cmd) if self.extra: cmd = ' '.join(map(str, self.extra)) runscript.append(self.__class__.SCRIPT_DIRECTIVE + ' ' + cmd) if len(self.script) > 1: logf = runscript.path.replace('.script', '.log') jobsf = runscript.path.replace('.script', '.jobs') with open(jobsf, 'w') as f_out: f_out.write('\n'.join(self.script)) cmd = '--array={}-{}%{}'.format(1, len(self.script), self.max_array_size) runscript.append(self.__class__.SCRIPT_DIRECTIVE + ' ' + cmd) runscript.append(self.__class__.SCRIPT_DIRECTIVE + ' -o {}'.format(logf)) runscript.extend(self.get_array_bash_extension(jobsf, 0)) else: runscript.append(self.__class__.SCRIPT_DIRECTIVE + ' -o {}'.format(self.log[0])) runscript.append(self.script[0]) return runscript