4 from pathlib
import Path
9 Describes an HPC job script including
10 + reading a configuration
11 + generating the script
12 + submitting the script
14 Each HPC job submission system (e.g., PBSPro on Cheyenne)
15 will have its own derived class that defines
16 the job header and submission command
17 generic config elements:
18 required config parameter(s):
19 basescript (required) - either a list of str's containing individual lines of the script
20 or a str giving the location of the script
22 optional config parameter(s):
23 env - linux environment of the script (e.g., csh, bash, sh, tcsh)
25 nppernode - processors per node
26 nnode - number of nodes
28 olog - output log name
33 self.
namename = conf.get(
'name',
'PyJobScript')
34 self.
nppernodenppernode = conf.get(
'nppernode',1)
35 self.
nnodennode = conf.get(
'nnode',1)
36 self.
walltimewalltime = conf.get(
'walltime',
'01:00:00')
37 self.
ologolog = conf.get(
'olog',
'log.job.out')
38 self.
elogelog = conf.get(
'elog',
'log.job.err')
41 self.
envenv = conf.get(
'env',
'csh')
43 assert (isinstance(self.
basescriptbasescript,list)
or isinstance(self.
basescriptbasescript,str)), \
44 "JobScriptBase : basescript must either be a list or a string"
45 self.
jobpathjobpath = Path(conf.get(
'path',
'./'))
53 joblines = [
'#!/bin/'+self.
envenv+
'\n']
56 for line
in self.
headerheader: joblines.append(line+
'\n')
61 for line
in self.
basescriptbasescript: joblines.append(line)
63 elif isinstance(self.
basescriptbasescript,str):
66 for line
in bs: joblines.append(line)
70 self.
jobpathjobpath.mkdir(parents=
True, exist_ok=
True)
74 if os.path.exists(script):
77 js.writelines(joblines)
79 os.system(
'chmod 744 '+script)
85 os.chdir(str(self.
jobpathjobpath))
86 print(command+
" in "+os.getcwd())
93 PBSPro job script on Cheyenne
94 unique config elements compared to base class:
95 account - cheyenne account for charging
96 queue - name of job submission queue (see qavail)
97 memory - amount of memory requested per node (see mavail)
99 NOTE: Cheyenne has a maximum of 36 processors available per node
101 qavail = [
'economy',
'regular',
'premium']
109 self.
accountaccount = conf.get(
'account',
'NMMM0043')
110 self.
queuequeue = conf.get(
'queue',
'regular')
111 assert self.
queuequeue
in self.
qavailqavail, (
"ERROR: PBSProCheyenne requires queue to be any of ",self.
qavailqavail)
112 self.
memorymemory = conf.get(
'memory',109)
113 assert self.
memorymemory
in self.
mavailmavail, (
"ERROR: PBSProCheyenne requires memory (in GB) to be any of", self.
mavailmavail)
117 '#PBS -N '+self.
namename,
118 '#PBS -A '+self.
accountaccount,
119 '#PBS -q '+self.
queuequeue,
120 '#PBS -l select='+str(self.
nnodennode)+
':ncpus='+str(self.
nppernodenppernode)+
':mpiprocs='+str(self.
nppernodenppernode)+
':mem='+str(self.
memorymemory)+
'GB',
121 '#PBS -l walltime='+self.
walltimewalltime,
124 '#PBS -o '+self.
ologolog,
125 '#PBS -e '+self.
elogelog,
133 SLURM job script on Casper
134 unique config elements compared to base class:
135 account - casper account for charging
136 partition - name of casper partition (see pavail)
137 memory - amount of memory requested per node (see maxmemory)
139 NOTE: Casper has a maximum of 36 processors available per node
149 self.
accountaccount = conf.get(
'account',
'NMMM0015')
150 self.
partitionpartition = conf.get(
'partition',
'dav')
151 assert self.
partitionpartition
in self.
pavailpavail, (
"ERROR: SLURMCasper requires partition to be any of ",self.
pavailpavail)
152 self.
memorymemory = conf.get(
'memory',300)
153 assert self.
memorymemory <= self.
maxmemorymaxmemory, (
"ERROR: SLURMCasper requires memory (in GB) to be <= ", self.
maxmemorymaxmemory)
158 '#SBATCH --job-name='+self.
namename,
159 '#SBATCH --account='+self.
accountaccount,
160 '#SBATCH --ntasks='+str(self.
nnodennode),
161 '#SBATCH --cpus-per-task='+str(self.
nppernodenppernode),
162 '#SBATCH --mem='+str(self.
memorymemory)+
'G',
163 '#SBATCH --time='+self.
walltimewalltime,
164 '#SBATCH --partition='+self.
partitionpartition,
165 '#SBATCH --output='+self.
ologolog,
173 'cheyenne': PBSProCheyenne,
175 'chadmin': PBSProCheyenne,
177 'casper': SLURMCasper
183 conf[
'sysname'] = subprocess.run([
'uname',
'-n'],
184 stdout=subprocess.PIPE).stdout.decode(
'utf-8')
187 for key, jobclass
in JobScriptDict.items():
188 if key
in conf[
'sysname']:
189 return jobclass(conf)
env
submission descriptors
def JobScriptFactory(conf)