2 # dqsub submits jobs using qsub with better options
3 # and is released under the terms of the GNU GPL version 3, or any
4 # later version, at your option. See the file README and COPYING for
6 # Copyright 2014 by Don Armstrong <don@donarmstrong.com>.
17 dqsub - submits jobs using qsub with better options
24 --queue, -q Queue to use
25 --interactive, -I call qsub interactively
27 --array array mode (one of 'chdir' or 'xargs' or '')
28 --array-from file to read arrays from (default STDIN)
29 --array-per-job number of array items to handle in each job (default 1)
30 --array-all-in-one-job Run all of the array items in one job
31 --ppn processors per node to use
32 --mem memory to request
33 --dir Directory to run the script in (default current directory)
34 --name, -N Name of the job
35 --debug, -d debugging level (Default 0)
36 --help, -h display this help
37 --man, -m display manual
45 This describes how dqsub will generate array jobs.
47 If no B<--array> is given, then the command and any additional
48 arguments given will be run using qsub.
50 If B<--array> is C<chdir>, then each line of the input given in
51 B<--array-from> will be used as a directory and the command and any
52 additional arguments given will run in each directory.
54 IF B<--array> is C<xargs>, then each line of the input given will be
55 considered to be an additional argument which will be given to the
56 command run in the current directory.
60 File to read array arguments from. If not provided, and B<--array> is
61 given, arguments will be read from STDIN.
65 Debug verbosity. (Default 0)
69 Display brief usage information.
84 use Cwd qw(getcwd abs_path);
86 use List::Util qw(min);
89 my %options = (nodes => 1,
104 'array_from|array-from=s',
105 'array_per_job|array-per-job=i',
106 'array_slot_limit|array-slot-limit=i',
107 'array_all_in_one_job|array-all-in-one-job!',
108 'ppn|processors-per-node=i',
112 'debug|d+','help|h|?','man|m');
114 # pod2usage() if $options{help};
115 # pod2usage({verbose=>2}) if $options{man};
117 $DEBUG = $options{debug};
120 if (not @ARGV and not $options{interactive}) {
121 push @USAGE_ERRORS,"You must provide a command to run";
123 if (defined $options{array} and $options{array} !~ /^(?:|chdir|xargs)$/i) {
124 push @USAGE_ERRORS,"--array must be one of chdir, xargs or '' if provided";
125 $options{array} = lc($options{array});
126 if ($options{array} eq '') {
127 $options{array} = undef;
130 if ($options{interactive} and @ARGV) {
131 push @USAGE_ERRORS,"Don't provide commands when you're asking for an interactive shell";
134 # pod2usage(join("\n",@USAGE_ERRORS)) if @USAGE_ERRORS;
135 print STDERR join("\n",@USAGE_ERRORS) and exit 1 if @USAGE_ERRORS;
137 # OK. Generate the options to qsub which we'll be using
138 my @qsub_options = generate_qsub_options(\%options,\@ARGV);
140 if ($options{interactive}) {
141 print STDERR 'running: qsub '.join(' ',@qsub_options) if $DEBUG;
142 exec('qsub',@qsub_options);
145 if ($options{array}) {
146 @array = read_array_options(\%options) if $options{array};
147 # the -t option gives the range of elements for an array job
148 if ($options{array_all_in_one_job}) {
149 $options{array_per_job} = scalar @array;
151 push @qsub_options,'-t','1-'. ceil(scalar @array / $options{array_per_job});
152 if ($options{array_slot_limit}) {
153 $qsub_options[$#qsub_options] .= '%'.$options{array_slot_limit};
157 call_qsub(\@qsub_options,write_qsub_script(\%options,\@ARGV,\@array));
160 sub generate_qsub_options{
161 my ($options,$args) = @_;
163 if (defined $options->{queue} and length $options->{queue}) {
164 push @qo,'-q',$options->{queue};
166 if (defined $options->{dir}) {
167 push @qo,'-d',abs_path($options->{dir});
169 push @qo,'-d',getcwd;
171 ## handle the -l options
173 push @l, 'nodes='.$options->{nodes};
174 if (defined $options->{ppn}) {
175 $l[$#l] .= ':ppn='.$options->{ppn};
177 if ($options->{mem}) {
178 push @l,'mem='.$options->{mem};
180 push @qo,'-l',join(',',@l) if @l;
181 if ($options->{interactive}) {
184 if ($options->{name}) {
185 push @qo,'-N',$options->{name};
187 push @qo,'-N',join('_',@{$args}[0..min($#{$args},2)]);
192 sub read_array_options{
195 if (defined $options->{array_from}) {
196 $fh = IO::File->new(defined $options->{array_from}) or
197 die "Unable to open $options->{array_from} for reading: $!";
208 my ($qsub_options,$script) = @_;
210 open $qsub_fh,'|-','qsub',@{$qsub_options},'-' or
211 die "Unable to start qsub: $!";
212 print {$qsub_fh} $script or
213 die "Unable to print to qsub: $!";
215 die "Unable to close qsub filehandle: $!";
218 sub write_qsub_script {
219 my ($opt,$arg,$array) = @_;
221 my $script = "#!/bin/bash\n";
222 my $command = join(' ',map {qq('$_')} @{$arg});
224 # this script was written by dqsub
226 if (defined $opt->{array}) {
227 my @subshell = ('','');
228 my $array_opt = join("\n",@{$array});
229 my $max_array = scalar @{$array};
230 my $apjm1 = $opt->{array_per_job} - 1;
231 if ($opt->{array_per_job} > 1) {
232 # we will use subshells if there are more than one array
234 @subshell = ('(',')');
236 for i in \$(seq 1 $opt->{array_per_job}); do
237 # in some cases, the jobs aren't going to come out evenly. Handle that.
238 JOBNUM=\$(( \${PBS_ARRAYID:=1} * $opt->{array_per_job} + \$i - $opt->{array_per_job} ))
239 if [ \$JOBNUM -le $max_array ]; then
240 OPT=\$(sed -n -e "\$JOBNUM p"<<'_HERE_DOC_END_'
244 OPT=\$(sed -n -e "\${PBS_ARRAYID:=1} p"<<'_HERE_DOC_END_'
252 if ($opt->{array} eq 'chdir') {
262 exec ${command} "\$OPT";
266 if ($opt->{array_per_job} > 1) {
274 # there's no array, so just executing the command with arguments