Module: CodeRunner::Moab

Included in:
Edison, Franklin, Hector, Iridis
Defined in:
lib/coderunner/system_modules/moab.rb

Class Method Summary collapse

Instance Method Summary collapse

Class Method Details

.configure_environmentObject



4
5
6
7
8
9
10
11
12
13
# File 'lib/coderunner/system_modules/moab.rb', line 4

def self.configure_environment
  eputs "Configuring Hector"
  conf = "eval `modulecmd bash swap PrgEnv-pgi PrgEnv-gnu`\neval `modulecmd bash load fftw/3.2.2`\nexport XTPE_LINK_TYPE=dynamic\nexport LD_LIBRARY_PATH=/opt/xt-libsci/10.4.1/gnu/lib/44:$LD_LIBRARY_PATH\n"
Kernel.change_environment_with_shell_script(conf)
end

Instance Method Details

#batch_scriptObject



71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
# File 'lib/coderunner/system_modules/moab.rb', line 71

def batch_script

  nodes, ppn = @nprocs.split(/x/)
  (eputs "Warning: number of nodes is not recommended (8, 16, 32, 64, 128, 256, 512, 1024, 2048 or 4096 recommended)"; sleep 0.2) unless [8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096].include? nodes.to_i
  (eputs "Warning: number of wall mins is not recommended (20, 60, 180, 360, 720 recomended)"; sleep 0.2) unless [20, 60, 180, 360, 720].include? @wall_mins.to_i
  eputs "Warning: Underuse of nodes (#{ppn} cores per node instead of #{max_ppn})" if ppn.to_i < max_ppn 
  raise "Error: cores per node cannot excede #{max_ppn}" if ppn.to_i > max_ppn
#   raise "Error: project (i.e. budget) not specified" unless @project
  ppn ||= max_ppn
  if @wall_mins
    ep @wall_mins
    hours = (@wall_mins / 60).floor
    mins = @wall_mins.to_i % 60
    secs = ((@wall_mins - @wall_mins.to_i) * 60).to_i
  end
  eputs "Allotted wall time is " + sprintf("%02d:%02d:%02d", hours, mins, secs)
  nprocstot = nodes.to_i * ppn.to_i
"#!/bin/bash --login \n#PBS -N \#{executable_name}.\#{job_identifier}\n#PBS -l mppwidth=\#{nprocstot}\n#PBS -l mppnppn=\#{ppn}\n\#{@wall_mins ? \"#PBS -l walltime=\#{sprintf(\"%02d:%02d:%02d\", hours, mins, secs)}\" : \"\"}\n\#{@project ? \"#PBS -A \#@project\" : \"\"}\n\n### start of jobscript \ncd $PBS_O_WORKDIR \necho \"workdir: $PBS_O_WORKDIR\" \n\#{code_run_environment}\n\necho \"Submitting \#{nodes}x\#{ppn} job on \#{CodeRunner::SYS} for project \#@project...\"\n\n\n"

end

#batch_script_fileObject



63
64
65
# File 'lib/coderunner/system_modules/moab.rb', line 63

def batch_script_file
  "#{executable_name}_#{job_identifier}.sh"
end

#cancel_jobObject



108
109
110
111
112
113
114
115
# File 'lib/coderunner/system_modules/moab.rb', line 108

def cancel_job
  if ((prefix = ENV['CODE_RUNNER_LAUNCHER']).size > 0 rescue false)
     fname = CodeRunner.launcher_directory + "/#{$$}.stop"
     File.open(fname, 'w'){|file| file.puts "\n"}
  else
    `qdel #{@job_no}`
  end
end

#error_fileObject



117
118
119
120
121
122
123
# File 'lib/coderunner/system_modules/moab.rb', line 117

def error_file
  if (ENV['CODE_RUNNER_LAUNCHER'].size > 0 rescue false)
    return "#{executable_name}.#{job_identifier}.e"
  else
    return "#{executable_name}.#{job_identifier}.e#@job_no"
  end
end

#executeObject



48
49
50
51
52
53
54
55
56
57
58
59
60
61
# File 'lib/coderunner/system_modules/moab.rb', line 48

def execute
  if ((prefix = ENV['CODE_RUNNER_LAUNCHER']).size > 0 rescue false)
    launch_id = "#{Time.now.to_i}#{$$}"
    fname = "#{CodeRunner.launcher_directory}/#{launch_id}"
    File.open(fname + '.start', 'w'){|file| file.print "cd #{Dir.pwd};", run_command, "\n"}
    sleep 2 until FileTest.exist? fname + '.pid'
    pid = File.read(fname + '.pid').to_i
    FileUtils.rm fname + '.pid'
    return pid
  else
    File.open(batch_script_file, 'w'){|file| file.puts batch_script + run_command + "\n"}
    pid = %x[qsub #{batch_script_file}].to_i
  end
end

#get_run_status(job_no, current_status) ⇒ Object



133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
# File 'lib/coderunner/system_modules/moab.rb', line 133

def get_run_status(job_no, current_status)
  if ((prefix = ENV['CODE_RUNNER_LAUNCHER']).size > 0 rescue false)
    if current_status =~ Regexp.new(job_no.to_s)
      @running = true
      return :Running
    else
      @running = false
      return :Unknown
    end
  end
  line = current_status.split(/\n/).grep(Regexp.new(job_no.to_s))[0]
  unless line
    return :Unknown
  else 
    if line =~ /\sQ\s/
      return :Queueing
    elsif line =~ /\sR\s/
      return :Running
    elsif line =~ /\sH\s/
      return :Queueing
    elsif line =~ /\sC\s/
      return :Unknown
    else
      ep 'line', line
      raise 'Could not get run status'
    end
  end
end

#max_ppnObject



67
68
69
# File 'lib/coderunner/system_modules/moab.rb', line 67

def max_ppn
  raise "Please define max_ppn for your system"
end

#mpi_progObject



24
25
26
# File 'lib/coderunner/system_modules/moab.rb', line 24

def mpi_prog
  "aprun -n #{nprocstot} -N #{ppn}"
end

#nprocstotObject



32
33
34
35
36
# File 'lib/coderunner/system_modules/moab.rb', line 32

def nprocstot
  
    nodes, ppn = @nprocs.split(/x/)
    nprocstot = nodes.to_i * ppn.to_i
end

#output_fileObject



125
126
127
128
129
130
131
# File 'lib/coderunner/system_modules/moab.rb', line 125

def output_file
  if (ENV['CODE_RUNNER_LAUNCHER'].size > 0 rescue false)
    return "#{executable_name}.#{job_identifier}.o"
  else
    return "#{executable_name}.#{job_identifier}.o#@job_no"
  end
end

#ppnObject



28
29
30
31
# File 'lib/coderunner/system_modules/moab.rb', line 28

def ppn
    nodes, ppn = @nprocs.split(/x/)
    ppn
end

#queue_statusObject



15
16
17
18
19
20
21
22
# File 'lib/coderunner/system_modules/moab.rb', line 15

def queue_status
  if ((prefix = ENV['CODE_RUNNER_LAUNCHER']).size > 0 rescue false)
    %x[cat #{CodeRunner.launcher_directory}/queue_status.txt | grep sh]  +
    %x[cat #{CodeRunner.launcher_directory}/queue_status2.txt | grep sh] 
  else
    %x[qstat | grep $USER]
  end
end

#run_commandObject



37
38
39
40
41
42
43
44
45
46
# File 'lib/coderunner/system_modules/moab.rb', line 37

def run_command
#     "qsub #{batch_script_file}"
  if (ENV['CODE_RUNNER_LAUNCHER'].size > 0 rescue false)
    return %[#{mpi_prog} #{executable_location}/#{executable_name} #{parameter_string} > #{output_file} 2> #{error_file}]
  else
    nodes, ppn = @nprocs.split(/x/)
    nprocstot = nodes.to_i * ppn.to_i
    "#{mpi_prog}  #{executable_location}/#{executable_name} #{parameter_string}"
  end
end