Module: CodeRunner::Moab

Included in:
Edison, Franklin, Hector, Iridis
Defined in:
lib/coderunner/system_modules/moab.rb

Class Method Summary collapse

Instance Method Summary collapse

Class Method Details

.configure_environmentObject



4
5
6
7
8
9
10
11
12
13
# File 'lib/coderunner/system_modules/moab.rb', line 4

def self.configure_environment
	eputs "Configuring Hector"
	conf = <<EOF
eval `modulecmd bash swap PrgEnv-pgi PrgEnv-gnu`
eval `modulecmd bash load fftw/3.2.2`
export XTPE_LINK_TYPE=dynamic
export LD_LIBRARY_PATH=/opt/xt-libsci/10.4.1/gnu/lib/44:$LD_LIBRARY_PATH
EOF
Kernel.change_environment_with_shell_script(conf)
end

Instance Method Details

#batch_scriptObject



71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
# File 'lib/coderunner/system_modules/moab.rb', line 71

def batch_script

	nodes, ppn = @nprocs.split(/x/)
	(eputs "Warning: number of nodes is not recommended (8, 16, 32, 64, 128, 256, 512, 1024, 2048 or 4096 recommended)"; sleep 0.2) unless [8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096].include? nodes.to_i
	(eputs "Warning: number of wall mins is not recommended (20, 60, 180, 360, 720 recomended)"; sleep 0.2) unless [20, 60, 180, 360, 720].include? @wall_mins.to_i
	eputs "Warning: Underuse of nodes (#{ppn} cores per node instead of #{max_ppn})" if ppn.to_i < max_ppn 
	raise "Error: cores per node cannot excede #{max_ppn}" if ppn.to_i > max_ppn
#		raise "Error: project (i.e. budget) not specified" unless @project
	ppn ||= max_ppn
	if @wall_mins
		ep @wall_mins
		hours = (@wall_mins / 60).floor
		mins = @wall_mins.to_i % 60
		secs = ((@wall_mins - @wall_mins.to_i) * 60).to_i
	end
	eputs "Allotted wall time is " + sprintf("%02d:%02d:%02d", hours, mins, secs)
	nprocstot = nodes.to_i * ppn.to_i
<<EOF
#!/bin/bash --login 
#PBS -N #{executable_name}.#{job_identifier}
#PBS -l mppwidth=#{nprocstot}
#PBS -l mppnppn=#{ppn}
#{@wall_mins ? "#PBS -l walltime=#{sprintf("%02d:%02d:%02d", hours, mins, secs)}" : ""}
#{@project ? "#PBS -A #@project" : ""}

### start of jobscript 
cd $PBS_O_WORKDIR 
echo "workdir: $PBS_O_WORKDIR" 
#{code_run_environment}

echo "Submitting #{nodes}x#{ppn} job on #{CodeRunner::SYS} for project #@project..."


EOF

end

#batch_script_fileObject



63
64
65
# File 'lib/coderunner/system_modules/moab.rb', line 63

def batch_script_file
	"#{executable_name}_#{job_identifier}.sh"
end

#cancel_jobObject



108
109
110
111
112
113
114
115
# File 'lib/coderunner/system_modules/moab.rb', line 108

def cancel_job
	if ((prefix = ENV['CODE_RUNNER_LAUNCHER']).size > 0 rescue false)
		 fname = CodeRunner.launcher_directory + "/#{$$}.stop"
		 File.open(fname, 'w'){|file| file.puts "\n"}
	else
		`qdel #{@job_no}`
	end
end

#error_fileObject



117
118
119
120
121
122
123
# File 'lib/coderunner/system_modules/moab.rb', line 117

def error_file
	if (ENV['CODE_RUNNER_LAUNCHER'].size > 0 rescue false)
		return "#{executable_name}.#{job_identifier}.e"
	else
		return "#{executable_name}.#{job_identifier}.e#@job_no"
	end
end

#executeObject



48
49
50
51
52
53
54
55
56
57
58
59
60
61
# File 'lib/coderunner/system_modules/moab.rb', line 48

def execute
	if ((prefix = ENV['CODE_RUNNER_LAUNCHER']).size > 0 rescue false)
		launch_id = "#{Time.now.to_i}#{$$}"
		fname = "#{CodeRunner.launcher_directory}/#{launch_id}"
		File.open(fname + '.start', 'w'){|file| file.print "cd #{Dir.pwd};", run_command, "\n"}
		sleep 2 until FileTest.exist? fname + '.pid'
		pid = File.read(fname + '.pid').to_i
		FileUtils.rm fname + '.pid'
		return pid
	else
		File.open(batch_script_file, 'w'){|file| file.puts batch_script + run_command + "\n"}
		pid = %x[qsub #{batch_script_file}].to_i
	end
end

#get_run_status(job_no, current_status) ⇒ Object



133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
# File 'lib/coderunner/system_modules/moab.rb', line 133

def get_run_status(job_no, current_status)
	if ((prefix = ENV['CODE_RUNNER_LAUNCHER']).size > 0 rescue false)
		if current_status =~ Regexp.new(job_no.to_s)
			@running = true
			return :Running
		else
			@running = false
			return :Unknown
		end
	end
	line = current_status.split(/\n/).grep(Regexp.new(job_no.to_s))[0]
	unless line
		return :Unknown
	else 
		if line =~ /\sQ\s/
			return :Queueing
		elsif line =~ /\sR\s/
			return :Running
		elsif line =~ /\sH\s/
			return :Queueing
		elsif line =~ /\sC\s/
			return :Unknown
		else
			ep 'line', line
			raise 'Could not get run status'
		end
	end
end

#max_ppnObject



67
68
69
# File 'lib/coderunner/system_modules/moab.rb', line 67

def max_ppn
	raise "Please define max_ppn for your system"
end

#mpi_progObject



24
25
26
# File 'lib/coderunner/system_modules/moab.rb', line 24

def mpi_prog
	"aprun -n #{nprocstot} -N #{ppn}"
end

#nprocstotObject



32
33
34
35
36
# File 'lib/coderunner/system_modules/moab.rb', line 32

def nprocstot
	
		nodes, ppn = @nprocs.split(/x/)
		nprocstot = nodes.to_i * ppn.to_i
end

#output_fileObject



125
126
127
128
129
130
131
# File 'lib/coderunner/system_modules/moab.rb', line 125

def output_file
	if (ENV['CODE_RUNNER_LAUNCHER'].size > 0 rescue false)
		return "#{executable_name}.#{job_identifier}.o"
	else
		return "#{executable_name}.#{job_identifier}.o#@job_no"
	end
end

#ppnObject



28
29
30
31
# File 'lib/coderunner/system_modules/moab.rb', line 28

def ppn
		nodes, ppn = @nprocs.split(/x/)
		ppn
end

#queue_statusObject



15
16
17
18
19
20
21
22
# File 'lib/coderunner/system_modules/moab.rb', line 15

def queue_status
	if ((prefix = ENV['CODE_RUNNER_LAUNCHER']).size > 0 rescue false)
		%x[cat #{CodeRunner.launcher_directory}/queue_status.txt | grep sh]  +
		%x[cat #{CodeRunner.launcher_directory}/queue_status2.txt | grep sh] 
	else
		%x[qstat | grep $USER]
	end
end

#run_commandObject



37
38
39
40
41
42
43
44
45
46
# File 'lib/coderunner/system_modules/moab.rb', line 37

def run_command
# 		"qsub #{batch_script_file}"
	if (ENV['CODE_RUNNER_LAUNCHER'].size > 0 rescue false)
		return %[#{mpi_prog} #{executable_location}/#{executable_name} #{parameter_string} > #{output_file} 2> #{error_file}]
	else
		nodes, ppn = @nprocs.split(/x/)
		nprocstot = nodes.to_i * ppn.to_i
		"#{mpi_prog}  #{executable_location}/#{executable_name} #{parameter_string}"
	end
end