forked from provakar1994/jlab-HPC
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsubmit-simc-g4sbs-digi-replay-jobs.sh
executable file
·310 lines (272 loc) · 13.1 KB
/
submit-simc-g4sbs-digi-replay-jobs.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
#!/bin/bash
# ------------------------------------------------------------------------- #
# This script runs SIMC events on ifarm and then uses the output ROOT files #
# to submit corresponding g4sbs, sbsdig, and replay jobs to the batch farm. #
# There is a flag that can be set to run all the jobs on ifarm as well. #
# --------- #
# P. Datta <[email protected]> CREATED 04-19-2023 #
# --------- #
# ** Do not tamper with this sticker! Log any updates to the script below. #
# --------- #
# S. Seeds <[email protected]> Added version control machinery #
# ------------------------------------------------------------------------- #
# ------------------- Notes and Instructions (READ BEFORE EXECUTION) -------------------- #
# --------------------------------------------------------------------------------------- #
# 1. This script takes 5 arguments: #
# a. SIMC infile w/o file extention. Must be located at $SIMC/infiles directory. #
# b. SBS configuration (Valid options: GMN4,GMN7,GMN11,GMN14,GMN8,GMN9,GEN2,GEN3,GEN4) #
# c. First job id. #
# d. Total no. of jobs to submit. #
# e. Flag to force all jobs to run on ifarm. (1=>YES) Very useful for debugging. #
# 2. Total no. of events applies to both SIMC and g4sbs for consistency. #
# 3. Be sure to edit "workflowname" variable appropriately before executing script. #
# 4. Be sure to edit "outdirpath" variable appropriately before executing script. #
# 5. After all the SIMC jobs are finished a summary CSV file, $infile_summary.csv get #
# created and kept in $outdirpath/simcoutdir, which contain the important #
# normalization factors for all jobs. #
# 6. List of interdependencies: utility.py, run-g4sbs-w-simc.sh, run-sbsdig.sh, run- #
# simc.sh, run-digi-replay.sh | All these scripts must be present in the $SCRIPT_DIR #
# --------------------------------------------------------------------------------------- #
# Setting necessary environments via setenv.sh
source setenv.sh
# Set path to version information
USER_VERSION_PATH="$SCRIPT_DIR/misc/version_control/user_env_version.conf"
# Check to verify information is at location and update as necessary
$SCRIPT_DIR/misc/version_control/check_and_update_versions.sh
# ------ Variables needed to be set properly for successful execution ------ #
# -------------------------------------------------------------------------- #
# SIMC input file (don't add file extension). Must be located at $SIMC/infiles.
# G4SBS macro should have same name as SIMC input file just with different
# file extention and should be located at $G4SBS/scripts.
infile=$1
sbsconfig=$2 # SBS configuration (Valid options: 4,7,11,14,8,9
nevents=$3 # No. of SIMC (and g4sbs) events to generate
fjobid=$4 # first job id
njobs=$5 # total no. of jobs to submit
run_on_ifarm=$6 # 1=>Yes (If true, runs all jobs on ifarm)
# ----/\---- Above variables are taken as arguments to this script ---/\---- #
# Workflow name
workflowname=
# Specify a directory on volatile to store simc, g4sbs, sbsdig, & replayed outfiles.
# Working on a single directory is convenient & safe for the above mentioned
# four processes to run coherently without any error.
outdirpath=
# -------------------------------------------------------------------------- #
# ------ Variables to allocate time and memory for each type of jobs ------ #
# -------------------------------------------------------------------------- #
# SIMC jobs
SIMCJOBram='100MB'
SIMCJOBdisk='250MB'
SIMCJOBtime='6h'
# g4sbs jobs
G4SBSJOBram='1200MB'
G4SBSJOBdisk='1GB'
G4SBSJOBtime='24h'
# sbsdig jobs
SBSDIGJOBram='1200MB'
SBSDIGJOBdisk='100MB'
SBSDIGJOBtime='6h'
# replay jobs
REPLAYJOBram='1200MB'
REPLAYJOBdisk='1GB'
REPLAYJOBtime='6h'
# -------------------------------------------------------------------------- #
# Sanity check 0: Checking the environments
if [[ ! -d $SCRIPT_DIR ]]; then
echo -e '\nERROR!! Please set "SCRIPT_DIR" path properly in setenv.sh script!\n'; exit;
elif [[ ! -d $SIMC ]]; then
echo -e '\nERROR!! Please set "SIMC" path properly in setenv.sh script!\n'; exit;
elif [[ ! -d $G4SBS ]]; then
echo -e '\nERROR!! Please set "G4SBS" path properly in setenv.sh script!\n'; exit;
elif [[ ! -d $LIBSBSDIG ]]; then
echo -e '\nERROR!! Please set "LIBSBSDIG" path properly in setenv.sh script!\n'; exit;
elif [[ (! -d $ANALYZER) && ($useJLABENV -eq 1) ]]; then
echo -e '\nERROR!! Please set "ANALYZER" path properly in setenv.sh script!\n'; exit;
elif [[ ! -d $SBSOFFLINE ]]; then
echo -e '\nERROR!! Please set "SBSOFFLINE" path properly in setenv.sh script!\n'; exit;
elif [[ ! -d $SBS_REPLAY ]]; then
echo -e '\nERROR!! Please set "SBS_REPLAY" path properly in setenv.sh script!\n'; exit;
fi
# Sanity check 1: Validating the number of arguments provided
if [[ "$#" -ne 6 ]]; then
echo -e " \n --!!--\n ERROR! Illegal number of arguments!! \n ------"
echo -e " This script takes 6 arguments: <infile> <sbsconfig> <fjobid> <njobs> <run_on_ifarm>"
echo -e " 1. <infile> : SIMC infile w/o file extention. Must be located at SIMC/infiles directory."
echo -e " 2. <sbsconfig> : SBS configuration (Valid options: GMN4,GMN7,GMN11,GMN14,GMN8,GMN9,GEN2,GEN3,GEN4)."
echo -e " 3. <nevents> : No. of SIMC (and g4sbs) events to generate per job."
echo -e " 4. <fjobid> : First job id."
echo -e " 5. <njobs> : Total no. of jobs to submit."
echo -e " 6. <run_on_ifarm> : 1=>Yes (If true, runs all jobs on ifarm)"
echo -e " ------"
echo -e ' ** Make sure "workflowname" & "outdirpath" variables are set properly in the script.'
echo -e ' ** Read the "Notes and Instructions" block at the top of script for more information.\n'
exit;
else
echo -e '\n------'
echo -e ' Check the following variable(s):'
if [[ $run_on_ifarm -ne 1 ]]; then
echo -e ' "workflowname" : '$workflowname''
fi
echo -e ' "outdirpath" : '$outdirpath' \n------'
while true; do
read -p "Do they look good? [y/n] " yn
echo -e ""
case $yn in
[Yy]*)
break; ;;
[Nn]*)
if [[ $run_on_ifarm -ne 1 ]]; then
read -p "Enter desired workflowname : " temp1
workflowname=$temp1
fi
read -p "Enter desired outdirpath : " temp2
outdirpath=$temp2
break; ;;
esac
done
fi
# Sanity check 2: Create the output directory if necessary
if [[ ! -d $outdirpath ]]; then
{ #try
mkdir $outdirpath
} || { #catch
echo -e "\n!!!!!!!! ERROR !!!!!!!!!"
echo -e $outdirpath "doesn't exist and cannot be created!\n"
exit;
}
fi
# Sanity check 3: Check for the existance of SIMC infile
simcmacro=$SIMC'/infiles/'$infile'.inp'
if [[ ! -f $simcmacro ]]; then
echo -e "\n!!!!!!!! ERROR !!!!!!!!!"
echo -e "SIMC infile, $simcmacro, doesn't exist! Aborting!\n"
exit;
fi
# Sanity check 4: Finding matching G4SBS preinit macro for SIMC infile
g4sbsmacro=$G4SBS'/scripts/'$infile'.mac'
if [[ ! -f $g4sbsmacro ]]; then
echo -e "\n!!!!!!!! ERROR !!!!!!!!!"
echo -e "G4SBS preinit macro, $g4sbsmacro, doesn't exist! Aborting!\n"
exit;
fi
# Sanity check 5: Check SIMC input file character count
charcount=$(echo -n $infile | wc -c)
if [[ $charcount -gt 100 ]]; then
echo -e "\n!!!!!!!! ERROR !!!!!!!!!"
echo -e "SIMC infile name must have < 100 characters.."
echo -e "Given infile, $infile, has $charcount characters!"
echo -e "Aborting.."
exit;
fi
# Creating a sub-directory (simcout) to keep all the SIMC outputs in one place
export simcoutdir=$outdirpath'/simcout'
if [[ ! -d $simcoutdir ]]; then
mkdir $simcoutdir
fi
# # Creating a CSV file to write a summary table of normalization factors by job
# simcnormtable=$simcoutdir'/'$infile'_summary.csv'
# Reading SIMC infile ("ngen" flag) to determine no. of g4sbs events to generate
#nevents=$(python3 $SCRIPT_DIR'/'utility.py 'grab_simc_param_value' $simcmacro 'ngen')
if [[ $nevents -lt 0 ]]; then
echo -e "\n!!!!!!!! ERROR !!!!!!!!!"
echo -e "Illegal no. of events! nevents = $nevents | Aborting!\n"
exit;
else
echo -e "\n ** $nevents SIMC (and g4sbs) events will be generated per job!"
fi
# Creating the workflow
if [[ $run_on_ifarm -ne 1 ]]; then
swif2 create $workflowname
else
echo -e "\nRunning all jobs on ifarm!\n"
fi
# Choosing the right GEM config for digitization
gemconfig=0
if [[ ($sbsconfig == GMN4) || ($sbsconfig == GMN7) ]]; then
gemconfig=12
elif [[ $sbsconfig == GMN11 ]]; then
gemconfig=10
elif [[ ($sbsconfig == GMN14) || ($sbsconfig == GMN8) || ($sbsconfig == GMN9) || ($sbsconfig == GEN2) || ($sbsconfig == GEN3) || ($sbsconfig == GEN4) ]]; then
gemconfig=8
else
echo -e "Enter valid SBS config! Valid options: GMN4,GMN7,GMN11,GMN14,GMN8,GMN9,GEN2,GEN3,GEN4"
exit;
fi
# Loop to create jobs
for ((i=$fjobid; i<$((fjobid+njobs)); i++))
do
# submitting SIMC jobs
simcjobname=$infile'_simc_job_'$i
randomseed=$(od -An -N3 -i /dev/urandom)
simcscript=$SCRIPT_DIR'/run-simc.sh'' '$infile' '$nevents' '$randomseed' '$i' '$simcoutdir' '$run_on_ifarm' '$SIMC' '$SCRIPT_DIR' '$ANAVER' '$useJLABENV' '$JLABENV
if [[ $run_on_ifarm -ne 1 ]]; then
swif2 add-job -workflow $workflowname -partition production -name $simcjobname -cores 1 -disk $SIMCJOBdisk -ram $SIMCJOBram -time $SIMCJOBtime $simcscript
else
$simcscript
fi
simcoutfile=$simcoutdir'/'$infile'_job_'$i'.root'
# submitting g4sbs jobs using SIMC outfiles
outfilebase=$infile'_job_'$i
postscript=$infile'_job_'$i'.mac'
g4sbsjobname=$infile'_g4sbs_job_'$i
g4sbsscript=$SCRIPT_DIR'/run-g4sbs-w-simc.sh'' '$infile' '$postscript' '$nevents' '$outfilebase' '$outdirpath' '$simcoutfile' '$run_on_ifarm' '$G4SBS' '$ANAVER' '$useJLABENV' '$JLABENV
if [[ $run_on_ifarm -ne 1 ]]; then
swif2 add-job -workflow $workflowname -antecedent $simcjobname -partition production -name $g4sbsjobname -cores 1 -disk $G4SBSJOBdisk -ram $G4SBSJOBram -time $G4SBSJOBtime $g4sbsscript
else
$g4sbsscript
fi
# now, it's time for digitization
txtfile=$infile'_job_'$i'.txt'
sbsdigjobname=$infile'_digi_job_'$i
sbsdiginfile=$outdirpath'/'$outfilebase'.root'
sbsdigscript=$SCRIPT_DIR'/run-sbsdig.sh'' '$txtfile' '$sbsdiginfile' '$gemconfig' '$run_on_ifarm' '$G4SBS' '$LIBSBSDIG' '$ANAVER' '$useJLABENV' '$JLABENV
if [[ $run_on_ifarm -ne 1 ]]; then
swif2 add-job -workflow $workflowname -antecedent $g4sbsjobname -partition production -name $sbsdigjobname -cores 1 -disk $SBSDIGJOBdisk -ram $SBSDIGJOBram -time $SBSDIGJOBtime $sbsdigscript
else
$sbsdigscript
fi
# finally, lets replay the digitized data
digireplayinfile=$infile'_job_'$i
digireplayjobname=$infile'_digi_replay_job_'$i
digireplayscript=$SCRIPT_DIR'/run-digi-replay.sh'' '$digireplayinfile' '$sbsconfig' '-1' '$outdirpath' '$run_on_ifarm' '$ANALYZER' '$SBSOFFLINE' '$SBS_REPLAY' '$ANAVER' '$useJLABENV' '$JLABENV
if [[ $run_on_ifarm -ne 1 ]]; then
swif2 add-job -workflow $workflowname -antecedent $sbsdigjobname -partition production -name $digireplayjobname -cores 1 -disk $REPLAYJOBdisk -ram $REPLAYJOBram -time $REPLAYJOBtime $digireplayscript
else
$digireplayscript
fi
done
# # keep a copy of SIMC job summary file in the $outdirpath as well
# cp $simcnormtable $outdirpath
# add a copy of the version control to simcout for traceability
# Define the path for the version file within the output directory
VERSION_FILE="$simcoutdir/${infile}_version.txt"
# Function to append version information to the file
append_version_info() {
# Add the date and time of creation to the version file
echo "# Version file created on $(date '+%Y-%m-%d %H:%M:%S')" >> "$VERSION_FILE"
# Add the configured run range to the version file
ljobid=$((fjobid + njobs))
echo "# This run range from $fjobid to $ljobid" >> "$VERSION_FILE"
# Append the contents of last_update.conf to the version file
echo "" >> "$VERSION_FILE" # Add an empty line for readability
cat "$USER_VERSION_PATH" >> "$VERSION_FILE"
echo "" >> "$VERSION_FILE" # Add an empty line for readability
}
# Check if the VERSION_FILE already exists
if [ -f "$VERSION_FILE" ]; then
# VERSION_FILE exists, append new version information
echo "Appending version information to existing $VERSION_FILE"
append_version_info
else
# VERSION_FILE does not exist, create it and add version information
echo "Creating new $VERSION_FILE and adding version information"
touch "$VERSION_FILE" # Ensure the file exists before appending
append_version_info
fi
echo "Version information has been saved to $VERSION_FILE"
# run the workflow and then print status
if [[ $run_on_ifarm -ne 1 ]]; then
swif2 run $workflowname
echo -e "\n Getting workflow status.. [may take a few minutes!] \n"
swif2 status $workflowname
fi