-
Notifications
You must be signed in to change notification settings - Fork 14
/
Copy pathcondor_resubmit.py
78 lines (64 loc) · 3.18 KB
/
condor_resubmit.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
import os
"""Condor resubmit script.
# Three steps to submit condor script
1. Set input information
2. `grep` the **search string** ("preselected entries from root:") from the log files.
1. If it is not present it means jobs failed.
2. \todo check any other signature of the failed jobs and add it.
3. Make list of failed jobs log file.
3. Get the initial 7 lines from the main jdl file on which original jobs was submitted.
1. \todo number 7 in the previous statement is hard-coded. Make it flexible.
4. Add the above 7 lines into new jdl file.
5. To add the failed jobs information in the new jdl file, do following:
1. From the log files check the name of root files that failed.
2. Search the same root file from the main jdl file and grep the corresponding
necessary lines from the main jdl file and add it to the new jdl file.
"""
"""path of log file directory"""
#path = "condor_logs/Run2017_v6_DataReDoJEC/200726_173958/"
#path = "condor_logs/Run2016_v6_DataReDoJEC/200727_064518/"
#path = "condor_logs/Run2018_v6_DataReDoJEC/200730_103313/"
path = "condor_logs/Run2017_v7_5Aug20200/200805_032620/"
"""Name of main condor jdl/sh file name"""
#condor_file_name = "submit_condor_jobs_lnujj_Run2017_v6_DataReDoJEC"
#condor_file_name = "submit_condor_jobs_lnujj_Run2016_v6_DataReDoJEC"
#condor_file_name = "submit_condor_jobs_lnujj_Run2018_v6_DataReDoJEC"
condor_file_name = "submit_condor_jobs_lnujj_Run2017_v7_5Aug20200"
"""This variable `Resubmit_no` is going to append in the new jdl file.
New jdl file name is the main jdl file + _resubmit_ + Resubmit_no
New JDL FILE name : condor_file_name + "_resubmit_" + Resubmit_no
"""
Resubmit_no = "2"
"""This string is going to be searched in the log files.
If this string is not present in the log file this means the jobs are failed.
"""
string_to_search = "preselected entries from root:"
grepCommand = 'grep -L "'+string_to_search+'" '+ path + os.sep +'*_1.stdout'
grepCommand = grepCommand.replace('//','/')
print 'grep command: ',grepCommand
output = os.popen(grepCommand).read()
print('output:')
outjdl_file = open(condor_file_name+'_resubmit_'+Resubmit_no+".jdl","w")
with open(condor_file_name+".jdl") as myfile:
head = [next(myfile) for x in xrange(7)]
for lines in head:
outjdl_file.write(lines)
for lines in output.split():
print "==> ",lines.strip()
# print "==> ",lines.strip().split('/')[-1].replace('.stdout','')
if lines.strip().split('/')[-1].replace('.stdout','').split('_')[-2] == "resubmit":
OldRefFile = lines.strip().split('/')[-1].replace('.stdout','').split('_')[-4]
else:
OldRefFile = lines.strip().split('/')[-1].replace('.stdout','').split('_')[-1]
# print "====> ",OldRefFile
grep_output = os.popen('grep -E "Running.*root" '+lines.strip()).read()
# print grep_output
root_file = grep_output.split()[5].split('/')[-1]
grepCommand_GetJdlInfo = 'grep -A1 -B3 "'+root_file+'" '+condor_file_name+'.jdl'
# print grepCommand_GetJdlInfo
grep_condor_jdl_part = os.popen(grepCommand_GetJdlInfo).read()
updateString = grep_condor_jdl_part.replace('$(Process)',OldRefFile+'_$(Process)'+ '_resubmit_' +Resubmit_no)
# print updateString
outjdl_file.write(updateString)
outjdl_file.close()
print "===> ",outjdl_file