forked from ram1123/nanoAOD_skim
-
Notifications
You must be signed in to change notification settings - Fork 0
/
condor_setup.py
171 lines (155 loc) · 8.33 KB
/
condor_setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
import subprocess
import os
import sys
sys.path.append("Utils/python_utils/.")
from color_style import style
# Variables to be changed by user
#StringToChange = "Run2016_v6_15June2020_MatteoWJetBinned"
#StringToChange = "Run2018_v6_DataReDoJEC"
StringToChange = "Run2017_v7_18Aug2020_Hadd"
customEOS = False
customEOS_cmd = 'eos root://cmseos.fnal.gov find -name "*.root" /store/group/lnujj/VVjj_aQGC/custom_nanoAOD'
#InputFileFromWhereReadDASNames = 'sample_list_v6_2016_campaign.dat'
#InputFileFromWhereReadDASNames = 'sample_list_v6_2017_campaign.dat'
#InputFileFromWhereReadDASNames = 'sample_list_v6_2018_campaign.dat'
#InputFileFromWhereReadDASNames = 'sample_list_v7_2016_campaign.dat'
#InputFileFromWhereReadDASNames = 'sample_list_v7_2017_eos_custom.dat'
InputFileFromWhereReadDASNames = 'sample_list_v7_2017_campaign.dat'
Initial_path = '/eos/uscms/store/user/lnujj/VVjj_aQGC/nanoAOD_skim/'
Initial_path += StringToChange
condor_file_name = 'submit_condor_jobs_lnujj_'+StringToChange
# Create log files
import infoCreaterGit
SumamryOfCurrentSubmission = raw_input("\n\nWrite summary for current job submission: ")
infoLogFiles = infoCreaterGit.BasicInfoCreater('summary.dat',SumamryOfCurrentSubmission)
infoLogFiles.GenerateGitPatchAndLog()
# Get CMSSW directory path and name
cmsswDirPath = os.environ['CMSSW_BASE']
CMSSWRel = cmsswDirPath.split("/")[-1]
# Create directories for storing log files and output files at EOS.
import fileshelper
dirsToCreate = fileshelper.FileHelper('condor_logs/'+StringToChange, Initial_path)
output_log_path = dirsToCreate.CreateLogDirWithDate()
storeDir = dirsToCreate.CreateSotreArea(Initial_path)
dirName = dirsToCreate.dirName
# create tarball of present working CMSSW base directory
os.system('rm -f CMSSW*.tgz')
import makeTarFile
makeTarFile.make_tarfile(cmsswDirPath, CMSSWRel+".tgz")
print "copying the "+CMSSWRel+".tgz file to eos path: "+storeDir+"\n"
os.system('xrdcp -f ' + CMSSWRel+".tgz" + ' root://cmseos.fnal.gov/'+storeDir+'/' + CMSSWRel+".tgz")
post_proc_to_run = "post_proc.py"
command = "python "+post_proc_to_run
Transfer_Input_Files = ("Cert_271036-284044_13TeV_PromptReco_Collisions16_JSON.txt, " +
"Cert_294927-306462_13TeV_PromptReco_Collisions17_JSON.txt, " +
"Cert_314472-325175_13TeV_PromptReco_Collisions18_JSON.txt, " +
"keep_and_drop_data.txt")
#with open('input_data_Files/sample_list_v6_2017_campaign.dat') as in_file:
with open('input_data_Files/'+InputFileFromWhereReadDASNames) as in_file:
outjdl_file = open(condor_file_name+".jdl","w")
outjdl_file.write("Executable = "+condor_file_name+".sh\n")
outjdl_file.write("Universe = vanilla\n")
outjdl_file.write("Notification = ERROR\n")
outjdl_file.write("Should_Transfer_Files = YES\n")
outjdl_file.write("WhenToTransferOutput = ON_EXIT\n")
outjdl_file.write("Transfer_Input_Files = "+Transfer_Input_Files + ", " + post_proc_to_run+"\n")
outjdl_file.write("x509userproxy = $ENV(X509_USER_PROXY)\n")
count = 0
count_jobs = 0
for lines in in_file:
if lines[0] == "#": continue
count = count +1
#if count > 1: break
print(style.RED +"="*51+style.RESET+"\n")
print "==> Sample : ",count
sample_name = lines.split('/')[1]
campaign = lines.split('/')[2].split('-')[0]
print "==> sample_name = ",sample_name
print "==> campaign = ",campaign
########################################
#
# Create output directory
#
########################################
if sample_name.find("SingleMuon") != -1 or sample_name.find("SingleElectron") != -1 or sample_name.find("EGamma") != -1 or sample_name.find("DoubleMuon") != -1 or sample_name.find("MuonEG") != -1 or sample_name.find("DoubleEG") != -1:
output_string = sample_name + os.sep + campaign + os.sep + dirName
output_path = Initial_path + os.sep + output_string
os.system("xrdfs root://cmseos.fnal.gov/ mkdir "+Initial_path + os.sep + sample_name)
os.system("xrdfs root://cmseos.fnal.gov/ mkdir "+Initial_path + os.sep + sample_name + os.sep + campaign)
os.system("xrdfs root://cmseos.fnal.gov/ mkdir "+ Initial_path + os.sep + sample_name + os.sep + campaign + os.sep + dirName)
infoLogFiles.SendGitLogAndPatchToEos(Initial_path + os.sep + sample_name + os.sep + campaign + os.sep + dirName)
else:
output_string = sample_name+os.sep+dirName
output_path = Initial_path+ os.sep + output_string
os.system("xrdfs root://cmseos.fnal.gov/ mkdir "+Initial_path + os.sep + sample_name)
os.system("xrdfs root://cmseos.fnal.gov/ mkdir "+Initial_path + os.sep + sample_name+os.sep+dirName)
infoLogFiles.SendGitLogAndPatchToEos(Initial_path + os.sep + sample_name + os.sep + dirName)
print "==> output_path = ",output_path
########################################
#print 'dasgoclient --query="file dataset='+lines.strip()+'"'
#print "..."
if customEOS:
xrd_redirector = 'root://cmseos.fnal.gov/'
output = os.popen(customEOS_cmd + lines.strip()).read()
else:
xrd_redirector = 'root://cms-xrd-global.cern.ch/'
output = os.popen('dasgoclient --query="file dataset='+lines.strip()+'"').read()
count_root_files = 0
for root_file in output.split():
#print "=> ",root_file
count_root_files+=1
count_jobs += 1
outjdl_file.write("Output = "+output_log_path+"/"+sample_name+"_$(Process).stdout\n")
outjdl_file.write("Error = "+output_log_path+"/"+sample_name+"_$(Process).stdout\n")
outjdl_file.write("Log = "+output_log_path+"/"+sample_name+"_$(Process).log\n")
outjdl_file.write("Arguments = "+(xrd_redirector+root_file).replace('/','\/')+" "+output_path+" "+Initial_path+"\n")
outjdl_file.write("Queue \n")
print "Number of files: ",count_root_files
print "Number of jobs (till now): ",count_jobs
outjdl_file.close();
outScript = open(condor_file_name+".sh","w");
outScript.write('#!/bin/bash');
outScript.write("\n"+'echo "Starting job on " `date`');
outScript.write("\n"+'echo "Running on: `uname -a`"');
outScript.write("\n"+'echo "System software: `cat /etc/redhat-release`"');
outScript.write("\n"+'source /cvmfs/cms.cern.ch/cmsset_default.sh');
outScript.write("\n"+'echo "copy cmssw tar file from store area"');
outScript.write("\n"+'xrdcp -s root://cmseos.fnal.gov/${3}/'+CMSSWRel +'.tgz .');
outScript.write("\n"+'tar -xf '+ CMSSWRel +'.tgz' );
outScript.write("\n"+'rm '+ CMSSWRel +'.tgz' );
outScript.write("\n"+'cd ' + CMSSWRel + '/src/PhysicsTools/NanoAODTools/python/postprocessing/analysis/nanoAOD_vvVBS/' );
#outScript.write("\n"+'echo "====> List files : " ');
#outScript.write("\n"+'ls -alh');
outScript.write("\n"+'rm *.root');
outScript.write("\n"+'scramv1 b ProjectRename');
outScript.write("\n"+'eval `scram runtime -sh`');
outScript.write("\n"+'sed -i "s/testfile = .*/testfile = \\"${1}\\"/g" '+post_proc_to_run);
outScript.write("\n"+'echo "========================================="');
outScript.write("\n"+'echo "cat post_proc.py"');
outScript.write("\n"+'echo "..."');
outScript.write("\n"+'cat post_proc.py');
outScript.write("\n"+'echo "..."');
outScript.write("\n"+'echo "========================================="');
outScript.write("\n"+command);
outScript.write("\n"+'echo "====> List root files : " ');
outScript.write("\n"+'ls *.root');
outScript.write("\n"+'echo "====> copying *.root file to stores area..." ');
outScript.write("\n"+'if ls *Hadd.root 1> /dev/null 2>&1; then');
outScript.write("\n"+' echo "File *Hadd.root exists. Copy this."');
outScript.write("\n"+' echo "xrdcp -f *Hadd.root root://cmseos.fnal.gov/${2}"');
outScript.write("\n"+' xrdcp -f *Hadd.root root://cmseos.fnal.gov/${2}');
outScript.write("\n"+'else');
outScript.write("\n"+' echo "file *Hadd.root does not exists, so copy *.root file."');
outScript.write("\n"+' echo "xrdcp -f *.root root://cmseos.fnal.gov/${2}"');
outScript.write("\n"+' xrdcp -f *.root root://cmseos.fnal.gov/${2}');
outScript.write("\n"+'fi');
outScript.write("\n"+'rm *.root');
outScript.write("\n"+'cd ${_CONDOR_SCRATCH_DIR}');
outScript.write("\n"+'rm -rf ' + CMSSWRel);
outScript.write("\n");
outScript.close();
os.system("chmod 777 "+condor_file_name+".sh");
print "===> Set Proxy Using:";
print "\tvoms-proxy-init --voms cms --valid 168:00";
print "\"condor_submit "+condor_file_name+".jdl\" to submit";
#os.system("condor_submit "+condor_file_name+".jdl")