-
Notifications
You must be signed in to change notification settings - Fork 9
/
Copy pathsubmitCondor_genToDESY.py
executable file
·139 lines (112 loc) · 5.84 KB
/
submitCondor_genToDESY.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
#### python -u submitCondor_gen.py 200PU >& submit.log &
import os,datetime,time,subprocess
runDir=os.getcwd()
os.system('xrdcp -f root://cmseos.fnal.gov//store/user/snowmass/DelphesSubmissionLPCcondor/scripts/EOSSafeUtils.py '+runDir)
execfile(runDir+'/EOSSafeUtils.py')
start_time = time.time()
#IO directories must be full paths
pileup = str(sys.argv[1])
##outputDir='/store/user/snowmass/noreplica/YR_Delphes/Delphes342pre15/'
## outputDir='/store/group/upgrade/delphes_output/YR_Delphes/Delphes342pre14/' ## For CERN condor
outputDir='/store/group/upgrade/delphes_output/YR_Delphes/Delphes342pre14/' ## For DESY (gfal prefix??? See line 52)
condorDir='/uscms/home/jmanagan/nobackup/YR_Delphes/Delphes342pre15_logs/' # Change username, helps to match log directory to the ROOT file directory, adding "_logs" (for compatibility with error checker)
cTime=datetime.datetime.now()
maxEvtsPerJob = 50000 ## -1 --> do not make splitting (1 job per file)
# maxEvtsPerJob = -1 ## -1 --> do not make splitting (1 job per file)
print 'Getting proxy'
proxyPath=os.popen('voms-proxy-info -path')
proxyPath=proxyPath.readline().strip()
print 'Starting submission'
count=0
fileList = [ # CHOOSE SAMPLES, you MUST have listed the file names with listFiles.py
#'ZJetsToNuNu_HT-400To600_14TeV-madgraph.txt',
#'ZZTo4L_14TeV_powheg_pythia8.txt',
]
for sample in fileList:
rootlist = open('fileLists/'+sample)
rootfiles = []
rootfiles_bare = []
for line in rootlist:
rootfiles.append('root://cmsxrootd.fnal.gov/'+line.strip()) ## Can change to whatever is normal for running @ CERN
rootfiles_bare.append(line.strip())
# OPTIONAL: use a more exact accessor for certain samples at CERN:
#if(sample != 'WprimeToWZToWhadZinv_narrow_M-600_13TeV-madgraph.txt'): rootfiles.append('root://eoscms.cern.ch/'+line.strip())
#else: rootfiles.append('root://cmsxrootd.fnal.gov/'+line.strip())
rootlist.close()
relPath = sample.replace('.txt','')
## os.system('eos root://cmseos.fnal.gov/ mkdir -p '+outputDir+relPath+'_'+pileup)
## os.system('eos root://eoscms.cern.ch/ mkdir -p '+outputDir+relPath+'_'+pileup) # For running @ CERN
os.system('gfal-mkdir -p srm://dcache-se-cms.desy.de/pnfs/desy.de/cms/tier2'+outputDir+relPath+'_'+pileup) ## DESY???
os.system('mkdir -p '+condorDir+relPath+'_'+pileup)
tempcount = 0;
for ifile, file in enumerate(rootfiles):
infile = file
tempcount+=1
#if tempcount > 296: continue # OPTIONAL to submit a test job or control submission groups
#if tempcount <= 296: continue
fname_bare = rootfiles_bare[ifile]
n_jobs = 1
if maxEvtsPerJob > -1: ## just query DAS if necessary
command = '/cvmfs/cms.cern.ch/common/dasgoclient --query="file='+fname_bare+' | grep file.nevents" '
proc = subprocess.Popen(command, shell=True, stdout=subprocess.PIPE)
(out, err) = proc.communicate()
try: nevents = int(out.split('\n')[0])
except:
try: nevents = int(out.split('\n')[1])
except: print 'ERROR: couldnt isolate the number of events'
n_jobs = int(nevents) / int(maxEvtsPerJob)
if int(nevents) % int(maxEvtsPerJob) > 0:
n_jobs += 1 ## and extra one to account for the remainder
print relPath+'_'+str(tempcount),'=',n_jobs,'jobs'
### split based on the number of events
for i_split in range(n_jobs):
count+=1
### usual submitter if no splitting
if not maxEvtsPerJob > -1:
outfile = relPath+'_'+str(tempcount)
dict={'RUNDIR':runDir, 'RELPATH':relPath, 'PILEUP':pileup, 'FILEIN':infile, 'FILEOUT':outfile, 'PROXY':proxyPath, 'OUTPUTDIR':outputDir}
jdfName=condorDir+'/%(RELPATH)s_%(PILEUP)s/%(FILEOUT)s.jdl'%dict
# print jdfName
jdf=open(jdfName,'w')
jdf.write(
"""x509userproxy = %(PROXY)s
universe = vanilla
Executable = %(RUNDIR)s/GENtoDelphesDESY.sh
Should_Transfer_Files = YES
WhenToTransferOutput = ON_EXIT
Output = %(FILEOUT)s.out
Error = %(FILEOUT)s.err
Log = %(FILEOUT)s.log
Requirements = (TotalCpus == 8)
Notification = Never
Arguments = %(FILEIN)s %(OUTPUTDIR)s/%(RELPATH)s_%(PILEUP)s %(FILEOUT)s.root %(PILEUP)s
Queue 1"""%dict)
else:
outfile = relPath+'_'+str(tempcount)+'_'+str(i_split)
maxEvents = int(maxEvtsPerJob)
skipEvents = int(maxEvtsPerJob*i_split)
if i_split == n_jobs-1:
maxEvents = nevents - maxEvtsPerJob*(n_jobs-1) ## up to the last event
dict={'RUNDIR':runDir, 'RELPATH':relPath, 'PILEUP':pileup, 'FILEIN':infile, 'FILEOUT':outfile, 'PROXY':proxyPath, 'OUTPUTDIR':outputDir, 'SKIPEVENTS':str(skipEvents), 'MAXEVENTS':str(maxEvents), 'ISPLIT':str(i_split)}
jdfName=condorDir+'/%(RELPATH)s_%(PILEUP)s/%(FILEOUT)s.jdl'%dict ## note: i_split is contained in FILEOUT
jdf=open(jdfName,'w')
jdf.write(
"""x509userproxy = %(PROXY)s
universe = vanilla
Executable = %(RUNDIR)s/GENtoDelphesDESY.sh
Should_Transfer_Files = YES
WhenToTransferOutput = ON_EXIT
Output = %(FILEOUT)s.out
Error = %(FILEOUT)s.err
Log = %(FILEOUT)s.log
Requirements = (TotalCpus == 8)
Notification = Never
Arguments = %(FILEIN)s %(OUTPUTDIR)s/%(RELPATH)s_%(PILEUP)s %(FILEOUT)s.root %(PILEUP)s %(SKIPEVENTS)s %(MAXEVENTS)s
Queue 1"""%dict)
jdf.close()
os.chdir('%s/%s_%s'%(condorDir,relPath,pileup))
os.system('condor_submit %(FILEOUT)s.jdl'%dict)
os.system('sleep 0.5')
os.chdir('%s'%(runDir))
print str(count), "jobs submitted!!!"
print("--- %s minutes ---" % (round(time.time() - start_time, 2)/60))