-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmergeCommandFromCrabDir.py
executable file
·75 lines (62 loc) · 2.87 KB
/
mergeCommandFromCrabDir.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
#!/usr/bin/env python2
import argparse
import re
import getpass
import crabInfo
from crabInfo import myMatch
def getInfoFromDir( crabDir ):
if crabDir[-1] != "/": crabDir += "/"
with open( crabDir+"crab.log" ) as f:
lines = f.readlines()
infos = {"crabDir":crabDir}
for line in lines:
for m in myMatch("config.Data.outLFNDirBase = '(.*)'", line ):
infos["lfn"] = m.group(1)
for m in myMatch( ".*Task name:.*\s([\d_]+):.*_crab_(.*)", line ):
infos["time"] = m.group(1)
for m in myMatch( "config.Data.outputDatasetTag = '(.*)'", line ):
infos["outputDatasetTag"] = m.group(1)
for m in myMatch( "config.Data.inputDataset = '(.*)'", line ):
infos["inputDataset"] = m.group(1)
infos["primaryDataset"], infos["processedDataset"], infos["format"] = infos["inputDataset"].split("/")[1:]
if "'schedd'" in line:
infos.update(eval( line.split("\t")[-1] ))
return infos
def getOutFileName( infos ):
user = getpass.getuser()
if user == "kiesel":
name = infos["primaryDataset"]
for mm in myMatch( '/.*/[^-]*-(.*)-[^-]*/USER', infos["inputDataset"] ):
name = mm.group(1)
if "Run201" in infos["processedDataset"]:
name = "_".join([infos["primaryDataset"],infos["processedDataset"]])
shortDset = crabInfo.modifyDatasetName(name)
return "/user/kiesel/nTuples/{}/{}_nTuple.root".format(infos["outputDatasetTag"],shortDset )
if user == "jschulz":
outFileName=infos["crabDir"][:-1]
outFileName=crabInfo.modifyDatasetName(outFileName.replace("crab_",""))
return "/user/jschulz/2016/data/run2/dl/"+outFileName+".root"
if user == "swuchterl":
n ame = infos["primaryDataset"]
for mm in myMatch( '/.*/[^-]*-(.*)-[^-]*/USER', infos["inputDataset"] ):
name = mm.group(1)
if "Run201" in infos["processedDataset"]:
name = "_".join([infos["primaryDataset"],infos["processedDataset"]])
shortDset = crabInfo.modifyDatasetName(name)
return "/user/swuchterl/nTuples/{}/{}_nTuple.root".format(infos["outputDatasetTag"],shortDset )
return "test.root"
def getSrmInput( infos ):
return "srm://grid-srm.physik.rwth-aachen.de:8443/srm/managerv2?SFN=/pnfs/physik.rwth-aachen.de/cms{lfn}/{primaryDataset}/{outputDatasetTag}/{time}/".format( **infos )
def getMergeCommand( crabDir ):
infos = getInfoFromDir( crabDir )
outFile = getOutFileName( infos )
srmSrc = getSrmInput( infos )
return "./mergeTier2Files.py {} {}".format(outFile,srmSrc)
def main():
parser = argparse.ArgumentParser(description="List merge command based on crab directory.")
parser.add_argument("crabDirs", nargs="+" )
args = parser.parse_args()
for crabDir in args.crabDirs:
print getMergeCommand( crabDir )
if __name__ == "__main__":
main()