-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrunGof.py
158 lines (141 loc) · 7.02 KB
/
runGof.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
from os import path, chmod, makedirs
import subprocess as sp
from optparse import OptionParser
from glob import glob
import shlex
from modelNames import getModelNames, getGoodModelNames
from condorFactory import *
from forcelink import force_symlink
####
# prepares a bunch of scripts and jdl files
# for running goodness-of-fit tests
# John Hakala 1/27/2017
####
def getDcardName(category, modelName, outDir):
return "%s/datacard_%s_%s.txt" % (outDir, category, modelName)
def makeOneDatacard(inFile, dcardTemplate, category, modelName, outDir):
dcardTemplate.seek(0)
outDcard = open(getDcardName(category, modelName, outDir), "w")
for line in dcardTemplate:
if "shapes background" in line:
outDcard.write(line.replace("backgroundRootFile", inFile).replace("backgroundPdf", modelName))
else:
outDcard.write(line)
outDcard.close()
print " > made datacard for model %s: %s" % (modelName, outDcard.name)
def doFit(category, inFile):
for modelName in getGoodModelNames(category):
bkgFileName = "cat-%s_model-%s.root" % (category, modelName)
dataLinkName = "w_data_%s.root" % options.category
dataFile = TFile(dataLinkName)
dataWS = dataFile.Get("Vg")
dataRooHist = dataWS.data("data_obs")
inTfile = TFile(inFile)
dump = inTfile.Get("Vg")
bkgPdfDict = getPdfFromDump(category, dump, modelName, False, dataRooHist, "gof", True)
outBkgFile = TFile("%s/%s" % (outDir, bkgFileName), "RECREATE")
bkgPdfDict["rooWS"].Write()
outBkgFile.Close()
def makeDatacards(category, inFile, outDir, fit):
print "Will make datacards for all models specified in modelNames.py"
if not path.exists(outDir):
makedirs(outDir)
dcardTemplate = open("datacard_template_%s.txt" % category, "r")
if not path.exists(path.join(outDir, "w_data_%s.root" % category)):
force_symlink(path.join("..", "w_data_%s.root" % category), path.join(outDir, "w_data_%s.root" % category))
if not path.exists(path.join(outDir, "w_signal_780.root")):
force_symlink(path.join("..", "..", "Vg", "signalFits_%s" % category, "w_signal_780.root"), path.join(outDir, "w_signal_780.root"))
if fit:
doFit(category, inFile)
for modelName in getGoodModelNames(category):
makeOneDatacard("cat-%s_model-%s.root" % (category, modelName), dcardTemplate, category, modelName, outDir)
def checkForDatacard(outDir, dcardName):
txtFiles = glob("%s/*.txt" % outDir)
if not dcardName in txtFiles:
print "Error: did not find datacard %s in working directory." % dcardName
exit(1)
def makeGOFscripts(category, method, nToys, seed, outDir):
for modelName in getGoodModelNames(category):
dcardName = getDcardName(category, modelName, outDir)
checkForDatacard(outDir, dcardName)
print "Will prepare gofCondor scripts to run GOF test with datacard %s using method %s" % (dcardName, method)
incantation = "combine -M GoodnessOfFit %s -t %i -s %i --algo=%s --fixedSignalStrength=0" % (
getDcardName(category, modelName, outDir).replace("%s/" % outDir,"") ,
nToys ,
seed ,
method
)
pName = "cat-%s_meth-%s_model-%s_nToys-%i_seed-%i"%(category, method, modelName, nToys, seed)
if options.useToysFile:
toysFileName = "../Vg/toys_%s/higgsCombineBiasTest_%s_%s.GenerateOnly.mH1337.246802.root" % (category, category, modelName) # HERE make sure this is the right file
incantation += " --toysFile=%s" % toysFileName
pName += "_vgToys"
scriptName = "%s/gof_%s.sh" % (outDir, pName)
jdlName = "%s/jdl_%s.jdl" % (outDir, pName)
script = open(scriptName, "w")
script.write(simpleScript(incantation, "%s/%s" % (path.dirname(path.realpath(__file__)), outDir)))
chmod(script.name, 0o777)
jdl = open(jdlName, "w")
jdl.write(simpleJdl(script.name.replace("%s/" % outDir,"")))
if not path.exists(path.join(outDir, "condorLogs")):
makedirs(path.join(outDir, "condorLogs"))
if __name__ == "__main__":
parser = OptionParser()
parser.add_option("-c", "--category" , dest="category",
help = "either 'btag' or 'antibtag'" )
parser.add_option("-i", "--inFile" , dest="inFile",
help = "the input rootFile containing a workspace %s" %
"with all pdfs [default=bkg_pdfs.root]", default="bkg_pdfs.root" )
parser.add_option("-m", action="store_false", dest="makeDatacards",
help = "toggle making datacards [default=True]", default=True )
parser.add_option("-g", "--doGOFtest" , dest="doGOFtest",
help = "perform GOF test on all models specified in %s" %
"modelNames.py using method 'saturated' or 'KS'" )
parser.add_option("-t", "--nToys" , dest="nToys", type="int",
help = "the number of toys to use in the GOF test. [default=25]" )
parser.add_option("-f", action="store_true", dest="fit",
help = "toggle fitting the backgrounds [default=False]", default=False )
parser.add_option("-v", action="store_true", dest="useToysFile",
help = "use toys file from Vg bias studies [default=False]", default=False )
parser.add_option("-s", "--seed" , dest="seed", type="int",
help = "the random number seed to use in the GOF test. [default=501337]" )
(options, args) = parser.parse_args()
outDir = "gof_%s_%s" % (options.doGOFtest, options.category)
if options.useToysFile:
outDir += "_vgToys"
if options.category is None:
parser.error("please specify 'btag' or 'antibtag' as the -c option")
if not options.doGOFtest in [None, "saturated", "KS"]:
parser.error("invalid GOF test specified: must be either 'saturated' or 'KS'")
if options.doGOFtest is None:
if options.nToys is not None:
print "error: -t or --nToys was specified, but not running GOF test."
exit(1)
if options.seed is not None:
print "error: -s or --seed was specified, but not running GOF test."
exit(1)
elif not options.makeDatacards:
if not options.fit:
print "neither making datacards nor running GOF test, nor fitting... which means this does nothing."
exit(2)
elif options.fit:
print "just doing background fits."
else:
print "error: something is funny with the options requested:"
print options
exit(2)
else:
if options.nToys is None:
options.nToys = 25
if options.seed is None:
options.seed = 501337
from ROOT import *
from getBkgFromDump import getPdfFromDump
if options.makeDatacards:
makeDatacards(options.category, options.inFile, outDir, options.fit)
elif options.fit:
doFit(options.category, options.inFile)
if options.doGOFtest is None:
print "Done making datacards. Will not perform GOF test."
if options.doGOFtest is not None:
makeGOFscripts(options.category, options.doGOFtest, options.nToys, options.seed, outDir)