eff_plots.py 30 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741
  1. #!/usr/bin/env python
  2. from itertools import product
  3. from argparse import ArgumentParser
  4. import numpy as np
  5. import matplotlib.pyplot as plt
  6. from uproot import open as root_open
  7. from matplottery.utils import Hist1D, Hist2D, to_html_table
  8. from matplottery.plotter import set_defaults, plot_2d
  9. import matplotboard as mpb
  10. matching_cuts = {
  11. 'new-extra-narrow': [
  12. dict(
  13. dPhiMaxHighEt=0.025,
  14. dPhiMaxHighEtThres=20.0,
  15. dPhiMaxLowEtGrad=-0.002,
  16. dRzMaxHighEt=9999.0,
  17. dRzMaxHighEtThres=0.0,
  18. dRzMaxLowEtGrad=0.0,
  19. ),
  20. dict(
  21. dPhiMaxHighEt=0.0015,
  22. dPhiMaxHighEtThres=0.0,
  23. dPhiMaxLowEtGrad=0.0,
  24. dRzMaxHighEt=0.025,
  25. dRzMaxHighEtThres=30.0,
  26. dRzMaxLowEtGrad=-0.002,
  27. ),
  28. dict(
  29. dPhiMaxHighEt=0.0015,
  30. dPhiMaxHighEtThres=0.0,
  31. dPhiMaxLowEtGrad=0.0,
  32. dRzMaxHighEt=0.025,
  33. dRzMaxHighEtThres=30.0,
  34. dRzMaxLowEtGrad=-0.002,
  35. )
  36. ],
  37. 'new-default': [
  38. dict(
  39. dPhiMaxHighEt=0.05,
  40. dPhiMaxHighEtThres=20.0,
  41. dPhiMaxLowEtGrad=-0.002,
  42. dRzMaxHighEt=9999.0,
  43. dRzMaxHighEtThres=0.0,
  44. dRzMaxLowEtGrad=0.0,
  45. ),
  46. dict(
  47. dPhiMaxHighEt=0.003,
  48. dPhiMaxHighEtThres=0.0,
  49. dPhiMaxLowEtGrad=0.0,
  50. dRzMaxHighEt=0.05,
  51. dRzMaxHighEtThres=30.0,
  52. dRzMaxLowEtGrad=-0.002,
  53. ),
  54. dict(
  55. dPhiMaxHighEt=0.003,
  56. dPhiMaxHighEtThres=0.0,
  57. dPhiMaxLowEtGrad=0.0,
  58. dRzMaxHighEt=0.05,
  59. dRzMaxHighEtThres=30.0,
  60. dRzMaxLowEtGrad=-0.002,
  61. )
  62. ],
  63. 'new-wide': [
  64. dict(
  65. dPhiMaxHighEt=0.10,
  66. dPhiMaxHighEtThres=20.0,
  67. dPhiMaxLowEtGrad=-0.002,
  68. dRzMaxHighEt=9999.0,
  69. dRzMaxHighEtThres=0.0,
  70. dRzMaxLowEtGrad=0.0,
  71. ),
  72. dict(
  73. dPhiMaxHighEt=0.006,
  74. dPhiMaxHighEtThres=0.0,
  75. dPhiMaxLowEtGrad=0.0,
  76. dRzMaxHighEt=0.10,
  77. dRzMaxHighEtThres=30.0,
  78. dRzMaxLowEtGrad=-0.002,
  79. ),
  80. dict(
  81. dPhiMaxHighEt=0.006,
  82. dPhiMaxHighEtThres=0.0,
  83. dPhiMaxLowEtGrad=0.0,
  84. dRzMaxHighEt=0.10,
  85. dRzMaxHighEtThres=30.0,
  86. dRzMaxLowEtGrad=-0.002,
  87. )
  88. ],
  89. 'new-extra-wide': [
  90. dict(
  91. dPhiMaxHighEt=0.15,
  92. dPhiMaxHighEtThres=20.0,
  93. dPhiMaxLowEtGrad=-0.002,
  94. dRzMaxHighEt=9999.0,
  95. dRzMaxHighEtThres=0.0,
  96. dRzMaxLowEtGrad=0.0,
  97. ),
  98. dict(
  99. dPhiMaxHighEt=0.009,
  100. dPhiMaxHighEtThres=0.0,
  101. dPhiMaxLowEtGrad=0.0,
  102. dRzMaxHighEt=0.15,
  103. dRzMaxHighEtThres=30.0,
  104. dRzMaxLowEtGrad=-0.002,
  105. ),
  106. dict(
  107. dPhiMaxHighEt=0.009,
  108. dPhiMaxHighEtThres=0.0,
  109. dPhiMaxLowEtGrad=0.0,
  110. dRzMaxHighEt=0.15,
  111. dRzMaxHighEtThres=30.0,
  112. dRzMaxLowEtGrad=-0.002,
  113. )
  114. ],
  115. }
  116. samples = None
  117. def load_samples():
  118. global samples
  119. if samples is None:
  120. print("loading samples")
  121. samples = {}
  122. for proc, wp, config in product(procs, wps, configs):
  123. samples[(proc, wp, config)] = root_open(f'../hists/{proc}-{wp}-{config}.root')
  124. # if 'old' in wp:
  125. # samples[(proc, wp)] = root_open(f'../hists/with_skipping/{proc}-{wp}.root')
  126. # elif 'noskip' in wp:
  127. # wpkey = wp.replace('-noskip', '')
  128. # samples[(proc, wp)] = root_open(f'../hists/no_skipping/{proc}-{wpkey}.root')
  129. # elif 'skip' in wp:
  130. # wpkey = wp.replace('-skip', '')
  131. # samples[(proc, wp)] = root_open(f'../hists/with_skipping/{proc}-{wpkey}.root')
  132. return samples
  133. def calc_window(et, eta, hit, variable, cut_sel):
  134. idx = min(hit-1, 2)
  135. cut_sel = cut_sel.replace('-skip', '').replace('-noskip', '')
  136. cuts = matching_cuts[cut_sel][idx]
  137. if 'etaBins' in cuts:
  138. for eta_idx, bin_high in enumerate(cuts['etaBins']):
  139. if eta < bin_high:
  140. high_et = cuts[f'{variable}MaxHighEt'][eta_idx]
  141. high_et_thres = cuts[f'{variable}MaxHighEtThres'][eta_idx]
  142. low_et_grad = cuts[f'{variable}MaxLowEtGrad'][eta_idx]
  143. break
  144. else: # highest bin
  145. high_et = cuts[f'{variable}MaxHighEt'][-1]
  146. high_et_thres = cuts[f'{variable}MaxHighEtThres'][-1]
  147. low_et_grad = cuts[f'{variable}MaxLowEtGrad'][-1]
  148. else:
  149. high_et = cuts[f'{variable}MaxHighEt']
  150. high_et_thres = cuts[f'{variable}MaxHighEtThres']
  151. low_et_grad = cuts[f'{variable}MaxLowEtGrad']
  152. return high_et + min(0, et-high_et_thres)*low_et_grad
  153. def hist_integral_ratio(num, den):
  154. num_int = num.integral
  155. den_int = den.integral
  156. ratio = num_int / den_int
  157. error = np.sqrt(den_int) / den_int # TODO: Check this definition of error
  158. return ratio, error
  159. def center_text(x, y, txt, **kwargs):
  160. plt.text(x, y, txt,
  161. horizontalalignment='center', verticalalignment='center',
  162. transform=plt.gca().transAxes, size=24, **kwargs)
  163. def hist_plot(h: Hist1D, *args, include_errors=False, line_width=1, **kwargs):
  164. """ Plots a 1D ROOT histogram object using matplotlib """
  165. counts = h.counts
  166. edges = h.edges
  167. left, right = edges[:-1], edges[1:]
  168. x = np.array([left, right]).T.flatten()
  169. y = np.array([counts, counts]).T.flatten()
  170. plt.plot(x, y, *args, linewidth=line_width, **kwargs)
  171. if include_errors:
  172. if h.errors_up is not None:
  173. errors = np.vstack((h.errors_down, h.errors_up))
  174. else:
  175. errors = h.errors
  176. plt.errorbar(h.bin_centers, h.counts, yerr=errors,
  177. color='k', marker=None, linestyle='None',
  178. barsabove=True, elinewidth=.7, capsize=1)
  179. def hist2d_percent_contour(h: Hist1D, percent: float, axis: str):
  180. values = h.counts
  181. try:
  182. axis = axis.lower()
  183. axis_idx = {'x': 1, 'y': 0}[axis]
  184. except KeyError:
  185. raise ValueError('axis must be \'x\' or \'y\'')
  186. if percent < 0 or percent > 1:
  187. raise ValueError('percent must be in [0,1]')
  188. with np.warnings.catch_warnings():
  189. np.warnings.filterwarnings('ignore', 'invalid value encountered in true_divide')
  190. values = values / np.sum(values, axis=axis_idx, keepdims=True)
  191. np.nan_to_num(values, copy=False)
  192. values = np.cumsum(values, axis=axis_idx)
  193. idxs = np.argmax(values > percent, axis=axis_idx)
  194. x_centers, y_centers = h.bin_centers
  195. if axis == 'x':
  196. return x_centers[idxs], y_centers
  197. else:
  198. return x_centers, y_centers[idxs]
  199. @mpb.decl_fig
  200. def plot_residuals(sample, layer, hit, variable, subdet):
  201. load_samples()
  202. proc, wp = sample
  203. track_matched = samples[sample][f'{variable}_{subdet}_L{layer}_H{hit}_v_Et_TrackMatched']
  204. # no_match = samples[sample][f'{variable}_{subdet}_L{layer}_H{hit}_v_Et_NoMatch']
  205. h_real = Hist2D(track_matched)
  206. # h_fake = Hist2D(no_match)
  207. def do_plot(h):
  208. plot_2d(h, cmap='viridis')
  209. xs, ys = hist2d_percent_contour(h, .90, 'x')
  210. plt.plot(xs, ys, color='green', label='90\% contour')
  211. xs, ys = hist2d_percent_contour(h, .995, 'x')
  212. plt.plot(xs, ys, color='darkgreen', label='99.5\% contour')
  213. ets = h.edges[1]
  214. cuts = [calc_window(et, 0, hit, variable, wp) for et in ets]
  215. plt.plot(cuts, ets, color='red', label='Cut Value')
  216. plt.xlabel({'dPhi': r'$\delta \phi$ (rads)',
  217. 'dRz': r'$\delta R/z$ (cm)'}[variable])
  218. # plt.sca(plt.subplot(1, 2, 1))
  219. do_plot(h_real)
  220. plt.title('Truth-Matched Seeds')
  221. plt.ylabel('$E_T$ (GeV)')
  222. # plt.sca(plt.subplot(1, 2, 2))
  223. # do_plot(h_fake)
  224. # plt.title('Not Truth-Matched Seeds')
  225. plt.legend(loc='upper right')
  226. @mpb.decl_fig
  227. def plot_residuals_eta(sample, hit, variable):
  228. load_samples()
  229. h = Hist2D(samples[sample][f'{variable}_residuals_v_eta_H{hit}'])
  230. plot_2d(h)
  231. xs, ys = hist2d_percent_contour(h, .90, 'x')
  232. plt.plot(xs, ys, color='green', label='90\% contour')
  233. xs, ys = hist2d_percent_contour(h, .995, 'x')
  234. plt.plot(xs, ys, color='darkgreen', label='99.5\% contour')
  235. plt.xlabel({'dPhi': r'$\delta \phi$ (rads)',
  236. 'dRz': r'$\delta R/z$ (cm)'}[variable])
  237. plt.ylabel(r'$|\eta|$')
  238. @mpb.decl_fig
  239. def plot_hit_vs_layer(sample, region):
  240. load_samples()
  241. if region == 'BPIX':
  242. region = 'barrel'
  243. if region == 'FPIX':
  244. region = 'forward'
  245. h = Hist2D(samples[sample][f'hit_vs_layer_{region}'])
  246. plot_2d(h, colz_fmt='2.0f')
  247. plt.xlabel('Layer #')
  248. plt.ylabel('Hit #')
  249. @mpb.decl_fig
  250. def plot_roc_curve(pfx, ext=''):
  251. load_samples()
  252. show_fr = pfx == "tracking"
  253. def get_num_den(sample, basename):
  254. num = Hist1D(sample[f'{basename}_num'])
  255. den = Hist1D(sample[f'{basename}_den'])
  256. return hist_integral_ratio(num, den)
  257. rows = []
  258. row_labels = []
  259. for i, proc in enumerate(procs):
  260. plt.subplot(len(procs), 1, i+1)
  261. row_labels.append(procs[proc])
  262. row_labels.extend(['']*(len(wps)-1))
  263. for wp, config in product(wps, configs):
  264. sample = samples[(proc, wp, config)]
  265. sample_name = f'{proc}-{wp}-{config}'
  266. eff, eff_err = get_num_den(sample, f'{pfx}_eff_v_phi{ext}')
  267. pur, pur_err = get_num_den(sample, f'{pfx}_pur_v_phi{ext}')
  268. if show_fr:
  269. fr, fr_err = get_num_den(sample, f'fake_rate_no_e_match_v_phi')
  270. rows.append([wp,
  271. rf'${eff*100:0.2f}\pm{eff_err*100:0.2f}\%$',
  272. rf'${pur*100:0.2f}\pm{pur_err*100:0.2f}\%$',
  273. rf'${fr*100:0.2f}\pm{fr_err*100:0.2f}\%$'])
  274. if config == 'skip-pileup':
  275. marker = 'o'
  276. elif config == 'noskip':
  277. marker = '*'
  278. else:
  279. marker = '^'
  280. # plt.errorbar([pur], [eff], xerr=[pur_err], yerr=[eff_err],
  281. # label=sample_name, marker=marker, color=color(proc, wp))
  282. plt.scatter([pur], [eff], label=sample_name, marker=marker, color=color(proc, wp))
  283. # center_text(0.3, 0.3, r'$p_T>20$ and $|\eta|<2.5$')
  284. # plt.axis('equal')
  285. # plt.xlim((0.5, 1.02))
  286. # plt.ylim((0.5, 1.02))
  287. plt.xlim((0, 1.02))
  288. plt.ylim((0.7, 1.02))
  289. plt.ylabel('Efficiency')
  290. plt.grid()
  291. plt.legend(loc='lower right', ncol=2, fancybox=True, numpoints=1)
  292. plt.xlabel('Purity')
  293. col_labels = ['Sample', 'Working Point', 'Efficiency', 'Purity']
  294. if show_fr:
  295. col_labels.append("Fake Rate")
  296. return to_html_table(rows, col_labels, row_labels, 'table-condensed')
  297. @mpb.decl_fig
  298. def plot_kinematic_eff(pref, ext='', ylim=(None, None), norm=None, label_pfx='', incl_sel=True,
  299. bins_pt=None, bins_eta=None, bins_phi=None, bins_PU=None,
  300. xlim_pt=(None, None), xlim_eta=(None, None), xlim_phi=(None, None),
  301. is_ratio=False, config=None):
  302. load_samples()
  303. # Figure out if this one has v_PU
  304. has_PU = f'{pref}_v_PU{ext}' in list(samples.values())[0]
  305. ax_pt = plt.subplot(221)
  306. ax_eta = plt.subplot(222)
  307. ax_phi = plt.subplot(223)
  308. if has_PU:
  309. ax_PU = plt.subplot(224)
  310. errors = True
  311. for (proc, wp, config_), sample in samples.items():
  312. if config is not None and config_ != config:
  313. continue
  314. sample_name = f'{proc}-{wp}-{config_}'
  315. l = sample_name
  316. c = color(proc, wp)
  317. def do_plot(ax, name, bins):
  318. plt.sca(ax)
  319. if is_ratio:
  320. num = Hist1D(sample[name+"_num"], no_overflow=True)
  321. den = Hist1D(sample[name+"_den"], no_overflow=True)
  322. if bins:
  323. num.rebin(bins)
  324. den.rebin(bins)
  325. h = num // den
  326. else:
  327. h = Hist1D(sample[name], no_overflow=True)
  328. if norm:
  329. h = h / (norm*h.integral)
  330. if bins:
  331. h.rebin(bins)
  332. hist_plot(h, include_errors=errors, label=l, color=c, linestyle=style(config_))
  333. do_plot(ax_pt, f'{pref}_v_pt{ext}', bins_pt)
  334. do_plot(ax_eta, f'{pref}_v_eta{ext}', bins_eta)
  335. do_plot(ax_phi, f'{pref}_v_phi{ext}', bins_phi)
  336. if has_PU:
  337. do_plot(ax_PU, f'{pref}_v_PU{ext}', [-0.5, 20, 30, 40, 50, 60, 70, 80, 100.5])
  338. plt.sca(ax_pt)
  339. if not incl_sel: center_text(0.5, 0.15, r'$|\eta|<2.5$')
  340. plt.xlabel(fr"{label_pfx} $p_T$")
  341. plt.ylim(ylim)
  342. plt.xlim(xlim_pt)
  343. plt.sca(ax_eta)
  344. if not incl_sel: center_text(0.5, 0.15, r'$p_T>20$')
  345. plt.xlabel(fr"{label_pfx} $\eta$")
  346. plt.ylim(ylim)
  347. plt.xlim(xlim_eta)
  348. plt.sca(ax_phi)
  349. if not incl_sel: center_text(0.5, 0.15, r'$p_T>20$ and $|\eta|<2.5$')
  350. plt.xlabel(fr"{label_pfx} $\phi$")
  351. plt.ylim(ylim)
  352. plt.xlim(xlim_phi)
  353. if has_PU:
  354. plt.sca(ax_PU)
  355. if not incl_sel: center_text(0.5, 0.15, r'$p_T>20$ and $|\eta|<2.5$')
  356. plt.xlabel("# Pile-up Interactions")
  357. plt.ylim(ylim)
  358. plt.tight_layout()
  359. plt.sca(ax_eta)
  360. plt.legend(loc='best', prop={'size': 10})
  361. else:
  362. plt.tight_layout()
  363. plt.legend(loc='upper left', bbox_to_anchor=(0.6, 0.45), bbox_transform=plt.gcf().transFigure,
  364. prop={'size': 20})
  365. @mpb.decl_fig
  366. def plot_ecal_rel_res():
  367. load_samples()
  368. for sample_name, sample in samples.items():
  369. h = Hist1D(sample['ecal_energy_resolution'])
  370. try:
  371. h = h / h.integral
  372. hist_plot(h, label=sample_name)
  373. except ZeroDivisionError:
  374. pass
  375. plt.xlabel(r"ECAL $E_T$ relative error")
  376. plt.legend()
  377. @mpb.decl_fig
  378. def plot_res_contour(proc, hit_number, var, layers, ext='_TrackMatched'):
  379. load_samples()
  380. _, axs = plt.subplots(1, 2, sharey=True)
  381. def do_plot(ax, sample):
  382. plt.sca(ax)
  383. wp = sample[1]
  384. plt.title(wp)
  385. h = None
  386. for subdet, layer in layers:
  387. h = Hist2D(samples[sample][f'{var}_{subdet}_L{layer}_H{hit_number}_v_Et{ext}'])
  388. xs, ys = hist2d_percent_contour(h, .99, 'x')
  389. plt.plot(xs, ys, label=f'{subdet} - L{layer}')
  390. ets = h.edges[1]
  391. cuts = [calc_window(et, 0, hit_number, var, wp) for et in ets]
  392. plt.plot(cuts, ets, color='k', label='Cut Value')
  393. for ax, wp in zip(axs, ['new-default-noskip', 'new-wide-noskip']):
  394. do_plot(ax, (proc, wp))
  395. plt.sca(axs[-1])
  396. plt.legend(loc='upper right')
  397. @mpb.decl_fig
  398. def simple_dist(hist_name, rebin=(), norm=1, xlabel="", ylabel="", xlim=None, ylim=None, line_width=1):
  399. load_samples()
  400. for (proc, wp, config), sample in samples.items():
  401. sample_name = f'{proc}-{wp}-{config}'
  402. h = Hist1D(sample[hist_name])
  403. if rebin:
  404. h.rebin(*rebin)
  405. mean = np.sum(h.counts * h.bin_centers) / h.integral
  406. try:
  407. if norm is not None:
  408. h = h * (norm / h.integral)
  409. hist_plot(h, label=f'{sample_name} ($\\mu={mean:.2f}$)',
  410. color=color(proc, wp), line_width=line_width)
  411. except ZeroDivisionError:
  412. pass
  413. if xlim:
  414. plt.xlim(xlim)
  415. if ylim:
  416. plt.ylim(ylim)
  417. plt.xlabel(xlabel)
  418. plt.ylabel(ylabel)
  419. plt.legend()
  420. @mpb.decl_fig
  421. def simple_dist2d(hist_name, proc, wp, config, norm=None, colz_fmt='g', clear_zero=False, **kwargs):
  422. load_samples()
  423. sample = samples[(proc, wp, config)]
  424. h = Hist2D(sample[hist_name])
  425. if norm is not None:
  426. h = h * (norm / h.integral)
  427. if clear_zero:
  428. h.counts[0, 0] = 0
  429. plot_2d(h, colz_fmt=colz_fmt, cmap='viridis', **kwargs)
  430. def all_cut_plots(build=True, publish=False):
  431. figures = {
  432. 'tracking_roc_curve': plot_roc_curve('tracking'),
  433. 'tracking_roc_curve_dR': plot_roc_curve('tracking', ext='_dR'),
  434. 'seeding_roc_curve': plot_roc_curve('seed'),
  435. # 'number_of_seeds': simple_dist('n_seeds', xlabel='Number of Seeds', rebin=(50, -0.5, 200.5)),
  436. # 'number_of_good_seeds': simple_dist('n_good_seeds', xlabel='Number of Seeds', rebin=(50, -0.5, 200.5)),
  437. # 'number_of_scls': simple_dist('n_scl', xlabel='Number of Super-Clusters', xlim=(-0.5, 25.5)),
  438. # 'number_of_good_scls': simple_dist('n_good_scl', xlabel='Number of Super-Clusters', xlim=(-0.5, 25.5)),
  439. #
  440. # 'number_of_sim_els': simple_dist('n_good_sim', xlabel='Number of prompt(ish) electrons', xlim=(-0.5, 20.5)),
  441. # 'number_of_gsf_tracks': simple_dist('n_gsf_track', xlabel='Number of reco electrons', xlim=(-0.5, 20.5)),
  442. #
  443. # 'number_of_prompt': simple_dist('n_prompt', xlabel='Number of prompt electrons', xlim=(-0.5, 20.5)),
  444. # 'number_of_nonprompt': simple_dist('n_nonprompt', xlabel='Number of nonprompt electrons', xlim=(-0.5, 20.5)),
  445. #
  446. # 'number_of_matched': simple_dist('n_matched', xlabel='Number of matched electrons',
  447. # xlim=(-0.5, 10.5), line_width=4),
  448. # 'number_of_merged': simple_dist('n_merged', xlabel='Number of merged electrons',
  449. # xlim=(-0.5, 10.5), line_width=4),
  450. # 'number_of_lost': simple_dist('n_lost', xlabel='Number of lost electrons',
  451. # xlim=(-0.5, 10.5), line_width=4),
  452. # 'number_of_split': simple_dist('n_split', xlabel='Number of split electrons',
  453. # xlim=(-0.5, 10.5), line_width=4),
  454. # 'number_of_faked': simple_dist('n_faked', xlabel='Number of faked electrons',
  455. # xlim=(-0.5, 10.5), line_width=4),
  456. # 'number_of_flipped': simple_dist('n_flipped', xlabel='Number of flipped electrons',
  457. # xlim=(-0.5, 10.5), line_width=4),
  458. # 'matched_dR': simple_dist('matched_dR', xlabel='dR between sim and reco'),
  459. # 'matched_dpT': simple_dist('matched_dpT', xlabel='dpT between sim and reco'),
  460. #
  461. #
  462. # 'number_of_matched_dR': simple_dist('n_matched_dR', xlabel='Number of matched electrons - dR Matched',
  463. # xlim=(-0.5, 10.5), line_width=4),
  464. # 'number_of_merged_dR': simple_dist('n_merged_dR', xlabel='Number of merged electrons - dR Matched',
  465. # xlim=(-0.5, 10.5), line_width=4),
  466. # 'number_of_lost_dR': simple_dist('n_lost_dR', xlabel='Number of lost electrons - dR Matched',
  467. # xlim=(-0.5, 10.5), line_width=4),
  468. # 'number_of_split_dR': simple_dist('n_split_dR', xlabel='Number of split electrons - dR Matched',
  469. # xlim=(-0.5, 10.5), line_width=4),
  470. # 'number_of_faked_dR': simple_dist('n_faked_dR', xlabel='Number of faked electrons - dR Matched',
  471. # xlim=(-0.5, 10.5), line_width=4),
  472. # 'number_of_flipped_dR': simple_dist('n_flipped_dR', xlabel='Number of flipped electrons - dR Matched',
  473. # xlim=(-0.5, 10.5), line_width=4),
  474. # 'matched_dR_dR': simple_dist('matched_dR_dR', xlabel='dR between sim and reco - dR Matched'),
  475. # 'matched_dpT_dR': simple_dist('matched_dpT_dR', xlabel='dpT between sim and reco - dR Matched'),
  476. #
  477. # # 'tm_corr': simple_dist2d('tm_corr', 'dy', 'old-default', xlabel='Seed Matched', ylabel='Track Matched', norm=1),
  478. #
  479. # 'ecal_rel_res': plot_ecal_rel_res(),
  480. # # 'hit_v_layer_BPIX_new-default_dy': plot_hit_vs_layer(('dy', 'new-default-skip'), 'barrel'),
  481. # # 'hit_v_layer_FPIX_new-default_dy': plot_hit_vs_layer(('dy', 'new-default-skip'), 'forward'),
  482. # # 'hit_v_layer_BPIX_new-default_tt': plot_hit_vs_layer(('tt', 'new-default-skip'), 'barrel'),
  483. # # 'hit_v_layer_FPIX_new-default_tt': plot_hit_vs_layer(('tt', 'new-default-skip'), 'forward'),
  484. # # 'hit_v_layer_BPIX_new-wide_dy': plot_hit_vs_layer(('dy', 'new-wide-skip'), 'barrel'),
  485. # # 'hit_v_layer_FPIX_new-wide_dy': plot_hit_vs_layer(('dy', 'new-wide-skip'), 'forward'),
  486. # # 'hit_v_layer_BPIX_new-wide_tt': plot_hit_vs_layer(('tt', 'new-wide-skip'), 'barrel'),
  487. # # 'hit_v_layer_FPIX_new-wide_tt': plot_hit_vs_layer(('tt', 'new-wide-skip'), 'forward'),
  488. #
  489. #
  490. # 'seed_kinem': plot_kinematic_eff('seed', norm=1, ylim=(0, None), bins_eta=30, bins_phi=30),
  491. # 'scl_kinem': plot_kinematic_eff('scl', norm=1, ylim=(0, None), bins_eta=30, bins_phi=30),
  492. # 'prompt_kinem': plot_kinematic_eff('prompt', norm=1, ylim=(0, None), bins_pt=30, bins_eta=30, bins_phi=30),
  493. # 'nonprompt_kinem': plot_kinematic_eff('nonprompt', norm=1, ylim=(0, None), xlim_pt=(0, 5),
  494. # bins_eta=30, bins_phi=30),
  495. }
  496. for config in configs:
  497. figures[f'good_sim_kinem_{config}'] = plot_kinematic_eff('good_sim', norm=1, ylim=(0, None),
  498. bins_eta=30, bins_phi=30, config=config)
  499. figures[f'gsf_track_kinem_{config}'] = plot_kinematic_eff('gsf_track', norm=1, ylim=(0, None),
  500. bins_eta=30, bins_phi=30, config=config)
  501. # for proc, wp, region in product(procs, wps, ('BPIX', 'FPIX')):
  502. # figures[f'hit_v_layer_{region}_{wp}_{proc}'] = plot_hit_vs_layer((proc, wp), region)
  503. def add_num_den(key, func, args, kwargs):
  504. base_ext = kwargs.get('ext', '')
  505. bins_pt_ = [0, 10, 20, 30, 40, 50, 60, 70, 80, 90, 100, 150, 200, 300]
  506. kwargs['bins_pt'] = kwargs.get('bins_pt', bins_pt_)
  507. kwargs['bins_eta'] = kwargs.get('bins_eta', 15)
  508. kwargs['bins_phi'] = kwargs.get('bins_phi', 15)
  509. figures[key] = func(*args, ylim=(0, 1.1), is_ratio=True, **kwargs)
  510. kwargs_ = kwargs.copy()
  511. kwargs_['ext'] = base_ext+'_num'
  512. figures[key+'_num'] = func(*args, **kwargs_)
  513. kwargs_ = kwargs.copy()
  514. kwargs_['ext'] = base_ext+'_den'
  515. figures[key+'_den'] = func(*args, **kwargs_)
  516. # add_num_den('tracking_eff', plot_kinematic_eff, ('tracking_eff',), dict(incl_sel=False))
  517. # add_num_den('tracking_pur', plot_kinematic_eff, ('tracking_pur',), dict(incl_sel=False))
  518. add_num_den('tracking_eff_dR', plot_kinematic_eff, ('tracking_eff',), dict(ext='_dR', incl_sel=False))
  519. add_num_den('tracking_pur_dR', plot_kinematic_eff, ('tracking_pur',), dict(ext='_dR', incl_sel=False))
  520. # add_num_den('prompt_eff', plot_kinematic_eff, ('prompt_eff',), dict(incl_sel=False))
  521. # add_num_den('prompt_pur', plot_kinematic_eff, ('prompt_pur',), dict(incl_sel=False))
  522. add_num_den('prompt_eff_dR', plot_kinematic_eff, ('prompt_eff',), dict(ext='_dR', incl_sel=False))
  523. add_num_den('prompt_pur_dR', plot_kinematic_eff, ('prompt_pur',), dict(ext='_dR', incl_sel=False))
  524. # add_num_den('nonprompt_eff', plot_kinematic_eff, ('nonprompt_eff',), dict(incl_sel=False))
  525. # add_num_den('nonprompt_pur', plot_kinematic_eff, ('nonprompt_pur',), dict(incl_sel=False))
  526. add_num_den('nonprompt_eff_dR', plot_kinematic_eff, ('nonprompt_eff',), dict(ext='_dR', incl_sel=False))
  527. add_num_den('nonprompt_pur_dR', plot_kinematic_eff, ('nonprompt_pur',), dict(ext='_dR', incl_sel=False))
  528. add_num_den('seeding_eff', plot_kinematic_eff, ('seed_eff',), dict(incl_sel=False))
  529. add_num_den('seeding_pur', plot_kinematic_eff, ('seed_pur',), dict(incl_sel=False))
  530. #
  531. # add_num_den('fake_rate_incl', plot_kinematic_eff, ('fake_rate_incl',), {})
  532. # add_num_den('fake_rate_no_e_match_incl', plot_kinematic_eff, ('fake_rate_no_e_match_incl',), {})
  533. # add_num_den('partial_fake_rate_incl', plot_kinematic_eff, ('partial_fake_rate_incl',), {})
  534. # add_num_den('full_fake_rate_incl', plot_kinematic_eff, ('full_fake_rate_incl',), {})
  535. # add_num_den('clean_fake_rate_incl', plot_kinematic_eff, ('clean_fake_rate_incl',), {})
  536. #
  537. # add_num_den('fake_rate', plot_kinematic_eff, ('fake_rate',), dict(incl_sel=False))
  538. # add_num_den('fake_rate_no_e_match', plot_kinematic_eff, ('fake_rate_no_e_match',), dict(incl_sel=False))
  539. # add_num_den('partial_fake_rate', plot_kinematic_eff, ('partial_fake_rate',), dict(incl_sel=False))
  540. # add_num_den('full_fake_rate', plot_kinematic_eff, ('full_fake_rate',), dict(incl_sel=False))
  541. # add_num_den('clean_fake_rate', plot_kinematic_eff, ('clean_fake_rate',), dict(incl_sel=False))
  542. #
  543. # # hit_layers = [(1, 1), (1, 2), (2, 2), (2, 3), (3, 3), (3, 4)]
  544. # # for proc, wp, (hit, layer), var, subdet in product(['dy', 'tt'], ['new-default-noskip', 'new-wide-noskip'],
  545. # # hit_layers, ['dPhi', 'dRz'], ['BPIX', 'FPIX']):
  546. # # figures[f'res_{subdet}_L{layer}_H{hit}_{var}_{proc}_{wp}'] = plot_residuals((proc, wp), layer, hit, var, subdet)
  547. #
  548. # # rel_layers = {1: [('BPIX', 1), ('BPIX', 2), ('FPIX', 1), ('FPIX', 2)],
  549. # # 2: [('BPIX', 2), ('BPIX', 3), ('FPIX', 2), ('FPIX', 3)],
  550. # # 3: [('BPIX', 3), ('BPIX', 4), ('FPIX', 3)], }
  551. # # for proc, hit, var in product(['dy', 'tt'], [1, 2, 3], ['dPhi', 'dRz']):
  552. # # figures[f'resall_H{hit}_{var}_{proc}'] = plot_res_contour(proc, hit, var, rel_layers[hit])
  553. #
  554. # # for proc, wp, hit, var in product(['dy', 'tt'], ['new-default-noskip', 'new-wide-noskip'], [1, 2, 3], ['dPhi', 'dRz']):
  555. # # figures[f'res_v_eta_H{hit}_{var}_{proc}_{wp}'] = plot_residuals_eta((proc, wp), hit, var)
  556. #
  557. # # figures = {}
  558. #
  559. def add_simple_plot(proc, wp, config, plot_name, xlabel, ylabel, is2d=False, xlim=None, ylim=None, clear_zero=False):
  560. if is2d:
  561. figures[f'{plot_name}_{proc}_{wp}_{config}'] = \
  562. simple_dist2d(plot_name, proc, wp, config, colz_fmt='', xlabel=xlabel, ylabel=ylabel, do_profile=True,
  563. xlim=xlim, ylim=ylim, clear_zero=clear_zero)
  564. else:
  565. figures[f'{plot_name}_{proc}_{wp}_{config}'] = \
  566. simple_dist(plot_name, proc, wp, config, xlabel=xlabel, ylabel=ylabel, xlim=xlim, ylim=ylim)
  567. for proc, wp, config, in product(procs, wps, configs):
  568. # add_simple_plot(proc, wp, 'n_pileup')
  569. add_simple_plot(proc, wp, config, 'n_initseeds_v_PU', '# Initial Seeds', '# In-Time Pileup', True)
  570. add_simple_plot(proc, wp, config, 'n_seeds_v_PU', '# Seeds', '# In-Time Pileup', True)
  571. add_simple_plot(proc, wp, config, 'n_good_seeds_v_PU', '# Seeds', '# In-Time Pileup', True, xlim=(-0.5, 40.5))
  572. add_simple_plot(proc, wp, config, 'n_tracks_v_PU', '# GSF Tracks', '# In-Time Pileup', True, xlim=(-0.5, 20.5))
  573. # add_simple_plot(proc, wp, config, 'n_pv_v_PU', '# PV', '# In-Time Pileup', True, xlim=(-0.5, 50.5)) # garbage
  574. # add_simple_plot(proc, wp, config, 'n_seeds_v_tPU', '# Seeds', '# True Pileup', True)
  575. # add_simple_plot(proc, wp, config, 'n_good_seeds_v_tPU', '# Seeds', '# True Pileup', True, xlim=(-0.5, 40.5))
  576. # add_simple_plot(proc, wp, config, 'n_tracks_v_tPU', '# GSF Tracks', '# True Pileup', True, xlim=(-0.5, 20.5))
  577. # add_simple_plot(proc, wp, config, 'n_pv_v_tPU', '# PV', '# True Pileup', True, xlim=(-0.5, 50.5))
  578. # add_simple_plot(proc, wp, config, 'n_seeds_v_n_scl', '# Seeds', '# Super Clusters', True,
  579. # xlim=(-0.5, 20.5), ylim=(-0.5, 20.5), clear_zero=False)
  580. add_simple_plot(proc, wp, config, 'n_good_seeds_v_n_scl', '# Good Seeds', '# Super Clusters', True,
  581. xlim=(-0.5, 20.5), ylim=(-0.5, 20.5), clear_zero=False)
  582. # add_simple_plot(proc, wp, config, 'n_good_seeds_v_n_good_scl', '# Good Seeds', '# Good Super Clusters', True,
  583. # xlim=(-0.5, 20.5), ylim=(-0.5, 20.5), clear_zero=False)
  584. # add_simple_plot(proc, wp, config, 'n_initseeds_v_PU', '# Initial Seeds', '# In-Time Pileup', True,
  585. # xlim=None, ylim=None, clear_zero=False)
  586. # add_simple_plot(proc, wp, config, 'n_initseeds_v_tPU', '# Initial Seeds', '# True Pileup', True,
  587. # xlim=None, ylim=None, clear_zero=False)
  588. mpb.render(figures, build=build)
  589. mpb.generate_report(figures, 'Electron Seeding Studies',
  590. output=f'hists.html',
  591. source=__file__)
  592. # mpb.generate_report(figures, 'Fixing Hit Skipping',
  593. # output='report.html',
  594. # body='../docs/reports/report_2018_08_16.md')
  595. if publish:
  596. mpb.publish()
  597. def color(proc, wp):
  598. from matplotlib.colors import XKCD_COLORS
  599. def f(name):
  600. return XKCD_COLORS['xkcd:'+name]
  601. wp = wp.replace('-skip', '')
  602. wp = wp.replace('-noskip', '')
  603. wp = wp.replace('-pileup', '')
  604. return {
  605. ('dy', 'new-extra-narrow'): f('indigo'),
  606. ('tt', 'new-extra-narrow'): f('bright purple'),
  607. ('dy', 'new-default'): f('red'),
  608. ('tt', 'new-default'): f('pink'),
  609. ('dy', 'new-wide'): f('strong blue'),
  610. ('tt', 'new-wide'): f('bright blue'),
  611. ('dy', 'new-extra-wide'): f('kelly green'),
  612. ('tt', 'new-extra-wide'): f('green'),
  613. ('dy', 'old-default'): f('black'),
  614. ('tt', 'old-default'): f('blue grey'),
  615. }[(proc, wp)]
  616. def style(config):
  617. return {
  618. 'noskip': '-',
  619. 'skip': '--',
  620. 'skip-pileup': '-.',
  621. }[config]
  622. if __name__ == '__main__':
  623. parser = ArgumentParser('Electron Seeding Efficiency Plot Maker')
  624. parser.add_argument('--build', action='store_true')
  625. parser.add_argument('--publish', action='store_true')
  626. args = parser.parse_args()
  627. set_defaults()
  628. mpb.configure(output_dir='seeding_studies',
  629. multiprocess=True,
  630. publish_remote="caleb@fangmeier.tech",
  631. publish_dir="/var/www/eg",
  632. publish_url="eg.fangmeier.tech",
  633. early_abort=True,
  634. )
  635. procs = {
  636. 'dy': r'Drell-Yan',
  637. 'tt': r'$t\bar{t}$'
  638. }
  639. configs = [
  640. 'noskip',
  641. 'skip',
  642. 'skip-pileup',
  643. ]
  644. wps = {
  645. 'old-default': 'Old-Method Seeding',
  646. # 'new-narrow': 'HLT Settings',
  647. 'new-default': 'HLT Settings',
  648. 'new-wide': 'Wide Settings',
  649. # 'new-extra-wide': 'Extra Wide Settings',
  650. }
  651. all_cut_plots(build=args.build, publish=args.publish)