main.tex 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307
  1. % rubber: module pdftex
  2. \documentclass[english,aspectratio=43,8pt]{beamer}
  3. \usepackage{graphicx}
  4. \usepackage{amssymb}
  5. \usepackage{booktabs}
  6. \usepackage{siunitx}
  7. \usepackage{subcaption}
  8. \usepackage{marvosym}
  9. \usepackage{verbatim}
  10. \usepackage[normalem]{ulem} % Needed for /sout
  11. \newcommand{\pb}{\si{\pico\barn}}%
  12. \newcommand{\fb}{\si{\femto\barn}}%
  13. \newcommand{\invfb}{\si{\per\femto\barn}}
  14. \newcommand{\GeV}{\si{\giga\electronvolt}}
  15. \hypersetup{colorlinks=true,urlcolor=blue}
  16. \usetheme[]{bjeldbak}
  17. \newcommand{\backupbegin}{%
  18. \newcounter{finalframe}
  19. \setcounter{finalframe}{\value{framenumber}}
  20. }
  21. \newcommand{\backupend}{%
  22. \setcounter{framenumber}{\value{finalframe}}
  23. }
  24. \begin{document}
  25. \title[$e$ Seeding Validation]{Offline Electron Seeding Validation \-- Update}
  26. \author[C. Fangmeier]{\textbf{Caleb Fangmeier} \\ Ilya Kravchenko, Greg Snow}
  27. \institute[UNL]{University of Nebraska \-- Lincoln}
  28. \date{EGM general meeting \textbf{CMS week} | April 18, 2018}
  29. \titlegraphic{%
  30. \begin{figure}
  31. \includegraphics[width=1in]{CMSlogo.png}\hspace{0.75in}\includegraphics[width=1in]{nebraska-n.png}
  32. \end{figure}
  33. }
  34. \begin{frame}[plain]
  35. \titlepage%
  36. \end{frame}
  37. \begin{frame}{Introduction}
  38. \begin{itemize}
  39. \item Our goal is to study \textbf{seeding} for the \textbf{offline} GSF tracking with the \textbf{new pixel detector}.
  40. \item Specifically, we want to optimize the new pixel-matching scheme from HLT for use in off-line reconstruction.
  41. \item This Talk:
  42. \begin{itemize}
  43. \item Show performance comparison between old seeding two working points of the new seeding in fake-rich environment
  44. \begin{itemize}
  45. \item New Seeding working points: \texttt{narrow} (HLT default settings), and \texttt{wide} (double window sizes with respect to \texttt{narrow})
  46. \end{itemize}
  47. \item Show alternative efficiency/purity measurements using $\Delta R$ truth-matching between \texttt{SimTracks} and \texttt{GSFTracks}
  48. \end{itemize}
  49. \end{itemize}
  50. \end{frame}
  51. \begin{frame}{N-Hit Electron Seeding}
  52. \begin{columns}
  53. \begin{column}{0.5\textwidth}
  54. {\small
  55. \begin{enumerate}
  56. \item Using the beam spot, the SC position, and SC energy, propagate a path through the pixels.
  57. \item Require the first hit to be within a $\delta\phi$ and $\delta z$ window. ($\delta\phi$ and $\delta R$ for FPIX)
  58. \item $\delta z$ window for first hit is huge as SC and beam spot positions give very little information about $z$.
  59. \item Forget the SC position, and propagate a new track based on the vertex and first hit positions, and the SC energy.
  60. \item Progress one-by-one through the remaining hits in the seed and require each one fit within a specified window around the track.
  61. \item Quit when all hits are matched, or a hit falls outside the window. No skipping is allowed.
  62. \end{enumerate}
  63. }
  64. \end{column}
  65. \begin{column}{0.5\textwidth}
  66. \begin{figure}
  67. \includegraphics[width=0.9\textwidth]{../common/diagrams/seeding_step2.png}
  68. \end{figure}
  69. \begin{figure}
  70. \includegraphics[width=0.9\textwidth]{../common/diagrams/seeding_step3.png}
  71. \end{figure}
  72. \end{column}
  73. \end{columns}
  74. \end{frame}
  75. \begin{frame}{Definitions}
  76. \begin{itemize}
  77. \item \textbf{Sim-Track \--} A track from a simulated electron originating from the luminous region of CMS (beam-spot +- 5$\sigma$)
  78. \item \textbf{ECAL-Driven Seed \--} A seed created via a matching procedure between Super-Clusters and General Tracking Seeds (Either from \texttt{ElectronSeedProducer} or \texttt{ElectronNHitSeedProducer})
  79. \item \textbf{GSF Track \--} A track from GSF-Tracking resulting from an \textbf{ECAL-Driven Seed}
  80. % \item \textbf{Seeding Efficiency \--} The fraction of \textbf{Sim-Tracks} that have a matching \textbf{ECAL-Driven Seed} (based on simhit-rechit linkage or $\Delta R$ matching)
  81. \item \textbf{GSF Tracking Efficiency \--} The fraction of \textbf{Sim-Tracks} that have a matching \textbf{GSF Track} (again, based on simhit-rechit linkage or $\Delta R$ matching)
  82. % \item \textbf{ECAL-Driven Seed Purity \--} The fraction of \textbf{ECAL-Driven Seeds} that have a matching \textbf{Sim-Track}
  83. \item \textbf{GSF Tracking Purity \--} The fraction of \textbf{GSF Tracks} that have a matching \textbf{Sim-Track}
  84. \end{itemize}
  85. \end{frame}
  86. \begin{frame}{Previous status-quo}
  87. \begin{columns}
  88. \begin{column}{0.45\textwidth}
  89. {\small
  90. \begin{itemize}
  91. \item In a previous presentation\footnotemark, I showed efficiency vs. purity for
  92. \begin{itemize}
  93. \item Old pair-match seeding (\texttt{ElectronSeedProducer})
  94. \item New triplet seeding (\texttt{ElectronNHitSeedProducer}) for several choices of matching windows.
  95. \end{itemize}
  96. \item Performance of new seeding at the \texttt{wide} working point was comparable to old seeding in low-fake ($Z\rightarrow e^+e^-$) environment
  97. \item Needed to validate performance in a high fake environment.
  98. \end{itemize}
  99. }
  100. \end{column}
  101. \begin{column}{0.6\textwidth}
  102. \begin{figure}
  103. \includegraphics[width=0.9\textwidth]{../common/figures/tracking_roc_curves_linear_plus_old_hoe.png}
  104. \end{figure}
  105. \end{column}
  106. \end{columns}
  107. \footnotetext[1]{\tiny \url{https://indico.cern.ch/event/697077/contributions/2936039/attachments/1618649/2573874/main.pdf}}
  108. \end{frame}
  109. \begin{frame}{Relative Performance - GSF Tracking Efficiency}
  110. \begin{columns}
  111. \begin{column}{0.5\textwidth}
  112. \begin{itemize}
  113. \item Figure shows GSF Tracking efficiency vs kinematic variables of the electron \texttt{SimTrack}
  114. \item Efficiency is more or less the same for both DY and $t\bar{t}$ environments and for both algorithms and working points.
  115. \item Largest (statistically significant) differences appear at low $p_T$ and in the barrel/endcap transition region.
  116. \end{itemize}
  117. \end{column}
  118. \begin{column}{0.5\textwidth}
  119. \begin{figure}
  120. GSF Tracking Efficiency
  121. \includegraphics[width=1.0\textwidth]{live_figures/tracking_eff_all.png}
  122. \end{figure}
  123. \end{column}
  124. \end{columns}
  125. \end{frame}
  126. \begin{frame}{Relative Performance - GSF Track Purity}
  127. \begin{columns}
  128. \begin{column}{0.5\textwidth}
  129. \begin{itemize}
  130. \item Figure shows GSF Tracking purity vs kinematic variables of the \texttt{GSFTrack}
  131. \item Clearly purity is affected by the higher fake environment in the $t\bar{t}$ sample.
  132. \item Note how the \texttt{narrow} working point of the new seeding (green) has significantly better purity than the \texttt{wide} working point or the old seeding.
  133. \item Purity loss at high $p_T$ is a feature of the shared-hits matching between \texttt{SimTracks} and \texttt{GSFTracks}.
  134. \end{itemize}
  135. \end{column}
  136. \begin{column}{0.5\textwidth}
  137. \begin{figure}
  138. GSF Tracking Purity
  139. \includegraphics[width=1.0\textwidth]{live_figures/tracking_pur_all.png}
  140. \end{figure}
  141. \end{column}
  142. \end{columns}
  143. \end{frame}
  144. \begin{frame}{$\Delta R$ Matching}
  145. \begin{columns}
  146. \begin{column}{0.5\textwidth}
  147. \begin{figure}
  148. GSF Tracking Efficiency ($\Delta R$ Matched)
  149. \includegraphics[width=1.0\textwidth]{live_figures/tracking_eff_all_dR.png}
  150. \end{figure}
  151. \end{column}
  152. \begin{column}{0.5\textwidth}
  153. \begin{figure}
  154. GSF Tracking Purity ($\Delta R$ Matched)
  155. \includegraphics[width=1.0\textwidth]{live_figures/tracking_pur_all_dR.png}
  156. \end{figure}
  157. \end{column}
  158. \end{columns}
  159. \begin{itemize}
  160. \item Previous efficiency/purity definitions based on shared tracker hits between \texttt{SimTracks} and \texttt{GSFTracks}.
  161. \item An alternative is to use simple $\Delta R<0.2$ matching.
  162. \item Overall numbers improve and purity no longer drops at high $p_T$.
  163. \end{itemize}
  164. \end{frame}
  165. \begin{frame}{Overall Performance}
  166. \begin{center}
  167. Integrating over all tracks with $p_T>20$GeV and $\eta<2.4$ yields the performance numbers below.
  168. \begin{table}[]
  169. \centering
  170. \begin{tabular}{@{}llrr} \toprule
  171. Sample & Algo & Efficiency ($\Delta R$ Matched) & Purity ($\Delta R$ Matched) \\ \midrule
  172. $Z\rightarrow ee$ & \texttt{old-seeding} & $96.08\pm0.28\%$ & $99.54\pm0.29\%$ \\
  173. & \texttt{narrow} & $94.49\pm0.28\%$ & $99.72\pm0.29\%$ \\
  174. & \texttt{wide} & $96.00\pm0.28\%$ & $99.60\pm0.29\%$ \\
  175. $t\bar{t}$ & \texttt{old-seeding} & $94.84\pm0.77\%$ & $57.49\pm0.60\%$ \\
  176. & \texttt{narrow} & $93.54\pm0.79\%$ & $65.84\pm0.67\%$ \\
  177. & \texttt{wide} & $95.06\pm0.77\%$ & $59.52\pm0.61\%$ \\
  178. \end{tabular}
  179. \end{table}
  180. \begin{itemize}
  181. \item The HLT default settings (\texttt{narrow}) of the new pixel matching
  182. scheme yield non-trivially better purity at the loss of some efficiency
  183. with respect to both the old seeding and the \texttt{wide} working point.
  184. \item The \texttt{wide} working point of the new seeding matches the
  185. \texttt{old-seeding} within errors except for purity is $\approx 2$\%
  186. better in the $t\bar{t}$ sample
  187. \end{itemize}
  188. \end{center}
  189. \end{frame}
  190. \begin{frame}{Conclusions \& Outlook}
  191. \begin{itemize}
  192. \item The new seeding algorithm has been verified to perform as well as,
  193. and in some cases better, than the current pair seeding based on MC
  194. studies in both low and high purity environments.
  195. \item Now the question is which working point (\texttt{wide} or \texttt{narrow}) is preferable?
  196. \item Unless there are objections, propose to move forward with implementing the new algorithm as the default in the next available CMSSW release.
  197. \end{itemize}
  198. \end{frame}
  199. \appendix
  200. \backupbegin
  201. \begin{frame}
  202. \begin{center}
  203. {\Huge BACKUP}
  204. \end{center}
  205. \end{frame}
  206. \begin{frame}{Overall Performance}
  207. \begin{columns}
  208. \begin{column}{0.5\textwidth}
  209. \begin{figure}
  210. GSF Tracking Performance (Hit Matched)
  211. \includegraphics[width=1.0\textwidth]{live_figures/tracking_roc_curve.png}
  212. \end{figure}
  213. \end{column}
  214. \begin{column}{0.5\textwidth}
  215. \begin{figure}
  216. GSF Tracking Performance ($\Delta R$ Matched)
  217. \includegraphics[width=1.0\textwidth]{live_figures/tracking_roc_curve_dR.png}
  218. \end{figure}
  219. \end{column}
  220. \end{columns}
  221. \end{frame}
  222. \begin{frame}{Matching Window Parameters}
  223. \begin{table}[]
  224. \centering
  225. \begin{tabular}{@{}llrrrr@{}}
  226. \toprule
  227. & & \textbf{extra-narrow} & \textbf{narrow(HLT)} & \textbf{wide} & \textbf{extra-wide} \\ \midrule
  228. Hit 1 & dPhiMaxHighEt & \textbf{0.025} & \textbf{0.05} & \textbf{0.1} & \textbf{0.15} \\
  229. & dPhiMaxHighEtThres & 20.0 & 20.0 & 20.0 & 20.0 \\
  230. & dPhiMaxLowEtGrad & -0.002 & -0.002 & -0.002 & -0.002 \\
  231. & dRzMaxHighEt & 9999.0 & 9999.0 & 9999.0 & 9999.0 \\
  232. & dRzMaxHighEtThres & 0.0 & 0.0 & 0.0 & 0.0 \\
  233. & dRzMaxLowEtGrad & 0.0 & 0.0 & 0.0 & 0.0 \\ \midrule
  234. Hit 2 & dPhiMaxHighEt & \textbf{0.0015} & \textbf{0.003} & \textbf{0.006} & \textbf{0.009} \\
  235. & dPhiMaxHighEtThres & 0.0 & 0.0 & 0.0 & 0.0 \\
  236. & dPhiMaxLowEtGrad & 0.0 & 0.0 & 0.0 & 0.0 \\
  237. & dRzMaxHighEt & \textbf{0.025} & \textbf{0.05} & \textbf{0.1} & \textbf{0.15} \\
  238. & dRzMaxHighEtThres & 30.0 & 30.0 & 30.0 & 30.0 \\
  239. & dRzMaxLowEtGrad & -0.002 & -0.002 & -0.002 & -0.002 \\ \midrule
  240. Hit 3+ & dPhiMaxHighEt & \textbf{0.0015} & \textbf{0.003} & \textbf{0.006} & \textbf{0.009} \\
  241. & dPhiMaxHighEtThres & 0.0 & 0.0 & 0.0 & 0.0 \\
  242. & dPhiMaxLowEtGrad & 0.0 & 0.0 & 0.0 & 0.0 \\
  243. & dRzMaxHighEt & \textbf{0.025} & \textbf{0.05} & \textbf{0.1} & \textbf{0.15} \\
  244. & dRzMaxHighEtThres & 30.0 & 30.0 & 30.0 & 30.0 \\
  245. & dRzMaxLowEtGrad & -0.002 & -0.002 & -0.002 & -0.002 \\ \bottomrule
  246. \end{tabular}
  247. \end{table}
  248. \centering
  249. \texttt{NHit} Seeding window parameters. Bold designates modified values.
  250. \end{frame}
  251. \begin{frame}{Overall Performance - Hit-Matching}
  252. \begin{center}
  253. Integrating over all tracks with $p_T>20$GeV and $\eta<2.4$ yields the performance numbers below.
  254. \begin{table}[]
  255. \centering
  256. \begin{tabular}{@{}llrr} \toprule
  257. Sample & Algo & Efficiency (Hit Matched) & Purity (Hit Matched) \\ \midrule
  258. $Z\rightarrow ee$ & \texttt{old-seeding} & $88.05\pm0.28\%$ & $90.30\pm0.29\%$ \\
  259. & \texttt{narrow} & $86.63\pm0.28\%$ & $90.69\pm0.29\%$ \\
  260. & \texttt{wide} & $88.01\pm0.28\%$ & $90.43\pm0.29\%$ \\
  261. $t\bar{t}$ & \texttt{old-seeding} & $88.06\pm0.77\%$ & $52.35\pm0.60\%$ \\
  262. & \texttt{narrow} & $86.89\pm0.79\%$ & $60.56\pm0.67\%$ \\
  263. & \texttt{wide} & $88.30\pm0.77\%$ & $54.38\pm0.61\%$ \\
  264. \end{tabular}
  265. \end{table}
  266. Note that the \texttt{wide} working point of the new seeding matches the \texttt{old-seeding} within errors except for purity is $\approx 2$\% better in the $t\bar{t}$ sample.
  267. \end{center}
  268. \end{frame}
  269. \begin{frame}{Samples}
  270. \begin{itemize}
  271. \item {\tiny /ZToEE\_NNPDF30\_13TeV-powheg\_M\_120\_200/RunIISummer17DRStdmix-NZSFlatPU28to62\_92X\_upgrade2017\_realistic\_v10-v1}
  272. \item {\tiny /TT\_TuneCUETP8M2T4\_13TeV-powheg-pythia8/RunIISummer17DRStdmix-NZSFlatPU28to62\_92X\_upgrade2017\_realistic\_v10-v2}
  273. \end{itemize}
  274. \end{frame}
  275. \backupend
  276. \end{document}