@phdthesis{10.7907/bqsn-sp82, author = {Cerri, Olmo}, title = {New Physics Tools for Discovery, a New Era of Timing Detector, and Lepton Flavor Universality Test at CMS}, school = {California Institute of Technology}, year = {2023}, doi = {10.7907/bqsn-sp82}, url = {https://resolver.caltech.edu/CaltechTHESIS:09132022-001004681}, abstract = {

The field of particle and fundamental physics finds itself now in a peculiar situation. The established Standard Model accurately predicts most of the observations, but several compelling reasons motivate a need for an extension of the current theory. In this thesis, I focus my research on facing the current situation of the field in a diversified threefold manner.

First, I develop methods based on physics-driven machine learning algorithms, with a particular focus on developing a model-independent tagger for unexpected events using artificial neural networks. This study shows how model-independent new physics triggers, possibly trained on real data, can select a low rate stream of events able to explore new physics processes up to a 10-100 pb cross section and can create a special dataset of rare unexpected events. Other important results from this body of work include the first application of the proposed anomaly detection strategy to real data, the use of graph neural networks to improve current pileup mitigation algorithms, the development of jet taggers based on the interaction network, and analysis-specific fast simulation.

Second, I focus on the methodological and hardware development of the MIP Timing Layer that is expected to upgrade CMS in preparation for HL-LHC. My seminal study demonstrates the possibility of using time-of-flight information to perform particle identification, which has a significant impact on heavy stable charged particle searches. This work introduces how to measure time-of-flight at CMS, a strategy for particle identification, and an algorithm to locate vertices in space and time. I also participated in the sensor testing and test beam operation. In particular, I conducted a study about the design and prototype of the detector modules’ thermal behavior that shows how different geometries could lead to cooling differences of a few K.

Last, I direct my attention towards CMS’s first lepton flavor universality tests with B meson decays. Using a dataset acquired thanks to a custom design trigger, I independently develop the measurement of the R(D*) ratio, a parameter whose tensions between the predictions and observation have drawn remarkable attentions. I oversaw the complete mature state of the analysis, from the Monte Carlo simulation to the fitting procedure. Further collaboration-wide efforts are still required, but I demonstrate the expected sensitivity of about 15% using an Asimov dataset.

}, address = {1200 East California Boulevard, Pasadena, California 91125}, advisor = {Spiropulu, Maria}, } @phdthesis{10.7907/tmt4-nq20, author = {Dutta, Irene}, title = {Rare Higgs Processes at CMS and Precision Timing Detector Studies for HL-LHC CMS Upgrade}, school = {California Institute of Technology}, year = {2023}, doi = {10.7907/tmt4-nq20}, url = {https://resolver.caltech.edu/CaltechTHESIS:09252022-195535688}, abstract = {

This thesis describes the search for two rare Higgs processes. The first analysis describes the CMS Run 2 search for H → µµ decays, with 137.3 fb-1 of data at √s = 13 TeV. The analysis targeted four different Higgs production modes: the gluon fusion (ggH), the vector boson fusion (VBF), the Higgs-strahlung process (VH), and the production in association with a pair of top quarks (ttH). Each category used a dedicated machine learning based classifier to separate the signal from the background processes. A combined fit from all these categories saw a slight excess in the data corresponding to 3.0 standard deviations at MH = 125.38 GeV, and gave the first evidence for the Higgs boson decay to second-generation fermions. The best-fit signal strength and the corresponding 68% CL interval was found to be µ^ =1.19 +0.41-0.39 (stat) +0.17-0.16 (syst) at MH = 125.38 GeV.

The second analysis describes the CMS Run 2 search for HH → bb̅bb̅ with highly boosted Higgs bosons. This analysis used a dedicated jet identification algorithm based on graph neural networks (ParticleNet) to identify boosted H → bb jets. This search targeted the gluon fusion and the vector boson fusion HH production modes, and put constraints on the allowed values of the various Higgs couplings as: κλ ∈ [-9.9,16.9] when κν = 1, κ= 1; κν ∈ [-1.17,-0.79] ∪ [0.81,1.18] when κλ = 1, κ = 1; κ ∈ [0.62,1.41] when κλ = 1, κν = 1. A scenario with κ = 0 was excluded with a significance of 6.3 standard deviations for the first time, when other H couplings are fixed to their SM values. The combined observed (expected) 95% upper limit on the HH production cross section was found to be 9.9 (5.1) x SM.

Finally, this thesis also discusses the planned MIP Timing Detector (MTD) upgrade for CMS at the HL-LHC. The MTD will be a time-of-flight (TOF) detector, designed to provide a precision timing information for charged particles using SiPMs + LYSO scintillating crystals, with a time resolution of ~30 ps. This thesis describes several R&D tests that have been performed for characterizing the sensor properties (time resolution, light yield, etc.) and optimizing the sensor design geometry. This thesis also contains a description of mock test setups for cooling the sensors, since it is known to be an effective way of mitigating the increased dark current rates in the sensors due to radiation damage.

}, address = {1200 East California Boulevard, Pasadena, California 91125}, advisor = {Spiropulu, Maria}, } @phdthesis{10.7907/knfz-q495, author = {Nguyen, Thong Quang}, title = {Searches for Nonresonant Higgs Boson Pair Production and Long-Lived Particles at the LHC and Machine-Learning Solutions for the High-Luminosity LHC Era}, school = {California Institute of Technology}, year = {2022}, doi = {10.7907/knfz-q495}, url = {https://resolver.caltech.edu/CaltechTHESIS:10012021-210141406}, abstract = {

This thesis presents two physics analyses using 137 fb−1 proton-proton collision data collected by the CMS experiment at √s = 13 TeV, along with a series of machine-learning solutions to extend the physics program at the LHC and to address the computational challenges in the High-Luminosity LHC era. The first analysis searches for nonresonant Higgs boson pair production in final states with two photons and two bottom quarks, with no significant deviation from the background-only hypothesis observed. The observed (expected) upper limit on the product of the Higgs boson pair production cross section and branching fraction into bb̅γγ is 0.67 (0.45) fb, corresponding to 7.7 (5.2) times the Standard Model prediction. The modifier of the Higgs trilinear self-coupling is constrained within the range -3.3 < κλ < 8.5. The modifier for coupling between a pair of Higgs bosons and a pair of vector bosons, along with the 2-dimensional constraint of the modifiers of Higgs self-coupling and Yukawa coupling, are also reported. A graph-based algorithm to identify boosted H → bb̅ jets to improve future Higgs search is presented. The second analysis searches for long-lived supersymmetry particles decaying to photons and gravitinos in the context of gauge-mediated supersymmetry breaking model. Results are presented in terms of 95% confidence level expected exclusion limits on the masses and proper decay lengths of the neutralino, which exceed the limits from the previous searches by up to 100 GeV for the neutralino mass and by five times for the neutralino proper decay length. A strategy for model-independent new physics searches is presented with an anomaly trigger based on unsupervised learning algorithms that can be deployed in both the high-level trigger and the Level-1 trigger in CMS. Three other machine-learning solutions are presented to address the computational challenges in the HL-LHC era: a layer based on multi-modal deep neural networks that can reduce the false-positive events selected by the trigger by over one order of magnitude while retaining 99% of signal events, a full-event simulation algorithm based on recurrent generative adversarial networks that has potential to replace traditional simulation method while being five orders of magnitude faster, and a fast simulation algorithm for specific analyses based on encoder-decoder architecture that would result in about an order-of-magnitude reduction in computing and storage requirements for the collision simulation workflow.

}, address = {1200 East California Boulevard, Pasadena, California 91125}, advisor = {Spiropulu, Maria}, } @phdthesis{10.7907/BHGN-VY70, author = {Anderson, Dustin James}, title = {Inclusive Searches for Supersymmetry at √s = 13 TeV Using Razor Kinematic Variables, and Data Scouting Using the CMS Trigger System}, school = {California Institute of Technology}, year = {2018}, doi = {10.7907/BHGN-VY70}, url = {https://resolver.caltech.edu/CaltechTHESIS:05162018-153827333}, abstract = {

We present two searches for supersymmetric particles using proton-proton collision data collected by the CMS experiment at √s = 13 TeV. The searches use razor kinematic variables for signal discrimination and target the pair production of heavy gluinos and squarks in R-parity conserving supersymmetry. The first search is performed on 2.3 fb−1 of data collected by CMS in 2015. Two complete, independent background predictions are made: one based on fits using a parameterized functional form, and the other based on Monte Carlo simulation corrected via control samples in data. The second search is an expanded version of the first search, and is performed using the Monte Carlo-based background prediction method on 35.9 fb−1 of data collected in 2016. Both searches obtain results compatible with standard model background expectations. The null results are interpreted as limits on the masses and cross sections of gluinos, squarks, and higgsinos in the context of simplified models of supersymmetry. We discuss the outlook for the fit-based search strategy and explore how the technique of gaussian process regression may be useful as a tool to combat the challenges of this analysis methodology.

We also describe a new paradigm for trigger-level collider data analysis, which we refer to as data scouting. In this paradigm, searches for new physics are performed using event information reconstructed within the experiment’s trigger software. This circumvents traditional event rate constraints, such as disk space and the latency of offline reconstruction. We provide details on the implementation of a framework for data scouting in the CMS High-Level Trigger system and its successful use in Run II of the LHC. We discuss the impact of scouting on the physics program of CMS and demonstrate that it enables searches for new physics that would not otherwise be possible due to trigger constraints, such as hadronic resonance searches at low mass and searches for leptonic decays of dark photons.

}, address = {1200 East California Boulevard, Pasadena, California 91125}, advisor = {Spiropulu, Maria}, } @phdthesis{10.7907/Z9GX48JV, author = {Duarte, Javier Mauricio Gonzalez}, title = {Naturalness Confronts Nature: Searches for Supersymmetry with the CMS Detector in pp Collisions at √s = 8 and 13 TeV}, school = {California Institute of Technology}, year = {2017}, doi = {10.7907/Z9GX48JV}, url = {https://resolver.caltech.edu/CaltechTHESIS:08232016-112522351}, abstract = {In this thesis, we present two inclusive searches for supersymmetric particles at 8 and 13 TeV using the razor variables and guided by the principle of naturalness. We build a framework to explore the natural supersymmetry parameter space of gluino and top squark masses and branching ratios, which is a unique attempt to cover this parameter space in a more complete way than ever before using LHC data. With this approach, the production of top squarks and gluinos are excluded below 700 GeV and 1.6 TeV, respectively, independent of the branching ratios, constituting one of the tightest constraints on natural supersymmetry from the LHC. Motivated by the need to mitigate the effects of multiple interactions per bunch crossing (pileup), an essential feature of present and future hadron colliders, in this thesis we also study the precision timing capabilities of a LYSO-based sampling calorimeter, and achieve a time resolution of 30 ps in electron test beam measurements. The achieved resolution corresponds to the precision needed to significantly reduce the inclusion of pileup particles in the reconstruction of the event of interest. This study is foundational in building an R and D program on precision timing for the high-luminosity LHC and other future hadron colliders. We also propose alternative simplified models to study Higgs-plus-jets events at the LHC, and reinterpret an excess observed at 8 TeV in the context of these models. Finally, we discuss a search for narrow resonances in the dijet mass spectrum at 13 TeV using the data-scouting technique at CMS, which records a smaller event format to increase the maximum recordable rate. For the benchmark models with a vector or axial-vector mediator that couples to quarks and dark matter particles, the dijet search excludes mediator masses from 0.5 TeV up to 2.7 TeV largely independent of the dark matter particle mass, which constitutes a larger exclusion than traditional mono-X searches at the LHC. In the plane of the dark matter-nucleon interaction cross section versus dark matter mass, the dijet search is also more sensitive than direct detection experiments for spin-dependent cross sections.}, address = {1200 East California Boulevard, Pasadena, California 91125}, advisor = {Spiropulu, Maria}, } @phdthesis{10.7907/Z9MK69Z6, author = {Peña Herrera, Cristián}, title = {Searches for New Physics at the Compact Muon Solenoid Experiment and Precision Timing Calorimetry}, school = {California Institute of Technology}, year = {2017}, doi = {10.7907/Z9MK69Z6}, url = {https://resolver.caltech.edu/CaltechTHESIS:05192017-195511866}, abstract = {

In this thesis, we present several searches for beyond the standard model physics in proton-proton collisions recorded by the Compact Muon Solenoid Experiment at center-of-mass energy of 8 and 13. We search for particle dark matter in events with two or more jets and missing transverse momentum at $\sqrt{s} = 8$ TeV, in this search we use the razor variables to discriminate signal from background events and thus improve the overall sensitivity of the analysis. We observe agreement between the observation and the background estimation. The interpretation of the results is carried out in the context of an effective field theory that couples the standard model quarks to the dark matter candidate. A search for anomalous production of Higgs bosons using 15.3 fb − 1 of proton-proton collisions at $\sqrt{s} = 13$ TeV is also presented; this search selects events with a Higgs boson in association with jets, where the Higgs candidate decays into two photons. We also employ the razor variables (MR, R2) to discriminate signal from background. We observe an excess of events in one of the search bins with relatively high values of MR and R2. The interpretation of this analysis is pair production of bottom squarks in the context of supersymmetry, this model is also presented in one of the appendices of this thesis. In the other appendix of this thesis, we present a search for new phenomena in high-mass diphoton events using 12.9 fb − 1 of proton-proton collisions at $\sqrt{s} = 13$ TeV. This search observed a significant excess (3.4 standard deviations, local) with 2015 data at a diphoton invariant mass of 750 GeV, equivalent to 20% of the current dataset. By repeating the search with the larger dataset collected in 2016, we found that the aforementioned excess has been greatly disfavored. Additionally, in order to confirm the robustness and correctness of the data analysis techniques used in this search, we have carried out a second – completely independent – analysis, which confirms the absence of an excess at a diphoton invariant mass of 750 GeV.

We also present detector research and developments studies of electromagnetic calorimeters equipped with precision timing capabilities. We present several calorimeter prototypes that were tested at the Fermilab Test Beam Facility. These prototypes include LYSO-based calorimeters, tungsten-LYSO “shashlik” sampling calorimeters, micro-channel-plate sampling calorimeters, and silicon-based sampling calorimeters. The results of these studies indicate that time resolutions of the order of 30 ps are readily available when measuring electromagnetic showers. A discussion about the applications of precision timing in high energy physics experiments is also presented, with a particular interest in pileup rejection in the context of the high-luminosity upgrade of the Large Hadron Collider foreseen to start in 2025.

}, address = {1200 East California Boulevard, Pasadena, California 91125}, advisor = {Spiropulu, Maria}, } @phdthesis{10.7907/VT37-HT20, author = {Chen, Yi}, title = {Extraction of CP Properties of the H(125) Boson Discovered in Proton-Proton Collisions at sqrt(s) = 7 and 8 TeV with the CMS Detector at the LHC}, school = {California Institute of Technology}, year = {2015}, doi = {10.7907/VT37-HT20}, url = {https://resolver.caltech.edu/CaltechTHESIS:12012014-145657884}, abstract = {In this thesis we build a novel analysis framework to perform the direct extraction of all possible effective Higgs boson couplings to the neutral electroweak gauge bosons in the H → ZZ(*) → 4l channel also referred to as the golden channel. We use analytic expressions of the full decay differential cross sections for the H → VV’ → 4l process, and the dominant irreducible standard model qq ̄ → 4l background where 4l = 2e2μ,4e,4μ. Detector effects are included through an explicit convolution of these analytic expressions with transfer functions that model the detector responses as well as acceptance and efficiency effects. Using the full set of decay observables, we construct an unbinned 8-dimensional detector level likelihood function which is con- tinuous in the effective couplings, and includes systematics. All potential anomalous couplings of HVV’ where V = Z,γ are considered, allowing for general CP even/odd admixtures and any possible phases. We measure the CP-odd mixing between the tree-level HZZ coupling and higher order CP-odd couplings to be compatible with zero, and in the range [−0.40, 0.43], and the mixing between HZZ tree-level coupling and higher order CP -even coupling to be in the ranges [−0.66, −0.57] ∪ [−0.15, 1.00]; namely compatible with a standard model Higgs. We discuss the expected precision in determining the various HVV’ couplings in future LHC runs. A powerful and at first glance surprising prediction of the analysis is that with 100-400 fb-1, the golden channel will be able to start probing the couplings of the Higgs boson to diphotons in the 4l channel. We discuss the implications and further optimization of the methods for the next LHC runs.}, address = {1200 East California Boulevard, Pasadena, California 91125}, advisor = {Spiropulu, Maria}, } @phdthesis{10.7907/Z9XK8CHR, author = {Mott, Alexander Robert}, title = {Search for Higgs Boson Production Beyond the Standard Model Using the Razor Kinematic Variables in pp Collisions at √s=8 TeV and Optimization of Higgs Boson Identification Using a Quantum Annealer}, school = {California Institute of Technology}, year = {2015}, doi = {10.7907/Z9XK8CHR}, url = {https://resolver.caltech.edu/CaltechTHESIS:05052015-155442785}, abstract = {

In the first part of this thesis we search for beyond the Standard Model physics through the search for anomalous production of the Higgs boson using the razor kinematic variables. We search for anomalous Higgs boson production using proton-proton collisions at center of mass energy √s=8 TeV collected by the Compact Muon Solenoid experiment at the Large Hadron Collider corresponding to an integrated luminosity of 19.8 fb-1.

In the second part we present a novel method for using a quantum annealer to train a classifier to recognize events containing a Higgs boson decaying to two photons. We train that classifier using simulated proton-proton collisions at √s=8 TeV producing either a Standard Model Higgs boson decaying to two photons or a non-resonant Standard Model process that produces a two photon final state.

The production mechanisms of the Higgs boson are precisely predicted by the Standard Model based on its association with the mechanism of electroweak symmetry breaking. We measure the yield of Higgs bosons decaying to two photons in kinematic regions predicted to have very little contribution from a Standard Model Higgs boson and search for an excess of events, which would be evidence of either non-standard production or non-standard properties of the Higgs boson. We divide the events into disjoint categories based on kinematic properties and the presence of additional b-quarks produced in the collisions. In each of these disjoint categories, we use the razor kinematic variables to characterize events with topological configurations incompatible with typical configurations found from standard model production of the Higgs boson.

We observe an excess of events with di-photon invariant mass compatible with the Higgs boson mass and localized in a small region of the razor plane. We observe 5 events with a predicted background of 0.54 ± 0.28, which observation has a p-value of 10-3 and a local significance of 3.35σ. This background prediction comes from 0.48 predicted non-resonant background events and 0.07 predicted SM higgs boson events. We proceed to investigate the properties of this excess, finding that it provides a very compelling peak in the di-photon invariant mass distribution and is physically separated in the razor plane from predicted background. Using another method of measuring the background and significance of the excess, we find a 2.5σ deviation from the Standard Model hypothesis over a broader range of the razor plane.

In the second part of the thesis we transform the problem of training a classifier to distinguish events with a Higgs boson decaying to two photons from events with other sources of photon pairs into the Hamiltonian of a spin system, the ground state of which is the best classifier. We then use a quantum annealer to find the ground state of this Hamiltonian and train the classifier. We find that we are able to do this successfully in less than 400 annealing runs for a problem of median difficulty at the largest problem size considered. The networks trained in this manner exhibit good classification performance, competitive with the more complicated machine learning techniques, and are highly resistant to overtraining. We also find that the nature of the training gives access to additional solutions that can be used to improve the classification performance by up to 1.2% in some regions.

}, address = {1200 East California Boulevard, Pasadena, California 91125}, advisor = {Spiropulu, Maria}, } @phdthesis{10.7907/B0MD-F026, author = {Rogan, Christopher Sean}, title = {Searches for New Symmetries in pp Collisions with the Razor Kinematic Variables at √s = 7 TeV}, school = {California Institute of Technology}, year = {2013}, doi = {10.7907/B0MD-F026}, url = {https://resolver.caltech.edu/CaltechTHESIS:05072013-174540453}, abstract = {

The construction and LHC phenomenology of the razor variables MR, an event-by-event indicator of the heavy particle mass scale, and R, a dimensionless variable related to the transverse momentum imbalance of events and missing transverse energy, are presented.  The variables are used  in the analysis of the first proton-proton collisions dataset at CMS  (35 pb-1) in a search for superpartners of the quarks and gluons, targeting indirect hints of dark matter candidates in the context of supersymmetric theoretical frameworks. The analysis produced the highest sensitivity results for SUSY to date and extended the LHC reach far beyond the previous Tevatron results.  A generalized inclusive search is subsequently presented for new heavy particle pairs produced in √s = 7 TeV proton-proton collisions at the LHC using 4.7±0.1 fb-1 of integrated luminosity from the second LHC run of 2011.  The selected events are analyzed in the 2D razor-space of MR and R and the analysis is performed in 12 tiers of all-hadronic, single and double leptons final states in the presence and absence of b-quarks, probing the third generation sector using the event heavy-flavor content.   The search is sensitive to generic supersymmetry models with minimal assumptions about the superpartner decay chains. No excess is observed in the number or shape of event yields relative to Standard Model predictions. Exclusion limits are derived in the CMSSM framework with  gluino masses up to 800 GeV and squark masses up to 1.35 TeV excluded at 95% confidence level, depending on the model parameters. The results are also interpreted for a collection of simplified models, in which gluinos are excluded with masses as large as 1.1 TeV, for small neutralino masses, and the first-two generation squarks, stops and sbottoms are excluded for masses up to about 800, 425 and 400 GeV, respectively.

 

With the discovery of a new boson by the CMS and ATLAS experiments in the γ-γ and 4 lepton final states, the identity of the putative Higgs candidate must be established through the measurements of its properties. The spin and quantum numbers are of particular importance, and we describe a method for measuring the JPC of this particle using the observed signal events in the H to ZZ to 4 lepton channel developed before the discovery. Adaptations of the razor kinematic variables are introduced for the H to WW to 2 lepton/2 neutrino channel, improving the resonance mass resolution and increasing the discovery significance. The prospects for incorporating this channel in an examination of the new boson JPC is discussed, with indications that this it could provide complementary information to the H to ZZ* to 4 lepton final state, particularly for measuring CP-violation in these decays.

}, address = {1200 East California Boulevard, Pasadena, California 91125}, advisor = {Spiropulu, Maria}, }