We develop, discuss, and compare several inference techniques to constrain
theory parameters in collider experiments. By harnessing the latent-space
structure of particle physics processes, we extract extra information from the
simulator. This augmented data can be used to train neural networks that
precisely estimate the likelihood ratio. The new methods scale well to many
observables and high-dimensional parameter spaces, do not require any
approximations of the parton shower and detector response, and can be evaluated
in microseconds. Using weak-boson-fusion Higgs production as an example
process, we compare the performance of several techniques. The best results are
found for likelihood ratio estimators trained with extra information about the
score, the gradient of the log likelihood function with respect to the theory
parameters. The score also provides sufficient statistics that contain all the
information needed for inference in the neighborhood of the Standard Model.
These methods enable us to put significantly stronger bounds on effective
dimension-six operators than the traditional approach based on histograms. They
also outperform generic machine learning methods that do not make use of the
particle physics structure, demonstrating their potential to substantially
improve the new physics reach of the LHC legacy results.
%0 Journal Article
%1 Brehmer2018Guide
%A Brehmer, Johann
%A Cranmer, Kyle
%A Louppe, Gilles
%A Pavez, Juan
%D 2018
%J Physical Review D
%K statistics
%N 5
%R 10.1103/physrevd.98.052004
%T A Guide to Constraining Effective Field Theories with Machine Learning
%U http://dx.doi.org/10.1103/physrevd.98.052004
%V 98
%X We develop, discuss, and compare several inference techniques to constrain
theory parameters in collider experiments. By harnessing the latent-space
structure of particle physics processes, we extract extra information from the
simulator. This augmented data can be used to train neural networks that
precisely estimate the likelihood ratio. The new methods scale well to many
observables and high-dimensional parameter spaces, do not require any
approximations of the parton shower and detector response, and can be evaluated
in microseconds. Using weak-boson-fusion Higgs production as an example
process, we compare the performance of several techniques. The best results are
found for likelihood ratio estimators trained with extra information about the
score, the gradient of the log likelihood function with respect to the theory
parameters. The score also provides sufficient statistics that contain all the
information needed for inference in the neighborhood of the Standard Model.
These methods enable us to put significantly stronger bounds on effective
dimension-six operators than the traditional approach based on histograms. They
also outperform generic machine learning methods that do not make use of the
particle physics structure, demonstrating their potential to substantially
improve the new physics reach of the LHC legacy results.
@article{Brehmer2018Guide,
abstract = {{ We develop, discuss, and compare several inference techniques to constrain
theory parameters in collider experiments. By harnessing the latent-space
structure of particle physics processes, we extract extra information from the
simulator. This augmented data can be used to train neural networks that
precisely estimate the likelihood ratio. The new methods scale well to many
observables and high-dimensional parameter spaces, do not require any
approximations of the parton shower and detector response, and can be evaluated
in microseconds. Using weak-boson-fusion Higgs production as an example
process, we compare the performance of several techniques. The best results are
found for likelihood ratio estimators trained with extra information about the
score, the gradient of the log likelihood function with respect to the theory
parameters. The score also provides sufficient statistics that contain all the
information needed for inference in the neighborhood of the Standard Model.
These methods enable us to put significantly stronger bounds on effective
dimension-six operators than the traditional approach based on histograms. They
also outperform generic machine learning methods that do not make use of the
particle physics structure, demonstrating their potential to substantially
improve the new physics reach of the LHC legacy results.}},
added-at = {2019-02-23T22:09:48.000+0100},
archiveprefix = {arXiv},
author = {Brehmer, Johann and Cranmer, Kyle and Louppe, Gilles and Pavez, Juan},
biburl = {https://www.bibsonomy.org/bibtex/2b4d2f3619c04f1fc146e22579b7135a6/cmcneile},
citeulike-article-id = {14579394},
citeulike-linkout-0 = {http://arxiv.org/abs/1805.00020},
citeulike-linkout-1 = {http://arxiv.org/pdf/1805.00020},
citeulike-linkout-2 = {http://dx.doi.org/10.1103/physrevd.98.052004},
day = 26,
doi = {10.1103/physrevd.98.052004},
eprint = {1805.00020},
interhash = {d628ae6e6ee9138f1758de1413927c7d},
intrahash = {b4d2f3619c04f1fc146e22579b7135a6},
issn = {2470-0010},
journal = {Physical Review D},
keywords = {statistics},
month = jul,
number = 5,
posted-at = {2018-05-02 08:41:49},
priority = {2},
timestamp = {2019-02-23T22:15:27.000+0100},
title = {{A Guide to Constraining Effective Field Theories with Machine Learning}},
url = {http://dx.doi.org/10.1103/physrevd.98.052004},
volume = 98,
year = 2018
}