@article{3071678, title = "Benchmark data and model independent event classification for the large hadron collider", author = "Aarrestad, T. and van Beekveld, M. and Bona, M. and Boveia, A. and Caron, S. and Davies, J. and De Simone, A. and Doglioni, C. and Duarte, J.M. and Farbin, A. and Gupta, H. and Hendriks, L. and Heinrich, L. and Howarth, J. and Jawahar, P. and Jueid, A. and Lastow, J. and Leinweber, A. and Mamuzic, J. and Merényi, E. and Morandini, A. and Moskvitina, P. and Nellist, C. and Ngadiuba, J. and Ostdiek, B. and Pierini, M. and Ravina, B. and de Austri, R.R. and Sekmen, S. and Touranakou, M. and Vaškevičiūte, M. and Vilalta, R. and Vlimant, J.-R. and Verheyen, R. and White, M. and Wulff, E. and Wallin, E. and Wozniak, K.A. and Zhang, Z.", journal = "SciPost Physics", year = "2022", volume = "12", number = "1", publisher = "SciPost Foundation", doi = "10.21468/SCIPOSTPHYS.12.1.043", abstract = "We describe the outcome of a data challenge conducted as part of the Dark Machines (https://www.darkmachines.org) initiative and the Les Houches 2019 workshop on Physics at TeV colliders. The challenged aims to detect signals of new physics at the Large Hadron Collider (LHC) using unsupervised machine learning algorithms. First, we propose how an anomaly score could be implemented to define model-independent signal regions in LHC searches. We define and describe a large benchmark dataset, consisting of > 1 billion simulated LHC events corresponding to 10 fb−1 of proton-proton collisions at a center-of-mass energy of 13 TeV. We then review a wide range of anomaly detection and density estimation algorithms, developed in the context of the data challenge, and we measure their performance in a set of realistic analysis environments. We draw a number of useful conclusions that will aid the development of unsupervised new physics searches during the third run of the LHC, and provide our benchmark dataset for future studies at https://www.phenoMLdata.org. Code to reproduce the analysis is provided at https://github.com/bostdiek/DarkMachines-UnsupervisedChallenge. Copyright © T. Aarrestad et al." }