@article{6282839591304f8daf447a5d60656808,
title = "FAIR AI models in high energy physics",
abstract = "The findable, accessible, interoperable, and reusable (FAIR) data principles provide a framework for examining, evaluating, and improving how data is shared to facilitate scientific discovery. Generalizing these principles to research software and other digital products is an active area of research. Machine learning models—algorithms that have been trained on data without being explicitly programmed—and more generally, artificial intelligence (AI) models, are an important target for this because of the ever-increasing pace with which AI is transforming scientific domains, such as experimental high energy physics (HEP). In this paper, we propose a practical definition of FAIR principles for AI models in HEP and describe a template for the application of these principles. We demonstrate the template{\textquoteright}s use with an example AI model applied to HEP, in which a graph neural network is used to identify Higgs bosons decaying to two bottom quarks. We report on the robustness of this FAIR AI model, its portability across hardware architectures and software frameworks, and its interpretability.",
keywords = "AI, FAIR, Higgs boson, high energy physics, ML",
author = "Javier Duarte and Haoyang Li and Avik Roy and Ruike Zhu and Huerta, {E. A.} and Daniel Diaz and Philip Harris and Raghav Kansal and Katz, {Daniel S.} and Kavoori, {Ishaan H.} and Kindratenko, {Volodymyr V.} and Farouk Mokhtar and Neubauer, {Mark S.} and {Eon Park}, Sang and Melissa Quinnan and Roger Rusack and Zhizhen Zhao",
note = "This research is supported by DE-SC0021258, DE-SC0021395, DE-SC0021225 and DE-SC0021396 from the Office of Advanced Scientific Computing Research (ASCR) within US Department of Energy (DOE) Office of Science, by the FAIR Data Program of the DOE, Office of Science, ASCR, under Contract Number DE-AC02-06CH11357, and by Laboratory Directed Research and Development funding from Argonne National Laboratory, provided by the Director, Office of Science, of the DOE under Contract No. DE-AC02-06CH11357. It used resources of the Argonne Leadership Computing Facility, which is a DOE Office of Science User Facility supported under Contract DE-AC02-06CH11357, and resources supported by the US National Science Foundation{\textquoteright}s Major Research Instrumentation program, Grant #1725729, as well as the University of Illinois at Urbana-Champaign. We thank Nikil Ravi, Pranshu Chaturvedi, and Huihuo Zheng for expert support creating and deploying ONNX and TensorRT engines, and Apptainer containers in the ThetaGPU supercomputer.",
year = "2023",
month = dec,
day = "1",
doi = "10.1088/2632-2153/ad12e3",
language = "English (US)",
volume = "4",
journal = "Machine Learning: Science and Technology",
issn = "2632-2153",
publisher = "Institute of Physics Publishing",
number = "4",
}