<?xml version='1.0' encoding='UTF-8'?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "JATS-journalpublishing1.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="en" article-type="review-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">exposome</journal-id>
<journal-title-group>
<journal-title>Exposome</journal-title></journal-title-group>
<issn pub-type="epub">2635-2265</issn>
<publisher>
<publisher-name>Oxford University Press</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.1093/exposome/osaf017</article-id>
<article-id pub-id-type="publisher-id">osaf017</article-id>
<article-categories>
<subj-group subj-group-type="category-toc-heading">
<subject>Review</subject>
</subj-group>
<subj-group subj-group-type="category-taxonomy-collection"><subject>AcademicSubjects/MED00305</subject>
<subject>AcademicSubjects/MED00860</subject>
<subject>AcademicSubjects/SCI01040</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>High resolution mass spectrometry to investigate the human exposome: Where are We?</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-3430-9255</contrib-id>
<name><surname>Talavera Andújar</surname><given-names>Begoña</given-names></name><degrees>PhD</degrees>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization" degree-contribution="equal">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation" degree-contribution="lead">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis" degree-contribution="equal">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation" degree-contribution="equal">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology" degree-contribution="equal">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software" degree-contribution="equal">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation" degree-contribution="equal">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization" degree-contribution="lead">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Writing - original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft" degree-contribution="lead">Writing - original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Writing - review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing" degree-contribution="equal">Writing - review &amp; editing</role>
<xref ref-type="corresp" rid="osaf017-cor1"/>
<aff><institution>Luxembourg Centre for Systems Biomedicine (LCSB), University of Luxembourg</institution>, Belvaux, <country country="LU">Luxembourg</country></aff>
<email xlink:type="simple">begona.talavera@uni.lu</email>
</contrib>
<contrib contrib-type="author" corresp="yes">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-6868-8145</contrib-id>
<name><surname>Schymanski</surname><given-names>Emma L</given-names></name><degrees>Dr. rer. nat</degrees>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization" degree-contribution="equal">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation" degree-contribution="equal">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis" degree-contribution="equal">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition" degree-contribution="lead">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation" degree-contribution="equal">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology" degree-contribution="equal">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration" degree-contribution="lead">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources" degree-contribution="lead">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software" degree-contribution="equal">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision" degree-contribution="lead">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation" degree-contribution="equal">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization" degree-contribution="equal">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Writing - original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft" degree-contribution="equal">Writing - original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org" vocab-term="Writing - review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing" degree-contribution="equal">Writing - review &amp; editing</role>
<xref ref-type="corresp" rid="osaf017-cor1"/>
<aff><institution>Luxembourg Centre for Systems Biomedicine (LCSB), University of Luxembourg</institution>, Belvaux, <country country="LU">Luxembourg</country></aff>
<email xlink:type="simple">emma.schymanski@uni.lu</email></contrib>
</contrib-group>
<author-notes>
<corresp id="osaf017-cor1">Corresponding authors: Begoña Talavera Andújar, PhD, Luxembourg Centre for Systems Biomedicine (LCSB), University of Luxembourg, Belvaux, Luxembourg (<email>begona.talavera@uni.lu</email>) and Emma L. Schymanski, Dr. rer. nat., Luxembourg Centre for Systems Biomedicine (LCSB), University of Luxembourg, Belvaux, Luxembourg (<email>emma.schymanski@uni.lu</email>)</corresp>
</author-notes>
<pub-date pub-type="cover"><year>2026</year></pub-date>
<pub-date pub-type="collection" iso-8601-date="2026-01-15"><day>15</day><month>01</month><year>2026</year></pub-date>
<pub-date pub-type="epub" iso-8601-date="2025-12-22"><day>22</day><month>12</month><year>2025</year></pub-date>
<volume>6</volume><issue>1</issue>
<elocation-id>osaf017</elocation-id>
<history>
<date date-type="received"><day>28</day><month>09</month><year>2025</year></date>
<date date-type="rev-recd"><day>04</day><month>12</month><year>2025</year></date>
<date date-type="accepted"><day>10</day><month>12</month><year>2025</year></date>
<date date-type="corrected-typeset"><day>15</day><month>01</month><year>2026</year></date>
</history>
<permissions>
<copyright-statement>© The Author(s) 2025. Published by Oxford University Press.</copyright-statement>
<copyright-year>2025</copyright-year>
<license license-type="cc-by" xlink:href="https://creativecommons.org/licenses/by/4.0/">
<license-p>This is an Open Access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted reuse, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
</license>
</permissions>
<self-uri xlink:href="osaf017.pdf"/>
<abstract abstract-type="abstract"><title>Abstract</title>
<p>Despite the significant role of the environment in health and disease, the accurate assessment of environmental exposures remains underdeveloped compared to genetic factors. To address this, the concept of the exposome was introduced in 2005 as a complement to the genome. High-resolution mass-spectrometry (HRMS) has emerged as a key technology for the comprehensive assessment of the chemical exposome. However, non-target HRMS based exposomics still faces numerous challenges, with the majority of features detected by HRMS (the “dark matter” of the chemical exposome) remaining unannotated. The lack of standardized workflows across the field often results in poorly comparable studies. Nevertheless, many positive developments have arisen in recent years, with open data revealing interesting trends in HRMS coverage. This review will examine and discuss the entire non-target HRMS exposomics workflow, from experimental design (study design and sample preparation) to the computational analysis and biological interpretation. It will also delve into key concepts, including the sometimes blurred distinction between the metabolome and the chemical exposome and the importance of exposomics within the “omics cascade”. Visualizations are used to support this discussion, including a detailed look at the chemical coverage of key categories of open exposomics resources. The review ends by exploring current challenges and strategies to advance towards harmonized exposomics studies, which are essential for greater biological insights and personalized medicine goals.</p>
</abstract>
<kwd-group><kwd>exposomics</kwd><kwd>non-target screening</kwd><kwd>high-resolution mass-spectrometry (HRMS)</kwd><kwd>liquid chromatography (LC)</kwd><kwd>cheminformatics</kwd>
</kwd-group>
<funding-group>
<award-group award-type="grant">
<funding-source><institution-wrap><institution>Microbiomes in One Health</institution></institution-wrap></funding-source>
</award-group>
<award-group award-type="grant">
<funding-source><institution-wrap><institution>PRIDE doctoral research funding</institution></institution-wrap></funding-source>
<award-id>PRIDE/11823097</award-id>
</award-group>
<award-group award-type="grant">
<funding-source><institution-wrap><institution>Luxembourg National Research Fund (FNR)</institution><institution-id institution-id-type="DOI">10.13039/501100001866</institution-id></institution-wrap></funding-source>
</award-group>
<award-group award-type="grant">
<funding-source><institution-wrap><institution>Luxembourg National Research Fund (FNR)</institution><institution-id institution-id-type="DOI">10.13039/501100001866</institution-id></institution-wrap></funding-source>
<award-id>A18/BM/12341006</award-id>
</award-group>
</funding-group>
<counts>
<page-count count="22"/>
</counts>
</article-meta>
</front>
<body><sec sec-type="intro"><title>Introduction</title>
<p>The phenotype of an individual arises from the interplay between genes and environment. Since only a small proportion of chronic diseases can be attributed solely to genetic factors, it is now hypothesized that the majority (70% - 90%) are influenced by environmental factors, many of which remain unknown.<xref ref-type="bibr" rid="osaf017-B1"><sup>1</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref> Despite the significant role of the environment in health and disease, the accurate assessment of many environmental exposures remains underdeveloped compared to genetic factors.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref> Christopher Wild proposed the concept of the exposome in 2005 as a complement of the genome, defining it as “all life-course exposures (including risk factors), from the prenatal period onwards”.<xref ref-type="bibr" rid="osaf017-B3"><sup>3</sup></xref> This concept was extended in 2014 by Miller and Jones to: “the cumulative measure of environmental influences and associated biological responses throughout the lifespan, including exposures from the environment, diet, behavior, and endogenous processes”.<xref ref-type="bibr" rid="osaf017-B4"><sup>4</sup></xref> Recent collaborative discussions in 2024 and 2025 resulted in further revised definitions of the exposome and its research goals, to foster a common understanding in the field.<xref ref-type="bibr" rid="osaf017-B5 osaf017-B6 osaf017-B7"><sup>5-7</sup></xref></p>
<p><xref ref-type="fig" rid="osaf017-F1">Figure 1</xref> shows the three different research domains that have been described within the exposome.<xref ref-type="bibr" rid="osaf017-B8"><sup>8</sup></xref> The <italic>internal exposome</italic> comprises the internal biological processes as a result of an exposure such as oxidative stress, metabolism, and microbiome changes.<xref ref-type="bibr" rid="osaf017-B8 osaf017-B9 osaf017-B10"><sup>8-10</sup></xref> The internal chemical exposome also includes environmentally derived chemicals plus their transformation products found in cells, tissues, organs or organisms.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref> The <italic>general external exposome</italic> includes social, economic, and environmental factors, while the <italic>specific external exposome</italic> encompasses the individual’s immediate local environment (such as diet, alcohol, infectious agents, pollutants).<xref ref-type="bibr" rid="osaf017-B8 osaf017-B9 osaf017-B10"><sup>8-10</sup></xref></p>
<fig id="osaf017-F1"><label>Figure 1.</label><caption><p>The exposome concept and how the specific external, general external and internal exposome contribute towards health impacts. Modified from.<xref ref-type="bibr" rid="osaf017-B9"><sup>9</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B10"><sup>10</sup></xref></p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f1.png"/></fig>
<p>Unlike the genome, which remains relatively stable over time, the exposome varies on different timescales, requiring complex study designs.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref> The integration of different “omics” layers, known as multi-omics analysis, can offer a more comprehensive understanding of a biological system’s state.<xref ref-type="bibr" rid="osaf017-B11"><sup>11</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B12"><sup>12</sup></xref> Among these “omics” (see <xref ref-type="fig" rid="osaf017-F2">Figure 2A</xref>), metabolomics and exposomics emerge as the terminal downstream outcomes of the genome, reflecting the phenotype of a cell, tissue or organism, in response to diverse genetic or environmental influences over life.<xref ref-type="bibr" rid="osaf017-B13"><sup>13</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B14"><sup>14</sup></xref> Metabolomics and exposomics aim to investigate small molecules, typically ranging between 50 and 1200 Da,<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref> although this boundary can also be constrained by analytical reality such as instrument range of <italic>eg</italic>, <italic>m/z </italic>= 1000 or 2000.<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref> Given the shared analytical scope, metabolomics and exposomics can be conceptually grouped as “small molecule omics.” Some of these small molecules are closely related with the genome and proteome, leading some to call them the “canaries of the genome”.<xref ref-type="bibr" rid="osaf017-B16"><sup>16</sup></xref> This metaphor underscores that even minor alterations, such as a single base change in a gene (especially in a metabolic enzyme), can potentially lead to a 10 000 fold-change in concentrations of specific small molecules.<xref ref-type="bibr" rid="osaf017-B16"><sup>16</sup></xref></p>
<fig id="osaf017-F2"><label>Figure 2.</label><caption><p>(A) The omics cascade from genome onwards, adapted from.<xref ref-type="bibr" rid="osaf017-B11"><sup>11</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B12"><sup>12</sup></xref> (B) The differences in chemical complexity of the different omics, adapted from.<xref ref-type="bibr" rid="osaf017-B16"><sup>16</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B17"><sup>17</sup></xref> Note that the colours represent the different “omes” (genes, proteins, metabolites).</p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f2.png"/></fig>
<p>The disparity in complexity in the different “omics” layers is shown in <xref ref-type="fig" rid="osaf017-F2">Figure 2B</xref>, which helps explain why genomics and transcriptomics are the most mature omics, followed by proteomics, then small molecule omics.<xref ref-type="bibr" rid="osaf017-B17"><sup>17</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B18"><sup>18</sup></xref> Current automated high-throughput techniques are able to (almost) completely cover the genome and proteome.<xref ref-type="bibr" rid="osaf017-B17"><sup>17</sup></xref> Gene sequencing requires a DNA sequencer, while protein characterization can be performed on a single type of high-resolution mass spectrometer.<xref ref-type="bibr" rid="osaf017-B16"><sup>16</sup></xref> In contrast, a wide range of analytical instrumentation is required to capture small molecules, explored further in section 2.4 below.</p>
<p>Since the border between the metabolome and exposome is not always clear-cut,<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B19"><sup>19</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B20"><sup>20</sup></xref> a distinction can be made between environmental exposure and the resulting biological response<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref> (see <xref ref-type="fig" rid="osaf017-F3">Figure 3</xref>). The metabolome refers to the complete set of small molecules (ie, metabolites) present within a biological sample such as a cell, tissue, organ or organism at a given time.<xref ref-type="bibr" rid="osaf017-B17"><sup>17</sup></xref> As these metabolites arise from both endogenous and exogenous sources, the metabolome is considered a key measure for exposome research.<xref ref-type="bibr" rid="osaf017-B19"><sup>19</sup></xref> In this context, the metabolome can be considered as a subset of the exposome, often referred to as the internal chemical exposome.<xref ref-type="bibr" rid="osaf017-B20"><sup>20</sup></xref> Thus, while all metabolites found in a biological sample can be considered part of the exposome, not all chemicals within the exposome belong to the metabolome. In contrast, the exposome is a broader concept that encompasses not only chemicals but also all physical, biological, and psychosocial influences that may impact health, as described above and illustrated in <xref ref-type="fig" rid="osaf017-F1">Figure 1</xref>.</p>
<fig id="osaf017-F3"><label>Figure 3.</label><caption><p>The chemicals part of the metabolome, exposome and the overlap. Adapted from.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B20"><sup>20</sup></xref> Note that gut microbiota is illustrated as a major microbial contributor to metabolic processes, however other microbiota such as saliva, nasal and skin, among others, can also contribute.</p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f3.png"/></fig>
<p>This review will specifically delve into common workflows for measuring the <italic>chemical exposome</italic>, with a particular focus on non-target high-resolution mass spectrometry (HRMS) coupled to liquid chromatography (LC). Although standardized workflows remain an area of active research (discussed further in<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B20"><sup>20</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref>) they can be divided into three main components (<xref ref-type="fig" rid="osaf017-F4">Figure 4</xref>), which have be used to construct the subsequent sections of this article: (1) <italic>experimental workflow</italic>, which encompasses experimental design, sample collection, sample preparation and data acquisition; (2) <italic>computational workflow</italic>, which includes data pre-processing and compound annotation; and (3) <italic>statistical analysis</italic> and <italic>biological interpretation</italic>.</p>
<fig id="osaf017-F4"><label>Figure 4.</label><caption><p>Common workflow steps to investigate the human chemical exposome.</p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f4.png"/></fig>
<p>A recent and extensive exposomics review was published in 2024 by Lai et al.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref> however the present review has a different focus. Specifically, this manuscript emphasizes the conceptual, and often blurred, distinctions between the metabolome and the exposome, as well as the analytical and computational workflows employed in non-target HRMS-based exposomics studies. These workflows are illustrated with visualizations to facilitate understanding, and the manuscript also discusses key challenges and strategies to advance towards harmonized studies. This review and the references provided are intended for readers entering the exposomics field, such as PhD students and early-career researchers but will be also helpful to any researcher investigating the human exposome.</p>
</sec>
<sec><title>Experimental workflows</title>
<sec><title>Experimental design</title>
<p>Individuals may encounter millions of chemical exposures throughout their lifetime, where some exposures may exert lifelong consequences, while childhood exposures may increase the risk of developing disease later in life.<xref ref-type="bibr" rid="osaf017-B19"><sup>19</sup></xref> The design of prospective longitudinal studies (<xref ref-type="fig" rid="osaf017-F5">Figure 5</xref>), which collect samples at various life stages including perinatal, childhood, and adulthood, holds inherent advantages over those that gather single samples from individuals who have already developed the disease.<xref ref-type="bibr" rid="osaf017-B19"><sup>19</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B22"><sup>22</sup></xref> Although challenging, promising initiatives are currently underway to provide such longitudinal data, such as All of Us<xref ref-type="bibr" rid="osaf017-B23"><sup>23</sup></xref> and HELIX.<xref ref-type="bibr" rid="osaf017-B24"><sup>24</sup></xref> While all exposomics studies should undergo independent validation to ensure the reproducibility, this poses significant challenges due to variations in exposures across populations.<xref ref-type="bibr" rid="osaf017-B22"><sup>22</sup></xref> To ensure robust scientific conclusions, several key factors must be considered, such as the number of samples, the types of samples (matrix selection) and their storage conditions.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref></p>
<fig id="osaf017-F5"><label>Figure 5.</label><caption><p>Human life timeline (top) and proposed longitudinal study for an exposomics study where both environmental and biological samples are collected. AD; Alzheimer’s disease, MCI; Mild Cognitive Impairment, PD; Parkinson’s disease, RBD; REM- sleep behavior disorder. Note that while neurodegenerative diseases were chosen for illustrative purposes, this conceptual framework can be applied to other diseases such as cancer.</p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f5.png"/></fig>
<p>The number of samples required for an small molecule omics experiment depends on the biological variability of the studied system and the analytical variability of the technology employed.<xref ref-type="bibr" rid="osaf017-B25"><sup>25</sup></xref> Generally, hundreds or thousands of subjects need to be investigated to obtain robust results, although sample numbers of 3-20 per group can be suitable for generating preliminary and/or pilot data.<xref ref-type="bibr" rid="osaf017-B25"><sup>25</sup></xref> Such preliminary data can then be used to estimate the number of samples needed to achieve certain statistical power (eg, 0.8), using open tools such as G*Power,<xref ref-type="bibr" rid="osaf017-B26"><sup>26</sup></xref> MetaboAnalyst<xref ref-type="bibr" rid="osaf017-B27"><sup>27</sup></xref> and MultiPower,<xref ref-type="bibr" rid="osaf017-B28"><sup>28</sup></xref> which estimates sample sizes for multi-omics studies.</p>
</sec>
<sec><title>Sample collection</title>
<p>The matrix selection is a critical aspect of the study design, affected by multiple factors including the cost of storage and collection devices, research question, technical feasibility and expected presence of specific chemicals, as some chemicals accumulate specifically in some tissues.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B29"><sup>29</sup></xref> To date, blood (plasma or serum) and urine are the most studied matrices.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B22"><sup>22</sup></xref> While biological samples can provide insights into potential biological responses (ie, endogenous compounds) to toxicants or pollutants (ie, exogenous compounds), these exogenous compounds are typically present at trace levels compared to the endogenous ones and thus stretch the dynamic range of current instrumentation,<xref ref-type="bibr" rid="osaf017-B30"><sup>30</sup></xref> as detailed below. Consequently, it may be advantageous to also incorporate non-target screening of environmental samples such as dust to first build a picture of potential contaminants, before analysing biological samples.</p>
<p>The collection and storage of many biological samples (at −80°C) for long-term longitudinal studies (<xref ref-type="fig" rid="osaf017-F5">Figure 5</xref>) can be costly. Dried Blood Spot (DBS) samples are compact, easy to collect and can be shipped at ambient temperature. However, the analysis of DBS is not as standardized as for plasma or serum, and it is not yet clear if there is sufficient sample material for non-target analysis.<xref ref-type="bibr" rid="osaf017-B31"><sup>31</sup></xref> Urine is a well-studied matrix, easily accessible and less invasive than blood,<xref ref-type="bibr" rid="osaf017-B22"><sup>22</sup></xref> while fecal analysis can yield valuable insights into gut microbiota metabolites, with relatively easy sample collection. Although cerebrospinal fluid (CSF) provides valuable information on brain metabolism, the collection of CSF samples is invasive, and the recruitment of healthy volunteers is more difficult, such that studies with large sample sizes involve significant commitments and dedication. The concentrations of exogenous chemicals in this matrix are typically very low compared with other biological samples such as blood. Other sample types that can be collected to answer specific questions include hair, teeth and nails, which can help to understand historical exposures, although determining the timing of exposure can be laborious.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref> The study of the specific external exposome can be done by collecting household dust samples with a vacuum cleaner,<xref ref-type="bibr" rid="osaf017-B32"><sup>32</sup></xref> although these samples are prone to variability. Passive samplers such as silicone wristbands allow a more individual assessment of the exposure to chemicals, although the silicone used in wristbands can lead to analytical interferences if they are not properly cleaned before use and the sample preparation may be more tedious compared to household dust.<xref ref-type="bibr" rid="osaf017-B33"><sup>33</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B34"><sup>34</sup></xref></p>
<p>Depending on the aim, two different approaches can be used when analysing the chemical exposome: (1) <italic>target or targeted</italic> studies, which focus on identifying a limited number of specific chemicals (hypothesis driven) and (2) <italic>non-target or untargeted</italic> studies, which are hypothesis generating and aim to identify as many compounds as possible.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B35"><sup>35</sup></xref> Typically, non-target studies are <italic>semiquantitative</italic>, which use peak height or area as direct readouts or estimate the concentrations relative to quantifiable compounds such as internal standards spiked at known concentrations. In contrast, target studies frequently employ <italic>absolute quantitation</italic>, which involves calculating the exact concentration via calibration curves.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref> The sections below focus on non-target HRMS studies, which can be used to generate hypotheses and insights for designing subsequent quantitative targeted studies.</p>
</sec>
<sec><title>Sample preparation</title>
<p>Sample preparation (or pretreatment) prior to instrumental analysis aims to reduce interferences, separate and concentrate analytes.<xref ref-type="bibr" rid="osaf017-B36"><sup>36</sup></xref> Due to the chemical diversity of the exposome, there is no universal method that captures all chemicals present in a sample<xref ref-type="bibr" rid="osaf017-B25"><sup>25</sup></xref> and a combination of different sample preparation approaches can cover a broader range of the chemical space.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref> However, this is limited by increased costs in resources and time.</p>
<p>Sample preparation methods for non-target analysis of biological/environmental samples should be:<xref ref-type="bibr" rid="osaf017-B37"><sup>37</sup></xref> (1) unselective (to cover a wide range of chemicals), (2) simple and fast (to prevent chemical loss/degradation during preparation), (3) reproducible, and, for biological samples, (4) incorporate a quenching step. The rapid stopping or quenching of metabolism is an essential step to produce a stable extract that reflects the endogenous metabolite levels present in the original biological system.<xref ref-type="bibr" rid="osaf017-B37"><sup>37</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B38"><sup>38</sup></xref> The sample preparation method is highly dependent on the matrix (eg, cells, plasma, or tissues), and analytical platform employed. For instance, although protein precipitation is the first step for plasma samples, tissues must be homogenized first.<xref ref-type="bibr" rid="osaf017-B39"><sup>39</sup></xref> Furthermore, while Gas Chromatography coupled with MS (GC-MS) often requires a derivatization step to make the compounds sufficiently volatile for the analysis,<xref ref-type="bibr" rid="osaf017-B40"><sup>40</sup></xref> the sample preparation for Liquid Chromatography coupled with MS (LC-MS) analysis is simpler and typically does not require this step.<xref ref-type="bibr" rid="osaf017-B39"><sup>39</sup></xref></p>
<p>Liquid-liquid extraction (LLE), often including a protein precipitation step, and dilute and shoot (DNS) are frequently employed sample pretreatment methods in exposomics studies. Other sample preparation methods include solid-phase extraction (SPE) and dispersive solid-phase extraction, such as QuEChERS.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B36"><sup>36</sup></xref> While LLE and DNS offer broad analytical coverage, they are susceptible to matrix effects and interferences, which can limit reproducibility and sensitivity. In contrast, SPE and QuEChERS typically enhance sensitivity and reproducibility, albeit often at the cost of reduced chemical coverage.<xref ref-type="bibr" rid="osaf017-B36"><sup>36</sup></xref> Further information can be found in the NORMAN guidance for non-target screening<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref> and other publications on sample preparation for metabolomics<xref ref-type="bibr" rid="osaf017-B25"><sup>25</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B37"><sup>37</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B39"><sup>39</sup></xref> and exposomics.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B36"><sup>36</sup></xref></p>
</sec>
<sec><title>Data acquisition</title>
<p>While HRMS has emerged as the leading technique to investigate the chemical exposome, there is no “one size fits all” analytical method and a combination of different separation and ionization platforms is needed to capture the relevant chemical space (<xref ref-type="fig" rid="osaf017-F6">Figure 6</xref>).<xref ref-type="bibr" rid="osaf017-B35"><sup>35</sup></xref> Flow-injection is very fast, but cannot separate any isobars, while chromatographic separation introduces analytes slowly into the mass spectrometer, separating more isobars and reducing the risk of ion suppression, source fouling and coelution. A mobile phase, either liquid or gas, transports the analytes through a stationary phase-fixed system<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref> (see top part of <xref ref-type="fig" rid="osaf017-F6">Figure 6</xref>).</p>
<fig id="osaf017-F6"><label>Figure 6.</label><caption><p>Separation analytical methods and their applicability range based on the polarity of the chemicals are displayed on the top part of the figure, while the different ionization techniques and their applicability range are displayed on the bottom. Examples of potentially endogenous (blue) and exogenous (gray) compounds are displayed. Adapted from Zeki et al.<xref ref-type="bibr" rid="osaf017-B39"><sup>39</sup></xref> and Hollender et al.<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref> Abbreviations: GC, gas chromatography; HILIC, Hydrophilic interaction chromatography; LC, liquid chromatography; RP, Reversed Phase; EI, electron ionization; ESI, electrospray ionization; APCI, atmospheric pressure chemical ionization; APPI, atmospheric pressure photoionization; VOCs, Volatile Organic Compounds; PFAS, Perfluoroalkyl and Polyfluoroalkyl Substances; PAHs, Polycyclic Aromatic Hydrocarbons; IC, Ion Exchange; CE, Capillary Electrophoresis.</p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f6.png"/></fig>
<p>GC is frequently used for the analysis of volatile and thermally stable compounds such as fatty acids, and organic compounds (see left part of <xref ref-type="fig" rid="osaf017-F6">Figure 6</xref> for examples). Due to the high temperatures, a derivatization step is often required before the analysis, which may result in compound loss<xref ref-type="bibr" rid="osaf017-B39"><sup>39</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B41"><sup>41</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B42"><sup>42</sup></xref> and changes the resulting mass spectra. The most common ionization technique applied in GC is Electron Ionization (EI), which provides robust, and highly reproducible fragmentation patterns.<xref ref-type="bibr" rid="osaf017-B39"><sup>39</sup></xref></p>
<p>Currently, LC coupled with an electrospray ionisation (ESI) source is probably the most used HRMS-based platform for non-target studies due to the soft ionization process, high dynamic range and versatility.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref> LC-HRMS does not typically require derivatization and is highly applicable to the analysis of a broad range of medium to very polar compounds,<xref ref-type="bibr" rid="osaf017-B39"><sup>39</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B41"><sup>41</sup></xref> with several examples shown in the right part of <xref ref-type="fig" rid="osaf017-F6">Figure 6</xref> Using both positive (+) and negative (−) ionization modes increases the coverage. Reversed Phase (RP) columns are widely employed to separate polar and medium polar compounds, providing relatively reliable, robust and reproducible results. Hydrophilic Interaction Liquid Chromatography (HILIC) columns improve the separation of very polar compounds minimally retained by RP,<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B39"><sup>39</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B42"><sup>42</sup></xref> but can be less reproducible. Alternative ionisation techniques such as Atmospheric Pressure Photoionization (APPI) and Atmospheric Pressure Chemical Ionization (APCI) can extend the LC range almost into the GC range (<xref ref-type="fig" rid="osaf017-F6">Figure 6</xref>).</p>
<p>Despite recent progress, current analytical platforms still lack the dynamic range to simultaneously detect trace-level exogenous compounds and high-abundance endogenous metabolites (see <xref ref-type="fig" rid="osaf017-F7">Figure 7</xref> for an example based on LC-ESI-HRMS). The integration of Ion Mobility Spectrometry (IMS) into HRMS workflows has been gaining more attention as it can improve the dynamic range and throughput of the analysis.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B18"><sup>18</sup></xref> Coupling IMS with HRMS offers the ability to resolve isomers or isobars that are difficult to distinguish using only HRMS, and adds Collison Cross Section (CCS) information to the retention time, MS1 and MS2 data, providing complementary information for compound identification and/or annotation.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B35"><sup>35</sup></xref> Depending on the instrument, including IMS also reduces the complexity in the MS1 and MS2 spectra,<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref> but comes at a cost of sensitivity and more difficult data analysis.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B43"><sup>43</sup></xref> Typical commercial IMS instruments do not yet offer sufficient resolution to resolve isomers within measurement and prediction errors.<xref ref-type="bibr" rid="osaf017-B44"><sup>44</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B45"><sup>45</sup></xref></p>
<fig id="osaf017-F7"><label>Figure 7.</label><caption><p>Concentration range of the different components of the human metabolome and internal chemical exposome as well as coverage by LC-ESI-HRMS. Adapted from.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B17"><sup>17</sup></xref></p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f7.png"/></fig>
<p>Quadrupole Time-of-Flight (Q-TOF) and Orbitrap are the most commonly used mass analyzers in non-target studies, as they provide high resolution.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B39"><sup>39</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B42"><sup>42</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B46"><sup>46</sup></xref> A Q-TOF analyzer maintains the selectivity of the quadrupole and provides a mass resolution of approximately 40 000-60 000. Orbitrap analyzers reach resolutions between 250 000 to even 1 000 000 for ions with <italic>m/z</italic> below 300.<xref ref-type="bibr" rid="osaf017-B46"><sup>46</sup></xref> Triple Quadrupole (QQQ) analyzers are often used for targeted analysis to confirm potential biomarkers due to high sensitivity and selectivity,<xref ref-type="bibr" rid="osaf017-B41"><sup>41</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B42"><sup>42</sup></xref> but are not suitable for non-target studies due to their low resolution.<xref ref-type="bibr" rid="osaf017-B39"><sup>39</sup></xref></p>
<p>Two acquisition methods are often used in non-target HRMS studies: Data-Dependent Acquisition (DDA), and Data-Independent Acquisition (DIA). DDA is typically more common, since MS2 spectra can be associated with a specific precursor,<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B47"><sup>47</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B48"><sup>48</sup></xref> resulting in simpler processing compared with DIA.<xref ref-type="bibr" rid="osaf017-B47"><sup>47</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B49"><sup>49</sup></xref> While low intensity features may not be selected for fragmentation, this can be alleviated with the creation of inclusion lists, supported by either open software solutions such as iterative exclusion lists from IE-Omics,<xref ref-type="bibr" rid="osaf017-B50"><sup>50</sup></xref> or instrument software such as AcquireX from ThermoFisher. DIA mode operates in a less-selective manner, as the instrument selects all the peaks within the isolation window, regardless of the peak intensity.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B47"><sup>47</sup></xref> Thus, the MS2 spectra are information-rich collections including fragments from low intensity ions, but they lack the precursor-fragment information<xref ref-type="bibr" rid="osaf017-B47"><sup>47</sup></xref> and require deconvolution to link the specific precursor to the MS2 spectra.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B48"><sup>48</sup></xref> This can be performed by open software such as MS-DIAL.<xref ref-type="bibr" rid="osaf017-B51"><sup>51</sup></xref> All-Ion Fragmentation (AIF), and Sequential Window Acquisition of all Theoretical Fragmention Spectra (SWATH) are two commonly employed DIA methods.</p>
<p>In practice, method selection depends strongly on the research question, instrument availability and analytical expertise, among others. While LC-MS (eg, QQQ) remains the preferred option for the quantification of a specific and small number of compounds (target studies), LC-HRMS and GC-HRMS (eg, Orbitrap) are employed for non-target exposomics studies generating larger and more complex datasets that make the data preprocessing steps more challenging. Therefore, the analytical considerations detailed above, together with the references provided, can serve as practical guidance for selecting the most appropriate analytical platform and acquisition mode for a given a study.</p>
</sec>
</sec>
<sec><title>Computational workflows</title>
<sec><title>Non-target HRMS data pre-processing</title>
<p>The main objective of data pre-processing (or feature detection) is to transform the raw data files into a format that simplifies the access to the distinct characteristics of every observed feature in each sample analyzed, ie, a feature list.<xref ref-type="bibr" rid="osaf017-B52"><sup>52</sup></xref> A “feature” does not necessarily refer to a specific chemical, but rather it typically refers to a peak (or signal) identified at a specific retention time, and <italic>m/z</italic>, containing spectral information such as MS1 and/or MS2.<xref ref-type="bibr" rid="osaf017-B35"><sup>35</sup></xref> Features are also called “<italic>m/z</italic> features”, “ion features” or “ion peaks”.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref> The resulting feature list (<xref ref-type="fig" rid="osaf017-F8">Figure 8</xref>, bottom right) can be then employed for various purposes, including feature prioritization, compound annotation, and statistics and typically contain the retention time, <italic>m/z</italic>, and peak area and/or intensity of each feature from each raw data file.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B52 osaf017-B53 osaf017-B54"><sup>52-54</sup></xref></p>
<fig id="osaf017-F8"><label>Figure 8.</label><caption><p>Data preprocessing steps for LC-HRMS raw data. First, data is centroided and noise is removed. Next, EICs are generated and a peak-picking algorithm is applied to detect true peaks. Finally, peaks are grouped across samples, and retention time alignment is performed. After that, a gap filling step can be performed to reduce the number of missing values. Adapted from.<xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B60"><sup>60</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B66"><sup>66</sup></xref> Abbreviations: RT, Retention Time; <italic>m/z</italic>, mass-to-charge ratio.</p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f8.png"/></fig>
<p>Data pre-processing steps include data conversion (if vendor software is not used), centroiding, filtering step for noise removal, generation of Extracted Ion Chromatograms (EICs), peak picking, peak grouping across samples, and retention time alignment (<xref ref-type="fig" rid="osaf017-F8">Figure 8</xref>).<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref> Software approaches include vendor software such as Compound Discoverer (ThermoFisher), MassHunter Profinder (Agilent), MetaboScape (Bruker) and Progenesis QI (Waters), as well as open software including MS-DIAL,<xref ref-type="bibr" rid="osaf017-B51"><sup>51</sup></xref> MZmine,<xref ref-type="bibr" rid="osaf017-B55"><sup>55</sup></xref> OpenMS,<xref ref-type="bibr" rid="osaf017-B56"><sup>56</sup></xref> XCMS,<xref ref-type="bibr" rid="osaf017-B57"><sup>57</sup></xref> and patRoon.<xref ref-type="bibr" rid="osaf017-B58"><sup>58</sup></xref> Recent reviews provide a comprehensive overview of the start of the art of data pre-processing software.<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B20"><sup>20</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B59"><sup>59</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B60"><sup>60</sup></xref> Since different instrument vendors use different formats, conversion of the raw data files into an open format such as mzML or mzXML<xref ref-type="bibr" rid="osaf017-B53"><sup>53</sup></xref> is required for open approaches, typically using ProteoWizard,<xref ref-type="bibr" rid="osaf017-B61"><sup>61</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B62"><sup>62</sup></xref> although some software now embed this conversion, including MS-DIAL<xref ref-type="bibr" rid="osaf017-B51"><sup>51</sup></xref> and patRoon.<xref ref-type="bibr" rid="osaf017-B58"><sup>58</sup></xref> Data acquisition can be done in either profile or centroid mode; the centroiding of profile data is an important data reduction step (see top part of <xref ref-type="fig" rid="osaf017-F8">Figure 8</xref>),<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref> often performed together with the data conversion using ProteoWizard.<xref ref-type="bibr" rid="osaf017-B61"><sup>61</sup></xref> While ProteoWizard offers both vendor-specific or general algorithms, the use of vendor-specific algorithms is recommended<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref> The quality of the conversion using ProteoWizard hinges on the vendor type—while the ThermoFisher conversion yields high quality results, this is not the case for Waters.<xref ref-type="bibr" rid="osaf017-B63"><sup>63</sup></xref></p>
<p>Once data is centroided, a filtering step is applied to suppress or reduce the random analytical noise, which is always present in the acquired MS data.<xref ref-type="bibr" rid="osaf017-B53"><sup>53</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B64"><sup>64</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B65"><sup>65</sup></xref> Noise is often removed via smoothing.<xref ref-type="bibr" rid="osaf017-B64"><sup>64</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B66"><sup>66</sup></xref> Methods include linear weighted moving average,<xref ref-type="bibr" rid="osaf017-B51"><sup>51</sup></xref> Savitzky-Golay smoothing,<xref ref-type="bibr" rid="osaf017-B67"><sup>67</sup></xref> moving average,<xref ref-type="bibr" rid="osaf017-B67"><sup>67</sup></xref> and binomial filter.<xref ref-type="bibr" rid="osaf017-B68"><sup>68</sup></xref> MS-DIAL uses the linear weighted moving average by default, although it supports all the aforementioned approaches.<xref ref-type="bibr" rid="osaf017-B51"><sup>51</sup></xref> After the EIC generation, peak picking is performed to determine the area under the peak.<xref ref-type="bibr" rid="osaf017-B52"><sup>52</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B53"><sup>53</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B66"><sup>66</sup></xref> This requires the establishment of criteria (ie, parameters) to distinguish true peaks from noise<xref ref-type="bibr" rid="osaf017-B64"><sup>64</sup></xref> such as setting a minimum intensity threshold and an estimated chromatographic peak width, establishing a maximum <italic>m/z</italic> error (eg, 0.001 Da for a Q-TOF instrument and 5 ppm for an Orbitrap), and ensuring that identified peaks are present in a significant proportion of the samples.<xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B64"><sup>64</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B65"><sup>65</sup></xref> Next, the selected peaks are grouped across samples,<xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref> and an alignment step is needed to correct retention time differences between runs (samples).<xref ref-type="bibr" rid="osaf017-B53"><sup>53</sup></xref> The alignment algorithm often requires a reference sample (eg, pooled Quality Control [QC] sample) to correct the retention time differences, and this choice can have a significant impact on the results.<xref ref-type="bibr" rid="osaf017-B53"><sup>53</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B65"><sup>65</sup></xref></p>
<p>The selection of parameters for data preprocessing is a critical step in the exposomics analysis,<xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref> as inadequate parameter selection can lead to biased results. Since exposomics seeks to identify highly abundant endogenous compounds along with exogenous small molecules that are often present at trace levels (see <xref ref-type="fig" rid="osaf017-F7">Figure 7</xref>), there are no universal parameters that can effectively capture the chemical complexity of the human exposome currently.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref> While approaches such as IPO<xref ref-type="bibr" rid="osaf017-B69"><sup>69</sup></xref> can be used to assist in parameter selection, they should be employed with a degree of caution, as they tend to discard low abundant or rare peaks, which may be trace level exogenous molecules of relevance for the exposomics question. Recently proposed quality assurance/quality control (QA/QC) guidelines support the exposomics community in their data preprocessing choices,<xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref> see further details in Section 5.</p>
</sec>
<sec><title>Compound annotation</title>
<p>The annotation of small molecules remains a major challenge in non-target HRMS based metabolomics and exposomics studies, as the majority of features detected (around 80%) remain unknown,<xref ref-type="bibr" rid="osaf017-B70"><sup>70</sup></xref> although experts continue to debate the fraction. High abundant peaks, with MS2 available, usually represent &lt;10% of the detected features by non-target HRMS, while the majority (60%-70%) are low abundant peaks without fragmentation information.<xref ref-type="bibr" rid="osaf017-B71"><sup>71</sup></xref> <italic>Annotation</italic> involves associating an identified MS feature with a specific chemical identity, while <italic>identification</italic> is the process of verifying that the annotated compound corresponds to the proposed chemical (ie, confirming the annotation with the reference standard).<xref ref-type="bibr" rid="osaf017-B72"><sup>72</sup></xref> However, the lack of availability of chemical reference standards for given molecules of interest represents a major bottleneck in exposomics/metabolomics studies, complicating biological interpretations.<xref ref-type="bibr" rid="osaf017-B73"><sup>73</sup></xref></p>
<p>The large number of unannotated features in non-target studies is a common subject of debate. Recently, Giera et al.<xref ref-type="bibr" rid="osaf017-B74"><sup>74</sup></xref> suggested that most (&gt;70%) of the unannotated features in non-target LC-HRMS experiments are in-source fragments (ISFs), concluding that the dark metabolome may be smaller than previously thought. However, the results were based on a 931 K compound library that is not publicly disclosed, while the formation and recognition of ISFs is highly dependent on multiple parameters including source voltages, instrument design, matrix type, extraction methods, analyte concentration and data preprocessing workflow.<xref ref-type="bibr" rid="osaf017-B75"><sup>75</sup></xref> Moreover, many of the ISFs observed in highly concentrated synthetic chemical standard mixes may not be detected in complex biological samples. Previous studies, in contrast, have reported that ISFs entail ∼2%-25% of all detected ions.<xref ref-type="bibr" rid="osaf017-B75 osaf017-B76 osaf017-B77"><sup>75-77</sup></xref> While ISFs can be problematic, they can also be intentionally enhanced to improve annotation confidence<xref ref-type="bibr" rid="osaf017-B78"><sup>78</sup></xref> and modern workflows are increasingly accounting for them.<xref ref-type="bibr" rid="osaf017-B75"><sup>75</sup></xref> These different estimates highlight the current lack of consensus and harmonization in the field. While high prevalence of ISFs would imply that the dark metabolome is smaller than previously thought, assuming that most of the features identified are known, lower estimates would indicate that although ISFs remain relevant, they may represent a relatively small subset of detected features.</p>
<p>Non-target HRMS studies generate vast amounts of data, necessitating various computational strategies such as suspect screening and non-target screening (top part of <xref ref-type="fig" rid="osaf017-F9">Figure 9A</xref>). While suspect screening approaches use lists of chemicals that could potentially be present in the samples (ie, suspect lists of certain chemical classes or organisms/matrices) for more efficient discovery, non-target screening approaches aim to identify as many compounds as possible via tandem mass spectral libraries or database search (eg, via in silico fragmentation software), as shown in the bottom part of <xref ref-type="fig" rid="osaf017-F9">Figure 9A</xref>. A detailed glossary of terms can be found in the 2023 NORMAN guidance.<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref></p>
<fig id="osaf017-F9"><label>Figure 9.</label><caption><p>(A) Generic computational workflow for target and non-target exposomics studies.<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B35"><sup>35</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B79"><sup>79</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B80"><sup>80</sup></xref> (B) Identification confidence levels by Schymanski et al.<xref ref-type="bibr" rid="osaf017-B81"><sup>81</sup></xref> (left), and proposed minimum data requirements for level 2a and 3a annotations using MS-DIAL and patRoon software (right). Similar approaches could be done with other software such as <bold>MZmine</bold><xref ref-type="bibr" rid="osaf017-B55"><sup>55</sup></xref> <bold>and LipidMatch</bold>.<xref ref-type="bibr" rid="osaf017-B82"><sup>82</sup></xref></p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f9.png"/></fig>
<p>Compound annotation is a fundamental step to convert raw HRMS data into meaningful biological information.<xref ref-type="bibr" rid="osaf017-B35"><sup>35</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B71"><sup>71</sup></xref> Since the amount of information available for identification varies, it is essential that the confidence assignment of each feature is transparent.<xref ref-type="bibr" rid="osaf017-B35"><sup>35</sup></xref> Several confidence level schemes exist, including the 2007 Metabolomics Standards Initiative (MSI),<xref ref-type="bibr" rid="osaf017-B83"><sup>83</sup></xref> the 2014 guidelines for HRMS data with an environmental focus<xref ref-type="bibr" rid="osaf017-B81"><sup>81</sup></xref> (left part of <xref ref-type="fig" rid="osaf017-F9">Figure 9B</xref>), 2020 guidelines for IMS<xref ref-type="bibr" rid="osaf017-B84"><sup>84</sup></xref> and 2022 guidelines for PFAS<xref ref-type="bibr" rid="osaf017-B85"><sup>85</sup></xref> and GC-HRMS.<xref ref-type="bibr" rid="osaf017-B86"><sup>86</sup></xref> The 2014 levels shown in <xref ref-type="fig" rid="osaf017-F9">Figure 9B</xref> range from Level 1 (confirmed structure with reference standard), to Level 5 (only a <italic>m/z</italic> is known).<xref ref-type="bibr" rid="osaf017-B87"><sup>87</sup></xref> According to metabolomics terminology conventions, only Level 1 can be considered identifications, while the rest (Level 2-5) are annotations. In downstream analyses, it is recommended to base biological interpretations primarily on Level 1 identifications, however, this is often hampered by the limited availability of chemical standards. Consequently, Level 2 annotations are frequently used as the next most reliable basis for interpretation, whereas Level 3-5 should be interpreted with caution, serving mainly for prioritization for future validation efforts.</p>
<p>Several criteria are used to assign the identification level of each feature, including the MS1, retention time, fragmentation pattern (MS2), CCS (if available) and experimental data.<xref ref-type="bibr" rid="osaf017-B71"><sup>71</sup></xref> However, although different classification systems have been proposed,<xref ref-type="bibr" rid="osaf017-B38"><sup>38</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B81"><sup>81</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B83"><sup>83</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B88"><sup>88</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B89"><sup>89</sup></xref> currently there is no standardized system for compound annotation integrated in the processing workflows, making the comparison of results between studies challenging.<xref ref-type="bibr" rid="osaf017-B71"><sup>71</sup></xref> This necessitates a degree of “translation” between software outputs (see <italic>eg</italic>, <xref ref-type="fig" rid="osaf017-F9">Figure 9B</xref>, right). While the use of False Discovery Rates (FDR), as done in other omics fields, has been proposed, estimating total FDR for compound identification in small molecule omics is still a nascent challenge in the field.<xref ref-type="bibr" rid="osaf017-B90"><sup>90</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B91"><sup>91</sup></xref> The use of identification probability was proposed recently as an alternative to the identification levels.<xref ref-type="bibr" rid="osaf017-B91"><sup>91</sup></xref> However, the probability depends on the reference library size and treats all candidates equally, such that smaller reference libraries can artificially lead to high identification probabilities, while larger libraries (such as those more applicable to exposomics) will potentially yield too many apparently equally-valid candidates with very low probabilities to support meaningful outcomes. Identification levels can be assigned automatically in some patRoon workflows,<xref ref-type="bibr" rid="osaf017-B58"><sup>58</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B92"><sup>92</sup></xref> while the NORMAN Network also trialled an automated assignment system<xref ref-type="bibr" rid="osaf017-B93"><sup>93</sup></xref> and Boatman et al. recently published a checklist to facilitate automation for PFAS identification with IMS.<xref ref-type="bibr" rid="osaf017-B94"><sup>94</sup></xref></p>
<sec><title>Compound annotation via tandem mass spectral libraries search</title>
<p>The fastest and most accurate (and thus most common) strategy for compound annotation is to compare the experimental mass spectra (MS2), with standard mass spectral libraries.<xref ref-type="bibr" rid="osaf017-B35"><sup>35</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B47"><sup>47</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B70"><sup>70</sup></xref> Compound annotation via spectral library searching is based on the premise that molecules generate a reproducible “fingerprint” under specific fragmentation conditions<xref ref-type="bibr" rid="osaf017-B72"><sup>72</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B95"><sup>95</sup></xref> (see <xref ref-type="fig" rid="osaf017-F10">Figure 10</xref>). Good matches between the experimental and the library MS2 spectra can lead to Level 2a annotations.<xref ref-type="bibr" rid="osaf017-B72"><sup>72</sup></xref> If the MS2 library is created <italic>in-house</italic>, ie, the experimental and library spectra are acquired under the same conditions, this can lead to Level 1 annotations when the retention times also match. Commonly used spectral libraries include MassBank,<xref ref-type="bibr" rid="osaf017-B96"><sup>96</sup></xref> MassBank of North America (MoNA),<xref ref-type="bibr" rid="osaf017-B97"><sup>97</sup></xref> GNPS,<xref ref-type="bibr" rid="osaf017-B98"><sup>98</sup></xref> mzCloud,<xref ref-type="bibr" rid="osaf017-B99"><sup>99</sup></xref> METLIN,<xref ref-type="bibr" rid="osaf017-B100"><sup>100</sup></xref> and NIST.<xref ref-type="bibr" rid="osaf017-B101"><sup>101</sup></xref> While GC-EI mass spectra have been standardized for over 60 years, LC-MS spectra are less standardized due to instrument variability and differences in acquisition parameters such as collision energy. As a result, MS2 libraries often contain multiple entries for each compound.<xref ref-type="bibr" rid="osaf017-B72"><sup>72</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B91"><sup>91</sup></xref></p>
<fig id="osaf017-F10"><label>Figure 10.</label><caption><p>Exemplified workflow of MS2 library search software.<xref ref-type="bibr" rid="osaf017-B47"><sup>47</sup></xref> For a given experimental MS1, first the precursor filter is applied to remove all the candidates outside the tolerance window (eg, 0.01 Da). Subsequently, the similarity algorithm ranks the experimental MS2 spectra against the remaining library spectra candidates (four in this example) and calculates a similarity score. Note that the adducts shown ([M + H]+ and [M + Na]+) are illustrative examples and other adducts (eg, [M + K]+, [M + NH4]+ in positive mode, [M − H]−, [M + Cl]− in negative mode) can occur based on the matrix and acquisition settings, among others. Abbreviations: RT, retention time; <italic>m/z</italic>, mass-to-charge ratio.</p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f10.png"/></fig>
<p>Tandem mass spectral libraries are typically generated by the analysis of chemical reference standards.<xref ref-type="bibr" rid="osaf017-B72"><sup>72</sup></xref> Therefore, compound annotation by this approach is hampered by the limited availability of mass spectra data due to lack of standards, and/or lack of open data. Of the 122 million compounds in PubChem (September 2025), only 36 242, or 0.03% have open LC-MS/MS data available.<xref ref-type="bibr" rid="osaf017-B102"><sup>102</sup></xref> Nonetheless, there has been substantial progress in the quality and quantity of mass spectral libraries in recent years. Automated spectral library searching and matching can be performed using various open and commercial software with different algorithms. Typically, these software tools work in a two-step procedure: (1) MS1 filter, (eg, 0.01 Da) which can remove up to 99% of false candidates and speeds up searching, and (2) similarity algorithm, which ranks the experimental MS2 spectra against the remaining library spectra and calculates a similarity score, see bottom part of <xref ref-type="fig" rid="osaf017-F9">Figure 9</xref>.<xref ref-type="bibr" rid="osaf017-B47"><sup>47</sup></xref> Ideally, scores should be able to distinguish true and false positive matches.<xref ref-type="bibr" rid="osaf017-B72"><sup>72</sup></xref></p>
<p>The most common spectral match score is the cosine score, which converts two MS2 spectra (observed and reference) into two equally size vectors through mass peak binning, and then calculates the dot product which ranges from 0 to 999 (or 0 to 0.999).<xref ref-type="bibr" rid="osaf017-B47"><sup>47</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B73"><sup>73</sup></xref> A score of 999 indicates a perfect match between the two spectra, while a score of 0 indicates no match.<xref ref-type="bibr" rid="osaf017-B47"><sup>47</sup></xref> Newer scoring approaches include the Entropy score<xref ref-type="bibr" rid="osaf017-B103"><sup>103</sup></xref> and a range of new machine learning algorithms.<xref ref-type="bibr" rid="osaf017-B73"><sup>73</sup></xref> The right part of <xref ref-type="fig" rid="osaf017-F9">Figure 9B</xref> shows how these scores can be applied to annotate compounds using different software. Several open software approaches support spectral library search, including MS-DIAL,<xref ref-type="bibr" rid="osaf017-B51"><sup>51</sup></xref> MZmine,<xref ref-type="bibr" rid="osaf017-B55"><sup>55</sup></xref> openMS,<xref ref-type="bibr" rid="osaf017-B56"><sup>56</sup></xref> and XCMS,<xref ref-type="bibr" rid="osaf017-B57"><sup>57</sup></xref> while commercial examples include Progenesis QI (Waters) and MetaboScape (Bruker). The in silico fragmentation software MetFrag also integrates a library search and calculates an Exact Spectral Similarity score (also known as “MoNA score”).<xref ref-type="bibr" rid="osaf017-B104"><sup>104</sup></xref> However, the variability in output results, including similarity scores, across different software can make the identification levels obtained poorly comparable. For instance, MS-DIAL and patRoon provide similarity scores, dot product and MoNA scores, respectively, with a proposed minimum data requirements for annotation shown in <xref ref-type="fig" rid="osaf017-F9">Figure 9B</xref>. Importantly, even when the spectral similarity score is high (&gt;0.9), the identity of the compound must be confirmed with a chemical reference standard to classify it as Level 1.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref> Otherwise, the match should be considered an annotation rather than an identification (Level 2 or below), since several isomers can have very similar spectra such that only retention time or other orthogonal parameters can distinguish between them.</p>
</sec>
<sec><title>In silico approaches for compound annotation</title>
<p>In silico fragmentation software supports compound annotation of candidates beyond those in mass spectral databases. These methods typically involve matching the experimental spectra against a selection of candidates obtained from known compound databases (discussed in the next section). Approaches such as MetFrag,<xref ref-type="bibr" rid="osaf017-B104"><sup>104</sup></xref> Mass Frontier, MS-FINDER<xref ref-type="bibr" rid="osaf017-B105"><sup>105</sup></xref> and CFM-ID<xref ref-type="bibr" rid="osaf017-B106"><sup>106</sup></xref> fragment the candidates and match the resulting spectra with the experimental spectrum, while approaches such as CSI: FingerID<xref ref-type="bibr" rid="osaf017-B107"><sup>107</sup></xref> and SIRIUS use the experimental spectrum to generate fingerprints, which are matched with the fingerprints of the candidates to rank the structure candidates.<xref ref-type="bibr" rid="osaf017-B70"><sup>70</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B108"><sup>108</sup></xref> MetFrag uses a bond dissociation approach to generate fragments for each candidate, which are compared with the experimental spectra to determine which are the best candidates.<xref ref-type="bibr" rid="osaf017-B104"><sup>104</sup></xref> Mass Frontier (Thermo) uses rule-based fragmentation prediction, complementary to the bond disconnection approach. CFM-ID<xref ref-type="bibr" rid="osaf017-B106"><sup>106</sup></xref> is a machine learning-based approach that can predict fragments and intensities, and thus can be used to generate in silico libraries of the given spectrum type used during the training.<xref ref-type="bibr" rid="osaf017-B47"><sup>47</sup></xref></p>
<p>In silico spectral libraries can help to overcome the limited number spectra in MS2 libraries and avoid the need for “on the fly” calculations in each workflow. In silico spectral libraries can be generated via <italic>eg</italic>, quantum chemistry, machine learning, heuristic-based, and chemical reaction-based methods. Heuristic approaches are best applied to compounds with consistent fragmentation patterns such as lipids.<xref ref-type="bibr" rid="osaf017-B47"><sup>47</sup></xref> LipidBlast,<xref ref-type="bibr" rid="osaf017-B109"><sup>109</sup></xref> integrated within MS-DIAL<xref ref-type="bibr" rid="osaf017-B51"><sup>51</sup></xref> and LipidMatch,<xref ref-type="bibr" rid="osaf017-B82"><sup>82</sup></xref> is an in silico library containing more than 200 000 spectra generated using a heuristic approach. LipidMatch<xref ref-type="bibr" rid="osaf017-B82"><sup>82</sup></xref> is a rule-based software that incorporates various libraries to facilitate the lipid annotation. CFM-ID<xref ref-type="bibr" rid="osaf017-B106"><sup>106</sup></xref> has been used to <italic>eg</italic>, generate in silico EI-MS and MS/MS spectra of small molecules in HMDB.<xref ref-type="bibr" rid="osaf017-B110"><sup>110</sup></xref> In general, predictions should only be used for compounds within or close to the domain of the training set/rule sets used.</p>
<p>In silico approaches for compound annotation typically yield Level 3 annotations or below, but they can be upgraded to Level 2 with the support of a good tandem mass spectral library match, such as the combined approach with MoNA used in MetFrag. In silico annotations often serve an important early role in the elucidation process, guiding subsequent activities such as the interpretation, prioritization and even acquisition of reference standards.<xref ref-type="bibr" rid="osaf017-B73"><sup>73</sup></xref></p>
</sec>
<sec><title>Compound databases for compound annotation</title>
<p>Due to the extreme chemical diversity of the chemical exposome, the database selection plays a critical role in the annotation process. This aims to reduce both false positives (ie, incorrect annotations) and false negatives (absence of the correct structure in the database). While the Chemical Abstract Service (CAS)<xref ref-type="bibr" rid="osaf017-B111"><sup>111</sup></xref> database is the largest chemical registry containing over 290 million organic substances (September 2025),<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref> it is not freely available or compatible with open software approaches. ChemSpider<xref ref-type="bibr" rid="osaf017-B112"><sup>112</sup></xref> and PubChem<xref ref-type="bibr" rid="osaf017-B113"><sup>113</sup></xref> contain over 128 and 122 million chemicals respectively (September 2025), making them the two largest freely available chemical databases. However, due to user quota limitations on ChemSpider, PubChem currently emerges as the most feasible large chemical database for integration into open software workflows.<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref></p>
<p>The use of smaller subsets of chemicals helps in the annotation process as these contain known molecules specific to certain domains. For example, PubChemLite for Exposomics (PCL), a subset of PubChem containing 442 379 chemicals (version 2.0.0)<xref ref-type="bibr" rid="osaf017-B87"><sup>87</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B114"><sup>114</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B115"><sup>115</sup></xref> and the Blood Exposome Database<xref ref-type="bibr" rid="osaf017-B116"><sup>116</sup></xref> (67 291 compounds) aid exposomics researchers in identifying relevant chemicals. Metabolite discovery in humans is facilitated by the HMDB,<xref ref-type="bibr" rid="osaf017-B110"><sup>110</sup></xref> while KEGG<xref ref-type="bibr" rid="osaf017-B117"><sup>117</sup></xref> and MetaCyc<xref ref-type="bibr" rid="osaf017-B118"><sup>118</sup></xref> establish connections with proteomics and transcriptomics disciplines.<xref ref-type="bibr" rid="osaf017-B70"><sup>70</sup></xref> Lipidomics studies are supported by LIPID MAPS Structure Database (LMSD),<xref ref-type="bibr" rid="osaf017-B119"><sup>119</sup></xref> which contains 49 790 unique lipid structures (July 2025), which is thus the largest public lipid-specific database. The Human Microbial Metabolome Database (MiMeDB) facilitates the study of small molecules produced by the human microbiome,<xref ref-type="bibr" rid="osaf017-B120"><sup>120</sup></xref> while the CompTox Chemicals Dashboard is a collection of 1 254 895 chemicals relevant for computational toxicity efforts.<xref ref-type="bibr" rid="osaf017-B121"><sup>121</sup></xref> The coverage of HMDB, PCL, CompTox and the Blood Exposome database is explored in <xref ref-type="fig" rid="osaf017-F11">Figure 11A</xref>, which shows the small, polar focus of the Blood Exposome database Versus the wider range of chemicals in HMDB (including lipid-based molecules) and the even wider range in CompTox and PCL that may not be detectable in humans, but may still influence health outcomes.</p>
<fig id="osaf017-F11"><label>Figure 11.</label><caption><p>(A) Overlaid dot plot showing the coverage of the Blood Exposome Database, CompTox, the Human Metabolome Database (HMDB) and PubChemLite for Exposomics (PCL). B) Overlaid dot plot of PubChemLite (PCL) displaying the coverage of the compounds with LC-MS, GC-MS as well as CCS information. C) Overlaid plot of PCL displaying the compounds with Pathway information (Biopathway), associated disorders and diseases (DisorderDisease), agrochemical information and drug and medication information (DrugMedicInfo). R code for data visualization can be found in the GitLab repository (<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://gitlab.com/uniluxembourg/lcsb/eci/exposomics-plots">https://gitlab.com/uniluxembourg/lcsb/eci/exposomics-plots</ext-link>).<xref ref-type="bibr" rid="osaf017-B122"><sup>122</sup></xref></p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f11.png"/></fig>
<p>As discussed above (see section 2.4 and <xref ref-type="fig" rid="osaf017-F6">Figure 6</xref>), a combination of analytical techniques is necessary to capture the chemical exposome. <xref ref-type="fig" rid="osaf017-F11">Figure 11B</xref> displays the chemicals within PCL that contain LC-MS and GC-MS spectral information, as well as CCS records in PubChem. This highlights the complementarity of the techniques, while GC-MS effectively identifies part of the non-polar side of the exposome, LC-MS covers a wider range of polar compounds. Notably, there are still many areas of the exposome that have no spectral information available, including very lipophilic molecules (middle and right top of the plot) and highly polar compounds (bottom right of the plot). Interestingly, CCS values are available for a good number of small molecules, providing an additional parameter to support compound annotation and identification in non-target HRMS. Several classes have been highlighted in <xref ref-type="fig" rid="osaf017-F11">Figure 11B</xref>, showing that both endogenous (triglycerides and nucleotides, in blue) as well as exogenous (perfluorooctanesulfonate [PFOS] and pesticides, in grey) can be captured with both LC-MS and GC-MS.</p>
<p><xref ref-type="fig" rid="osaf017-F11">Figure 11C</xref> shows the overlaid plot of PCL along with four of the major PCL categories. Interestingly, the chemical space covered by the Biopathway category (<xref ref-type="fig" rid="osaf017-F11">Figure 11C</xref>) and HMDB (<xref ref-type="fig" rid="osaf017-F11">Figure 11A</xref>) are very similar, although both contain patches with little experimental data in PubChem (mass ∼750-1750, XlogP 20-30). The Disorder and Disease category also overlaps more with the DrugMedicInfo category than perhaps expected, indicating that a large portion of this section may indicate drug availability and not additional disease insights. The Agrochemical information and DrugMedicInfo categories (<xref ref-type="fig" rid="osaf017-F11">Figure 11C</xref>) cluster in the left part of the plot, representing low molecular weight molecules with medium polarity, similar to the patterns observed in the Blood Exposome Database (<xref ref-type="fig" rid="osaf017-F11">Figure 11A</xref>).</p>
<p>One important fraction of the chemical exposome are transformation products, which are often overlooked.<xref ref-type="bibr" rid="osaf017-B123"><sup>123</sup></xref> These products, derived from biotic or abiotic reactions, can have toxicity and persistence profiles that differ significantly from their parent compounds and may even be more toxic in some cases.<xref ref-type="bibr" rid="osaf017-B124"><sup>124</sup></xref> Currently, structural elucidation of transformation products is typically performed by a combination of experimental and in silico approaches.<xref ref-type="bibr" rid="osaf017-B123"><sup>123</sup></xref> The “Transformations” section in PubChem, which contains documented parent-transformation product relationships from ChEMBL and the NORMAN Suspect List Exchange (NORMAN-SLE)<xref ref-type="bibr" rid="osaf017-B125"><sup>125</sup></xref> is included in PubChemLite,<xref ref-type="bibr" rid="osaf017-B87"><sup>87</sup></xref> while software such as patRoon can aid in identifying transformation products from databases or by in silico prediction.<xref ref-type="bibr" rid="osaf017-B126"><sup>126</sup></xref> Open source software such as BioTransformer<xref ref-type="bibr" rid="osaf017-B127"><sup>127</sup></xref> or ShinyTPs<xref ref-type="bibr" rid="osaf017-B124"><sup>124</sup></xref> help generate transformation product databases or suspect lists via in silico prediction and text mining, respectively.</p>
<p>Suspect screening approaches can be used to search for compounds of interest that are expected (“suspected”) to be in the samples, facilitated through the use of suspect lists. This can be considered a form of prioritization, as it reduces the number of compounds to be investigated and assists in discovering potentially relevant results. Although this approach was initially employed in environmental and toxicology sciences to expedite non-targe screening, it has been increasingly applied in metabolomics and exposomics studies.<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref> Different platforms exist to exchange suspect lists, such as the NORMAN-SLE<xref ref-type="bibr" rid="osaf017-B125"><sup>125</sup></xref> and the CompTox Chemicals Dashboard.<xref ref-type="bibr" rid="osaf017-B128"><sup>128</sup></xref> Furthermore, specific lists of chemicals can be generated in PubChem by literature mining.<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref> Suspect screening can be facilitated by software such as patRoon,<xref ref-type="bibr" rid="osaf017-B58"><sup>58</sup></xref> which performs the automatic annotation of “suspects” based on pre-defined rules. The automatic assignment of identification levels is a key feature of patRoon, enhancing the reproducibility and leading to more transparent and comparable results.<xref ref-type="bibr" rid="osaf017-B58"><sup>58</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B126"><sup>126</sup></xref> Other software options allowing suspect screening include MZmine,<xref ref-type="bibr" rid="osaf017-B55"><sup>55</sup></xref> and Compound Discoverer (ThermoFisher). However, there is a risk in focusing too narrowly on distinct suspect classes in exposomics, depending on the study context, since recent studies have shown that significant chemicals for disease penetrance arise from many different information categories and suspect lists.<xref ref-type="bibr" rid="osaf017-B32"><sup>32</sup></xref></p>
</sec>
</sec>
</sec>
<sec><title>Statistics &amp; biological interpretation</title>
<p>Non-target HRMS exposomics studies generate a large amount of data, necessitating a combination of univariate and multivariate statistical analysis to identify significant differences between groups.<xref ref-type="bibr" rid="osaf017-B129"><sup>129</sup></xref> Data pre-treatment (eg, normalization, scaling) is essential before applying statistics, as detailed in the next subsection.</p>
<sec><title>Data pre-treatment</title>
<p>Data pre-treatment consists of transforming the HRMS feature list into a suitable state for subsequent statistical analysis.<xref ref-type="bibr" rid="osaf017-B83"><sup>83</sup></xref> This process aims to reduce the effects of technical and measurement errors while enhancing relevant biological variations.<xref ref-type="bibr" rid="osaf017-B130"><sup>130</sup></xref> Common pre-treatment methods include normalization, centering, scaling (eg, Pareto scaling), and transformations (eg, log and power).<xref ref-type="bibr" rid="osaf017-B52"><sup>52</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B131"><sup>131</sup></xref> Multifunctional open tools such as MetaboAnalyst,<xref ref-type="bibr" rid="osaf017-B27"><sup>27</sup></xref> XCMS online,<xref ref-type="bibr" rid="osaf017-B57"><sup>57</sup></xref> and MS-DIAL<xref ref-type="bibr" rid="osaf017-B51"><sup>51</sup></xref> implement some pre-treatment steps, while various statistical packages are available for data pre-treatment in C/C++, Java, R, and Python.<xref ref-type="bibr" rid="osaf017-B132"><sup>132</sup></xref></p>
<p>Normalization strategies are used to remove or correct unwanted systematic variations between samples, making them more comparable.<xref ref-type="bibr" rid="osaf017-B53"><sup>53</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B83"><sup>83</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B130"><sup>130</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B133"><sup>133</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B134"><sup>134</sup></xref> Normalization in metabolomics and exposomics is more challenging compared to genomics and proteomics, due to the vast complexity of the chemical space.<xref ref-type="bibr" rid="osaf017-B134"><sup>134</sup></xref> For instance, there is no standard method to measure the total amount of chemicals in a sample to normalize in the way total protein amount is used in proteomics.<xref ref-type="bibr" rid="osaf017-B66"><sup>66</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B133"><sup>133</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B134"><sup>134</sup></xref> Normalization can be performed either pre-acquisition or post-acquisition of HRMS data and is generally divided into sample-based and data-based approaches, reviewed recently elsewhere.<xref ref-type="bibr" rid="osaf017-B133"><sup>133</sup></xref></p>
</sec>
<sec><title>Univariate and multivariate statistical analysis</title>
<p>Univariate statistical tests aim to identify changes in individual molecules and work on the assumption of statistical independence.<xref ref-type="bibr" rid="osaf017-B129"><sup>129</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B135"><sup>135</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B136"><sup>136</sup></xref> These approaches are commonly used to initially assess the potential relationships between exposures and disease phenotypes.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref> Different tests are available to investigate differences across groups (or changes over time) and the choice depends on the data distribution and the experimental design (number of groups and type, ie, matched or unmatched).<xref ref-type="bibr" rid="osaf017-B66"><sup>66</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B137"><sup>137</sup></xref> Univariate analysis can also be employed to investigate the association between specific small molecules of interest and other variables, such as known clinical parameters, environmental exposures, or microbial species, among others. For this purpose, various similarity tests, including Pearson’s correlation (parametric test) and Spearman’s correlation (non-parametric test) can be used.<xref ref-type="bibr" rid="osaf017-B138"><sup>138</sup></xref> Univariate statistics are also widely used within Exposome-Wide Association Studies (ExWAS).<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref> In an ExWAS, a large number of exposures are successively and independently tested for their association with a specific health outcome, using statistical approach analogous to Genome-wide association studies (GWAS).<xref ref-type="bibr" rid="osaf017-B139"><sup>139</sup></xref> However, although univariate statistics are widely employed to test individual chemicals, non-target exposomics studies do not generate univariate data, as chemicals are not independent of each other, necessitating the use of multivariate statistics.<xref ref-type="bibr" rid="osaf017-B135"><sup>135</sup></xref></p>
<p>Multivariate statistical methods encompass both supervised and unsupervised methods.<xref ref-type="bibr" rid="osaf017-B83"><sup>83</sup></xref> Unsupervised methods are generally exploratory in nature, used to find patterns and generate hypotheses, while supervised methods are more confirmatory (hypothesis testing), widely used for biomarker identification, classification, and prediction.<xref ref-type="bibr" rid="osaf017-B132"><sup>132</sup></xref> Unsupervised methods are an effective approach to explore and visualize the structure of the dataset. Principal Component Analysis (PCA)<xref ref-type="bibr" rid="osaf017-B66"><sup>66</sup></xref> stands out as one of the most widely employed methods, used to reduce the number of dimensions in the data, facilitating data exploration and visualization. It is often employed as a pre-processing step, to check the data quality, before applying a supervised method.<xref ref-type="bibr" rid="osaf017-B52"><sup>52</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B140"><sup>140</sup></xref> Pooled QC samples that cluster tightly, ideally at the origin of the scores plot, are indicative of high-quality data<xref ref-type="bibr" rid="osaf017-B140"><sup>140</sup></xref> (<xref ref-type="fig" rid="osaf017-F12">Figure 12A</xref>).</p>
<fig id="osaf017-F12"><label>Figure 12.</label><caption><p>Multivariate statistical approaches applied in exposomics studies. (A) PCA scores plot of where all QC samples cluster tightly near the origin, which is indicative of quality data, affirming that the instrument variation was effectively corrected. PCA is widely used as a QA/QC tool to detect outliers and assess batch effects. (B) PLS-DA scores plot of the same dataset, included here to illustrate how supervised methods maximize the differences between predefined groups. Unlike PCA, PLS-DA is not used for QA/QC but is applied in downstream analyses such as classification, biomarker discovery, and hypothesis testing. Further details regarding QA/QC measures are discussed in Broadhurst et al.<xref ref-type="bibr" rid="osaf017-B140"><sup>140</sup></xref></p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f12.png"/></fig>
<p>Supervised methods are used to identify the independent variables (molecules) that best discriminate the groups under study (dependent variables). PLS-DA and orthogonal-PLS-DA (oPLS-DA) are some of the most commonly used methods. As shown in <xref ref-type="fig" rid="osaf017-F12">Figure 12B</xref>, they maximize the differences between groups. However, the main drawback of these supervised methods is their susceptibility to overfitting. Therefore, it is highly recommended to perform validation analysis to avoid finding false relationships and misinterpretation of the data.<xref ref-type="bibr" rid="osaf017-B129"><sup>129</sup></xref> Ideally, these classification models require splitting the dataset into training set, validation set, and test set. Thus, individual models are tested and evaluated on unique datasets and then applied to the entire dataset and/or to other datasets.<xref ref-type="bibr" rid="osaf017-B129"><sup>129</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B135"><sup>135</sup></xref> This approach, however, is often limited when working with small sample sizes or cases such as rare diseases or mutations, which may prevent the dataset from being split effectively.</p>
</sec>
<sec><title>Special statistical considerations for exposomics studies</title>
<p>Missing data pose a particular challenge in exposomics studies, where exposures are often analysed jointly. As the number of included exposures (such as chemicals identified by HRMS) increases, the number of complete cases can decline rapidly. This issue is further exacerbated in longitudinal exposomics studies where participant numbers are typically highest at baseline, but dropouts accumulate over time, leading to progressively fewer observations and a greater <italic>proportion</italic> of missing data at later time points. Therefore, the use of imputation techniques, such as multiple imputation is recommended, as detailed by Santos et al.<xref ref-type="bibr" rid="osaf017-B139"><sup>139</sup></xref></p>
<p>Exposomics studies often involve analyzing samples collected at different time points and therefore processed in different analytical batches. This can introduce batch effects, which occur when quantitative measurements differ systematically between batches due to irrelevant factors.<xref ref-type="bibr" rid="osaf017-B141"><sup>141</sup></xref> Batch effects can be caused by multiple sources at any step of the experimental workflow (<xref ref-type="fig" rid="osaf017-F4">Figure 4</xref>), from sample collection to sample preparation and data acquisition by the analytical platform (eg, LC-HRMS), which is often the primary source of variation.<xref ref-type="bibr" rid="osaf017-B141"><sup>141</sup></xref> These batch effects are almost unavoidable when working with HRMS platforms. Thus, it is very important to identify the unwanted variations (eg, via PCA, as shown above in <xref ref-type="fig" rid="osaf017-F12">Figure 12A</xref>) and correct them. Although several strategies have been proposed to correct batch effects (eg, using ISs or pooled QC samples), it remains an active area of research with no standardized approach.<xref ref-type="bibr" rid="osaf017-B141"><sup>141</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B142"><sup>142</sup></xref> A recent review discusses potential sources of batch effects in multiomics studies as well as different batch effect correction algorithms (BECAs).<xref ref-type="bibr" rid="osaf017-B143"><sup>143</sup></xref></p>
<p>Exposomics data typically contains many covariates such as confounders (<italic>eg</italic>, age, sex, medication), which must be accounted in the statistical analyses. For this purpose, linear models can be employed to identify potential chemicals associated with a particular outcome (eg, Parkinson’s disease or diabetes), while accounting for any number of covariates.<xref ref-type="bibr" rid="osaf017-B144"><sup>144</sup></xref></p>
<p>Network based approaches can help interpret the behaviour of chemicals or diseases that are related, and to provide insights into their mechanisms. Specifically, in exposomics, network approaches allow the identification of correlated exposures and potential biological changes associated with multiple exposures and health effects.<xref ref-type="bibr" rid="osaf017-B139"><sup>139</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B144"><sup>144</sup></xref></p>
<p>Mendelian randomization (MR) has become a valuable method in exposomics for assessing causal relationships between exposures and health outcomes. MR uses genetic variants, such as single nucleotide polymorphisms (SNPs), as instrumental variables to estimate the causal effect of a modifiable exposure on an outcome.<xref ref-type="bibr" rid="osaf017-B144"><sup>144</sup></xref> MR relies on the assumptions that genetic variants are strongly associated with the exposure, are not associated with confounders, and influence the outcome only through the exposure.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B144"><sup>144</sup></xref> Recent studies<xref ref-type="bibr" rid="osaf017-B145 osaf017-B146 osaf017-B147 osaf017-B148"><sup>145-148</sup></xref> have successfully applied this approach in various exposomics contexts.</p>
<p>Since chemical exposures typically occur in complex mixtures rather than individually, various statistical methods can be applied to account for multiple exposures and their potential combined effects.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B149"><sup>149</sup></xref> These include, mixture analysis approaches, dimension reduction techniques or Bayesian model averaging. Further details can be found in Maitre et al.<xref ref-type="bibr" rid="osaf017-B149"><sup>149</sup></xref> In addition, machine learning approaches such as random forest, support vector machine, and gradient boosting can be used for biomarker selection, classification, and predictive modelling.<xref ref-type="bibr" rid="osaf017-B21"><sup>21</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B144"><sup>144</sup></xref></p>
</sec>
<sec><title>Biological interpretation</title>
<p>Biological interpretation of exposomics data is still a major challenge.<xref ref-type="bibr" rid="osaf017-B150"><sup>150</sup></xref> This is primarily due to the fact that the majority of the detected features by non-target HRMS remain unknown or, if annotated, little additional information is available. Another key challenge is distinguishing between exogenous and endogenous chemicals that reflect the biological response to the exposure,<xref ref-type="bibr" rid="osaf017-B20"><sup>20</sup></xref> where it is increasingly plausible that some detected chemicals originate from both exogenous and endogenous sources. Therefore, a multi-faceted approach is essential for interpreting small molecule omics data, encompassing different computational methods for statistical analysis, functional analysis, chemical classification, data integration, and data visualization, among others.<xref ref-type="bibr" rid="osaf017-B135"><sup>135</sup></xref></p>
<p>Network modelling and pathway mapping are key approaches for providing biological context to the data by enhancing the understanding of relationships between small molecules.<xref ref-type="bibr" rid="osaf017-B151"><sup>151</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B152"><sup>152</sup></xref> MetaboAnalyst<xref ref-type="bibr" rid="osaf017-B27"><sup>27</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B138"><sup>138</sup></xref> is a widely employed platform allowing data processing and interpretation through various functionality, including pathway, enrichment and network analysis. These approaches are valuable for data exploration and hypothesis generation, but the results require further validation. Pathway mapping is often limited by incomplete and manually curated pathway databases, leading to variability in results across different databases (eg, KEGG and MetaCyc),<xref ref-type="bibr" rid="osaf017-B135"><sup>135</sup></xref> while various metabolites can belong to different pathways. This analysis also excludes exogenous chemicals (ie, the chemical exposome). An alternative approach is ChemRICH,<xref ref-type="bibr" rid="osaf017-B150"><sup>150</sup></xref> which uses MeSH and Tanimoto substructure chemical similarity coefficients to cluster small molecules into non-overlapping chemical groups. In contrast with pathways analysis, ChemRICH sets have a self-contained size (based on the chemicals found in a particular study), therefore <italic>P</italic>-values do not rely on the size of a background database, such as KEGG. Furthermore, the analysis can also place exposome chemicals into metabolite sets. However, results from ChemRICH cannot yet be directly integrated with genomics or proteomics results.<xref ref-type="bibr" rid="osaf017-B135"><sup>135</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B150"><sup>150</sup></xref> Another strategy that does not require compound identification is mummichog.<xref ref-type="bibr" rid="osaf017-B153"><sup>153</sup></xref> This method uses as input peak lists, which are queried against a database to identify all the potential matches to metabolic pathways and networks.<xref ref-type="bibr" rid="osaf017-B152"><sup>152</sup></xref> Linear models are useful for complex exposomics studies as they can account for covariates like age, sex, and occupation, helping to identify chemicals associated with specific metadata of interest. A recent review summarizes different computational methods including linear models with covariate adjustment, dimensionality reduction, and neural networks, among others, that support exposomics data analysis and interpretation.<xref ref-type="bibr" rid="osaf017-B144"><sup>144</sup></xref></p>
<p>Multi-omics approaches offer a more comprehensive understanding of the biological system by integrating small molecule omics with other omics data acquired from the same samples. Currently, there is a wide array of tools available for the integration of multi-omics data, such as mixOmics.<xref ref-type="bibr" rid="osaf017-B154"><sup>154</sup></xref> For instance, combining metabolomics with metagenomics can help elucidate the role of bacteria derived metabolites.<xref ref-type="bibr" rid="osaf017-B151"><sup>151</sup></xref> In this context, tools like microbeMASST can help identifying the potential microbial origin of annotated chemicals by mapping known and unknown MS2 spectra to potential microbial producers.<xref ref-type="bibr" rid="osaf017-B155"><sup>155</sup></xref></p>
</sec>
</sec>
<sec><title>From history to harmonization: Addressing challenges between the metabolome and exposome</title>
<p>Currently, the lack of harmonization not only in the annotation process but also throughout the entire non-target HRMS workflow leads to poorly comparable metabolomics and exposomics studies. As shown in <xref ref-type="fig" rid="osaf017-F13">Figure 13</xref>, metabolomics and exposomics are still young and rapidly growing fields of research, where workflow standardization is an ongoing task. To address this need, several initiatives have emerged separately for each discipline. In 2005, the MSI was formed,<xref ref-type="bibr" rid="osaf017-B156"><sup>156</sup></xref> proposing a series of minimum reporting standards for data analysis in metabolomics two years later.<xref ref-type="bibr" rid="osaf017-B52"><sup>52</sup></xref> A network of global metabolomics repositories arose in 2015 (COordination of Standards in MetabOlomicS [COSMOS]).<xref ref-type="bibr" rid="osaf017-B157"><sup>157</sup></xref> Since exposomics is a newer field, there is no “Exposomics Standard Initiative” yet. However, in the last few years various European, American and international initiatives have been developed, including The Human Early-Life Exposome (HELIX),<xref ref-type="bibr" rid="osaf017-B24"><sup>24</sup></xref> EXPOsOMICS,<xref ref-type="bibr" rid="osaf017-B158"><sup>158</sup></xref> The European Human Exposome Network (EHEN)<xref ref-type="bibr" rid="osaf017-B159"><sup>159</sup></xref> the Network for EXposomics in the United States (NEXUS),<xref ref-type="bibr" rid="osaf017-B160"><sup>160</sup></xref> HERCULES,<xref ref-type="bibr" rid="osaf017-B161"><sup>161</sup></xref> Human Health Exposure Analysis Resource (HHEAR) network,<xref ref-type="bibr" rid="osaf017-B162"><sup>162</sup></xref> and the International Human Exposome Network (IHEN).<xref ref-type="bibr" rid="osaf017-B163"><sup>163</sup></xref></p>
<fig id="osaf017-F13"><label>Figure 13.</label><caption><p>The metabolome and exposome timeline. Only the peak heights of the Metabolome (1998), Exposome (2014) and last peak (?) are intentionally emphasized for significance. The sizes of the other peaks were adjusted for aesthetic reasons and do not reflect their importance. A representative selection of tools is displayed here for illustrative purposes, and the authors acknowledge the presence of many other numerous tools and initiatives that have emerged in recent years. Adapted from.<xref ref-type="bibr" rid="osaf017-B164"><sup>164</sup></xref> Abbreviations: Artificial Intelligence; AI.</p></caption><graphic xmlns:xlink="http://www.w3.org/1999/xlink" mimetype="image" xlink:href="osaf017f13.png"/></fig>
<p>QA/QC procedures should be implemented throughout the entire metabolomics and exposomics workflow, from sample preparation to data acquisition and data pre-processing, to ensure that the analysis is consistent, comparable, reproducible, precise and accurate. While well established QA/QC procedures in metabolomics serve as valuable benchmarks, such as the 2018 guidelines by Broadhurst et al.<xref ref-type="bibr" rid="osaf017-B140"><sup>140</sup></xref> (<xref ref-type="fig" rid="osaf017-F13">Figure 13</xref>), they may require adaptation for exposomics studies or research endeavours that integrate both metabolomics and exposomics. Notably, filtering features based on QC pooled samples may inadvertently exclude low-abundance small molecules, including exogenous compounds typically present at trace levels, which may be significant in certain groups or conditions. To address this issue, an alternative approach involves preparing tailored pooled QC samples for specific study groups, such as cases and controls.<xref ref-type="bibr" rid="osaf017-B165"><sup>165</sup></xref> Currently, the usage of QC pooled samples varies greatly across studies accompanied by inconsistencies in the reporting of their preparation methods, as recently highlighted by Broeckling et al.<xref ref-type="bibr" rid="osaf017-B166"><sup>166</sup></xref> Therefore, it would be beneficial to establish guidelines for the preparation, usage, and reporting of QC samples in metabolomics and exposomics studies. A minimum set of QC measures as well as a standardized method for reporting them should be required in future studies. <xref ref-type="table" rid="osaf017-T1">Table 1</xref> summarizes a structure summary of recommended QA/QC for each stage of the non-target HRMS metabolomics and exposomics workflow, offering a practical starting point for harmonized QA/QC reporting in future exposomics studies.</p>
<table-wrap id="osaf017-T1"><label>Table 1.</label><caption><p>Summary of some recommended QA/QC procedures for non-target-HRMS exposomics and metabolomics.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col valign="top" align="left"/>
<col valign="top" align="left"/>
</colgroup>
<thead>
<tr><th>Workflow step</th><th>QA/QC procedures</th>
</tr>
</thead>
<tbody>
<tr>
<td><bold>Sample collection</bold></td>
<td>
<list list-type="bullet">
<list-item><p>Develop detailed Standard Operational Protocols (SOPs) for sampling and storage.</p></list-item>
<list-item><p>Careful selection of appropriate sampling materials (eg, avoiding tubes with components such as phthalates and Polyethylene Glycol (PEG) that may interfere with the analysis).</p></list-item>
<list-item><p>Train personnel performing the sample collection.<xref ref-type="bibr" rid="osaf017-B140"><sup>140</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B167"><sup>167</sup></xref></p></list-item>
<list-item><p>Define specific acceptance/rejection criteria for samples upon arrival at the laboratory.<xref ref-type="bibr" rid="osaf017-B167"><sup>167</sup></xref></p></list-item>
<list-item><p>Report collection method, storage temperature and number of freeze-thaw cycles, if applicable.</p></list-item>
</list></td>
</tr>
<tr>
<td><bold>Sample preparation</bold></td>
<td>
<list list-type="bullet">
<list-item><p>Use Internal Standards (IS). Ideally a mixture of multiple IS covering the range of the chemical space to be investigated should be added to each sample, at predetermined concentrations.<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B140"><sup>140</sup></xref></p></list-item>
<list-item><p>Use pooled QC samples, prepared by taking a small aliquot of each study sample and mixing it into homogenous pooled sample. Pooled QC samples are used to condition the analytical platform,<xref ref-type="bibr" rid="osaf017-B140"><sup>140</sup></xref> assess the analytical performance,<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref> correct batch effects,<xref ref-type="bibr" rid="osaf017-B2"><sup>2</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B140"><sup>140</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B166"><sup>166</sup></xref> support metabolite identification,<xref ref-type="bibr" rid="osaf017-B166"><sup>166</sup></xref> and filter low quality data,<xref ref-type="bibr" rid="osaf017-B140"><sup>140</sup></xref> although this may result in the loss of low abundant features such as pollutants. Thus, it is not recommended for exposomics studies, where low-abundant features may be relevant. Report how pooled samples were prepared and used.</p></list-item>
<list-item><p>Include blank samples to prevent false positives. Different blanks can be prepared such as extraction blanks (or process banks) and system suitability blanks (instrument blanks). Further details can be found in the 2023 NORMAN guidance.<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref></p></list-item>
<list-item><p>Report sample preparation protocol including the reconstitution solvent and volume, IS employed and concentrations.<xref ref-type="bibr" rid="osaf017-B168"><sup>168</sup></xref></p></list-item>
</list></td>
</tr>
<tr>
<td><bold>Data acquisition</bold></td>
<td>
<list list-type="bullet">
<list-item><p>Ensure instrument is calibrated before starting the analysis.<xref ref-type="bibr" rid="osaf017-B168"><sup>168</sup></xref></p></list-item>
<list-item><p>Carefully plan the injection order to ensure the quality and precision of the analysis. A graphical example of a sequence is given in.<xref ref-type="bibr" rid="osaf017-B140"><sup>140</sup></xref> System suitability blanks (eg, MilliQ water) are injected to check that the instrument is working properly. System conditioning pooled QC samples can be injected to equilibrate the instrument before sample analysis. Injecting pooled QC samples throughout the sequence (eg, every 5 or 10 samples) helps measure the precision of the system (eg, stable retention times), correct for systematic bias, and support the later data pre-processing (eg, feature filtering).<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B140"><sup>140</sup></xref> Randomization of all the samples across the sequence reduces systematic errors due to carryover.<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref></p></list-item>
<list-item><p>Report the instrument configuration including the LC system, ionization source (ESI, APPI…), and MS analyzer (eg, Orbitrap).</p></list-item>
<list-item><p>Report the LC-HRMS method details including mobile phase, gradient, flow rate, column temperature, sample volume injected, acquisition mode (eg, DDA), polarity (eg, positive), and <italic>m/z</italic> range, among others. Further details can be found in Viant et al.<xref ref-type="bibr" rid="osaf017-B168"><sup>168</sup></xref></p></list-item>
</list></td>
</tr>
<tr>
<td><bold>Data pre-processing</bold></td>
<td>
<list list-type="bullet">
<list-item><p>Following existing reporting guidelines for data pre-processing such as the MEtabolomics standaRds Initiative in Toxicology (MERIT)<xref ref-type="bibr" rid="osaf017-B168"><sup>168</sup></xref> and the Metabolomics Quality Assurance and Quality Control Consortium (mQACC).<xref ref-type="bibr" rid="osaf017-B169"><sup>169</sup></xref></p></list-item>
<list-item><p>Share raw data in public repositories (eg, MetaboLights<xref ref-type="bibr" rid="osaf017-B170"><sup>170</sup></xref> and GNPS<xref ref-type="bibr" rid="osaf017-B171"><sup>171</sup></xref>) to ensure data reproducibility and reusability.<xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref></p></list-item>
<list-item><p>Use open software computational workflows integrating data pre-processing, compound annotation, and statistical analysis, to enhance reproducibility by minimizing manual data curation.<xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref></p></list-item>
<list-item><p>Use benchmark datasets to evaluate pre-processing algorithms.<xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref> Packages such as IPO<xref ref-type="bibr" rid="osaf017-B69"><sup>69</sup></xref> and Meta-Clean<xref ref-type="bibr" rid="osaf017-B172"><sup>172</sup></xref> help optimize data pre-processing parameters.</p></list-item>
<list-item><p>Consider data pre-processing QA/QC guidelines proposed in.<xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref></p></list-item>
</list></td>
</tr>
<tr>
<td><bold>Compound Annotation</bold></td>
<td>
<list list-type="bullet">
<list-item><p>Assigning identification levels to the detected features is not trivial process and requires appropriate QA/QC procedures. Document the confidence level assigned to each feature and the annotation system employed.<xref ref-type="bibr" rid="osaf017-B72"><sup>72</sup></xref></p></list-item>
<list-item><p>Manual curation of all the annotations, coupled with the provision of evidence supporting the confidence level (eg, <italic>m/z</italic>, retention time, and MS2) is important for mitigating false positives and enhancing the reliability of the results.<xref ref-type="bibr" rid="osaf017-B173"><sup>173</sup></xref></p></list-item>
<list-item><p>Report software employed, and parameters (eg, mass tolerance) used for compound annotation. The mass spectral library, suspect lists, and/or chemical databases utilized should be clearly stated, along with their respective versions.<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref> Spectra included in MS2 libraries should be curated by filtering, noise removal, and recalibration to ensure the quality of the reference spectra.<xref ref-type="bibr" rid="osaf017-B72"><sup>72</sup></xref></p></list-item>
</list></td>
</tr>
<tr>
<td><bold>Statistical analysis</bold></td>
<td>
<list list-type="bullet">
<list-item><p>Report all statistical methods transparently; the use of open source-software are preferred.</p></list-item>
<list-item><p>In-house generated code, such as R scripts, should be shared in public repositories (eg, GitHub) fostering transparency and reproducibility.<xref ref-type="bibr" rid="osaf017-B168"><sup>168</sup></xref></p></list-item>
<list-item><p>Univariate statistics: report median and Relative Standard Deviation (RSD) of each feature across the pooled QC samples.</p></list-item>
<list-item><p>Multivariate statistics: performing and reporting PCA is recommended to confirm that the pooled QC samples cluster tightly, indicating high quality data.</p></list-item>
</list></td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The NORMAN network released their guidance on suspect and non-target screening for environmental monitoring in 2023,<xref ref-type="bibr" rid="osaf017-B15"><sup>15</sup></xref> which has many parallel applications in the exposomics community. This guidance offers recommendations for all steps in a non-target screening experiment, from sample preparation to HRMS and data analysis and reporting. Additionally, the PARC initiative (environmental and biomonitoring communities) proposed their harmonized QA/QC procedures for data pre-processing of non-target and suspect screening LC-HRMS data in 2024.<xref ref-type="bibr" rid="osaf017-B54"><sup>54</sup></xref> These are very good starting points to be followed by the exposomics community, and these efforts indicate that the field is moving towards standardized workflows, which will hopefully emerge in the coming years.</p>
<p>Finally, artificial intelligence (AI) approaches (grey area of <xref ref-type="fig" rid="osaf017-F13">Figure 13</xref>), including Machine Learning (ML) approaches, are increasingly integrated into metabolomics and exposomics fields. AI can support various steps of the non-target HRMS workflow, such as feature prioritization, compound annotation, prediction modelling and pathways analysis. Although some of these approaches are still in their early stages and not yet widely and readily integrated into small molecule omics workflows, they are key starting points for supporting the new era of omics research.<xref ref-type="bibr" rid="osaf017-B174"><sup>174</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B175"><sup>175</sup></xref> The shift from having most of the features unannotated to actively predicting the structure and biological impact of thousands of molecules is essential for translating exposomics research findings into precision medicine.</p>
</sec>
<sec><title>Conclusions and future perspectives</title>
<p>Genes only explain a small fraction of chronic diseases, highlighting the need for a broader approach to better understand health and disease etiology.<xref ref-type="bibr" rid="osaf017-B176"><sup>176</sup></xref> In this context, the significant global health burden of environmental factors, such as the 9 million premature deaths attributed to pollution in 2019,<xref ref-type="bibr" rid="osaf017-B177"><sup>177</sup></xref> underscores the critical role of environmental factors. Consequently, exposomics has emerged as a complementary field to genomics to study environmental drivers of disease. However, translating these omics insights into clinical practice requires overcoming several challenges including the large number of unannotated features, the lack of harmonization, poor reproducibility across studies, and ethical, legal and social issues related to human exposomics data.<xref ref-type="bibr" rid="osaf017-B175"><sup>175</sup></xref> To address these challenges, substantial investment in exposomics research and the establishment of large-scale international consortia are urgently needed. Recent initiatives such as NEXUS are pivotal in this regard, fostering collaboration among scientists, policymakers and funders to accelerate innovation and standardize practices.</p>
<p>The increasing availability of open data (<xref ref-type="fig" rid="osaf017-F11">Figure 11</xref>) on relevant environmental chemicals and the matrices in which they are detected, is crucial to assess the suitability of our current analytical approaches to capture the chemical exposome. This data will enable a critical evaluation of whether existing methods can effectively capture relevant chemicals and downstream biological processes or whether additional analytical techniques, such as supercritical fluid chromatography<xref ref-type="bibr" rid="osaf017-B178"><sup>178</sup></xref> or two-dimensional chromatography, will be needed for a comprehensive characterization of the human exposome. However, while open data is important it is not always possible, particularly for human datasets, where privacy and ethical constraints may limit open access. To address these challenges, tiered or control data access, embargo periods and data use agreements can be employed.</p>
<p>Over the last years, the field has evolved significantly, bringing the future of exposomics and metabolomics closer to the well-established omics fields such as genomics, transcriptomics, and proteomics. The exposomics field is currently moving from proof-of-concept studies, with low sample sizes, to ExWAS, which include thousands of participants and a broad range of environmental exposures and disease endpoints.<xref ref-type="bibr" rid="osaf017-B179"><sup>179</sup></xref> A key example is the HELIX study, which focuses on a cohort of more than 1000 mother-child pairs and demonstrated that early life exposures can lead to biological responses detectable through different omics layers.<xref ref-type="bibr" rid="osaf017-B24"><sup>24</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B180"><sup>180</sup></xref> These findings highlight that exposomics can identify early life biomarkers of exposure, which can improve our understanding of health and disease status and promote public health policies. Another recent ExWAS explored environmental exposures associated with aging in the UK Biobank.<xref ref-type="bibr" rid="osaf017-B181"><sup>181</sup></xref> Twenty-five independent exposures were associated with mortality and proteomic aging. Notably, this study revealed a greater impact of the exposome on variation in mortality than polygenic risk scores.<xref ref-type="bibr" rid="osaf017-B179"><sup>179</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B181"><sup>181</sup></xref> This progress is essential for a future where integrating data from different omics will allow for a more comprehensive assessment of an individual’s disease risk, thereby facilitating personalized medicine. In the long term, the findings from exposomics studies will be instrumental in guiding policymakers to implement measures that protect future generations from harmful environmental exposures.</p>
</sec>
<sec><title>Glossary</title>
<p><bold>Exposomics:</bold> Refers to the study of the exposome, ie, characterization of small molecules environmental derived and its transformation products within an entity (cell, tissue, or organism).</p>
<p><bold>Feature:</bold> Peak (or signal) identified at a specific retention time, and <italic>m/z</italic>, containing spectral information such as MS1 and/or MS2, and intensity.</p>
<p><bold>Metabolomics:</bold> Systematic and comprehensive study of low molecular weight molecules in a particular biological sample.<xref ref-type="bibr" rid="osaf017-B39"><sup>39</sup></xref><sup>,</sup><xref ref-type="bibr" rid="osaf017-B40"><sup>40</sup></xref></p>
<p><bold>MS1:</bold> In Mass Spectrometry refers to the full scan information of the precursor ion (also known as parent ion) including the information of adducts, isotopic pattern and in-source fragments.</p>
<p><bold>MS2:</bold> Also known as MS/MS refers to the fragmentation pattern of the precursor ion.</p>
<p><bold>Non-target:</bold> This can refer to non-target <italic>study</italic> or non-target <italic>compound</italic>. <italic>Non-target study</italic> also known as untarget or untargeted, refers to discovery-based studies aiming to identify as many compounds as possible (known and unknown), whereas <italic>non-target compound</italic> refers to a compound for which no target or suspect identity can be assigned readily. The term not-target screening refers to the computational strategy searching for a broad range of compounds via tandem mass spectral libraries or database search.</p>
<p><bold>Small molecule omics:</bold> Refers to the study of low molecule weight molecules in a particular biological or environmental sample. It encompasses metabolomics and exposomics.</p>
<p><bold>Suspect:</bold> Suspects can refer to known <italic>compounds</italic> that are expected to be in the sample but with insufficient standard information to be identified. Suspect <italic>screening</italic> refers to a computational strategy searching for known chemicals that are expected to be in the sample.</p>
<p><bold>Target:</bold> This can refer to target <italic>study</italic> or target <italic>compound</italic>. <italic>Target study</italic> also known as targeted, refers to validation-based studies focused on a limited number of known compounds. <italic>Target compound</italic> refers to known compound, preselected for the analysis, with reference standard data, including MS2 and retention time, available for the unequivocal identification.</p>
</sec>
</body>
<back><ack id="ack1"><title>Acknowledgments</title>
<p>The current and former members of the Environmental Cheminformatics (ECI) group at the LCB are acknowledged for their valuable inputs and discussion, some of which have guided and inspired the ideas discussed and figures presented in this manuscript. We wish to acknowledge that AI was used by BTA to assist with generating the code for a few visualizations (<xref ref-type="fig" rid="osaf017-F11">Figures 11</xref> and <xref ref-type="fig" rid="osaf017-F12">12</xref>), and for support to polish some writing and finding synonyms for contents of original text.</p>
</ack>
<sec><title>Author contributions</title>
<p>Begoña Talavera Andújar (Conceptualization [Equal], Data curation [Lead], Formal analysis [Equal], Investigation [Equal], Methodology [Equal], Software [Equal], Validation [Equal], Visualization [Lead], Writing—original draft [Lead], Writing—review &amp; editing [Equal]), Emma Schymanski (Conceptualization [Equal], Data curation [Equal], Formal analysis [Equal], Funding acquisition [Lead], Investigation [Equal], Methodology [Equal], Project administration [Lead], Resources [Lead], Software [Equal], Supervision [Lead], Validation [Equal], Visualization [Equal], Writing—original draft [Equal], Writing—review &amp; editing [Equal])</p>
</sec>
<sec><title>Funding</title>
<p>BTA acknowledges the support of the “Microbiomes in One Health” PhD training program, which is supported by the PRIDE doctoral research funding scheme (PRIDE/11823097) of the Luxembourg National Research Fund (FNR). ELS acknowledges funding support from the Luxembourg National Research Fund (FNR) for project A18/BM/12341006.</p>
</sec>
<sec><title>Conflict of interest</title>
<p>The authors have no conflict of interest. Emma Schymanski holds the position of Associate Editor and did not participate in the peer-review or make any editorial decisions for this manuscript..</p>
</sec>
<sec sec-type="data-availability"><title>Data availability</title>
<p>No new data were generated or analysed in support of this research. The code associated with <xref ref-type="fig" rid="osaf017-F11">Figure 11</xref> (which retrieves relevant data from open repositories) is available in the ECI GitLab repository (<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://gitlab.com/uniluxembourg/lcsb/eci/exposomics-plots">https://gitlab.com/uniluxembourg/lcsb/eci/exposomics-plots</ext-link>).</p>
</sec>
<sec><title>Disclosure</title>
<p>This manuscript is based on unpublished portions of the PhD thesis of Begoña Talavera Andújar, defended on July 2024 and publicly available at the University of Luxembourg repository ORBilu (<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://orbilu.uni.lu/handle/10993/61575">https://orbilu.uni.lu/handle/10993/61575</ext-link>).</p>
</sec>
<ref-list id="ref1"><title>References</title>
<ref id="osaf017-B1"><label>1</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Rappaport</surname><given-names>SM</given-names></string-name>, <string-name name-style="western"><surname>Smith</surname><given-names>MT.</given-names></string-name></person-group> <article-title>Environment and disease risks</article-title>. <source>Science</source>. <year>2010</year>;<volume>330</volume>:<fpage>460</fpage>-<lpage>461</lpage>. <pub-id pub-id-type="doi">10.1126/science.1192603</pub-id></mixed-citation></ref>
<ref id="osaf017-B2"><label>2</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>David</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Chaker</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Price</surname><given-names>EJ</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Towards a comprehensive characterisation of the human internal chemical exposome: challenges and perspectives</article-title>. <source>Environ Int</source>. <year>2021</year>;<volume>156</volume>:<fpage>106630</fpage>.<pub-id pub-id-type="doi">10.1016/j.envint.2021.106630</pub-id></mixed-citation></ref>
<ref id="osaf017-B3"><label>3</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wild</surname><given-names>CP.</given-names></string-name></person-group> <article-title>Complementing the genome with an “exposome”: the outstanding challenge of environmental exposure measurement in molecular epidemiology</article-title>. <source>Cancer Epidemiol Biomarkers Prev</source>. <year>2005</year>;<volume>14</volume>:<fpage>1847</fpage>-<lpage>1850</lpage>. <pub-id pub-id-type="doi">10.1158/5–9965.EPI-5–0456</pub-id></mixed-citation></ref>
<ref id="osaf017-B4"><label>4</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Miller</surname><given-names>GW</given-names></string-name>, <string-name name-style="western"><surname>Jones</surname><given-names>DP.</given-names></string-name></person-group> <article-title>The nature of nurture: refining the definition of the exposome</article-title>. <source>Toxicol Sci</source>. <year>2014</year>;<volume>137</volume>:<fpage>1</fpage>-<lpage>2</lpage>. <pub-id pub-id-type="doi">10.1093/toxsci/kft251</pub-id></mixed-citation></ref>
<ref id="osaf017-B5"><label>5</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Miller</surname><given-names>GW</given-names></string-name></person-group>, <collab>Banbury Exposomics Consortium</collab>. <article-title>Integrating exposomics into biomedicine</article-title>. <source>Science</source>. <year>2025</year>;<volume>388</volume>:<fpage>356</fpage>-<lpage>358</lpage>. <pub-id pub-id-type="doi">10.1126/science.adr0544</pub-id></mixed-citation></ref>
<ref id="osaf017-B6"><label>6</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Safarlou</surname><given-names>CW</given-names></string-name>, <string-name name-style="western"><surname>Jongsma</surname><given-names>KR</given-names></string-name>, <string-name name-style="western"><surname>Vermeulen</surname><given-names>R.</given-names></string-name></person-group> <article-title>Reconceptualizing and defining exposomics within environmental health: expanding the scope of health research</article-title>. <source>Environ Health Perspect</source>. <year>2024</year>;<volume>132</volume>:<fpage>95001</fpage>. <pub-id pub-id-type="doi">10.1289/EHP14509</pub-id></mixed-citation></ref>
<ref id="osaf017-B7"><label>7</label><mixed-citation publication-type="other"><person-group person-group-type="author"><string-name name-style="western"><surname>Vermeulen</surname><given-names>R.</given-names></string-name></person-group> <article-title>Human exposome research: potential, limitations and public policy implications</article-title>. <publisher-name>Think Tank, European Parliament</publisher-name>, Accessed August 29, 2025. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://www.europarl.europa.eu/thinktank/en/document/EPRS_STU(2025)765791">https://www.europarl.europa.eu/thinktank/en/document/EPRS_STU(2025)765791</ext-link></mixed-citation></ref>
<ref id="osaf017-B8"><label>8</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wild</surname><given-names>CP.</given-names></string-name></person-group> <article-title>The exposome: from concept to utility</article-title>. <source>Int J Epidemiol</source>. <year>2012</year>;<volume>41</volume>:<fpage>24</fpage>-<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1093/ije/dyr236</pub-id></mixed-citation></ref>
<ref id="osaf017-B9"><label>9</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Vrijheid</surname><given-names>M.</given-names></string-name></person-group> <article-title>The exposome: a new paradigm to study the impact of environment on health</article-title>. <source>Thorax</source>. <year>2014</year>;<volume>69</volume>:<fpage>876</fpage>-<lpage>878</lpage>. <pub-id pub-id-type="doi">10.1136/thoraxjnl-3–204949</pub-id></mixed-citation></ref>
<ref id="osaf017-B10"><label>10</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Guillien</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Ghosh</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Gille</surname><given-names>T</given-names></string-name>, <string-name name-style="western"><surname>Dumas</surname><given-names>O.</given-names></string-name></person-group> <article-title>The exposome concept: how has it changed our understanding of environmental causes of chronic respiratory diseases?</article-title> <source>Breathe (Sheff)</source>. <year>2023</year>;<volume>19</volume>:<fpage>230044</fpage>.<pub-id pub-id-type="doi">10.1183/20734735.4–2023</pub-id></mixed-citation></ref>
<ref id="osaf017-B11"><label>11</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>La Cognata</surname><given-names>V</given-names></string-name>, <string-name name-style="western"><surname>Morello</surname><given-names>G</given-names></string-name>, <string-name name-style="western"><surname>Cavallaro</surname><given-names>S.</given-names></string-name></person-group> <article-title>Omics data and their integrative analysis to support stratified medicine in neurodegenerative diseases</article-title>. <source>Int J Mol Sci</source>. <year>2021</year>;<volume>22</volume>:<fpage>4820</fpage>.<pub-id pub-id-type="doi">10.3390/ijms22094820</pub-id></mixed-citation></ref>
<ref id="osaf017-B12"><label>12</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Babu</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Snyder</surname><given-names>M.</given-names></string-name></person-group> <article-title>Multi-omics profiling for health</article-title>. <source>Mol Cell Proteom</source>. <year>2023</year>;<volume>22</volume>:<fpage>100561</fpage>.<pub-id pub-id-type="doi">10.1016/j.mcpro.2023.100561</pub-id></mixed-citation></ref>
<ref id="osaf017-B13"><label>13</label><mixed-citation publication-type="book"><person-group person-group-type="author"><string-name name-style="western"><surname>Botas</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Campbell</surname><given-names>HM</given-names></string-name>, <string-name name-style="western"><surname>Han</surname><given-names>X</given-names></string-name>, <string-name name-style="western"><surname>Maletic-Savatic</surname><given-names>M.</given-names></string-name></person-group> <chapter-title>Metabolomics of neurodegenerative diseases</chapter-title>. In: Hurley MJ (ed.) <source>International Review of Neurobiology</source>. <publisher-name>Elsevier</publisher-name>; <year>2015</year>:<fpage>53</fpage>-<lpage>80</lpage>.</mixed-citation></ref>
<ref id="osaf017-B14"><label>14</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Roberts</surname><given-names>LD</given-names></string-name>, <string-name name-style="western"><surname>Souza</surname><given-names>AL</given-names></string-name>, <string-name name-style="western"><surname>Gerszten</surname><given-names>RE</given-names></string-name>, <string-name name-style="western"><surname>Clish</surname><given-names>CB.</given-names></string-name></person-group> <article-title>Targeted metabolomics</article-title>. <source>Curr Protoc Mol Biol</source>. 2012;98:30.2.1-30.2.24. <pub-id pub-id-type="doi">10.1002/0471142727.mb3002s98</pub-id></mixed-citation></ref>
<ref id="osaf017-B15"><label>15</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Hollender</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Schymanski</surname><given-names>EL</given-names></string-name>, <string-name name-style="western"><surname>Ahrens</surname><given-names>L</given-names></string-name></person-group>, <etal>et al</etal> <article-title>NORMAN guidance on suspect and non-target screening in environmental monitoring</article-title>. <source>Environ Sci Eur</source>. <year>2023</year>;<volume>35</volume>:<fpage>75</fpage>.<pub-id pub-id-type="doi">10.1186/s12302-3–00779-4</pub-id></mixed-citation></ref>
<ref id="osaf017-B16"><label>16</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wishart</surname><given-names>DS.</given-names></string-name></person-group> <article-title>Metabolomics for investigating physiological and pathophysiological processes</article-title>. <source>Physiol Rev</source>. <year>2019</year>;<volume>99</volume>:<fpage>1819</fpage>-<lpage>1875</lpage>. <pub-id pub-id-type="doi">10.1152/physrev.00035.2018</pub-id></mixed-citation></ref>
<ref id="osaf017-B17"><label>17</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wishart</surname><given-names>DS.</given-names></string-name></person-group> <article-title>Advances in metabolite identification</article-title>. <source>Bioanalysis</source>. <year>2011</year>;<volume>3</volume>:<fpage>1769</fpage>-<lpage>1782</lpage>. <pub-id pub-id-type="doi">10.4155/bio.11.155</pub-id></mixed-citation></ref>
<ref id="osaf017-B18"><label>18</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Metz</surname><given-names>TO</given-names></string-name>, <string-name name-style="western"><surname>Baker</surname><given-names>ES</given-names></string-name>, <string-name name-style="western"><surname>Schymanski</surname><given-names>EL</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Integrating ion mobility spectrometry into mass spectrometry-based exposome measurements: what can it add and how far can it go?</article-title> <source>Bioanalysis</source>. <year>2017</year>;<volume>9</volume>:<fpage>81</fpage>-<lpage>98</lpage>. <pub-id pub-id-type="doi">10.4155/bio-2016-0244</pub-id></mixed-citation></ref>
<ref id="osaf017-B19"><label>19</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Walker</surname><given-names>DI</given-names></string-name>, <string-name name-style="western"><surname>Valvi</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Rothman</surname><given-names>N</given-names></string-name>, <string-name name-style="western"><surname>Lan</surname><given-names>Q</given-names></string-name>, <string-name name-style="western"><surname>Miller</surname><given-names>GW</given-names></string-name>, <string-name name-style="western"><surname>Jones</surname><given-names>DP.</given-names></string-name></person-group> <article-title>The metabolome: a key measure for exposome research in epidemiology</article-title>. <source>Curr Epidemiol Rep</source>. <year>2019</year>;<volume>6</volume>:<fpage>93</fpage>-<lpage>103</lpage>.</mixed-citation></ref>
<ref id="osaf017-B20"><label>20</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Balcells</surname><given-names>C</given-names></string-name>, <string-name name-style="western"><surname>Xu</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Gil-Solsona</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Maitre</surname><given-names>L</given-names></string-name>, <string-name name-style="western"><surname>Gago-Ferrero</surname><given-names>P</given-names></string-name>, <string-name name-style="western"><surname>Keun</surname><given-names>HC.</given-names></string-name></person-group> <article-title>Blurred lines: crossing the boundaries between the chemical exposome and the metabolome</article-title>. <source>Curr Opin Chem Biol</source>. <year>2024</year>;<volume>78</volume>:<fpage>102407</fpage>.<pub-id pub-id-type="doi">10.1016/j.cbpa.2023.102407</pub-id></mixed-citation></ref>
<ref id="osaf017-B21"><label>21</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Lai</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Koelmel</surname><given-names>JP</given-names></string-name>, <string-name name-style="western"><surname>Walker</surname><given-names>DI</given-names></string-name></person-group>, <etal>et al</etal> <article-title>High-resolution mass spectrometry for human exposomics: expanding chemical space coverage</article-title>. <source>Environ Sci Technol</source>. <year>2024</year>;<volume>58</volume>:<fpage>12784</fpage>-<lpage>12822</lpage>. <pub-id pub-id-type="doi">10.1021/acs.est.4c01156</pub-id></mixed-citation></ref>
<ref id="osaf017-B22"><label>22</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Zhang</surname><given-names>P</given-names></string-name>, <string-name name-style="western"><surname>Carlsten</surname><given-names>C</given-names></string-name>, <string-name name-style="western"><surname>Chaleckis</surname><given-names>R</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Defining the scope of exposome studies and research needs from a multidisciplinary perspective</article-title>. <source>Environ Sci Technol Lett</source>. <year>2021</year>;<volume>8</volume>:<fpage>839</fpage>-<lpage>852</lpage>. <pub-id pub-id-type="doi">10.1021/acs.estlett.1c00648</pub-id></mixed-citation></ref>
<ref id="osaf017-B23"><label>23</label><mixed-citation publication-type="other">All of Us Research Program, National Institutes of Health (NIH). In: Us Res. Program NIH. Accessed May 10, 2024, <year>2020</year>. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://allofus.nih.gov/future-health-begins-all-us">https://allofus.nih.gov/future-health-begins-all-us</ext-link></mixed-citation></ref>
<ref id="osaf017-B24"><label>24</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Vrijheid</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Slama</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Robinson</surname><given-names>O</given-names></string-name></person-group>, <etal>et al</etal> <article-title>The human early-life exposome (HELIX): project rationale and design</article-title>. <source>Environ Health Perspect</source>. <year>2014</year>;<volume>122</volume>:<fpage>535</fpage>-<lpage>544</lpage>. <pub-id pub-id-type="doi">10.1289/ehp.1307204</pub-id></mixed-citation></ref>
<ref id="osaf017-B25"><label>25</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Barnes</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Benton</surname><given-names>HP</given-names></string-name>, <string-name name-style="western"><surname>Casazza</surname><given-names>K</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Training in metabolomics research. I. Designing the experiment, collecting and extracting samples and generating metabolomics data</article-title>. <source>J Mass Spectrom</source>. <year>2016</year>;<volume>51</volume>:<fpage>461</fpage>-<lpage>475</lpage>. <pub-id pub-id-type="doi">10.1002/jms.3782</pub-id></mixed-citation></ref>
<ref id="osaf017-B26"><label>26</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Faul</surname><given-names>F</given-names></string-name>, <string-name name-style="western"><surname>Erdfelder</surname><given-names>E</given-names></string-name>, <string-name name-style="western"><surname>Lang</surname><given-names>A-G</given-names></string-name>, <string-name name-style="western"><surname>Buchner</surname><given-names>A.</given-names></string-name></person-group> <article-title>G*Power 3: a flexible statistical power analysis program for the social, behavioral, and biomedical sciences</article-title>. <source>Behav Res Methods</source>. <year>2007</year>;<volume>39</volume>:<fpage>175</fpage>-<lpage>191</lpage>. <pub-id pub-id-type="doi">10.3758/BF03193146</pub-id></mixed-citation></ref>
<ref id="osaf017-B27"><label>27</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Pang</surname><given-names>Z</given-names></string-name>, <string-name name-style="western"><surname>Lu</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Zhou</surname><given-names>G</given-names></string-name></person-group>, <etal>et al</etal> <article-title>MetaboAnalyst 6.0: towards a unified platform for metabolomics data processing, analysis and interpretation</article-title>. <source>Nucleic Acids Res</source>. <year>2024</year>;<volume>52</volume>:<fpage>W398</fpage>-<lpage>W406</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkae253</pub-id></mixed-citation></ref>
<ref id="osaf017-B28"><label>28</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Tarazona</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Balzano-Nogueira</surname><given-names>L</given-names></string-name>, <string-name name-style="western"><surname>Gómez-Cabrero</surname><given-names>D</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Harmonization of quality metrics and power calculation in multi-omic studies</article-title>. <source>Nat Commun</source>. <year>2020</year>;<volume>11</volume>:<fpage>3092</fpage>.<pub-id pub-id-type="doi">10.1038/s41467-020-16937-8</pub-id></mixed-citation></ref>
<ref id="osaf017-B29"><label>29</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Dennis</surname><given-names>KK</given-names></string-name>, <string-name name-style="western"><surname>Marder</surname><given-names>E</given-names></string-name>, <string-name name-style="western"><surname>Balshaw</surname><given-names>DM</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Biomonitoring in the era of the exposome</article-title>. <source>Environ Health Perspect</source>. <year>2017</year>;<volume>125</volume>:<fpage>502</fpage>-<lpage>510</lpage>. <pub-id pub-id-type="doi">10.1289/EHP474</pub-id></mixed-citation></ref>
<ref id="osaf017-B30"><label>30</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Rappaport</surname><given-names>SM</given-names></string-name>, <string-name name-style="western"><surname>Barupal</surname><given-names>DK</given-names></string-name>, <string-name name-style="western"><surname>Wishart</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Vineis</surname><given-names>P</given-names></string-name>, <string-name name-style="western"><surname>Scalbert</surname><given-names>A.</given-names></string-name></person-group> <article-title>The blood exposome and its role in discovering causes of disease</article-title>. <source>Environ Health Perspect</source>. <year>2014</year>;<volume>122</volume>:<fpage>769</fpage>-<lpage>774</lpage>. <pub-id pub-id-type="doi">10.1289/ehp.1308015</pub-id></mixed-citation></ref>
<ref id="osaf017-B31"><label>31</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Jacobson</surname><given-names>TA</given-names></string-name>, <string-name name-style="western"><surname>Kler</surname><given-names>JS</given-names></string-name>, <string-name name-style="western"><surname>Bae</surname><given-names>Y</given-names></string-name></person-group>, <etal>et al</etal> <article-title>A state-of-the-science review and guide for measuring environmental exposure biomarkers in dried blood spots</article-title>. <source>J Expo Sci Environ Epidemiol</source>. <year>2023</year>;<volume>33</volume>:<fpage>505</fpage>-<lpage>523</lpage>. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="http://10.1038/s41370-022-00460-7">10.1038/s41370-022-00460-7</ext-link></mixed-citation></ref>
<ref id="osaf017-B32"><label>32</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Talavera Andújar</surname><given-names>B</given-names></string-name>, <string-name name-style="western"><surname>Pereira</surname><given-names>SL</given-names></string-name>, <string-name name-style="western"><surname>Bhanu Busi</surname><given-names>S</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Exploring environmental modifiers of LRRK2-associated Parkinson’s disease penetrance: an exposomics and metagenomics pilot study on household dust</article-title>. <source>Environ Int</source>. <year>2024</year>;<volume>194</volume>:<fpage>109151</fpage>.<pub-id pub-id-type="doi">10.1016/j.envint.2024.109151</pub-id></mixed-citation></ref>
<ref id="osaf017-B33"><label>33</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Running</surname><given-names>LS</given-names></string-name>, <string-name name-style="western"><surname>Kordas</surname><given-names>K</given-names></string-name>, <string-name name-style="western"><surname>Aga</surname><given-names>DS.</given-names></string-name></person-group> <article-title>Use of wristbands to measure exposure to environmental pollutants in children: recent advances and future directions</article-title>. <source>Curr Opin Environ Sci Health</source>. <year>2023</year>;<volume>32</volume>:<fpage>100450</fpage>.<pub-id pub-id-type="doi">10.1016/j.coesh.2023.100450</pub-id></mixed-citation></ref>
<ref id="osaf017-B34"><label>34</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wacławik</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Rodzaj</surname><given-names>W</given-names></string-name>, <string-name name-style="western"><surname>Wielgomas</surname><given-names>B.</given-names></string-name></person-group> <article-title>Silicone wristbands in exposure assessment: analytical considerations and comparison with other approaches</article-title>. <source>Int J Environ Res Public Health</source>. <year>2022</year>;<volume>19</volume>:<fpage>1935</fpage>. <pub-id pub-id-type="doi">10.3390/ijerph19041935</pub-id></mixed-citation></ref>
<ref id="osaf017-B35"><label>35</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Schrimpe-Rutledge</surname><given-names>AC</given-names></string-name>, <string-name name-style="western"><surname>Codreanu</surname><given-names>SG</given-names></string-name>, <string-name name-style="western"><surname>Sherrod</surname><given-names>SD</given-names></string-name>, <string-name name-style="western"><surname>McLean</surname><given-names>JA.</given-names></string-name></person-group> <article-title>Untargeted metabolomics strategies—challenges and emerging directions</article-title>. <source>J Am Soc Mass Spectrom</source>. <year>2016</year>;<volume>27</volume>:<fpage>1897</fpage>-<lpage>1905</lpage>. <pub-id pub-id-type="doi">10.1007/s13361-6–1469-y</pub-id></mixed-citation></ref>
<ref id="osaf017-B36"><label>36</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Gu</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Peach</surname><given-names>JT</given-names></string-name>, <string-name name-style="western"><surname>Warth</surname><given-names>B.</given-names></string-name></person-group> <article-title>Sample preparation strategies for mass spectrometry analysis in human exposome research: current status and future perspectives</article-title>. <source>TrAC Trends Anal Chem</source>. <year>2023</year>;<volume>166</volume>:<fpage>117151</fpage>.<pub-id pub-id-type="doi">10.1016/j.trac.2023.117151</pub-id></mixed-citation></ref>
<ref id="osaf017-B37"><label>37</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Vuckovic</surname><given-names>D.</given-names></string-name></person-group> <article-title>Current trends and challenges in sample preparation for global metabolomics using liquid chromatography–mass spectrometry</article-title>. <source>Anal Bioanal Chem</source>. <year>2012</year>;<volume>403</volume>:<fpage>1523</fpage>-<lpage>1548</lpage>. <pub-id pub-id-type="doi">10.1007/s00216-2–6039-y</pub-id></mixed-citation></ref>
<ref id="osaf017-B38"><label>38</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Alseekh</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Aharoni</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Brotman</surname><given-names>Y</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Mass spectrometry-based metabolomics: a guide for annotation, quantification and best reporting practices</article-title>. <source>Nat Methods</source>. <year>2021</year>;<volume>18</volume>:<fpage>747</fpage>-<lpage>756</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-021-01197-1</pub-id></mixed-citation></ref>
<ref id="osaf017-B39"><label>39</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Zeki</surname><given-names>ÖC</given-names></string-name>, <string-name name-style="western"><surname>Eylem</surname><given-names>CC</given-names></string-name>, <string-name name-style="western"><surname>Reçber</surname><given-names>T</given-names></string-name>, <string-name name-style="western"><surname>Kır</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Nemutlu</surname><given-names>E.</given-names></string-name></person-group> <article-title>Integration of GC–MS and LC–MS for untargeted metabolomics profiling</article-title>. <source>J Pharm Biomed Anal</source>. <year>2020</year>;<volume>190</volume>:<fpage>113509</fpage>.<pub-id pub-id-type="doi">10.1016/j.jpba.2020.113509</pub-id></mixed-citation></ref>
<ref id="osaf017-B40"><label>40</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Fiehn</surname><given-names>O.</given-names></string-name></person-group> <article-title>Metabolomics by gas chromatography–mass spectrometry: combined targeted and untargeted profiling</article-title>. <source>Curr Protoc Mol Biol</source>. <year>2016</year>;<volume>114</volume>:<fpage>30.4.1</fpage>-<lpage>30.4.32</lpage>. <pub-id pub-id-type="doi">10.1002/0471142727.mb3004s114</pub-id></mixed-citation></ref>
<ref id="osaf017-B41"><label>41</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Zhang</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Sun</surname><given-names>H</given-names></string-name>, <string-name name-style="western"><surname>Wang</surname><given-names>P</given-names></string-name>, <string-name name-style="western"><surname>Han</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Wang</surname><given-names>X.</given-names></string-name></person-group> <article-title>Modern analytical techniques in metabolomics analysis</article-title>. <source>Analyst</source>. <year>2012</year>;<volume>137</volume>:<fpage>293</fpage>-<lpage>300</lpage>. <pub-id pub-id-type="doi">10.1039/C1AN15605E</pub-id></mixed-citation></ref>
<ref id="osaf017-B42"><label>42</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wang</surname><given-names>JH</given-names></string-name>, <string-name name-style="western"><surname>Byun</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Pennathur</surname><given-names>S.</given-names></string-name></person-group> <article-title>Analytical approaches to metabolomics and applications to systems biology</article-title>. <source>Semin Nephrol</source>. <year>2010</year>;<volume>30</volume>:<fpage>500</fpage>-<lpage>511</lpage>. <pub-id pub-id-type="doi">10.1016/j.semnephrol.2010.07.007</pub-id></mixed-citation></ref>
<ref id="osaf017-B43"><label>43</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Zhang</surname><given-names>X</given-names></string-name>, <string-name name-style="western"><surname>Quinn</surname><given-names>K</given-names></string-name>, <string-name name-style="western"><surname>Cruickshank-Quinn</surname><given-names>C</given-names></string-name>, <string-name name-style="western"><surname>Reisdorph</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Reisdorph</surname><given-names>N.</given-names></string-name></person-group> <article-title>The application of ion mobility mass spectrometry to metabolomics</article-title>. <source>Curr Opin Chem Biol</source>. <year>2018</year>;<volume>42</volume>:<fpage>60</fpage>-<lpage>66</lpage>. <pub-id pub-id-type="doi">10.1016/j.cbpa.2017.11.001</pub-id></mixed-citation></ref>
<ref id="osaf017-B44"><label>44</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Izquierdo-Sandoval</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Fabregat-Safont</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Lacalle-Bergeron</surname><given-names>L</given-names></string-name>, <string-name name-style="western"><surname>Sancho</surname><given-names>JV</given-names></string-name>, <string-name name-style="western"><surname>Hernández</surname><given-names>F</given-names></string-name>, <string-name name-style="western"><surname>Portoles</surname><given-names>T.</given-names></string-name></person-group> <article-title>Benefits of ion mobility separation in GC-APCI-HRMS screening: from the construction of a CCS library to the application to real-world samples</article-title>. <source>Anal Chem</source>. <year>2022</year>;<volume>94</volume>:<fpage>9040</fpage>-<lpage>9047</lpage>. <pub-id pub-id-type="doi">10.1021/acs.analchem.2c01118</pub-id></mixed-citation></ref>
<ref id="osaf017-B45"><label>45</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Ropartz</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Fanuel</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Ujma</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Palmer</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Giles</surname><given-names>K</given-names></string-name>, <string-name name-style="western"><surname>Rogniaux</surname><given-names>H.</given-names></string-name></person-group> <article-title>Structure determination of large isomeric oligosaccharides of natural origin through multipass and multistage cyclic traveling-wave ion mobility mass spectrometry</article-title>. <source>Anal Chem</source>. <year>2019</year>;<volume>91</volume>:<fpage>12030</fpage>-<lpage>12037</lpage>. <pub-id pub-id-type="doi">10.1021/acs.analchem.9b03036</pub-id></mixed-citation></ref>
<ref id="osaf017-B46"><label>46</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Collins</surname><given-names>SL</given-names></string-name>, <string-name name-style="western"><surname>Koo</surname><given-names>I</given-names></string-name>, <string-name name-style="western"><surname>Peters</surname><given-names>JM</given-names></string-name>, <string-name name-style="western"><surname>Smith</surname><given-names>PB</given-names></string-name>, <string-name name-style="western"><surname>Patterson</surname><given-names>AD.</given-names></string-name></person-group> <article-title>Current challenges and recent developments in mass spectrometry–based metabolomics</article-title>. <source>Annu Rev Anal Chem (Palo Alto Calif)</source>. <year>2021</year>;<volume>14</volume>:<fpage>467</fpage>-<lpage>487</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-anchem-091620-015205</pub-id></mixed-citation></ref>
<ref id="osaf017-B47"><label>47</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Kind</surname><given-names>T</given-names></string-name>, <string-name name-style="western"><surname>Tsugawa</surname><given-names>H</given-names></string-name>, <string-name name-style="western"><surname>Cajka</surname><given-names>T</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Identification of small molecules using accurate mass MS/MS search</article-title>. <source>Mass Spectrom Rev</source>. <year>2018</year>;<volume>37</volume>:<fpage>513</fpage>-<lpage>532</lpage>. <pub-id pub-id-type="doi">10.1002/mas.21535</pub-id></mixed-citation></ref>
<ref id="osaf017-B48"><label>48</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Guo</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Huan</surname><given-names>T.</given-names></string-name></person-group> <article-title>Comparison of full-scan, data-dependent, and data-independent acquisition modes in liquid chromatography–mass spectrometry based untargeted metabolomics</article-title>. <source>Anal Chem</source>. <year>2020</year>;<volume>92</volume>:<fpage>8072</fpage>-<lpage>8080</lpage>. <pub-id pub-id-type="doi">10.1021/acs.analchem.9b05135</pub-id></mixed-citation></ref>
<ref id="osaf017-B49"><label>49</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Yang</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Yang</surname><given-names>L</given-names></string-name>, <string-name name-style="western"><surname>Zheng</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Cao</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Liu</surname><given-names>G.</given-names></string-name></person-group> <article-title>Data acquisition methods for non-targeted screening in environmental analysis</article-title>. <source>TrAC Trends Anal Chem</source>. <year>2023</year>;<volume>160</volume>:<fpage>116966</fpage>.<pub-id pub-id-type="doi">10.1016/j.trac.2023.116966</pub-id></mixed-citation></ref>
<ref id="osaf017-B50"><label>50</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Koelmel</surname><given-names>JP</given-names></string-name>, <string-name name-style="western"><surname>Kroeger</surname><given-names>NM</given-names></string-name>, <string-name name-style="western"><surname>Gill</surname><given-names>EL</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Expanding lipidome coverage using LC-MS/MS data-dependent acquisition with automated exclusion list generation</article-title>. <source>J Am Soc Mass Spectrom</source>. <year>2017</year>;<volume>28</volume>:<fpage>908</fpage>-<lpage>917</lpage>. <pub-id pub-id-type="doi">10.1007/s13361-7–1608-0</pub-id></mixed-citation></ref>
<ref id="osaf017-B51"><label>51</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Tsugawa</surname><given-names>H</given-names></string-name>, <string-name name-style="western"><surname>Cajka</surname><given-names>T</given-names></string-name>, <string-name name-style="western"><surname>Kind</surname><given-names>T</given-names></string-name></person-group>, <etal>et al</etal> <article-title>MS-DIAL: data-independent MS/MS deconvolution for comprehensive metabolome analysis</article-title>. <source>Nat Methods</source>. <year>2015</year>;<volume>12</volume>:<fpage>523</fpage>-<lpage>526</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.3393</pub-id></mixed-citation></ref>
<ref id="osaf017-B52"><label>52</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Goodacre</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Broadhurst</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Smilde</surname><given-names>AK</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Proposed minimum reporting standards for data analysis in metabolomics</article-title>. <source>Metabolomics</source>. <year>2007</year>;<volume>3</volume>:<fpage>231</fpage>-<lpage>241</lpage>. <pub-id pub-id-type="doi">10.1007/s11306-007-0081-3</pub-id></mixed-citation></ref>
<ref id="osaf017-B53"><label>53</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Katajamaa</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Orešič</surname><given-names>M.</given-names></string-name></person-group> <article-title>Data processing for mass spectrometry-based metabolomics</article-title>. <source>J Chromatogr A</source>. <year>2007</year>;<volume>1158</volume>:<fpage>318</fpage>-<lpage>328</lpage>. <pub-id pub-id-type="doi">10.1016/j.chroma.2007.04.021</pub-id></mixed-citation></ref>
<ref id="osaf017-B54"><label>54</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Lennon</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Chaker</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Price</surname><given-names>EJ</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Harmonized quality assurance/quality control provisions to assess completeness and robustness of MS1 data preprocessing for LC-HRMS-based suspect screening and non-targeted analysis</article-title>. <source>TrAC Trends Anal Chem</source>. <year>2024</year>;<volume>174</volume>:<fpage>117674</fpage>.<pub-id pub-id-type="doi">10.1016/j.trac.2024.117674</pub-id></mixed-citation></ref>
<ref id="osaf017-B55"><label>55</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Schmid</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Heuckeroth</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Korf</surname><given-names>A</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Integrative analysis of multimodal mass spectrometry data in MZmine 3</article-title>. <source>Nat Biotechnol</source>. <year>2023</year>;<volume>41</volume>:<fpage>447</fpage>-<lpage>449</lpage>. <pub-id pub-id-type="doi">10.1038/s41587-023-01690-2</pub-id></mixed-citation></ref>
<ref id="osaf017-B56"><label>56</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Sturm</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Bertsch</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Gröpl</surname><given-names>C</given-names></string-name></person-group>, <etal>et al</etal> <article-title>OpenMS—an open-source software framework for mass spectrometry</article-title>. <source>BMC Bioinformatics</source>. <year>2008</year>;<volume>9</volume>:<fpage>163</fpage>.<pub-id pub-id-type="doi">10.1186/1471-2105-9-163</pub-id></mixed-citation></ref>
<ref id="osaf017-B57"><label>57</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Tautenhahn</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Patti</surname><given-names>GJ</given-names></string-name>, <string-name name-style="western"><surname>Rinehart</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Siuzdak</surname><given-names>G.</given-names></string-name></person-group> <article-title>XCMS online: a web-based platform to process untargeted metabolomic data</article-title>. <source>Anal Chem</source>. <year>2012</year>;<volume>84</volume>:<fpage>5035</fpage>-<lpage>5039</lpage>. <pub-id pub-id-type="doi">10.1021/ac300698c</pub-id></mixed-citation></ref>
<ref id="osaf017-B58"><label>58</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Helmus</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Ter Laak</surname><given-names>TL</given-names></string-name>, <string-name name-style="western"><surname>Van Wezel</surname><given-names>AP</given-names></string-name>, <string-name name-style="western"><surname>De Voogt</surname><given-names>P</given-names></string-name>, <string-name name-style="western"><surname>Schymanski</surname><given-names>EL.</given-names></string-name></person-group> <article-title>patRoon: open source software platform for environmental mass spectrometry based non-target screening</article-title>. <source>J Cheminform</source>. <year>2021</year>;<volume>13</volume>:<fpage>1</fpage>.<pub-id pub-id-type="doi">10.1186/s13321-020-00477-w</pub-id></mixed-citation></ref>
<ref id="osaf017-B59"><label>59</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Misra</surname><given-names>BB.</given-names></string-name></person-group> <article-title>New software tools, databases, and resources in metabolomics: updates from 2020</article-title>. <source>Metabolomics</source>. <year>2021</year>;<volume>17</volume>:<fpage>49</fpage>.<pub-id pub-id-type="doi">10.1007/s11306-021-01796-1</pub-id></mixed-citation></ref>
<ref id="osaf017-B60"><label>60</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Renner</surname><given-names>G</given-names></string-name>, <string-name name-style="western"><surname>Reuschenbach</surname><given-names>M.</given-names></string-name></person-group> <article-title>Critical review on data processing algorithms in non-target screening: challenges and opportunities to improve result comparability</article-title>. <source>Anal Bioanal Chem</source>. <year>2023</year>;<volume>415</volume>:<fpage>4111</fpage>-<lpage>4123</lpage>. <pub-id pub-id-type="doi">10.1007/s00216-3–04776-7</pub-id></mixed-citation></ref>
<ref id="osaf017-B61"><label>61</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Chambers</surname><given-names>MC</given-names></string-name>, <string-name name-style="western"><surname>Maclean</surname><given-names>B</given-names></string-name>, <string-name name-style="western"><surname>Burke</surname><given-names>R</given-names></string-name></person-group>, <etal>et al</etal> <article-title>A cross-platform toolkit for mass spectrometry and proteomics</article-title>. <source>Nat Biotechnol</source>. <year>2012</year>;<volume>30</volume>:<fpage>918</fpage>-<lpage>920</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.2377</pub-id></mixed-citation></ref>
<ref id="osaf017-B62"><label>62</label><mixed-citation publication-type="other">ProteoWizard: Home. Accessed April 2, 2024, <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://proteowizard.sourceforge.io/index.html">https://proteowizard.sourceforge.io/index.html</ext-link></mixed-citation></ref>
<ref id="osaf017-B63"><label>63</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Holman</surname><given-names>JD</given-names></string-name>, <string-name name-style="western"><surname>Tabb</surname><given-names>DL</given-names></string-name>, <string-name name-style="western"><surname>Mallick</surname><given-names>P.</given-names></string-name></person-group> <article-title>Employing ProteoWizard to convert raw mass spectrometry data</article-title>. <source>Curr Protoc Bioinformatics</source>. <year>2014</year>;<volume>46</volume>:<fpage>13.24.1</fpage>-<lpage>13.24.9</lpage>. <pub-id pub-id-type="doi">10.1002/0471250953.bi1324s46</pub-id></mixed-citation></ref>
<ref id="osaf017-B64"><label>64</label><mixed-citation publication-type="book"><person-group person-group-type="author"><string-name name-style="western"><surname>Karaman</surname><given-names>I</given-names></string-name>, <string-name name-style="western"><surname>Climaco Pinto</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Graça</surname><given-names>G.</given-names></string-name></person-group> <chapter-title>Metabolomics data preprocessing: from raw data to features for statistical analysis</chapter-title>. In: <source>Comprehensive Analytical Chemistry</source>. <publisher-name>Elsevier</publisher-name>; <year>2018</year>:<fpage>197</fpage>-<lpage>225</lpage>.</mixed-citation></ref>
<ref id="osaf017-B65"><label>65</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Boccard</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Veuthey</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Rudaz</surname><given-names>S.</given-names></string-name></person-group> <article-title>Knowledge discovery in metabolomics: an overview of MS data handling</article-title>. <source>J Sep Sci</source>. <year>2010</year>;<volume>33</volume>:<fpage>290</fpage>-<lpage>304</lpage>. <pub-id pub-id-type="doi">10.1002/jssc.200900609</pub-id></mixed-citation></ref>
<ref id="osaf017-B66"><label>66</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Santamaria</surname><given-names>G</given-names></string-name>, <string-name name-style="western"><surname>Pinto</surname><given-names>FR.</given-names></string-name></person-group> <article-title>Bioinformatic analysis of metabolomic data: from raw spectra to biological insight</article-title>. <source>BioChem</source>. <year>2024</year>;<volume>4</volume>:<fpage>90</fpage>-<lpage>114</lpage>. <pub-id pub-id-type="doi">10.3390/biochem4020005</pub-id></mixed-citation></ref>
<ref id="osaf017-B67"><label>67</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Savitzky</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Golay</surname><given-names>MJE.</given-names></string-name></person-group> <article-title>Smoothing and differentiation of data by simplified least squares procedures</article-title>. <source>Anal Chem</source>. <year>1964</year>;<volume>36</volume>:<fpage>1627</fpage>-<lpage>1639</lpage>. <pub-id pub-id-type="doi">10.1021/ac60214a047</pub-id></mixed-citation></ref>
<ref id="osaf017-B68"><label>68</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Lommen</surname><given-names>A.</given-names></string-name></person-group> <article-title>MetAlign: interface-driven, versatile metabolomics tool for hyphenated full-scan mass spectrometry data preprocessing</article-title>. <source>Anal Chem</source>. <year>2009</year>;<volume>81</volume>:<fpage>3079</fpage>-<lpage>3086</lpage>. <pub-id pub-id-type="doi">10.1021/ac900036d</pub-id></mixed-citation></ref>
<ref id="osaf017-B69"><label>69</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Libiseller</surname><given-names>G</given-names></string-name>, <string-name name-style="western"><surname>Dvorzak</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Kleb</surname><given-names>U</given-names></string-name></person-group>, <etal>et al</etal> <article-title>IPO: a tool for automated optimization of XCMS parameters</article-title>. <source>BMC Bioinformatics</source>. <year>2015</year>;<volume>16</volume>:<fpage>118</fpage>.<pub-id pub-id-type="doi">10.1186/s12859-015-0562-8</pub-id></mixed-citation></ref>
<ref id="osaf017-B70"><label>70</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Blaženović</surname><given-names>I</given-names></string-name>, <string-name name-style="western"><surname>Kind</surname><given-names>T</given-names></string-name>, <string-name name-style="western"><surname>Ji</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Fiehn</surname><given-names>O.</given-names></string-name></person-group> <article-title>Software tools and approaches for compound identification of LC-MS/MS data in metabolomics</article-title>. <source>Metabolites</source>. <year>2018</year>;<volume>8</volume>:<fpage>31</fpage>.<pub-id pub-id-type="doi">10.3390/metabo8020031</pub-id></mixed-citation></ref>
<ref id="osaf017-B71"><label>71</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Chaleckis</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Meister</surname><given-names>I</given-names></string-name>, <string-name name-style="western"><surname>Zhang</surname><given-names>P</given-names></string-name>, <string-name name-style="western"><surname>Wheelock</surname><given-names>CE.</given-names></string-name></person-group> <article-title>Challenges, progress and promises of metabolite annotation for LC–MS-based metabolomics</article-title>. <source>Curr Opin Biotechnol</source>. <year>2019</year>;<volume>55</volume>:<fpage>44</fpage>-<lpage>50</lpage>. <pub-id pub-id-type="doi">10.1016/j.copbio.2018.07.010</pub-id></mixed-citation></ref>
<ref id="osaf017-B72"><label>72</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Oberacher</surname><given-names>H</given-names></string-name>, <string-name name-style="western"><surname>Sasse</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Antignac</surname><given-names>J-P</given-names></string-name></person-group>, <etal>et al</etal> <article-title>A European proposal for quality control and quality assurance of tandem mass spectral libraries</article-title>. <source>Environ Sci Eur</source>. <year>2020</year>;<volume>32</volume>:<fpage>43</fpage>.<pub-id pub-id-type="doi">10.1186/s12302-020-00314-9</pub-id></mixed-citation></ref>
<ref id="osaf017-B73"><label>73</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>de Jonge</surname><given-names>NF</given-names></string-name>, <string-name name-style="western"><surname>Mildau</surname><given-names>K</given-names></string-name>, <string-name name-style="western"><surname>Meijer</surname><given-names>D</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Good practices and recommendations for using and benchmarking computational metabolomics metabolite annotation tools</article-title>. <source>Metabolomics</source>. <year>2022</year>;<volume>18</volume>:<fpage>103</fpage>.<pub-id pub-id-type="doi">10.1007/s11306-022-01963-y</pub-id></mixed-citation></ref>
<ref id="osaf017-B74"><label>74</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Giera</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Aisporna</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Uritboonthai</surname><given-names>W</given-names></string-name>, <string-name name-style="western"><surname>Siuzdak</surname><given-names>G.</given-names></string-name></person-group> <article-title>The hidden impact of in-source fragmentation in metabolic and chemical mass spectrometry data interpretation</article-title>. <source>Nat Metab</source>. <year>2024</year>;<volume>6</volume>:<fpage>1647</fpage>-<lpage>1648</lpage>. <pub-id pub-id-type="doi">10.1038/s42255-024-01076-x</pub-id></mixed-citation></ref>
<ref id="osaf017-B75"><label>75</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>El Abiead</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Rutz</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Zuffa</surname><given-names>S</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Discovery of metabolites prevails amid in-source fragmentation</article-title>. <source>Nat Metab</source>. <year>2025</year>;<volume>7</volume>:<fpage>435</fpage>-<lpage>437</lpage>. <pub-id pub-id-type="doi">10.1038/s42255-025-01239-4</pub-id></mixed-citation></ref>
<ref id="osaf017-B76"><label>76</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Schmid</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Petras</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Nothias</surname><given-names>L-F</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Ion identity molecular networking for mass spectrometry-based metabolomics in the GNPS environment</article-title>. <source>Nat Commun</source>. <year>2021</year>;<volume>12</volume>:<fpage>3832</fpage>.<pub-id pub-id-type="doi">10.1038/s41467-021-23953-9</pub-id></mixed-citation></ref>
<ref id="osaf017-B77"><label>77</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Xu</surname><given-names>Y-F</given-names></string-name>, <string-name name-style="western"><surname>Lu</surname><given-names>W</given-names></string-name>, <string-name name-style="western"><surname>Rabinowitz</surname><given-names>JD.</given-names></string-name></person-group> <article-title>Avoiding misannotation of in-source fragmentation products as cellular metabolites in liquid chromatography-mass spectrometry-based metabolomics</article-title>. <source>Anal Chem</source>. <year>2015</year>;<volume>87</volume>:<fpage>2273</fpage>-<lpage>2281</lpage>. <pub-id pub-id-type="doi">10.1021/ac504118y</pub-id></mixed-citation></ref>
<ref id="osaf017-B78"><label>78</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Xue</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Domingo-Almenara</surname><given-names>X</given-names></string-name>, <string-name name-style="western"><surname>Guijas</surname><given-names>C</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Enhanced in-source fragmentation annotation enables novel data independent acquisition and autonomous METLIN molecular identification</article-title>. <source>Anal Chem</source>. <year>2020</year>;<volume>92</volume>:<fpage>6051</fpage>-<lpage>6059</lpage>. <pub-id pub-id-type="doi">10.1021/acs.analchem.0c00409</pub-id></mixed-citation></ref>
<ref id="osaf017-B79"><label>79</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Krier</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Singh</surname><given-names>RR</given-names></string-name>, <string-name name-style="western"><surname>Kondić</surname><given-names>T</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Discovering pesticides and their TPs in Luxembourg waters using open cheminformatics approaches</article-title>. <source>Environ Int</source>. <year>2022</year>;<volume>158</volume>:<fpage>106885</fpage>.<pub-id pub-id-type="doi">10.1016/j.envint.2021.106885</pub-id></mixed-citation></ref>
<ref id="osaf017-B80"><label>80</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Hollender</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Bourgin</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Fenner</surname><given-names>KB</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Exploring the behaviour of emerging contaminants in the water cycle using the capabilities of high resolution mass spectrometry</article-title>. <source>Chimia (Aarau)</source>. <year>2014</year>;<volume>68</volume>:<fpage>793</fpage>-<lpage>798</lpage>. <pub-id pub-id-type="doi">10.2533/chimia.2014.793</pub-id></mixed-citation></ref>
<ref id="osaf017-B81"><label>81</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Schymanski</surname><given-names>EL</given-names></string-name>, <string-name name-style="western"><surname>Jeon</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Gulde</surname><given-names>R</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Identifying small molecules via high resolution mass spectrometry: communicating confidence</article-title>. <source>Environ Sci Technol</source>. <year>2014</year>;<volume>48</volume>:<fpage>2097</fpage>-<lpage>2098</lpage>. <pub-id pub-id-type="doi">10.1021/es5002105</pub-id></mixed-citation></ref>
<ref id="osaf017-B82"><label>82</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Koelmel</surname><given-names>JP</given-names></string-name>, <string-name name-style="western"><surname>Kroeger</surname><given-names>NM</given-names></string-name>, <string-name name-style="western"><surname>Ulmer</surname><given-names>CZ</given-names></string-name></person-group>, <etal>et al</etal> <article-title>LipidMatch: an automated workflow for rule-based lipid identification using untargeted high-resolution tandem mass spectrometry data</article-title>. <source>BMC Bioinformatics</source>. <year>2017</year>;<volume>18</volume>:<fpage>331</fpage>.<pub-id pub-id-type="doi">10.1186/s12859-017-1744-3</pub-id></mixed-citation></ref>
<ref id="osaf017-B83"><label>83</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Sumner</surname><given-names>LW</given-names></string-name>, <string-name name-style="western"><surname>Amberg</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Barrett</surname><given-names>D</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Proposed minimum reporting standards for chemical analysis</article-title>. <source>Metabolomics</source>. <year>2007</year>;<volume>3</volume>:<fpage>211</fpage>-<lpage>221</lpage>. <pub-id pub-id-type="doi">10.1007/s11306-7–0082-2</pub-id></mixed-citation></ref>
<ref id="osaf017-B84"><label>84</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Celma</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Sancho</surname><given-names>JV</given-names></string-name>, <string-name name-style="western"><surname>Schymanski</surname><given-names>EL</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Improving target and suspect screening high-resolution mass spectrometry workflows in environmental analysis by ion mobility separation</article-title>. <source>Environ Sci Technol</source>. <year>2020</year>;<volume>54</volume>:<fpage>15120</fpage>-<lpage>15131</lpage>. <pub-id pub-id-type="doi">10.1021/acs.est.0c05713</pub-id></mixed-citation></ref>
<ref id="osaf017-B85"><label>85</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Charbonnet</surname><given-names>JA</given-names></string-name>, <string-name name-style="western"><surname>McDonough</surname><given-names>CA</given-names></string-name>, <string-name name-style="western"><surname>Xiao</surname><given-names>F</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Communicating confidence of per- and polyfluoroalkyl substance identification via high-resolution mass spectrometry</article-title>. <source>Environ Sci Technol Lett</source>. <year>2022</year>;<volume>9</volume>:<fpage>473</fpage>-<lpage>481</lpage>. <pub-id pub-id-type="doi">10.1021/acs.estlett.2c00206</pub-id></mixed-citation></ref>
<ref id="osaf017-B86"><label>86</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Koelmel</surname><given-names>JP</given-names></string-name>, <string-name name-style="western"><surname>Xie</surname><given-names>H</given-names></string-name>, <string-name name-style="western"><surname>Price</surname><given-names>EJ</given-names></string-name></person-group>, <etal>et al</etal> <article-title>An actionable annotation scoring framework for gas chromatography-high-resolution mass spectrometry</article-title>. <source>Exposome</source>. <year>2022</year>;<volume>2</volume>:<fpage>osac007</fpage>.<pub-id pub-id-type="doi">10.1093/exposome/osac007</pub-id></mixed-citation></ref>
<ref id="osaf017-B87"><label>87</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Schymanski</surname><given-names>EL</given-names></string-name>, <string-name name-style="western"><surname>Kondić</surname><given-names>T</given-names></string-name>, <string-name name-style="western"><surname>Neumann</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Thiessen</surname><given-names>PA</given-names></string-name>, <string-name name-style="western"><surname>Zhang</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Bolton</surname><given-names>EE.</given-names></string-name></person-group> <article-title>Empowering large chemical knowledge bases for exposomics: PubChemLite meets MetFrag</article-title>. <source>J Cheminform</source>. <year>2021</year>;<volume>13</volume>:<fpage>19</fpage>.<pub-id pub-id-type="doi">10.1186/s13321-021-00489-0</pub-id></mixed-citation></ref>
<ref id="osaf017-B88"><label>88</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Creek</surname><given-names>DJ</given-names></string-name>, <string-name name-style="western"><surname>Dunn</surname><given-names>WB</given-names></string-name>, <string-name name-style="western"><surname>Fiehn</surname><given-names>O</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Metabolite identification: are you sure? And how do your peers gauge your confidence?</article-title> <source>Metabolomics</source>. <year>2014</year>;<volume>10</volume>:<fpage>350</fpage>-<lpage>353</lpage>. <pub-id pub-id-type="doi">10.1007/s11306-014-0656-8</pub-id></mixed-citation></ref>
<ref id="osaf017-B89"><label>89</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Liebisch</surname><given-names>G</given-names></string-name>, <string-name name-style="western"><surname>Vizcaíno</surname><given-names>JA</given-names></string-name>, <string-name name-style="western"><surname>Köfeler</surname><given-names>H</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Shorthand notation for lipid structures derived from mass spectrometry</article-title>. <source>J Lipid Res</source>. <year>2013</year>;<volume>54</volume>:<fpage>1523</fpage>-<lpage>1530</lpage>. <pub-id pub-id-type="doi">10.1194/jlr.M033506</pub-id></mixed-citation></ref>
<ref id="osaf017-B90"><label>90</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Scheubert</surname><given-names>K</given-names></string-name>, <string-name name-style="western"><surname>Hufsky</surname><given-names>F</given-names></string-name>, <string-name name-style="western"><surname>Petras</surname><given-names>D</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Significance estimation for large scale metabolomics annotations by spectral matching</article-title>. <source>Nat Commun</source>. <year>2017</year>;<volume>8</volume>:<fpage>1494</fpage>.<pub-id pub-id-type="doi">10.1038/s41467-017-01318-5</pub-id></mixed-citation></ref>
<ref id="osaf017-B91"><label>91</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Metz</surname><given-names>TO</given-names></string-name>, <string-name name-style="western"><surname>Chang</surname><given-names>CH</given-names></string-name>, <string-name name-style="western"><surname>Gautam</surname><given-names>V</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Introducing “identification probability” for automated and transferable assessment of metabolite identification confidence in metabolomics and related studies</article-title>. <source>Anal Chem</source>. <year>2025</year>;<volume>97</volume>:<fpage>1</fpage>-<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1021/acs.analchem.4c04060</pub-id></mixed-citation></ref>
<ref id="osaf017-B92"><label>92</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Talavera Andújar</surname><given-names>B</given-names></string-name>, <string-name name-style="western"><surname>Aurich</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Aho</surname><given-names>VTE</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Studying the Parkinson’s disease metabolome and exposome in biological samples through different analytical and cheminformatics approaches: a pilot study</article-title>. <source>Anal Bioanal Chem</source>. <year>2022</year>;<volume>414</volume>:<fpage>7399</fpage>-<lpage>7419</lpage>. <pub-id pub-id-type="doi">10.1007/s00216-2–04207-z</pub-id></mixed-citation></ref>
<ref id="osaf017-B93"><label>93</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Alygizakis</surname><given-names>N</given-names></string-name>, <string-name name-style="western"><surname>Lestremau</surname><given-names>F</given-names></string-name>, <string-name name-style="western"><surname>Gago-Ferrero</surname><given-names>P</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Towards a harmonized identification scoring system in LC-HRMS/MS based non-target screening (NTS) of emerging contaminants</article-title>. <source>TrAC Trends Anal Chem</source>. <year>2023</year>;<volume>159</volume>:<fpage>116944</fpage>.<pub-id pub-id-type="doi">10.1016/j.trac.2023.116944</pub-id></mixed-citation></ref>
<ref id="osaf017-B94"><label>94</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Boatman</surname><given-names>AK</given-names></string-name>, <string-name name-style="western"><surname>Chappel</surname><given-names>JR</given-names></string-name>, <string-name name-style="western"><surname>Kirkwood-Donelson</surname><given-names>KI</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Updated guidance for communicating PFAS identification confidence with ion mobility spectrometry</article-title>. <source>Environ Sci Technol</source>. <year>2025</year>;<volume>59</volume>:<fpage>17711</fpage>-<lpage>17721</lpage>. <pub-id pub-id-type="doi">10.1021/acs.est.5c01354</pub-id></mixed-citation></ref>
<ref id="osaf017-B95"><label>95</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Bittremieux</surname><given-names>W</given-names></string-name>, <string-name name-style="western"><surname>Wang</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Dorrestein</surname><given-names>PC.</given-names></string-name></person-group> <article-title>The critical role that spectral libraries play in capturing the metabolomics community knowledge</article-title>. <source>Metabolomics</source>. <year>2022</year>;<volume>18</volume>:<fpage>94</fpage>.<pub-id pub-id-type="doi">10.1007/s11306-022-01947-y</pub-id></mixed-citation></ref>
<ref id="osaf017-B96"><label>96</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Horai</surname><given-names>H</given-names></string-name>, <string-name name-style="western"><surname>Arita</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Kanaya</surname><given-names>S</given-names></string-name></person-group>, <etal>et al</etal> <article-title>MassBank: a public repository for sharing mass spectral data for life sciences</article-title>. <source>J Mass Spectrom</source>. <year>2010</year>;<volume>45</volume>:<fpage>703</fpage>-<lpage>714</lpage>. <pub-id pub-id-type="doi">10.1002/jms.1777</pub-id></mixed-citation></ref>
<ref id="osaf017-B97"><label>97</label><mixed-citation publication-type="other">MassBank of North America. Accessed September 11, 2023. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://mona.fiehnlab.ucdavis.edu/">https://mona.fiehnlab.ucdavis.edu/</ext-link></mixed-citation></ref>
<ref id="osaf017-B98"><label>98</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wang</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Carver</surname><given-names>JJ</given-names></string-name>, <string-name name-style="western"><surname>Phelan</surname><given-names>VV</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Sharing and community curation of mass spectrometry data with Global Natural Products Social Molecular Networking</article-title>. <source>Nat Biotechnol</source>. <year>2016</year>;<volume>34</volume>:<fpage>828</fpage>-<lpage>837</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.3597</pub-id></mixed-citation></ref>
<ref id="osaf017-B99"><label>99</label><mixed-citation publication-type="other">mzCloud—Advanced Mass Spectral Database. Accessed April 28, 2024. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://www.mzcloud.org/">https://www.mzcloud.org/</ext-link></mixed-citation></ref>
<ref id="osaf017-B100"><label>100</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Guijas</surname><given-names>C</given-names></string-name>, <string-name name-style="western"><surname>Montenegro-Burke</surname><given-names>JR</given-names></string-name>, <string-name name-style="western"><surname>Domingo-Almenara</surname><given-names>X</given-names></string-name></person-group>, <etal>et al</etal> <article-title>METLIN: a technology platform for identifying knowns and unknowns</article-title>. <source>Anal Chem</source>. <year>2018</year>;<volume>90</volume>:<fpage>3156</fpage>-<lpage>3164</lpage>. <pub-id pub-id-type="doi">10.1021/acs.analchem.7b04424</pub-id></mixed-citation></ref>
<ref id="osaf017-B101"><label>101</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Stein</surname><given-names>SE</given-names></string-name>, <string-name name-style="western"><surname>Scott</surname><given-names>DR.</given-names></string-name></person-group> <article-title>Optimization and testing of mass spectral library search algorithms for compound identification</article-title>. <source>J Am Soc Mass Spectrom</source>. <year>1994</year>;<volume>5</volume>:<fpage>5:859</fpage>-<lpage>866</lpage>. <pub-id pub-id-type="doi">10.1016/1044(94)87009-8</pub-id></mixed-citation></ref>
<ref id="osaf017-B102"><label>102</label><mixed-citation publication-type="other">PubChem Classification Browser. Accessed May 19, 2024. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://pubchem.ncbi.nlm.nih.gov/classification/#hid=72">https://pubchem.ncbi.nlm.nih.gov/classification/#hid=72</ext-link></mixed-citation></ref>
<ref id="osaf017-B103"><label>103</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Li</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Kind</surname><given-names>T</given-names></string-name>, <string-name name-style="western"><surname>Folz</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Vaniya</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Mehta</surname><given-names>SS</given-names></string-name>, <string-name name-style="western"><surname>Fiehn</surname><given-names>O.</given-names></string-name></person-group> <article-title>Spectral entropy outperforms MS/MS dot product similarity for small-molecule compound identification</article-title>. <source>Nat Methods</source>. <year>2021</year>;<volume>18</volume>:<fpage>1524</fpage>-<lpage>1531</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-021-01331-z</pub-id></mixed-citation></ref>
<ref id="osaf017-B104"><label>104</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Ruttkies</surname><given-names>C</given-names></string-name>, <string-name name-style="western"><surname>Schymanski</surname><given-names>EL</given-names></string-name>, <string-name name-style="western"><surname>Wolf</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Hollender</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Neumann</surname><given-names>S.</given-names></string-name></person-group> <article-title>MetFrag relaunched: incorporating strategies beyond in silico fragmentation</article-title>. <source>J Cheminform</source>. <year>2016</year>;<volume>8</volume>:<fpage>3</fpage>.<pub-id pub-id-type="doi">10.1186/s13321-016-0115-9</pub-id></mixed-citation></ref>
<ref id="osaf017-B105"><label>105</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Tsugawa</surname><given-names>H</given-names></string-name>, <string-name name-style="western"><surname>Kind</surname><given-names>T</given-names></string-name>, <string-name name-style="western"><surname>Nakabayashi</surname><given-names>R</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Hydrogen rearrangement rules: computational MS/MS fragmentation and structure elucidation using MS-FINDER software</article-title>. <source>Anal Chem</source>. <year>2016</year>;<volume>88</volume>:<fpage>7946</fpage>-<lpage>7958</lpage>. <pub-id pub-id-type="doi">10.1021/acs.analchem.6b00770</pub-id></mixed-citation></ref>
<ref id="osaf017-B106"><label>106</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Allen</surname><given-names>F</given-names></string-name>, <string-name name-style="western"><surname>Pon</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Wilson</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Greiner</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Wishart</surname><given-names>D.</given-names></string-name></person-group> <article-title>CFM-ID: a web server for annotation, spectrum prediction and metabolite identification from tandem mass spectra</article-title>. <source>Nucleic Acids Res</source>. <year>2014</year>;<volume>42</volume>:<fpage>W94</fpage>-<lpage>W99</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gku436</pub-id></mixed-citation></ref>
<ref id="osaf017-B107"><label>107</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Dührkop</surname><given-names>K</given-names></string-name>, <string-name name-style="western"><surname>Shen</surname><given-names>H</given-names></string-name>, <string-name name-style="western"><surname>Meusel</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Rousu</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Böcker</surname><given-names>S.</given-names></string-name></person-group> <article-title>Searching molecular structure databases with tandem mass spectra using CSI: FingerID</article-title>. <source>Proc Natl Acad Sci U S A</source>. <year>2015</year>;<volume>112</volume>:<fpage>12580</fpage>-<lpage>12585</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1509788112</pub-id></mixed-citation></ref>
<ref id="osaf017-B108"><label>108</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Dührkop</surname><given-names>K</given-names></string-name>, <string-name name-style="western"><surname>Fleischauer</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Ludwig</surname><given-names>M</given-names></string-name></person-group>, <etal>et al</etal> <article-title>SIRIUS 4: a rapid tool for turning tandem mass spectra into metabolite structure information</article-title>. <source>Nat Methods</source>. <year>2019</year>;<volume>16</volume>:<fpage>299</fpage>-<lpage>302</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-019-0344-8</pub-id></mixed-citation></ref>
<ref id="osaf017-B109"><label>109</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Kind</surname><given-names>T</given-names></string-name>, <string-name name-style="western"><surname>Liu</surname><given-names>K-H</given-names></string-name>, <string-name name-style="western"><surname>Lee</surname><given-names>DY</given-names></string-name>, <string-name name-style="western"><surname>DeFelice</surname><given-names>B</given-names></string-name>, <string-name name-style="western"><surname>Meissen</surname><given-names>JK</given-names></string-name>, <string-name name-style="western"><surname>Fiehn</surname><given-names>O.</given-names></string-name></person-group> <article-title>LipidBlast in silico tandem mass spectrometry database for lipid identification</article-title>. <source>Nat Methods</source>. <year>2013</year>;<volume>10</volume>:<fpage>755</fpage>-<lpage>758</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.2551</pub-id></mixed-citation></ref>
<ref id="osaf017-B110"><label>110</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wishart</surname><given-names>DS</given-names></string-name>, <string-name name-style="western"><surname>Feunang</surname><given-names>YD</given-names></string-name>, <string-name name-style="western"><surname>Marcu</surname><given-names>A</given-names></string-name></person-group>, <etal>et al</etal> <article-title>HMDB 4.0: the human metabolome database for 2018</article-title>. <source>Nucleic Acids Res</source>. <year>2018</year>;<volume>46</volume>:<fpage>D608</fpage>-<lpage>D617</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkx1089</pub-id></mixed-citation></ref>
<ref id="osaf017-B111"><label>111</label><mixed-citation publication-type="other">CAS REGISTRY, CAS. Accessed April 30, 2024. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://www.cas.org/cas-data/cas-registry">https://www.cas.org/cas-data/cas-registry</ext-link></mixed-citation></ref>
<ref id="osaf017-B112"><label>112</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Pence</surname><given-names>HE</given-names></string-name>, <string-name name-style="western"><surname>Williams</surname><given-names>A.</given-names></string-name></person-group> <article-title>ChemSpider: an online chemical information resource</article-title>. <source>J Chem Educ</source>. <year>2010</year>;<volume>87</volume>:<fpage>1123</fpage>-<lpage>1124</lpage>. <pub-id pub-id-type="doi">10.1021/ed100697w</pub-id></mixed-citation></ref>
<ref id="osaf017-B113"><label>113</label><mixed-citation publication-type="book"><person-group person-group-type="author"><string-name name-style="western"><surname>Bolton</surname><given-names>EE</given-names></string-name>, <string-name name-style="western"><surname>Wang</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Thiessen</surname><given-names>PA</given-names></string-name>, <string-name name-style="western"><surname>Bryant</surname><given-names>SH.</given-names></string-name></person-group> <chapter-title>Chapter 12 - PubChem: integrated platform of small molecules and biological activities</chapter-title>. In: <person-group person-group-type="editor"><string-name name-style="western"><surname>Wheeler</surname><given-names>RA</given-names></string-name>, <string-name name-style="western"><surname>Spellmeyer</surname><given-names>DC</given-names></string-name></person-group>, eds. <source>Annual Reports in Computational Chemistry</source>. <publisher-name>Elsevier</publisher-name>; <year>2008</year>:<fpage>217</fpage>-<lpage>241</lpage>.</mixed-citation></ref>
<ref id="osaf017-B114"><label>114</label><mixed-citation publication-type="other"><person-group person-group-type="author"><string-name name-style="western"><surname>Bolton</surname><given-names>E</given-names></string-name>, <string-name name-style="western"><surname>Schymanski</surname><given-names>E</given-names></string-name>, <string-name name-style="western"><surname>Kondic</surname><given-names>T</given-names></string-name>, <string-name name-style="western"><surname>Thiessen</surname><given-names>P</given-names></string-name>, <string-name name-style="western"><surname>Zhang</surname><given-names>J.</given-names></string-name></person-group> PubChemLite for Exposomics. <year>2020</year>.</mixed-citation></ref>
<ref id="osaf017-B115"><label>115</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Elapavalore</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Ross</surname><given-names>DH</given-names></string-name>, <string-name name-style="western"><surname>Grouès</surname><given-names>V</given-names></string-name></person-group>, <etal>et al</etal> <article-title>PubChemLite Plus Collision Cross Section (CCS) values for enhanced interpretation of nontarget environmental data</article-title>. <source>Environ Sci Technol Lett</source>. <year>2025</year>;<volume>12</volume>:<fpage>166</fpage>-<lpage>174</lpage>. <pub-id pub-id-type="doi">10.1021/acs.estlett.4c01003</pub-id></mixed-citation></ref>
<ref id="osaf017-B116"><label>116</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Barupal</surname><given-names>DK</given-names></string-name>, <string-name name-style="western"><surname>Fiehn</surname><given-names>O.</given-names></string-name></person-group> <article-title>Generating the blood exposome database using a comprehensive text mining and database fusion approach</article-title>. <source>Environ Health Perspect</source>. <year>2019</year>;<volume>127</volume>:<fpage>97008</fpage>.<pub-id pub-id-type="doi">10.1289/EHP4713</pub-id></mixed-citation></ref>
<ref id="osaf017-B117"><label>117</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Kanehisa</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Goto</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Hattori</surname><given-names>M</given-names></string-name></person-group>, <etal>et al</etal> <article-title>From genomics to chemical genomics: new developments in KEGG</article-title>. <source>Nucleic Acids Res</source>. <year>2006</year>;<volume>34</volume>:<fpage>D354</fpage>-<lpage>D357</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkj102</pub-id></mixed-citation></ref>
<ref id="osaf017-B118"><label>118</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Caspi</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Foerster</surname><given-names>H</given-names></string-name>, <string-name name-style="western"><surname>Fulcher</surname><given-names>CA</given-names></string-name></person-group>, <etal>et al</etal> <article-title>The MetaCyc Database of metabolic pathways and enzymes and the BioCyc collection of Pathway/Genome Databases</article-title>. <source>Nucleic Acids Res</source>. <year>2008</year>;<volume>36</volume>:<fpage>D623</fpage>-<lpage>D631</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkm900</pub-id></mixed-citation></ref>
<ref id="osaf017-B119"><label>119</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Sud</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Fahy</surname><given-names>E</given-names></string-name>, <string-name name-style="western"><surname>Cotter</surname><given-names>D</given-names></string-name></person-group>, <etal>et al</etal> <article-title>LMSD: LIPID MAPS structure database</article-title>. <source>Nucleic Acids Res</source>. <year>2007</year>;<volume>35</volume>:<fpage>D527</fpage>-<lpage>D532</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkl838</pub-id></mixed-citation></ref>
<ref id="osaf017-B120"><label>120</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wishart</surname><given-names>DS</given-names></string-name>, <string-name name-style="western"><surname>Oler</surname><given-names>E</given-names></string-name>, <string-name name-style="western"><surname>Peters</surname><given-names>H</given-names></string-name></person-group>, <etal>et al</etal> <article-title>MiMeDB: the human microbial metabolome database</article-title>. <source>Nucleic Acids Res</source>. <year>2023</year>;<volume>51</volume>:<fpage>D611</fpage>-<lpage>D620</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkac868</pub-id></mixed-citation></ref>
<ref id="osaf017-B121"><label>121</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Williams</surname><given-names>AJ</given-names></string-name>, <string-name name-style="western"><surname>Grulke</surname><given-names>CM</given-names></string-name>, <string-name name-style="western"><surname>Edwards</surname><given-names>J</given-names></string-name></person-group>, <etal>et al</etal> <article-title>The CompTox Chemistry Dashboard: a community data resource for environmental chemistry</article-title>. <source>J Cheminform</source>. <year>2017</year>;<volume>9</volume>:<fpage>61</fpage>.<pub-id pub-id-type="doi">10.1186/s13321-017-0247-6</pub-id></mixed-citation></ref>
<ref id="osaf017-B122"><label>122</label><mixed-citation publication-type="other"><year>Talavera Andújar B</year>. uniluxembourg/LCSB/Environmental Cheminformatics/Exposomics plots. GitLab. In: GitLab. Accessed July 21, 2025. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://gitlab.com/uniluxembourg/lcsb/eci/exposomics-plots">https://gitlab.com/uniluxembourg/lcsb/eci/exposomics-plots</ext-link></mixed-citation></ref>
<ref id="osaf017-B123"><label>123</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Samanipour</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Barron</surname><given-names>LP</given-names></string-name>, <string-name name-style="western"><surname>van Herwerden</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Praetorius</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Thomas</surname><given-names>KV</given-names></string-name>, <string-name name-style="western"><surname>O’Brien</surname><given-names>JW.</given-names></string-name></person-group> <article-title>Exploring the chemical space of the exposome: how far have we gone?</article-title> <source>JACS Au</source>. <year>2024</year>;<volume>4</volume>:<fpage>2412</fpage>-<lpage>2425</lpage>. <pub-id pub-id-type="doi">10.1021/jacsau.4c00220</pub-id></mixed-citation></ref>
<ref id="osaf017-B124"><label>124</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Palm</surname><given-names>EH</given-names></string-name>, <string-name name-style="western"><surname>Chirsir</surname><given-names>P</given-names></string-name>, <string-name name-style="western"><surname>Krier</surname><given-names>J</given-names></string-name></person-group>, <etal>et al</etal> <article-title>ShinyTPs: curating transformation products from text mining results</article-title>. <source>Environ Sci Technol Lett</source>. <year>2023</year>;<volume>10</volume>:<fpage>865</fpage>-<lpage>871</lpage>. <pub-id pub-id-type="doi">10.1021/acs.estlett.3c00537</pub-id></mixed-citation></ref>
<ref id="osaf017-B125"><label>125</label><mixed-citation publication-type="other">NORMAN-SLE. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://www.norman-network.com/nds/SLE/">https://www.norman-network.com/nds/SLE/</ext-link></mixed-citation></ref>
<ref id="osaf017-B126"><label>126</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Helmus</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Van De Velde</surname><given-names>B</given-names></string-name>, <string-name name-style="western"><surname>Brunner</surname><given-names>AM</given-names></string-name>, <string-name name-style="western"><surname>Ter Laak</surname><given-names>TL</given-names></string-name>, <string-name name-style="western"><surname>Van Wezel</surname><given-names>AP</given-names></string-name>, <string-name name-style="western"><surname>Schymanski</surname><given-names>EL.</given-names></string-name></person-group> <article-title>patRoon 2.0: improved non-target analysis workflowsincluding automated transformation product screening</article-title>. <source>Joss</source>. <year>2022</year>;<volume>7</volume>:<fpage>4029</fpage>.<pub-id pub-id-type="doi">10.21105/joss.04029</pub-id></mixed-citation></ref>
<ref id="osaf017-B127"><label>127</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Djoumbou-Feunang</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Fiamoncini</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Gil-de-la-Fuente</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Greiner</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Manach</surname><given-names>C</given-names></string-name>, <string-name name-style="western"><surname>Wishart</surname><given-names>DS.</given-names></string-name></person-group> <article-title>BioTransformer: a comprehensive computational tool for small molecule metabolism prediction and metabolite identification</article-title>. <source>J Cheminform</source>. <year>2019</year>;<volume>11</volume>:<fpage>2</fpage>.<pub-id pub-id-type="doi">10.1186/s13321-018-0324-5</pub-id></mixed-citation></ref>
<ref id="osaf017-B128"><label>128</label><mixed-citation publication-type="other">CompTox Chemicals Dashboard Chemical Lists. Accessed April 30, 2024. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://comptox.epa.gov/dashboard/chemical-lists">https://comptox.epa.gov/dashboard/chemical-lists</ext-link></mixed-citation></ref>
<ref id="osaf017-B129"><label>129</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Gertsman</surname><given-names>I</given-names></string-name>, <string-name name-style="western"><surname>Barshop</surname><given-names>BA.</given-names></string-name></person-group> <article-title>Promises and pitfalls of untargeted metabolomics</article-title>. <source>J Inherit Metab Dis</source>. <year>2018</year>;<volume>41</volume>:<fpage>355</fpage>-<lpage>366</lpage>. <pub-id pub-id-type="doi">10.1007/s10545-017-0130-7</pub-id></mixed-citation></ref>
<ref id="osaf017-B130"><label>130</label><mixed-citation publication-type="book"><person-group person-group-type="author"><string-name name-style="western"><surname>Karaman</surname><given-names>I.</given-names></string-name></person-group> <chapter-title>Preprocessing and pretreatment of metabolomics data for statistical analysis</chapter-title>. In: <person-group person-group-type="editor"><string-name name-style="western"><surname>Sussulini</surname><given-names>A</given-names></string-name></person-group>, ed. <source>Metabolomics: From Fundamentals to Clinical Applications</source>. <publisher-name>Springer International Publishing</publisher-name>; <year>2017</year>:<fpage>145</fpage>-<lpage>161</lpage>.</mixed-citation></ref>
<ref id="osaf017-B131"><label>131</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>van den Berg</surname><given-names>RA</given-names></string-name>, <string-name name-style="western"><surname>Hoefsloot</surname><given-names>HC</given-names></string-name>, <string-name name-style="western"><surname>Westerhuis</surname><given-names>JA</given-names></string-name>, <string-name name-style="western"><surname>Smilde</surname><given-names>AK</given-names></string-name>, <string-name name-style="western"><surname>van der Werf</surname><given-names>MJ.</given-names></string-name></person-group> <article-title>Centering, scaling, and transformations: improving the biological information content of metabolomics data</article-title>. <source>BMC Genomics</source>. <year>2006</year>;<volume>7</volume>:<fpage>142</fpage>.<pub-id pub-id-type="doi">10.1186/1471-2164-7-142</pub-id></mixed-citation></ref>
<ref id="osaf017-B132"><label>132</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Ren</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Hinzman</surname><given-names>AA</given-names></string-name>, <string-name name-style="western"><surname>Kang</surname><given-names>EL</given-names></string-name>, <string-name name-style="western"><surname>Szczesniak</surname><given-names>RD</given-names></string-name>, <string-name name-style="western"><surname>Lu</surname><given-names>LJ.</given-names></string-name></person-group> <article-title>Computational and statistical analysis of metabolomics data</article-title>. <source>Metabolomics</source>. <year>2015</year>;<volume>11</volume>:<fpage>1492</fpage>-<lpage>1513</lpage>. <pub-id pub-id-type="doi">10.1007/s11306-015-0823-6</pub-id></mixed-citation></ref>
<ref id="osaf017-B133"><label>133</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Misra</surname><given-names>BB.</given-names></string-name></person-group> <article-title>Data normalization strategies in metabolomics: current challenges, approaches, and tools</article-title>. <source>Eur J Mass Spectrom (Chichester)</source>. <year>2020</year>;<volume>26</volume>:<fpage>165</fpage>-<lpage>174</lpage>. <pub-id pub-id-type="doi">10.1177/1469066720918446</pub-id></mixed-citation></ref>
<ref id="osaf017-B134"><label>134</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wu</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Li</surname><given-names>L.</given-names></string-name></person-group> <article-title>Sample normalization methods in quantitative metabolomics</article-title>. <source>J Chromatogr A</source>. <year>2016</year>;<volume>1430</volume>:<fpage>80</fpage>-<lpage>95</lpage>. <pub-id pub-id-type="doi">10.1016/j.chroma.2015.12.007</pub-id></mixed-citation></ref>
<ref id="osaf017-B135"><label>135</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Barupal</surname><given-names>DK</given-names></string-name>, <string-name name-style="western"><surname>Fan</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Fiehn</surname><given-names>O.</given-names></string-name></person-group> <article-title>Integrating bioinformatics approaches for a comprehensive interpretation of metabolomics datasets</article-title>. <source>Curr Opin Biotechnol</source>. <year>2018</year>;<volume>54</volume>:<fpage>1</fpage>-<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1016/j.copbio.2018.01.010</pub-id></mixed-citation></ref>
<ref id="osaf017-B136"><label>136</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Chen</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Li</surname><given-names>E-M</given-names></string-name>, <string-name name-style="western"><surname>Xu</surname><given-names>L-Y.</given-names></string-name></person-group> <article-title>Guide to metabolomics analysis: a bioinformatics workflow</article-title>. <source>Metabolites</source>. <year>2022</year>;<volume>12</volume>:<fpage>357</fpage>.<pub-id pub-id-type="doi">10.3390/metabo12040357</pub-id></mixed-citation></ref>
<ref id="osaf017-B137"><label>137</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Vinaixa</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Samino</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Saez</surname><given-names>I</given-names></string-name>, <string-name name-style="western"><surname>Duran</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Guinovart</surname><given-names>JJ</given-names></string-name>, <string-name name-style="western"><surname>Yanes</surname><given-names>O.</given-names></string-name></person-group> <article-title>A guideline to univariate statistical analysis for LC/MS-based untargeted metabolomics-derived data</article-title>. <source>Metabolites</source>. <year>2012</year>;<volume>2</volume>:<fpage>775</fpage>-<lpage>795</lpage>. <pub-id pub-id-type="doi">10.3390/metabo2040775</pub-id></mixed-citation></ref>
<ref id="osaf017-B138"><label>138</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Pang</surname><given-names>Z</given-names></string-name>, <string-name name-style="western"><surname>Zhou</surname><given-names>G</given-names></string-name>, <string-name name-style="western"><surname>Ewald</surname><given-names>J</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Using MetaboAnalyst 5.0 for LC–HRMS spectra processing, multi-omics integration and covariate adjustment of global metabolomics data</article-title>. <source>Nat Protoc</source>. <year>2022</year>;<volume>17</volume>:<fpage>1735</fpage>-<lpage>1761</lpage>. <pub-id pub-id-type="doi">10.1038/s41596-022-00710-w</pub-id></mixed-citation></ref>
<ref id="osaf017-B139"><label>139</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Santos</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Maitre</surname><given-names>L</given-names></string-name>, <string-name name-style="western"><surname>Warembourg</surname><given-names>C</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Applying the exposome concept in birth cohort research: a review of statistical approaches</article-title>. <source>Eur J Epidemiol</source>. <year>2020</year>;<volume>35</volume>:<fpage>193</fpage>-<lpage>204</lpage>. <pub-id pub-id-type="doi">10.1007/s10654-020-00625-4</pub-id></mixed-citation></ref>
<ref id="osaf017-B140"><label>140</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Broadhurst</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Goodacre</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Reinke</surname><given-names>SN</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Guidelines and considerations for the use of system suitability and quality control samples in mass spectrometry assays applied in untargeted clinical metabolomic studies</article-title>. <source>Metabolomics</source>. <year>2018</year>;<volume>14</volume>:<fpage>72</fpage>.<pub-id pub-id-type="doi">10.1007/s11306-018-1367-3</pub-id></mixed-citation></ref>
<ref id="osaf017-B141"><label>141</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Han</surname><given-names>W</given-names></string-name>, <string-name name-style="western"><surname>Li</surname><given-names>L.</given-names></string-name></person-group> <article-title>Evaluating and minimizing batch effects in metabolomics</article-title>. <source>Mass Spectrom Rev</source>. <year>2022</year>;<volume>41</volume>:<fpage>421</fpage>-<lpage>442</lpage>. <pub-id pub-id-type="doi">10.1002/mas.21672</pub-id></mixed-citation></ref>
<ref id="osaf017-B142"><label>142</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Fan</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Kind</surname><given-names>T</given-names></string-name>, <string-name name-style="western"><surname>Cajka</surname><given-names>T</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Systematic error removal using random forest for normalizing large-scale untargeted lipidomics data</article-title>. <source>Anal Chem</source>. <year>2019</year>;<volume>91</volume>:<fpage>3590</fpage>-<lpage>3596</lpage>. <pub-id pub-id-type="doi">10.1021/acs.analchem.8b05592</pub-id></mixed-citation></ref>
<ref id="osaf017-B143"><label>143</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Yu</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Mai</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Zheng</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Shi</surname><given-names>L.</given-names></string-name></person-group> <article-title>Assessing and mitigating batch effects in large-scale omics studies</article-title>. <source>Genome Biol</source>. <year>2024</year>;<volume>25</volume>:<fpage>254</fpage>.<pub-id pub-id-type="doi">10.1186/s13059-024-03401-9</pub-id></mixed-citation></ref>
<ref id="osaf017-B144"><label>144</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Chang</surname><given-names>L</given-names></string-name>, <string-name name-style="western"><surname>Ewald</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Hui</surname><given-names>F</given-names></string-name>, <string-name name-style="western"><surname>Bayen</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Xia</surname><given-names>J.</given-names></string-name></person-group> <article-title>A data-centric perspective on exposomics data analysis</article-title>. <source>Exposome</source>. <year>2024</year>;<volume>4</volume>:<fpage>osae005</fpage>. <pub-id pub-id-type="doi">10.1093/exposome/osae005</pub-id></mixed-citation></ref>
<ref id="osaf017-B145"><label>145</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Huang</surname><given-names>S-Y</given-names></string-name>, <string-name name-style="western"><surname>Yang</surname><given-names>Y-X</given-names></string-name>, <string-name name-style="western"><surname>Chen</surname><given-names>S-D</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Investigating causal relationships between exposome and human longevity: a Mendelian randomization analysis</article-title>. <source>BMC Med</source>. <year>2021</year>;<volume>19</volume>:<fpage>150</fpage>.<pub-id pub-id-type="doi">10.1186/s12916-021-02030-4</pub-id></mixed-citation></ref>
<ref id="osaf017-B146"><label>146</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Domenighetti</surname><given-names>C</given-names></string-name>, <string-name name-style="western"><surname>Sugier</surname><given-names>P-E</given-names></string-name>, <string-name name-style="western"><surname>Ashok Kumar Sreelatha</surname><given-names>A</given-names></string-name></person-group>, <collab>Comprehensive Unbiased Risk Factor Assessment for Genetics and Environment in Parkinson’s Disease (Courage-PD) Consortium</collab>, <etal>et al</etal> <article-title>Dairy Intake and Parkinson’s Disease: a Mendelian Randomization Study</article-title>. <source>Mov Disord</source>. <year>2022</year>;<volume>37</volume>:<fpage>857</fpage>-<lpage>864</lpage>. <pub-id pub-id-type="doi">10.1002/mds.28902</pub-id></mixed-citation></ref>
<ref id="osaf017-B147"><label>147</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Li</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Zhou</surname><given-names>L</given-names></string-name>, <string-name name-style="western"><surname>Cao</surname><given-names>Z</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Associations of environmental factors with neurodegeneration: an exposome-wide Mendelian randomization investigation</article-title>. <source>Ageing Res Rev</source>. <year>2024</year>;<volume>95</volume>:<fpage>102254</fpage>.<pub-id pub-id-type="doi">10.1016/j.arr.2024.102254</pub-id></mixed-citation></ref>
<ref id="osaf017-B148"><label>148</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Zhao</surname><given-names>Y-L</given-names></string-name>, <string-name name-style="western"><surname>Hao</surname><given-names>Y-N</given-names></string-name>, <string-name name-style="western"><surname>Ge</surname><given-names>Y-J</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Variables associated with cognitive function: an exposome-wide and mendelian randomization analysis</article-title>. <source>Alzheimers Res Ther</source>. <year>2025</year>;<volume>17</volume>:<fpage>13</fpage>.<pub-id pub-id-type="doi">10.1186/s13195-025-01670-5</pub-id></mixed-citation></ref>
<ref id="osaf017-B149"><label>149</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Maitre</surname><given-names>L</given-names></string-name>, <string-name name-style="western"><surname>Guimbaud</surname><given-names>J-B</given-names></string-name>, <string-name name-style="western"><surname>Warembourg</surname><given-names>C</given-names></string-name></person-group>, <collab>Exposome Data Challenge Participant Consortium</collab>, <etal>et al</etal> <article-title>State-of-the-art methods for exposure-health studies: results from the exposome data challenge event</article-title>. <source>Environ Int</source>. <year>2022</year>;<volume>168</volume>:<fpage>107422</fpage>.<pub-id pub-id-type="doi">10.1016/j.envint.2022.107422</pub-id></mixed-citation></ref>
<ref id="osaf017-B150"><label>150</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Barupal</surname><given-names>DK</given-names></string-name>, <string-name name-style="western"><surname>Fiehn</surname><given-names>O.</given-names></string-name></person-group> <article-title>Chemical Similarity Enrichment Analysis (ChemRICH) as alternative to biochemical pathway mapping for metabolomic datasets</article-title>. <source>Sci Rep</source>. <year>2017</year>;<volume>7</volume>:<fpage>14567</fpage>.<pub-id pub-id-type="doi">10.1038/s41598-017-15231-w</pub-id></mixed-citation></ref>
<ref id="osaf017-B151"><label>151</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Johnson</surname><given-names>CH</given-names></string-name>, <string-name name-style="western"><surname>Ivanisevic</surname><given-names>J</given-names></string-name>, <string-name name-style="western"><surname>Siuzdak</surname><given-names>G.</given-names></string-name></person-group> <article-title>Metabolomics: beyond biomarkers and towards mechanisms</article-title>. <source>Nat Rev Mol Cell Biol</source>. <year>2016</year>;<volume>17</volume>:<fpage>451</fpage>-<lpage>459</lpage>. <pub-id pub-id-type="doi">10.1038/nrm.2016.25</pub-id></mixed-citation></ref>
<ref id="osaf017-B152"><label>152</label><mixed-citation publication-type="book"><person-group person-group-type="author"><string-name name-style="western"><surname>Xia</surname><given-names>J.</given-names></string-name></person-group> <chapter-title>Computational strategies for biological interpretation of metabolomics data</chapter-title>. In: <person-group person-group-type="editor"><string-name name-style="western"><surname>Sussulini</surname><given-names>A</given-names></string-name></person-group>, ed. <source>Metabolomics: From Fundamentals to Clinical Applications</source>. <publisher-name>Springer International Publishing</publisher-name>; <year>2017</year>:<fpage>191</fpage>-<lpage>206</lpage>.</mixed-citation></ref>
<ref id="osaf017-B153"><label>153</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Li</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Park</surname><given-names>Y</given-names></string-name>, <string-name name-style="western"><surname>Duraisingham</surname><given-names>S</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Predicting network activity from high throughput metabolomics</article-title>. <source>PLOS Comput Biol</source>. <year>2013</year>;<volume>9</volume>:<fpage>e1003123</fpage>.<pub-id pub-id-type="doi">10.1371/journal.pcbi.1003123</pub-id></mixed-citation></ref>
<ref id="osaf017-B154"><label>154</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Rohart</surname><given-names>F</given-names></string-name>, <string-name name-style="western"><surname>Gautier</surname><given-names>B</given-names></string-name>, <string-name name-style="western"><surname>Singh</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Cao</surname><given-names>K-AL.</given-names></string-name></person-group> <article-title>mixOmics: an R package for ‘omics feature selection and multiple data integration</article-title>. <source>PLOS Comput Biol</source>. <year>2017</year>;<volume>13</volume>:<fpage>e1005752</fpage>.<pub-id pub-id-type="doi">10.1371/journal.pcbi.1005752</pub-id></mixed-citation></ref>
<ref id="osaf017-B155"><label>155</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Zuffa</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Schmid</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Bauermeister</surname><given-names>A</given-names></string-name></person-group>, <etal>et al</etal> <article-title>microbeMASST: a taxonomically informed mass spectrometry search tool for microbial metabolomics data</article-title>. <source>Nat Microbiol</source>. <year>2024</year>;<volume>9</volume>:<fpage>336</fpage>-<lpage>345</lpage>. <pub-id pub-id-type="doi">10.1038/s41564-023-01575-9</pub-id></mixed-citation></ref>
<ref id="osaf017-B156"><label>156</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Fiehn</surname><given-names>O</given-names></string-name>, <string-name name-style="western"><surname>Robertson</surname><given-names>D</given-names></string-name>, <string-name name-style="western"><surname>Griffin</surname><given-names>J</given-names></string-name></person-group>, <etal>et al</etal> <article-title>The metabolomics standards initiative (MSI)</article-title>. <source>Metabolomics</source>. <year>2007</year>;<volume>3</volume>:<fpage>175</fpage>-<lpage>178</lpage>. <pub-id pub-id-type="doi">10.1007/s11306-007-0070-6</pub-id></mixed-citation></ref>
<ref id="osaf017-B157"><label>157</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Salek</surname><given-names>RM</given-names></string-name>, <string-name name-style="western"><surname>Neumann</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Schober</surname><given-names>D</given-names></string-name></person-group>, <etal>et al</etal> <article-title>COordination of Standards in MetabOlomicS (COSMOS): facilitating integrated metabolomics data access</article-title>. <source>Metabolomics</source>. <year>2015</year>;<volume>11</volume>:<fpage>1587</fpage>-<lpage>1597</lpage>. <pub-id pub-id-type="doi">10.1007/s11306-015-0810-y</pub-id></mixed-citation></ref>
<ref id="osaf017-B158"><label>158</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Vineis</surname><given-names>P</given-names></string-name>, <string-name name-style="western"><surname>Chadeau-Hyam</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Gmuender</surname><given-names>H</given-names></string-name></person-group>, <collab>EXPOsOMICS Consortium</collab>, <etal>et al</etal> <article-title>The exposome in practice: design of the EXPOsOMICS project</article-title>. <source>Int J Hyg Environ Health</source>. <year>2017</year>;<volume>220</volume>:<fpage>142</fpage>-<lpage>151</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijheh.2016.08.001</pub-id></mixed-citation></ref>
<ref id="osaf017-B159"><label>159</label><mixed-citation publication-type="other">The European Human Exposome Network. Home—The European Human Exposome Network (EHEN). Accessed May 3, 2024. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://www.humanexposome.eu/">https://www.humanexposome.eu/</ext-link></mixed-citation></ref>
<ref id="osaf017-B160"><label>160</label><mixed-citation publication-type="other">NEXUS. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://www.nexus-exposomics.org/">https://www.nexus-exposomics.org/</ext-link></mixed-citation></ref>
<ref id="osaf017-B161"><label>161</label><mixed-citation publication-type="book"><person-group person-group-type="author"><string-name name-style="western"><surname>Niedzwiecki</surname><given-names>MM</given-names></string-name>, <string-name name-style="western"><surname>Miller</surname><given-names>GW.</given-names></string-name></person-group> <chapter-title>HERCULES: an academic center to support exposome research</chapter-title>. In: <person-group person-group-type="editor"><string-name name-style="western"><surname>Dagnino</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Macherone</surname><given-names>A</given-names></string-name></person-group>, eds. <source>Unraveling the Exposome: A Practical View</source>. <publisher-name>Springer International Publishing</publisher-name>, <year>2019</year>:<fpage>339</fpage>-<lpage>348</lpage>.</mixed-citation></ref>
<ref id="osaf017-B162"><label>162</label><mixed-citation publication-type="other">Westat. Human Health Exposure Analysis Resource (HHEAR). Accessed July 15, 2025. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://hhearprogram.org/">https://hhearprogram.org/</ext-link></mixed-citation></ref>
<ref id="osaf017-B163"><label>163</label><mixed-citation publication-type="other">International Human Exposome Network. IHEN—The International Human Exposome Network. In: IHEN. Accessed July 15, 2025. <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://humanexposome.net/">https://humanexposome.net/</ext-link></mixed-citation></ref>
<ref id="osaf017-B164"><label>164</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Aharoni</surname><given-names>A</given-names></string-name>, <string-name name-style="western"><surname>Goodacre</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Fernie</surname><given-names>AR.</given-names></string-name></person-group> <article-title>Plant and microbial sciences as key drivers in the development of metabolomics research</article-title>. <source>Proc Natl Acad Sci U S A</source>. <year>2023</year>;<volume>120</volume>:<fpage>e2217383120</fpage>.<pub-id pub-id-type="doi">10.1073/pnas.2217383120</pub-id></mixed-citation></ref>
<ref id="osaf017-B165"><label>165</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Frigerio</surname><given-names>G</given-names></string-name>, <string-name name-style="western"><surname>Moruzzi</surname><given-names>C</given-names></string-name>, <string-name name-style="western"><surname>Mercadante</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Schymanski</surname><given-names>EL</given-names></string-name>, <string-name name-style="western"><surname>Fustinoni</surname><given-names>S.</given-names></string-name></person-group> <article-title>Development and application of an LC-MS/MS untargeted exposomics method with a separated pooled quality control strategy</article-title>. <source>Molecules</source>. <year>2022</year>;<volume>27</volume>:<fpage>2580</fpage>.<pub-id pub-id-type="doi">10.3390/molecules27082580</pub-id></mixed-citation></ref>
<ref id="osaf017-B166"><label>166</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Broeckling</surname><given-names>CD</given-names></string-name>, <string-name name-style="western"><surname>Beger</surname><given-names>RD</given-names></string-name>, <string-name name-style="western"><surname>Cheng</surname><given-names>LL</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Current practices in LC-MS untargeted metabolomics: a scoping review on the use of pooled quality control samples</article-title>. <source>Anal Chem</source>. <year>2023</year>;<volume>95</volume>:<fpage>18645</fpage>-<lpage>18654</lpage>. <pub-id pub-id-type="doi">10.1021/acs.analchem.3c02924</pub-id></mixed-citation></ref>
<ref id="osaf017-B167"><label>167</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Caballero-Casero</surname><given-names>N</given-names></string-name>, <string-name name-style="western"><surname>Belova</surname><given-names>L</given-names></string-name>, <string-name name-style="western"><surname>Vervliet</surname><given-names>P</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Towards harmonised criteria in quality assurance and quality control of suspect and non-target LC-HRMS analytical workflows for screening of emerging contaminants in human biomonitoring</article-title>. <source>TrAC Trends Anal Chem</source>. <year>2021</year>;<volume>136</volume>:<fpage>116201</fpage>.<pub-id pub-id-type="doi">10.1016/j.trac.2021.116201</pub-id></mixed-citation></ref>
<ref id="osaf017-B168"><label>168</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Viant</surname><given-names>MR</given-names></string-name>, <string-name name-style="western"><surname>Ebbels</surname><given-names>TMD</given-names></string-name>, <string-name name-style="western"><surname>Beger</surname><given-names>RD</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Use cases, best practice and reporting standards for metabolomics in regulatory toxicology</article-title>. <source>Nat Commun</source>. <year>2019</year>;<volume>10</volume>:<fpage>3041</fpage>.<pub-id pub-id-type="doi">10.1038/s41467-019-10900-y</pub-id></mixed-citation></ref>
<ref id="osaf017-B169"><label>169</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Kirwan</surname><given-names>JA</given-names></string-name>, <string-name name-style="western"><surname>Gika</surname><given-names>H</given-names></string-name>, <string-name name-style="western"><surname>Beger</surname><given-names>RD</given-names></string-name></person-group>, <collab>metabolomics Quality Assurance and Quality Control Consortium (mQACC)</collab>, <etal>et al</etal> <article-title>Quality assurance and quality control reporting in untargeted metabolic phenotyping: mQACC recommendations for analytical quality management</article-title>. <source>Metabolomics</source>. <year>2022</year>;<volume>18</volume>:<fpage>70</fpage>.<pub-id pub-id-type="doi">10.1007/s11306-022-01926-3</pub-id></mixed-citation></ref>
<ref id="osaf017-B170"><label>170</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Haug</surname><given-names>K</given-names></string-name>, <string-name name-style="western"><surname>Cochrane</surname><given-names>K</given-names></string-name>, <string-name name-style="western"><surname>Nainala</surname><given-names>VC</given-names></string-name></person-group>, <etal>et al</etal> <article-title>MetaboLights: a resource evolving in response to the needs of its scientific community</article-title>. <source>Nucleic Acids Res</source>. <year>2020</year>;<volume>48</volume>:<fpage>D440</fpage>-<lpage>D444</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkz1019</pub-id></mixed-citation></ref>
<ref id="osaf017-B171"><label>171</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Leao</surname><given-names>TF</given-names></string-name>, <string-name name-style="western"><surname>Clark</surname><given-names>CM</given-names></string-name>, <string-name name-style="western"><surname>Bauermeister</surname><given-names>A</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Quick-start infrastructure for untargeted metabolomics analysis in GNPS</article-title>. <source>Nat Metab</source>. <year>2021</year>;<volume>3</volume>:<fpage>880</fpage>-<lpage>882</lpage>. <pub-id pub-id-type="doi">10.1038/s42255-021-00429-0</pub-id></mixed-citation></ref>
<ref id="osaf017-B172"><label>172</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Chetnik</surname><given-names>K</given-names></string-name>, <string-name name-style="western"><surname>Petrick</surname><given-names>L</given-names></string-name>, <string-name name-style="western"><surname>Pandey</surname><given-names>G.</given-names></string-name></person-group> <article-title>MetaClean: a machine learning-based classifier for reduced false positive peak detection in untargeted LC–MS metabolomics data</article-title>. <source>Metabolomics</source>. <year>2020</year>;<volume>16</volume>:<fpage>117</fpage>.<pub-id pub-id-type="doi">10.1007/s11306-020-01738-3</pub-id></mixed-citation></ref>
<ref id="osaf017-B173"><label>173</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Mosley</surname><given-names>JD</given-names></string-name>, <string-name name-style="western"><surname>Schock</surname><given-names>TB</given-names></string-name>, <string-name name-style="western"><surname>Beecher</surname><given-names>CW</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Establishing a framework for best practices for quality assurance and quality control in untargeted metabolomics</article-title>. <source>Metabolomics</source>. <year>2024</year>;<volume>20</volume>:<fpage>20</fpage>.<pub-id pub-id-type="doi">10.1007/s11306-023-02080-0</pub-id></mixed-citation></ref>
<ref id="osaf017-B174"><label>174</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Petrick</surname><given-names>LM</given-names></string-name>, <string-name name-style="western"><surname>Shomron</surname><given-names>N.</given-names></string-name></person-group> <article-title>AI/ML-driven advances in untargeted metabolomics and exposomics for biomedical applications</article-title>. <source>Cell Rep Phys Sci</source>. <year>2022</year>;<volume>3</volume>:<fpage>100978</fpage>.<pub-id pub-id-type="doi">10.1016/j.xcrp.2022.100978</pub-id></mixed-citation></ref>
<ref id="osaf017-B175"><label>175</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wan</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Simonin</surname><given-names>EM</given-names></string-name>, <string-name name-style="western"><surname>Johnson</surname><given-names>MM</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Exposomics: a review of methodologies, applications, and future directions in molecular medicine</article-title>. <source>EMBO Mol Med</source>. <year>2025</year>;<volume>17</volume>:<fpage>599</fpage>-<lpage>608</lpage>. <pub-id pub-id-type="doi">10.1038/s44321-025-00191-w</pub-id></mixed-citation></ref>
<ref id="osaf017-B176"><label>176</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Rappaport</surname><given-names>SM.</given-names></string-name></person-group> <article-title>Genetic factors are not the major causes of chronic diseases</article-title>. <source>PLoS One</source>. <year>2016</year>;<volume>11</volume>:<fpage>e0154387</fpage>.<pub-id pub-id-type="doi">10.1371/journal.pone.0154387</pub-id></mixed-citation></ref>
<ref id="osaf017-B177"><label>177</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Fuller</surname><given-names>R</given-names></string-name>, <string-name name-style="western"><surname>Landrigan</surname><given-names>PJ</given-names></string-name>, <string-name name-style="western"><surname>Balakrishnan</surname><given-names>K</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Pollution and health: a progress update</article-title>. <source>Lancet Planet Health</source>. <year>2022</year>;<volume>6</volume>:<fpage>e535</fpage>-<lpage>e547</lpage>. <pub-id pub-id-type="doi">10.1016/S2542-5196(22)00090-0</pub-id></mixed-citation></ref>
<ref id="osaf017-B178"><label>178</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Tisler</surname><given-names>S</given-names></string-name>, <string-name name-style="western"><surname>Savvidou</surname><given-names>P</given-names></string-name>, <string-name name-style="western"><surname>Jørgensen</surname><given-names>MB</given-names></string-name>, <string-name name-style="western"><surname>Castro</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Christensen</surname><given-names>JH.</given-names></string-name></person-group> <article-title>Supercritical fluid chromatography coupled to high-resolution mass spectrometry reveals persistent mobile organic compounds with unknown toxicity in wastewater effluents</article-title>. <source>Environ Sci Technol</source>. <year>2023</year>;<volume>57</volume>:<fpage>9287</fpage>-<lpage>9297</lpage>. <pub-id pub-id-type="doi">10.1021/acs.est.3c00120</pub-id></mixed-citation></ref>
<ref id="osaf017-B179"><label>179</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wild</surname><given-names>CP.</given-names></string-name></person-group> <article-title>The exposome at twenty: a personal account</article-title>. <source>Exposome</source>. <year>2025</year>;<volume>5</volume>:<fpage>osaf003</fpage>.<pub-id pub-id-type="doi">10.1093/exposome/osaf003</pub-id></mixed-citation></ref>
<ref id="osaf017-B180"><label>180</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Maitre</surname><given-names>L</given-names></string-name>, <string-name name-style="western"><surname>Bustamante</surname><given-names>M</given-names></string-name>, <string-name name-style="western"><surname>Hernández-Ferrer</surname><given-names>C</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Multi-omics signatures of the human early life exposome</article-title>. <source>Nat Commun</source>. <year>2022</year>;<volume>13</volume>:<fpage>7024</fpage>.<pub-id pub-id-type="doi">10.1038/s41467-022-34422-2</pub-id></mixed-citation></ref>
<ref id="osaf017-B181"><label>181</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Argentieri</surname><given-names>MA</given-names></string-name>, <string-name name-style="western"><surname>Amin</surname><given-names>N</given-names></string-name>, <string-name name-style="western"><surname>Nevado-Holgado</surname><given-names>AJ</given-names></string-name></person-group>, <etal>et al</etal> <article-title>Integrating the environmental and genetic architectures of aging and mortality</article-title>. <source>Nat Med</source>. <year>2025</year>;<volume>31</volume>:<fpage>1016</fpage>-<lpage>1025</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-024-03483-9</pub-id></mixed-citation></ref>
</ref-list>
</back>
</article>