<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Exp. Biol. Med.</journal-id>
<journal-title>Experimental Biology and Medicine</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Exp. Biol. Med.</abbrev-journal-title>
<issn pub-type="epub">1535-3699</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">10279</article-id>
<article-id pub-id-type="doi">10.3389/ebm.2024.10279</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Experimental Biology and Medicine</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Development of a comprehensive open access &#x201c;molecules with androgenic activity resource (MAAR)&#x201d; to facilitate risk assessment of chemicals</article-title>
<alt-title alt-title-type="left-running-head">Dong et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/ebm.2024.10279">10.3389/ebm.2024.10279</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Dong</surname>
<given-names>Fan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2083053/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Hardy</surname>
<given-names>Barry</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Jie</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2009453/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mohoric</surname>
<given-names>Tomaz</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Guo</surname>
<given-names>Wenjing</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Exner</surname>
<given-names>Thomas</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1577885/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tong</surname>
<given-names>Weida</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Dohler</surname>
<given-names>Joh</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bachler</surname>
<given-names>Daniel</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Hong</surname>
<given-names>Huixiao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/472005/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>National Center for Toxicological Research</institution>, <institution>US Food and Drug Administration</institution>, <addr-line>Jefferson</addr-line>, <addr-line>AR</addr-line>, <country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Edelweiss Connect Inc.</institution>, <addr-line>Durham</addr-line>, <addr-line>NC</addr-line>, <country>United States</country>
</aff>
<author-notes>
<corresp id="c001">&#x2a;Correspondence: Huixiao Hong, <email>huixiao.hong@fda.hhs.gov</email>; Barry Hardy, <email>barry.hardy@edelweissconnect.com</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>19</day>
<month>09</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>249</volume>
<elocation-id>10279</elocation-id>
<history>
<date date-type="received">
<day>07</day>
<month>06</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>27</day>
<month>08</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Dong, Hardy, Liu, Mohoric, Guo, Exner, Tong, Dohler, Bachler and Hong.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Dong, Hardy, Liu, Mohoric, Guo, Exner, Tong, Dohler, Bachler and Hong</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The increasing prevalence of endocrine-disrupting chemicals (EDCs) and their potential adverse effects on human health underscore the necessity for robust tools to assess and manage associated risks. The androgen receptor (AR) is a critical component of the endocrine system, playing a pivotal role in mediating the biological effects of androgens, which are male sex hormones. Exposure to androgen-disrupting chemicals during critical periods of development, such as fetal development or puberty, may result in adverse effects on reproductive health, including altered sexual differentiation, impaired fertility, and an increased risk of reproductive disorders. Therefore, androgenic activity data is critical for chemical risk assessment. A large amount of androgenic data has been generated using various experimental protocols. Moreover, the data are reported in different formats and in diverse sources. To facilitate utilization of androgenic activity data in chemical risk assessment, the Molecules with Androgenic Activity Resource (MAAR) was developed. MAAR is the first open-access platform designed to streamline and enhance the risk assessment of chemicals with androgenic activity. MAAR&#x2019;s development involved the integration of diverse data sources, including data from public databases and mining literature, to establish a reliable and versatile repository. The platform employs a user-friendly interface, enabling efficient navigation and extraction of pertinent information. MAAR is poised to advance chemical risk assessment by offering unprecedented access to information crucial for evaluating the androgenic potential of a wide array of chemicals. The open-access nature of MAAR promotes transparency and collaboration, fostering a collective effort to address the challenges posed by androgenic EDCs.</p>
</abstract>
<kwd-group>
<kwd>androgen receptor</kwd>
<kwd>risk assessment</kwd>
<kwd>chemicals</kwd>
<kwd>database</kwd>
<kwd>open access</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Impact statement</title>
<p>The prevalence of endocrine-disrupting chemicals (EDCs) and their potential health impacts necessitate robust tools for risk assessment. The androgen receptor is crucial in mediating the effects of male sex hormones, with disruption during critical developmental periods leading to reproductive health issues. To address this, the Molecules with Androgenic Activity Resource (MAAR) was developed. MAAR integrates diverse data sources to create an open-access platform facilitating chemical risk assessment. By offering easy navigation and extraction of androgenic activity data, MAAR enhances transparency and collaboration in addressing the challenges posed by androgenic EDCs.</p>
</sec>
<sec id="s2">
<title>Introduction</title>
<p>Endocrine-active chemicals are exogenous compounds that affect the endocrine system of humans and other vertebrates. Endocrine activity of chemicals has the potential to cause numerous adverse outcomes, including disrupting physiological function of endogenous hormones and altering homeostasis [<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>]. Evidence that certain man-made chemicals can disrupt the endocrine system by mimicking endogenous hormones sparked intense international scientific discussion and debate starting some 24&#xa0;years ago [<xref ref-type="bibr" rid="B3">3</xref>]. These discussions culminated in issuance of legislation that reauthorized the Safe Drinking Water Act<xref ref-type="fn" rid="fn1">
<sup>1</sup>
</xref> and authorization of the 1996 Food Quality Protection Act mandating that the US Environmental Protection Agency (EPA) develop a program for screening and testing chemicals with endocrine disrupting potential<xref ref-type="fn" rid="fn2">
<sup>2</sup>
</xref>. In 2015, the US Food and Drug Administration (FDA) published guidance to provide recommendations to sponsors of investigational new drug applications, new drug applications, and biologics license applications regulated by the FDA&#x2019;s Center for Drug Evaluation and Research (CDER) regarding nonclinical studies intended to identify the potential for a drug to cause endocrine-related toxicity<xref ref-type="fn" rid="fn3">
<sup>3</sup>
</xref>. FDA&#x2019;s National Center for Toxicological Research (NCTR) developed a program to meet the need for information systems focused on aggregating knowledge of chemicals with experimental results relevant to endocrine activity. These efforts resulted in the development of the endocrine disruptors knowledge base (EDKB) [<xref ref-type="bibr" rid="B4">4</xref>] and estrogenic activity database (EADB) [<xref ref-type="bibr" rid="B5">5</xref>], which have been used to help identify endocrine active chemicals, develop predictive toxicology models, and prioritize chemicals for laborious and expensive testing [<xref ref-type="bibr" rid="B6">6</xref>&#x2013;<xref ref-type="bibr" rid="B22">22</xref>]. However, as of today, androgenic activity data have not been comprehensively curated into a database.</p>
<p>Androgen receptors (ARs) are ligand-dependent transcription factors that belong to the nuclear receptor superfamily [<xref ref-type="bibr" rid="B23">23</xref>]. ARs are widely expressed in various tissues within the body [<xref ref-type="bibr" rid="B24">24</xref>]. They are the targets for drugs to treat hormone-related diseases including cancers of prostate, breast, ovary, pancreas, etc. [<xref ref-type="bibr" rid="B25">25</xref>]. On the other hand, chemicals can interfere with the endocrine system by interacting with ARs, which result in adverse effects [<xref ref-type="bibr" rid="B26">26</xref>]. Therefore, estimation of the androgenic activity of drugs and other chemicals is critical for the evaluation of drug safety and assessment of chemical risk.</p>
<p>Over the past decades, large numbers of chemicals have been assayed for androgenic activity by government agencies, industry, and academic research groups, with the results of these studies reported in the public domain. However, the data are distributed across different and diverse sources, obtained in multiple diverse assays, and stored in different formats, limiting the use of the data in research and regulation. Therefore, a comprehensive and reliable resource to provide open access to the data and enable modeling and prediction of androgenic activity for untested chemicals could facilitate advancement in developing strategies to mitigate the AR-driven toxicity and risk. To enable and optimize the use of the data generated by these studies, we have developed and are maintaining a comprehensive open access resource called Molecules with Androgenic Activity Resource (MAAR) to provide the scientific and regulatory communities with an up-to-date androgenic activity database for evaluating potential endocrine activity of chemicals.</p>
</sec>
<sec sec-type="methods" id="s3">
<title>Materials and methods</title>
<sec id="s3-1">
<title>Data collection</title>
<p>Androgenic activity data were collected from multiple sources which encompass published literature and public databases including PubChem [<xref ref-type="bibr" rid="B27">27</xref>], ChEMBL [<xref ref-type="bibr" rid="B28">28</xref>], BindingDB [<xref ref-type="bibr" rid="B29">29</xref>], EDKB [<xref ref-type="bibr" rid="B4">4</xref>], ToxCast [<xref ref-type="bibr" rid="B30">30</xref>], and the Comparative Toxicogenomics Database (CTD) [<xref ref-type="bibr" rid="B31">31</xref>]. Java programs were developed to automatically retrieve androgenic activity data points and associated data such as chemical structures, assays, species, and references from these public databases. In addition, androgenic activity data in the literature were manually searched and extracted. The collected androgenic activity data include both quantitative measurements for active compounds and qualitative descriptions for inactive chemicals. <xref ref-type="fig" rid="F1">Figure 1</xref> gives the sources from which the androgenic activity and related data were collected and the four types of data that were included in this database.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Androgenic Activity Data Collection and Curation. Data collection sources including ChemBL, PubChem, BindingDB, EDKB, CTD, Toxcast. After data pre-processing steps, Androgenic Activity Data are curated into four categories: Activity Data information, Reference information, Assay information, Chemical information.</p>
</caption>
<graphic xlink:href="ebm-249-10279-g001.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>Data curation</title>
<p>After data were collected from individual sources, data were pre-processed and integrated before they were implemented into the database. Given potential duplications in the data collected from different sources, an automated pre-process program was devised to check and remove duplicated data records by comparing chemicals, activity data, assays, and references. This program identified and removed duplicates by comparing CID, ChEMBL ID, PubMed ID, endpoint values, and assay descriptions across data sources. Geometric and optical isomers are considered duplicates only if they have the same CID or ChEMBL ID. This program also ensured data uniformity by transforming all collected activity data into standardized units. For different activity values of a compound from different sources where inconsistencies were found, a manual review was conducted to determine the most reliable value by examining the assay details. Following a cleaning procedure that removed duplicates to keep unique androgenic activity data, the pre-processed data were combined to make the final data that were included in the database. This program was developed in Java. It processes text file containing all activity information, specifies columns used for comparison, and identifies both duplicate and unique activity records to ensure that non-redundant data is included in the final dataset.</p>
</sec>
<sec id="s3-3">
<title>Data model</title>
<p>The data implemented in the database were organized into four categories: androgen activity data, references, assays, and chemical information. Properties for each of the four categories are summarized in <xref ref-type="table" rid="T1">Tables 1</xref>&#x2013;<xref ref-type="table" rid="T4">4</xref>. The four tables are interconnected through Chemical ID, Assay ID and Reference ID as depicted in the database schema in <xref ref-type="fig" rid="F2">Figure 2</xref>.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Reference data table.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Data field</th>
<th align="left">Description</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Reference ID</td>
<td align="left">Internal ID for reference</td>
</tr>
<tr>
<td align="left">PMID</td>
<td align="left">PubMed ID for reference</td>
</tr>
<tr>
<td align="left">Journal_Name</td>
<td align="left">Reference journal name</td>
</tr>
<tr>
<td align="left">Year</td>
<td align="left">Publication year</td>
</tr>
<tr>
<td align="left">Volume</td>
<td align="left">Volume number</td>
</tr>
<tr>
<td align="left">Issue</td>
<td align="left">Issue number</td>
</tr>
<tr>
<td align="left">First_Page</td>
<td align="left">First page number</td>
</tr>
<tr>
<td align="left">Author</td>
<td align="left">Author names</td>
</tr>
<tr>
<td align="left">Title</td>
<td align="left">Publication title</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Assay data table.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Data field</th>
<th align="left">Description</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Assay ID</td>
<td align="left">Internal ID for assay</td>
</tr>
<tr>
<td align="left">Description</td>
<td align="left">Description of assay</td>
</tr>
<tr>
<td align="left">Assay_Name</td>
<td align="left">Assay name</td>
</tr>
<tr>
<td align="left">Assay_Group</td>
<td align="left">Assay group, e.g., HTS, Reporter gene</td>
</tr>
<tr>
<td align="left">Assay_Format</td>
<td align="left">Assay format, e.g., cell-based, protein-based</td>
</tr>
<tr>
<td align="left">Assay_Type</td>
<td align="left">Assay type, e.g., Agonist, Antagonist</td>
</tr>
<tr>
<td align="left">Species</td>
<td align="left">Species assay based on, e.g., <italic>Homo sapiens</italic>
</td>
</tr>
<tr>
<td align="left">AID</td>
<td align="left">Bioassay AID in PubChem</td>
</tr>
<tr>
<td align="left">ChEMBL Assay ID</td>
<td align="left">Assay ID in ChEMBL.</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Androgen activity data table.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Data field</th>
<th align="left">Description</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Activity ID</td>
<td align="left">Internal ID for activity data</td>
</tr>
<tr>
<td align="left">Chemical ID</td>
<td align="left">Internal ID for chemicals</td>
</tr>
<tr>
<td align="left">Assay ID</td>
<td align="left">Internal ID for assays</td>
</tr>
<tr>
<td align="left">Reference ID</td>
<td align="left">Internal ID for references</td>
</tr>
<tr>
<td align="left">Endpoint</td>
<td align="left">Activity endpoint, e.g., IC50, AC50, LogRBA</td>
</tr>
<tr>
<td align="left">Relation</td>
<td align="left">Relation to describe activity value, e.g., &#x3e;, &#x3d;, &#x3c;</td>
</tr>
<tr>
<td align="left">Value</td>
<td align="left">Activity value from endpoint measurement</td>
</tr>
<tr>
<td align="left">Units</td>
<td align="left">Activity data unit, e.g., nM, %</td>
</tr>
<tr>
<td align="left">Download</td>
<td align="left">Database where data downloaded, e.g., PubChem, ChEMBL</td>
</tr>
<tr>
<td align="left">Curation/Data source</td>
<td align="left">Date source, e.g., literatures, US Patent, Tox21, Abbott Labs</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Chemical data table.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Data field</th>
<th align="left">Description</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Chemical ID</td>
<td align="left">Internal chemical ID of chemical</td>
</tr>
<tr>
<td align="left">IUPAC_NAME</td>
<td align="left">IUPAC name of chemical</td>
</tr>
<tr>
<td align="left">Name</td>
<td align="left">Chemical name used in the system</td>
</tr>
<tr>
<td align="left">Synonyms</td>
<td align="left">Chemical synonyms (a string separated by &#x201c;&#x7c;&#x201d;)</td>
</tr>
<tr>
<td align="left">SMILES</td>
<td align="left">SMILES string of chemical</td>
</tr>
<tr>
<td align="left">InChIKey</td>
<td align="left">A fixed-length format directly derived from InChI</td>
</tr>
<tr>
<td align="left">InChI</td>
<td align="left">International Chemical Identifier</td>
</tr>
<tr>
<td align="left">Molecular_weight</td>
<td align="left">Molecular weight</td>
</tr>
<tr>
<td align="left">Molecular_formula</td>
<td align="left">Molecular formula</td>
</tr>
<tr>
<td align="left">CAS</td>
<td align="left">Chemical CAS registry number</td>
</tr>
<tr>
<td align="left">CID</td>
<td align="left">Compound ID in PubChem</td>
</tr>
<tr>
<td align="left">CHEMBL_ID</td>
<td align="left">Compound ID in ChEMBL</td>
</tr>
<tr>
<td align="left">BindingDB_ID</td>
<td align="left">Compound ID in BindingDB</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Database schema.</p>
</caption>
<graphic xlink:href="ebm-249-10279-g002.tif"/>
</fig>
</sec>
<sec id="s3-4">
<title>Database design</title>
<p>The curated tables were put into a cloud-based database based on EdelweissData that was developed by Edelweiss Connect, GmbH to tackle data management issues in life sciences. Some of the advantages offered by the EdelweissData solution are:<list list-type="simple">
<list-item>
<p>- Each published dataset is assigned a unique URL and is easily accessible through a web browser.</p>
</list-item>
<list-item>
<p>- Published datasets are automatically versioned.</p>
</list-item>
<list-item>
<p>- Published datasets are static, i.e., they cannot be changed unless a newer version is published.</p>
</list-item>
<list-item>
<p>- Published datasets are immediately available through a web service and can be consumed by numerous data analysis tools (Python, R, Excel, KNIME, etc.) via REST API (see also section Data model).</p>
</list-item>
<list-item>
<p>- Flexibility - there is no predefined schema for published datasets. Instead, the schema is inferred from the data during publishing. This allows for a quick and easy consumption of datasets with various structures.</p>
</list-item>
</list>
</p>
</sec>
<sec id="s3-5">
<title>Database implementation - EdelweissData</title>
<p>The MAAR Database is built as a simple web application with a back-end supported by EdelweissData and a front-end that lets the user easily explore the database. The most common use cases (such as search by compound or chemical similarity) are well covered by the web application as is, while more advanced queries or analyses could be made through the API (Application Programming Interface) enabled by EdelweissData.</p>
</sec>
</sec>
<sec sec-type="results" id="s4">
<title>Results</title>
<sec id="s4-1">
<title>Data collected and curated</title>
<p>In total, 125,519 androgenic activity data points for 13,648 chemicals were collected and curated from multiple sources and included in the MAAR database. These data were obtained from 923 assays. <xref ref-type="table" rid="T5">Table 5</xref> lists the statistics of the data collected.</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Statistics of the data collected in the androgenic activity database.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Chemicals</th>
<th colspan="2" align="left"/>
<th align="left">13,648</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="5" align="left">Activity data</td>
<td colspan="2" align="left">Quantitative data</td>
<td align="left">48,273</td>
</tr>
<tr>
<td rowspan="3" align="left">Qualitative data</td>
<td align="left">Active</td>
<td align="left">723</td>
</tr>
<tr>
<td align="left">Inactive</td>
<td align="left">71,630</td>
</tr>
<tr>
<td align="left">Not determined</td>
<td align="left">4,893</td>
</tr>
<tr>
<td colspan="2" align="left">Total</td>
<td align="left">125,519</td>
</tr>
<tr>
<td rowspan="7" align="left">Assays</td>
<td colspan="2" align="left">Binding</td>
<td align="left">379</td>
</tr>
<tr>
<td colspan="2" align="left">Reporter gene</td>
<td align="left">358</td>
</tr>
<tr>
<td colspan="2" align="left">Cell proliferation</td>
<td align="left">86</td>
</tr>
<tr>
<td colspan="2" align="left">
<italic>In vivo</italic>
</td>
<td align="left">60</td>
</tr>
<tr>
<td colspan="2" align="left">HTS</td>
<td align="left">24</td>
</tr>
<tr>
<td colspan="2" align="left">Other</td>
<td align="left">16</td>
</tr>
<tr>
<td colspan="2" align="left">Total</td>
<td align="left">923</td>
</tr>
<tr>
<td align="left">Species</td>
<td colspan="2" align="left"/>
<td align="left">6</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The androgenic activity data are presented in two types. The first type is quantitative value and 48,273 data points are in this type. A quantitative activity value indicates the androgenic activity is numerically determined. Another type of data is qualitative androgenic activity that is described using qualitative terms: active or positive indicates a chemical was tested using an assay and activity was observed but could not be numerically determined; inactive or negative means a chemical did not show androgenic activity in an assay; inconclusion or not determined or unspecified implies activity of a chemical in an assay was not able to be determined. There are 77,246 data that are qualitative. The data were generated using 923 assays, including 379 binding assays, 358 reporter gene assays, 86 cell proliferation assays, 60 <italic>in vivo</italic> assays, 24 high-throughput screening assays (HTS), and 16 other assays that could not be clearly put into any type of assays. Species used in the activity testing are also included in the database, including <italic>Bos taurus</italic>, Chimpanzee, Chinese hamster, <italic>Homo sapiens</italic>, <italic>Mus musculus</italic>, and <italic>Rattus norvegicus</italic>. Information on species for some assays could not be determined in the sources, and thus they are missed for the data generated using such assays.</p>
<p>A chemical could be tested in many laboratories using multiple assays. All androgenic activity data for the same chemicals were collected and presented in this database. The distribution of androgenic activity data for the same chemicals is given in <xref ref-type="fig" rid="F3">Figure 3</xref>.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Distribution of androgenic activity data for the same chemical. Each bar represents the number of chemicals. X-axis indicates the number of data records for the same chemicals. The chemicals with 41&#x2013;50 data records were grouped into the bar with x-axis value 41 and the chemicals with more than 50 data were grouped in the last bar with x-axis value 42.</p>
</caption>
<graphic xlink:href="ebm-249-10279-g003.tif"/>
</fig>
<p>The same chemical is often tested by a variety of assays and has multiple data records. Of the 13,648 chemicals in the database, 2,504 have only one androgenic activity data and the remaining 11,144 have more than one data. Many chemicals have more than 10 androgenic activity data reported and are included in this database. For example, 3,481 chemicals have 11 data records, and 54 chemicals even have more than 40 data records. The androgenic activity data obtained from the same type of assays in different laboratories could be inconsistent. For example, 127 chemicals each have four androgenic activity data generated using binding assays. As shown in <xref ref-type="fig" rid="F4">Figure 4</xref>, 79 chemicals are active for all four data (100% active) and 11 chemicals consistently show inactive (0% active), while the other (37 chemicals) have inconsistent androgenic activity data: one active and three inactive for 15 chemicals, three active and one inactive for six chemicals, and two active and two inactive for 16 chemicals. This database presents all androgenic activity data reported in different sources. Assessing data quality and selecting data for specific applications such as QSAR (quantitative structure-activity relationship) modelling are critically important. Users should make decisions on how to use the data tailored to their applications.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Ratio of active data among 4 binding assay data for 127 chemicals. Each bar represents the number of chemicals. X-axis indicates the ratio of active data.</p>
</caption>
<graphic xlink:href="ebm-249-10279-g004.tif"/>
</fig>
</sec>
<sec id="s4-2">
<title>Web resource</title>
<p>The MAAR database is made available through a web portal as an open science resource based on open data provided according to a Creative Commons license. We have established the resource as part of the OpenTox open knowledge infrastructure located at<xref ref-type="fn" rid="fn4">
<sup>4</sup>
</xref>. The main initial functionality supported allows the user to search for compounds or chemically similar compounds in the database (<xref ref-type="fig" rid="F5">Figure 5</xref>). The portal also supports the location of community-generated notebooks providing additional analysis of the data, starting with illustrative examples we have provided (see sections Method and Application Programming Interface).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>User interface of the web resource.</p>
</caption>
<graphic xlink:href="ebm-249-10279-g005.tif"/>
</fig>
</sec>
<sec id="s4-3">
<title>Application programming interface (API)</title>
<p>The MAAR database comes with a versatile API that simplifies the consumption of the data into other applications. Common data analysis tools that support Representational State Transfer (REST) APIs can obtain data in the database through a simple web request. In this way data can be easily transferred into a Python or R script/notebook, KNIME, Microsoft Excel, etc. To make it even easier for users, an example of an API call in Python and curl<xref ref-type="fn" rid="fn5">
<sup>5</sup>
</xref> is provided in the web application and could be copy-pasted to the user&#x2019;s script/notebook. API documentation is available from the EdelweissData main website<xref ref-type="fn" rid="fn6">
<sup>6</sup>
</xref>.</p>
<p>For the purpose of demonstrating programmatic data retrieval from the database, we show an example of how a particular dataset could be accessed with a web request. Each assay dataset in the database has its own unique ID and when the URL pointing to that dataset is called the database returns the dataset in the JSON format. For a dataset inside the database the URL for dataset with ID &#x201c;21b033c5-d048-41f5-b8a1-d5d8492f7048&#x201d; would be the following: <xref ref-type="fn" rid="fn7">
<sup>7</sup>
</xref>. And the response from the database is shown in <xref ref-type="fig" rid="F6">Figure 6</xref>.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>JSON response from the database.</p>
</caption>
<graphic xlink:href="ebm-249-10279-g006.tif"/>
</fig>
</sec>
<sec id="s4-4">
<title>Notebooks</title>
<p>The REST API service mentioned above is very well suited for different interactive notebooks that are nowadays a common tool for data analysis and visualization. There are many different notebooks available today that differ in the language, interactivity, etc. To build an interactive notebook for visualization of the MAAR data we decided to use Observable HQ notebooks<xref ref-type="fn" rid="fn8">
<sup>8</sup>
</xref> as they offer in our opinion a very good user experience even for technically less skilled users. The programming language in Observable notebooks is JavaScript, which is typically not the language of first choice for data analysis, however, it is very well suited for interactive visualizations that work as a web page.</p>
<p>The Observable notebook<xref ref-type="fn" rid="fn9">
<sup>9</sup>
</xref> for the MAAR database is available through a URL and can be easily shared with anyone. The notebook addresses a simple use case where a user wants to search the database for a particular compound. The notebook returns a list of chemically most similar compounds (based on the Tanimoto chemical similarity &#x2013; see <xref ref-type="fig" rid="F7">Figure 7</xref>, left) together with their activities in the assays. In the next step, users can narrow down the set of activities by filtering the assays based on format, group, type, species, or endpoint. Finally, the subset of compounds (on x axis) and their activities (colors) in various assays (y axis) is displayed as a heatmap (<xref ref-type="fig" rid="F7">Figure 7</xref>, right).</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Two sections of the AADB Observable notebook: user interface for entering the input parameters (left) and visualization of filtered results (right).</p>
</caption>
<graphic xlink:href="ebm-249-10279-g007.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s5">
<title>Discussion</title>
<p>Androgens are hormones that play a key role in the development and maintenance of male characteristics. Understanding the androgenic activity of chemicals is important for assessing chemical risk through endocrine disruption. Therefore, androgenic activity data are important for comprehensive chemical risk assessments, providing insight into the potential endocrine-disrupting effects of substances and helping to establish guidelines and regulations to protect human health and the environment.</p>
<p>Vast amounts of androgenic activity data have been generated and reported in the public domain for many chemicals. However, accessing and using androgenic activity data in the public domain may pose several challenges. First, androgenic activity data are contained in different and diverse sources in the public domain. The lack of comprehensive datasets can hinder applications in chemical risk assessment. Second, the importance of data quality and reliability in scientific research cannot be overstated [<xref ref-type="bibr" rid="B32">32</xref>, <xref ref-type="bibr" rid="B33">33</xref>]. Sound scientific conclusions rest on the foundation of accurate and trustworthy data. The reliability and accuracy of available androgenic activity data vary. Incomplete or poorly curated datasets can compromise the validity of research findings. Third, androgenic activity data are sourced from various studies, experiments, or databases, leading to heterogeneity in data formats and measurement techniques. Lack of standardized protocols for androgenic activity assessment can make it challenging to compare data from different sources. Finally, without sufficient metadata or contextual information, it may be challenging to interpret and utilize androgenic activity data accurately. Inter-laboratory and species-specific variations in androgenic responses can complicate the interpretation of androgenic activity data. Therefore, to facilitate utilization of the available androgenic data in chemical risk assessment, we aim to develop an open resource of androgenic activity data of molecules so that the huge amount of androgenic activity data generated in the scientific community could be used to accelerate and improve chemical risk assessment.</p>
<p>In this article we report the development of an open science data resource for androgenic activity data. We followed principles established in previous projects including OpenTox<xref ref-type="fn" rid="fn10">
<sup>10</sup>
</xref>, OpenRiskNet<xref ref-type="fn" rid="fn11">
<sup>11</sup>
</xref> and EU-ToxRisk<xref ref-type="fn" rid="fn12">
<sup>12</sup>
</xref> [<xref ref-type="bibr" rid="B34">34</xref>&#x2013;<xref ref-type="bibr" rid="B41">41</xref>]. The work includes the careful collection and curation of data entering the database and a data model which includes harmonized data to structure the data in a database. Resource functionalities aligned to the FAIR (findability, accessibility, interoperability, and reusability) principles in the preparation and sharing of open science data and supporting further initiatives and use of the project knowledge. We also paid attention to data integrity principles in the construction of the database and the provision of data through harmonized application programming interfaces, supporting the building of web applications making reliable use of the data. This approach should support analysis and modelling goals of the community in making use of the open knowledge resource created by this work.</p>
<p>The MAAR database is an extensive compilation of chemical compounds, systematically curated and annotated for their androgenic properties, providing researchers, regulators, and industry stakeholders with a comprehensive resource for in-depth investigations. To evaluate the structural coverage of chemicals in the MAAR, we computed chemical spaces for both the MAAR and Tox21 [<xref ref-type="bibr" rid="B42">42</xref>] datasets using Mold2 descriptors [<xref ref-type="bibr" rid="B43">43</xref>, <xref ref-type="bibr" rid="B44">44</xref>]. Following the methodology outlined in our previous studies [<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B45">45</xref>], we performed principal component analysis to represent the chemical space for each dataset. <xref ref-type="fig" rid="F8">Figure 8</xref> illustrates the first three principal components of the compounds in MAAR and Tox21, demonstrating that the structural coverage of MAAR closely resembles that of Tox21. This comparison confirms that MAAR includes structurally diverse set of compounds, making it suitable for a wide range of applications. Development of the MAAR database represents a significant stride towards a more comprehensive and accessible approach to assessing the androgenic activity of chemicals. By providing a centralized platform for data integration and analysis, the MAAR database is poised to enhance our understanding of androgenic endocrine disruption and contribute to the development of effective risk management strategies in the face of evolving chemical landscapes.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Chemical spaces of MAAR and Tox21. Compounds in MAAR and Tox21 are plotted as blue and red circles, respectively. The x-, y-, and z-axes give the first three principal components.</p>
</caption>
<graphic xlink:href="ebm-249-10279-g008.tif"/>
</fig>
</sec>
<sec sec-type="conclusions" id="s6">
<title>Conclusions</title>
<p>We have reported here on a useful curated database for androgenic activity provided as an open science resource to the community, and available to enable searches for relevant information on the presence or absence of evidence on androgenic activity of compounds. We have also provided a model and resource with interfaces supporting additional community members to build additional analysis and modelling applications that work with the database. We hope the resource will prove useful and encourage additional development of the resource including addition of new data and its analysis.</p>
</sec>
</body>
<back>
<sec id="s7">
<title>Author contributions</title>
<p>Conceptualization, HH and BH; methodology, FD, TM, JL, TE, WG, TE, BH, and HH; software, TM, TE, JD, and BH; data curation, FD, JL, WG, and HH; writing&#x2013;original draft preparation, FD, JL, TM, BH, and HH; writing&#x2013;review and editing, WT, BH, and HH; supervision, BH and HH. All authors have read and agreed to the published version of the manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s8">
<title>Author disclaimer</title>
<p>This article reflects the views of the authors and does not necessarily reflect those of the U.S. Food and Drug Administration. Any mention of commercial products is for clarification only and is not intended as approval, endorsement, or recommendation.</p>
</sec>
<sec id="s9">
<title>Data availability</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <ext-link ext-link-type="uri" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="https://github.com/FANMISUA/AADB.git">https://github.com/FANMISUA/AADB.git</ext-link>.</p>
</sec>
<sec sec-type="funding-information" id="s10">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research, authorship, and/or publication of this article.</p>
</sec>
<sec sec-type="COI-statement" id="s11">
<title>Conflict of interest</title>
<p>Authors BH, TM, TE, JD, and DB were employed by Edelweiss Connect Inc.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<fn-group>
<fn id="fn1">
<label>1</label>
<p>
<ext-link ext-link-type="uri" xlink:href="http://www.epa.gov/safewater/sdwa/index.html">http://www.epa.gov/safewater/sdwa/index.html</ext-link>
</p>
</fn>
<fn id="fn2">
<label>2</label>
<p>
<ext-link ext-link-type="uri" xlink:href="http://www.epa.gov/scipoly/oscpendo/">http://www.epa.gov/scipoly/oscpendo/</ext-link>
</p>
</fn>
<fn id="fn3">
<label>3</label>
<p>
<ext-link ext-link-type="uri" xlink:href="https://www.fda.gov/media/86996/download">https://www.fda.gov/media/86996/download</ext-link>
</p>
</fn>
<fn id="fn4">
<label>4</label>
<p>
<ext-link ext-link-type="uri" xlink:href="https://opentox.net/MAAR/">https://opentox.net/MAAR/</ext-link>
</p>
</fn>
<fn id="fn5">
<label>5</label>
<p>
<ext-link ext-link-type="uri" xlink:href="https://en.wikipedia.org/wiki/CURL">https://en.wikipedia.org/wiki/CURL</ext-link>
</p>
</fn>
<fn id="fn6">
<label>6</label>
<p>
<ext-link ext-link-type="uri" xlink:href="https://edelweissdata.com/docs/about">https://edelweissdata.com/docs/about</ext-link>
</p>
</fn>
<fn id="fn7">
<label>7</label>
<p>
<ext-link ext-link-type="uri" xlink:href="https://api.aadb.cloud.edelweissconnect.com/datasets/21b033c5-d048-41f5-b8a1-d5d8492f7048/versions/latest">https://api.aadb.cloud.edelweissconnect.com/datasets/21b033c5-d048-41f5-b8a1-d5d8492f7048/versions/latest</ext-link>
</p>
</fn>
<fn id="fn8">
<label>8</label>
<p>
<ext-link ext-link-type="uri" xlink:href="https://observablehq.com/">https://observablehq.com/</ext-link>
</p>
</fn>
<fn id="fn9">
<label>9</label>
<p>
<ext-link ext-link-type="uri" xlink:href="https://observablehq.com/@saferworldbydesign/aadb-notebook">https://observablehq.com/@saferworldbydesign/aadb-notebook</ext-link>
</p>
</fn>
<fn id="fn10">
<label>10</label>
<p>
<ext-link ext-link-type="uri" xlink:href="https://opentox.net/">https://opentox.net/</ext-link>
</p>
</fn>
<fn id="fn11">
<label>11</label>
<p>
<ext-link ext-link-type="uri" xlink:href="https://openrisknet.org/">https://openrisknet.org/</ext-link>
</p>
</fn>
<fn id="fn12">
<label>12</label>
<p>
<ext-link ext-link-type="uri" xlink:href="http://www.eu-toxrisk.eu/">www.eu-toxrisk.eu</ext-link>
</p>
</fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Adebayo</surname>
<given-names>OA</given-names>
</name>
<name>
<surname>Adesanoye</surname>
<given-names>OA</given-names>
</name>
<name>
<surname>Abolaji</surname>
<given-names>OA</given-names>
</name>
<name>
<surname>Kehinde</surname>
<given-names>AO</given-names>
</name>
<name>
<surname>Adaramoye</surname>
<given-names>OA</given-names>
</name>
</person-group>. <article-title>First-line antituberculosis drugs disrupt endocrine balance and induce ovarian and uterine oxidative stress in rats</article-title>. <source>J Basic Clin Physiol Pharmacol</source> (<year>2018</year>) <volume>29</volume>(<issue>2</issue>):<fpage>131</fpage>&#x2013;<lpage>40</lpage>. <pub-id pub-id-type="doi">10.1515/jbcpp-2017-0087</pub-id>
</citation>
</ref>
<ref id="B2">
<label>2.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Danzo</surname>
<given-names>BJ</given-names>
</name>
</person-group>. <article-title>Environmental xenobiotics may disrupt normal endocrine function by interfering with the binding of physiological ligands to steroid receptors and binding proteins</article-title>. <source>Environ Health Perspect</source> (<year>1997</year>) <volume>105</volume>(<issue>3</issue>):<fpage>294</fpage>&#x2013;<lpage>301</lpage>. <pub-id pub-id-type="doi">10.1289/ehp.97105294</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kavlock</surname>
<given-names>RJ</given-names>
</name>
<name>
<surname>Daston</surname>
<given-names>GP</given-names>
</name>
<name>
<surname>DeRosa</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Fenner-Crisp</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Gray</surname>
<given-names>LE</given-names>
</name>
<name>
<surname>Kaattari</surname>
<given-names>S</given-names>
</name>
<etal/>
</person-group> <article-title>Research needs for the risk assessment of health and environmental effects of endocrine disruptors: a report of the U.S. EPA-sponsored workshop</article-title>. <source>Environ Health Perspect</source> (<year>1996</year>) <volume>104</volume>(<issue>Suppl. 4</issue>):<fpage>715</fpage>&#x2013;<lpage>40</lpage>. <pub-id pub-id-type="doi">10.2307/3432708</pub-id>
</citation>
</ref>
<ref id="B4">
<label>4.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ding</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Perkins</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Harris</surname>
<given-names>S</given-names>
</name>
<etal/>
</person-group> <article-title>The EDKB: an established knowledge base for endocrine disrupting chemicals</article-title>. <source>BMC Bioinformatics</source> (<year>2010</year>) <volume>11</volume>(<issue>Suppl. 6</issue>):<fpage>S5</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-11-s6-s5</pub-id>
</citation>
</ref>
<ref id="B5">
<label>5.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shen</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Richard</surname>
<given-names>AM</given-names>
</name>
<name>
<surname>Bray</surname>
<given-names>JD</given-names>
</name>
<name>
<surname>Judson</surname>
<given-names>RS</given-names>
</name>
<etal/>
</person-group> <article-title>EADB: an estrogenic activity database for assessing potential endocrine activity</article-title>. <source>Toxicol Sci</source> (<year>2013</year>) <volume>135</volume>(<issue>2</issue>):<fpage>277</fpage>&#x2013;<lpage>91</lpage>. <pub-id pub-id-type="doi">10.1093/toxsci/kft164</pub-id>
</citation>
</ref>
<ref id="B6">
<label>6.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>LM</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>Q</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>J</given-names>
</name>
<etal/>
</person-group> <article-title>Prediction of Estrogen Receptor Binding for 58,000 chemicals Using an Integrated system of a tree-based model with structural alerts</article-title>. <source>Environ Health Perspect</source> (<year>2002</year>) <volume>110</volume>(<issue>1</issue>):<fpage>29</fpage>&#x2013;<lpage>36</lpage>. <pub-id pub-id-type="doi">10.1289/ehp.0211029</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tong</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Perkins</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Fa Perkinsng</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>Q</given-names>
</name>
<name>
<surname>Branham</surname>
<given-names>SW</given-names>
</name>
<etal/>
</person-group> <article-title>Development of Quantitative Structure-Activity Relationships (QSARs) and their use for priority setting in the testing strategy of endocrine disruptors</article-title>. <source>Regul Res Perspect</source> (<year>2002</year>) <volume>1</volume>(<issue>3</issue>):<fpage>1</fpage>&#x2013;<lpage>16</lpage>.</citation>
</ref>
<ref id="B8">
<label>8.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>Q</given-names>
</name>
<name>
<surname>Perkins</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Sheehan</surname>
<given-names>DM</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W</given-names>
</name>
</person-group>. <article-title>Comparative molecular field analysis (CoMFA) model using a large diverse set of natural, synthetic and environmental chemicals for binding to the androgen receptor</article-title>. <source>SAR QSAR Environ Res</source> (<year>2003</year>) <volume>14</volume>(<issue>5-6</issue>):<fpage>373</fpage>&#x2013;<lpage>88</lpage>. <pub-id pub-id-type="doi">10.1080/10629360310001623962</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname>
<given-names>LM</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>Q</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Perkins</surname>
<given-names>R</given-names>
</name>
<etal/>
</person-group> <article-title>An integrated 4-Phase approach for setting endocrine disruption screening priorities - phase I and II predictions of estrogen receptor binding affinity</article-title>. <source>SAR QSAR Environ Res</source> (<year>2002</year>) <volume>13</volume>(<issue>1</issue>):<fpage>69</fpage>&#x2013;<lpage>88</lpage>. <pub-id pub-id-type="doi">10.1080/10629360290002235</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sakkiah</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Kusko</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
</person-group>. <article-title>Computational prediction models for assessing endocrine disrupting potential of chemicals</article-title>. <source>J Environ Sci Health C</source> (<year>2018</year>) <volume>36</volume>(<issue>4</issue>):<fpage>192</fpage>&#x2013;<lpage>218</lpage>. <pub-id pub-id-type="doi">10.1080/10590501.2018.1537132</pub-id>
</citation>
</ref>
<ref id="B11">
<label>11.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ng</surname>
<given-names>HW</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Shu</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Perkins</surname>
<given-names>R</given-names>
</name>
<etal/>
</person-group> <article-title>Competitive molecular docking approach for predicting estrogen receptor subtype &#x3b1; agonists and antagonists</article-title>. <source>BMC Bioinformatics</source> (<year>2014</year>) <volume>15</volume>(<issue>Suppl. 11</issue>):<fpage>S4</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-15-s11-s4</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ng</surname>
<given-names>HW</given-names>
</name>
<name>
<surname>Doughty</surname>
<given-names>SW</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W</given-names>
</name>
<etal/>
</person-group> <article-title>Development and validation of decision forest model for estrogen receptor binding prediction of chemicals using large data sets</article-title>. <source>Chem Res Toxicol</source> (<year>2015</year>) <volume>28</volume>(<issue>12</issue>):<fpage>2343</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1021/acs.chemrestox.5b00358</pub-id>
</citation>
</ref>
<ref id="B13">
<label>13.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ng</surname>
<given-names>HW</given-names>
</name>
<name>
<surname>Shu</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Perkins</surname>
<given-names>R</given-names>
</name>
<etal/>
</person-group> <article-title>Estrogenic activity data extraction and <italic>in silico</italic> prediction show the endocrine disruption potential of bisphenol A replacement compounds</article-title>. <source>Chem Res Toxicol</source> (<year>2015</year>) <volume>28</volume>(<issue>9</issue>):<fpage>1784</fpage>&#x2013;<lpage>95</lpage>. <pub-id pub-id-type="doi">10.1021/acs.chemrestox.5b00243</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Rua</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Sakkiah</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Selvaraj</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W</given-names>
</name>
</person-group>. <article-title>Consensus modeling for prediction of estrogenic activity of ingredients commonly used in sunscreen products</article-title>. <source>Int J Environ Res Public Health</source> (<year>2016</year>) <volume>13</volume>(<issue>10</issue>):<fpage>958</fpage>. <pub-id pub-id-type="doi">10.3390/ijerph13100958</pub-id>
</citation>
</ref>
<ref id="B15">
<label>15.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Harvey</surname>
<given-names>BG</given-names>
</name>
<name>
<surname>Palmese</surname>
<given-names>GR</given-names>
</name>
<name>
<surname>Stanzione</surname>
<given-names>JF</given-names>
</name>
<name>
<surname>Ng</surname>
<given-names>HW</given-names>
</name>
<name>
<surname>Sakkiah</surname>
<given-names>S</given-names>
</name>
<etal/>
</person-group> <article-title>Experimental data extraction and <italic>in silico</italic> prediction of the estrogenic activity of renewable replacements for bisphenol A</article-title>. <source>Int J Environ Res Public Health</source> (<year>2016</year>) <volume>13</volume>(<issue>7</issue>):<fpage>705</fpage>. <pub-id pub-id-type="doi">10.3390/ijerph13070705</pub-id>
</citation>
</ref>
<ref id="B16">
<label>16.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ye</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Ng</surname>
<given-names>HW</given-names>
</name>
<name>
<surname>Meehan</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W</given-names>
</name>
<etal/>
</person-group> <article-title>Applying network analysis and Nebula (neighbor-edges based and unbiased leverage algorithm) to ToxCast data</article-title>. <source>Environ Int</source> (<year>2016</year>) <volume>89-90</volume>:<fpage>81</fpage>&#x2013;<lpage>92</lpage>. <pub-id pub-id-type="doi">10.1016/j.envint.2016.01.010</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17.</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Sakkiah</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Kusko</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
</person-group>. <article-title>Applications of molecular dynamics simulations in computational toxicology</article-title>. In: <person-group person-group-type="editor">
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
</person-group>, editor. <source>Advances in computational toxicology: methodologies and applications in regulatory science</source>. <publisher-loc>Cham</publisher-loc>: <publisher-name>Springer International Publishing</publisher-name> (<year>2019</year>). p. <fpage>181</fpage>&#x2013;<lpage>212</lpage>.</citation>
</ref>
<ref id="B18">
<label>18.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sakkiah</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Selvaraj</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Patterson</surname>
<given-names>TA</given-names>
</name>
<etal/>
</person-group> <article-title>Elucidation of agonist and antagonist dynamic binding patterns in ER-&#x3b1; by integration of molecular docking, molecular dynamics simulations and quantum mechanical calculations</article-title>. <source>Int J Mol Sci</source> (<year>2021</year>) <volume>22</volume>(<issue>17</issue>):<fpage>9371</fpage>. <pub-id pub-id-type="doi">10.3390/ijms22179371</pub-id>
</citation>
</ref>
<ref id="B19">
<label>19.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tan</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Benfenati</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Giesy</surname>
<given-names>JP</given-names>
</name>
<name>
<surname>Gini</surname>
<given-names>GC</given-names>
</name>
<etal/>
</person-group> <article-title>Structures of endocrine-disrupting chemicals determine binding to and activation of the estrogen receptor &#x3b1; and androgen receptor</article-title>. <source>Environ Sci Technol</source> (<year>2020</year>) <volume>54</volume>(<issue>18</issue>):<fpage>11424</fpage>&#x2013;<lpage>33</lpage>. <pub-id pub-id-type="doi">10.1021/acs.est.0c02639</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Banerjee</surname>
<given-names>A</given-names>
</name>
<name>
<surname>De</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>V</given-names>
</name>
<name>
<surname>Kar</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Roy</surname>
<given-names>K</given-names>
</name>
</person-group>. <article-title>Quick and efficient quantitative predictions of androgen receptor binding affinity for screening Endocrine Disruptor Chemicals using 2D-QSAR and Chemical Read-Across</article-title>. <source>Chemosphere</source> (<year>2022</year>) <volume>309</volume>(<issue>Pt 1</issue>):<fpage>136579</fpage>. <pub-id pub-id-type="doi">10.1016/j.chemosphere.2022.136579</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wilkes</surname>
<given-names>JG</given-names>
</name>
<name>
<surname>Stoyanova-Slavova</surname>
<given-names>IB</given-names>
</name>
<name>
<surname>Buzatu</surname>
<given-names>DA</given-names>
</name>
</person-group>. <article-title>Alignment-independent technique for 3D QSAR analysis</article-title>. <source>J Comput Aided Mol Des</source> (<year>2016</year>) <volume>30</volume>(<issue>4</issue>):<fpage>331</fpage>&#x2013;<lpage>45</lpage>. <pub-id pub-id-type="doi">10.1007/s10822-016-9909-0</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Sedykh</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Tripathi</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Afantitis</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Mouchlis</surname>
<given-names>VD</given-names>
</name>
<etal/>
</person-group> <article-title>Identification of putative estrogen receptor-mediated endocrine disrupting chemicals using QSAR- and structure-based virtual screening approaches</article-title>. <source>Toxicol Appl Pharmacol</source> (<year>2013</year>) <volume>272</volume>(<issue>1</issue>):<fpage>67</fpage>&#x2013;<lpage>76</lpage>. <pub-id pub-id-type="doi">10.1016/j.taap.2013.04.032</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname>
<given-names>NZ</given-names>
</name>
<name>
<surname>Wardell</surname>
<given-names>SE</given-names>
</name>
<name>
<surname>Burnstein</surname>
<given-names>KL</given-names>
</name>
<name>
<surname>Defranco</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Fuller</surname>
<given-names>PJ</given-names>
</name>
<name>
<surname>Giguere</surname>
<given-names>V</given-names>
</name>
<etal/>
</person-group> <article-title>International Union of Pharmacology. LXV. The pharmacology and classification of the nuclear receptor superfamily: glucocorticoid, mineralocorticoid, progesterone, and androgen receptors</article-title>. <source>Pharmacol Rev</source> (<year>2006</year>) <volume>58</volume>(<issue>4</issue>):<fpage>782</fpage>&#x2013;<lpage>97</lpage>. <pub-id pub-id-type="doi">10.1124/pr.58.4.9</pub-id>
</citation>
</ref>
<ref id="B24">
<label>24.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sakkiah</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Ng</surname>
<given-names>HW</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
</person-group>. <article-title>Structures of androgen receptor bound with ligands: advancing understanding of biological functions and drug discovery</article-title>. <source>Expert Opin Ther Targets</source> (<year>2016</year>) <volume>20</volume>(<issue>10</issue>):<fpage>1267</fpage>&#x2013;<lpage>82</lpage>. <pub-id pub-id-type="doi">10.1080/14728222.2016.1192131</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mooradian</surname>
<given-names>AD</given-names>
</name>
<name>
<surname>Morley</surname>
<given-names>JE</given-names>
</name>
<name>
<surname>Korenman</surname>
<given-names>SG</given-names>
</name>
</person-group>. <article-title>Biological actions of androgens</article-title>. <source>Endocr Rev</source> (<year>1987</year>) <volume>8</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>28</lpage>. <pub-id pub-id-type="doi">10.1210/edrv-8-1-1</pub-id>
</citation>
</ref>
<ref id="B26">
<label>26.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Matsumoto</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Sakari</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Okada</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Yokoyama</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Takahashi</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Kouzmenko</surname>
<given-names>A</given-names>
</name>
<etal/>
</person-group> <article-title>The androgen receptor in health and disease</article-title>. <source>Annu Rev Physiol</source> (<year>2013</year>) <volume>75</volume>:<fpage>201</fpage>&#x2013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-physiol-030212-183656</pub-id>
</citation>
</ref>
<ref id="B27">
<label>27.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Gindulyte</surname>
<given-names>A</given-names>
</name>
<name>
<surname>He</surname>
<given-names>J</given-names>
</name>
<name>
<surname>He</surname>
<given-names>S</given-names>
</name>
<etal/>
</person-group> <article-title>PubChem 2019 update: improved access to chemical data</article-title>. <source>Nucleic Acids Res</source> (<year>2019</year>) <volume>47</volume>(<issue>D1</issue>):<fpage>D1102</fpage>&#x2013;<lpage>D1109</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gky1033</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mendez</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Gaulton</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Bento</surname>
<given-names>AP</given-names>
</name>
<name>
<surname>Chambers</surname>
<given-names>J</given-names>
</name>
<name>
<surname>De&#xa0;Veij</surname>
<given-names>M</given-names>
</name>
<name>
<surname>F&#xe9;lix</surname>
<given-names>E</given-names>
</name>
<etal/>
</person-group> <article-title>ChEMBL: towards direct deposition of bioassay data</article-title>. <source>Nucleic Acids Res</source> (<year>2019</year>) <volume>47</volume>(<issue>D1</issue>):<fpage>D930</fpage>&#x2013;<lpage>D940</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gky1075</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Jorissen</surname>
<given-names>RN</given-names>
</name>
<name>
<surname>Gilson</surname>
<given-names>MK</given-names>
</name>
</person-group>. <article-title>BindingDB: a web-accessible database of experimentally determined protein-ligand binding affinities</article-title>. <source>Nucleic Acids Res</source> (<year>2007</year>) <volume>35</volume>:<fpage>D198</fpage>&#x2013;<lpage>201</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkl999</pub-id>
</citation>
</ref>
<ref id="B30">
<label>30.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dix</surname>
<given-names>DJ</given-names>
</name>
<name>
<surname>Houck</surname>
<given-names>KA</given-names>
</name>
<name>
<surname>Martin</surname>
<given-names>MT</given-names>
</name>
<name>
<surname>Richard</surname>
<given-names>AM</given-names>
</name>
<name>
<surname>Setzer</surname>
<given-names>RW</given-names>
</name>
<name>
<surname>Kavlock</surname>
<given-names>RJ</given-names>
</name>
</person-group>. <article-title>The ToxCast program for prioritizing toxicity testing of environmental chemicals</article-title>. <source>Toxicol Sci</source> (<year>2007</year>) <volume>95</volume>(<issue>1</issue>):<fpage>5</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1093/toxsci/kfl103</pub-id>
</citation>
</ref>
<ref id="B31">
<label>31.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davis</surname>
<given-names>AP</given-names>
</name>
<name>
<surname>Grondin</surname>
<given-names>CJ</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>RJ</given-names>
</name>
<name>
<surname>Sciaky</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>TC</given-names>
</name>
<etal/>
</person-group> <article-title>Comparative toxicogenomics database (CTD): update 2021</article-title>. <source>Nucleic Acids Res</source> (<year>2021</year>) <volume>49</volume>(<issue>D1</issue>):<fpage>D1138</fpage>&#x2013;<lpage>43</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkaa891</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Jones</surname>
<given-names>WD</given-names>
</name>
<name>
<surname>Su</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Ning</surname>
<given-names>B</given-names>
</name>
<etal/>
</person-group> <article-title>Technical reproducibility of genotyping SNP arrays used in genome-wide association studies</article-title>. <source>PLoS One</source> (<year>2012</year>) <volume>7</volume>(<issue>9</issue>):<fpage>e44483</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0044483</pub-id>
</citation>
</ref>
<ref id="B33">
<label>33.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pan</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Kusko</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>C</given-names>
</name>
<etal/>
</person-group> <article-title>Correction to: similarities and differences between variants called with human reference genome HG19 or HG38</article-title>. <source>BMC Bioinformatics</source> (<year>2019</year>) <volume>20</volume>(<issue>1</issue>):<fpage>252</fpage>. <pub-id pub-id-type="doi">10.1186/s12859-019-2776-7</pub-id>
</citation>
</ref>
<ref id="B34">
<label>34.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hardy</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Douglas</surname>
<given-names>N</given-names>
</name>
<name>
<surname>Helma</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Rautenberg</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Jeliazkova</surname>
<given-names>N</given-names>
</name>
<name>
<surname>Jeliazkov</surname>
<given-names>V</given-names>
</name>
<etal/>
</person-group> <article-title>Collaborative development of predictive toxicology applications</article-title>. <source>J Cheminformatics</source> (<year>2010</year>) <volume>2</volume>(<issue>7</issue>):<fpage>7</fpage>. <pub-id pub-id-type="doi">10.1186/1758-2946-2-7</pub-id>
</citation>
</ref>
<ref id="B35">
<label>35.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hardy</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Apic</surname>
<given-names>G</given-names>
</name>
<name>
<surname>Carthew</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Clark</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Cook</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Dix</surname>
<given-names>I</given-names>
</name>
<etal/>
</person-group> <article-title>A toxicology ontology roadmap</article-title>. <source>ALTEX</source> (<year>2012</year>) <volume>29</volume>:<fpage>129</fpage>&#x2013;<lpage>37</lpage>. <pub-id pub-id-type="doi">10.14573/altex.2012.2.129</pub-id>
</citation>
</ref>
<ref id="B36">
<label>36.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hardy</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Apic</surname>
<given-names>G</given-names>
</name>
<name>
<surname>Carthew</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Clark</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Cook</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Dix</surname>
<given-names>I</given-names>
</name>
<etal/>
</person-group> <article-title>Toxicology ontology perspectives</article-title>. <source>ALTEX</source> (<year>2012</year>) <volume>29</volume>:<fpage>139</fpage>&#x2013;<lpage>56</lpage>. <pub-id pub-id-type="doi">10.14573/altex.2012.2.139</pub-id>
</citation>
</ref>
<ref id="B37">
<label>37.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kohonen</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Benfenati</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Bower</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Ceder</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Crump</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Cross</surname>
<given-names>K</given-names>
</name>
<etal/>
</person-group> <article-title>The ToxBank data warehouse: supporting the replacement of <italic>in vivo</italic> repeated dose systemic toxicity testing</article-title>. <source>Mol Inform</source> (<year>2013</year>) <volume>32</volume>(<issue>Issue 1</issue>):<fpage>47</fpage>&#x2013;<lpage>63</lpage>. <pub-id pub-id-type="doi">10.1002/minf.201200114</pub-id>
</citation>
</ref>
<ref id="B38">
<label>38.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fourches</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Muratov</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Tropsha</surname>
<given-names>A</given-names>
</name>
</person-group>. <article-title>Trust, but verify: on the importance of chemical structure curation in cheminformatics and QSAR modeling research</article-title>. <source>J Chem Inf Model</source> (<year>2010</year>) <volume>50</volume>:<fpage>1189</fpage>&#x2013;<lpage>204</lpage>. <pub-id pub-id-type="doi">10.1021/ci100176x</pub-id>
</citation>
</ref>
<ref id="B39">
<label>39.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fourches</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Muratov</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Tropsha</surname>
<given-names>A</given-names>
</name>
</person-group>. <article-title>Curation of chemogenomics data</article-title>. <source>Nat Chem Biol</source> (<year>2015</year>) <volume>11</volume>:<fpage>535</fpage>. <pub-id pub-id-type="doi">10.1038/nchembio.1881</pub-id>
</citation>
</ref>
<ref id="B40">
<label>40.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fourches</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Muratov</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Tropsha</surname>
<given-names>A</given-names>
</name>
</person-group>. <article-title>Trust, but Verify II: A Practical Guide to Chemogenomics Data Curation</article-title>. <source>J Chem Inf Model</source>. (<year>2016</year>) <volume>56</volume>(<issue>7</issue>):<fpage>1243</fpage>&#x2013;<lpage>1252</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.6b00129</pub-id>
</citation>
</ref>
<ref id="B41">
<label>41.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tropsha</surname>
<given-names>A</given-names>
</name>
</person-group>. <article-title>Best practices for QSAR model development, validation, and exploitation</article-title>. <source>Mol Inform</source> (<year>2010</year>) <volume>29</volume>(<issue>6-7</issue>):<fpage>476</fpage>&#x2013;<lpage>88</lpage>. <pub-id pub-id-type="doi">10.1002/minf.201000061</pub-id>
</citation>
</ref>
<ref id="B42">
<label>42.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Idakwo</surname>
<given-names>G</given-names>
</name>
<name>
<surname>Thangapandian</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Luttrell</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>N</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Z</given-names>
</name>
<etal/>
</person-group> <article-title>Structure-activity relationship-based chemical classification of highly imbalanced Tox21 datasets</article-title>. <source>J Cheminform</source> (<year>2020</year>) <volume>12</volume>(<issue>1</issue>):<fpage>66</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-020-00468-x</pub-id>
</citation>
</ref>
<ref id="B43">
<label>43.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>Q</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Qian</surname>
<given-names>F</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>L</given-names>
</name>
<etal/>
</person-group> <article-title>Mold(2), molecular descriptors from 2D structures for chemoinformatics and toxicoinformatics</article-title>. <source>J Chem Inf Model</source> (<year>2008</year>) <volume>48</volume>(<issue>7</issue>):<fpage>1337</fpage>&#x2013;<lpage>44</lpage>. <pub-id pub-id-type="doi">10.1021/ci800038f</pub-id>
</citation>
</ref>
<ref id="B44">
<label>44.</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Sakkiah</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Yavas</surname>
<given-names>G</given-names>
</name>
<etal/>
</person-group> <article-title>Mold2 descriptors facilitate development of machine learning and deep learning models for predicting toxicity of chemicals</article-title>. In: <person-group person-group-type="editor">
<name>
<surname>Hong</surname>
<given-names>H</given-names>
</name>
</person-group>, editor. <source>Machine learning and deep learning in computational toxicology</source>. <publisher-loc>Cham</publisher-loc>: <publisher-name>Springer International Publishing</publisher-name> (<year>2023</year>). p. <fpage>297</fpage>&#x2013;<lpage>321</lpage>.</citation>
</ref>
<ref id="B45">
<label>45.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Khan</surname>
<given-names>MKH</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>W</given-names>
</name>
<etal/>
</person-group> <article-title>Developing a SARS-CoV-2 main protease binding prediction random forest model for drug repurposing for COVID-19 treatment</article-title>. <source>Exp Biol Med (Maywood)</source> (<year>2023</year>) <volume>248</volume>(<issue>21</issue>):<fpage>1927</fpage>&#x2013;<lpage>36</lpage>. <pub-id pub-id-type="doi">10.1177/15353702231209413</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>