<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JBB</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Bioinform Biotech</journal-id>
      <journal-title>JMIR Bioinformatics and Biotechnology</journal-title>
      <issn pub-type="epub">2563-3570</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v5i1e56538</article-id>
      <article-id pub-id-type="pmid">39046787</article-id>
      <article-id pub-id-type="doi">10.2196/56538</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Deep Learning–Based Identification of Tissue of Origin for Carcinomas of Unknown Primary Using MicroRNA Expression: Algorithm Development and Validation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Uzun</surname>
            <given-names>Alper</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Robertson</surname>
            <given-names>Alan</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Timmaraju</surname>
            <given-names>Venkata Arun</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Raghu</surname>
            <given-names>Ananya</given-names>
          </name>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0002-4282-3163</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Raghu</surname>
            <given-names>Anisha</given-names>
          </name>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0002-2192-5259</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Wise</surname>
            <given-names>Jillian F</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Department of Biology and Biomedical Sciences</institution>
            <institution>Salve Regina University</institution>
            <addr-line>100 Ochre Point Avenue</addr-line>
            <addr-line>Newport, RI, 02840</addr-line>
            <country>United States</country>
            <phone>1 401 847 6650 ext 2822</phone>
            <email>jillian.wise@salve.edu</email>
          </address>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2575-869X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Quarry Lane School</institution>
        <addr-line>San Ramon, CA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Biology and Biomedical Sciences</institution>
        <institution>Salve Regina University</institution>
        <addr-line>Newport, RI</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Broad Institute of MIT and Harvard</institution>
        <addr-line>Cambridge, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Pre-College Programs</institution>
        <institution>Tufts University</institution>
        <addr-line>Medford, MA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Jillian F Wise <email>jillian.wise@salve.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>24</day>
        <month>7</month>
        <year>2024</year>
      </pub-date>
      <volume>5</volume>
      <elocation-id>e56538</elocation-id>
      <history>
        <date date-type="received">
          <day>18</day>
          <month>1</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>6</day>
          <month>2</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>2</day>
          <month>4</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>25</day>
          <month>4</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Ananya Raghu, Anisha Raghu, Jillian F Wise. Originally published in JMIR Bioinformatics and Biotechnology (https://bioinform.jmir.org), 24.07.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Bioinformatics and Biotechnology, is properly cited. The complete bibliographic information, a link to the original publication on https://bioinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://bioinform.jmir.org/2024/1/e56538" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Carcinoma of unknown primary (CUP) is a subset of metastatic cancers in which the primary tissue source of the cancer cells remains unidentified. CUP is the eighth most common malignancy worldwide, accounting for up to 5% of all malignancies. Representing an exceptionally aggressive metastatic cancer, the median survival is approximately 3 to 6 months. The tissue in which cancer arises plays a key role in our understanding of sensitivities to various forms of cell death. Thus, the lack of knowledge on the tissue of origin (TOO) makes it difficult to devise tailored and effective treatments for patients with CUP. Developing quick and clinically implementable methods to identify the TOO of the primary site is crucial in treating patients with CUP. Noncoding RNAs may hold potential for origin identification and provide a robust route to clinical implementation due to their resistance against chemical degradation.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to investigate the potential of microRNAs, a subset of noncoding RNAs, as highly accurate biomarkers for detecting the TOO through data-driven, machine learning approaches for metastatic cancers.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We used microRNA expression data from The Cancer Genome Atlas data set and assessed various machine learning approaches, from simple classifiers to deep learning approaches. As a test of our classifiers, we evaluated the accuracy on a separate set of 194 primary tumor samples from the Sequence Read Archive. We used permutation feature importance to determine the potential microRNA biomarkers and assessed them with principal component analysis and t-distributed stochastic neighbor embedding visualizations.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our results show that it is possible to design robust classifiers to detect the TOO for metastatic samples on The Cancer Genome Atlas data set, with an accuracy of up to 97% (351/362), which may be used in situations of CUP. Our findings show that deep learning techniques enhance prediction accuracy. We progressed from an initial accuracy prediction of 62.5% (226/362) with decision trees to 93.2% (337/362) with logistic regression, finally achieving 97% (351/362) accuracy using deep learning on metastatic samples. On the Sequence Read Archive validation set, a lower accuracy of 41.2% (77/188) was achieved by the decision tree, while deep learning achieved a higher accuracy of 80.4% (151/188). Notably, our feature importance analysis showed the top 3 most important features for predicting TOO to be microRNA-10b, microRNA-205, and microRNA-196b, which aligns with previous work.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our findings highlight the potential of using machine learning techniques to devise accurate tests for detecting TOO for CUP. Since microRNAs are carried throughout the body via extracellular vesicles secreted from cells, they may serve as key biomarkers for liquid biopsy due to their presence in blood plasma. Our work serves as a foundation toward developing blood-based cancer detection tests based on the presence of microRNA.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>cancer genomics</kwd>
        <kwd>machine learning algorithms</kwd>
        <kwd>deep learning</kwd>
        <kwd>gene expression</kwd>
        <kwd>RNA</kwd>
        <kwd>RNAs</kwd>
        <kwd>cancer</kwd>
        <kwd>oncology</kwd>
        <kwd>tumor</kwd>
        <kwd>tumors</kwd>
        <kwd>tissue</kwd>
        <kwd>tissues</kwd>
        <kwd>metastatic</kwd>
        <kwd>microRNA</kwd>
        <kwd>microRNAs</kwd>
        <kwd>gene</kwd>
        <kwd>genes</kwd>
        <kwd>genomic</kwd>
        <kwd>genomics</kwd>
        <kwd>machine learning</kwd>
        <kwd>algorithm</kwd>
        <kwd>algorithms</kwd>
        <kwd>carcinoma</kwd>
        <kwd>genetics</kwd>
        <kwd>genome</kwd>
        <kwd>detection</kwd>
        <kwd>bioinformatics</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Carcinoma of unknown primary (CUP) originates when a patient presents at diagnosis with malignant disease across the body; yet, the cancer cells tissue of origin (TOO) remains unidentifiable. Thus, CUP is a unique subset of metastasized cancer representing an advanced stage in which cancer has gained the ability to thrive in new tissue sites and has spread from the primary tumor site. In the United States, an estimated 31,490 people were diagnosed with cases of cancer of unknown TOO in 2008. This accounts for nearly 3%-5% of all cancer cases [<xref ref-type="bibr" rid="ref1">1</xref>] and given the lack of knowledge on tissue response to current therapeutics the median survival of patients remains only 3-9 months [<xref ref-type="bibr" rid="ref2">2</xref>]. In many cases of CUP, the primary site is never identified, preventing the use of treatment that can be effective for the true TOO [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. It has been demonstrated that pinpointing the primary site can significantly increase survival rates by enabling precise and targeted treatment [<xref ref-type="bibr" rid="ref5">5</xref>].</p>
      <p>Unfortunately, primary tumor identification poses various challenges. Techniques such as serum tumor markers and imaging tests are used to identify the TOO, although only 30% of these tests are successful. Moreover, some positive findings can be misleading [<xref ref-type="bibr" rid="ref6">6</xref>] and CUP diagnostic workups are often time-consuming, expensive, and unsuccessful [<xref ref-type="bibr" rid="ref7">7</xref>]. These difficulties have spurred interest in using genetic expression data, such as microRNA, to identify the TOO.</p>
      <p>MicroRNAs belong to a class of noncoding regulatory RNAs, small single-stranded RNA molecules that are between 19 and 25 nucleotides long and are involved in the regulation of gene expression of mRNAs. MicroRNAs hold promise as informative biomarkers for cancer due to their significant involvement in cellular processes such as cell division, apoptosis, proliferation, and oncogenesis [<xref ref-type="bibr" rid="ref8">8</xref>]. Beyond their intracellular role in gene regulation, microRNAs may be carried throughout the body via extracellular vesicles secreted from cells and have been identified in the blood. Additionally, microRNA, unlike mRNA, is characterized by resistance to extreme temperatures and pH. This makes microRNAs far more stable biomarkers [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>].</p>
      <p>Previous work [<xref ref-type="bibr" rid="ref11">11</xref>] demonstrates that microRNA expression is more informative in classifying tumor samples by their origin in comparison to mRNA. Specifically, microRNAs are better at classifying poorly differentiated tumors [<xref ref-type="bibr" rid="ref12">12</xref>]. Moreover, microRNAs have shown great potential for identifying TOO for cancers of unknown primary origin [<xref ref-type="bibr" rid="ref13">13</xref>]. MicroRNAs have been investigated as prognostic and diagnostic biomarkers extensively in the research community and have even been found to be deregulated in numerous cancers [<xref ref-type="bibr" rid="ref14">14</xref>].</p>
      <p>With the wide availability of large data sets containing gene expression data, computational techniques such as machine learning have emerged as promising tools for improving TOO detection. Machine learning implementations have increased accuracy in predicting cancer and have the potential to improve the diagnosis, prognosis, and therapy selection for patients with cancer [<xref ref-type="bibr" rid="ref15">15</xref>]. The 3 traditional machine learning models are decision trees, random forests, and logistic regression. Decision trees [<xref ref-type="bibr" rid="ref16">16</xref>] attempt to partition the training set into subsets that contain samples of only one class, thereby predicting the class of interest. Random forests are ensemble classifiers, combining multiple trees for higher accuracy [<xref ref-type="bibr" rid="ref17">17</xref>]. In contrast, logistic regression is a predictive algorithm to find a model that can predict categorical output [<xref ref-type="bibr" rid="ref18">18</xref>]. Deep learning is a subset of machine learning designed to mimic the human brain through the use of artificial neural networks by using many layers and larger data sets. Generally, deep learning techniques are well suited for discovering and recognizing complex patterns in data that traditional machine learning methods can often miss. The increasing incorporation of deep learning in health care along with the availability of highly characterized cancer data sets has further accelerated research into the applications of deep learning in the analysis of the biology of cancer [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      <p>Given the complexities of diagnosing a TOO from a cancer that has spread throughout the body, previous investigators have applied machine learning methods to determine TOO for metastasized cancers [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. Longstanding techniques of microarrays and polymerase chain reaction have been used for the generation of machine learning models for CUP detection, including support vector machines with 89% accuracy [<xref ref-type="bibr" rid="ref22">22</xref>] and the k-nearest neighbor algorithm with 82% accuracy [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. LoCUP, a TOO classifier, was the first machine learning model using a multinomial logistic regression classifier with ridge penalties to incorporate tumor purity and reached a 95.8% accuracy [<xref ref-type="bibr" rid="ref25">25</xref>]. Cup AI Dx [<xref ref-type="bibr" rid="ref20">20</xref>] used mRNA gene expression data from The Cancer Genome Atlas (TCGA) data set to train a network based on the popular inception model [<xref ref-type="bibr" rid="ref22">22</xref>] to identify the TOO, achieving an accuracy of 96.7% on a validation set of 354 TCGA metastatic samples. The TOD-CUP method [<xref ref-type="bibr" rid="ref21">21</xref>] addressed the variation in mRNA platforms and used a gene expression rank–based majority vote algorithm to achieve an overall accuracy of 94%. Early work with microRNAs and nondeep learning machine learning algorithms showed 84% accuracy with k-nearest neighbor models [<xref ref-type="bibr" rid="ref26">26</xref>] and binary decision trees at 85% [<xref ref-type="bibr" rid="ref27">27</xref>]. However, the investigation of deep learning machine learning models may improve these accuracies with TOO detection by microRNA. MicroRNAs are also at the forefront of extracellular vesicle liquid biopsy development and may be better suited for the noninvasive classification of TOO [<xref ref-type="bibr" rid="ref28">28</xref>].</p>
      <p>This study sets out to explore the possibility of developing a model for using microRNA profiles from metastatic tissues to determine the TOO through the application of deep learning techniques. Successful TOO detection from microRNAs will provide a route for cancer detection without requiring samples from the primary tumor site in cases of CUP malignancies. We hypothesize that we would be able to predict the origin of metastatic tumors with higher accuracy than previous reports by leveraging larger data sets of microRNA profiles from both normal and primary site tissues to train the model.</p>
      <p>The data for this project were collected from TCGA data set [<xref ref-type="bibr" rid="ref29">29</xref>] and the Sequence Read Archive (SRA) [<xref ref-type="bibr" rid="ref30">30</xref>] from microRNA tissue expression database. The TCGA data set contains samples from 18 different cancer types representing 9648 samples, of which 365 were metastatic, 633 were solid normal, and 8650 were from the primary tumor site. Each sample consisted of microRNA expression data, available as RPM (reads per million mapped reads), as well as metadata including age and gender. We split TCGA data set into a combined primary tumor or solid normal samples training set and a metastatic sample test set. We then further split the primary tumor and solid normal samples into a training and validation set with a 9:1 ratio. The training set consisted of 8355 samples and the validation set consisted of 928 samples.</p>
      <p>We use 2 data sets for evaluating the performance of our models. The SRA test data set consisted of 194 samples from 5 different cancer types, all of which were from the primary tumor. We also used the metastatic samples from TCGA data set as our final test data set, which contained samples from 6 cancer types. We developed 4 machine learning models, a decision tree classifier, random forest, logistic regression, and finally, a deep learning model. Our deep learning model performed with the highest accuracy, achieving an accuracy of 97% in detecting TOO for metastatic samples and 80.4% on the nonmetastatic SRA cohort. Feature importance analysis revealed the top 3 differentiating microRNA targets as microRNA-10b, microRNA-196b, and microRNA-205, which confirms prior investigations on microRNAs associated with metastatic cancer [<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>].</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Sets</title>
        <p>In <xref rid="figure1" ref-type="fig">Figure 1</xref>, we outline the data preprocessing pipeline. Our study analyzed published data and did not generate any new sequencing data. TCGA data were obtained [<xref ref-type="bibr" rid="ref29">29</xref>]. Data were further filtered by querying the Genomics Data Commons via the Application Programming Interfaces specified [<xref ref-type="bibr" rid="ref34">34</xref>]. We restricted the tissue type to be one of the primary tumors, solid tissue normal, or metastatic. We further restricted the data to microRNA transcriptome profiling and picked data corresponding to 18 types of cancer each containing a sufficient number of samples, obtaining 9648 files (<xref rid="figure2" ref-type="fig">Figure 2</xref> and Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
        <p>To obtain the SRA data, we used the microRNA tissue expression database portal and restricted the cancer types to 6 types of cancer, seen in further detail in <xref rid="figure2" ref-type="fig">Figure 2</xref>. We obtained 207 samples, each containing expression data for 2656 microRNAs. After removing samples with missing features, 194 samples were remaining.</p>
        <p>We selected microRNA features that were expressed in at least 50% (4824/9648) of the samples, which reduced the number of features in the TCGA data set from 1889 to 562. We then picked the common features between the SRA data set and the TCGA data set, reducing this number to 497. On both data sets, we normalized the RPM of the selected features per sample to sum to a million. We then transformed the RPM values using the transformation log(RPM + 1) to restrict the range of the input.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Overview of our data processing pipeline. Data from the TCGA GDC portal and SRA miTED portal was obtained. Underexpressed microRNA and samples containing missing features from the miTED data were filtered. Common features were selected between both data sets, reducing the number of microRNA to 497. Features were normalized as reads per million per sample and log-transformed. TCGA data set was split into (1) the primary tissue and solid normal set and (2) the metastatic test set. The first, combined, set was further split into a training and validation set. GDC: Genomics Data Commons; miTED: microRNA tissue expression database; SRA: Sequence Read Archive; TCGA: The Cancer Genome Atlas.</p>
          </caption>
          <graphic xlink:href="bioinform_v5i1e56538_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>The Cancer Genome Atlas (TCGA) data set distribution across tissue of origin (TOO). Distribution of the different cancer samples in the TCGA data set that are from the primary tumor site, solid tissue, or metastatic. Note that metastatic samples primarily corresponded to the skin as the TOO.</p>
          </caption>
          <graphic xlink:href="bioinform_v5i1e56538_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Training Procedure</title>
        <p>For the implementation of decision tree, random forest, and logistic regression classifiers, the sklearn package was used [<xref ref-type="bibr" rid="ref35">35</xref>]. We used classification accuracy as the primary metric to evaluate our models. Deep learning models were created with PyTorch (Meta AI) [<xref ref-type="bibr" rid="ref36">36</xref>]. To optimize and train our neural network, we used Adam optimizer and trained for 50 epochs. Since our objective was classification, we used softmax with cross-entropy loss [<xref ref-type="bibr" rid="ref37">37</xref>] to optimize the model. We used the validation set to determine the hyperparameters of the models and picked the best-performing model for further evaluation on the test set. Feature importance was calculated with sklearn’s permutation feature importance function.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study was conducted in accordance with the ethical standards of the Salve Regina University ethical standards. The research study was reviewed by the institutional review board of Salve Regina University and was determined to be exempt from further review as per criteria contained in Title 45 CFR §46.104(d) section 4ii of federal regulations. As such, the study used only publicly available deidentified or anonymized data, and the project was reviewed (Exemption #Wise.2024.6.11).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>In order to develop a model to detect TOO, we set out to find the best-performing machine learning model for determining the TOO from the TCGA primary tumor and solid normal tissue cohorts. The models were then tested on the validation set, and we could accurately determine the TOO based on primary or normal microRNA profiles, with an accuracy of over 90% for 15 of 18 different tissue types using deep learning (<xref ref-type="table" rid="table1">Table 1</xref> and Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
      <p>We can note that the deep learning model performs consistently the highest on the validation set, with logistic regression and random forest classifiers providing comparable performance.</p>
      <p>We then set out to apply our best-performing deep learning model and evaluate its performance on the SRA test set that contains microRNA expression data from primary tumors (<xref ref-type="table" rid="table2">Table 2</xref>). We accurately determined the TOO with an accuracy of over 90% (90/100) for 3 of the 5 cancer types but saw a decrease in accuracy for bladder and colorectal cancer.</p>
      <p>Finally, we analyzed our deep learning model on microRNA expression data from metastatic tissue samples in the TCGA data set (<xref ref-type="table" rid="table3">Table 3</xref>). We accurately determined the TOO with an accuracy of over 85% (308/362) for all cancer types with an average of 97% (351/362).</p>
      <p>Since random forest and logistic regression classifiers provided comparable performance on the primary or normal validation set, we compared the classifier accuracy on both test sets for all created models (<xref ref-type="table" rid="table4">Table 4</xref>).</p>
      <p>The input features of our models consist of microRNA expression data common to TCGA and SRA data sets. <xref rid="figure3" ref-type="fig">Figure 3</xref> describes the overall architecture of the model, which consists of 2 linear layers. The second layer has 18 outputs, corresponding to each cancer type. The cancer type corresponds to the output with the maximum value.</p>
      <p>We used dropout for the input layer [<xref ref-type="bibr" rid="ref38">38</xref>] as it is a common technique to improve model accuracy and reduce overfitting. We also augmented our input data with noise.</p>
      <p>To evaluate the performance of our models, we computed confusion matrices for performance on metastatic samples (Figure S2A and S2B in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) and plotted the receiver operating characteristic curves for performance on metastatic skin cancer (Figure S2C and S2D in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), as the majority of the metastatic samples were obtained from skin cancer cases. We observed that the deep learning model performed significantly better than our decision tree model, which was consistent when evaluated on the SRA validation cohort (Figure S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). To illustrate the effectiveness of our models, we created Sankey plots representing the deep learning model performance on metastatic samples from the TCGA data set and primary tissue sites from the SRA data set (<xref rid="figure4" ref-type="fig">Figure 4</xref>).</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Model accuracies on the validation test set. Performance of 4 models for the identification of tissue of origin. The validation set consists of both primary tumor and solid normal tissue samples from The Cancer Genome Atlas data set.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="260"/>
          <col width="170"/>
          <col width="180"/>
          <col width="220"/>
          <col width="170"/>
          <thead>
            <tr valign="top">
              <td>Cancer type</td>
              <td>Decision tree (%)</td>
              <td>Random forest (%)</td>
              <td>Logistic regression (%)</td>
              <td>Deep learning (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Breast (n=131)</td>
              <td>91.6</td>
              <td>99.2</td>
              <td>96.9</td>
              <td>99.2</td>
            </tr>
            <tr valign="top">
              <td>Uterus (n=73)</td>
              <td>76.7</td>
              <td>100</td>
              <td>90.4</td>
              <td>94.5</td>
            </tr>
            <tr valign="top">
              <td>Ovary (n=48)</td>
              <td>89.6</td>
              <td>91.6</td>
              <td>93.8</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Prostrate (n=54)</td>
              <td>94.5</td>
              <td>100</td>
              <td>100</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Testis (n=18)</td>
              <td>61.1</td>
              <td>94.5</td>
              <td>94.4</td>
              <td>88.9</td>
            </tr>
            <tr valign="top">
              <td>Lung (n=117)</td>
              <td>81.1</td>
              <td>95.7</td>
              <td>82.9</td>
              <td>98.2</td>
            </tr>
            <tr valign="top">
              <td>Kidney (n=116)</td>
              <td>94.8</td>
              <td>100</td>
              <td>99.1</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Bladder (n=35)</td>
              <td>71.4</td>
              <td>95.7</td>
              <td>88.5</td>
              <td>88.5</td>
            </tr>
            <tr valign="top">
              <td>Esophagus (n=24)</td>
              <td>33.3</td>
              <td>29.2</td>
              <td>54.1</td>
              <td>83.3</td>
            </tr>
            <tr valign="top">
              <td>Liver (n=42)</td>
              <td>97.6</td>
              <td>100</td>
              <td>97.6</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Pancreas (n=20)</td>
              <td>55.0</td>
              <td>95</td>
              <td>95.2</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Pleura (n=7)</td>
              <td>42.8</td>
              <td>85.7</td>
              <td>100</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Colorectal (n=57)</td>
              <td>85.6</td>
              <td>98.2</td>
              <td>94.7</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Skin (n=6)</td>
              <td>66.6</td>
              <td>100</td>
              <td>100</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Stomach (n =45)</td>
              <td>82.2</td>
              <td>97.8</td>
              <td>75.5</td>
              <td>91.1</td>
            </tr>
            <tr valign="top">
              <td>Brain (n=47)</td>
              <td>100</td>
              <td>100</td>
              <td>100</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Cervix (n=32)</td>
              <td>62.5</td>
              <td>78.1</td>
              <td>78.1</td>
              <td>93.7</td>
            </tr>
            <tr valign="top">
              <td>Thyroid (n=55)</td>
              <td>98.1</td>
              <td>100</td>
              <td>100</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Overall—across cancer types</td>
              <td>84.6</td>
              <td>95.3</td>
              <td>96.4</td>
              <td>97.2</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Performance of our deep learning model for the identification of tissue of origin on the primary tissue site cohorts from the SRA<sup>a</sup>.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="430"/>
          <col width="570"/>
          <thead>
            <tr valign="top">
              <td>Cancer type</td>
              <td>SRA test accuracy—deep learning (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Breast (n=44)</td>
              <td>91.6</td>
            </tr>
            <tr valign="top">
              <td>Prostrate (n=37)</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Lung (n=19)</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Bladder (n=10)</td>
              <td>80</td>
            </tr>
            <tr valign="top">
              <td>Colorectal (n=78)</td>
              <td>58.9</td>
            </tr>
            <tr valign="top">
              <td>Skin (n=0)</td>
              <td>N/A<sup>b</sup></td>
            </tr>
            <tr valign="top">
              <td>Overall—across cancer types</td>
              <td>80.4</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table2fn1">
            <p><sup>a</sup>SRA: Sequence Read Archive.</p>
          </fn>
          <fn id="table2fn2">
            <p><sup>b</sup>N/A: not applicable.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>Performance of our deep learning model for the identification of tissue of origin in metastatic tumor tissue.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="520"/>
          <col width="480"/>
          <thead>
            <tr valign="bottom">
              <td>Cancer type</td>
              <td>TCGA<sup>a</sup> metastatic test accuracy—deep learning (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Breast (n=7)</td>
              <td>85.7</td>
            </tr>
            <tr valign="top">
              <td>Prostrate (n=1)</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Lung (n=0)</td>
              <td>N/A<sup>b</sup></td>
            </tr>
            <tr valign="top">
              <td>Bladder (n=1)</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Colorectal (n=1)</td>
              <td>100</td>
            </tr>
            <tr valign="top">
              <td>Skin (n=352)</td>
              <td>97.4</td>
            </tr>
            <tr valign="top">
              <td>Overall—across cancer types</td>
              <td>97</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table3fn1">
            <p><sup>a</sup>TCGA: The Cancer Genome Atlas.</p>
          </fn>
          <fn id="table3fn2">
            <p><sup>b</sup>N/A: not applicable.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table4">
        <label>Table 4</label>
        <caption>
          <p>Accuracy of developed models on metastatic and SRA<sup>a</sup> test sets. The accuracy for all 4 models is presented on the TCGA<sup>b</sup> metastatic and SRA cohorts. The decision tree classifier had a depth of 14 and the random forest had a depth of 19.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="330"/>
          <col width="350"/>
          <col width="320"/>
          <thead>
            <tr valign="top">
              <td>Classifier</td>
              <td>Accuracy on TCGA metastatic test set (%)</td>
              <td>Accuracy on SRA test set (%)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Decision tree</td>
              <td>62.5</td>
              <td>41.2</td>
            </tr>
            <tr valign="top">
              <td>Random forest</td>
              <td>94.2</td>
              <td>74.2</td>
            </tr>
            <tr valign="top">
              <td>Logistic regression</td>
              <td>93.2</td>
              <td>71.6</td>
            </tr>
            <tr valign="top">
              <td>Deep learning</td>
              <td>97</td>
              <td>80.4</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table4fn1">
            <p><sup>a</sup>SRA: Sequence Read Archive.</p>
          </fn>
          <fn id="table4fn2">
            <p><sup>b</sup>TCGA: The Cancer Genome Atlas.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <fig id="figure3" position="float">
        <label>Figure 3</label>
        <caption>
          <p>A schematic of the machine learning model architecture. MiRNA: microRNA.</p>
        </caption>
        <graphic xlink:href="bioinform_v5i1e56538_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure4" position="float">
        <label>Figure 4</label>
        <caption>
          <p>Sankey plot for deep learning model on Sequence Read Archive (SRA) and The Cancer Genome Atlas (TCGA) test data sets. (A) On the TCGA data set, our deep learning model is able to correctly classify 333 out of 343 metastatic skin cancer samples, demonstrating high accuracy. (B) On the SRA test data set, we show representative plots for breast and colon cancers, showing high accuracy for breast cancer tissue of origin identification. (C) The model performance on colon cancer is less accurate due to microRNA expression consistently overlapping for colon and stomach cancers [<xref ref-type="bibr" rid="ref40">40</xref>].</p>
        </caption>
        <graphic xlink:href="bioinform_v5i1e56538_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>These results confirm our hypotheses and show that we were able to predict the TOO with high accuracy using deep learning. Furthermore, our findings demonstrated that deep learning techniques significantly increase the accuracy in comparison to decision tree, logistic regression, and random forest models.</p>
      <p>To reveal the significance of individual features, we performed feature importance analysis using the permutation feature importance method (<xref rid="figure5" ref-type="fig">Figure 5</xref>A). The top 3 microRNAs contributing to our deep learning model based on our combined normal and primary site training set are microRNA-10b, microRNA-196, and microRNA-205. MicroRNA-10b has been shown to function as a metastasis-promoting factor in many cancer types. In fact, it was one of the first microRNAs to have been discovered with aberrant expression in cancer cells [<xref ref-type="bibr" rid="ref31">31</xref>]. MicroRNA-196 has been linked to the progression of many cancers, notably metastatic colorectal cancer [<xref ref-type="bibr" rid="ref32">32</xref>], while microRNA-205 expression is downregulated in metastatic breast and prostate cancer [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
      <p>To further understand the significance of the identified important features, we compute a heat map (<xref rid="figure5" ref-type="fig">Figure 5</xref>B) showing the microRNA expression values for the top 10 microRNA features for samples in the training data set. Visually, it is apparent that the microRNA features can be used to distinguish the cancer type. To further validate this, we perform principal component analysis and t-SNE analysis using only the top 10 features (<xref rid="figure5" ref-type="fig">Figures 5</xref>C and 5D). We note that the t-SNE plot shows a clear separation of features into distinct clusters corresponding to each cancer type, showing the significance of the features for detecting the TOO.</p>
      <fig id="figure5" position="float">
        <label>Figure 5</label>
        <caption>
          <p>MicroRNA feature importance visualizations. (A) Permutation feature importance for the top 3 microRNA candidates. A bar graph of the importance values for the 3 top microRNA candidates for the logistic regression model. (B) MicroRNA expression heatmap. MicroRNA expression values for the top 10 most important features (as determined by permutation feature importance) for a subset of samples. The top 10 microRNA features can cluster cancer type. Low mir-205 and mir-944 and a high mir-10b are indicative of colorectal cancer. Similarly, low expressions for microRNA-429, microRNA-483, microRNA-215, microRNA-944, microRNA-1247, microRNA-375, and microRNA-205 are indicative of kidney cancer. (C) PCA visualization. (D) t-SNE visualization. PCA and t-SNE visualization of data corresponding to the 6 cancer types with the most samples in our data set, using only the top 10 microRNA features. In the PCA plot, note that there is significant overlap between the cancer types, while in the t-SNE plot, the cancer types are well separated, suggesting that with 10 microRNA features, machine learning models may correctly identify patterns and predict tissue of origin. PCA: principal component analysis; t-SNE: t-distributed stochastic neighbor embedding.</p>
        </caption>
        <graphic xlink:href="bioinform_v5i1e56538_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In these investigations, while using successively more powerful classifiers, we were able to detect the TOO on solely metastatic cancer samples with accuracies ranging from 62.5% (226/362) with a decision tree to 97% (351/362) with a deep learning model. Our methods show that one can leverage larger amounts of gene expression data for primary and solid tissue normal tumor samples (~10,000 samples) to come up with accurate classifiers to determine TOO for metastatic cancer (currently limited to ~300 samples). In order to verify the robustness of our model, we assessed its performance on primary tumor data from the SRA and obtained accuracies ranging from 41.2% (77/188) with decision tree to 80.4% (151/188) when using deep learning. Our methods have also identified promising microRNA candidates, reaffirming prior research in this field and demonstrating the potential of machine learning.</p>
        <p>The predominant failure of our model on the SRA test cohort was within colorectal cancer as can be seen in <xref rid="figure4" ref-type="fig">Figure 4</xref>C. Many colorectal samples were incorrectly classified as stomach or gastric cancer. This is consistent with previous research in this area as microRNA expression profiles for gastrointestinal cancers show significant overlap [<xref ref-type="bibr" rid="ref39">39</xref>]. In addition, colorectal and stomach cancer are often synchronous with probabilities ranging from 20.1% to 37.2% [<xref ref-type="bibr" rid="ref40">40</xref>].</p>
        <p>We used permutation feature importance, a model-agnostic metric that permutes features across samples in the test set to assess the change in model accuracy. The results are in line with existing research in this area and serve as a good indicator of the feasibility of machine learning techniques to identify promising biomarkers.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>To effectively use our model in clinical care, accuracy must be improved further. Our model currently performs with an accuracy of 97% (351/362). While this may seem impressive, clinical classifiers should be highly accurate so that there are a negligible number of cases with errors in identifying TOO. To improve the accuracy, the accumulation of larger data sets is necessary, and as the noncoding genome continues to reveal significant contributions to cancer, we predict that available data sets will expand. A further limitation to our study is that the available microRNA metastatic data sets are predominantly skin cancer. Thus, access to a larger, more varied, data set would improve our assessment of model performance. Furthermore, in order to develop a truly noninvasive method of TOO identification relevant to all cancers, it would be ideal to extend our method to microRNA expression data from blood samples. Detecting the TOO through blood-based microRNA biomarkers would significantly impact the diagnosis and treatment of patients with CUP. Additionally, our model cannot differentiate between tumor and solid tissue normal samples, as it was designed to identify the TOO specifically.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>To summarize, our developed machine learning models can accurately identify the TOO with high accuracy from microRNA expression data when trained on primary tumor and solid tissue samples. Importantly, our results identified key microRNA differentiators of tissue type. Our models are robust and perform well across different data sets (TCGA and the SRA data set). We look forward to developing further deep learning models that can accurately detect TOO as microRNA data sets expand, with the goal of having a noninvasive test for diagnosing the presence of cancer and determining cancer TOO with high accuracy.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Detailed analyses of feature importance and confusion matrices to support the study's findings on tissue of origin classification using microRNA features.</p>
        <media xlink:href="bioinform_v5i1e56538_app1.docx" xlink:title="DOCX File , 619 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">CUP</term>
          <def>
            <p>carcinoma of unknown primary</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">RPM</term>
          <def>
            <p>reads per million</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">SRA</term>
          <def>
            <p>Sequence Read Archive</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">TCGA</term>
          <def>
            <p>The Cancer Genome Atlas</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">TOO</term>
          <def>
            <p>tissue of origin</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We are grateful to The Cancer Genome Atlas Project and patients for providing the data used in this research. We are thankful to Soroush Hajizadeh for reviewing our code and providing insightful feedback. The results are in part based on data generated by The Cancer Genome Atlas Project Research Network [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data sets generated during and/or analyzed during this study are available in the github repository [<xref ref-type="bibr" rid="ref41">41</xref>].</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Qaseem</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Usman</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jayaraj</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Janapala</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kashif</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Cancer of unknown primary: a review on clinical guidelines in the development and targeted management of patients with the unknown primary site</article-title>
          <source>Cureus</source>
          <year>2019</year>
          <volume>11</volume>
          <issue>9</issue>
          <fpage>e5552</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31695975"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.5552</pub-id>
          <pub-id pub-id-type="medline">31695975</pub-id>
          <pub-id pub-id-type="pmcid">PMC6820325</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Monzon</surname>
              <given-names>FA</given-names>
            </name>
            <name name-style="western">
              <surname>Medeiros</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lyons-Weiler</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Henner</surname>
              <given-names>WD</given-names>
            </name>
          </person-group>
          <article-title>Identification of tissue of origin in carcinoma of unknown primary with a microarray-based gene expression test</article-title>
          <source>Diagn Pathol</source>
          <year>2010</year>
          <volume>5</volume>
          <fpage>3</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://diagnosticpathology.biomedcentral.com/articles/10.1186/1746-1596-5-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1746-1596-5-3</pub-id>
          <pub-id pub-id-type="medline">20205775</pub-id>
          <pub-id pub-id-type="pii">1746-1596-5-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC2823680</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Laprovitera</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Riefolo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ambrosini</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Klec</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pichler</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ferracin</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Cancer of unknown primary: challenges and progress in clinical management</article-title>
          <source>Cancers (Basel)</source>
          <year>2021</year>
          <volume>13</volume>
          <issue>3</issue>
          <fpage>451</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=cancers13030451"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/cancers13030451</pub-id>
          <pub-id pub-id-type="medline">33504059</pub-id>
          <pub-id pub-id-type="pii">cancers13030451</pub-id>
          <pub-id pub-id-type="pmcid">PMC7866161</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Case report: tissue origin identification for cancer of unknown primary: gene expression profiling approach</article-title>
          <source>Front Oncol</source>
          <year>2021</year>
          <volume>11</volume>
          <fpage>702887</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34858803"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fonc.2021.702887</pub-id>
          <pub-id pub-id-type="medline">34858803</pub-id>
          <pub-id pub-id-type="pmcid">PMC8632144</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Teschendorff</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Tumor origin detection with tissue-specific miRNA and DNA methylation markers</article-title>
          <source>Bioinformatics</source>
          <year>2018</year>
          <volume>34</volume>
          <issue>3</issue>
          <fpage>398</fpage>
          <lpage>406</lpage>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btx622</pub-id>
          <pub-id pub-id-type="medline">29028927</pub-id>
          <pub-id pub-id-type="pii">4265460</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greco</surname>
              <given-names>FA</given-names>
            </name>
            <name name-style="western">
              <surname>Burris</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Erland</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Kalman</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Schreeder</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Hainsworth</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Carcinoma of unknown primary site</article-title>
          <source>Cancer</source>
          <year>2000</year>
          <volume>89</volume>
          <issue>12</issue>
          <fpage>2655</fpage>
          <lpage>2660</lpage>
          <pub-id pub-id-type="medline">11135228</pub-id>
          <pub-id pub-id-type="pii">10.1002/1097-0142(20001215)89:12&lt;2655::AID-CNCR19&gt;3.0.CO;2-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schapira</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Jarrett</surname>
              <given-names>AR</given-names>
            </name>
          </person-group>
          <article-title>The need to consider survival, outcome, and expense when evaluating and treating patients with unknown primary carcinoma</article-title>
          <source>Arch Intern Med</source>
          <year>1995</year>
          <volume>155</volume>
          <issue>19</issue>
          <fpage>2050</fpage>
          <lpage>2054</lpage>
          <pub-id pub-id-type="medline">7575063</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cobb</surname>
              <given-names>GP</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>TA</given-names>
            </name>
          </person-group>
          <article-title>microRNAs as oncogenes and tumor suppressors</article-title>
          <source>Dev Biol</source>
          <year>2007</year>
          <volume>302</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0012-1606(06)01096-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ydbio.2006.08.028</pub-id>
          <pub-id pub-id-type="medline">16989803</pub-id>
          <pub-id pub-id-type="pii">S0012-1606(06)01096-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Dragomir</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Horst</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Calin</surname>
              <given-names>GA</given-names>
            </name>
          </person-group>
          <article-title>Targeting non-coding RNAs to overcome cancer therapy resistance</article-title>
          <source>Signal Transduct Target Ther</source>
          <year>2022</year>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>121</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41392-022-00975-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41392-022-00975-3</pub-id>
          <pub-id pub-id-type="medline">35418578</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41392-022-00975-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC9008121</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smolarz</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Durczyński</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Romanowicz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Szyłło</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hogendorf</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>miRNAs in cancer (review of literature)</article-title>
          <source>Int J Mol Sci</source>
          <year>2022</year>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>2805</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijms23052805"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijms23052805</pub-id>
          <pub-id pub-id-type="medline">35269947</pub-id>
          <pub-id pub-id-type="pii">ijms23052805</pub-id>
          <pub-id pub-id-type="pmcid">PMC8910953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chakrabortty</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Patton</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>BF</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>miRNAs: potential as biomarkers and therapeutic targets for cancer</article-title>
          <source>Genes (Basel)</source>
          <year>2023</year>
          <volume>14</volume>
          <issue>7</issue>
          <fpage>1375</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=genes14071375"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/genes14071375</pub-id>
          <pub-id pub-id-type="medline">37510280</pub-id>
          <pub-id pub-id-type="pii">genes14071375</pub-id>
          <pub-id pub-id-type="pmcid">PMC10378777</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Getz</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Miska</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Alvarez-Saavedra</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lamb</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Peck</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sweet-Cordero</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ebert</surname>
              <given-names>BL</given-names>
            </name>
            <name name-style="western">
              <surname>Mak</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrando</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Downing</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Jacks</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Horvitz</surname>
              <given-names>HR</given-names>
            </name>
            <name name-style="western">
              <surname>Golub</surname>
              <given-names>TR</given-names>
            </name>
          </person-group>
          <article-title>MicroRNA expression profiles classify human cancers</article-title>
          <source>Nature</source>
          <year>2005</year>
          <volume>435</volume>
          <issue>7043</issue>
          <fpage>834</fpage>
          <lpage>838</lpage>
          <pub-id pub-id-type="doi">10.1038/nature03702</pub-id>
          <pub-id pub-id-type="medline">15944708</pub-id>
          <pub-id pub-id-type="pii">nature03702</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosenfeld</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Aharonov</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Meiri</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenwald</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Spector</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zepeniuk</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Benjamin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Shabes</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Tabak</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lebanony</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Goren</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Silberschein</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Targan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ben-Ari</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gilad</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sion-Vardy</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Tobar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Feinmesser</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kharenko</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Nativ</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Nass</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Perelman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yosepovich</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shalmon</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Polak-Charcon</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fridman</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Avniel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bentwich</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Bentwich</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chajut</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Barshack</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>MicroRNAs accurately identify cancer tissue origin</article-title>
          <source>Nat Biotechnol</source>
          <year>2008</year>
          <volume>26</volume>
          <issue>4</issue>
          <fpage>462</fpage>
          <lpage>469</lpage>
          <pub-id pub-id-type="doi">10.1038/nbt1392</pub-id>
          <pub-id pub-id-type="medline">18362881</pub-id>
          <pub-id pub-id-type="pii">nbt1392</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tucci</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>The role of microRNAs in cancer: functions, biomarkers and therapeutics</article-title>
          <source>Cancers (Basel)</source>
          <year>2022</year>
          <volume>14</volume>
          <issue>4</issue>
          <fpage>872</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=cancers14040872"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/cancers14040872</pub-id>
          <pub-id pub-id-type="medline">35205620</pub-id>
          <pub-id pub-id-type="pii">cancers14040872</pub-id>
          <pub-id pub-id-type="pmcid">PMC8870119</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Machine learning and AI in cancer prognosis, prediction, and treatment selection: a critical approach</article-title>
          <source>J Multidiscip Healthc</source>
          <year>2023</year>
          <volume>16</volume>
          <fpage>1779</fpage>
          <lpage>1791</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37398894"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/JMDH.S410301</pub-id>
          <pub-id pub-id-type="medline">37398894</pub-id>
          <pub-id pub-id-type="pii">410301</pub-id>
          <pub-id pub-id-type="pmcid">PMC10312208</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Song</surname>
              <given-names>YY</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Ying</given-names>
            </name>
          </person-group>
          <article-title>Decision tree methods: applications for classification and prediction</article-title>
          <source>Shanghai Arch Psychiatry</source>
          <year>2015</year>
          <volume>27</volume>
          <issue>2</issue>
          <fpage>130</fpage>
          <lpage>135</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26120265"/>
          </comment>
          <pub-id pub-id-type="doi">10.11919/j.issn.1002-0829.215044</pub-id>
          <pub-id pub-id-type="medline">26120265</pub-id>
          <pub-id pub-id-type="pii">sap-27-02-130</pub-id>
          <pub-id pub-id-type="pmcid">PMC4466856</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Breiman</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Random forests</article-title>
          <source>Mach Learn</source>
          <year>2001</year>
          <volume>45</volume>
          <fpage>5</fpage>
          <lpage>32</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1023/A:1010933404324"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Introduction to Logistic Regression</source>
          <year>2020</year>
          <publisher-loc>Ithaca, NY</publisher-loc>
          <publisher-name>Cornell University</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Kondrashova</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Bradley</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>ED</given-names>
            </name>
            <name name-style="western">
              <surname>Pearson</surname>
              <given-names>JV</given-names>
            </name>
            <name name-style="western">
              <surname>Waddell</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Deep learning in cancer diagnosis, prognosis and treatment selection</article-title>
          <source>Genome Med</source>
          <year>2021</year>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>152</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://genomemedicine.biomedcentral.com/articles/10.1186/s13073-021-00968-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13073-021-00968-x</pub-id>
          <pub-id pub-id-type="medline">34579788</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13073-021-00968-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC8477474</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Namburi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pattison</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Posner</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Balachander</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Paisie</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Reddi</surname>
              <given-names>HV</given-names>
            </name>
            <name name-style="western">
              <surname>Rueter</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gill</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Raghav</surname>
              <given-names>KPS</given-names>
            </name>
            <name name-style="western">
              <surname>Flynn</surname>
              <given-names>WF</given-names>
            </name>
            <name name-style="western">
              <surname>Tothill</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karuturi</surname>
              <given-names>RKM</given-names>
            </name>
            <name name-style="western">
              <surname>George</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>CUP-AI-Dx: a tool for inferring cancer tissue of origin and molecular subtype using RNA gene-expression data and artificial intelligence</article-title>
          <source>EBioMedicine</source>
          <year>2020</year>
          <volume>61</volume>
          <fpage>103030</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2352-3964(20)30406-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ebiom.2020.103030</pub-id>
          <pub-id pub-id-type="medline">33039710</pub-id>
          <pub-id pub-id-type="pii">S2352-3964(20)30406-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC7553237</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Timko</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>TOD-CUP: a gene expression rank-based majority vote algorithm for tissue origin diagnosis of cancers of unknown primary</article-title>
          <source>Brief Bioinform</source>
          <year>2021</year>
          <volume>22</volume>
          <issue>2</issue>
          <fpage>2106</fpage>
          <lpage>2118</lpage>
          <pub-id pub-id-type="doi">10.1093/bib/bbaa031</pub-id>
          <pub-id pub-id-type="medline">32266390</pub-id>
          <pub-id pub-id-type="pii">5817479</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tothill</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Kowalczyk</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rischin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bousioutas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haviv</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>van Laar</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Waring</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Zalcberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Biankin</surname>
              <given-names>AV</given-names>
            </name>
            <name name-style="western">
              <surname>Sutherland</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Henshall</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Fong</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pollack</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Bowtell</surname>
              <given-names>DDL</given-names>
            </name>
            <name name-style="western">
              <surname>Holloway</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>An expression-based site of origin diagnostic method designed for clinical application to cancer of unknown origin</article-title>
          <source>Cancer Res</source>
          <year>2005</year>
          <volume>65</volume>
          <issue>10</issue>
          <fpage>4031</fpage>
          <lpage>4040</lpage>
          <pub-id pub-id-type="doi">10.1158/0008-5472.CAN-04-3617</pub-id>
          <pub-id pub-id-type="medline">15899792</pub-id>
          <pub-id pub-id-type="pii">65/10/4031</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Laar</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>XJ</given-names>
            </name>
            <name name-style="western">
              <surname>de Jong</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wehkamp</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Floore</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Warmoes</surname>
              <given-names>MO</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Erlander</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>van't Veer</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Glas</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Implementation of a novel microarray-based diagnostic test for cancer of unknown primary</article-title>
          <source>Int J Cancer</source>
          <year>2009</year>
          <volume>125</volume>
          <issue>6</issue>
          <fpage>1390</fpage>
          <lpage>1397</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/doi/10.1002/ijc.24504"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/ijc.24504</pub-id>
          <pub-id pub-id-type="medline">19536816</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>XJ</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Salunga</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Murage</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tuggle</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Stecker</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Raja</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Robin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Baunoch</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sgroi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Erlander</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Molecular classification of human cancers using a 92-gene real-time quantitative polymerase chain reaction assay</article-title>
          <source>Arch Pathol Lab Med</source>
          <year>2006</year>
          <volume>130</volume>
          <issue>4</issue>
          <fpage>465</fpage>
          <lpage>473</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://meridian.allenpress.com/aplm/article-lookup/doi/10.5858/2006-130-465-MCOHCU"/>
          </comment>
          <pub-id pub-id-type="doi">10.5858/2006-130-465-MCOHCU</pub-id>
          <pub-id pub-id-type="medline">16594740</pub-id>
          <pub-id pub-id-type="pii">OA51149</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Søndergaard</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nielsen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pedersen</surname>
              <given-names>CNS</given-names>
            </name>
            <name name-style="western">
              <surname>Besenbacher</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Prediction of primary tumors in cancers of unknown primary</article-title>
          <source>J Integr Bioinform</source>
          <year>2017</year>
          <volume>14</volume>
          <issue>2</issue>
          <fpage>20170013</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28686574"/>
          </comment>
          <pub-id pub-id-type="doi">10.1515/jib-2017-0013</pub-id>
          <pub-id pub-id-type="medline">28686574</pub-id>
          <pub-id pub-id-type="pii">/j/jib.ahead-of-print/jib-2017-0013/jib-2017-0013.xml</pub-id>
          <pub-id pub-id-type="pmcid">PMC6042823</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Varadhachary</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Spector</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Abbruzzese</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenwald</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Aharonov</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Carlson</surname>
              <given-names>HR</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Karanth</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Macinskas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lenzi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chajut</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Edmonston</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Raber</surname>
              <given-names>MN</given-names>
            </name>
          </person-group>
          <article-title>Prospective gene signature study using microRNA to identify the tissue of origin in patients with carcinoma of unknown primary</article-title>
          <source>Clin Cancer Res</source>
          <year>2011</year>
          <volume>17</volume>
          <issue>12</issue>
          <fpage>4063</fpage>
          <lpage>4070</lpage>
          <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-10-2599</pub-id>
          <pub-id pub-id-type="medline">21531815</pub-id>
          <pub-id pub-id-type="pii">1078-0432.CCR-10-2599</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosenwald</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gilad</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Benjamin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lebanony</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Dromi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Faerman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Benjamin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tamir</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ezagouri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goren</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Barshack</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Nass</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tobar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Feinmesser</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenfeld</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Leizerman</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Ashkenazi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Spector</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chajut</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Aharonov</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Validation of a microRNA-based qRT-PCR test for accurate identification of tumor tissue origin</article-title>
          <source>Mod Pathol</source>
          <year>2010</year>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>814</fpage>
          <lpage>823</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0893-3952(22)02700-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/modpathol.2010.57</pub-id>
          <pub-id pub-id-type="medline">20348879</pub-id>
          <pub-id pub-id-type="pii">S0893-3952(22)02700-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Miguel Pérez</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez Martínez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ortigosa Palomo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Delgado Ureña</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia Puche</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Robles Remacho</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Exposito Hernandez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lorente Acosta</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Ortega Sánchez</surname>
              <given-names>FG</given-names>
            </name>
            <name name-style="western">
              <surname>Serrano</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Extracellular vesicle-miRNAs as liquid biopsy biomarkers for disease identification and prognosis in metastatic colorectal cancer patients</article-title>
          <source>Sci Rep</source>
          <year>2020</year>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>3974</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-020-60212-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-020-60212-1</pub-id>
          <pub-id pub-id-type="medline">32132553</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-020-60212-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7055306</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <article-title>The Cancer Genome Atlas Program (TCGA)</article-title>
          <source>National Cancer Institute</source>
          <access-date>2024-05-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cancer.gov/ccg/research/genome-sequencing/tcga">https://www.cancer.gov/ccg/research/genome-sequencing/tcga</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Leinonen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sugawara</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Shumway</surname>
              <given-names>M</given-names>
            </name>
            <collab>International Nucleotide Sequence Database Collaboration</collab>
          </person-group>
          <article-title>The sequence read archive</article-title>
          <source>Nucleic Acids Res</source>
          <year>2011</year>
          <volume>39</volume>
          <issue>Database issue</issue>
          <fpage>D19</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/21062823"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkq1019</pub-id>
          <pub-id pub-id-type="medline">21062823</pub-id>
          <pub-id pub-id-type="pii">gkq1019</pub-id>
          <pub-id pub-id-type="pmcid">PMC3013647</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sheedy</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Medarova</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>The fundamental role of miR-10b in metastatic cancer</article-title>
          <source>Am J Cancer Res</source>
          <year>2018</year>
          <volume>8</volume>
          <issue>9</issue>
          <fpage>1674</fpage>
          <lpage>1688</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30323962"/>
          </comment>
          <pub-id pub-id-type="medline">30323962</pub-id>
          <pub-id pub-id-type="pmcid">PMC6176190</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chauhan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dhasmana</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jaggi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chauhan</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Yallapu</surname>
              <given-names>MM</given-names>
            </name>
          </person-group>
          <article-title>miR-205: a potential biomedicine for cancer therapy</article-title>
          <source>Cells</source>
          <year>2020</year>
          <volume>9</volume>
          <issue>9</issue>
          <fpage>1957</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=cells9091957"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/cells9091957</pub-id>
          <pub-id pub-id-type="medline">32854238</pub-id>
          <pub-id pub-id-type="pii">cells9091957</pub-id>
          <pub-id pub-id-type="pmcid">PMC7564275</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yeh</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>miR-196, an emerging cancer biomarker for digestive tract cancers</article-title>
          <source>J Cancer</source>
          <year>2016</year>
          <volume>7</volume>
          <issue>6</issue>
          <fpage>650</fpage>
          <lpage>655</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27076845"/>
          </comment>
          <pub-id pub-id-type="doi">10.7150/jca.13460</pub-id>
          <pub-id pub-id-type="medline">27076845</pub-id>
          <pub-id pub-id-type="pii">jcav07p0650</pub-id>
          <pub-id pub-id-type="pmcid">PMC4829550</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <article-title>NCI Genomic Data Commons</article-title>
          <source>GDC Application Programming Interface (API)</source>
          <access-date>2024-05-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://gdc.cancer.gov/developers/gdc-application-programming-interface-api">https://gdc.cancer.gov/developers/gdc-application-programming-interface-api</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>Pedregosa, Fabian</collab>
            <collab>Varquaux, Gaël</collab>
            <collab>Gramfort, Alexandre</collab>
            <collab>Michel, Vincent</collab>
            <collab>Thirion, Bertrand</collab>
            <collab>Grisel, Olivier</collab>
            <collab>Blondel, Mathieu</collab>
            <collab>Pretternhofer, Peter</collab>
            <collab>Weiss, Ron</collab>
            <collab>Dubourg, Vincent</collab>
            <collab>Vanderplas, Jake</collab>
            <collab>Passos, Alexandre</collab>
            <collab>Cornapeau, David</collab>
            <collab>Brucher, Matthieu</collab>
            <collab>Perrot, Mathhieu</collab>
          </person-group>
          <article-title>Scikit-learn: machine learning in Python</article-title>
          <source>J Mach Learn Res</source>
          <year>2011</year>
          <fpage>2825</fpage>
          <lpage>2830</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume12/pedregosa11a/pedregosa11a.pdf?ref=https:/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Paszke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gross</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Massa</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Pytorch: an imperative style, high-performance deep learning library</article-title>
          <year>2019</year>
          <conf-name>arXiv.org</conf-name>
          <conf-date>Dec 3 2019</conf-date>
          <conf-loc>NA</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1912.01703"/>
          </comment>
          <pub-id pub-id-type="doi">https://doi.org/10.48550/arXiv.1912.01703</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mohri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Cross-entropy loss functions: theoretical analysis and applications</article-title>
          <year>2023</year>
          <conf-name>Proceedings of the 40th International Conference on Machine Learning</conf-name>
          <conf-date>July 2023</conf-date>
          <conf-loc>Honolulu, Hawaii</conf-loc>
          <publisher-name>PMLR</publisher-name>
          <fpage>23803</fpage>
          <lpage>23828</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Srivastava</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hinton</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Krizhevsky</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Salakhutdinov</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <source>Dropout: A Simple Way to Prevent Neural Networks from Overfitting</source>
          <year>2014</year>
          <publisher-loc>Toronto</publisher-loc>
          <publisher-name>JMLR</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Laprovitera</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Riefolo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Porcellini</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Durante</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Garajova</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Vasuri</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Aigelsreiter</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dandachi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Benvenuto</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Agostinis</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sabbioni</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Berindan Neagoe</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Romualdi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ardizzoni</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Trerè</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pichler</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>D'Errico</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ferracin</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>MicroRNA expression profiling with a droplet digital PCR assay enables molecular diagnosis and prognosis of cancers of unknown primary</article-title>
          <source>Mol Oncol</source>
          <year>2021</year>
          <volume>15</volume>
          <issue>10</issue>
          <fpage>2732</fpage>
          <lpage>2751</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34075699"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/1878-0261.13026</pub-id>
          <pub-id pub-id-type="medline">34075699</pub-id>
          <pub-id pub-id-type="pmcid">PMC8486570</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Suh</surname>
              <given-names>Byoung Jo</given-names>
            </name>
          </person-group>
          <article-title>Synchronous and metachronous colon cancers in patients with gastric cancer: report of 2 cases</article-title>
          <source>Case Rep Oncol</source>
          <year>2016</year>
          <volume>9</volume>
          <issue>3</issue>
          <fpage>752</fpage>
          <lpage>759</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1159/000452831"/>
          </comment>
          <pub-id pub-id-type="doi">10.1159/000452831</pub-id>
          <pub-id pub-id-type="medline">27990112</pub-id>
          <pub-id pub-id-type="pii">cro-0009-0752</pub-id>
          <pub-id pub-id-type="pmcid">PMC5156887</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="web">
          <article-title>ANIHA234/identifying-tissue-of-origin-from-mirna</article-title>
          <source>GitHub</source>
          <year>2023</year>
          <access-date>2024-05-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/Anisha234/miRNA">https://github.com/Anisha234/miRNA</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
