<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v3.0 20080202//EN" "journalpublishing3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="en" article-type="research-article">
<?release-delay 0|0?>
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">BR</journal-id>
<journal-title-group>
<journal-title>Biomedical Reports</journal-title>
</journal-title-group>
<issn pub-type="ppub">2049-9434</issn>
<issn pub-type="epub">2049-9442</issn>
<publisher>
<publisher-name>D.A. Spandidos</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">BR-24-6-02147</article-id>
<article-id pub-id-type="doi">10.3892/br.2026.2147</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Articles</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Machine learning-based identification of key genes underlying sex differences in hepatocellular carcinoma and targeted drug screening</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Wang</surname><given-names>Zhen</given-names></name>
<xref rid="af1-BR-24-6-02147" ref-type="aff">1</xref>
<xref rid="fn1-BR-24-6-02147" ref-type="author-notes">&#x002A;</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Ning</surname><given-names>Jinghua</given-names></name>
<xref rid="af1-BR-24-6-02147" ref-type="aff">1</xref>
<xref rid="af2-BR-24-6-02147" ref-type="aff">2</xref>
<xref rid="fn1-BR-24-6-02147" ref-type="author-notes">&#x002A;</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname><given-names>Hongyuan</given-names></name>
<xref rid="af1-BR-24-6-02147" ref-type="aff">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Ruan</surname><given-names>Qingfen</given-names></name>
<xref rid="af3-BR-24-6-02147" ref-type="aff">3</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhao</surname><given-names>Yanhong</given-names></name>
<xref rid="af1-BR-24-6-02147" ref-type="aff">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Qu</surname><given-names>Run</given-names></name>
<xref rid="af1-BR-24-6-02147" ref-type="aff">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Lv</surname><given-names>Congcong</given-names></name>
<xref rid="af1-BR-24-6-02147" ref-type="aff">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Wu</surname><given-names>Yutong</given-names></name>
<xref rid="af1-BR-24-6-02147" ref-type="aff">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Liu</surname><given-names>Weidong</given-names></name>
<xref rid="af1-BR-24-6-02147" ref-type="aff">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Yang</surname><given-names>Xiaoyin</given-names></name>
<xref rid="af1-BR-24-6-02147" ref-type="aff">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname><given-names>Ziming</given-names></name>
<xref rid="af1-BR-24-6-02147" ref-type="aff">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Liang</surname><given-names>Yi</given-names></name>
<xref rid="af4-BR-24-6-02147" ref-type="aff">4</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Zhang</surname><given-names>Yuzhe</given-names></name>
<xref rid="af1-BR-24-6-02147" ref-type="aff">1</xref>
<xref rid="af5-BR-24-6-02147" ref-type="aff">5</xref>
<xref rid="af6-BR-24-6-02147" ref-type="aff">6</xref>
<xref rid="c1-BR-24-6-02147" ref-type="corresp"/>
</contrib>
</contrib-group>
<aff id="af1-BR-24-6-02147"><label>1</label>Department of Biochemistry and Molecular Biology, College of Basic Medical Sciences, Dali University, Dali, Yunnan 671003, P.R. China</aff>
<aff id="af2-BR-24-6-02147"><label>2</label>Department of Pathology, Fumin County People&#x0027;s Hospital, Kunming, Yunnan 650400, P.R. China</aff>
<aff id="af3-BR-24-6-02147"><label>3</label>Department of Gastroenterology, The First Affiliated Hospital of Dali University, Dali, Yunnan 671003, P.R. China</aff>
<aff id="af4-BR-24-6-02147"><label>4</label>Princess Margaret Cancer Centre, University Health Network, TMDT-MaRS Centre, Toronto, Ontario ON M5G 1L7, Canada</aff>
<aff id="af5-BR-24-6-02147"><label>5</label>Yunnan Provincial Key Laboratory of Entomological Biopharmaceutical Research and Development, Dali University, Dali, Yunnan 671000, P.R. China</aff>
<aff id="af6-BR-24-6-02147"><label>6</label>Yunnan Key Laboratory of Screening and Research on Anti-pathogenic Plant Resources from West Yunnan (Cultivation), Dali, Yunnan 671000, P.R. China</aff>
<author-notes>
<corresp id="c1-BR-24-6-02147"><italic>Correspondence to:</italic> Dr Yuzhe Zhang, Department of Biochemistry and Molecular Biology, College of Basic Medical Sciences, Dali University, 22 Wanhua Road, Dali, Yunnan 671003, P.R. China <email>lzuzyz1568@hotmail.com</email></corresp>
<fn id="fn1-BR-24-6-02147"><p><sup>&#x002A;</sup>Contributed equally</p></fn>
</author-notes>
<pub-date pub-type="collection"><month>06</month><year>2026</year></pub-date>
<pub-date pub-type="epub"><day>24</day><month>04</month><year>2026</year></pub-date>
<volume>24</volume>
<issue>6</issue>
<elocation-id>74</elocation-id>
<history>
<date date-type="received">
<day>08</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>23</day>
<month>03</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright: &#x00A9; 2026 Wang et al.</copyright-statement>
<copyright-year>2026</copyright-year>
<license license-type="open-access">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by-nc-nd/4.0/">Creative Commons Attribution-NonCommercial-NoDerivs License</ext-link>, which permits use and distribution in any medium, provided the original work is properly cited, the use is non-commercial and no modifications or adaptations are made.</license-p></license>
</permissions>
<abstract>
<p>Hepatocellular carcinoma (HCC) shows a marked predominance in men, yet the molecular basis for this sex disparity remains unclear. The present study leveraged multi-omics data and machine learning algorithms to identify key genes associated with sex-specific differences in HCC and to screen for putative candidate compounds, aiming to provide new insights for sex-specific therapy. The mRNA expression data of male and female patients with HCC and paracancerous tissues were obtained from the GEO and TCGA databases. To mitigate overfitting, data were partitioned into independent training and testing sets. Candidate genes were screened by differential expression analysis and weighted gene co-expression network analysis. A total of four complementary algorithms, random forest, support vector machines, generalized linear models and extreme gradient boosting were used to identify key genes with high predictive capability. CYP17A1 and IRX3 were identified as the top differentially expressed core genes associated with HCC in men. Pan-cancer analysis showed that CYP17A1 was lowly expressed in the majority of tumors, but significantly highly expressed in HCC, rectal adenocarcinoma and gastric cancer (P&#x003C;0.001). Functional cell-based assays showed that knockout of CYP17A1 inhibited the proliferation, migration and invasion ability of HCC cells (P&#x003C;0.001). Immunohistochemistry showed that CYP17A1 protein expression was significantly increased in HCC tissues from male patients when compared with that in paracancerous tissues (P&#x003C;0.001), whereas there was no significant difference in female patient tissues (P&#x003E;0.05). Notably, while IRX3 was identified computationally, its functional role remains to be experimentally validated. Molecular docking predicted a potential interaction between the natural compound Saikosaponin A and the CYP17A1 protein, and cellular assays revealed that it dose-dependently inhibits HCC cell malignant phenotypes. The present study suggests that CYP17A1 is associated with sex differences in HCC, potentially via the androgen signaling axis. Furthermore, IRX3 emerges as a novel hypothesis-generating candidate gene. Finally, the findings of the present study highlight Saikosaponin A as a putative therapeutic candidate for male patients with HCC, warranting further target-dependency investigations.</p>
</abstract>
<kwd-group>
<kwd>hepatocellular carcinoma</kwd>
<kwd>sex differences</kwd>
<kwd>machine learning</kwd>
<kwd>CYP17A1</kwd>
<kwd>Saikosaponin A</kwd>
</kwd-group>
<funding-group>
<funding-statement><bold>Funding:</bold> The author(s) declare that financial support was received for the research, authorship and/or publication of this article. The present study was supported by the following projects: General Project of the Joint Special Project of Local Universities in Yunnan Province (grant nos. 202001BA070001-064 and 202101BA070001-102), Dali University Doctoral Research Start-up Fund Project (grant no. KYBS2018012), Open Project of Yunnan Provincial Key Laboratory of Entomological Biopharmaceutical R&#x0026;D (grant no. AG2024002), Clinical Medicine Discipline Team Building Project of the First Affiliated Hospital of Dali University (grant no. DFYYB2024026), Open Project of Key Laboratory of Screening and Research of Resistant Plant Resources in West Yunnan, Yunnan Province (grant no. APKL2101) and Yunnan College Students Innovation and Entrepreneurship Training Project Fund (grant no. S202410679068).</funding-statement>
</funding-group>
</article-meta>
</front>
<body>
<sec sec-type="intro">
<title>Introduction</title>
<p>Hepatocellular carcinoma (HCC) is one of the leading causes of cancer-related mortalities worldwide. It occupies a dominant position among primary types of liver cancer (<xref rid="b1-BR-24-6-02147" ref-type="bibr">1</xref>). Due to the insidious onset of HCC in its early stages and the lack of typical symptoms and signs, the disease is delayed, and diagnosis is made at an advanced stage (<xref rid="b2-BR-24-6-02147" ref-type="bibr">2</xref>). Patients with advanced HCC are frequently unsuitable for surgical treatment due to tumor metastasis, compromised liver function and poor systemic status, leading to a generally poor prognosis (<xref rid="b3-BR-24-6-02147" ref-type="bibr">3</xref>,<xref rid="b4-BR-24-6-02147" ref-type="bibr">4</xref>).</p>
<p>Epidemiologic data show that there is a considerable sex difference in the incidence of HCC, with a global prevalence of 2.8-3 times higher in men when compared with women (<xref rid="b3-BR-24-6-02147" ref-type="bibr">3</xref>,<xref rid="b4-BR-24-6-02147" ref-type="bibr">4</xref>). In the present study, all analyses regarding these disparities are strictly based on biological sex (men vs. women) rather than sociocultural factors. Studies show that sex hormones carry out an important role in the development of HCC. Estrogens inhibit HCC by regulating the cytokine IL-6, whereas androgens promote HCC by inhibiting lipocalin secretion or directly activating pro-cancer signaling pathways (<xref rid="b5-BR-24-6-02147" ref-type="bibr">5</xref>,<xref rid="b6-BR-24-6-02147" ref-type="bibr">6</xref>). Testosterone in particular, leads to reduced levels of lipocalin by inhibiting its secretion, a mechanism that is considered to be one of the most important reasons for the increased incidence of HCC in men (<xref rid="b7-BR-24-6-02147" ref-type="bibr">7</xref>). However, the effect of these hormones on the sex differences in mechanisms of HCC has not been fully clarified at the molecular level.</p>
<p>Machine learning, as an emerging bioinformatics analysis method, has shown great potential for application in the medical field and has been widely used in the analysis of clinical datasets (<xref rid="b8-BR-24-6-02147" ref-type="bibr">8</xref>). By constructing robust risk models to aid clinical decision-making and simultaneously redefining patient categories based on data characteristics, precision medicine can be realized in the future (<xref rid="b9-BR-24-6-02147" ref-type="bibr">9</xref>). Machine learning has been used to analyze high-dimensional transcriptomic data with promising results in identifying key genes for diseases, providing key clues for the study of disease mechanisms (<xref rid="b10-BR-24-6-02147" ref-type="bibr">10</xref>).</p>
<p>The present study combined differential expression analysis, weighted gene co-expression network analysis (WGCNA) and four machine learning algorithms, including random forest (RF), support vector machine (SVM), generalized linear model (GLM) and extreme gradient boosting (XGBoost), to systematically screen the core genes associated with sex differences in the development of HCC. This was then combined with pan-cancer analysis, functional cell-based assays and virtual drug screening to explore the potential molecular associations of the key genes and identify putative candidate compounds. Specifically, the screening in the present study highlighted Saikosaponin A as a promising therapeutic candidate. This will provide a theoretical basis for understanding the sex disparity in HCC incidence and proposing candidate compounds for further evaluation.</p>
</sec>
<sec sec-type="Materials|methods">
<title>Materials and methods</title>
<sec>
<title/>
<sec>
<title>Cell lines and reagents</title>
<p>Human liver cancer cell lines HepG2 and Huh7, and 293T were purchased from Beijing Beina Chunglian Institute of Biotechnology and The Cell Bank of Type Culture Collection of The Chinese Academy of Sciences. The authenticity of the cell lines used in the present study was verified via short tandem repeat profiling. The plasmids used in the experiments &#x005B;including the CYP17A1 knockout plasmid (cat. no. L25930), pLenti-Control-sgRNA (cat. no. L00011) and lentiviral packaging vector set A (cat. no. L00002S)&#x005D; were obtained from Beyotime Biotechnology. According to the manufacturer, the sgRNA incorporated in the commercial CYP17A1 knockout plasmid (cat. no. L25930) was generated using Beyotime&#x0027;s CRISPR/Cas9 sgRNA rapid screening and validation system, and its efficacy had been pre-validated by a T7 endonuclease I (T7EI) assay. The primary reagents included DMEM containing 10&#x0025; fetal bovine serum (Gibco; Thermo Fisher Scientific, Inc.), 0.25&#x0025; trypsin-EDTA digest (Beijing Solarbio Science &#x0026; Technology Co., Ltd.), penicillin-streptomycin solution (100X; Beyotime Biotechnology), BCA Protein Quantification Kit (cat. no. 500T; Beyotime Biotechnology) and puromycin (cat. no. ST551; Beyotime Biotechnology). Cell culture conditions were maintained at 37&#x02DA;C in a humidified incubator with 5&#x0025; CO<sub>2</sub>.</p>
</sec>
<sec>
<title>Data acquisition and pre-processing</title>
<p>The mRNA expression profiling data of HCC and corresponding paracancerous tissues were downloaded from the GEO database (<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/">https://www.ncbi.nlm.nih.gov/geo/</ext-link>; accession nos. GSE19665, GSE54236, GSE84402 and GSE121248), which included samples of both sexes and were generated in the original studies by Deng <italic>et al</italic> (<xref rid="b11-BR-24-6-02147" ref-type="bibr">11</xref>), Villa <italic>et al</italic> (<xref rid="b12-BR-24-6-02147" ref-type="bibr">12</xref>), Wang <italic>et al</italic> (<xref rid="b13-BR-24-6-02147" ref-type="bibr">13</xref>) and Wang <italic>et al</italic> (<xref rid="b14-BR-24-6-02147" ref-type="bibr">14</xref>). Batch effects were corrected using Surrogate Variable Analysis &#x005B;sva package, v3.54.0(<xref rid="b15-BR-24-6-02147" ref-type="bibr">15</xref>)&#x005D; in R (v4.4.2; R Foundation for Statistical Computing), and the expression matrix of HCC vs. normal tissue for sex groupings was extracted. Differentially expressed genes (DEGs) were screened using limma (v3.62.2) based on &#x007C;log2 fold change (FC)&#x007C;&#x2265;0.5 and an adjusted P&#x003C;0.05 after Benjamini-Hochberg correction.</p>
</sec>
<sec>
<title>WGCNA</title>
<p>A WGCN was constructed based on the expression matrix of DEGs, and a dynamic tree-cutting algorithm was used to divide the gene modules and screen for those significantly associated with the HCC phenotype (P&#x003C;0.05 for module significance). The &#x2018;WGCNA&#x2019; R package (v1.72) was utilized to construct the network. The network parameters were determined by setting a soft threshold of &#x03B2;=6 (scale-free topological fit index R&#x00B2;&#x003E;0.85). Modules significantly associated with HCC phenotypes were screened (Pearson correlation; P&#x003C;0.05) and the top 10&#x0025; of genes with high intra-module connectivity were extracted as candidate hub genes.</p>
</sec>
<sec>
<title>Machine learning-based core gene screening</title>
<p>The WGCNA hub genes were intersected with sex-specific DEGs (yielding a total of 36 candidate genes). Given the relatively limited sample size and the small, highly pre-filtered feature set (only 36 candidate genes), further dividing the dataset into separate training and testing cohorts would severely compromise the training process and the statistical power. Instead, to maximize data utility while strictly preventing overfitting, the present study relied entirely on a rigorous 10-fold cross-validation strategy across the entire dataset. A total of four machine learning algorithms, RF, SVM, GLM and XGBoost, were used to assess gene importance. During the 10-fold cross-validation process, the data were iteratively partitioned into training and validation folds, ensuring that the predictive performance of each model was robustly assessed on unseen data within each fold. The predictive performance was evaluated by calculating the area under the receiver operating characteristic curve (AUC), with all models achieving an AUC &#x003E;0.95. The overlapping genes (CYP17A1 and IRX3) ranked in the top ten for importance across all four algorithms were ultimately selected as the core genes. Their sex-specific differential expression profiles were further validated using the GEO database.</p>
</sec>
<sec>
<title>Bioinformatics validation</title>
<p>For pan-cancer expression analysis, the TIMER2.0 platform (<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="http://timer.cistrome.org/">http://timer.cistrome.org/</ext-link>) was used to analyze the expression differences of the core genes across 30 tumors in The Cancer Genome Atlas (TCGA) database (<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://portal.gdc.cancer.gov/">https://portal.gdc.cancer.gov/</ext-link>; Wilcoxon rank-sum test; with P&#x003C;0.05 as the criterion for determining statistically significant differences). For survival and clinical correlation analyses, TCGA clinical data were integrated and the association between core gene expression and patients&#x0027; overall survival was evaluated using the Kaplan-Meier method (R package &#x2018;survival&#x2019;; v3.3.1). Correlations with tumor grade and stage were analyzed using the Spearman rank correlation test. Gene set enrichment analysis was performed to identify the biological pathways associated with the core genes. For immune infiltration analysis, the CIBERSORT algorithm (R package &#x2018;CIBERSORT&#x2019;; v1.06) was applied to quantitatively analyze the infiltration levels of 22 immune cells and explore the correlation between core gene expression and the immune microenvironment (P&#x003C;0.05).</p>
</sec>
<sec>
<title>Collection of samples</title>
<p>Tumors and corresponding paracancerous tissues of liver cancer patients (n=18; 12 men and 6 women; age range, 40-75 years) were included in the present study. The samples were collected between January 2019 and June 2023. Specifically, samples dating from January 2019 to November 2022 were retrospectively accessed from historical archival formalin-fixed paraffin-embedded blocks, while samples from November 2022 to June 2023 were prospectively collected. Based on the study design, the precise inclusion criteria were: i) Patients who underwent radical resection for liver cancer; ii) pathologically confirmed primary liver cancer; iii) availability of matched paraffin-embedded tumor and paracancerous tissues (with paracancerous tissue strictly defined as being &#x003E;10 mm away from the tumor margin). The exclusion criteria were: i) Patients who received preoperative radiotherapy, chemotherapy or targeted therapy; ii) presence of other primary malignancies. Following surgical resection, fresh tissues were snap-frozen and stored at -80&#x02DA;C within 30 min, while matched tissue blocks were routinely formalin-fixed and paraffin-embedded for subsequent analysis. The present study was conducted with the approval of the Ethics Committee of the First Affiliated Hospital of Dali University (Approval no. OFY20221122001), which explicitly covered both the retrospective use of archived material and the prospective collection of new samples. Written informed consent was obtained from all patients prior to their participation; notably, for the newer prospectively collected samples, dedicated written informed consent for research use was strictly obtained prior to surgery. Strict confidentiality of patient identities was maintained. Detailed clinicopathological characteristics, including age, biological sex, tumor stage and viral hepatitis status, were retrospectively collected from medical records.</p>
</sec>
<sec>
<title>Immunohistochemistry (IHC)</title>
<p>Paraffin sections were deparaffinized with xylene and rehydrated with descending gradient ethanol. Antigen retrieval was performed in sodium citrate buffer (pH 6.0) at 100&#x02DA;C for 20 min. After blocking with goat serum blocking solution (cat. no. C0265; Beyotime Biotechnology) at room temperature for 10 min, the sections were incubated in a humidified chamber with rabbit anti-CYP17A1 primary antibody (1:200; cat. no. bsm-54306R; Bioss) overnight at 4&#x02DA;C, followed by an HRP-labeled goat anti-rabbit secondary antibody (1:1,000; cat. no. G1213-100UL; Wuhan Servicebio Technology) at 37&#x02DA;C for 30 min. Visualization was achieved using DAB, followed by hematoxylin counterstaining at room temperature for 15 sec. Staining intensity (0-3) and the percentage score of positive cells (1-4) were independently evaluated by two pathologists in a double-blind manner; the final IHC score was calculated as intensity x percentage score, and discordant cases were reviewed jointly to reach consensus.</p>
</sec>
<sec>
<title>Knockout cell line construction and functional experiments</title>
<p>To construct stable CYP17A1 knockout cells, 293T cells were transfected at 37&#x02DA;C using a third-generation lentiviral packaging system consisting of the CYP17A1 knockout plasmid (cat. no. L25930; Beyotime Biotechnology), pMDLg, Rev and VSV-g plasmids. For each 10-cm dish, 10 &#x00B5;g transfer plasmid, 6.5 &#x00B5;g pMDLg, 2.5 &#x00B5;g Rev and 3.5 &#x00B5;g VSV-g were mixed in 500 &#x00B5;l serum- and antibiotic-free DMEM and transfected using 40 &#x00B5;l Lipo6000 (cat. no. C0526; Beyotime Biotechnology) at 37&#x02DA;C for 6 h. The medium was replaced after 4-6 h, and viral supernatants were collected at 24 and 48 h, filtered through a 0.45-&#x00B5;m membrane, and used to infect HepG2 cells. Because a fixed MOI was not determined, transduction conditions were optimized empirically using 0.5-2.0 ml viral supernatant/well according to transduction efficiency; 1 ml viral supernatant plus Polybrene (8 &#x00B5;g/ml; cat. no. ST1380; Beyotime Biotechnology) was used for routine infection in 6-well plates. Cells were transduced for 48 h, after which puromycin selection was initiated at 2 &#x00B5;g/ml and maintained at the same concentration for &#x003E;1 week until stable knockout cells were obtained. The CYP17A1 sgRNA sequence was 5&#x0027;-GCACCAGGGCACCTTCTCTT-3&#x0027;, and an empty vector was used as the negative control (NC).</p>
</sec>
<sec>
<title>Reverse transcription-quantitative PCR (RT-qPCR)</title>
<p>Total RNA was extracted from cells using TRIzol<sup>&#x00AE;</sup> reagent (cat. no. 15596026; Invitrogen; Thermo Fisher Scientific, Inc.). Reverse transcription was performed using HiScript III All-in-one RT SuperMix Perfect for qPCR (cat. no. R333-01; Vazyme Biotech Co, Ltd.) according to the manufacturer&#x0027;s instructions (37&#x02DA;C for 15 min and 85&#x02DA;C for 5 sec). qPCR was performed using ChamQ Universal SYBR qPCR Master Mix (cat. no. Q311-02; Vazyme Biotech Co, Ltd.) on cDNA derived from the indicated cells, and relative mRNA expression was calculated using the 2<sup>-&#x0394;&#x0394;Cq</sup> method (<xref rid="b16-BR-24-6-02147" ref-type="bibr">16</xref>) with GAPDH as the internal reference. The thermocycling conditions were 95&#x02DA;C for 30 sec, followed by 40 cycles of 95&#x02DA;C for 10 sec and 60&#x02DA;C for 30 sec. The forward and reverse sequences of all primers used were as follows: CYP17A1 Forward: 5&#x0027;-AGAAGTTATCATCAATCTGTGGGC-3&#x0027;, Reverse: 5&#x0027;-CTGCTCCGAAGGGCAAATA-3&#x0027;; GAPDH Forward: 5&#x0027;-GGAAGCTTGTCATCAATGGAAATC-3&#x0027;, Reverse: 5&#x0027;-TGATGACCCTTTTGGCTCCC-3&#x0027;.</p>
</sec>
<sec>
<title>Western blotting</title>
<p>Total protein was extracted from cells using RIPA lysis buffer (cat. no. R0010; Beijing Solarbio Science &#x0026; Technology) supplemented with PMSF. Protein concentrations were determined using a BCA Protein Assay kit. Equal amounts of protein (20 &#x00B5;g/lane) were separated by 10&#x0025; SDS-PAGE and transferred onto PVDF membranes (cat. no. IPVH00010; MilliporeSigma) at 200 mA for 90 min. The membranes were blocked with 5&#x0025; non-fat milk in TBST (0.1&#x0025; Tween-20) at room temperature for 2 h and incubated with rabbit anti-CYP17A1 antibody (1:1,000; cat. no. bsm-54306R; Bioss) and mouse anti-GAPDH antibody (1:1,000; cat. no. GB12002-100; Wuhan Servicebio Technology) overnight at 4&#x02DA;C, followed by HRP-conjugated goat anti-rabbit IgG (1:5,000; cat. no. bs-0295G-HRP; Bioss) or HRP-conjugated goat anti-mouse IgG (1:5,000; cat. no. bs-0296G-HRP; Bioss) for 1 h at room temperature. Signals were visualized using BeyoECL Plus chemiluminescence reagent (cat. no. P0018S; Beyotime Biotechnology).</p>
</sec>
<sec>
<title>Cell proliferation</title>
<p>Cell Counting Kit-8 (CCK-8) was used to measure cell proliferation (Dojindo Laboratories, Inc.). Cells were seeded in 96-well plates (5x10&#x00B3; cells/well; six replicates per group) and cell viability was assessed at 0, 24, 48 and 72 h by measuring the OD450. In the functional cell-based assays, the KO-CYP17A1-HepG2 cell line was used as the experimental group, and the KO-Control-HepG2 cell line was used as the control group, to explore the effects of CYP17A1 knockout on the proliferation, migration and invasion ability of the cells.</p>
</sec>
<sec>
<title>Cell migration</title>
<p>Cell migration was evaluated using a scratch wound-healing assay. For CYP17A1 knockout experiments, HepG2 NC and KO cells were used; for Saikosaponin A experiments, HepG2 and Huh7 cells were treated with 20 &#x00B5;M Saikosaponin A (Aladdin Biochemical Technology Co., Ltd.). Cells were seeded in 6-well plates and allowed to reach &#x007E;100&#x0025; confluence, scratched with a 200-&#x00B5;l pipette tip, washed three times with PBS, and then cultured in complete medium. Images were captured at 0 and 24 h under an inverted light microscope (magnification, x100), and wound-healing area was quantified using ImageJ (v1.53; National Institutes of Health). For invasion assays, Matrigel (cat. no. M8370; Beijing Solarbio Science &#x0026; Technology Co., Ltd.) was diluted to &#x007E;200 &#x00B5;g/ml, 100 &#x00B5;l was added to each upper chamber and allowed to polymerize at 37&#x02DA;C for 4 h. Transwell inserts (8-&#x00B5;m pore size; cat. no. WG3422; Wuhan Servicebio Technology) were used. Cells were resuspended at 5x10<sup>5</sup> cells/ml in serum-free DMEM, and 200 &#x00B5;l cell suspension was added to the upper chamber, while 600 &#x00B5;l complete medium containing 10&#x0025; FBS was added to the lower chamber. After incubation for 24 h at 37&#x02DA;C, cells on the lower membrane surface were fixed with 4&#x0025; paraformaldehyde for 20 min at room temperature, stained with 0.1&#x0025; crystal violet for 10 min at room temperature, and counted in five random fields under an inverted light microscope (magnification, x200).</p>
</sec>
<sec>
<title>Virtual drug screening and molecular docking</title>
<p>The crystal structure of the CYP17A1 protein was retrieved from the PDB database (<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://www.rcsb.org/">https://www.rcsb.org/</ext-link>). Water molecules and co-crystallized ligands were removed using PyMOL (v2.5.2; <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://pymol.org/2/">https://pymol.org/2/</ext-link>). A Traditional Chinese Medicine monomer library containing 4,080 compounds was obtained from TargetMol (<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://www.targetmol.com/compound-library/traditional-chinese-medicine-monomers-library.html">https://www.targetmol.com/compound-library/traditional-chinese-medicine-monomers-library.html</ext-link>) and virtually screened using AutoDock Vina (v1.2.3). For compounds demonstrating binding energies &#x2264;-10 kcal/mol, molecular docking interactions with the CYP17A1 protein were further analyzed using PyMOL and PLIP software (<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://plip-tool.biotec.tu-dresden.de/plip-web/plip/index">https://plip-tool.biotec.tu-dresden.de/plip-web/plip/index</ext-link>). Saikosaponin A (Aladdin Biochemical Technology Co., Ltd.) exhibited the highest binding affinity for CYP17A1 and was therefore selected for subsequent <italic>in vitro</italic> validation. The concentration gradient of Saikosaponin A was 0-30 &#x00B5;M. In each experiment, the changes in cell proliferation, migration and invasion ability of HepG2 and Huh7 cells were observed under different concentrations of Saikosaponin A, and the dose-dependent inhibitory effects were analyzed.</p>
</sec>
<sec>
<title>Statistical analysis</title>
<p>Experimental data were analyzed using R (v4.4.2; R Foundation for Statistical Computing), GraphPad Prism (v6.0; Dotmatics) and ImageJ (v1.53; National Institutes of Health). Data are presented as mean &#x00B1; SD. Two-group comparisons were performed using unpaired, two-tailed Student&#x0027;s t-tests. For &#x003E;2 groups, one-way ANOVA followed by Tukey&#x0027;s post hoc test was used. Time-course proliferation data (CCK-8) were analyzed using two-way ANOVA with Bonferroni post hoc correction. Differential expression analyses were performed using limma (v3.62.2) with Benjamini-Hochberg false discovery rate correction. Pearson correlation analysis was used for WGCNA module-trait associations, Wilcoxon rank-sum tests were used for pan-cancer expression comparisons, and Spearman rank tests were used for correlations with tumor grade and stage. Survival analyses were performed using Kaplan-Meier curves and two-sided log-rank tests. Because late-stage crossover/convergence was observed in <xref rid="f3-BR-24-6-02147" ref-type="fig">Fig. 3C</xref>, sensitivity analyses were additionally conducted using i) administrative truncation at 7 years, ii) weighted Gehan-Breslow testing (rho=1) and iii) a two-stage test &#x005B;TSHRC package (v0.1-6)&#x005D;. P&#x003C;0.05 was considered statistically significant.</p>
</sec>
</sec>
</sec>
<sec sec-type="Results">
<title>Results</title>
<sec>
<title/>
<sec>
<title>Identification of core genes for sex differences in HCC</title>
<p>A total of 36 candidate genes were screened from samples from male and female patients with HCC by differential expression analysis combined with WGCNA (<xref rid="f1-BR-24-6-02147" ref-type="fig">Fig. 1A</xref> and <xref rid="f1-BR-24-6-02147" ref-type="fig">B</xref>). The evaluation results showed that the AUC of all models was &#x003E;0.95 (<xref rid="f1-BR-24-6-02147" ref-type="fig">Fig. 1C</xref>) and the residual analysis showed that the model residual values were &#x003C;0.25 (<xref rid="f1-BR-24-6-02147" ref-type="fig">Fig. 1D</xref>), which suggested that the constructed models achieved high discriminatory ability within the cross-validation framework. An intersectional analysis of the top ten genes ranked in importance by the four algorithms identified CYP17A1 and IRX3 as the core genes differentially expressed in HCC samples from men (<xref rid="f1-BR-24-6-02147" ref-type="fig">Fig. 1E</xref>).</p>
</sec>
<sec>
<title>Validation of sex-specific expression of CYP17A1 and IRX3</title>
<p>To verify the differences in the expression of CYP17A1 and IRX3 in HCC tissues of different sexes, their mRNA expression levels were further evaluated using the comprehensive GEO datasets. The results showed that CYP17A1 and IRX3 mRNA expression levels in HCC tissues from men were significantly higher when compared with those in paired paracancerous tissues (P&#x003C;0.001, <xref rid="f2-BR-24-6-02147" ref-type="fig">Fig. 2A</xref> and <xref rid="f2-BR-24-6-02147" ref-type="fig">C</xref>). However, there was no significant difference in CYP17A1 and IRX3 mRNA expression between HCC tissues from women and their paired paracancerous tissues (P&#x003E;0.05; <xref rid="f2-BR-24-6-02147" ref-type="fig">Fig. 2B</xref> and <xref rid="f2-BR-24-6-02147" ref-type="fig">D</xref>). Subgroup analysis further strictly compared tumor tissues to their sex-matched normal controls. The results showed that the expression levels of CYP17A1 and IRX3 were elevated in the male patient HCC group compared with the normal male group (both P&#x003C;0.001, <xref rid="f2-BR-24-6-02147" ref-type="fig">Fig. 2E</xref> and <xref rid="f2-BR-24-6-02147" ref-type="fig">F</xref>). These data verified that CYP17A1 and IRX3 were differentially expressed only in male patient HCC, suggesting a sex-specific regulatory pattern. Notably, while CYP17A1 was subjected to further experimental validation in the present study, IRX3 lacks functional validation and currently serves as a hypothesis-generating candidate gene warranting future investigation.</p>
</sec>
<sec>
<title>Pan-cancer exploratory analysis and HCC-specific clinical relevance of CYP17A1</title>
<p>To explore the broader context of CYP17A1, a pan-cancer expression analysis was performed. It showed that CYP17A1 was generally lowly expressed in the majority of tumors, such as cholangiocarcinoma and renal cancer, but exhibited specific high expression in HCC, rectal adenocarcinoma and gastric cancer (P&#x003C;0.001; <xref rid="f3-BR-24-6-02147" ref-type="fig">Fig. 3A</xref>). In a subsequent, strictly independent HCC-specific validation using the TCGA-LIHC dataset, the expression of CYP17A1 in HCC tissues was significantly increased compared with that in normal tissues (P&#x003C;0.001; <xref rid="f3-BR-24-6-02147" ref-type="fig">Fig. 3B</xref>). The survival analysis with the standard log-rank test indicated no statistically significant association with overall survival (log-rank P&#x003E;0.05; <xref rid="f3-BR-24-6-02147" ref-type="fig">Fig. 3C</xref>). Considering the late-stage curve crossover, additional sensitivity analyses were performed: A 7-year truncated log-rank (P&#x003E;0.05), weighted Gehan-Breslow (P&#x003C;0.05) and two-stage test (P=&#x003E;0.05), indicating a trend-level but non-robust prognostic association. Furthermore, the correlation analysis of CYP17A1 expression and immune cell infiltration showed a positive correlation with M1 macrophage infiltration (R=0.33; P&#x003C;0.05; <xref rid="f3-BR-24-6-02147" ref-type="fig">Fig. 3D</xref>) and a negative correlation with activated dendritic cell infiltration (R=-0.3; P&#x003C;0.05; <xref rid="f3-BR-24-6-02147" ref-type="fig">Fig. 3E</xref>).</p>
</sec>
<sec>
<title>Validation of protein expression and functional mechanisms for CYP17A1</title>
<p>Validation of CYP17A1 protein expression by IHC suggested that CYP17A1 protein was significantly higher in male patient HCC tissues when compared with that in paracancerous tissues (P&#x003C;0.001; <xref rid="f4-BR-24-6-02147" ref-type="fig">Fig. 4A</xref> and <xref rid="f4-BR-24-6-02147" ref-type="fig">B</xref>). By contrast, there was no significant difference in female patient samples (P&#x003E;0.05; <xref rid="f4-BR-24-6-02147" ref-type="fig">Fig. 4C</xref> and <xref rid="f4-BR-24-6-02147" ref-type="fig">D</xref>). This protein-level result was consistent with the mRNA expression patterns. To investigate the functional mechanisms of CYP17A1 <italic>in vitro</italic>, stable knockout of CYP17A1 was established using lentivirus specifically in the HepG2 cell line. The mRNA (<xref rid="f5-BR-24-6-02147" ref-type="fig">Fig. 5A</xref>) and protein (<xref rid="f5-BR-24-6-02147" ref-type="fig">Fig. 5B</xref> and <xref rid="f5-BR-24-6-02147" ref-type="fig">C</xref>) expression levels of HepG2 cells were significantly reduced following CYP17A1 knockout (P&#x003C;0.001). Functional cell-based assays demonstrated that knockout of CYP17A1 inhibited HepG2 cell proliferation at 72 h (P&#x003C;0.001; <xref rid="f5-BR-24-6-02147" ref-type="fig">Fig. 5D</xref>; <xref rid="SD1-BR-24-6-02147" ref-type="supplementary-material">Table SI</xref>), reduced migration capacity by 78&#x0025; in the scratch healing assay (P&#x003C;0.001; <xref rid="f5-BR-24-6-02147" ref-type="fig">Fig. 5E</xref> and <xref rid="f5-BR-24-6-02147" ref-type="fig">F</xref>) and attenuated invasive capacity by 65&#x0025; in the Transwell assay (P&#x003C;0.001; <xref rid="f5-BR-24-6-02147" ref-type="fig">Fig. 5G</xref> and <xref rid="f5-BR-24-6-02147" ref-type="fig">H</xref>). These results suggest that CYP17A1 potentially contributes to the malignant phenotypes of HCC cells <italic>in vitro</italic>.</p>
</sec>
<sec>
<title>Virtual screening and in vitro validation of putative CYP17A1-targeting compounds</title>
<p>In a virtual screening of 4,080 herbal monomers using the CYP17A1 protein as a receptor, molecular docking predicted that Saikosaponin A possessed the highest binding affinity for the CYP17A1 protein, with a binding energy of -12.5 kcal/mol and the formation of 6 pairs of hydrogen bonds (<xref rid="tI-BR-24-6-02147" ref-type="table">Table I</xref>; <xref rid="f6-BR-24-6-02147" ref-type="fig">Fig. 6A</xref>). Based on these predictive docking data, Saikosaponin A was selected as a putative compound targeting CYP17A1 for further cellular validation. <italic>In vitro</italic> experiments evaluated the effects of Saikosaponin A on HCC cell phenotypes. Cell proliferation assays demonstrated that treatment with different concentrations of Saikosaponin A significantly inhibited the proliferation of HepG2 and Huh7 cells in a dose- and time-dependent manner (<xref rid="f6-BR-24-6-02147" ref-type="fig">Fig. 6B</xref> and <xref rid="f6-BR-24-6-02147" ref-type="fig">C</xref>; <xref rid="SD2-BR-24-6-02147" ref-type="supplementary-material">Tables SII</xref> and <xref rid="SD3-BR-24-6-02147" ref-type="supplementary-material">SIII</xref>). Furthermore, after treatment with 20 &#x00B5;M of Saikosaponin A for 24 h, the scratch healing rates of HepG2 and Huh7 cells were reduced by 63 and 58&#x0025;, respectively (P&#x003C;0.001; <xref rid="f6-BR-24-6-02147" ref-type="fig">Fig. 6D-G</xref>). In response to the image-quality query, representative wound-healing control images were replaced with fields showing continuous near-confluent monolayers outside the wound area, and quantification was recalculated from qualified fields (<xref rid="f6-BR-24-6-02147" ref-type="fig">Fig. 6F</xref>). Similarly, Transwell assays revealed that the number of invading HepG2 and Huh7 cells was reduced by 52 and 48&#x0025;, respectively (P&#x003C;0.01; <xref rid="f6-BR-24-6-02147" ref-type="fig">Fig. 6H-J</xref>). These inhibitory effects on migration and invasion were also dose-dependent. This suggests that Saikosaponin A exhibits a significant inhibitory effect on the malignant phenotypes of HCC cells, highlighting it as a potential therapeutic candidate, although direct CYP17A1-dependency requires further rescue validations.</p>
</sec>
</sec>
</sec>
<sec sec-type="Discussion">
<title>Discussion</title>
<p>HCC is considerably more prevalent in men than in women (<xref rid="b3-BR-24-6-02147" ref-type="bibr">3</xref>,<xref rid="b4-BR-24-6-02147" ref-type="bibr">4</xref>), and exploring the underlying molecular mechanisms of this sex difference is a prominent research topic in oncology. In the present study, by integrating multi-omics data and machine learning algorithms, CYP17A1 and IRX3 were computationally identified as key candidate genes associated with sex differences in HCC. The present study explored their potential mechanisms in influencing the progression of HCC, possibly through the modulation of the androgen signaling pathway. Virtual drug screening and <italic>in vitro</italic> functional validation revealed that the traditional Chinese medicine monomer Saikosaponin A could inhibit the malignant phenotypes of HCC cells, highlighting a putative new candidate for the treatment of HCC.</p>
<p>Cytochrome P450 enzyme (CYP17A1) is a key steroidogenic enzyme that carries out an important role in the development of several tumors. It catalyzes the conversion of pregnenolone to dehydroepiandrosterone and promotes testosterone synthesis (<xref rid="b17-BR-24-6-02147" ref-type="bibr">17</xref>,<xref rid="b18-BR-24-6-02147" ref-type="bibr">18</xref>). Niu <italic>et al</italic> (<xref rid="b19-BR-24-6-02147" ref-type="bibr">19</xref>) found that CYP17A1 knockout <italic>in vitro</italic> considerably inhibits the proliferation and invasive ability of glioma cells, while promoting apoptosis. Moreover, in women, it has also been hypothesized that the androgen receptor (AR) can substitute for estrogen-dependent signaling to stimulate transcription of steroid-responsive genes that drive breast cancer (<xref rid="b20-BR-24-6-02147" ref-type="bibr">20</xref>). Altered expression levels of genes involved in the androgen expression pathway have been suggested as one of the key factors that may be associated with sex differences in the development of these tumors (<xref rid="b21-BR-24-6-02147 b22-BR-24-6-02147 b23-BR-24-6-02147" ref-type="bibr">21-23</xref>). The present study found that CYP17A1 was specifically highly expressed in male patient HCC tissues. This result aligns with the mechanism that CYP17A1 drives tumor progression by promoting androgen synthesis in prostate cancer. At the same time, previous studies have found that cell culture medium containing certain levels of androgens promotes the proliferative capacity of glioma cells and that average serum testosterone levels are markedly higher in patients with glioma (<xref rid="b24-BR-24-6-02147" ref-type="bibr">24</xref>,<xref rid="b25-BR-24-6-02147" ref-type="bibr">25</xref>). Taken together, the present study speculates that the higher incidence of HCC in men may be associated with CYP17A1-mediated elevations of local androgen levels, which potentially promote tumor cell proliferation through the activation of AR signaling pathways. Notably, while IRX3 was identified alongside CYP17A1 as a core gene, to the best of our knowledge, its association with sex differences has not yet been previously reported. IRX3 regulates cell differentiation in embryonic development, and its function in HCC may involve aberrant activation of the Wnt/&#x03B2;-catenin pathway. However, because no functional validation was performed for IRX3 in the present study, it must be viewed as a hypothesis-generating candidate gene that requires rigorous future experimental validation.</p>
<p>In the field of tumor therapy, natural products have been an important source for the development of chemotherapeutic drugs (<xref rid="b26-BR-24-6-02147" ref-type="bibr">26</xref>). In order to explore potential interventions, the present study found that Saikosaponin A, an important bioactive triterpene glycoside compound extracted from Chaihu (Radix Bupleuri), has a predicted binding affinity with CYP17A1(<xref rid="b27-BR-24-6-02147" ref-type="bibr">27</xref>). Du <italic>et al</italic> (<xref rid="b28-BR-24-6-02147" ref-type="bibr">28</xref>) found that Saikosaponin A triggered apoptosis and inhibited the PI3K/Akt signaling pathway, exerting an anti-cervical cancer effect. Wang <italic>et al</italic> (<xref rid="b29-BR-24-6-02147" ref-type="bibr">29</xref>) showed that Saikosaponin A may induce apoptosis in gastric cancer cells. Zhang <italic>et al</italic> (<xref rid="b30-BR-24-6-02147" ref-type="bibr">30</xref>) found that Saikosaponin A has potent anti-angiogenic activity and inhibits tumor growth mainly by blocking the VEGFR2 signaling pathway. In the present study, molecular docking predicted a high affinity (binding energy=-12.5 kcal/mol) with the CYP17A1 protein, and <italic>in vitro</italic> experiments confirmed that it dose-dependently inhibited HCC cell migration and invasion. However, molecular docking alone does not establish direct enzymatic inhibition, presenting a limitation of the present study. Without target-dependency or rescue experiments, it remains inconclusive whether CYP17A1 is the primary functional target mediating the observed anti-migration and anti-invasion effects, as Saikosaponin A may act through pleiotropic mechanisms. In the future, enzymatic activity assays and rescue experiments in CYP17A1-knockout cells are necessary to comprehensively reveal its precise antitumor mechanism.</p>
<p>The sex-specific expression of CYP17A1 in HCC provides a new direction for the development of personalized treatment regimens for male patients. Abiraterone, an inhibitor of CYP17A1, has achieved significant efficacy in the treatment of prostate cancer, suggesting that targeting this gene axis might also be applicable to HCC (<xref rid="b31-BR-24-6-02147" ref-type="bibr">31</xref>). Despite these promising results, several limitations must be addressed. First, the clinical IHC sample size was small (n=18), and the subgroup analyses did not adequately control for potential confounding factors such as age, viral hepatitis status and alcohol consumption. Thus, it is premature to attribute the observed expression differences of CYP17A1 solely to biological sex without validation in a larger, multifactorial clinical cohort. Second, as indicated by the primary log-rank analysis (P=0.0726) and additional crossover-sensitive analyses (7-year truncated log-rank P=0.0933; weighted Gehan-Breslow P=0.0334; two-stage P=0.0908), the association between CYP17A1 expression and overall survival was not robust across methods, suggesting its role may be mechanistic or therapeutic rather than acting as a robust prognostic biomarker. Third, owing to the scarcity of comprehensive multi-omics HCC datasets with perfectly matched biological sex annotations, we were unable to construct a fully independent external validation cohort, which implies that the risk of overfitting cannot be entirely ruled out. Finally, the involvement of the androgen pathway is inferred from previous literature and our bioinformatics findings, rather than directly demonstrated through androgen level measurements or rescue experiments in this study. The <italic>in vivo</italic> efficacy and safety of Saikosaponin A also require systematic evaluation using humanized HCC mouse or patient-derived xenograft models in future studies.</p>
<p>In conclusion, the present study suggests that CYP17A1 is a key gene associated with HCC in men, potentially driving malignant phenotypes via the androgen signaling axis, while IRX3 emerges as a novel hypothesis-generating candidate. Furthermore, Saikosaponin A is highlighted as a putative therapeutic candidate. Future research efforts will focus on constructing a CYP17A1 conditional knockout mouse model to validate its necessity in HCC occurrence, performing target-dependency assays for Saikosaponin A and resolving the interaction network of IRX3 with sex-related signaling pathways. These studies are expected to provide a more solid theoretical basis for sex-specific strategies and personalized treatment in HCC.</p>
</sec>
<sec sec-type="supplementary-material">
<title>Supplementary Material</title>
<supplementary-material id="SD1-BR-24-6-02147" content-type="local-data">
<caption>
<title>Cell Counting Kit-8 assay of control and CYP17A1 knockout groups.</title>
</caption>
<media mimetype="application" mime-subtype="xls" xlink:href="Supplementary_Data1.xlsx"/>
</supplementary-material>
<supplementary-material id="SD2-BR-24-6-02147" content-type="local-data">
<caption>
<title>Inhibitory effects of Saikosaponin A on the proliferation of HepG2 cells assessed by Cell Counting Kit-8 assay.</title>
</caption>
<media mimetype="application" mime-subtype="xls" xlink:href="Supplementary_Data2.xlsx"/>
</supplementary-material>
<supplementary-material id="SD3-BR-24-6-02147" content-type="local-data">
<caption>
<title>Inhibitory effects of Saikosaponin A on the proliferation of Huh7 cells assessed by Cell Counting Kit-8 assay.</title>
</caption>
<media mimetype="application" mime-subtype="xls" xlink:href="Supplementary_Data3.xlsx"/>
</supplementary-material>
</sec>
</body>
<back>
<ack>
<title>Acknowledgements</title>
<p>Not applicable.</p>
</ack>
<sec sec-type="data-availability">
<title>Availability of data and materials</title>
<p>The data generated in the present study may be requested from the corresponding author. The datasets analyzed for this study can be found in the GEO database (<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/">https://www.ncbi.nlm.nih.gov/geo/</ext-link>) under accession numbers GSE19665, GSE54236, GSE84402 and GSE121248, and in the TCGA-LIHC dataset via the TIMER2.0 platform.</p>
</sec>
<sec>
<title>Authors&#x0027; contributions</title>
<p>ZW and JN contributed to conceptualization, data curation, formal analysis, investigation, methodology, project administration, supervision, CYP17A1 protein expression and functional validation, visualization, writing of the original draft, and review and editing. HZ and WL contributed to conceptualization, formal analysis, investigation, supervision, visualization, and review and editing. ZL and XY contributed to methodology, bioinformatics data analysis, visualization and writing of the original draft. YZhao and YW contributed to data curation, formal analysis and writing of the original draft. RQ contributed to data processing, conducting experiments, visualization and writing of the original draft. CL contributed to bioinformatics data analysis, visualization and writing of the original draft. QR contributed to the acquisition of clinical data, interpretation of data, and review of the manuscript. YL and YZhang contributed to conceptualization, data curation, funding acquisition, investigation, methodology, project administration, resources, supervision, visualization, writing of the original draft and review and editing.</p>
</sec>
<sec>
<title>Ethics approval and consent to participate</title>
<p>The study of human tumor cells was approved by the ethics committee of the First Affiliated Hospital of Dali University, Dali, China (approval no. OFY20221122001). The present study was conducted in accordance with the local legislation and institutional requirements.</p>
</sec>
<sec>
<title>Patient consent for publication</title>
<p>All patients provided written informed consent for the publication of their anonymized clinical data obtained and analyzed in the present study. The consent process ensured that participants were aware that their data would be used for research purposes and potentially included in scientific publications, with all personally identifiable information removed to protect their privacy.</p>
</sec>
<sec sec-type="COI-statement">
<title>Competing interests</title>
<p>The authors declare that they have no competing financial interests.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="b1-BR-24-6-02147"><label>1</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Petrick</surname><given-names>JL</given-names></name><name><surname>McGlynn</surname><given-names>KA</given-names></name></person-group><article-title>The changing epidemiology of primary liver cancer</article-title><source>Curr Epidemiol Rep</source><volume>6</volume><fpage>104</fpage><lpage>111</lpage><year>2019</year><pub-id pub-id-type="pmid">31259140</pub-id><pub-id pub-id-type="doi">10.1007/s40471-019-00188-3</pub-id></element-citation></ref>
<ref id="b2-BR-24-6-02147"><label>2</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname><given-names>E</given-names></name><name><surname>Viatour</surname><given-names>P</given-names></name></person-group><article-title>Hepatocellular carcinoma: Old friends and new tricks</article-title><source>Exp Mol Med</source><volume>52</volume><fpage>1898</fpage><lpage>1907</lpage><year>2020</year><pub-id pub-id-type="pmid">33268834</pub-id><pub-id pub-id-type="doi">10.1038/s12276-020-00527-1</pub-id></element-citation></ref>
<ref id="b3-BR-24-6-02147"><label>3</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kulik</surname><given-names>L</given-names></name><name><surname>El-Serag</surname><given-names>HB</given-names></name></person-group><article-title>Epidemiology and management of hepatocellular carcinoma</article-title><source>Gastroenterology</source><volume>156</volume><fpage>477</fpage><lpage>491.e1</lpage><year>2019</year><pub-id pub-id-type="pmid">30367835</pub-id><pub-id pub-id-type="doi">10.1053/j.gastro.2018.08.065</pub-id></element-citation></ref>
<ref id="b4-BR-24-6-02147"><label>4</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bray</surname><given-names>F</given-names></name><name><surname>Ferlay</surname><given-names>J</given-names></name><name><surname>Soerjomataram</surname><given-names>I</given-names></name><name><surname>Siegel</surname><given-names>RL</given-names></name><name><surname>Torre</surname><given-names>LA</given-names></name><name><surname>Jemal</surname><given-names>A</given-names></name></person-group><article-title>Global cancer statistics 2018: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title><source>CA Cancer J Clin</source><volume>68</volume><fpage>394</fpage><lpage>424</lpage><year>2018</year><pub-id pub-id-type="pmid">30207593</pub-id><pub-id pub-id-type="doi">10.3322/caac.21492</pub-id></element-citation></ref>
<ref id="b5-BR-24-6-02147"><label>5</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nakatani</surname><given-names>T</given-names></name><name><surname>Roy</surname><given-names>G</given-names></name><name><surname>Fujimoto</surname><given-names>N</given-names></name><name><surname>Asahara</surname><given-names>T</given-names></name><name><surname>Ito</surname><given-names>A</given-names></name></person-group><article-title>Sex hormone dependency of diethylnitrosamine-induced liver tumors in mice and chemoprevention by leuprorelin</article-title><source>Jpn J Cancer Res</source><volume>92</volume><fpage>249</fpage><lpage>256</lpage><year>2001</year><pub-id pub-id-type="pmid">11267934</pub-id><pub-id pub-id-type="doi">10.1111/j.1349-7006.2001.tb01089.x</pub-id></element-citation></ref>
<ref id="b6-BR-24-6-02147"><label>6</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Naugler</surname><given-names>WE</given-names></name><name><surname>Sakurai</surname><given-names>T</given-names></name><name><surname>Kim</surname><given-names>S</given-names></name><name><surname>Maeda</surname><given-names>S</given-names></name><name><surname>Kim</surname><given-names>K</given-names></name><name><surname>Elsharkawy</surname><given-names>AM</given-names></name><name><surname>Karin</surname><given-names>M</given-names></name></person-group><article-title>Gender disparity in liver cancer due to sex differences in MyD88-dependent IL-6 production</article-title><source>Science</source><volume>317</volume><fpage>121</fpage><lpage>124</lpage><year>2007</year><pub-id pub-id-type="pmid">17615358</pub-id><pub-id pub-id-type="doi">10.1126/science.1140485</pub-id></element-citation></ref>
<ref id="b7-BR-24-6-02147"><label>7</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Manieri</surname><given-names>E</given-names></name><name><surname>Herrera-Melle</surname><given-names>L</given-names></name><name><surname>Mora</surname><given-names>A</given-names></name><name><surname>Tom&#x00E1;s-Loba</surname><given-names>A</given-names></name><name><surname>Leiva-Vega</surname><given-names>L</given-names></name><name><surname>Fern&#x00E1;ndez</surname><given-names>DI</given-names></name><name><surname>Rodr&#x00ED;guez</surname><given-names>E</given-names></name><name><surname>Mor&#x00E1;n</surname><given-names>L</given-names></name><name><surname>Hern&#x00E1;ndez-Cosido</surname><given-names>L</given-names></name><name><surname>Torres</surname><given-names>JL</given-names></name><etal/></person-group><article-title>Adiponectin accounts for gender differences in hepatocellular carcinoma incidence</article-title><source>J Exp Med</source><volume>216</volume><fpage>1108</fpage><lpage>1119</lpage><year>2019</year><pub-id pub-id-type="pmid">30944152</pub-id><pub-id pub-id-type="doi">10.1084/jem.20181288</pub-id></element-citation></ref>
<ref id="b8-BR-24-6-02147"><label>8</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lip</surname><given-names>GYH</given-names></name><name><surname>Nieuwlaat</surname><given-names>R</given-names></name><name><surname>Pisters</surname><given-names>R</given-names></name><name><surname>Lane</surname><given-names>DA</given-names></name><name><surname>Crijns</surname><given-names>HJGM</given-names></name></person-group><article-title>Refining clinical risk stratification for predicting stroke and thromboembolism in atrial fibrillation using a novel risk factor-based approach: The euro heart survey on atrial fibrillation</article-title><source>Chest</source><volume>137</volume><fpage>263</fpage><lpage>272</lpage><year>2010</year><pub-id pub-id-type="pmid">19762550</pub-id><pub-id pub-id-type="doi">10.1378/chest.09-1584</pub-id></element-citation></ref>
<ref id="b9-BR-24-6-02147"><label>9</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>O&#x0027;Mahony</surname><given-names>C</given-names></name><name><surname>Jichi</surname><given-names>F</given-names></name><name><surname>Pavlou</surname><given-names>M</given-names></name><name><surname>Monserrat</surname><given-names>L</given-names></name><name><surname>Anastasakis</surname><given-names>A</given-names></name><name><surname>Rapezzi</surname><given-names>C</given-names></name><name><surname>Biagini</surname><given-names>E</given-names></name><name><surname>Gimeno</surname><given-names>JR</given-names></name><name><surname>Limongelli</surname><given-names>G</given-names></name><name><surname>McKenna</surname><given-names>WJ</given-names></name><etal/></person-group><article-title>A novel clinical risk prediction model for sudden cardiac death in hypertrophic cardiomyopathy (HCM risk-SCD)</article-title><source>Eur Heart J</source><volume>35</volume><fpage>2010</fpage><lpage>2020</lpage><year>2014</year><pub-id pub-id-type="pmid">24126876</pub-id><pub-id pub-id-type="doi">10.1093/eurheartj/eht439</pub-id></element-citation></ref>
<ref id="b10-BR-24-6-02147"><label>10</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bogard</surname><given-names>N</given-names></name><name><surname>Linder</surname><given-names>J</given-names></name><name><surname>Rosenberg</surname><given-names>AB</given-names></name><name><surname>Seelig</surname><given-names>G</given-names></name></person-group><article-title>A deep neural network for predicting and engineering alternative polyadenylation</article-title><source>Cell</source><volume>178</volume><fpage>91</fpage><lpage>106.e23</lpage><year>2019</year><pub-id pub-id-type="pmid">31178116</pub-id><pub-id pub-id-type="doi">10.1016/j.cell.2019.04.046</pub-id></element-citation></ref>
<ref id="b11-BR-24-6-02147"><label>11</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Deng</surname><given-names>YB</given-names></name><name><surname>Nagae</surname><given-names>G</given-names></name><name><surname>Midorikawa</surname><given-names>Y</given-names></name><name><surname>Yagi</surname><given-names>K</given-names></name><name><surname>Tsutsumi</surname><given-names>S</given-names></name><name><surname>Yamamoto</surname><given-names>S</given-names></name><name><surname>Hasegawa</surname><given-names>K</given-names></name><name><surname>Kokudo</surname><given-names>N</given-names></name><name><surname>Aburatani</surname><given-names>H</given-names></name><name><surname>Kaneda</surname><given-names>A</given-names></name></person-group><article-title>Identification of genes preferentially methylated in hepatitis C virus-related hepatocellular carcinoma</article-title><source>Cancer Sci</source><volume>101</volume><fpage>1501</fpage><lpage>1510</lpage><year>2010</year><pub-id pub-id-type="pmid">20345479</pub-id><pub-id pub-id-type="doi">10.1111/j.1349-7006.2010.01549.x</pub-id></element-citation></ref>
<ref id="b12-BR-24-6-02147"><label>12</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Villa</surname><given-names>E</given-names></name><name><surname>Critelli</surname><given-names>R</given-names></name><name><surname>Lei</surname><given-names>B</given-names></name><name><surname>Marzocchi</surname><given-names>G</given-names></name><name><surname>Camm&#x00E0;</surname><given-names>C</given-names></name><name><surname>Giannelli</surname><given-names>G</given-names></name><name><surname>Pontisso</surname><given-names>P</given-names></name><name><surname>Cabibbo</surname><given-names>G</given-names></name><name><surname>Enea</surname><given-names>M</given-names></name><name><surname>Colopi</surname><given-names>S</given-names></name><etal/></person-group><article-title>Neoangiogenesis-related genes are hallmarks of fast-growing hepatocellular carcinomas and worst survival. Results from a prospective study</article-title><source>Gut</source><volume>65</volume><fpage>861</fpage><lpage>869</lpage><year>2016</year><pub-id pub-id-type="pmid">25666192</pub-id><pub-id pub-id-type="doi">10.1136/gutjnl-2014-308483</pub-id></element-citation></ref>
<ref id="b13-BR-24-6-02147"><label>13</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>H</given-names></name><name><surname>Huo</surname><given-names>X</given-names></name><name><surname>Yang</surname><given-names>XR</given-names></name><name><surname>He</surname><given-names>J</given-names></name><name><surname>Cheng</surname><given-names>L</given-names></name><name><surname>Wang</surname><given-names>N</given-names></name><name><surname>Deng</surname><given-names>X</given-names></name><name><surname>Jin</surname><given-names>H</given-names></name><name><surname>Wang</surname><given-names>N</given-names></name><name><surname>Wang</surname><given-names>C</given-names></name><etal/></person-group><article-title>STAT3-mediated upregulation of lncRNA HOXD-AS1 as a ceRNA facilitates liver cancer metastasis by regulating SOX4</article-title><source>Mol Cancer</source><volume>16</volume><issue>136</issue><year>2017</year><pub-id pub-id-type="pmid">28810927</pub-id><pub-id pub-id-type="doi">10.1186/s12943-017-0680-1</pub-id></element-citation></ref>
<ref id="b14-BR-24-6-02147"><label>14</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>SM</given-names></name><name><surname>Ooi</surname><given-names>LLPJ</given-names></name><name><surname>Hui</surname><given-names>KM</given-names></name></person-group><article-title>Identification and validation of a novel gene signature associated with the recurrence of human hepatocellular carcinoma</article-title><source>Clin Cancer Res</source><volume>13</volume><fpage>6275</fpage><lpage>6283</lpage><year>2007</year><pub-id pub-id-type="pmid">17975138</pub-id><pub-id pub-id-type="doi">10.1158/1078-0432.CCR-06-2236</pub-id></element-citation></ref>
<ref id="b15-BR-24-6-02147"><label>15</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Leek</surname><given-names>JT</given-names></name><name><surname>Johnson</surname><given-names>WE</given-names></name><name><surname>Parker</surname><given-names>HS</given-names></name><name><surname>Jaffe</surname><given-names>AE</given-names></name><name><surname>Storey</surname><given-names>JD</given-names></name></person-group><article-title>The sva package for removing batch effects and other unwanted variation in high-throughput experiments</article-title><source>Bioinformatics</source><volume>28</volume><fpage>882</fpage><lpage>883</lpage><year>2012</year><pub-id pub-id-type="pmid">22257669</pub-id><pub-id pub-id-type="doi">10.1093/bioinformatics/bts034</pub-id></element-citation></ref>
<ref id="b16-BR-24-6-02147"><label>16</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Livak</surname><given-names>KJ</given-names></name><name><surname>Schmittgen</surname><given-names>TD</given-names></name></person-group><article-title>Analysis of relative gene expression data using real-time quantitative PCR and the 2(-Delta Delta C(T)) method</article-title><source>Methods</source><volume>25</volume><fpage>402</fpage><lpage>408</lpage><year>2001</year><pub-id pub-id-type="pmid">11846609</pub-id><pub-id pub-id-type="doi">10.1006/meth.2001.1262</pub-id></element-citation></ref>
<ref id="b17-BR-24-6-02147"><label>17</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Abul-Hajj</surname><given-names>YJ</given-names></name><name><surname>Iverson</surname><given-names>R</given-names></name><name><surname>Kiang</surname><given-names>DT</given-names></name></person-group><article-title>Metabolism of pregnenolone by human breast cancer. Evidence for 17 alpha-hydroxylase and 17,20-lyase</article-title><source>Steroids</source><volume>34</volume><fpage>817</fpage><lpage>827</lpage><year>1979</year><pub-id pub-id-type="pmid">161434</pub-id><pub-id pub-id-type="doi">10.1016/0039-128x(79)90094-1</pub-id></element-citation></ref>
<ref id="b18-BR-24-6-02147"><label>18</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Parker</surname><given-names>C</given-names></name><name><surname>Sartor</surname><given-names>O</given-names></name></person-group><article-title>Abiraterone and increased survival in metastatic prostate cancer</article-title><source>N Engl J Med</source><volume>365</volume><issue>767</issue><year>2011</year><pub-id pub-id-type="pmid">21864180</pub-id><pub-id pub-id-type="doi">10.1056/NEJMc1107198</pub-id></element-citation></ref>
<ref id="b19-BR-24-6-02147"><label>19</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Niu</surname><given-names>WX</given-names></name><name><surname>Zhou</surname><given-names>CX</given-names></name><name><surname>Cheng</surname><given-names>CD</given-names></name><name><surname>Bao</surname><given-names>DJ</given-names></name><name><surname>Dong</surname><given-names>YF</given-names></name><name><surname>Li</surname><given-names>DX</given-names></name><name><surname>Yang</surname><given-names>Y</given-names></name><name><surname>He</surname><given-names>H</given-names></name><name><surname>Niu</surname><given-names>CS</given-names></name></person-group><article-title>Effects of lentivirus-mediated CYP17A1 gene silencing on the biological activity of glioma</article-title><source>Neurosci Lett</source><volume>692</volume><fpage>210</fpage><lpage>215</lpage><year>2019</year><pub-id pub-id-type="pmid">30439398</pub-id><pub-id pub-id-type="doi">10.1016/j.neulet.2018.11.017</pub-id></element-citation></ref>
<ref id="b20-BR-24-6-02147"><label>20</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Robinson</surname><given-names>JL</given-names></name><name><surname>Macarthur</surname><given-names>S</given-names></name><name><surname>Ross-Innes</surname><given-names>CS</given-names></name><name><surname>Tilley</surname><given-names>WD</given-names></name><name><surname>Neal</surname><given-names>DE</given-names></name><name><surname>Mills</surname><given-names>IG</given-names></name><name><surname>Carroll</surname><given-names>JS</given-names></name></person-group><article-title>Androgen receptor driven transcription in molecular apocrine breast cancer is mediated by FoxA1</article-title><source>Embo J</source><volume>30</volume><fpage>3019</fpage><lpage>3027</lpage><year>2011</year><pub-id pub-id-type="pmid">21701558</pub-id><pub-id pub-id-type="doi">10.1038/emboj.2011.216</pub-id></element-citation></ref>
<ref id="b21-BR-24-6-02147"><label>21</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Camargo</surname><given-names>MC</given-names></name><name><surname>Goto</surname><given-names>Y</given-names></name><name><surname>Zabaleta</surname><given-names>J</given-names></name><name><surname>Morgan</surname><given-names>DR</given-names></name><name><surname>Correa</surname><given-names>P</given-names></name><name><surname>Rabkin</surname><given-names>CS</given-names></name></person-group><article-title>Sex hormones, hormonal interventions, and gastric cancer risk: A meta-analysis</article-title><source>Cancer Epidemiol Biomarkers Prev</source><volume>21</volume><fpage>20</fpage><lpage>38</lpage><year>2012</year><pub-id pub-id-type="pmid">22028402</pub-id><pub-id pub-id-type="doi">10.1158/1055-9965.EPI-11-0834</pub-id></element-citation></ref>
<ref id="b22-BR-24-6-02147"><label>22</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Marcinkiewicz</surname><given-names>K</given-names></name><name><surname>Scotland</surname><given-names>KB</given-names></name><name><surname>Boorjian</surname><given-names>SA</given-names></name><name><surname>Nilsson</surname><given-names>EM</given-names></name><name><surname>Persson</surname><given-names>JL</given-names></name><name><surname>Abrahamsson</surname><given-names>PA</given-names></name><name><surname>Allegrucci</surname><given-names>C</given-names></name><name><surname>Hughes</surname><given-names>IA</given-names></name><name><surname>Gudas</surname><given-names>LJ</given-names></name><name><surname>Mongan</surname><given-names>NP</given-names></name></person-group><article-title>The androgen receptor and stem cell pathways in prostate and bladder cancers (review)</article-title><source>Int J Oncol</source><volume>40</volume><fpage>5</fpage><lpage>12</lpage><year>2012</year><pub-id pub-id-type="pmid">21956088</pub-id><pub-id pub-id-type="doi">10.3892/ijo.2011.1212</pub-id></element-citation></ref>
<ref id="b23-BR-24-6-02147"><label>23</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>PJ</given-names></name><name><surname>Yeh</surname><given-names>SH</given-names></name><name><surname>Liu</surname><given-names>WH</given-names></name><name><surname>Lin</surname><given-names>CC</given-names></name><name><surname>Huang</surname><given-names>HC</given-names></name><name><surname>Chen</surname><given-names>CL</given-names></name><name><surname>Chen</surname><given-names>DS</given-names></name><name><surname>Chen</surname><given-names>PJ</given-names></name></person-group><article-title>Androgen pathway stimulates microRNA-216a transcription to suppress the tumor suppressor in lung cancer-1 gene in early hepatocarcinogenesis</article-title><source>Hepatology</source><volume>56</volume><fpage>632</fpage><lpage>643</lpage><year>2012</year><pub-id pub-id-type="pmid">22392644</pub-id><pub-id pub-id-type="doi">10.1002/hep.25695</pub-id></element-citation></ref>
<ref id="b24-BR-24-6-02147"><label>24</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ceccarelli</surname><given-names>I</given-names></name><name><surname>Rossi</surname><given-names>A</given-names></name><name><surname>Maddalena</surname><given-names>M</given-names></name><name><surname>Weber</surname><given-names>E</given-names></name><name><surname>Aloisi</surname><given-names>AM</given-names></name></person-group><article-title>Effects of morphine on testosterone levels in rat C6 glioma cells: Modulation by anastrozole</article-title><source>J Cell Physiol</source><volume>221</volume><fpage>1</fpage><lpage>4</lpage><year>2009</year><pub-id pub-id-type="pmid">19492405</pub-id><pub-id pub-id-type="doi">10.1002/jcp.21830</pub-id></element-citation></ref>
<ref id="b25-BR-24-6-02147"><label>25</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bao</surname><given-names>D</given-names></name><name><surname>Cheng</surname><given-names>C</given-names></name><name><surname>Lan</surname><given-names>X</given-names></name><name><surname>Xing</surname><given-names>R</given-names></name><name><surname>Chen</surname><given-names>Z</given-names></name><name><surname>Zhao</surname><given-names>H</given-names></name><name><surname>Sun</surname><given-names>J</given-names></name><name><surname>Wang</surname><given-names>Y</given-names></name><name><surname>Niu</surname><given-names>C</given-names></name><name><surname>Zhang</surname><given-names>B</given-names></name><name><surname>Fang</surname><given-names>S</given-names></name></person-group><article-title>Regulation of p53wt glioma cell proliferation by androgen receptor-mediated inhibition of small VCP/p97-interacting protein expression</article-title><source>Oncotarget</source><volume>8</volume><fpage>23142</fpage><lpage>23154</lpage><year>2017</year><pub-id pub-id-type="pmid">28423563</pub-id><pub-id pub-id-type="doi">10.18632/oncotarget.15509</pub-id></element-citation></ref>
<ref id="b26-BR-24-6-02147"><label>26</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mann</surname><given-names>J</given-names></name></person-group><article-title>Natural products in cancer chemotherapy: Past, present and future</article-title><source>Nat Rev Cancer</source><volume>2</volume><fpage>143</fpage><lpage>148</lpage><year>2002</year><pub-id pub-id-type="pmid">12635177</pub-id><pub-id pub-id-type="doi">10.1038/nrc723</pub-id></element-citation></ref>
<ref id="b27-BR-24-6-02147"><label>27</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>X</given-names></name><name><surname>Li</surname><given-names>X</given-names></name><name><surname>Huang</surname><given-names>N</given-names></name><name><surname>Liu</surname><given-names>R</given-names></name><name><surname>Sun</surname><given-names>R</given-names></name></person-group><article-title>A comprehensive review and perspectives on pharmacology and toxicology of saikosaponins</article-title><source>Phytomedicine</source><volume>50</volume><fpage>73</fpage><lpage>87</lpage><year>2018</year><pub-id pub-id-type="pmid">30466994</pub-id><pub-id pub-id-type="doi">10.1016/j.phymed.2018.09.174</pub-id></element-citation></ref>
<ref id="b28-BR-24-6-02147"><label>28</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Du</surname><given-names>J</given-names></name><name><surname>Song</surname><given-names>D</given-names></name><name><surname>Cao</surname><given-names>T</given-names></name><name><surname>Li</surname><given-names>Y</given-names></name><name><surname>Liu</surname><given-names>J</given-names></name><name><surname>Li</surname><given-names>B</given-names></name><name><surname>Li</surname><given-names>L</given-names></name></person-group><article-title>Saikosaponin-A induces apoptosis of cervical cancer through mitochondria- and endoplasmic reticulum stress-dependent pathway in vitro and in vivo: Involvement of PI3K/AKT signaling pathway</article-title><source>Cell Cycle</source><volume>20</volume><fpage>2221</fpage><lpage>2232</lpage><year>2021</year><pub-id pub-id-type="pmid">34520332</pub-id><pub-id pub-id-type="doi">10.1080/15384101.2021.1974791</pub-id></element-citation></ref>
<ref id="b29-BR-24-6-02147"><label>29</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>C</given-names></name><name><surname>Zhang</surname><given-names>R</given-names></name><name><surname>Chen</surname><given-names>X</given-names></name><name><surname>Yuan</surname><given-names>M</given-names></name><name><surname>Wu</surname><given-names>J</given-names></name><name><surname>Sun</surname><given-names>Q</given-names></name><name><surname>Miao</surname><given-names>C</given-names></name><name><surname>Jing</surname><given-names>Y</given-names></name></person-group><article-title>The potential effect and mechanism of Saikosaponin A against gastric cancer</article-title><source>BMC Complement Med Ther</source><volume>23</volume><issue>295</issue><year>2023</year><pub-id pub-id-type="pmid">37608281</pub-id><pub-id pub-id-type="doi">10.1186/s12906-023-04108-3</pub-id></element-citation></ref>
<ref id="b30-BR-24-6-02147"><label>30</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>P</given-names></name><name><surname>Lai</surname><given-names>X</given-names></name><name><surname>Zhu</surname><given-names>MH</given-names></name><name><surname>Long</surname><given-names>M</given-names></name><name><surname>Liu</surname><given-names>XL</given-names></name><name><surname>Wang</surname><given-names>ZX</given-names></name><name><surname>Zhang</surname><given-names>Y</given-names></name><name><surname>Guo</surname><given-names>RJ</given-names></name><name><surname>Dong</surname><given-names>J</given-names></name><name><surname>Lu</surname><given-names>Q</given-names></name><etal/></person-group><article-title>Saikosaponin A, a triterpene saponin, suppresses angiogenesis and tumor growth by blocking VEGFR2-mediated signaling pathway</article-title><source>Front Pharmacol</source><volume>12</volume><issue>713200</issue><year>2021</year><pub-id pub-id-type="pmid">34776948</pub-id><pub-id pub-id-type="doi">10.3389/fphar.2021.713200</pub-id></element-citation></ref>
<ref id="b31-BR-24-6-02147"><label>31</label><element-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fujita</surname><given-names>K</given-names></name><name><surname>Nonomura</surname><given-names>N</given-names></name></person-group><article-title>Role of androgen receptor in prostate cancer: A review</article-title><source>World J Mens Health</source><volume>37</volume><fpage>288</fpage><lpage>295</lpage><year>2019</year><pub-id pub-id-type="pmid">30209899</pub-id><pub-id pub-id-type="doi">10.5534/wjmh.180040</pub-id></element-citation></ref>
</ref-list>
</back>
<floats-group>
<fig id="f1-BR-24-6-02147" position="float">
<label>Figure 1</label>
<caption><p>Screening for genes central to sex differences in hepatocellular carcinoma incidence by four machine learning algorithms. (A) Genes that are differentially expressed only in male or female patients intersect with the hub genes of WGCNA. (B) A total of four machine learning algorithms score the importance of 36 candidate core genes. (C) Receiver operating characteristic curve of four machine learning algorithms on model prediction accuracy. (D) Residual values of predictive accuracy of four machine learning algorithms. (E) Venn diagram of the top 10 most important genes for four machine learning algorithms. WGCNA, weighted gene co-expression network analysis; Diffgene, differentially expressed genes; RF, random forest; SVM, support vector machine; XGB, extreme gradient boosting; GLM, generalized linear model.</p></caption>
<graphic xlink:href="br-24-06-02147-g00.tif"/>
</fig>
<fig id="f2-BR-24-6-02147" position="float">
<label>Figure 2</label>
<caption><p>Validation of sex-specific expression of CYP17A1 and IRX3. (A) Expression of CYP17A1 in male patients with HCC. (B) Expression of CYP17A1 in female patients with HCC. (C) Expression of IRX3 in male patients with HCC. (D) Expression of IRX3 in female patients with HCC. (E) Differences in CYP17A1 expression among four groups. (F) Differences in IRX3 expression among four groups. Con, control; Treat, treated; HCC, hepatocellular carcinoma; ns, not significant; <sup>&#x002A;</sup>P&#x003C;0.05; <sup>&#x002A;&#x002A;&#x002A;</sup>P&#x003C;0.001.</p></caption>
<graphic xlink:href="br-24-06-02147-g01.tif"/>
</fig>
<fig id="f3-BR-24-6-02147" position="float">
<label>Figure 3</label>
<caption><p>Pan-cancer analysis of CYP17A1 and single-gene analysis in HCC. (A) Expression of CYP17A1 in various tumors. (B) Expression of CYP17A1 in HCC and paracancerous tissues. (C) Kaplan-Meier survival curve of CYP17A1 high- and low-expression groups. (D) Correlation of CYP17A1 expression with M1 macrophages. (E) Correlation of CYP17A1 expression with activated dendritic cells. HCC, hepatocellular carcinoma; <sup>&#x002A;&#x002A;</sup>P&#x003C;0.01; <sup>&#x002A;&#x002A;&#x002A;</sup>P&#x003C;0.001.</p></caption>
<graphic xlink:href="br-24-06-02147-g02.tif"/>
</fig>
<fig id="f4-BR-24-6-02147" position="float">
<label>Figure 4</label>
<caption><p>Immunohistochemical validation of CYP17A1 protein in HCC tissues. (A) Immunohistochemical images from HCC and paired paracancerous tissues from a male patient. (B) Difference in CYP17A1 expression between HCC and paired paracancerous tissues from a male patient. (C) Immunohistochemical images from HCC and paired paracancerous tissues from a female patient. (D) Difference in CYP17A1 expression between HCC and paired paracancerous tissues from a female patient. HCC, hepatocellular carcinoma; ns, not significant; <sup>&#x002A;&#x002A;&#x002A;</sup>P&#x003C;0.001.</p></caption>
<graphic xlink:href="br-24-06-02147-g03.tif"/>
</fig>
<fig id="f5-BR-24-6-02147" position="float">
<label>Figure 5</label>
<caption><p>A preliminary investigation of the role of CYP17A1 in hepatocellular carcinoma based on CYP17A1 knockout and functional cell-based assays. (A) Relative expression of CYP17A1 mRNA in the control group and the KO group. (B) CYP17A1 protein expression in the control group and the KO group. (C) Difference analysis of CYP17A1 relative expression levels in the control group and the KO group. (D) Proliferation of the control group and the CYP17A1 gene KO group over 72 h. (E) Effect of CYP17A1 gene knockout on HepG2 migration ability under the microscope at 0 and 24 h (magnification, x100). (F) Difference analysis of scratch healing rates between the control group and the KO group. (G) Transwell results of the control group and the KO group under a microscope. (H) Analysis of the difference in the relative number of invasive cells in the control group and the KO group. NC, the control group; KO, the knockout group; OD, optical density; <sup>&#x002A;&#x002A;&#x002A;</sup>P&#x003C;0.001.</p></caption>
<graphic xlink:href="br-24-06-02147-g04.tif"/>
</fig>
<fig id="f6-BR-24-6-02147" position="float">
<label>Figure 6</label>
<caption><p>Screening and <italic>in vitro</italic> validation of drug candidates targeting CYP17A1. (A) Saikosaponin A interacts with the CYP17A1 protein. (B) Cell proliferation of HepG2 cells treated with different concentrations of Saikosaponin A for 24, 48 and 72 h. (C) Cell proliferation of Huh7 cells treated with different concentrations of Saikosaponin A for 24, 48 and 72 h. (D) Scratch healing of HepG2 control and Saikosaponin A-treated cells at 0 and 24 h under the microscope (magnification, x100). (E) Difference analysis of the scratch healing rate between the Control group and the drug-treated group. (F) Scratch healing of Huh7 Control and Saikosaponin A-treated cells at 0 and 24 h under the microscope (magnification, x100). (G) Difference analysis of scratch healing rates between the Control group and the drug-treated group. (H) Cell invasion of HepG2 and Huh7 cells in the Control group and the drug-treated group under the microscope. (I) Difference analysis of the relative cell number of HepG2 cells in the Control group and the drug-treated group. (J) Difference analysis of relative cell numbers of Huh7 cells in the Control group and the drug-treated group. <sup>&#x002A;</sup>P&#x003C;0.05; <sup>&#x002A;&#x002A;</sup>P&#x003C;0.01; <sup>&#x002A;&#x002A;&#x002A;</sup>P&#x003C;0.001.</p></caption>
<graphic xlink:href="br-24-06-02147-g05.tif"/>
</fig>
<table-wrap id="tI-BR-24-6-02147" position="float">
<label>Table I</label>
<caption><p>Virtual screening of interactions between the top 10 drugs with the highest affinity and CYP17A1 protein.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="middle">Ligand</th>
<th align="center" valign="middle">Chemical formula</th>
<th align="center" valign="middle">Pubchem no.</th>
<th align="center" valign="middle">Molecular weight</th>
<th align="center" valign="middle">Affinity (kcal/mol)</th>
<th align="center" valign="middle">Interactions</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Wilforlide A</td>
<td align="center" valign="middle">C<sub>30</sub>H<sub>46</sub>O<sub>3</sub></td>
<td align="center" valign="middle">158477</td>
<td align="center" valign="middle">454.7</td>
<td align="center" valign="middle">-13.7</td>
<td align="left" valign="middle">5 hydrophobic interactions</td>
</tr>
<tr>
<td align="left" valign="middle">Epifriedelanol</td>
<td align="center" valign="middle">C<sub>30</sub>H<sub>52</sub>O</td>
<td align="center" valign="middle">119242</td>
<td align="center" valign="middle">428.7</td>
<td align="center" valign="middle">-13.4</td>
<td align="left" valign="middle">7 hydrophobic interactions</td>
</tr>
<tr>
<td align="left" valign="middle">&#x03B4;-Amyrenone</td>
<td align="center" valign="middle">C<sub>30</sub>H<sub>48</sub>O</td>
<td align="center" valign="middle">5318261</td>
<td align="center" valign="middle">424.7</td>
<td align="center" valign="middle">-13.2</td>
<td align="left" valign="middle">6 hydrophobic interactions</td>
</tr>
<tr>
<td align="left" valign="middle">Arnidiol</td>
<td align="center" valign="middle">C<sub>30</sub>H<sub>50</sub>O<sub>2</sub></td>
<td align="center" valign="middle">10478550</td>
<td align="center" valign="middle">442.7</td>
<td align="center" valign="middle">-13.1</td>
<td align="left" valign="middle">7 hydrophobic interactions</td>
</tr>
<tr>
<td align="left" valign="middle">&#x03B2;-Amyrin</td>
<td align="center" valign="middle">C<sub>30</sub>H<sub>50</sub>O</td>
<td align="center" valign="middle">73145</td>
<td align="center" valign="middle">426.7</td>
<td align="center" valign="middle">-12.8</td>
<td align="left" valign="middle">7 hydrophobic interactions</td>
</tr>
<tr>
<td align="left" valign="middle">Taraxasterol</td>
<td align="center" valign="middle">C<sub>30</sub>H<sub>50</sub>O</td>
<td align="center" valign="middle">115250</td>
<td align="center" valign="middle">426.7</td>
<td align="center" valign="middle">-12.7</td>
<td align="left" valign="middle">7 hydrophobic interactions</td>
</tr>
<tr>
<td align="left" valign="middle">Saikosaponin A</td>
<td align="center" valign="middle">C<sub>42</sub>H<sub>68</sub>O<sub>13</sub></td>
<td align="center" valign="middle">167928</td>
<td align="center" valign="middle">781</td>
<td align="center" valign="middle">-12.5</td>
<td align="left" valign="middle">4 hydrophobic interactions, 6 H-bonds</td>
</tr>
<tr>
<td align="left" valign="middle">Taraxastery acetate</td>
<td align="center" valign="middle">C<sub>32</sub>H<sub>52</sub>O<sub>2</sub></td>
<td align="center" valign="middle">13889352</td>
<td align="center" valign="middle">468.8</td>
<td align="center" valign="middle">-12.4</td>
<td align="left" valign="middle">7 hydrophobic interactions</td>
</tr>
<tr>
<td align="left" valign="middle">Glycyrrhetinic acid</td>
<td align="center" valign="middle">C<sub>30</sub>H<sub>46</sub>O<sub>4</sub></td>
<td align="center" valign="middle">10114</td>
<td align="center" valign="middle">470.7</td>
<td align="center" valign="middle">-12.3</td>
<td align="left" valign="middle">6 hydrophobic interactions</td>
</tr>
<tr>
<td align="left" valign="middle">Saikosaponin D</td>
<td align="center" valign="middle">C<sub>42</sub>H<sub>68</sub>O<sub>13</sub></td>
<td align="center" valign="middle">107793</td>
<td align="center" valign="middle">781</td>
<td align="center" valign="middle">-12.3</td>
<td align="left" valign="middle">4 hydrophobic interactions, 5 H-bonds</td>
</tr>
</tbody>
</table>
</table-wrap>
</floats-group>
</article>
