<?xml version="1.0" encoding="UTF-8"?>



<records>

  <record>
    <language>eng</language>
          <publisher>Oriental Scientific Publishing Company</publisher>
        <journalTitle>Biomedical and Pharmacology Journal</journalTitle>
          <issn>0974-6242</issn>
            <publicationDate>2025-09-30</publicationDate>
    
        <volume>18</volume>
        <issue>3</issue>

 
    <startPage>2014</startPage>
    <endPage>2023</endPage>

	 
      <doi>10.13005/bpj/3233</doi>
        <publisherRecordId>67353</publisherRecordId>
    <documentType>article</documentType>
    <title language="eng">Gene Expression Data-Based Interpretable Machine Learning Framework for Classifying Brain Cancer Subtypes</title>

    <authors>
	 


      <author>
       <name>Virendra Singh Kushwah</name>

 
		
	<affiliationId>1</affiliationId>
      </author>
    

	 


      <author>
       <name>Sivaneasan Bala Krishnan</name>


		
	<affiliationId>2</affiliationId>

      </author>
    

	 


      <author>
       <name>Kamal Upreti</name>

		
	<affiliationId>3</affiliationId>
      </author>
    

	 


      <author>
       <name>Pravin Kshirsagar</name>

		
	<affiliationId>4</affiliationId>
      </author>
    


	 


      <author>
       <name>Manoj Kumar</name>

		
	<affiliationId>5</affiliationId>
      </author>
    


	 


      <author>
       <name>Uma Shankar</name>

		
	<affiliationId>6</affiliationId>
      </author>
    
    </authors>
    
	    <affiliationsList>
	    
		
		<affiliationName affiliationId="1">Department of CSE and AI, VIT Bhopal University, Sehore, Madhya Pradesh, Indi</affiliationName>
    

		
		<affiliationName affiliationId="2">Department. of Electrical and Electronics Engineering, Singapore Institute of Technology, Singapore</affiliationName>
    
		
		<affiliationName affiliationId="3">Department of Computer Science, Christ University, Delhi NCR Campus, Ghaziabad, India</affiliationName>
    
		
		<affiliationName affiliationId="4">Department of Electronics and Telecommunication Engineering, J D College of Engineering and Management, Nagpur, India</affiliationName>
    
		
		<affiliationName affiliationId="5">Department of Mathematics and Statistics, Gurukula Kangri University, Haridwar, Uttarakhand, India</affiliationName>
    
		
		<affiliationName affiliationId="6">Department of Management and Social Sciences, Qaiwan International University, Sulaimanyah, Kurdistan, Iraq. </affiliationName>
    
	  </affiliationsList>






    <abstract language="eng">Early detection, therapeutic stratification, and precision medicine all rely on the precise classification of brain cancer subtypes.   To categorize brain tumor subtypes, we examine the application of ensemble machine learning models—Random Forest, XGBoost, and LightGBM—using high-dimensional gene expression data from the GSE50161 dataset (CuMiDa).   The top 1000 genes were selected using variance thresholding, and models were then trained and evaluated on a stratified split of the dataset.   Despite the availability of models achieving similar accuracies (~95–96%) in existing works, our framework integrates SHAP-based interpretability to identify biologically significant genes, such as CDK4, EGFR, and TP53, offering dual benefits of high predictive power and explainability. The use of SHAP (SHapley Additive exPlanations) values to assess model predictions and identify physiologically important gene features revealed that key gene probes, including as CDK4, EGFR, and TP53, were significant across different tumor subtypes. This study demonstrates how SHAP and interpretable ensemble learning may be used to diagnose brain tumors with excellent classification accuracy and physiologically meaningful gene identification.</abstract>

    <fullTextUrl format="html">https://biomedpharmajournal.org/vol18no3/gene-expression-data-based-interpretable-machine-learning-framework-for-classifying-brain-cancer-subtypes/</fullTextUrl>

<keywords language="eng">

      
        <keyword>Brain Cancer</keyword>
      

      
        <keyword> Biomarker Identification</keyword>
      

      
        <keyword> Cell Lines</keyword>
      

      
        <keyword> Gene-expression</keyword>
      

      
        <keyword> Machine Learning</keyword>
      

      
        <keyword> Microarray Data</keyword>
      
</keywords>
  </record>
</records>