﻿<?xml version="1.0" encoding="UTF-8"?>
<records>
  <record>
    <language>eng</language>
    <publisher>Science and Education Publishing</publisher>
    <journalTitle>Journal of Computer Sciences and Applications</journalTitle>
    <eissn>2328-725X</eissn>
    <publicationDate>2026-05-20</publicationDate>
    <volume>14</volume>
    <issue>1</issue>
    <startPage>21</startPage>
    <endPage>30</endPage>
    <doi>10.12691/jcsa-14-1-4</doi>
    <publisherRecordId>JCSA20261414</publisherRecordId>
    <documentType>article</documentType>
    <title language="eng">Improving Medical Multimodal Retrieval with Graph-Rag and Fusion Methods with Mmedrag++</title>
    <authors>
      <author>
        <name>Dr. A.Shilpa Gupta</name>
        <email>a.shilpagupta@gmail.com</email>
        <affiliationId>1</affiliationId>
      </author>
      <author>
        <name>M. Uday Reddy</name>
        <affiliationId>1</affiliationId>
      </author>
      <author>
        <name>K. Jayanth Kumar Reddy</name>
        <affiliationId>1</affiliationId>
      </author>
      <author>
        <name>P. Medha Goud</name>
        <affiliationId>1</affiliationId>
      </author>
      <author>
        <name>T. Harshitha Reddy</name>
        <affiliationId>1</affiliationId>
      </author>
      <author>
        <name>Aditi Jopat</name>
        <affiliationId>1</affiliationId>
      </author>
    </authors>
    <affiliationsList>
      <affiliationName affiliationId="1">Department of Computer Science Engineering, Keshav Memorial College of Engineering, Ibrahimpatnam, Telangana, India</affiliationName>
    </affiliationsList>
    <abstract language="eng">We introduce MMedRAG++,a medical multimodal retrieval system that uses fusion-based representation learning and graph-based reranking (Graph-RAG) to improve on conventional Retrieval-Augmented Generation (RAG). Unlike baseline systems, which do not incorporate fusion strategies or graph-based reranking, MMedRAG++ improves cross-modal embeddings and retrieval coherence. Experiments are conducted primarily on PMC-OA, a challenging dataset with only ~10% unique captions and many unrelated image-text pairs, and IU-Xray is used for modality- specific subtasks. Graph-RAG demonstrates improved retrieval centrality and diversity, and fusion strategies, including Cross- Attention and DeepSet Fusion, enhance embedding quality. Quantitative evaluation on PMC-OA and IU-Xray confirms improved retrieval coherence and cross-modal alignment over baseline configurations. Top-1 Accuracy: 18.7%, Top-10 Accuracy: 57.4%.</abstract>
    <fullTextUrl format="pdf">https://pubs.sciepub.com/jcsa/14/1/4/jcsa-14-1-4.pdf</fullTextUrl>
    <keywords language="eng">
      <keyword>Medical AI</keyword>
      <keyword>RAG</keyword>
      <keyword>Graph-RAG</keyword>
      <keyword>Multimodal Fusion</keyword>
      <keyword>Contrastive Learning</keyword>
      <keyword>Medical Image-text Retrieval</keyword>
    </keywords>
  </record>
</records>