@inproceedings{zheng-etal-2026-neurag,
title = "{N}eu{RAG}: End-to-End Neural Knowledge Augmentation via Hyper-Neurons",
author = "Zheng, Liwei and
Liu, Xuemin and
Liu, Jie",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2026.findings-acl.1516/",
doi = "10.18653/v1/2026.findings-acl.1516",
pages = "30324--30343",
ISBN = "979-8-89176-395-1",
abstract = "Retrieval-Augmented Generation (RAG) systems have become a standard approach for grounding large language models in external knowledge. However, they are constrained by a decoupled architecture: retrieval and reasoning operate as separate stages, with retrieved text merely prepended as passive context. This prevents deep integration of knowledge into the model{'}s parametric reasoning, leading to fragmented responses for complex queries requiring multi-document synthesis or conflict resolution. To bridge this gap, we propose NeuRAG, an end-to-end Neuralized RAG framework that unifies knowledge retrieval and fusion through Hyper-Neurons{---}parameterized modules encoding entire documents directly into the model{'}s parameter space. In NeuRAG, each document is encoded as a lightweight LoRA module, conceptualized as a knowledge neuron. These neurons collectively form a document-adaptive Hyper-Layer, which dynamically activates and fuses knowledge neurons via an attention mechanism conditioned on the input hidden-state query. This enables the model to jointly retrieve and reason within a single forward pass, seamlessly integrating external knowledge into its inference pathway. Extensive experiments across multiple datasets and LLMs demonstrate NeuRAG{'}s strong and consistent performance as a promising novel RAG paradigm."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="zheng-etal-2026-neurag">
<titleInfo>
<title>NeuRAG: End-to-End Neural Knowledge Augmentation via Hyper-Neurons</title>
</titleInfo>
<name type="personal">
<namePart type="given">Liwei</namePart>
<namePart type="family">Zheng</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Xuemin</namePart>
<namePart type="family">Liu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jie</namePart>
<namePart type="family">Liu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2026-07</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Findings of the Association for Computational Linguistics: ACL 2026</title>
</titleInfo>
<name type="personal">
<namePart type="given">Maria</namePart>
<namePart type="family">Liakata</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Viviane</namePart>
<namePart type="given">P</namePart>
<namePart type="family">Moreira</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jiajun</namePart>
<namePart type="family">Zhang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">David</namePart>
<namePart type="family">Jurgens</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">San Diego, California, United States</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-8-89176-395-1</identifier>
</relatedItem>
<abstract>Retrieval-Augmented Generation (RAG) systems have become a standard approach for grounding large language models in external knowledge. However, they are constrained by a decoupled architecture: retrieval and reasoning operate as separate stages, with retrieved text merely prepended as passive context. This prevents deep integration of knowledge into the model’s parametric reasoning, leading to fragmented responses for complex queries requiring multi-document synthesis or conflict resolution. To bridge this gap, we propose NeuRAG, an end-to-end Neuralized RAG framework that unifies knowledge retrieval and fusion through Hyper-Neurons—parameterized modules encoding entire documents directly into the model’s parameter space. In NeuRAG, each document is encoded as a lightweight LoRA module, conceptualized as a knowledge neuron. These neurons collectively form a document-adaptive Hyper-Layer, which dynamically activates and fuses knowledge neurons via an attention mechanism conditioned on the input hidden-state query. This enables the model to jointly retrieve and reason within a single forward pass, seamlessly integrating external knowledge into its inference pathway. Extensive experiments across multiple datasets and LLMs demonstrate NeuRAG’s strong and consistent performance as a promising novel RAG paradigm.</abstract>
<identifier type="citekey">zheng-etal-2026-neurag</identifier>
<identifier type="doi">10.18653/v1/2026.findings-acl.1516</identifier>
<location>
<url>https://aclanthology.org/2026.findings-acl.1516/</url>
</location>
<part>
<date>2026-07</date>
<extent unit="page">
<start>30324</start>
<end>30343</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T NeuRAG: End-to-End Neural Knowledge Augmentation via Hyper-Neurons
%A Zheng, Liwei
%A Liu, Xuemin
%A Liu, Jie
%Y Liakata, Maria
%Y Moreira, Viviane P.
%Y Zhang, Jiajun
%Y Jurgens, David
%S Findings of the Association for Computational Linguistics: ACL 2026
%D 2026
%8 July
%I Association for Computational Linguistics
%C San Diego, California, United States
%@ 979-8-89176-395-1
%F zheng-etal-2026-neurag
%X Retrieval-Augmented Generation (RAG) systems have become a standard approach for grounding large language models in external knowledge. However, they are constrained by a decoupled architecture: retrieval and reasoning operate as separate stages, with retrieved text merely prepended as passive context. This prevents deep integration of knowledge into the model’s parametric reasoning, leading to fragmented responses for complex queries requiring multi-document synthesis or conflict resolution. To bridge this gap, we propose NeuRAG, an end-to-end Neuralized RAG framework that unifies knowledge retrieval and fusion through Hyper-Neurons—parameterized modules encoding entire documents directly into the model’s parameter space. In NeuRAG, each document is encoded as a lightweight LoRA module, conceptualized as a knowledge neuron. These neurons collectively form a document-adaptive Hyper-Layer, which dynamically activates and fuses knowledge neurons via an attention mechanism conditioned on the input hidden-state query. This enables the model to jointly retrieve and reason within a single forward pass, seamlessly integrating external knowledge into its inference pathway. Extensive experiments across multiple datasets and LLMs demonstrate NeuRAG’s strong and consistent performance as a promising novel RAG paradigm.
%R 10.18653/v1/2026.findings-acl.1516
%U https://aclanthology.org/2026.findings-acl.1516/
%U https://doi.org/10.18653/v1/2026.findings-acl.1516
%P 30324-30343
Markdown (Informal)
[NeuRAG: End-to-End Neural Knowledge Augmentation via Hyper-Neurons](https://aclanthology.org/2026.findings-acl.1516/) (Zheng et al., Findings 2026)
ACL