@inproceedings{liu-etal-2026-llm,
title = "Do {LLM} Agents Really Mimic Humans? Diagnosing and Aligning Microeconomic Behaviors in Macro-{ABM}s",
author = "Liu, Guangya and
Wang, Cheng and
Li, Jiangtong and
Wu, Huafei and
Jiang, Changjun",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2026.findings-acl.1799/",
pages = "36102--36122",
ISBN = "979-8-89176-395-1",
abstract = "Large Language Models (LLMs) are increasingly adopted in macroeconomic agent-based modeling(ABM). However, existing research focuses on replicating macro-level stylized facts while often neglecting verification of micro-level decision-making. We investigate this gap by comparing LLM agents to human responses from the Survey of Consumer Expectations (SCE) dataset. Our empirical analysis identifies specific limitations: weak trend responsiveness, mode collapse, and a potential data leakage. We propose the Heterogeneous Shock-Response Causal Transmission Framework to tackle these issues. To ensure theoretical consistency, we use LLMs to build a literature-verified causal graph in which macroeconomic shocks influence decisions via generated mediator nodes, while agent profiles serve as edge moderators. Building on this, during inference, we perform a path search to retrieve relevant causal chains and inject them as an explicit Chain-of-Thought(CoT), prioritizing mechanistic logic over statistical pattern matching. To evaluate the effectiveness of our inference approach, we validate it via a two-stage process that combines micro-level dataset testing and macro-level simulation in the EconAgent system. Results from these experiments indicate that our framework improves alignment with human trends and effectively captures behavioral heterogeneity. Overall, this work contributes to the development of reliable and grounded economic simulations."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="liu-etal-2026-llm">
<titleInfo>
<title>Do LLM Agents Really Mimic Humans? Diagnosing and Aligning Microeconomic Behaviors in Macro-ABMs</title>
</titleInfo>
<name type="personal">
<namePart type="given">Guangya</namePart>
<namePart type="family">Liu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Cheng</namePart>
<namePart type="family">Wang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jiangtong</namePart>
<namePart type="family">Li</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Huafei</namePart>
<namePart type="family">Wu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Changjun</namePart>
<namePart type="family">Jiang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2026-07</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Findings of the Association for Computational Linguistics: ACL 2026</title>
</titleInfo>
<name type="personal">
<namePart type="given">Maria</namePart>
<namePart type="family">Liakata</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Viviane</namePart>
<namePart type="given">P</namePart>
<namePart type="family">Moreira</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jiajun</namePart>
<namePart type="family">Zhang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">David</namePart>
<namePart type="family">Jurgens</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">San Diego, California, United States</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-8-89176-395-1</identifier>
</relatedItem>
<abstract>Large Language Models (LLMs) are increasingly adopted in macroeconomic agent-based modeling(ABM). However, existing research focuses on replicating macro-level stylized facts while often neglecting verification of micro-level decision-making. We investigate this gap by comparing LLM agents to human responses from the Survey of Consumer Expectations (SCE) dataset. Our empirical analysis identifies specific limitations: weak trend responsiveness, mode collapse, and a potential data leakage. We propose the Heterogeneous Shock-Response Causal Transmission Framework to tackle these issues. To ensure theoretical consistency, we use LLMs to build a literature-verified causal graph in which macroeconomic shocks influence decisions via generated mediator nodes, while agent profiles serve as edge moderators. Building on this, during inference, we perform a path search to retrieve relevant causal chains and inject them as an explicit Chain-of-Thought(CoT), prioritizing mechanistic logic over statistical pattern matching. To evaluate the effectiveness of our inference approach, we validate it via a two-stage process that combines micro-level dataset testing and macro-level simulation in the EconAgent system. Results from these experiments indicate that our framework improves alignment with human trends and effectively captures behavioral heterogeneity. Overall, this work contributes to the development of reliable and grounded economic simulations.</abstract>
<identifier type="citekey">liu-etal-2026-llm</identifier>
<location>
<url>https://aclanthology.org/2026.findings-acl.1799/</url>
</location>
<part>
<date>2026-07</date>
<extent unit="page">
<start>36102</start>
<end>36122</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Do LLM Agents Really Mimic Humans? Diagnosing and Aligning Microeconomic Behaviors in Macro-ABMs
%A Liu, Guangya
%A Wang, Cheng
%A Li, Jiangtong
%A Wu, Huafei
%A Jiang, Changjun
%Y Liakata, Maria
%Y Moreira, Viviane P.
%Y Zhang, Jiajun
%Y Jurgens, David
%S Findings of the Association for Computational Linguistics: ACL 2026
%D 2026
%8 July
%I Association for Computational Linguistics
%C San Diego, California, United States
%@ 979-8-89176-395-1
%F liu-etal-2026-llm
%X Large Language Models (LLMs) are increasingly adopted in macroeconomic agent-based modeling(ABM). However, existing research focuses on replicating macro-level stylized facts while often neglecting verification of micro-level decision-making. We investigate this gap by comparing LLM agents to human responses from the Survey of Consumer Expectations (SCE) dataset. Our empirical analysis identifies specific limitations: weak trend responsiveness, mode collapse, and a potential data leakage. We propose the Heterogeneous Shock-Response Causal Transmission Framework to tackle these issues. To ensure theoretical consistency, we use LLMs to build a literature-verified causal graph in which macroeconomic shocks influence decisions via generated mediator nodes, while agent profiles serve as edge moderators. Building on this, during inference, we perform a path search to retrieve relevant causal chains and inject them as an explicit Chain-of-Thought(CoT), prioritizing mechanistic logic over statistical pattern matching. To evaluate the effectiveness of our inference approach, we validate it via a two-stage process that combines micro-level dataset testing and macro-level simulation in the EconAgent system. Results from these experiments indicate that our framework improves alignment with human trends and effectively captures behavioral heterogeneity. Overall, this work contributes to the development of reliable and grounded economic simulations.
%U https://aclanthology.org/2026.findings-acl.1799/
%P 36102-36122
Markdown (Informal)
[Do LLM Agents Really Mimic Humans? Diagnosing and Aligning Microeconomic Behaviors in Macro-ABMs](https://aclanthology.org/2026.findings-acl.1799/) (Liu et al., Findings 2026)
ACL