@inproceedings{gondo-etal-2024-verification,
title = "Verification of Reasoning Ability using {BDI} Logic and Large Language Model in {AIW}olf",
author = "Gondo, Hiraku and
Sakaji, Hiroki and
Noda, Itsuki",
editor = "Kano, Yoshinobu",
booktitle = "Proceedings of the 2nd International AIWolfDial Workshop",
month = sep,
year = "2024",
address = "Tokyo, Japan",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.aiwolfdial-1.5",
pages = "40--47",
abstract = "We attempt to improve the reasoning capability of LLMs in werewolf game by combining BDI logic with LLMs. While LLMs such as ChatGPT has been developed and used for various tasks, there remain several weakness of the LLMs. Logical reasoning is one of such weakness. Therefore, we try to introduce BDI logic-based prompts to verify the logical reasoning ability of LLMs in dialogue of werewofl game. Experiments and evaluations were conducted using {``}AI-Werewolf,{''} a communication game for AI with incomplete information. From the results of the game played by five agents, we compare the logical reasoning ability of LLMs by using the win rate and the vote rate against werewolf.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="gondo-etal-2024-verification">
<titleInfo>
<title>Verification of Reasoning Ability using BDI Logic and Large Language Model in AIWolf</title>
</titleInfo>
<name type="personal">
<namePart type="given">Hiraku</namePart>
<namePart type="family">Gondo</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Hiroki</namePart>
<namePart type="family">Sakaji</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Itsuki</namePart>
<namePart type="family">Noda</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2024-09</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 2nd International AIWolfDial Workshop</title>
</titleInfo>
<name type="personal">
<namePart type="given">Yoshinobu</namePart>
<namePart type="family">Kano</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Tokyo, Japan</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>We attempt to improve the reasoning capability of LLMs in werewolf game by combining BDI logic with LLMs. While LLMs such as ChatGPT has been developed and used for various tasks, there remain several weakness of the LLMs. Logical reasoning is one of such weakness. Therefore, we try to introduce BDI logic-based prompts to verify the logical reasoning ability of LLMs in dialogue of werewofl game. Experiments and evaluations were conducted using “AI-Werewolf,” a communication game for AI with incomplete information. From the results of the game played by five agents, we compare the logical reasoning ability of LLMs by using the win rate and the vote rate against werewolf.</abstract>
<identifier type="citekey">gondo-etal-2024-verification</identifier>
<location>
<url>https://aclanthology.org/2024.aiwolfdial-1.5</url>
</location>
<part>
<date>2024-09</date>
<extent unit="page">
<start>40</start>
<end>47</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Verification of Reasoning Ability using BDI Logic and Large Language Model in AIWolf
%A Gondo, Hiraku
%A Sakaji, Hiroki
%A Noda, Itsuki
%Y Kano, Yoshinobu
%S Proceedings of the 2nd International AIWolfDial Workshop
%D 2024
%8 September
%I Association for Computational Linguistics
%C Tokyo, Japan
%F gondo-etal-2024-verification
%X We attempt to improve the reasoning capability of LLMs in werewolf game by combining BDI logic with LLMs. While LLMs such as ChatGPT has been developed and used for various tasks, there remain several weakness of the LLMs. Logical reasoning is one of such weakness. Therefore, we try to introduce BDI logic-based prompts to verify the logical reasoning ability of LLMs in dialogue of werewofl game. Experiments and evaluations were conducted using “AI-Werewolf,” a communication game for AI with incomplete information. From the results of the game played by five agents, we compare the logical reasoning ability of LLMs by using the win rate and the vote rate against werewolf.
%U https://aclanthology.org/2024.aiwolfdial-1.5
%P 40-47
Markdown (Informal)
[Verification of Reasoning Ability using BDI Logic and Large Language Model in AIWolf](https://aclanthology.org/2024.aiwolfdial-1.5) (Gondo et al., AIWolfDial-WS 2024)
ACL