@inproceedings{regino-dos-reis-2025-llms,
title = "Can {LLM}s be Knowledge Graph Curators for Validating Triple Insertions?",
author = "Regino, Andr{\'e} Gomes and
dos Reis, Julio Cesar",
editor = "Gesese, Genet Asefa and
Sack, Harald and
Paulheim, Heiko and
Merono-Penuela, Albert and
Chen, Lihu",
booktitle = "Proceedings of the Workshop on Generative AI and Knowledge Graphs (GenAIK)",
month = jan,
year = "2025",
address = "Abu Dhabi, UAE",
publisher = "International Committee on Computational Linguistics",
url = "https://aclanthology.org/2025.genaik-1.10/",
pages = "87--99",
abstract = "As Knowledge Graphs (KGs) become central to modern applications, automated methods for validating RDF triples before insertion into these graphs are essential. The complexity and scalability challenges in manual validation processes have led researchers to explore Large Language Models (LLMs) as potential automated validators. This study investigates the feasibility of using LLMs to validate RDF triples by focusing on four distinct and complementary validation tasks: class and property alignment, URI standardization, semantic consistency, and syntactic correctness. We propose a systematic validation method that uses prompts to guide LLMs through each stage of the triple evaluation of the RDF. In our experiments, four models are evaluated across these tasks. Our results reveal that more advanced models like Llama-3-70B-Instruct offer superior accuracy and consistency. Our findings emphasize the practical open challenges of deploying LLMs in real-world RDF validation scenarios, including domain generalization, semantic drift, and the need for human-in-the-loop interventions. This investigation advances the research on the refinement and integration of LLM-based RDF validation techniques into KG management workflows."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="regino-dos-reis-2025-llms">
<titleInfo>
<title>Can LLMs be Knowledge Graph Curators for Validating Triple Insertions?</title>
</titleInfo>
<name type="personal">
<namePart type="given">André</namePart>
<namePart type="given">Gomes</namePart>
<namePart type="family">Regino</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Julio</namePart>
<namePart type="given">Cesar</namePart>
<namePart type="family">dos Reis</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2025-01</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Workshop on Generative AI and Knowledge Graphs (GenAIK)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Genet</namePart>
<namePart type="given">Asefa</namePart>
<namePart type="family">Gesese</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Harald</namePart>
<namePart type="family">Sack</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Heiko</namePart>
<namePart type="family">Paulheim</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Albert</namePart>
<namePart type="family">Merono-Penuela</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Lihu</namePart>
<namePart type="family">Chen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>International Committee on Computational Linguistics</publisher>
<place>
<placeTerm type="text">Abu Dhabi, UAE</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>As Knowledge Graphs (KGs) become central to modern applications, automated methods for validating RDF triples before insertion into these graphs are essential. The complexity and scalability challenges in manual validation processes have led researchers to explore Large Language Models (LLMs) as potential automated validators. This study investigates the feasibility of using LLMs to validate RDF triples by focusing on four distinct and complementary validation tasks: class and property alignment, URI standardization, semantic consistency, and syntactic correctness. We propose a systematic validation method that uses prompts to guide LLMs through each stage of the triple evaluation of the RDF. In our experiments, four models are evaluated across these tasks. Our results reveal that more advanced models like Llama-3-70B-Instruct offer superior accuracy and consistency. Our findings emphasize the practical open challenges of deploying LLMs in real-world RDF validation scenarios, including domain generalization, semantic drift, and the need for human-in-the-loop interventions. This investigation advances the research on the refinement and integration of LLM-based RDF validation techniques into KG management workflows.</abstract>
<identifier type="citekey">regino-dos-reis-2025-llms</identifier>
<location>
<url>https://aclanthology.org/2025.genaik-1.10/</url>
</location>
<part>
<date>2025-01</date>
<extent unit="page">
<start>87</start>
<end>99</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Can LLMs be Knowledge Graph Curators for Validating Triple Insertions?
%A Regino, André Gomes
%A dos Reis, Julio Cesar
%Y Gesese, Genet Asefa
%Y Sack, Harald
%Y Paulheim, Heiko
%Y Merono-Penuela, Albert
%Y Chen, Lihu
%S Proceedings of the Workshop on Generative AI and Knowledge Graphs (GenAIK)
%D 2025
%8 January
%I International Committee on Computational Linguistics
%C Abu Dhabi, UAE
%F regino-dos-reis-2025-llms
%X As Knowledge Graphs (KGs) become central to modern applications, automated methods for validating RDF triples before insertion into these graphs are essential. The complexity and scalability challenges in manual validation processes have led researchers to explore Large Language Models (LLMs) as potential automated validators. This study investigates the feasibility of using LLMs to validate RDF triples by focusing on four distinct and complementary validation tasks: class and property alignment, URI standardization, semantic consistency, and syntactic correctness. We propose a systematic validation method that uses prompts to guide LLMs through each stage of the triple evaluation of the RDF. In our experiments, four models are evaluated across these tasks. Our results reveal that more advanced models like Llama-3-70B-Instruct offer superior accuracy and consistency. Our findings emphasize the practical open challenges of deploying LLMs in real-world RDF validation scenarios, including domain generalization, semantic drift, and the need for human-in-the-loop interventions. This investigation advances the research on the refinement and integration of LLM-based RDF validation techniques into KG management workflows.
%U https://aclanthology.org/2025.genaik-1.10/
%P 87-99
Markdown (Informal)
[Can LLMs be Knowledge Graph Curators for Validating Triple Insertions?](https://aclanthology.org/2025.genaik-1.10/) (Regino & dos Reis, GenAIK 2025)
ACL