Among different characteristics of knowledge bases, data quality is one of the most relevant to maximize the benefits of the provided information. Knowledge base quality assessment poses a number of big data challenges such as high volume, variety, velocity, and veracity. In this article, we focus on answering questions related to the assessment of the veracity of facts through Deep Fact Validation (DeFacto), a triple validation framework designed to assess facts in RDF knowledge bases. Despite current developments in the research area, the underlying framework faces many challenges. This article pinpoints and discusses these issues and conducts a thorough analysis of its pipeline, aiming at reducing the error propagation through its components. Furthermore, we discuss recent developments related to this fact validation as well as describing advantages and drawbacks of state-of-the-art models. As a result of this exploratory analysis, we give insights and directions toward a better architecture to tackle the complex task of fact-checking in knowledge bases.
%0 Journal Article
%1 10.1145/3177873
%A Esteves, Diego
%A Rula, Anisa
%A Reddy, Aniketh Janardhan
%A Lehmann, Jens
%C New York, NY, USA
%D 2018
%I Association for Computing Machinery
%J J. Data and Information Quality
%K DeFacto, analysis benchmark, checking, data data, exploratory fact linked quality, trustworthiness,
%N 3
%R 10.1145/3177873
%T Toward Veracity Assessment in RDF Knowledge Bases: An Exploratory Analysis
%U https://doi.org/10.1145/3177873
%V 9
%X Among different characteristics of knowledge bases, data quality is one of the most relevant to maximize the benefits of the provided information. Knowledge base quality assessment poses a number of big data challenges such as high volume, variety, velocity, and veracity. In this article, we focus on answering questions related to the assessment of the veracity of facts through Deep Fact Validation (DeFacto), a triple validation framework designed to assess facts in RDF knowledge bases. Despite current developments in the research area, the underlying framework faces many challenges. This article pinpoints and discusses these issues and conducts a thorough analysis of its pipeline, aiming at reducing the error propagation through its components. Furthermore, we discuss recent developments related to this fact validation as well as describing advantages and drawbacks of state-of-the-art models. As a result of this exploratory analysis, we give insights and directions toward a better architecture to tackle the complex task of fact-checking in knowledge bases.
@article{10.1145/3177873,
abstract = {Among different characteristics of knowledge bases, data quality is one of the most relevant to maximize the benefits of the provided information. Knowledge base quality assessment poses a number of big data challenges such as high volume, variety, velocity, and veracity. In this article, we focus on answering questions related to the assessment of the veracity of facts through Deep Fact Validation (DeFacto), a triple validation framework designed to assess facts in RDF knowledge bases. Despite current developments in the research area, the underlying framework faces many challenges. This article pinpoints and discusses these issues and conducts a thorough analysis of its pipeline, aiming at reducing the error propagation through its components. Furthermore, we discuss recent developments related to this fact validation as well as describing advantages and drawbacks of state-of-the-art models. As a result of this exploratory analysis, we give insights and directions toward a better architecture to tackle the complex task of fact-checking in knowledge bases.},
added-at = {2024-09-10T11:54:51.000+0200},
address = {New York, NY, USA},
articleno = {16},
author = {Esteves, Diego and Rula, Anisa and Reddy, Aniketh Janardhan and Lehmann, Jens},
biburl = {https://puma.scadsai.uni-leipzig.de/bibtex/2c04b14bac3e7ec28f63cbd5af82f146d/scadsfct},
doi = {10.1145/3177873},
interhash = {949e173f5d0048bf03ab151fc6f41e8b},
intrahash = {c04b14bac3e7ec28f63cbd5af82f146d},
issn = {1936-1955},
issue_date = {September 2017},
journal = {J. Data and Information Quality},
keywords = {DeFacto, analysis benchmark, checking, data data, exploratory fact linked quality, trustworthiness,},
month = feb,
number = 3,
numpages = {26},
publisher = {Association for Computing Machinery},
timestamp = {2024-09-10T11:54:51.000+0200},
title = {Toward Veracity Assessment in RDF Knowledge Bases: An Exploratory Analysis},
url = {https://doi.org/10.1145/3177873},
volume = 9,
year = 2018
}