With knowledge graphs (KGs) at the center of numerous applications such as
recommender systems and question answering, the need for generalized pipelines
to construct and continuously update such KGs is increasing. While the
individual steps that are necessary to create KGs from unstructured (e.g. text)
and structured data sources (e.g. databases) are mostly well-researched for
their one-shot execution, their adoption for incremental KG updates and the
interplay of the individual steps have hardly been investigated in a systematic
manner so far. In this work, we first discuss the main graph models for KGs and
introduce the major requirement for future KG construction pipelines. Next, we
provide an overview of the necessary steps to build high-quality KGs, including
cross-cutting topics such as metadata management, ontology development, and
quality assurance. We then evaluate the state of the art of KG construction
w.r.t the introduced requirements for specific popular KGs as well as some
recent tools and strategies for KG construction. Finally, we identify areas in
need of further research and improvement.
Description
[2302.11509] Construction of Knowledge Graphs: State and Challenges
%0 Generic
%1 hofer2023construction
%A Hofer, Marvin
%A Obraczka, Daniel
%A Saeedi, Alieh
%A Köpcke, Hanna
%A Rahm, Erhard
%D 2023
%K data graph knowledge linked lod open semantic survey web
%T Construction of Knowledge Graphs: State and Challenges
%U http://arxiv.org/abs/2302.11509
%X With knowledge graphs (KGs) at the center of numerous applications such as
recommender systems and question answering, the need for generalized pipelines
to construct and continuously update such KGs is increasing. While the
individual steps that are necessary to create KGs from unstructured (e.g. text)
and structured data sources (e.g. databases) are mostly well-researched for
their one-shot execution, their adoption for incremental KG updates and the
interplay of the individual steps have hardly been investigated in a systematic
manner so far. In this work, we first discuss the main graph models for KGs and
introduce the major requirement for future KG construction pipelines. Next, we
provide an overview of the necessary steps to build high-quality KGs, including
cross-cutting topics such as metadata management, ontology development, and
quality assurance. We then evaluate the state of the art of KG construction
w.r.t the introduced requirements for specific popular KGs as well as some
recent tools and strategies for KG construction. Finally, we identify areas in
need of further research and improvement.
@misc{hofer2023construction,
abstract = {With knowledge graphs (KGs) at the center of numerous applications such as
recommender systems and question answering, the need for generalized pipelines
to construct and continuously update such KGs is increasing. While the
individual steps that are necessary to create KGs from unstructured (e.g. text)
and structured data sources (e.g. databases) are mostly well-researched for
their one-shot execution, their adoption for incremental KG updates and the
interplay of the individual steps have hardly been investigated in a systematic
manner so far. In this work, we first discuss the main graph models for KGs and
introduce the major requirement for future KG construction pipelines. Next, we
provide an overview of the necessary steps to build high-quality KGs, including
cross-cutting topics such as metadata management, ontology development, and
quality assurance. We then evaluate the state of the art of KG construction
w.r.t the introduced requirements for specific popular KGs as well as some
recent tools and strategies for KG construction. Finally, we identify areas in
need of further research and improvement.},
added-at = {2023-10-10T09:21:36.000+0200},
author = {Hofer, Marvin and Obraczka, Daniel and Saeedi, Alieh and Köpcke, Hanna and Rahm, Erhard},
biburl = {https://www.bibsonomy.org/bibtex/2592c52c278ad9b6fbd608255d016a0ed/jaeschke},
description = {[2302.11509] Construction of Knowledge Graphs: State and Challenges},
interhash = {1c70c8be84477a599ea2bd0e42d84b9d},
intrahash = {592c52c278ad9b6fbd608255d016a0ed},
keywords = {data graph knowledge linked lod open semantic survey web},
note = {cite arxiv:2302.11509Comment: 43 pages, 5 figures, 3 tables},
timestamp = {2023-10-10T09:21:36.000+0200},
title = {Construction of Knowledge Graphs: State and Challenges},
url = {http://arxiv.org/abs/2302.11509},
year = 2023
}