The rapid generation of large amounts of information about the coronavirus SARS-COV-2 and the disease COVID-19 makes it increasingly difficult to gain a comprehensive overview of current insights related to the disease. With this work, we aim to support the rapid access to a comprehensive data source on COVID-19 targeted especially at researchers. Our knowledge graph, CovidPubGraph, an RDF knowledge graph of scientific publications, abides by the Linked Data and FAIR principles. The base dataset for the extraction is CORD-19, a dataset of COVID-19-related publications, which is updated regularly. Consequently, COVIDPUBGRAPH is updated biweekly. Our generation pipeline applies named entity recognition, entity linking and link discovery approaches to the original data. The current version of CovidPubGraph contains 268,108,670 triples and is linked to 9 other datasets by over 1 million links. In our use case studies, we demonstrate the usefulness of our knowledge graph for different applications. COVIDPUBGRAPH is publicly available under the Creative Commons Attribution 4.0 International license.
%0 Journal Article
%1 nature_sd_patents
%A Pestryakova, Svetlana
%A Vollmers, Daniel
%A Sherif, Mohamed Ahmed
%A Heindorf, Stefan
%A Saleem, Muhammad
%A Moussallem, Diego
%A Ngomo, Axel-Cyrille Ngonga
%D 2022
%I Nature Publishing Group
%J Scientific Data
%K dice ngonga saleem sherif vollmers
%T CovidPubGraph: A FAIR Knowledge Graph of COVID-19 Publications
%U https://papers.dice-research.org/2022/NSDJ_CovidPubGraph/public.pdf
%X The rapid generation of large amounts of information about the coronavirus SARS-COV-2 and the disease COVID-19 makes it increasingly difficult to gain a comprehensive overview of current insights related to the disease. With this work, we aim to support the rapid access to a comprehensive data source on COVID-19 targeted especially at researchers. Our knowledge graph, CovidPubGraph, an RDF knowledge graph of scientific publications, abides by the Linked Data and FAIR principles. The base dataset for the extraction is CORD-19, a dataset of COVID-19-related publications, which is updated regularly. Consequently, COVIDPUBGRAPH is updated biweekly. Our generation pipeline applies named entity recognition, entity linking and link discovery approaches to the original data. The current version of CovidPubGraph contains 268,108,670 triples and is linked to 9 other datasets by over 1 million links. In our use case studies, we demonstrate the usefulness of our knowledge graph for different applications. COVIDPUBGRAPH is publicly available under the Creative Commons Attribution 4.0 International license.
@article{nature_sd_patents,
abstract = {The rapid generation of large amounts of information about the coronavirus SARS-COV-2 and the disease COVID-19 makes it increasingly difficult to gain a comprehensive overview of current insights related to the disease. With this work, we aim to support the rapid access to a comprehensive data source on COVID-19 targeted especially at researchers. Our knowledge graph, CovidPubGraph, an RDF knowledge graph of scientific publications, abides by the Linked Data and FAIR principles. The base dataset for the extraction is CORD-19, a dataset of COVID-19-related publications, which is updated regularly. Consequently, COVIDPUBGRAPH is updated biweekly. Our generation pipeline applies named entity recognition, entity linking and link discovery approaches to the original data. The current version of CovidPubGraph contains 268,108,670 triples and is linked to 9 other datasets by over 1 million links. In our use case studies, we demonstrate the usefulness of our knowledge graph for different applications. COVIDPUBGRAPH is publicly available under the Creative Commons Attribution 4.0 International license.},
added-at = {2022-02-03T12:41:23.000+0100},
author = {Pestryakova, Svetlana and Vollmers, Daniel and Sherif, Mohamed Ahmed and Heindorf, Stefan and Saleem, Muhammad and Moussallem, Diego and Ngomo, Axel-Cyrille Ngonga},
bdsk-url-1 = {https://papers.dice-research.org/2022/NSDJ_CovidPubGraph/public.pdf},
biburl = {https://www.bibsonomy.org/bibtex/24a08be85abeb4df17f52d22c7c390af5/dice-research},
interhash = {b6e1b27c01a29f3f93c8dd78603dabcc},
intrahash = {4a08be85abeb4df17f52d22c7c390af5},
journal = {Scientific Data},
keywords = {dice ngonga saleem sherif vollmers},
publisher = {Nature Publishing Group},
timestamp = {2023-04-25T16:33:53.000+0200},
title = {{CovidPubGraph: A FAIR Knowledge Graph of COVID-19 Publications}},
url = {https://papers.dice-research.org/2022/NSDJ_CovidPubGraph/public.pdf},
year = 2022
}