We introduce the novel task of identifying important citations in scholarly literature, i.e., citations that indicate that the cited work is used or extended in the new effort. We believe this task is a crucial component in algorithms that detect and follow research topics and in methods that measure the quality of publications.We model this task as a supervised classification problem at two levels of detail: a coarse one with classes (important vs. non-important), and a more detailed one with four importance classes. We annotate a dataset of approximately 450 citations with this information, and release it publicly. We propose a supervised classification approach that addresses this task with a battery of features that range from citation counts to where the citation appears in the body of the paper, and show that,our approach achieves a precision of 65% for a recall of 90%.
%0 Conference Paper
%1 valenzuela2015identifying
%A Valenzuela, Marco
%A Ha, Vu
%A Etzioni, Oren
%B AAAI Workshops
%D 2015
%K citation classification scientometrics type
%T Identifying Meaningful Citations
%U http://www.aaai.org/ocs/index.php/WS/AAAIW15/paper/view/10185
%X We introduce the novel task of identifying important citations in scholarly literature, i.e., citations that indicate that the cited work is used or extended in the new effort. We believe this task is a crucial component in algorithms that detect and follow research topics and in methods that measure the quality of publications.We model this task as a supervised classification problem at two levels of detail: a coarse one with classes (important vs. non-important), and a more detailed one with four importance classes. We annotate a dataset of approximately 450 citations with this information, and release it publicly. We propose a supervised classification approach that addresses this task with a battery of features that range from citation counts to where the citation appears in the body of the paper, and show that,our approach achieves a precision of 65% for a recall of 90%.
@inproceedings{valenzuela2015identifying,
abstract = {We introduce the novel task of identifying important citations in scholarly literature, i.e., citations that indicate that the cited work is used or extended in the new effort. We believe this task is a crucial component in algorithms that detect and follow research topics and in methods that measure the quality of publications.We model this task as a supervised classification problem at two levels of detail: a coarse one with classes (important vs. non-important), and a more detailed one with four importance classes. We annotate a dataset of approximately 450 citations with this information, and release it publicly. We propose a supervised classification approach that addresses this task with a battery of features that range from citation counts to where the citation appears in the body of the paper, and show that,our approach achieves a precision of 65% for a recall of 90%.},
added-at = {2015-11-03T18:01:21.000+0100},
author = {Valenzuela, Marco and Ha, Vu and Etzioni, Oren},
biburl = {https://www.bibsonomy.org/bibtex/2d81475ff345e7aa8f4fb0c3bff9e9ba7/jaeschke},
booktitle = {AAAI Workshops},
description = {Valenzuela},
interhash = {6fb4132fcf04a0d66b31ed98e858d9c5},
intrahash = {d81475ff345e7aa8f4fb0c3bff9e9ba7},
keywords = {citation classification scientometrics type},
timestamp = {2015-11-03T18:01:21.000+0100},
title = {Identifying Meaningful Citations},
url = {http://www.aaai.org/ocs/index.php/WS/AAAIW15/paper/view/10185},
year = 2015
}