Counts of hyperlinks between websites can be unreliable for webometrics studies so researchers have attempted to find alternate counting methods or have tried to identify the reasons why links in websites are created. Manual classification of individual links in websites is infeasible for large webometrics studies, so a more efficient approach to identifying the reasons for link creation is needed to fully harness the potential of hyperlinks for webometrics research. This paper describes a machine learning method to automatically classify hyperlink source and target page types in university websites. 78% accuracy was achieved for automatically classifying web page types and up to 74% accuracy for predicting link target page types from link source page characteristics.
%0 Journal Article
%1 kenekayoro2014automatic
%A Kenekayoro, Patrick
%A Buckley, Kevan
%A Thelwall, Mike
%D 2014
%J Scientometrics
%K academic classification ddm feature_evaluation gaw mk5.4 page type web
%N 2
%P 1015--1026
%R 10.1007/s11192-014-1292-9
%T Automatic classification of academic web page types
%U http://dx.doi.org/10.1007/s11192-014-1292-9
%V 101
%X Counts of hyperlinks between websites can be unreliable for webometrics studies so researchers have attempted to find alternate counting methods or have tried to identify the reasons why links in websites are created. Manual classification of individual links in websites is infeasible for large webometrics studies, so a more efficient approach to identifying the reasons for link creation is needed to fully harness the potential of hyperlinks for webometrics research. This paper describes a machine learning method to automatically classify hyperlink source and target page types in university websites. 78% accuracy was achieved for automatically classifying web page types and up to 74% accuracy for predicting link target page types from link source page characteristics.
@article{kenekayoro2014automatic,
abstract = {Counts of hyperlinks between websites can be unreliable for webometrics studies so researchers have attempted to find alternate counting methods or have tried to identify the reasons why links in websites are created. Manual classification of individual links in websites is infeasible for large webometrics studies, so a more efficient approach to identifying the reasons for link creation is needed to fully harness the potential of hyperlinks for webometrics research. This paper describes a machine learning method to automatically classify hyperlink source and target page types in university websites. 78% accuracy was achieved for automatically classifying web page types and up to 74% accuracy for predicting link target page types from link source page characteristics.},
added-at = {2017-06-13T13:06:11.000+0200},
author = {Kenekayoro, Patrick and Buckley, Kevan and Thelwall, Mike},
biburl = {https://www.bibsonomy.org/bibtex/2feb0e721762399008b699c99b02e5f7d/jaeschke},
doi = {10.1007/s11192-014-1292-9},
interhash = {ac5dde7d241eac857f83c574ced2d43a},
intrahash = {feb0e721762399008b699c99b02e5f7d},
issn = {1588-2861},
journal = {Scientometrics},
keywords = {academic classification ddm feature_evaluation gaw mk5.4 page type web},
number = 2,
pages = {1015--1026},
timestamp = {2021-06-11T14:18:08.000+0200},
title = {Automatic classification of academic web page types},
url = {http://dx.doi.org/10.1007/s11192-014-1292-9},
volume = 101,
year = 2014
}