@inproceedings{ba156277a9854fe8b57229253f19910e,
title = "Traffic analytics for linked data publishers",
abstract = "We present a traffic analytics platform for servers that publish Linked Data. To the best of our knowledge, this is the first system that mines access logs of registered Linked Data servers to extract traffic insights on daily basis and without human intervention. The framework extracts Linked Data-specific traffic metrics from log records of HTTP lookups and SPARQL queries, and provides insights not available in traditional web analytics tools. Among all, we detect visitor sessions with a variant of hierarchical agglomerative clustering. We also identify workload peaks of SPARQL endpoints by detecting heavy and light SPARQL queries with supervised learning. The platform has been tested on 13 months of access logs of the British National Bibliography RDF dataset.",
keywords = "Data publication, Linked data, SPARQL, Traffic analytics",
author = "Luca Costabello and Vandenbussche, {Pierre Yves} and Gofran Shukair and Corine Deliot and Neil Wilson",
note = "Publisher Copyright: {\textcopyright} Springer International Publishing AG 2017.; 14th Extended Semantic Web Conference, ESWC 2017 ; Conference date: 28-05-2017 Through 01-06-2017",
year = "2017",
doi = "10.1007/978-3-319-58068-5_1",
language = "Ingl{\'e}s",
isbn = "9783319580678",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "3--18",
editor = "Diana Maynard and Aldo Gangemi and Rinke Hoekstra and Eva Blomqvist and Olaf Hartig and Pascal Hitzler",
booktitle = "The Semantic Web - 14th International Conference, ESWC 2017, Proceedings",
}