@inproceedings{0270dbc35fa84b2c8e653a867f5f8cb4,
title = "CiteTracked: A Longitudinal Dataset of Peer Reviews and Citations",
abstract = "Scientific dissemination is of central importance for the scientific process. This paper presents CiteTracked, a dataset of peer reviews and citation statistics covering scientific papers from the machine learning community and spanning six years. We describe and analyze the data collection of over 3,000 published papers, their peer review texts and citation counts, and depict possible usage directions. The dataset aims at fertilizing novel interdisciplinary work between fields such as scientometrics, information retrieval, computational linguistics and natural language processing to study the scientific publishing process.",
keywords = "Scientific dissemination, Peer reviews, Citation analysis, Machine learning publications, Interdisciplinary research, Scientific dissemination, Peer reviews, Citation analysis, Machine learning publications, Interdisciplinary research",
author = "Barbara Plank and {van Dalen}, Reinard",
year = "2019",
month = jul,
day = "25",
language = "English",
volume = "Vol-2414",
series = "CEUR Workshop Proceedings",
publisher = "CEUR Workshop Proceedings",
pages = "116--122",
editor = "Chandrasekaran, {Muthu Kumar} and Philipp Mayr",
booktitle = "4th Joint Workshop on Bibliometric-enhanced Information Retrieval and Natural Language Processing for Digital Libraries (BIRNDL 2019)",
edition = "urn:nbn:de:0074-2414-3",
}