@inproceedings{5ca6556dd23347fcbee96a00be0ca015,
title = "Sub-document timestamping of web documents",
abstract = "Knowledge about a (Web) document's creation time has been shown to be an important factor in various temporal information retrieval settings. Commonly, it is assumed that such documents were created at a single point in time. While this assumption may hold for news articles and similar document types, it is a clear oversimplification for general Web documents. In this paper, we investigate to what extent (i) this simplifying assumption is violated for a corpus of Web documents, and, (ii) it is possible to accurately estimate the creation time of individual Web documents' components (so-called sub-documents).",
keywords = "timestamping, sub-documents, Web-archiving",
author = "Y. Zhao and C Hauff",
year = "2015",
doi = "10.1145/2766462.2767803",
language = "English",
isbn = "978-1-4503-3621-5",
publisher = "Association for Computing Machinery (ACM)",
pages = "1023--1026",
editor = "R Baeza-Yates and M Lalmas and A Moffat and B Ribeiro-Neto",
booktitle = "Proceedings of the 38th International ACM SIGIR Conference on Research and Development in Information Retrieval, SIGIR 2015",
address = "United States",
note = "SIGIR 2015, Santiago, Chile ; Conference date: 09-08-2015 Through 13-08-2015",
}