@inbook{c28796aff7374eeea555d7127b2eb906,
title = "The accessibility dimension for structured document retrieval",
abstract = "Structured document retrieval aims at retrieving the document components that best satisfy a query, instead of merely retrieving pre-defined document units. This paper reports on an investigation of a tf-idf-acc approach, where tf and idf are the classical term frequency and inverse document frequency, and acc, a new parameter called accessibility, that captures the structure of documents. The tf-idf-acc approach is defined using a probabilistic relational algebra. To investigate the retrieval quality and estimate the acc values, we developed a method that automatically constructs diverse test collections of structured documents from a standard test collection, with which experiments were carried out. The analysis of the experiments provides estimates of the acc values.",
keywords = "structured document retrieval, probabilistic relational algebra, accessibility dimension",
author = "Thomas Roelleke and Mounia Lalmas and Gabriella Kazai and Ian Ruthven and Stefan Quicker and F. Crestani and M. Dunlop and S. Mizzaro",
year = "2002",
month = mar,
day = "25",
doi = "10.1007/3-540-45886-7",
language = "English",
isbn = "978-3-540-43343-9",
volume = "2291",
series = "Lecture Notes in Computer Science",
publisher = "Springer",
pages = "284--302",
booktitle = "Advances in Information Retrieval",
}