@inproceedings{73b3cbedea8b474db85bfdbb534ed806,
title = "Towards Digital Repository Interoperability: The Document Indexing and Semantic Tagging Interface for Libraries (DISTIL)",
abstract = "The question of how to integrate diverse digital repositories into a unified information infrastructure, accessible and discoverable through simple interfaces, remains a central research issue for digital libraries. Many collections are described by specialized metadata, which currently has to be mapped and crosswalked to a standard format in order to be useful. However, this metadata work can be expensive and resource consuming. We describe work-in-progress with DISTIL (Document Indexing & Semantic Tagging Interface for Libraries) to support federated cross-collection search in humanities and the social sciences. DISTIL proposes to support interoperability by generating Dewey Decimal Classification {\textquoteleft}tags{\textquoteright} from individual metadata records. The resulting tags can then be used to support cross-collection browsing. We focus here on some of the initial pre-processing stages of the metadata workflow, which include cleaning and formatting metadata records, in order to extract terms that can then be used to generate the DDC tags. Some initial strategies for and issues with this workflow are described.",
keywords = "Dewey Decimal Classification, digital humanities, interoperability, Metadata, social sciences, tagging",
author = "Michael Khoo and Douglas Tudhope and Ceri Binding and Eileen Abels and Xia Lin and Diana Massam",
year = "2012",
doi = "10.1007/978-3-642-33290-6_49",
language = "English",
isbn = "978-3-642-33289-0",
volume = "7489",
series = "Lecture Notes in Computer Science",
publisher = "Springer",
pages = "439--444",
editor = "Panayiotis Zaphiris and George Buchanan and Edie Rasmussen and Fernando Loizides",
booktitle = "Theory and Practice of Digital Libraries",
address = "Germany",
}