@INPROCEEDINGS{0769Moreau2004, AUTHOR = {Nicolas Moreau and Hyoung-Gook Kim and Thomas Sikora}, TITLE = {Phonetic Confusion Based Document Expansion for Spoken Document Retrieval}, BOOKTITLE = {INTERSPEECH 2004 - ICSLP}, YEAR = {2004}, MONTH = oct, ADDRESS = {Jeju Island, Korea}, PDF = {http://elvera.nue.tu-berlin.de/files/0769Moreau2004.pdf}, URL = {http://elvera.nue.tu-berlin.de/files/0769Moreau2004.pdf}, ABSTRACT = {This paper presents a phone-based approach of spoken document retrieval (SDR), developed in the framework of the emerging MPEG-7 standard. We describe an indexing and retrieval system that uses phonetic information only. The retrieval method is based on the vector space IR model, using phone N-grams as indexing terms. We propose a technique to expand the representation of documents by means of phone confusion probabilities in order to improve the retrieval performance. This method is tested on a collection of short German spoken documents, using 10 city names as queries.} }