@INPROCEEDINGS{1213Jin2009,
	AUTHOR = {Shan Jin and Hemant Misra and Thomas Sikora and Joemon Jose},
	TITLE = {Automatic Topic Detection Strategy for information retrieval in Spoken Document},
	BOOKTITLE = {Wiamis 2009},
	YEAR = {2009},
	MONTH = may,
	PDF = {http://elvera.nue.tu-berlin.de/files/1213Jin2009.pdf},
	URL = {http://elvera.nue.tu-berlin.de/files/1213Jin2009.pdf},
	ABSTRACT = {This paper suggests an alternative solution for the task of spoken
document retrieval (SDR). The proposed system runs retrieval on
multi-level transcriptions (word and phone) produced by word and
phone recognizers respectively, and their outputs are combined. We
propose to use latent Dirichlet allocation (LDA) model for capturing
the semantic information on word transcription. The LDA model
is employed for estimating topic distribution in queries and word
transcribed spoken documents, and the matching is performed at the
topic level. Acoustic matching between query words and phonetically
transcribed spoken documents is performed using phone-based
matching algorithm. The results of acoustic and topic level matching
methods are compared and shown to be complementary.}
}