@inproceedings{82add0181c514b469640b30219e92d23,
title = "Layered dynamic mixture model for pattern discovery in asynchronous multi-modal streams",
abstract = "We propose a layered dynamic mixture model for asynchronous multi-modal fusion for unsupervised pattern discovery in video. The lower layer of the model uses generative temporal structures such as a hierarchical hidden Markov model to convert the audiovisual streams into mid-level labels, it also models the correlations in text with probabilistic latent semantic analysis. The upper layer fuses the statistical evidence across diverse modalities with a flexible meta-mixture model that assumes loose temporal correspondence. Evaluation on a large news database shows that multi-modal clusters have better correspondence to news topics than audio-visual clusters alone; novel analysis techniques suggest that meaningful clusters occur when the prediction of salient features by the model concurs with those shown in the story clusters.",
author = "Lexing Xie and Lyndon Kennedy and Chang, {Shih Fu} and Ajay Divakaran and Huifang Sun and Lin, {Ching Yung}",
year = "2005",
doi = "10.1109/ICASSP.2005.1415589",
language = "English",
isbn = "0780388747",
series = "ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings",
pages = "II1053--II1056",
booktitle = "2005 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP '05 - Proceedings - Image and Multidimensional Signal Processing Multimedia Signal Processing",
note = "2005 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP '05 ; Conference date: 18-03-2005 Through 23-03-2005",
}