@inproceedings{2214e20a25d44e5e9dfb4295a5aefd17,
title = "Audio-visual event detection using duration dependent input output Markov models",
abstract = "Analysis of audio-visual data and detection of semantic events with spatio-temporal support is a challenging multimedia understanding problem. The difficulty lies in the gap that exists between low level media features and high level semantic concept. We introduce a duration dependent input output Markov model (DDIOMM) to detect events based on multiple modalities. The DDIOMM combines the ability to model non-exponential duration densities with the mapping of input sequences to output sequences. We test the DDIOMM by modelling the audio-visual event explosion. We compare the detection performance of the DDIOMM with the IOMM as well as the HMM. Experiments reveal that modeling of duration improves detection performance.",
author = "Naphade, {M. R.} and A. Garg and Huang, {T. S.}",
note = "Publisher Copyright: {\textcopyright} 2001 IEEE.; IEEE Workshop on Content-Based Access of Image and Video Libraries, CBAIVL 2001 ; Conference date: 14-12-2001",
year = "2001",
doi = "10.1109/IVL.2001.990854",
language = "English (US)",
series = "Proceedings - IEEE Workshop on Content-Based Access of Image and Video Libraries, CBAIVL 2001",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "39--43",
booktitle = "Proceedings - IEEE Workshop on Content-Based Access of Image and Video Libraries, CBAIVL 2001",
address = "United States",
}