@inproceedings{05b5189e6a7c41fa85fc3800b3b93934,
title = "Video scene analysis of interactions between humans and vehicles using event context",
abstract = "We present a methodology to estimate a detailed state of a video scene involving multiple humans and vehicles. In order to automatically annotate and retrieve videos containing activities of humans and vehicles, the system must correctly identify their trajectories and relationships even in a complex dynamic environment. Our methodology constructs various joint 3-D models describing possible configurations of humans and vehicles in each image frame and performs maximum-a-posteriori tracking to obtain a sequence of scene states that matches the video. Reliable and view-independent scene state analysis is performed by taking advantage of event context. We focus on the fact that events occurring in a video must contextually coincide with scene states of humans and vehicles. Our experimental results verify that our system using event context is able to analyze and track 3-D scene states of complex human-vehicle interactions more reliably and accurately than previous systems.",
keywords = "Dynamic scene analysis, Event context, Scene state tracking",
author = "Ryoo, {M. S.} and Lee, {Jong Taek} and Aggarwal, {J. K.}",
year = "2010",
doi = "10.1145/1816041.1816109",
language = "English",
isbn = "9781450301176",
series = "CIVR 2010 - 2010 ACM International Conference on Image and Video Retrieval",
pages = "462--469",
booktitle = "CIVR 2010 - 2010 ACM International Conference on Image and Video Retrieval",
note = "ACM International Conference on Image and Video Retrieval, ACM-CIVR 2010 ; Conference date: 05-07-2010 Through 07-07-2010",
}