@inproceedings{c90fb939523a4b7f8e32c00dc3b6e382,
title = "DAVE: A Unified Framework for Fast Vehicle Detection and Annotation",
abstract = "Vehicle detection and annotation for streaming video data with complex scenes is an interesting but challenging task for urban traffic surveillance. In this paper, we present a fast framework of Detection and Annotation for Vehicles (DAVE), which effectively combines vehicle detection and attributes annotation. DAVE consists of two convolutional neural networks (CNNs): a fast vehicle proposal network (FVPN) for vehicle-like objects extraction and an attributes learning network (ALN) aiming to verify each proposal and infer each vehicle{\textquoteright}s pose, color and type simultaneously. These two nets are jointly optimized so that abundant latent knowledge learned from the ALN can be exploited to guide FVPN training. Once the system is trained, it can achieve efficient vehicle detection and annotation for real-world traffic surveillance data. We evaluate DAVE on a new self-collected UTS dataset and the public PASCAL VOC2007 car and LISA 2010 datasets, with consistent improvements over existing algorithms.",
keywords = "Vehicle Detection, Attributes Annotation, Latent Knowledge Guidance, Joint Learning, Deep Networks",
author = "Yi Zhou and Li Liu and Ling Shao and Matt Mellor",
year = "2016",
month = sep,
day = "17",
doi = "10.1007/978-3-319-46475-6_18",
language = "English",
isbn = "978-3-319-46474-9",
volume = "9906",
series = "Lecture Notes in Computer Science",
publisher = "Springer",
pages = "278--293",
booktitle = "European Conference on Computer Vision",
address = "Germany",
}