@inproceedings{cf986d324d9c4d398a121258fdd689a1,
title = "Temporal action detection based on hierarchical object detection networks",
abstract = "This paper addresses the problem of temporal action detection from untrimmed videos. Considering that actions can be recognized by the occurrence of objects and the corresponding moving information in the video, a hierarchical model is proposed which consists of two object detection networks to do temporal action detection. The first network is used to detect objects in each frame, and the second one is for temporal action detection. We also proposed a method which converts the object detection results of the first network into a new type of frame so that it can be fed to the second network. The generated frame has six channels with spatiotemporal information beneficial to action detection. Quantitative results on THUMOS14 dataset demonstrate the superior of the proposed model with satisfactory performance gains over state-of-the-art action detection methods.",
keywords = "Convolutional neural network (CNN), Temporal action detection",
author = "Wu, {Yi Hui} and Tsai, {Wen Jiin} and Chen, {Hua Tsung}",
year = "2019",
month = aug,
doi = "10.1109/Ubi-Media.2019.00031",
language = "English",
series = "Proceedings - 2019 12th International Conference on Ubi-Media Computing, Ubi-Media 2019",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "119--123",
booktitle = "Proceedings - 2019 12th International Conference on Ubi-Media Computing, Ubi-Media 2019",
address = "美國",
note = "12th International Conference on Ubi-Media Computing, Ubi-Media 2019 ; Conference date: 06-08-2019 Through 09-08-2019",
}