@inproceedings{d21125b7c8ac47c2889d9cbea7b7b495,
title = "Action recognition using three dimension convolution and long short term memory",
abstract = "The convolutional neural network (CNN) is more and more popular in computer vision and widely used in acoustic signal processing, image classification, and image segmentation. In this work, an architecture which is a combination of the 3-D convolutional neural network and the long short term memory (LSTM) was proposed for action recognition. It stacks the consecutive video frames, extracts spatial and time features, and trains the input dataset to achieve good recognition performance. Moreover, the LSTM model based on the relations among the frames in different time is adopted to consider the information of past frames. Simulations show that the proposed algorithm outperforms other neural network based methods and has even better performance for action recognition.",
author = "Liu, {Yu Cheng} and Ding, {Jian Jiun} and Chang, {Yao Jen} and Wang, {Chien Yao} and Wang, {Jia Ching}",
note = "Publisher Copyright: {\textcopyright} 2017 IEEE.; 4th IEEE International Conference on Consumer Electronics - Taiwan, ICCE-TW 2017 ; Conference date: 12-06-2017 Through 14-06-2017",
year = "2017",
month = jul,
day = "25",
doi = "10.1109/ICCE-China.2017.7991006",
language = "???core.languages.en_GB???",
series = "2017 IEEE International Conference on Consumer Electronics - Taiwan, ICCE-TW 2017",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "83--84",
booktitle = "2017 IEEE International Conference on Consumer Electronics - Taiwan, ICCE-TW 2017",
}