@inproceedings{dbeff2537e8447b3867882813bd336a4,
title = "A Hierarchical and Reconfigurable Process Element Design for Quantized Neural Networks",
abstract = "Convolution neural networks are very popular for various applications. However, data size and accuracy are the two major concerns to perform efficient and effective computations. In conventional CNN models, 32bits data are frequently used to maintain high accuracy. However, performing a bunch of 32bits multiply-and-accumulate (MAC) operations causes significant computing efforts as well as power consumptions. Therefore, recently researchers develop various methods to reduce data size and speed up calculations. Quantization is one of the techniques which reduces the number of the bits of data and the computational complexity at the cost of accuracy loss. To provide better computation effort and accuracy trade-off, different bitwidth may be applied to different layers within a CNN model. Therefore, a flexible Processing Element (PE) which can support operations of different bitwidth is in demand. In this paper, we propose a hierarchal PE structure that can support 8bits x 8bits, 8bits x 4bits, 4bits x 4bits and 2bits x 2bits operations. The structure applies the concept of reconfiguration and can avoid the redundant hardware for reconfiguration. Moreover, the concept of pipelining is also adopted in our design to provide better efficiency. The experimental results show that in 2bits x 2bits PE, we can achieve area reduction by 57% and 68% compared to a Precision-Scalable accelerator and Bit Fusion, respectively. ",
keywords = "Processing Element (PE), Quantized Neural Networks (QNN), Reconfigurable Design",
author = "Chen, {Yu Guang} and Hsu, {Chi Wei} and Chiang, {Hung Yi} and Hsieh, {Tsung Han} and Jou, {Jing Yang}",
note = "Publisher Copyright: {\textcopyright} 2021 IEEE.; null ; Conference date: 14-09-2021 Through 17-09-2021",
year = "2021",
doi = "10.1109/SOCC52499.2021.9739487",
language = "???core.languages.en_GB???",
series = "International System on Chip Conference",
publisher = "IEEE Computer Society",
pages = "278--283",
editor = "Gang Qu and Jinjun Xiong and Danella Zhao and Venki Muthukumar and Reza, {Md Farhadur} and Ramalingam Sridhar",
booktitle = "Proceedings - 34th IEEE International System-on-Chip Conference, SOCC 2021",
}