@inproceedings{c06936c3eedd43f4b4d73b1210d09bc8,
title = "FLoPAD-GRU: A Flexible, Low Power, Accelerated DSP for Gated Recurrent Unit Neural Network",
abstract = "Recurrent neural networks (RNNs) are efficient for classification of sequential data such as speech and audio due to their high precision on tasks. However, power efficiency, the required memory capacity and bandwidth requirements make them less suitable for battery powered devices. In this work, we introduce FLoPAD-GRU: a system on a chip (SoC) for efficient processing of gated recurrent unit (GRU) networks, that consists of a digital signal processor (DSP), supplemented with an optimized hardware accelerator, which reduces memory accesses and cost. The system is programmable and scalable, which allows for execution of different network sizes. Synthesized in 28 nm CMOS technology, real-time classification is achieved at 4 MHz, with an energy dissipation of 4.1 pJ/classification, an improvement of 15 × compared to a pure DSP realization. The memory requirements are reduced by 75 %, which results in a silicon area of 0.7 mm2for the entire SoC.",
keywords = "Deep Learning, Digital Signal Processor, GRU, Hardware Accelerator, RNN, SoC, Speech Recognition",
author = "Ilayda Yaman and Allan Andersen and Lucas Ferreira and Joachirn Rodrigues",
note = "Publisher Copyright: {\textcopyright} 2021 IEEE.; 34th SBC/SBMicro/IEEE/ACM Symposium on Integrated Circuits and Systems Design, SBCCI 2021 ; Conference date: 23-08-2021 Through 27-08-2021",
year = "2021",
month = aug,
day = "23",
doi = "10.1109/SBCCI53441.2021.9529981",
language = "English",
series = "Proceedings - 34th SBC/SBMicro/IEEE/ACM Symposium on Integrated Circuits and Systems Design, SBCCI 2021",
publisher = "IEEE - Institute of Electrical and Electronics Engineers Inc.",
booktitle = "Proceedings - 34th SBC/SBMicro/IEEE/ACM Symposium on Integrated Circuits and Systems Design, SBCCI 2021",
address = "United States",
}