@inproceedings{b76c50202b0247a7be17ce07992e324f,
title = "Performance Optimization for MLP Accelerators using ILP-Based On-Chip Weight Allocation Strategy",
abstract = "It is generally impossible to store all weights into an MLP accelerator because of limited on-chip SRAM capacity. However, the performance can still be improved if a portion of weights are allocated in faster SRAM. In this paper, we first present an analytical method for performance evaluation under different weight allocation approaches. We then propose an ILP-based on-chip weight allocation strategy that can maximize the overall performance. Experiment results show that the proposed strategy constantly outperforms several trivial heuristic methods over a large set of various MLP models, MLP accelerator configurations, and on-chip SRAM capacities.",
keywords = "deep learning, ILP, MLP accelerator, performance optimization, weight allocation",
author = "Fan, {Kang Yi} and Chen, {Jyun Hua} and Liu, {Chien Nan} and Huang, {Juinn Dar}",
note = "Publisher Copyright: {\textcopyright} 2022 IEEE.; 2022 International Symposium on VLSI Design, Automation and Test, VLSI-DAT 2022 ; Conference date: 18-04-2022 Through 21-04-2022",
year = "2022",
doi = "10.1109/VLSI-DAT54769.2022.9768095",
language = "English",
series = "2022 International Symposium on VLSI Design, Automation and Test, VLSI-DAT 2022 - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "2022 International Symposium on VLSI Design, Automation and Test, VLSI-DAT 2022 - Proceedings",
address = "美國",
}