@inproceedings{f0d8145e7a12470ea1d2bcfae2b36d9c,
title = "A Prototype Implementation of NNEF Execution Framework with CUDA Acceleration",
abstract = "Recently, we have many research works on the neural networks and their related issues. For exchangeability of neural network frameworks, the Neural Network Exchange Format (NNEF) specification is now widely used. Due to very large size of these neural networks, their accelerations are actively explored, and can be achieved through parallel processing techniques. In this paper, we present a prototype implementation of NNEF execution system with parallel-processing accelerations based on CUDA (compute unified device architecture). We will tune the prototype acceleration to achieve more remark-able speed ups.",
keywords = "Acceleration, CUDA, Neural network, NNEF, Parallel processing",
author = "Nakhoon Baek",
note = "Publisher Copyright: {\textcopyright} 2021, The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd.; iCatse International Conference on Information Science and Applications, ICISA 2020 ; Conference date: 16-12-2020 Through 18-12-2020",
year = "2021",
doi = "10.1007/978-981-33-6385-4_12",
language = "English",
isbn = "9789813363847",
series = "Lecture Notes in Electrical Engineering",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "129--132",
editor = "Hyuncheol Kim and Kim, {Kuinam J.} and Suhyun Park",
booktitle = "Information Science and Applications - Proceedings of ICISA 2020",
address = "Germany",
}