@inproceedings{f4c59d67f8f04ad790c95fdf08ca366f,
title = "A CNN-Based Multi-scale Super-Resolution Architecture on FPGA for 4K/8K UHD Applications",
abstract = "In this paper, based on our previous work, we present a multi-scale super-resolution (SR) hardware (HW) architecture using a convolutional neural network (CNN), where the up-scaling factors of 2, 3 and 4 are supported. In our dedicated multi-scale CNN-based SR HW, low-resolution (LR) input frames are processed line-by-line, and the number of convolutional filter parameters is significantly reduced by incorporating depth-wise separable convolutions with residual connections. As for 3× and 4× up-scaling, the number of channels for point-wise convolution layer before a pixel-shuffle layer is set to 9 and 16, respectively. Additionally, we propose an integrated timing generator that supports 3× and 4× up-scaling. For efficient HW implementation, we use a simple and effective quantization method with a minimal peak signal-to-noise ratio (PSNR) degradation. Also, we propose a compression method to efficiently store intermediate feature map data to reduce the number of line memories used in HW. Our CNN-based SR HW implementation on the FPGA can generate 4K ultra high-definition (UHD) frames of higher PSNR at 60 fps, which have higher visual quality compared to conventional CNN-based SR methods that were trained and tested in software. The resources in our CNN-based SR HW can be shared for multi-scale upscaling factors of 2, 3 and 4 so that can be implemented to generate 8K UHD frames from 2K FHD input frames.",
keywords = "4 K UHD, CNN, Deep learning, FPGA, Hardware, Multi-scale, Real-time, Super-resolution",
author = "Yongwoo Kim and Choi, \{Jae Seok\} and Jaehyup Lee and Munchurl Kim",
note = "Publisher Copyright: {\textcopyright} 2020, Springer Nature Switzerland AG.; 26th International Conference on MultiMedia Modeling, MMM 2020 ; Conference date: 05-01-2020 Through 08-01-2020",
year = "2020",
doi = "10.1007/978-3-030-37734-2\_63",
language = "English",
isbn = "9783030377335",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer",
pages = "739--744",
editor = "Ro, \{Yong Man\} and Junmo Kim and Jung-Woo Choi and Wen-Huang Cheng and Wei-Ta Chu and Peng Cui and Min-Chun Hu and \{De Neve\}, Wesley",
booktitle = "MultiMedia Modeling - 26th International Conference, MMM 2020, Proceedings",
address = "Germany",
}