@inproceedings{f46104983e8d410ab4e74d7927665024,
title = "Two-Layer Learning-Based P-Frame Coding with Super-Resolution and Content-Adaptive Conditional ANF",
abstract = "Deep-learning-based video compression technique has been rapidly growing in recent years. This paper adopts the Conditional Augmented Normalizing Flow video codec (CANF-VC) [8] as our basic system. To improve the quality of the condition signal (image) for CANF, we propose a two-layer structure learning-based video codec. At low cost of extra bit rate, the low-resolution base layer provides side information to improve the quality of motion-compensated reference frame through a super-resolution module with a merge-net. In addition, the base layer also provides information to the skip-mask generator. The skip-mask guides the coding mechanism to reduce the transmitted samples for the high-resolution enhancement layer. The experiment results indicate that the proposed two-layer coding scheme can provide 22.19% PSNR BD-Rate saving and 49.59% MS-SSIM BD-Rate saving over H.265 (HM 16.20) on the UVG test sequences.",
keywords = "deep video coding, merge-net, skip mode coding, two-layer coding, video compression",
author = "David Alexandre and Hsueh-Ming Hang and Peng, {Wen Hsiao}",
note = "Publisher Copyright: {\textcopyright} 2022 ACM.; 4th ACM International Conference on Multimedia in Asia, MMAsia 2022 ; Conference date: 13-12-2022 Through 16-12-2022",
year = "2022",
month = dec,
day = "13",
doi = "10.1145/3551626.3564953",
language = "English",
series = "Proceedings of the 4th ACM International Conference on Multimedia in Asia, MMAsia 2022",
publisher = "Association for Computing Machinery, Inc",
booktitle = "Proceedings of the 4th ACM International Conference on Multimedia in Asia, MMAsia 2022",
}