@inproceedings{36504305372f4bdeaa2aa371975577f5,
title = "Standard Compatible Efficient Video Coding with Jointly Optimized Neural Wrappers",
abstract = "We present a standard-compatible video coding scheme with end-to-end optimized neural wrapper over standard video codecs that achieves significant rate-distortion (R-D) performance gains and is still efficient in decoding. We train a pair of pre- and post-processor using a differential JPEG proxy. The pre-processor applies a learned transform to the video and downsamples the video by a factor of 2. It generates a bottleneck video to be coded by a standard codec as a YUV sequence. The post-processor takes the decoded bottleneck video, does the inverse transform, and upsamples it to the original resolution. We follow the design in [1] , where we configure downsample using a layer of strided convolution. We optimize the post-processor for efficiency by replacing convolutions with kernel size larger than 1×1 to depth-wise convolutions [2].",
keywords = "Efficient Video Coding, Neural Network, Postprocess, Preprocess, Video Coding",
author = "Yueyu Hu and Chenhao Zhang and Guleryuz, {Onur G.} and Debargha Mukherjee and Yao Wang",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 2024 Data Compression Conference, DCC 2024 ; Conference date: 19-03-2024 Through 22-03-2024",
year = "2024",
doi = "10.1109/DCC58796.2024.00078",
language = "English (US)",
series = "Data Compression Conference Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "561",
editor = "Ali Bilgin and Fowler, {James E.} and Joan Serra-Sagrista and Yan Ye and Storer, {James A.}",
booktitle = "Proceedings - DCC 2024",
}