@inproceedings{cd933519eb964103bb00a638aea60469,
title = "Efficient Bitrate Ladder Construction using Transfer Learning and Spatio-Temporal Features",
abstract = "Providing high-quality video with efficient bitrate is a main challenge in video industry. The traditional one-size-fits-all scheme for bitrate ladders is inefficient and reaching the best content-aware decision is computationally impractical due to extensive encodings required. To mitigate this, we propose a bitrate and complexity efficient bitrate ladder prediction method using transfer learning and spatio-temporal features. We propose: (1) using feature maps from well-known pre-trained DNNs to predict rate-quality behavior with limited training data; and (2) improving highest quality rung efficiency by predicting minimum bitrate for top quality and using it for the top rung. The method tested on 102 video scenes demonstrates 94.1% reduction in complexity versus brute-force at 1.71% BD-Rate expense. Additionally, transfer learning was thoroughly studied through four networks and ablation studies.",
keywords = "Bitrate ladder, CRF, HTTP Adaptive Streaming (HAS), Pareto Front, Transfer Learning",
author = "Ali Falahati and Safavi, {Mohammad Karim} and Ardavan Elahi and Farhad Pakdaman and Moncef Gabbouj",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; Iranian and International Conference on Machine Vision and Image Processing ; Conference date: 06-03-2024 Through 07-03-2024",
year = "2024",
doi = "10.1109/MVIP62238.2024.10491154",
language = "English",
series = "Iranian Conference on Machine Vision and Image Processing, MVIP",
publisher = "IEEE",
pages = "1--7",
booktitle = "Proceedings of the 13th Iranian and 3rd International Conference on Machine Vision and Image Processing, MVIP 2024",
}