@InProceedings{MingyiYang2023, author="Mingyi Yang and Luis Herranz and Fei Yang and Luka Murn and Marc Gorriz Blanch and Shuai Wan and Fuzheng Yang and Marta Mrak", title="Semantic Preprocessor for Image Compression for Machines", booktitle="IEEE International Conference on Acoustics, Speech and Signal Processing", year="2023", abstract="Visual content is being increasingly transmitted and consumed by machines rather than humans to perform automated content analysis tasks. In this paper, we propose an image preprocessor that optimizes the input image for machine consumption prior to encoding by an off-the-shelf codec designed for human consumption. To achieve a better trade-off between the accuracy of the machine analysis task and bitrate, we propose leveraging pre-extracted semantic information to improve the preprocessor{\textquoteright}s ability to accurately identify and filter out task-irrelevant information. Furthermore, we propose a two-part loss function to optimize the preprocessor, consisted of a rate-task performance loss and a semantic distillation loss, which helps the reconstructed image obtain more information that contributes to the accuracy of the task. Experiments show that the proposed preprocessor can save up to 48.83\% bitrate compared with the method without the preprocessor, and save up to 36.24\% bitrate compared to existing preprocessors for machine vision.", optnote="MACO; LAMP", optnote="exported from refbase (http://158.109.8.37/show.php?record=3912), last updated on Fri, 19 Jan 2024 16:14:09 +0100", doi="10.1109/ICASSP49357.2023.10096472", opturl="https://ieeexplore.ieee.org/document/10096472" }