@inproceedings{f7fa144e17a64d96aefe2cf77e5ad6ef,
title = "TVFormer: Trajectory-guided Visual Quality Assessment on 360° Images with Transformers",
abstract = "Visual quality assessment (VQA) on 360° images plays an important role in optimizing immersive multimedia systems. Due to the absence of pristine 360° images in real world, blind VQA (BVQA) on 360° images has drawn much research attention. In subjective VQA on 360\textasciicircum{} images, human intuitively make the quality-scoring decisions through the quality degradation of each observed viewport on the head trajectories. Unfortunately, the existing BVQA works for 360° images neglect the dynamic property of head trajectories with viewport interactions, thus failing to obtain human-like quality scores. In this paper, we propose a novel Transformer-based approach for trajectory-guided VQA on 360° images (named TVFormer), in which both the tasks of head trajectory prediction and BVQA can be accomplished for 360° images. In the first task, we develop a trajectory-Aware memory updater (TMU) module, for maintaining the coherence and accuracy of predicted head trajectories. To capture the long-range quality dependency across time-ordered viewports, we propose a spatio-Temporal factorized self-Attention (STF) module in the encoder of TVFormer for the BVQA task. By implanting the predicted head trajectories into the BVQA task, we can obtain the human-like quality scores. Extensive experiments demonstrate the superior BVQA performance of TVFormer over state-of-The-Art approaches on three benchmark datasets.",
keywords = "360, BVQA, head trajectory, images, transformer",
author = "Li Yang and Mai Xu and Tie Liu and Liangyu Huo and Xinbo Gao",
note = "Publisher Copyright: {\textcopyright} 2022 ACM.; 30th ACM International Conference on Multimedia, MM 2022 ; Conference date: 10-10-2022 Through 14-10-2022",
year = "2022",
month = oct,
day = "10",
doi = "10.1145/3503161.3547748",
language = "英语",
series = "MM 2022 - Proceedings of the 30th ACM International Conference on Multimedia",
publisher = "Association for Computing Machinery, Inc",
pages = "799--808",
booktitle = "MM 2022 - Proceedings of the 30th ACM International Conference on Multimedia",
}