@inproceedings{71197bb0925948f79506e49bc62cf3be,
title = "MS-MH-TCN: Multi-Stage and Multi-Head Temporal Convolutional Network for Action Segmentation",
abstract = "The segmentation of manual action in long video has important application value in the fields of demonstration programming and human-computer interaction. The state-of-the-art manual action segmentation method uses multi-stage temporal convolution. Although it can capture the long temporal dependence between actions, there are still excessive segmentation errors in the predicted results. In this paper, we propose a multistage and multi-head temporal convolutional network (MS-MH-TCN) for improving the performance on the action segmentation task. A multi-head calculation is performed at each stage, and the results of the multi-head are pooled to average and fed into the next stage. This approach improves the model{\textquoteright}s prediction and generalization of input information, because different heads can focus on different aspects of the input and can adapt to learn how to combine them to generate final action predictions. We also propose a new segment smoothing loss function to punish over-segmentation errors. An extensive evaluation showed the effectiveness of the proposed model in capturing long-term dependencies and identifying action segments. Our model achieved the most advanced results on the 50salad dataset.",
keywords = "Action segmentation, Action segmentation, Multi-head attention, Temporal convolutional network",
author = "Zengxin Kang and Zhongyi Chu",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd. 2024.; 2nd International Conference on Cognitive Computation and Systems, ICCCS 2023 ; Conference date: 14-10-2023 Through 15-10-2023",
year = "2024",
doi = "10.1007/978-981-97-0885-7\_5",
language = "英语",
isbn = "9789819708840",
series = "Communications in Computer and Information Science",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "48--60",
editor = "Fuchun Sun and Jianmin Li",
booktitle = "Cognitive Computation and Systems - 2nd International Conference, ICCCS 2023, Revised Selected Papers",
address = "德国",
}