@inproceedings{a6ada94193ed4d70981e8d6f6e73cea8,
title = "M\&C: A software solution to reduce errors caused by incoherent caches on GPUs in unstructured graphic algorithm",
abstract = "Recently, researchers have focused on addressing incoherent caches on GPUs as current GPUs lack hardware to support that. Moreover, the support for inter-block communication also lacks which limits the scalability of parallel programming especially in the unstructured algorithm in which program would share data between different threads. Barrier synchronization can be a solution but it becomes invalid because of incoherent caches. In this paper, we propose a set of rules for programming on current GPUs to avoid the errors caused by incoherent caches when applying barrier synchronization. We also leverage these rules into an unstructured graphic algorithm - constrained Delaunay triangulation. In comparison with traditional ways such as (1) disabling L1 cache and (2) using keyword volatile, we find that when vertices is over 300K the error rate is lesser than (1) by 91.19\% and than (2) by 84.2\% on average.",
author = "Kun Wang and Rui Wang and Zhongzhi Luan and Depei Qian",
year = "2013",
doi = "10.1007/978-3-319-03859-9\_37",
language = "英语",
isbn = "9783319038582",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
number = "PART 1",
pages = "426--435",
booktitle = "Algorithms and Architectures for Parallel Processing - 13th International Conference, ICA3PP 2013, Proceedings",
edition = "PART 1",
note = "13th International Conference on Algorithms and Architectures for Parallel Processing, ICA3PP 2013 ; Conference date: 18-12-2013 Through 20-12-2013",
}