@inproceedings{65a7c8b8d8bd49499bc9e6e4ea6817bc,
title = "PPLSA: Parallel probabilistic latent semantic analysis based on MapReduce",
abstract = "PLSA(Probabilistic Latent Semantic Analysis) is a popular topic modeling technique for exploring document collections. Due to the increasing prevalence of large datasets, there is a need to improve the scalability of computation in PLSA. In this paper, we propose a parallel PLSA algorithm called PPLSA to accommodate large corpus collections in the MapReduce framework. Our solution efficiently distributes computation and is relatively simple to implement.",
keywords = "EM, MapReduce, Parallel, Probabilistic Latent Semantic Analysis",
author = "Ning Li and Fuzhen Zhuang and Qing He and Zhongzhi Shi",
year = "2012",
doi = "10.1007/978-3-642-32891-6\_8",
language = "英语",
isbn = "9783642328909",
series = "IFIP Advances in Information and Communication Technology",
pages = "40--49",
booktitle = "Intelligent Information Processing VI - 7th IFIP TC 12 International Conference, IIP 2012, Proceedings",
note = "7th IFIP International Conference on Intelligent Information Processing, IIP 2012 ; Conference date: 12-10-2012 Through 15-10-2012",
}