@inproceedings{f9fcdb9708934154bcd4e4aa005b8761,
title = "Why simple models perform well in predicting popularity for caching?",
abstract = "Predicting file popularity is an important task for proactive caching, which has been shown a promising way to support the explosive increase of data traffic. Both linear and non-linear predictors have been proposed in literature to predict file popularity, and shallow neural networks have been shown to achieve good performance for caching. In this paper, we strive to explain why simple models perform well in predicting dynamic popularity with the historical number of requests. We consider linear regression, deep neural networks, random forest, support vector regression, and a persistence model for predicting popularity. We employ MovieLens and Youku datasets for analyzing the time-varying pattern of popularity and for evaluating the caching performance. We show that the cache hit ratios achieved by the caching policy with predicted popularity using linear models are close to that using non-linear models. We interpret the observation by first proving that deterministic popularity with typical profiles can be predicted with linear models and then showing that majority of the popular files are with these profiles in the real dataset.",
keywords = "File popularity, Interpretation, Linear predictor",
author = "Jiajun Wu and Chenyang Yang",
note = "Publisher Copyright: {\textcopyright} 2019 IEEE.; 25th Asia-Pacific Conference on Communications, APCC 2019 ; Conference date: 06-11-2019 Through 08-11-2019",
year = "2019",
month = nov,
doi = "10.1109/APCC47188.2019.9026481",
language = "英语",
series = "Proceedings of 2019 25th Asia-Pacific Conference on Communications, APCC 2019",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "7--12",
editor = "Bao, \{Vo Nguyen Quoc\} and Thanh, \{Tran Thien\}",
booktitle = "Proceedings of 2019 25th Asia-Pacific Conference on Communications, APCC 2019",
address = "美国",
}