@inproceedings{4286d53e98084222bbe3d7b0f32b51b0,
title = "Intelligent Resource Scheduling at Scale: A Machine Learning Perspective",
abstract = "Resource scheduling in a computing system addresses the problem of packing tasks with multi-dimensional resource requirements and non-functional constraints. The exhibited heterogeneity of workload and server characteristics in Cloud-scale or Internet-scale systems is adding further complexity and new challenges to the problem. Compared with existing solutions based on ad-hoc heuristics, Machine Learning (ML) has the potential to improve further the efficiency of resource management in large-scale systems. In this paper we will describe and discuss how ML could be used to understand automatically both workloads and environments, and to help to cope with scheduling-related challenges such as consolidating co-located workloads, handling resource requests, guaranteeing application's QoSs, and mitigating tailed stragglers. We will introduce a generalized ML-based solution to large-scale resource scheduling and demonstrate its effectiveness through a case study that deals with performance-centric node classification and straggler mitigation. We believe that an MLbased method will help to achieve architectural optimization and efficiency improvement.",
keywords = "Resource Scheduling, machine learning, resource management, straggler",
author = "Renyu Yang and Xue Ouyang and Yaofeng Chen and Paul Townend and Jie Xu",
note = "Publisher Copyright: {\textcopyright} 2018 IEEE.; 12th IEEE International Symposium on Service-Oriented System Engineering, SOSE 2018 and 9th International Workshop on Joint Cloud Computing, JCC 2018 ; Conference date: 26-03-2018 Through 29-03-2018",
year = "2018",
month = may,
day = "14",
doi = "10.1109/SOSE.2018.00025",
language = "英语",
series = "Proceedings - 12th IEEE International Symposium on Service-Oriented System Engineering, SOSE 2018 and 9th International Workshop on Joint Cloud Computing, JCC 2018",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "132--141",
booktitle = "Proceedings - 12th IEEE International Symposium on Service-Oriented System Engineering, SOSE 2018 and 9th International Workshop on Joint Cloud Computing, JCC 2018",
address = "美国",
}