@inproceedings{249a76cb2c4f47c38488ca14080a73b8,
title = "Fair share: Allocation of GPU resources for both performance and fairness",
abstract = "General-purpose computing on the GPU (GPGPU computing) is becoming widely adopted for an increasing variety of applications. However, it has been shown that as the available computing elements in the GPU increase with every generation some GPGPU applications fail to fully utilize the GPU resources. Spatial multitasking - subdividing GPU resources amongst concurrently-running applicationshas been shown to increase overall system performance and utilization for GPGPU computing. However, dividing the computing resources among multiple applications to maximize system performance often results in one application having 'unfair' access to GPU resources. Yet, evenly dividing resources among applications does not guarantee equal speedups to each application; nor does it take into account overall system performance. In this paper we examine several different ways to characterize 'fairness' for GPGPU spatial multitasking, by balancing individual application's performance and overall system performance. We further present a run-time algorithm to predict and adjust the SM allocation at runtime to meet the desired fairness metric.",
keywords = "GPGPU computing, fairness, resource allocation",
author = "Paula Aguilera and Katherine Morrow and Kim, {Nam Sung}",
note = "Publisher Copyright: {\textcopyright} 2014 IEEE.; 32nd IEEE International Conference on Computer Design, ICCD 2014 ; Conference date: 19-10-2014 Through 22-10-2014",
year = "2014",
month = dec,
day = "3",
doi = "10.1109/ICCD.2014.6974717",
language = "English (US)",
series = "2014 32nd IEEE International Conference on Computer Design, ICCD 2014",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "440--447",
booktitle = "2014 32nd IEEE International Conference on Computer Design, ICCD 2014",
address = "United States",
}