@inproceedings{861ab6f8c41b435e9651a79a6c397762,
title = "Optimizing energy consumption in GPUS through feedback-driven CTA scheduling",
abstract = "Emerging GPU architectures offer a cost-effective computing platform by providing thousands of energy-efficient compute cores and high bandwidth memory that facilitate the execution of highly parallel applications. In this paper, we show that different applications, and in fact different kernels from the same application might exhibit significantly varying utilizations of compute and memory resources. In order to improve the energy efficiency of the GPU system, we propose a run-time characterization strategy that classifies kernels as compute- or memory-intensive based on their resource utilizations. Using this knowledge, our proposed mechanism employs core shut-down technique for memory-intensive kernels in order to manage energy in a more efficient way. This strategy uses performance and memory bandwidth utilization information to determine the ideal hardware configuration at run-time. The proposed technique saves on average 21% of total chip energy for memory-intensive applications, which is within 8% of the optimal saving that can be obtained from an oracle scheme.",
author = "Amin Jadidi and Mohammad Arjomand and Kandemir, {Mahmut Taylan} and Das, {Chita R.}",
note = "Publisher Copyright: {\textcopyright}2017 Society for Modeling & Simulation International (SCS).; 25th High Performance Computing Symposium, HPC 2017, Part of the 2017 Spring Simulation Multi-Conference, SpringSim 2017 ; Conference date: 23-04-2017 Through 26-04-2017",
year = "2017",
language = "English (US)",
series = "Simulation Series",
publisher = "The Society for Modeling and Simulation International",
number = "3",
pages = "129--140",
editor = "Lukas Polok and William Thacker and Masha Sosonkina and Josef Weinbub",
booktitle = "Simulation Series",
address = "United States",
edition = "3",
}