@inproceedings{1165ab0a4fd64bfba46b344a6c88c84d,
title = "Predictive performance tuning of open ACC accelerated applications",
abstract = "GPUs are gradually becoming mainstream in supercomputing as their capabilities to significantly accelerate a large spectrum of scientific applications have been identified and proven. Moreover, with the introduction of directive based programming models such as OpenACC, these devices are becoming more accessible and practical to use by a larger scientific community. However, performance optimization of OpenACC applications usually requires an indepth knowledge of the hardware and software specifications. We suggest a prediction-based performance tuning mechanism to quickly tune OpenACC parameters to dynamically adapt to the execution environment on a given system. This approach is applied to a finite difference kernel to tune the OpenACC gang and vector clauses for mapping the computations into the underlying accelerator architecture. Our experiments show a good performance improvement against the default compiler parameters and a faster tuning by an order of magnitude compared to the brute force search tuning.",
author = "Shahzeb Siddiqui and Saber Feki",
year = "2014",
language = "English (US)",
isbn = "9783319075174",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "511--512",
booktitle = "Supercomputing - 29th International Conference, ISC 2014, Proceedings",
address = "Germany",
note = "29th International Supercomputing Conference, ISC 2014 ; Conference date: 22-06-2014 Through 26-06-2014",
}