Powered by
8th Workshop on General Purpose Processing using GPUs (GPGPU 8), February 7, 2015,
San Francisco, CA, USA
8th Workshop on General Purpose Processing using GPUs (GPGPU 8)
Preface
HPC
A Comparative Investigation of Device-Specific Mechanisms for Exploiting HPC Accelerators
Ayman Tarakji,
Lukas Börger, and
Rainer Leupers
(RWTH Aachen University, Germany)
@InProceedings{GPGPU15p1,
author = {Ayman Tarakji and Lukas Börger and Rainer Leupers},
title = {A Comparative Investigation of Device-Specific Mechanisms for Exploiting HPC Accelerators},
booktitle = {Proc.\ GPGPU},
publisher = {ACM},
pages = {1-0},
doi = {},
year = {2015},
}
Cache and Shared Memory
GPU-SM: Shared Memory Multi-GPU Programming
Javier Cabezas,
Marc Jordà,
Isaac Gelado,
Nacho Navarro, and
Wen-mei Hwu
(Barcelona Supercomputing Center, Spain; NVIDIA, USA; Universitat Politècnica de Catalunya, Spain; University of Illinois at Urbana-Champaign, USA)
@InProceedings{GPGPU15p13,
author = {Javier Cabezas and Marc Jordà and Isaac Gelado and Nacho Navarro and Wen-mei Hwu},
title = {GPU-SM: Shared Memory Multi-GPU Programming},
booktitle = {Proc.\ GPGPU},
publisher = {ACM},
pages = {13-12},
doi = {},
year = {2015},
}
Adaptive GPU Cache Bypassing
Yingying Tian,
Sooraj Puthoor,
Joseph L. Greathouse,
Bradford M. Beckmann, and
Daniel A. Jiménez
(Texas A&M University, USA; AMD Research, USA)
@InProceedings{GPGPU15p25,
author = {Yingying Tian and Sooraj Puthoor and Joseph L. Greathouse and Bradford M. Beckmann and Daniel A. Jiménez},
title = {Adaptive GPU Cache Bypassing},
booktitle = {Proc.\ GPGPU},
publisher = {ACM},
pages = {25-24},
doi = {},
year = {2015},
}
Efficient Utilization of GPGPU Cache Hierarchy
Mahmoud Khairy,
Mohamed Zahran, and
Amr G. Wassal
(Cairo University, Egypt; New York University, USA)
@InProceedings{GPGPU15p37,
author = {Mahmoud Khairy and Mohamed Zahran and Amr G. Wassal},
title = {Efficient Utilization of GPGPU Cache Hierarchy},
booktitle = {Proc.\ GPGPU},
publisher = {ACM},
pages = {37-36},
doi = {},
year = {2015},
}
Optimization
Effects of Source-Code Optimizations on GPU Performance and Energy Consumption
Jared Coplin and
Martin Burtscher
(Texas State University, USA)
@InProceedings{GPGPU15p49,
author = {Jared Coplin and Martin Burtscher},
title = {Effects of Source-Code Optimizations on GPU Performance and Energy Consumption},
booktitle = {Proc.\ GPGPU},
publisher = {ACM},
pages = {49-48},
doi = {},
year = {2015},
}
Optimization for Performance and Energy for Batched Matrix Computations on GPUs
Azzam Haidar,
Tingxing Dong,
Piotr Luszczek,
Stanimire Tomov, and
Jack Dongarra
(University of Tennessee, USA; Oak Ridge National Laboratory, USA; University of Manchester, UK)
@InProceedings{GPGPU15p61,
author = {Azzam Haidar and Tingxing Dong and Piotr Luszczek and Stanimire Tomov and Jack Dongarra},
title = {Optimization for Performance and Energy for Batched Matrix Computations on GPUs},
booktitle = {Proc.\ GPGPU},
publisher = {ACM},
pages = {61-60},
doi = {},
year = {2015},
}
Helium: A Transparent Inter-kernel Optimizer for OpenCL
Thibaut Lutz,
Christian Fensch, and
Murray Cole
(University of Edinburgh, UK; Heriot-Watt University, UK)
@InProceedings{GPGPU15p73,
author = {Thibaut Lutz and Christian Fensch and Murray Cole},
title = {Helium: A Transparent Inter-kernel Optimizer for OpenCL},
booktitle = {Proc.\ GPGPU},
publisher = {ACM},
pages = {73-72},
doi = {},
year = {2015},
}
Applications
Stochastic Gradient Descent on GPUs
Rashid Kaleem,
Sreepathi Pai, and
Keshav Pingali
(University of Texas at Austin, USA)
@InProceedings{GPGPU15p85,
author = {Rashid Kaleem and Sreepathi Pai and Keshav Pingali},
title = {Stochastic Gradient Descent on GPUs},
booktitle = {Proc.\ GPGPU},
publisher = {ACM},
pages = {85-84},
doi = {},
year = {2015},
}
High Performance Computing of Fiber Scattering Simulation
Leiming Yu,
Yan Zhang,
Xiang Gong,
Nilay Roy,
Lee Makowski, and
David Kaeli
(Northeastern University, USA)
@InProceedings{GPGPU15p97,
author = {Leiming Yu and Yan Zhang and Xiang Gong and Nilay Roy and Lee Makowski and David Kaeli},
title = {High Performance Computing of Fiber Scattering Simulation},
booktitle = {Proc.\ GPGPU},
publisher = {ACM},
pages = {97-96},
doi = {},
year = {2015},
}
Forma: A DSL for Image Processing Applications to Target GPUs and Multi-core CPUs
Mahesh Ravishankar,
Justin Holewinski, and
Vinod Grover
(NVIDIA, USA)
@InProceedings{GPGPU15p121,
author = {Mahesh Ravishankar and Justin Holewinski and Vinod Grover},
title = {Forma: A DSL for Image Processing Applications to Target GPUs and Multi-core CPUs},
booktitle = {Proc.\ GPGPU},
publisher = {ACM},
pages = {121-120},
doi = {},
year = {2015},
}
proc time: 0.62