Powered by
20th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming (PPoPP 2015), February 7–11, 2015,
San Francisco, CA, USA
Frontmatter
Concurrency
Mon, Feb 9, 10:20 - 12:00
More Than You Ever Wanted to Know about Synchronization: Synchrobench, Measuring the Impact of the Synchronization on Concurrent Algorithms
Vincent Gramoli
(NICTA, Australia; University of Sydney, Australia)
@InProceedings{PPoPP15p1,
author = {Vincent Gramoli},
title = {More Than You Ever Wanted to Know about Synchronization: Synchrobench, Measuring the Impact of the Synchronization on Concurrent Algorithms},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {1-0},
doi = {},
year = {2015},
}
The SprayList: A Scalable Relaxed Priority Queue
Dan Alistarh,
Justin Kopinsky,
Jerry Li, and
Nir Shavit
(Microsoft Research, UK; Massachusetts Institute of Technology, USA; Tel Aviv University, Israel)
@InProceedings{PPoPP15p13,
author = {Dan Alistarh and Justin Kopinsky and Jerry Li and Nir Shavit},
title = {The SprayList: A Scalable Relaxed Priority Queue},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {13-12},
doi = {},
year = {2015},
}
Predicate RCU: An RCU for Scalable Concurrent Updates
Maya Arbel and
Adam Morrison
(Technion, Israel)
@InProceedings{PPoPP15p25,
author = {Maya Arbel and Adam Morrison},
title = {Predicate RCU: An RCU for Scalable Concurrent Updates},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {25-24},
doi = {},
year = {2015},
}
Automatic Scalable Atomicity via Semantic Locking
Guy Golan-Gueta,
G. Ramalingam,
Mooly Sagiv, and
Eran Yahav
(Yahoo Labs, Israel; Microsoft Research, India; Tel Aviv University, Israel; Technion, Israel)
@InProceedings{PPoPP15p37,
author = {Guy Golan-Gueta and G. Ramalingam and Mooly Sagiv and Eran Yahav},
title = {Automatic Scalable Atomicity via Semantic Locking},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {37-36},
doi = {},
year = {2015},
}
Code Generation
Mon, Feb 9, 13:30 - 14:45
A Framework for Practical Parallel Fast Matrix Multiplication
Austin R. Benson and
Grey Ballard
(Stanford University, USA; Sandia National Laboratories, USA)
@InProceedings{PPoPP15p49,
author = {Austin R. Benson and Grey Ballard},
title = {A Framework for Practical Parallel Fast Matrix Multiplication},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {49-48},
doi = {},
year = {2015},
}
Distributed Memory Code Generation for Mixed Irregular/Regular Computations
Mahesh Ravishankar,
Roshan Dathathri,
Venmugil Elango,
Louis-Noël Pouchet,
J. Ramanujam,
Atanas Rountev, and
P. Sadayappan
(Ohio State University, USA; Louisiana State University, USA)
@InProceedings{PPoPP15p73,
author = {Mahesh Ravishankar and Roshan Dathathri and Venmugil Elango and Louis-Noël Pouchet and J. Ramanujam and Atanas Rountev and P. Sadayappan},
title = {Distributed Memory Code Generation for Mixed Irregular/Regular Computations},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {73-72},
doi = {},
year = {2015},
}
Transactional Memory
Mon, Feb 9, 15:10 - 16:25
Software Partitioning of Hardware Transactions
Lingxiang Xiang and
Michael L. Scott
(University of Rochester, USA)
@InProceedings{PPoPP15p85,
author = {Lingxiang Xiang and Michael L. Scott},
title = {Software Partitioning of Hardware Transactions},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {85-84},
doi = {},
year = {2015},
}
Performance Implications of Dynamic Memory Allocators on Transactional Memory Systems
Alexandro Baldassin,
Edson Borin, and
Guido Araujo
(UNESP, Brazil; UNICAMP, Brazil)
@InProceedings{PPoPP15p97,
author = {Alexandro Baldassin and Edson Borin and Guido Araujo},
title = {Performance Implications of Dynamic Memory Allocators on Transactional Memory Systems},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {97-96},
doi = {},
year = {2015},
}
Low-Overhead Software Transactional Memory with Progress Guarantees and Strong Semantics
Minjia Zhang,
Jipeng Huang,
Man Cao, and
Michael D. Bond
(Ohio State University, USA)
@InProceedings{PPoPP15p109,
author = {Minjia Zhang and Jipeng Huang and Man Cao and Michael D. Bond},
title = {Low-Overhead Software Transactional Memory with Progress Guarantees and Strong Semantics},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {109-108},
doi = {},
year = {2015},
}
Large Scale Parallelism
Tue, Feb 10, 08:25 - 09:40
Barrier Elision for Production Parallel Programs
Milind Chabbi,
Wim Lavrijsen,
Wibe de Jong,
Koushik Sen,
John Mellor-Crummey, and
Costin Iancu
(Rice University, USA; Lawrence Berkeley National Laboratory, USA; University of California at Berkeley, USA)
@InProceedings{PPoPP15p121,
author = {Milind Chabbi and Wim Lavrijsen and Wibe de Jong and Koushik Sen and John Mellor-Crummey and Costin Iancu},
title = {Barrier Elision for Production Parallel Programs},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {121-120},
doi = {},
year = {2015},
}
Scalable and Efficient Implementation of 3D Unstructured Meshes Computation: A Case Study on Matrix Assembly
Loïc Thébault,
Eric Petit, and
Quang Dinh
(University of Versailles, France; Dassault Aviation, France)
@InProceedings{PPoPP15p133,
author = {Loïc Thébault and Eric Petit and Quang Dinh},
title = {Scalable and Efficient Implementation of 3D Unstructured Meshes Computation: A Case Study on Matrix Assembly},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {133-132},
doi = {},
year = {2015},
}
Diagnosing the Causes and Severity of One-Sided Message Contention
Nathan R. Tallent,
Abhinav Vishnu,
Hubertus Van Dam,
Jeff Daily,
Darren J. Kerbyson, and
Adolfy Hoisie
(Pacific Northwest National Laboratory, USA)
@InProceedings{PPoPP15p145,
author = {Nathan R. Tallent and Abhinav Vishnu and Hubertus Van Dam and Jeff Daily and Darren J. Kerbyson and Adolfy Hoisie},
title = {Diagnosing the Causes and Severity of One-Sided Message Contention},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {145-144},
doi = {},
year = {2015},
}
Verification and Accelerators
Tue, Feb 10, 10:05 - 11:45
A Parallel Algorithm for Global States Enumeration in Concurrent Systems
Yen-Jung Chang and
Vijay K. Garg
(University of Texas at Austin, USA)
@InProceedings{PPoPP15p157,
author = {Yen-Jung Chang and Vijay K. Garg},
title = {A Parallel Algorithm for Global States Enumeration in Concurrent Systems},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {157-156},
doi = {},
year = {2015},
}
Dynamic Deadlock Verification for General Barrier Synchronisation
Tiago Cogumbreiro,
Raymond Hu,
Francisco Martins, and
Nobuko Yoshida
(Imperial College London, UK; University of Lisbon, Portugal)
@InProceedings{PPoPP15p169,
author = {Tiago Cogumbreiro and Raymond Hu and Francisco Martins and Nobuko Yoshida},
title = {Dynamic Deadlock Verification for General Barrier Synchronisation},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {169-168},
doi = {},
year = {2015},
}
VirtCL: A Framework for OpenCL Device Abstraction and Management
Yi-Ping You,
Hen-Jung Wu,
Yeh-Ning Tsai, and
Yen-Ting Chao
(National Chiao Tung University, Taiwan)
@InProceedings{PPoPP15p181,
author = {Yi-Ping You and Hen-Jung Wu and Yeh-Ning Tsai and Yen-Ting Chao},
title = {VirtCL: A Framework for OpenCL Device Abstraction and Management},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {181-180},
doi = {},
year = {2015},
}
On Optimizing Machine Learning Workloads via Kernel Fusion
Arash Ashari,
Shirish Tatikonda,
Matthias Boehm,
Berthold Reinwald,
Keith Campbell,
John Keenleyside, and
P. Sadayappan
(Ohio State University, USA; IBM, USA; IBM, Canada)
@InProceedings{PPoPP15p193,
author = {Arash Ashari and Shirish Tatikonda and Matthias Boehm and Berthold Reinwald and Keith Campbell and John Keenleyside and P. Sadayappan},
title = {On Optimizing Machine Learning Workloads via Kernel Fusion},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {193-192},
doi = {},
year = {2015},
}
Algorithms
Tue, Feb 10, 14:45 - 16:00
NUMA-Aware Graph-Structured Analytics
Kaiyuan Zhang,
Rong Chen, and
Haibo Chen
(Shanghai Jiao Tong University, China)
@InProceedings{PPoPP15p205,
author = {Kaiyuan Zhang and Rong Chen and Haibo Chen},
title = {NUMA-Aware Graph-Structured Analytics},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {205-204},
doi = {},
year = {2015},
}
SYNC or ASYNC: Time to Fuse for Distributed Graph-Parallel Computation
Chenning Xie,
Rong Chen,
Haibing Guan,
Binyu Zang, and
Haibo Chen
(Shanghai Jiao Tong University, China)
@InProceedings{PPoPP15p217,
author = {Chenning Xie and Rong Chen and Haibing Guan and Binyu Zang and Haibo Chen},
title = {SYNC or ASYNC: Time to Fuse for Distributed Graph-Parallel Computation},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {217-216},
doi = {},
year = {2015},
}
Cache-Oblivious Wavefront: Improving Parallelism of Recursive Dynamic Programming Algorithms without Losing Cache-Efficiency
Yuan Tang,
Ronghui You,
Haibin Kan,
Jesmin Jahan Tithi,
Pramod Ganapathi, and
Rezaul A. Chowdhury
(Fudan University, China; Stony Brook University, USA)
@InProceedings{PPoPP15p229,
author = {Yuan Tang and Ronghui You and Haibin Kan and Jesmin Jahan Tithi and Pramod Ganapathi and Rezaul A. Chowdhury},
title = {Cache-Oblivious Wavefront: Improving Parallelism of Recursive Dynamic Programming Algorithms without Losing Cache-Efficiency},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {229-228},
doi = {},
year = {2015},
}
Locking and Locality
Wed, Feb 11, 09:40 - 10:55
High Performance Locks for Multi-level NUMA Systems
Milind Chabbi,
Michael Fagan, and
John Mellor-Crummey
(Rice University, USA)
@InProceedings{PPoPP15p241,
author = {Milind Chabbi and Michael Fagan and John Mellor-Crummey},
title = {High Performance Locks for Multi-level NUMA Systems},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {241-240},
doi = {},
year = {2015},
}
MPI+Threads: Runtime Contention and Remedies
Abdelhalim Amer,
Huiwei Lu,
Yanjie Wei,
Pavan Balaji, and
Satoshi Matsuoka
(Tokyo Institute of Technology, Japan; Argonne National Laboratory, USA; Shenzhen Institute of Advanced Technologies at Chinese Academy of Sciences, China)
@InProceedings{PPoPP15p265,
author = {Abdelhalim Amer and Huiwei Lu and Yanjie Wei and Pavan Balaji and Satoshi Matsuoka},
title = {MPI+Threads: Runtime Contention and Remedies},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {265-264},
doi = {},
year = {2015},
}
Poster Abstracts
Sun, Feb 8, 18:15 - 20:00
Fence Placement for Legacy Data-Race-Free Programs via Synchronization Read Detection
Andrew J. McPherson,
Vijay Nagarajan,
Susmit Sarkar, and
Marcelo Cintra
(University of Edinburgh, UK; University of St. Andrews, UK; Intel, Germany)
@InProceedings{PPoPP15p277,
author = {Andrew J. McPherson and Vijay Nagarajan and Susmit Sarkar and Marcelo Cintra},
title = {Fence Placement for Legacy Data-Race-Free Programs via Synchronization Read Detection},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {277-276},
doi = {},
year = {2015},
}
JAWS: A JavaScript Framework for Adaptive CPU-GPU Work Sharing
Xianglan Piao,
Channoh Kim,
Younghwan Oh,
Huiying Li,
Jincheon Kim,
Hanjun Kim, and
Jae W. Lee
(Sungkyunkwan University, South Korea; Company 100, South Korea; POSTECH, South Korea)
@InProceedings{PPoPP15p279,
author = {Xianglan Piao and Channoh Kim and Younghwan Oh and Huiying Li and Jincheon Kim and Hanjun Kim and Jae W. Lee},
title = {JAWS: A JavaScript Framework for Adaptive CPU-GPU Work Sharing},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {279-278},
doi = {},
year = {2015},
}
GStream: A Graph Streaming Processing Method for Large-Scale Graphs on GPUs
Hyunseok Seo,
Jinwook Kim, and
Min-Soo Kim
(DGIST, South Korea)
@InProceedings{PPoPP15p281,
author = {Hyunseok Seo and Jinwook Kim and Min-Soo Kim},
title = {GStream: A Graph Streaming Processing Method for Large-Scale Graphs on GPUs},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {281-280},
doi = {},
year = {2015},
}
An OpenACC-Based Unified Programming Model for Multi-accelerator Systems
Jungwon Kim,
Seyong Lee, and
Jeffrey S. Vetter
(Oak Ridge National Laboratory, USA; Georgia Tech, USA)
@InProceedings{PPoPP15p285,
author = {Jungwon Kim and Seyong Lee and Jeffrey S. Vetter},
title = {An OpenACC-Based Unified Programming Model for Multi-accelerator Systems},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {285-284},
doi = {},
year = {2015},
}
Towards Batched Linear Solvers on Accelerated Hardware Platforms
Azzam Haidar,
Tingxing Dong,
Piotr Luszczek,
Stanimire Tomov, and
Jack Dongarra
(University of Tennessee, USA; Oak Ridge National Laboratory, USA; University of Manchester, UK)
@InProceedings{PPoPP15p289,
author = {Azzam Haidar and Tingxing Dong and Piotr Luszczek and Stanimire Tomov and Jack Dongarra},
title = {Towards Batched Linear Solvers on Accelerated Hardware Platforms},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {289-288},
doi = {},
year = {2015},
}
A Collection-Oriented Programming Model for Performance Portability
Saurav Muralidharan,
Michael Garland,
Bryan Catanzaro,
Albert Sidelnik, and
Mary Hall
(University of Utah, USA; NVIDIA, USA; Baidu, USA)
@InProceedings{PPoPP15p291,
author = {Saurav Muralidharan and Michael Garland and Bryan Catanzaro and Albert Sidelnik and Mary Hall},
title = {A Collection-Oriented Programming Model for Performance Portability},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {291-290},
doi = {},
year = {2015},
}
Gunrock: A High-Performance Graph Processing Library on the GPU
Yangzihao Wang,
Andrew Davidson,
Yuechao Pan,
Yuduo Wu,
Andy Riffel, and
John D. Owens
(University of California at Davis, USA)
@InProceedings{PPoPP15p293,
author = {Yangzihao Wang and Andrew Davidson and Yuechao Pan and Yuduo Wu and Andy Riffel and John D. Owens},
title = {Gunrock: A High-Performance Graph Processing Library on the GPU},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {293-292},
doi = {},
year = {2015},
}
Decoupled Load Balancing
Olga Pearce,
Todd Gamblin,
Bronis R. de Supinski,
Martin Schulz, and
Nancy M. Amato
(Texas A&M University, USA; Lawrence Livermore National Laboratory, USA)
@InProceedings{PPoPP15p295,
author = {Olga Pearce and Todd Gamblin and Bronis R. de Supinski and Martin Schulz and Nancy M. Amato},
title = {Decoupled Load Balancing},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {295-294},
doi = {},
year = {2015},
}
Combining Phase Identification and Statistic Modeling for Automated Parallel Benchmark Generation
Ye Jin,
Mingliang Liu,
Xiaosong Ma,
Qing Liu,
Jeremy Logan,
Norbert Podhorszki,
Jong Youl Choi, and
Scott Klasky
(North Carolina State University, USA; Qatar Computing Research Institute, Qatar; Oak Ridge National Laboratory, USA)
@InProceedings{PPoPP15p297,
author = {Ye Jin and Mingliang Liu and Xiaosong Ma and Qing Liu and Jeremy Logan and Norbert Podhorszki and Jong Youl Choi and Scott Klasky},
title = {Combining Phase Identification and Statistic Modeling for Automated Parallel Benchmark Generation},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {297-296},
doi = {},
year = {2015},
}
Optimization of Asynchronous Graph Processing on GPU with Hybrid Coloring Model
Xuanhua Shi,
Junling Liang,
Sheng Di,
Bingsheng He,
Hai Jin,
Lu Lu,
Zhixiang Wang,
Xuan Luo, and
Jianlong Zhong
(Huazhong University of Science and Technology, China; Argonne National Laboratory, USA; Nanyang Technological University, Singapore)
@InProceedings{PPoPP15p299,
author = {Xuanhua Shi and Junling Liang and Sheng Di and Bingsheng He and Hai Jin and Lu Lu and Zhixiang Wang and Xuan Luo and Jianlong Zhong},
title = {Optimization of Asynchronous Graph Processing on GPU with Hybrid Coloring Model},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {299-298},
doi = {},
year = {2015},
}
Efficient and Reasonable Object-Oriented Concurrency
Scott West,
Sebastian Nanz, and
Bertrand Meyer
(ETH Zurich, Switzerland)
@InProceedings{PPoPP15p301,
author = {Scott West and Sebastian Nanz and Bertrand Meyer},
title = {Efficient and Reasonable Object-Oriented Concurrency},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {301-300},
doi = {},
year = {2015},
}
A Programming Model and Runtime System for Significance-Aware Energy-Efficient Computing
Vassilis Vassiliadis,
Konstantinos Parasyris,
Charalambos Chalios,
Christos D. Antonopoulos,
Spyros Lalis,
Nikolaos Bellas,
Hans Vandierendonck, and
Dimitrios S. Nikolopoulos
(University of Thessaly, Greece; Centre for Research and Technology Hellas, Greece; Queen's University of Belfast, UK)
@InProceedings{PPoPP15p303,
author = {Vassilis Vassiliadis and Konstantinos Parasyris and Charalambos Chalios and Christos D. Antonopoulos and Spyros Lalis and Nikolaos Bellas and Hans Vandierendonck and Dimitrios S. Nikolopoulos},
title = {A Programming Model and Runtime System for Significance-Aware Energy-Efficient Computing},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {303-302},
doi = {},
year = {2015},
}
The Lock-Free k-LSM Relaxed Priority Queue
Martin Wimmer,
Jakob Gruber,
Jesper Larsson Träff, and
Philippas Tsigas
(TU Vienna, Austria; Chalmers University of Technology, Sweden)
@InProceedings{PPoPP15p305,
author = {Martin Wimmer and Jakob Gruber and Jesper Larsson Träff and Philippas Tsigas},
title = {The Lock-Free k-LSM Relaxed Priority Queue},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {305-304},
doi = {},
year = {2015},
}
Static/Dynamic Validation of MPI Collective Communications in Multi-threaded Context
Emmanuelle Saillard,
Patrick Carribault, and
Denis Barthou
(CEA, France; Bordeaux Institute of Technology, France; LaBRI, France; INRIA, France)
@InProceedings{PPoPP15p307,
author = {Emmanuelle Saillard and Patrick Carribault and Denis Barthou},
title = {Static/Dynamic Validation of MPI Collective Communications in Multi-threaded Context},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {307-306},
doi = {},
year = {2015},
}
CASTLE: Fast Concurrent Internal Binary Search Tree using Edge-Based Locking
Arunmoezhi Ramachandran and
Neeraj Mittal
(University of Texas at Dallas, USA)
@InProceedings{PPoPP15p309,
author = {Arunmoezhi Ramachandran and Neeraj Mittal},
title = {CASTLE: Fast Concurrent Internal Binary Search Tree using Edge-Based Locking},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {309-308},
doi = {},
year = {2015},
}
Section Based Program Analysis to Reduce Overhead of Detecting Unsynchronized Thread Communication
Madan Das,
Gabriel Southern, and
Jose Renau
(University of California at Santa Cruz, USA)
@InProceedings{PPoPP15p311,
author = {Madan Das and Gabriel Southern and Jose Renau},
title = {Section Based Program Analysis to Reduce Overhead of Detecting Unsynchronized Thread Communication},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {311-310},
doi = {},
year = {2015},
}
A Hierarchical Approach to Reducing Communication in Parallel Graph Algorithms
Harshvardhan,
Nancy M. Amato, and
Lawrence Rauchwerger
(Texas A&M University, USA)
@InProceedings{PPoPP15p313,
author = { Harshvardhan and Nancy M. Amato and Lawrence Rauchwerger},
title = {A Hierarchical Approach to Reducing Communication in Parallel Graph Algorithms},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {313-312},
doi = {},
year = {2015},
}
Tiles: A New Language Mechanism for Heterogeneous Parallelism
Yifeng Chen,
Xiang Cui, and
Hong Mei
(Peking University, China)
@InProceedings{PPoPP15p315,
author = {Yifeng Chen and Xiang Cui and Hong Mei},
title = {Tiles: A New Language Mechanism for Heterogeneous Parallelism},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {315-314},
doi = {},
year = {2015},
}
Are Web Applications Ready for Parallelism?
Cosmin Radoi,
Stephan Herhut,
Jaswanth Sreeram, and
Danny Dig
(University of Illinois at Urbana-Champaign, USA; Intel, USA; Oregon State University, USA)
@InProceedings{PPoPP15p317,
author = {Cosmin Radoi and Stephan Herhut and Jaswanth Sreeram and Danny Dig},
title = {Are Web Applications Ready for Parallelism?},
booktitle = {Proc.\ PPoPP},
publisher = {ACM},
pages = {317-316},
doi = {},
year = {2015},
}
proc time: 0.78