Powered by
2019 IEEE/ACM International Symposium on Code Generation and Optimization (CGO), February 16–20, 2019,
Washington, DC, USA
Frontmatter
Keynote
Research Papers
Binary Optimization
BOLT: A Practical Binary Optimizer for Data Centers and Beyond
Maksim Panchenko,
Rafael Auler,
Bill Nell, and
Guilherme Ottoni
(Facebook, USA)
@InProceedings{CGO19p100,
author = {Maksim Panchenko and Rafael Auler and Bill Nell and Guilherme Ottoni},
title = {BOLT: A Practical Binary Optimizer for Data Centers and Beyond},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {100-99},
doi = {},
year = {2019},
}
Artifacts Available
Artifacts Reusable
Results Replicated
Bugs and Security
Smokestack: Thwarting DOP Attacks with Runtime Stack Layout Randomization
Misiker Tadesse Aga and
Todd Austin
(University of Michigan, USA)
@InProceedings{CGO19p134,
author = {Misiker Tadesse Aga and Todd Austin},
title = {Smokestack: Thwarting DOP Attacks with Runtime Stack Layout Randomization},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {134-133},
doi = {},
year = {2019},
}
CSOD: Context-Sensitive Overflow Detection
Hongyu Liu,
Sam Silvestro,
Xiaoyin Wang,
Lide Duan, and
Tongping Liu
(University of Texas at San Antonio, USA)
@InProceedings{CGO19p168,
author = {Hongyu Liu and Sam Silvestro and Xiaoyin Wang and Lide Duan and Tongping Liu},
title = {CSOD: Context-Sensitive Overflow Detection},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {168-167},
doi = {},
year = {2019},
}
Reasoning about the Node.js Event Loop using Async Graphs
Haiyang Sun,
Daniele Bonetta,
Filippo Schiavio, and
Walter Binder
(USI Lugano, Switzerland; Oracle Labs, USA)
@InProceedings{CGO19p185,
author = {Haiyang Sun and Daniele Bonetta and Filippo Schiavio and Walter Binder},
title = {Reasoning about the Node.js Event Loop using Async Graphs},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {185-184},
doi = {},
year = {2019},
}
Artifacts Available
Artifacts Functional
Results Replicated
GPUs and Tensors
Automatic Generation of Warp-Level Primitives and Atomic Instructions for Fast and Portable Parallel Reduction on GPUs
Simon Garcia De Gonzalo,
Sitao Huang,
Juan Gómez-Luna,
Simon Hammond,
Onur Mutlu, and
Wen-mei Hwu
(University of Illinois at Urbana-Champaign, USA; ETH Zurich, Switzerland; Sandia National Laboratories, USA)
@InProceedings{CGO19p202,
author = {Simon Garcia De Gonzalo and Sitao Huang and Juan Gómez-Luna and Simon Hammond and Onur Mutlu and Wen-mei Hwu},
title = {Automatic Generation of Warp-Level Primitives and Atomic Instructions for Fast and Portable Parallel Reduction on GPUs},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {202-201},
doi = {},
year = {2019},
}
A Code Generator for High-Performance Tensor Contractions on GPUs
Jinsung Kim,
Aravind Sukumaran-Rajam,
Vineeth Thumma,
Sriram Krishnamoorthy,
Ajay Panyala,
Louis-Noël Pouchet,
Atanas Rountev, and
P. Sadayappan
(Ohio State University, USA; Pacific Northwest National Laboratory, USA; Colorado State University, USA)
@InProceedings{CGO19p219,
author = {Jinsung Kim and Aravind Sukumaran-Rajam and Vineeth Thumma and Sriram Krishnamoorthy and Ajay Panyala and Louis-Noël Pouchet and Atanas Rountev and P. Sadayappan},
title = {A Code Generator for High-Performance Tensor Contractions on GPUs},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {219-218},
doi = {},
year = {2019},
}
Artifacts Available
Artifacts Functional
Results Replicated
Potpourri
Transforming Query Sequences for High-Throughput B+ Tree Processing on Many-Core Processors
Ruiqin Tian,
Junqiao Qiu,
Zhijia Zhao,
Xu Liu, and
Bin Ren
(College of William and Mary, USA; University of California at Riverside, USA)
@InProceedings{CGO19p236,
author = {Ruiqin Tian and Junqiao Qiu and Zhijia Zhao and Xu Liu and Bin Ren},
title = {Transforming Query Sequences for High-Throughput B+ Tree Processing on Many-Core Processors},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {236-235},
doi = {},
year = {2019},
}
Artifacts Available
Artifacts Functional
Results Replicated
Quantifying and Reducing Execution Variance in STM via Model Driven Commit Optimization
Girish Mururu,
Ada Gavrilovska, and
Santosh Pande
(Georgia Institute of Technology, USA)
@InProceedings{CGO19p253,
author = {Girish Mururu and Ada Gavrilovska and Santosh Pande},
title = {Quantifying and Reducing Execution Variance in STM via Model Driven Commit Optimization},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {253-252},
doi = {},
year = {2019},
}
Artifacts Available
Artifacts Functional
Results Replicated
White-Box Program Tuning
Wen-Chuan Lee,
Yingqi Liu,
Peng Liu,
Shiqing Ma,
Hongjun Choi,
Xiangyu Zhang, and
Rajiv Gupta
(Purdue University, USA; University of California at Riverside, USA)
@InProceedings{CGO19p270,
author = {Wen-Chuan Lee and Yingqi Liu and Peng Liu and Shiqing Ma and Hongjun Choi and Xiangyu Zhang and Rajiv Gupta},
title = {White-Box Program Tuning},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {270-269},
doi = {},
year = {2019},
}
Generation of In-Bounds Inputs for Arrays in Memory-Unsafe Languages
Marcus Rodrigues,
Breno Guimarães, and
Fernando Magno Quintão Pereira
(Federal University of Minas Gerais, Brazil)
@InProceedings{CGO19p287,
author = {Marcus Rodrigues and Breno Guimarães and Fernando Magno Quintão Pereira},
title = {Generation of In-Bounds Inputs for Arrays in Memory-Unsafe Languages},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {287-286},
doi = {},
year = {2019},
}
Code Generation
Function Merging by Sequence Alignment
Rodrigo C. O. Rocha,
Pavlos Petoumenos,
Zheng Wang,
Murray Cole, and
Hugh Leather
(University of Edinburgh, UK; Lancaster University, UK)
@InProceedings{CGO19p304,
author = {Rodrigo C. O. Rocha and Pavlos Petoumenos and Zheng Wang and Murray Cole and Hugh Leather},
title = {Function Merging by Sequence Alignment},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {304-303},
doi = {},
year = {2019},
}
Artifacts Available
Artifacts Functional
Results Replicated
An Optimization-Driven Incremental Inline Substitution Algorithm for Just-in-Time Compilers
Aleksandar Prokopec,
Gilles Duboscq,
David Leopoldseder, and
Thomas Würthinger
(Oracle Labs, Switzerland; JKU Linz, Austria)
@InProceedings{CGO19p321,
author = {Aleksandar Prokopec and Gilles Duboscq and David Leopoldseder and Thomas Würthinger},
title = {An Optimization-Driven Incremental Inline Substitution Algorithm for Just-in-Time Compilers},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {321-320},
doi = {},
year = {2019},
}
Artifacts Available
Artifacts Functional
Results Replicated
Tensor Algebra Compilation with Workspaces
Fredrik Kjolstad,
Peter Ahrens,
Shoaib Kamil, and
Saman Amarasinghe
(Massachusetts Institute of Technology, USA; Adobe, USA)
@InProceedings{CGO19p338,
author = {Fredrik Kjolstad and Peter Ahrens and Shoaib Kamil and Saman Amarasinghe},
title = {Tensor Algebra Compilation with Workspaces},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {338-337},
doi = {},
year = {2019},
}
Kernel Optimization
Tiramisu: A Polyhedral Compiler for Expressing Fast and Portable Code
Riyadh Baghdadi,
Jessica Ray,
Malek Ben Romdhane,
Emanuele Del Sozzo,
Abdurrahman Akkas,
Yunming Zhang,
Patricia Suriana,
Shoaib Kamil, and
Saman Amarasinghe
(Massachusetts Institute of Technology, USA; Politecnico di Milano, Italy; Google, USA; Adobe, USA)
@InProceedings{CGO19p355,
author = {Riyadh Baghdadi and Jessica Ray and Malek Ben Romdhane and Emanuele Del Sozzo and Abdurrahman Akkas and Yunming Zhang and Patricia Suriana and Shoaib Kamil and Saman Amarasinghe},
title = {Tiramisu: A Polyhedral Compiler for Expressing Fast and Portable Code},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {355-354},
doi = {},
year = {2019},
}
Artifacts Available
Artifacts Reusable
Results Replicated
Super-Node SLP: Optimized Vectorization for Code Sequences Containing Operators and Their Inverse Elements
Vasileios Porpodas,
Rodrigo C. O. Rocha,
Evgueni Brevnov,
Luís F. W. Góes, and
Timothy Mattson
(Intel, USA; University of Edinburgh, UK; PUC-MG, Brazil)
@InProceedings{CGO19p372,
author = {Vasileios Porpodas and Rodrigo C. O. Rocha and Evgueni Brevnov and Luís F. W. Góes and Timothy Mattson},
title = {Super-Node SLP: Optimized Vectorization for Code Sequences Containing Operators and Their Inverse Elements},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {372-371},
doi = {},
year = {2019},
}
Locus: A System and a Language for Program Optimization
Thiago S. F. X. Teixeira,
Corinne Ancourt,
David Padua, and
William Gropp
(University of Illinois at Urbana-Champaign, USA; MINES ParisTech, France)
@InProceedings{CGO19p389,
author = {Thiago S. F. X. Teixeira and Corinne Ancourt and David Padua and William Gropp},
title = {Locus: A System and a Language for Program Optimization},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {389-388},
doi = {},
year = {2019},
}
GPUs
Decoding CUDA Binary
Ari B. Hayes,
Fei Hua,
Jin Huang,
Yanhao Chen, and
Eddy Z. Zhang
(Rutgers University, USA)
@InProceedings{CGO19p406,
author = {Ari B. Hayes and Fei Hua and Jin Huang and Yanhao Chen and Eddy Z. Zhang},
title = {Decoding CUDA Binary},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {406-405},
doi = {},
year = {2019},
}
Artifacts Available
Artifacts Reusable
Results Replicated
From Loop Fusion to Kernel Fusion: A Domain-Specific Approach to Locality Optimization
Bo Qiao,
Oliver Reiche,
Frank Hannig, and
Jürgen Teich
(University of Erlangen-Nuremberg, Germany)
@InProceedings{CGO19p423,
author = {Bo Qiao and Oliver Reiche and Frank Hannig and Jürgen Teich},
title = {From Loop Fusion to Kernel Fusion: A Domain-Specific Approach to Locality Optimization},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {423-422},
doi = {10.1109/CGO.2019.8661176},
year = {2019},
}
Publisher's Version
Published Artifact
Artifacts Available
Artifacts Reusable
Results Replicated
IGC: The Open Source Intel Graphics Compiler
Anupama Chandrasekhar,
Gang Chen,
Po-Yu Chen,
Wei-Yu Chen,
Junjie Gu,
Peng Guo,
Shruthi Hebbur Prasanna Kumar,
Guei-Yuan Lueh,
Pankaj Mistry,
Wei Pan,
Thomas Raoux, and
Konrad Trifunovic
(Intel, USA; Intel, Poland)
@InProceedings{CGO19p440,
author = {Anupama Chandrasekhar and Gang Chen and Po-Yu Chen and Wei-Yu Chen and Junjie Gu and Peng Guo and Shruthi Hebbur Prasanna Kumar and Guei-Yuan Lueh and Pankaj Mistry and Wei Pan and Thomas Raoux and Konrad Trifunovic},
title = {IGC: The Open Source Intel Graphics Compiler},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {440-439},
doi = {},
year = {2019},
}
Student Research Competition
Undergraduate
Graduate
A Shared BTB Design for Multicore Systems
Moumita Das,
Ansuman Banerjee, and
Bhaskar Sardar
(Jadavpur University, India; Indian Statistical Institute, India)
@InProceedings{CGO19p459,
author = {Moumita Das and Ansuman Banerjee and Bhaskar Sardar},
title = {A Shared BTB Design for Multicore Systems},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {459-458},
doi = {},
year = {2019},
}
Optimizing RNA-RNA Interaction Computations
Swetha Varadarajan
(Colorado State University, USA)
@InProceedings{CGO19p461,
author = {Swetha Varadarajan},
title = {Optimizing RNA-RNA Interaction Computations},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {461-460},
doi = {},
year = {2019},
}
Code Generation from Formal Models for Automatic RTOS Portability
Renata Martins Gomes and
Marcel Baunach
(Graz University of Technology, Austria)
@InProceedings{CGO19p463,
author = {Renata Martins Gomes and Marcel Baunach},
title = {Code Generation from Formal Models for Automatic RTOS Portability},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {463-462},
doi = {},
year = {2019},
}
Understanding RDMA Behavior in NUMA Systems
Jacob Nelson and
Roberto Palmieri
(Lehigh University, USA)
@InProceedings{CGO19p465,
author = {Jacob Nelson and Roberto Palmieri},
title = {Understanding RDMA Behavior in NUMA Systems},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {465-464},
doi = {},
year = {2019},
}
Accelerating GPU Computing at Runtime with Binary Optimization
Guangli Li,
Lei Liu, and
Xiaobing Feng
(Institute of Computing Technology at Chinese Academy of Sciences, China; University of Chinese Academy of Sciences, China)
@InProceedings{CGO19p469,
author = {Guangli Li and Lei Liu and Xiaobing Feng},
title = {Accelerating GPU Computing at Runtime with Binary Optimization},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {469-468},
doi = {},
year = {2019},
}
Extending LLVM for Lightweight SPMD Vectorization: Using SIMD and Vector Instructions Easily from Any Language
Robin Kruppe,
Julian Oppermann,
Lukas Sommer, and
Andreas Koch
(TU Darmstadt, Germany)
@InProceedings{CGO19p471,
author = {Robin Kruppe and Julian Oppermann and Lukas Sommer and Andreas Koch},
title = {Extending LLVM for Lightweight SPMD Vectorization: Using SIMD and Vector Instructions Easily from Any Language},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {471-470},
doi = {},
year = {2019},
}
Multi-target Compiler for the Deployment of Machine Learning Models
Oscar Castro-Lopez and
Ines F. Vega-Lopez
(Autonomous University of Sinaloa, Mexico)
@InProceedings{CGO19p473,
author = {Oscar Castro-Lopez and Ines F. Vega-Lopez},
title = {Multi-target Compiler for the Deployment of Machine Learning Models},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {473-472},
doi = {},
year = {2019},
}
Kernel Fusion/Decomposition for Automatic GPU-Offloading
Alok Mishra,
Martin Kong, and
Barbara Chapman
(Stony Brook University, USA; Brookhaven National Laboratory, USA)
@InProceedings{CGO19p477,
author = {Alok Mishra and Martin Kong and Barbara Chapman},
title = {Kernel Fusion/Decomposition for Automatic GPU-Offloading},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {477-476},
doi = {},
year = {2019},
}
proc time: 0.06