Powered by
2021 IEEE/ACM International Symposium on Code Generation and Optimization (CGO), February 27 – March 3, 2021,
Virtual, Republic of Korea
Frontmatter
Keynote
Compiler Infrastructure
(Chair: Michael Kruse, Argonne National Laboratory, USA)
MLIR: Scaling Compiler Infrastructure for Domain Specific Computation
Chris Lattner,
Mehdi Amini,
Uday Bondhugula,
Albert Cohen,
Andy Davis,
Jacques Pienaar,
River Riddle,
Tatiana Shpeisman,
Nicolas Vasilache, and
Oleksandr Zinenko
(Google, USA; Indian Institute of Science, India; Google, France)
@InProceedings{CGO21p18,
author = {Chris Lattner and Mehdi Amini and Uday Bondhugula and Albert Cohen and Andy Davis and Jacques Pienaar and River Riddle and Tatiana Shpeisman and Nicolas Vasilache and Oleksandr Zinenko},
title = {MLIR: Scaling Compiler Infrastructure for Domain Specific Computation},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {18-17},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Reusable
Progressive Raising in Multi-level IR
Lorenzo Chelini,
Andi Drebes,
Oleksandr Zinenko,
Albert Cohen,
Nicolas Vasilache,
Tobias Grosser, and
Henk Corporaal
(Eindhoven University of Technology, Netherlands; Inria, France; ENS Paris, France; Google, France; Google, Switzerland; University of Edinburgh, UK)
@InProceedings{CGO21p35,
author = {Lorenzo Chelini and Andi Drebes and Oleksandr Zinenko and Albert Cohen and Nicolas Vasilache and Tobias Grosser and Henk Corporaal},
title = {Progressive Raising in Multi-level IR},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {35-34},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Functional
Results Reproduced
Towards a Domain-Extensible Compiler: Optimizing an Image Processing Pipeline on Mobile CPUs
Thomas Koehler and
Michel Steuwer
(University of Glasgow, UK; University of Edinburgh, UK)
@InProceedings{CGO21p52,
author = {Thomas Koehler and Michel Steuwer},
title = {Towards a Domain-Extensible Compiler: Optimizing an Image Processing Pipeline on Mobile CPUs},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {52-51},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Reusable
Results Reproduced
Dealing with Precision
(Chair: Uma Srinivasan, Twitter)
An Interval Compiler for Sound Floating-Point Computations
Joao Rivera,
Franz Franchetti, and
Markus Püschel
(ETH Zurich, Switzerland; Carnegie Mellon University, USA)
@InProceedings{CGO21p86,
author = {Joao Rivera and Franz Franchetti and Markus Püschel},
title = {An Interval Compiler for Sound Floating-Point Computations},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {86-85},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Reusable
Results Reproduced
Seamless Compiler Integration of Variable Precision Floating-Point Arithmetic
Tiago Trevisan Jost,
Yves Durand,
Christian Fabre,
Albert Cohen, and
Frédéric Pétrot
(Université Grenoble Alpes, France; CEA LIST, France; Google, France; CNRS, France; Grenoble INP, France; TIMA, France)
@InProceedings{CGO21p103,
author = {Tiago Trevisan Jost and Yves Durand and Christian Fabre and Albert Cohen and Frédéric Pétrot},
title = {Seamless Compiler Integration of Variable Precision Floating-Point Arithmetic},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {103-102},
doi = {},
year = {2021},
}
Artifacts Functional
Results Reproduced
UNIT: Unifying Tensorized Instruction Compilation
Jian Weng,
Animesh Jain,
Jie Wang,
Leyuan Wang,
Yida Wang, and
Tony Nowatzki
(University of California at Los Angeles, USA; Amazon, USA)
@InProceedings{CGO21p120,
author = {Jian Weng and Animesh Jain and Jie Wang and Leyuan Wang and Yida Wang and Tony Nowatzki},
title = {UNIT: Unifying Tensorized Instruction Compilation},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {120-119},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Functional
Unleashing the Low-Precision Computation Potential of Tensor Cores on GPUs
Guangli Li,
Jingling Xue,
Lei Liu,
Xueying Wang,
Xiu Ma,
Xiao Dong,
Jiansong Li, and
Xiaobing Feng
(Institute of Computing Technology at Chinese Academy of Sciences, China; University of Chinese Academy of Sciences, China; UNSW, Australia; Jilin University, China)
@InProceedings{CGO21p137,
author = {Guangli Li and Jingling Xue and Lei Liu and Xueying Wang and Xiu Ma and Xiao Dong and Jiansong Li and Xiaobing Feng},
title = {Unleashing the Low-Precision Computation Potential of Tensor Cores on GPUs},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {137-136},
doi = {},
year = {2021},
}
Binary Profiling, Tracing, Sampling
(Chair: Wei Wang, University of Texas at San Antonio, USA)
Cinnamon: A Domain-Specific Language for Binary Profiling and Monitoring
Mahwish Arif,
Ruoyu Zhou,
Hsi-Ming Ho, and
Timothy M. Jones
(University of Cambridge, UK; University of Sussex, UK)
@InProceedings{CGO21p154,
author = {Mahwish Arif and Ruoyu Zhou and Hsi-Ming Ho and Timothy M. Jones},
title = {Cinnamon: A Domain-Specific Language for Binary Profiling and Monitoring},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {154-153},
doi = {},
year = {2021},
}
GPA: A GPU Performance Advisor Based on Instruction Sampling
Keren Zhou,
Xiaozhu Meng,
Ryuichi Sai, and
John Mellor-Crummey
(Rice University, USA)
@InProceedings{CGO21p171,
author = {Keren Zhou and Xiaozhu Meng and Ryuichi Sai and John Mellor-Crummey},
title = {GPA: A GPU Performance Advisor Based on Instruction Sampling},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {171-170},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Reusable
Results Reproduced
ELFies: Executable Region Checkpoints for Performance Analysis and Simulation
Harish Patil,
Alexander Isaev,
Wim Heirman,
Alen Sabu,
Ali Hajiabadi, and
Trevor E. Carlson
(Intel Corporation, USA; Intel Corporation, Belgium; National University of Singapore, Singapore)
@InProceedings{CGO21p188,
author = {Harish Patil and Alexander Isaev and Wim Heirman and Alen Sabu and Ali Hajiabadi and Trevor E. Carlson},
title = {ELFies: Executable Region Checkpoints for Performance Analysis and Simulation},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {188-187},
doi = {},
year = {2021},
}
Artifacts Functional
Results Reproduced
Vulkan Vision: Ray Tracing Workload Characterization using Automatic Graphics Instrumentation
David Pankratz,
Tyler Nowicki,
Ahmed Eltantawy, and
José Nelson Amaral
(University of Alberta, Canada; Huawei Technologies, Canada)
@InProceedings{CGO21p205,
author = {David Pankratz and Tyler Nowicki and Ahmed Eltantawy and José Nelson Amaral},
title = {Vulkan Vision: Ray Tracing Workload Characterization using Automatic Graphics Instrumentation},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {205-204},
doi = {},
year = {2021},
}
Artifacts Functional
Results Reproduced
Parallelism - Optimizing, Modeling, Testing
(Chair: Michael O'Boyle, University of Edinburgh, UK)
Loop Parallelization using Dynamic Commutativity Analysis
Christos Vasiladiotis,
Roberto Castañeda Lozano,
Murray Cole, and
Björn Franke
(University of Edinburgh, UK)
@InProceedings{CGO21p222,
author = {Christos Vasiladiotis and Roberto Castañeda Lozano and Murray Cole and Björn Franke},
title = {Loop Parallelization using Dynamic Commutativity Analysis},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {222-221},
doi = {},
year = {2021},
}
Fine-Grained Pipeline Parallelization for Network Function Programs
Seungbin Song,
Heelim Choi, and
Hanjun Kim
(Yonsei University, South Korea)
@InProceedings{CGO21p239,
author = {Seungbin Song and Heelim Choi and Hanjun Kim},
title = {Fine-Grained Pipeline Parallelization for Network Function Programs},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {239-238},
doi = {},
year = {2021},
}
YaskSite: Stencil Optimization Techniques Applied to Explicit ODE Methods on Modern Architectures
Christie L. Alappat,
Johannes Seiferth,
Georg Hager,
Matthias Korch,
Thomas Rauber, and
Gerhard Wellein
(University of Erlangen-Nuremberg, Germany; University of Bayreuth, Germany)
@InProceedings{CGO21p256,
author = {Christie L. Alappat and Johannes Seiferth and Georg Hager and Matthias Korch and Thomas Rauber and Gerhard Wellein},
title = {YaskSite: Stencil Optimization Techniques Applied to Explicit ODE Methods on Modern Architectures},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {256-255},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Functional
Results Reproduced
GoBench: A Benchmark Suite of Real-World Go Concurrency Bugs
Ting Yuan,
Guangwei Li,
Jie Lu,
Chen Liu,
Lian Li, and
Jingling Xue
(Institute of Computing Technology at Chinese Academy of Sciences, China; University of Chinese Academy of Sciences, China; UNSW, Australia)
@InProceedings{CGO21p273,
author = {Ting Yuan and Guangwei Li and Jie Lu and Chen Liu and Lian Li and Jingling Xue},
title = {GoBench: A Benchmark Suite of Real-World Go Concurrency Bugs},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {273-272},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Functional
Results Reproduced
Memory Optimization and Safeness
(Chair: Eunjung Park, Los Alamos National Laboratory, USA)
Variable-Sized Blocks for Locality-Aware SpMV
Naveen Namashivayam,
Sanyam Mehta, and
Pen-Chung Yew
(HPE, USA; University of Minnesota at Twin Cities, USA)
@InProceedings{CGO21p307,
author = {Naveen Namashivayam and Sanyam Mehta and Pen-Chung Yew},
title = {Variable-Sized Blocks for Locality-Aware SpMV},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {307-306},
doi = {},
year = {2021},
}
Object Versioning for Flow-Sensitive Pointer Analysis
Mohamad Barbar,
Yulei Sui, and
Shiping Chen
(University of Technology Sydney, Australia; CSIRO's Data61, Australia)
@InProceedings{CGO21p324,
author = {Mohamad Barbar and Yulei Sui and Shiping Chen},
title = {Object Versioning for Flow-Sensitive Pointer Analysis},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {324-323},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Functional
Results Reproduced
Scaling Up the IFDS Algorithm with Efficient Disk-Assisted Computing
Haofeng Li,
Haining Meng,
Hengjie Zheng,
Liqing Cao,
Jie Lu,
Lian Li, and
Lin Gao
(Institute of Computing Technology at Chinese Academy of Sciences, China; University of Chinese Academy of Sciences, China; TianqiSoft, China)
@InProceedings{CGO21p341,
author = {Haofeng Li and Haining Meng and Hengjie Zheng and Liqing Cao and Jie Lu and Lian Li and Lin Gao},
title = {Scaling Up the IFDS Algorithm with Efficient Disk-Assisted Computing},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {341-340},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Functional
Compiling Graph Algorithms, Compiling for GPU's
(Chair: Maria Garzaran, Intel Corporation and University of Illinois at Urbana-Champaign, USA)
Compiling Graph Applications for GPUs with GraphIt
Ajay Brahmakshatriya,
Yunming Zhang,
Changwan Hong,
Shoaib Kamil,
Julian Shun, and
Saman Amarasinghe
(Massachusetts Institute of Technology, USA; Adobe, USA)
@InProceedings{CGO21p358,
author = {Ajay Brahmakshatriya and Yunming Zhang and Changwan Hong and Shoaib Kamil and Julian Shun and Saman Amarasinghe},
title = {Compiling Graph Applications for GPUs with GraphIt},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {358-357},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Reusable
Results Reproduced
r3d3: Optimized Query Compilation on GPUs
Alexander Krolik,
Clark Verbrugge, and
Laurie Hendren
(McGill University, Canada)
@InProceedings{CGO21p392,
author = {Alexander Krolik and Clark Verbrugge and Laurie Hendren},
title = {r3d3: Optimized Query Compilation on GPUs},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {392-391},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Functional
Results Reproduced
C-for-Metal: High Performance SIMD Programming on Intel GPUs
Guei-Yuan Lueh,
Kaiyu Chen,
Gang Chen,
Joel Fuentes,
Wei-Yu Chen,
Fangwen Fu,
Hong Jiang,
Hongzheng Li, and
Daniel Rhee
(Intel Corporation, USA)
@InProceedings{CGO21p409,
author = {Guei-Yuan Lueh and Kaiyu Chen and Gang Chen and Joel Fuentes and Wei-Yu Chen and Fangwen Fu and Hong Jiang and Hongzheng Li and Daniel Rhee},
title = {C-for-Metal: High Performance SIMD Programming on Intel GPUs},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {409-408},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Functional
Results Reproduced
Compiling for Spatial, Quantum, and Embedded Devices
(Chair: Wei-Fen Lin, National Cheng Kung University, Taiwan)
Relaxed Peephole Optimization: A Novel Compiler Optimization for Quantum Circuits
Ji Liu,
Luciano Bello, and
Huiyang Zhou
(North Carolina State University, USA; IBM Research, USA)
@InProceedings{CGO21p426,
author = {Ji Liu and Luciano Bello and Huiyang Zhou},
title = {Relaxed Peephole Optimization: A Novel Compiler Optimization for Quantum Circuits},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {426-425},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Reusable
Results Reproduced
StencilFlow: Mapping Large Stencil Programs to Distributed Spatial Computing Systems
Johannes de Fine Licht,
Andreas Kuster,
Tiziano De Matteis,
Tal Ben-Nun,
Dominic Hofer, and
Torsten Hoefler
(ETH Zurich, Switzerland; MeteoSwiss, Switzerland)
@InProceedings{CGO21p443,
author = {Johannes de Fine Licht and Andreas Kuster and Tiziano De Matteis and Tal Ben-Nun and Dominic Hofer and Torsten Hoefler},
title = {StencilFlow: Mapping Large Stencil Programs to Distributed Spatial Computing Systems},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {443-442},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Reusable
Results Reproduced
Thread-Aware Area-Efficient High-Level Synthesis Compiler for Embedded Devices
Changsu Kim,
Shinnung Jeong,
Sungjun Cho,
Yongwoo Lee,
William Song,
Youngsok Kim, and
Hanjun Kim
(POSTECH, South Korea; Yonsei University, South Korea)
@InProceedings{CGO21p460,
author = {Changsu Kim and Shinnung Jeong and Sungjun Cho and Yongwoo Lee and William Song and Youngsok Kim and Hanjun Kim},
title = {Thread-Aware Area-Efficient High-Level Synthesis Compiler for Embedded Devices},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {460-459},
doi = {},
year = {2021},
}
JIT and Binary Translation; Optimizing for Code-Size
(Chair: Probir Roy, University of Michigan at Dearborn, USA)
Enhancing Atomic Instruction Emulation for Cross-ISA Dynamic Binary Translation
Ziyi Zhao,
Zhang Jiang,
Ying Chen,
Xiaoli Gong,
Wenwen Wang, and
Pen-Chung Yew
(Nankai University, China; University of Georgia, USA; University of Minnesota at Twin Cities, USA)
@InProceedings{CGO21p494,
author = {Ziyi Zhao and Zhang Jiang and Ying Chen and Xiaoli Gong and Wenwen Wang and Pen-Chung Yew},
title = {Enhancing Atomic Instruction Emulation for Cross-ISA Dynamic Binary Translation},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {494-493},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Reusable
Results Reproduced
An Experience with Code-Size Optimization for Production iOS Mobile Applications
Milind Chabbi,
Jin Lin, and
Raj Barik
(Uber Technologies, USA)
@InProceedings{CGO21p511,
author = {Milind Chabbi and Jin Lin and Raj Barik},
title = {An Experience with Code-Size Optimization for Production iOS Mobile Applications},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {511-510},
doi = {},
year = {2021},
}
Published Artifact
Artifacts Available
Artifacts Reusable
AnghaBench: A Suite with One Million Compilable C Benchmarks for Code-Size Reduction
Anderson Faustino da Silva,
Bruno Conde Kind,
José Wesley de Souza Magalhães,
Jerônimo Nunes Rocha,
Breno Campos Ferreira Guimarães, and
Fernando Magno Quintão Pereira
(State University of Maringá, Brazil; Federal University of Minas Gerais, Brazil)
@InProceedings{CGO21p528,
author = {Anderson Faustino da Silva and Bruno Conde Kind and José Wesley de Souza Magalhães and Jerônimo Nunes Rocha and Breno Campos Ferreira Guimarães and Fernando Magno Quintão Pereira},
title = {AnghaBench: A Suite with One Million Compilable C Benchmarks for Code-Size Reduction},
booktitle = {Proc.\ CGO},
publisher = {IEEE},
pages = {528-527},
doi = {},
year = {2021},
}
proc time: 0.04