|
| 1 | +@inproceedings{NEURIPS2020_9332c513, |
| 2 | + author = {Moses, William and Churavy, Valentin}, |
| 3 | + booktitle = {Advances in Neural Information Processing Systems}, |
| 4 | + editor = {H. Larochelle and M. Ranzato and R. Hadsell and M. F. Balcan and H. Lin}, |
| 5 | + pages = {12472--12485}, |
| 6 | + publisher = {Curran Associates, Inc.}, |
| 7 | + title = {Instead of Rewriting Foreign Code for Machine Learning, Automatically Synthesize Fast Gradients}, |
| 8 | + url = {https://proceedings.neurips.cc/paper/2020/file/9332c513ef44b682e9347822c2e457ac-Paper.pdf}, |
| 9 | + volume = {33}, |
| 10 | + year = {2020} |
| 11 | +} |
| 12 | +@inproceedings{10.1145/3458817.3476165, |
| 13 | +author = {Moses, William S. and Churavy, Valentin and Paehler, Ludger and H\"{u}ckelheim, Jan and Narayanan, Sri Hari Krishna and Schanen, Michel and Doerfert, Johannes}, |
| 14 | +title = {Reverse-Mode Automatic Differentiation and Optimization of GPU Kernels via Enzyme}, |
| 15 | +year = {2021}, |
| 16 | +isbn = {9781450384421}, |
| 17 | +publisher = {Association for Computing Machinery}, |
| 18 | +address = {New York, NY, USA}, |
| 19 | +url = {https://doi.org/10.1145/3458817.3476165}, |
| 20 | +doi = {10.1145/3458817.3476165}, |
| 21 | +booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis}, |
| 22 | +articleno = {61}, |
| 23 | +numpages = {16}, |
| 24 | +keywords = {CUDA, LLVM, ROCm, HPC, AD, GPU, automatic differentiation}, |
| 25 | +location = {St. Louis, Missouri}, |
| 26 | +series = {SC '21} |
| 27 | +} |
| 28 | +@inproceedings{10.5555/3571885.3571964, |
| 29 | +author = {Moses, William S. and Narayanan, Sri Hari Krishna and Paehler, Ludger and Churavy, Valentin and Schanen, Michel and H\"{u}ckelheim, Jan and Doerfert, Johannes and Hovland, Paul}, |
| 30 | +title = {Scalable Automatic Differentiation of Multiple Parallel Paradigms through Compiler Augmentation}, |
| 31 | +year = {2022}, |
| 32 | +isbn = {9784665454445}, |
| 33 | +publisher = {IEEE Press}, |
| 34 | +booktitle = {Proceedings of the International Conference on High Performance Computing, Networking, Storage and Analysis}, |
| 35 | +articleno = {60}, |
| 36 | +numpages = {18}, |
| 37 | +keywords = {automatic differentiation, tasks, OpenMP, compiler, Julia, parallel, Enzyme, C++, RAJA, hybrid parallelization, MPI, distributed, LLVM}, |
| 38 | +location = {Dallas, Texas}, |
| 39 | +series = {SC '22} |
| 40 | +} |
0 commit comments