Copyrights to the following papers are held by the publishers. The attached
files are preprints. It is understood that all persons copying this
information will adhere to the terms and constraints invoked by each author's
copyright. These work may not be reposted without the explicit permission of
the copyright holder.
Journal
Safe Overclocking for CNN Accelerators through Algorithm-Level Error Detection, Thibaut Marty, Tomofumi Yuki, and Steven Derrien, IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems, 2020, (link), (BibTEX).
@ARTICLE{marty2020safe,
author={Thibaut Marty and Tomofumi Yuki and Steven Derrien},
journal={IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems},
title={Safe Overclocking for {CNN} Accelerators through Algorithm-Level Error Detection},
year={2020},
volume={},
number={},
pages={1-1},
doi = {10.1109/TCAD.2020.2981056}
}
Conference/Workshop
Sparse Computation Data Dependence Simplification for Efficient Compiler-generated Inspectors, Mahdi Soltan Mohammadi, Tomofumi Yuki, Kazem Cheshmi, Eddie C. Davis, Mary Hall, Maryam Mehri Dehnavi, Payal Nandy, Catherine Olschanowsky, Anand Venkat, and Michelle Mills Strout, 40th ACM SIGPLAN Conference on Programming Language Design and Implementation, 2019, (pdf), (BibTEX).
@inproceedings{mohammadi2019sparse,
author = {Mohammadi, Mahdi Soltan and Yuki, Tomofumi and Cheshmi, Kazem and Davis, Eddie C. and Hall, Mary and Dehnavi, Maryam Mehri and Nandy, Payal and Olschanowsky, Catherine and Venkat, Anand and Strout, Michelle Mills},
title = {Sparse Computation Data Dependence Simplification for Efficient Compiler-generated Inspectors},
booktitle = {Proceedings of the 40th ACM SIGPLAN Conference on Programming Language Design and Implementation},
series = {PLDI '19},
year = 2019,
month = Jun,
pages = {594--609},
numpages = {16},
doi = {10.1145/3314221.3314646},
}
The Limit of Polynomials, Tomofumi Yuki, 9th International Workshop on Polyhedral Compilation Techniques, 2019, (pdf)(slides-pptx), (BibTEX).
@inproceedings{yuki2019limit,
author = {Yuki, Tomofumi},
title = {The Limit of Polynomials},
booktitle = {Proceedings of the 9th International Workshop on Polyhedral Compilation Techniques},
series = {IMPACT '19},
year = 2019,
month = Jan,
}
Enabling Overclocking with HLS Tools through Algorithm-Level Error Detection, Thibaut Marty, Tomofumi Yuki, and Steven Derrien, 2018 International Conference on Field-Programmable Technology (to appear), 2018, (pdf), (BibTEX).
@inproceedings{marty2018enabling,
title={Enabling Overclocking with HLS Tools through Algorithm-Level Error Detection},
author={Thibaut Marty, Tomofumi Yuki, and Steven Derrien},
booktitle={Proceedings of the 2018 International Conference on Field-Programmable Technology (to appear)},
series={ICFPT '18},
location={Naha, Japan},
month=Dec,
year={2018},
}
Extending Index-Array Properties for Data Dependence Analysis, Mahdi Soltan Mohammadi, Kazem Cheshmi, Maryam Mehri Dehnavi, Anand Venkat, Tomofumi Yuki, and Michelle Mills Strout, 31st International Workshop on Languages and Compilers for Parallel Computing, 2018, (pdf), (BibTEX).
@inproceedings{mohammadi2018extending,
title={Extending Index-Array Properties for Data Dependence Analysis},
authors={Mahdi Soltan Mohammadi and Kazem Cheshmi and Maryam Mehri Dehnavi and Anand Venkat and Tomofumi Yuki and Michelle Mills Strout},
booktitle={Proceedings of the 31st International Workshop on Languages and Compilers for Parallel Computing},
series={LCPC '18},
month=Oct,
year={2018}
}
One Size Does Not Fit All: Implementation Trade-offs for Iterative Stencil Computations on FPGAs, Gaël Deest, Tomofumi Yuki, Sanjay Rajopadhye, and Steven Derrien, 27th International Conference on Field-Programmable Logic and Applications, 2017, (pdf), (BibTEX).
@inproceedings{deest2017onesize,
title={One Size Does Not Fit All: Implementation Trade-offs for Iterative Stencil Computations on FPGAs},
author={Ga\"{e}l Deest, Tomofumi Yuki, Sanjay Rajopadhye, and Steven Derrien},
booktitle={Proceedings of the 27th International Conference on Field-Programmable Logic and Applications},
series={FPL '17},
year={2017},
month=Sep,
location={Ghent, Belgium},
}
EURECA compilation: Automatic optimisation of cycle-reconfigurable circuits, Xinyu Niu, Nicholas Ng, Tomofumi Yuki, Shaojun Wang, Nobuko Yoshida, and Wayne Luk, 26th International Conference on Field Programmable Logic and Applications, 2016, (pdf), (BibTEX).
@INPROCEEDINGS{niu2016eureca,
author={Xinyu Niu and Nicholas Ng and Tomofumi Yuki and Shaojun Wang and Nobuko Yoshida and Wayne Luk},
title={{EURECA} compilation: Automatic optimisation of cycle-reconfigurable circuits},
booktitle={Proceedings of the 26th International Conference on Field Programmable Logic and Applications},
series={FPL '16}
year={2016},
pages={1-4},
doi={10.1109/FPL.2016.7577359},
month={Aug}
}
Extended Lattice-based Memory Allocation, Alain Darte, Alexandre Isoard, and Tomofumi Yuki, 25th International Conference on Compiler Construction, 2016, (pdf)(slides), (BibTEX).
@inproceedings{darte2016extended,
author = {Darte, Alain and Isoard, Alexandre and Yuki, Tomofumi},
title = {Extended Lattice-based Memory Allocation},
booktitle = {Proceedings of the 25th International Conference on Compiler Construction},
series = {CC '16},
year = {2016},
location = {Barcelona, Spain},
pages = {218--228},
numpages = {11},
doi = {10.1145/2892208.2892213},
}
Liveness Analysis in Explicitly-Parallel Programs, Alain Darte, Alexandre Isoard, and Tomofumi Yuki, 6th International Workshop on Polyhedral Compilation Techniques, 2016, (pdf)(slides),
Towards Scalable and Efficient FPGA Stencil Accelerators, Gaël Deest, Nicolas Estibals, Tomofumi Yuki, Steven Derrien, and Sanjay Rajopadhye, 6th International Workshop on Polyhedral Compilation Techniques, 2016, (pdf)(slides),
@inproceedings{yuki2015revisiting,
author = {Tomofumi Yuki},
title = {Revisiting Loop Transformations with {X10} Clocks},
booktitle = {Proceedings of the ACM SIGPLAN Workshop on {X10}},
series = {X10'15},
year = {2015},
location = {Portland, OR, USA},
pages = {1--6},
numpages = {6},
doi = {10.1145/2771774.2771778}
}
Toward Scalable Source Level Accuracy Analysis for Floating-point to Fixed-point Conversion, Gaël Deest, Tomofumi Yuki, Olivier Sentieys, and Steven Derrien, 2014 International Conference on Computer-Aided Design, 2014, (pdf), (BibTEX).
@inproceedings{deest2014derivation,
title={Toward Scalable Source Level Accuracy Analysis for Floating-point to Fixed-point Conversion},
author={Ga\"{e}l Deest, Tomofumi Yuki, Olivier Sentieys, and Steven Derrien},
booktitle={Proceedings of the 2014 International Conference on Computer-Aided Design},
series={ICCAD '14},
year={2014},
pages={726--733},
month=Nov,
location={San Jose, CA},
}
Understanding PolyBench/C 3.2 Kernels, Tomofumi Yuki, 4th International Workshop on Polyhedral Compilation Techniques, 2014, (pdf)(slides), (BibTEX).
@inproceedings{yuki2014understanding,
author = {Yuki, Tomofumi},
title = {Understanding {PolyBench/C} 3.2 Kernels},
booktitle = {Proceedings of the 4th International Workshop on Polyhedral Compilation Techniques},
series = {IMPACT '14},
year = 2014,
month = Jan,
}
Derivation of Efficient FSM from Loop Nests, Tomofumi Yuki, Antoine Morvan, and Steven Derrien, 2013 International Conference on Field-Programmable Technology, 2013, (pdf)(slides)(slides-pptx), (BibTEX).
@inproceedings{yuki2013derivation,
title={Derivation of Efficient {FSM} from Loop Nests},
author={Tomofumi Yuki and Antoine Morvan and Steven Derrien},
booktitle={Proceedings of the 2013 International Conference on Field-Programmable Technology},
series={ICFPT '13},
pages={286--293},
location={Kyoto, Japan},
month=Dec,
year={2013},
doi={10.1109/FPT.2013.6718367}
}
Folklore Confirmed: Compiling for Speed = Compiling for Energy, Tomofumi Yuki and Sanjay Rajopadhye, 26th International Workshop on Languages and Compilers for Parallel Computing, 2013, (pdf)(slides)(slides-pptx), (BibTEX).
@inproceedings{yuki2013folklore,
title={Folklore Confirmed: Compiling for Speed = Compiling for Energy},
author={Tomofumi Yuki and Sanjay Rajopadhye},
booktitle={Proceedings of the 26th International Workshop on Languages and Compilers for Parallel Computing},
series={LCPC '13},
month=Sep,
year={2013}
}
Coarse-Grain Optimization and Code Generation for Embedded Multicore Systems, Goulas, G. and Valouxis, C. and Alefragis, P. and Voros, N.S. and Oey, O. and Stripf, T. and Bruckschloegl, T. and Becker, J. and Gogos, C. and El Moussawi, A. and Naullet, M. and Yuki, T., Proceedings of the 2013 Euromicro Conference on Digital System Design, 2013, (link), (BibTEX).
@INPROCEEDINGS{alma2013coarse,
author={Goulas, G. and Valouxis, C. and Alefragis, P. and Voros, N.S. and Oey, O. and Stripf, T. and Bruckschloegl, T. and Becker, J. and Gogos, C. and El Moussawi, A. and Naullet, M. and Yuki, T.},
booktitle={Proceedings of the 2013 Euromicro Conference on Digital System Design},
title={Coarse-Grain Optimization and Code Generation for Embedded Multicore Systems},
month=Sep,
year={2013},
pages={379-386},
doi={10.1109/DSD.2013.48}
}
GeCoS: A Framework for Prototyping Custom Hardware Design Flows, Antoine Floc'h, Tomofumi Yuki, Ali El-Moussawi, Antoine Morvan, Kevin Martin, Maxime Naullet,
Mythri Alle, Ludovic L'Hours, Nicolas Simon, Steven Derrien, François Charot, Christophe Wolinski, and Olivier Sentieys, 13th IEEE International Working Conference on Source Code Analysis and Manipulation, 2013, (pdf), (BibTEX).
@inproceedings{floch2013gecos,
title={{GeCoS}: A Framework for Prototyping Custom Hardware Design Flows},
author={Antoine Floc'h and Tomofumi Yuki and Ali El-Moussawi and Antoine Morvan and Kevin Martin and Maxime Naullet and
Mythri Alle and Ludovic L'Hours and Nicolas Simon and Steven Derrien and Fran\c{c}ois Charot and Christophe Wolinski and Olivier Sentieys},
booktitle={Proceedings of the 13th IEEE International Working Conference on Source Code Analysis and Manipulation},
series={SCAM'13},
location={Eindhoven, Netherlands},
pages={100--105},
month=Sep,
year={2013},
doi={10.1109/SCAM.2013.6648190}
}
Determinacy Analysis of Polyhedral X10 Programs, Alain Ketterlin, Eric Violard, Paul Feautrier, Tomofumi Yuki, Sanjay Rajopadhye, and Vijay Saraswat, 17th Workshop on Compilers for Parallel Computing, 2013, , (BibTEX).
@inproceedings{ketterlin2013determinacy,
title={Determinacy Analysis of Polyhedral X10 Programs},
author={Alain Ketterlin and Eric Violard and Paul Feautrier and Tomofumi Yuki and Sanjay Rajopadhye and Vijay Saraswat},
booktitle={Proceedings of the 17th Workshop on Compilers for Parallel Computing},
month=Jul,
year={2013}
}
Array Dataflow Analysis for Polyhedral X10 Programs, Tomofumi Yuki, Paul Feautrier, Sanjay Rajopadhye and Vijay Saraswat, 18th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming, 2013, (pdf)(slides), (BibTEX).
@inproceedings{yuki2013array,
title={Array Dataflow Analysis for Polyhedral {X10} Programs},
author={Tomofumi Yuki and Paul Feautrier and Sanjay Rajopadhye and Vijay Saraswat},
booktitle={Proceedings of the 18th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming},
series = {PPoPP '13},
location = {Shenzhen, China},
pages = {23--34},
month= Feb,
year = {2013},
doi = {10.1145/2442516.2442520}
}
Automatic Complexity Reduction with the Polyhedral Equational Model, Tomofumi Yuki, Sanjay Rajopadhye and Gautam Gupta, Workshop on Leveraging Abstractions and Semantics in High-performance Computing, 2013, (pdf),
Memory Allocations for Tiled Uniform Dependence Programs, Tomofumi Yuki and Sanjay Rajopadhye, 3rd International Workshop on Polyhedral Compilation Techniques, 2013, (pdf)(slides)(slides-pptx),
AlphaZ and the Polyhedral Equational Model, Tomofumi Yuki and Sanjay Rajopadhye, Second International Workshop on Domain-Specific Languages and High-Level Frameworks for High Performance Computing, 2012, (pdf)(slides), (BibTEX).
@inproceedings{yuki2012equational,
title={{AlphaZ and the Polyhedral Equational Model}},
author={Tomofumi Yuki and Sanjay Rajopadhye},
booktitle={Proceedings of the 2nd International Workshop on Domain-Specific Languages and High-Level Frameworks for High Performance Computing},
year={2012}
}
AlphaZ: A System for Design Space Exploration in the Polyhedral Model, Tomofumi Yuki, Gautam Gupta, DaeGon Kim, Tanveer Pathan, and Sanjay Rajopadhye, 25th International Workshop on Languages and Compilers for Parallel Computing, 2012, (pdf)(slides)(slides-pptx), (BibTEX).
@inproceedings{yuki2012alphaz,
title={{AlphaZ}: A System for Design Space Exploration in the Polyhedral Model},
author={Tomofumi Yuki and Gautam Gupta and DaeGon Kim and Tanveer Pathan and Sanjay Rajopadhye},
booktitle={Proceedings of the 25th International Workshop on Languages and Compilers for Parallel Computing},
series = {LCPC '12},
location ={Tokyo, Japan},
pages={17--31},
month=Sep,
year={2012},
doi={10.1007/978-3-642-37658-0_2},
}
Model-Driven Engineering and Optimizing Compilers: A bridge too far?, Antoine Floch, Tomofumi Yuki, Clement Guy, Steven Derrien, Benoit Combemale, Sanjay Rajopadhye, and Robert France, International Conference on Model Driven Engineering Languages and Systems, 2011, (pdf), (BibTEX).
@inproceedings{floch2011model,
title={Model-Driven Engineering and Optimizing Compilers: A bridge too far?},
author={Floch, Antoine and Yuki, Tomofumi and Guy, Clement and Derrien, Steven and Combemale, Benoit and Rajopadhye, Sanjay and France, Robert},
booktitle={Proceedings of the 14th International Conference on Model Driven Engineering Languages and Systems},
series = {MODELS '11},
location = {Wellington, New Zealand},
pages = {608--622},
month = Oct,
year={2011},
doi={10.1007/978-3-642-24485-8_45}
}
ompVerify: Polyhedral Analysis for the OpenMP Programmer, Vamshi Basupalli, Tomofumi Yuki, Sanjay Rajopadhye, Antoine Morvan, Steven Derrien, Patrice Quinton, and Dave Wonnacott, 7th International Workshop on OpenMP, 2011, , (BibTEX).
@inproceedings{basupalli2011ompverify,
title={{ompVerify}: Polyhedral Analysis for the {OpenMP} Programmer},
author={Basupalli, Vamshi and Yuki, Tomofumi and Rajopadhye, Sanjay and Morvan, Antoine and Derrien, Steven and Quinton, Patrice and Wonnacott, Dave},
booktitle = {Proceedings of the 7th International Workshop on OpenMP},
series={IWOMP '11},
location={Chicago, IL},
pages={37--53},
month=Jun,
year={2011},
doi={10.1007/978-3-642-21487-5_4}
}
Automatic Creation of Tile Size Selection Models, Tomofumi Yuki, Lakshminarayanan Renganarayanan, Sanjay Rajopadhye, Charles Anderson, Alexandre E. Eichenberger, and Kevin O'Brien, International Symposium on Code Generation and Optimization, April 24-28, 2010, (pdf)(slides), (BibTEX).
@inproceedings{yuki2010automatic,
title={Automatic Creation of Tile Size Selection Models},
author={Yuki, Tomofumi and Renganarayanan, Lakshminarayanan and Rajopadhye, Sanjay and Anderson, Charles and Eichenberger, Alex E. and O'Brien, Kevin},
booktitle={Proceedings of the 8th IEEE ACM International symposium on Code Generation and Optimization},
series = {CGO '10},
location ={Tronto, Canada},
pages={190--199},
month=Apr,
year={2010},
doi={10.1145/1772954.1772982}
}
Technical Reports
Sparse Matrix Code Dependence Analysis Simplification at Compile Time, Mahdi Soltan Mohammadi, Kazem Cheshmi, Ganesh Gopalakrishnan, Mary Hall, Maryam Mehri Dehnavi, Anand Venkat, Tomofumi Yuki, and Michelle Mills Strout, Technical Report arXiv:1807.10852 [cs.PL], 2018, (link), (BibTEX).
@article{mohammadi2018sparse,
author = {Mahdi Soltan Mohammadi and Kazem Cheshmi and Ganesh Gopalakrishnan and Mary Hall and Maryam Mehri Dehnavi and Anand Venkat and Tomofumi Yuki and Michelle Mills Strout},
title = {Sparse Matrix Code Dependence Analysis Simplification at Compile Time},
journal = {ArXiv e-prints},
archivePrefix = "arXiv",
eprint = {1807.10852},
primaryClass = "cs.PL",
year = 2018,
month = jul,
url={https://arxiv.org/abs/1807.10852}
adsurl = {http://adsabs.harvard.edu/abs/2018arXiv180710852S},
adsnote = {Provided by the SAO/NASA Astrophysics Data System}
}
Checking Race Freedom of Clocked X10 Programs, Tomofumi Yuki, Paul Feautrier, Sanjay Rajopadhye, and Vijay Saraswat, Technical Report arXiv:1311.4305 [cs.DC], 2013, (link), (BibTEX).
@techreport{yuki2013checking,
title={Checking Race Freedom of Clocked X10 Programs},
author={Yuki, Tomofumi and Feautrier, Paul and Rajopadhye, Sanjay and Saraswat, Vijay},
year=2013,
institution={arxiv/1311.4305},
version=1,
date={2013-11-18},
eprinttype = "arXiv",
eprint = {1311.4305},
url={http://arxiv.org/abs/1311.4305},
}
Diminishing Returns of Frequency Scaling, Tomofumi Yuki and Sanjay Rajopadhye, Technical Report CS-13-107, Colorado State University, 2013, (pdf), (BibTEX).
@techreport{yuki2013dvfsTR,
title={Diminishing Returns of Frequency Scaling},
author={Yuki, Tomofumi and Rajopadhye, Sanjay},
year={2013},
institution={CS-13-107, Colorado State University}
}
Parametrically Tiled Distributed Memory Parallelization of Polyhedral Programs, Tomofumi Yuki and Sanjay Rajopadhye, Technical Report CS-13-105, Colorado State University, 2013, (pdf), (BibTEX).
@techreport{yuki2013mpiTR,
title={Parametrically Tiled Distributed Memory Parallelization of Polyhedral Programs},
author={Yuki, Tomofumi and Rajopadhye, Sanjay},
year={2013},
institution={CS-13-105, Colorado State University}
}
The Stencil Processing Unit: GPGPU Done Right, Sanjay Rajopadhye, Guillaume Iooss, Tomofumi Yuki, and Dan Connors, Technical Report CS-13-103, Colorado State University, 2013, (pdf), (BibTEX).
@techreport{rajopadhye2013gpgpuTR,
title={The Stencil Processing Unit: {GPGPU} Done Right},
author={Rajopadhye, Sanjay and Iooss, Guillaume and Yuki, Tomofumi and Connors, Dan},
year={2013},
institution={CS-13-103, Colorado State University}
}
AlphaZ: A System for Analysis, Transformation, and Code Generation in the Polyhedral Equational Model, Tomofumi Yuki, Vamshi Basupalli, Gautam Gupta, Guillaume Iooss, DaeGon Kim, Tanveer Pathan, Pradeep Srinivasa, Yun Zou, and Sanjay Rajopadhye, Technical Report CS-12-101, Colorado State University, 2012, (pdf), (BibTEX).
@techreport{yuki2012alphazTR,
title={{AlphaZ}: A System for Analysis, Transformation, and Code Generation in
the Polyhedral Equational Model},
author={Yuki, Tomofumi and Basupalli, Vamshi and Gupta, Gautam and Iooss, Guillaume and
Kim, DaeGon and Pathan, Tanveer and Srinivasa, Pradeep. and Zou, Yun. and
Rajopadhye, Sanjay},
year={2012},
institution={CS-12-101, Colorado State University}
}
Systematic Implementation of fast-i-loop in UNAfold using AlphaZ, Tomofumi Yuki, Gautam Gupta, Tanveer Pathan, and Sanjay Rajopadhye, Technical Report CS-12-102, Colorado State University, 2012, (pdf), (BibTEX).
@techreport{yuki2012unafold,
title={Systematic Implementation of fast-i-loop in {UNAfold} using {AlphaZ}},
author={Yuki, Tomofumi and Gupta, Gautam and Pathan, Tanveer and Rajopadhye, Sanjay},
year={2012},
institution={CS-12-102, Colorado State University}
}
Canonic Multi-Projection: Memory Allocation for Distributed Memory Parallelization, Tomofumi Yuki and Sanjay Rajopadhye, Technical Report CS-11-106, Colorado State University, 2011, (pdf), (BibTEX).
@techreport{yuki2011canonic,
title={Canonic Multi-Projection: Memory Allocation for Distributed Memory Parallelization},
author={Tomofumi Yuki and Sanjay Rajopadhye},
year={2011},
institution={Technical Report CS-11-106, Colorado State University}
}
Talks
Far Fetched Prefetching?, Tomofumi Yuki, Antoine Morvan, and Steven Derrien, 6th French Compilation Days, 2013, (pdf)(pptx),
Leveraging Model-Driven Engineering Techniques in Optimizing Compiler Research, Tomofumi Yuki, Sanjay Rajopadhye, Robert France, Antoine Floch, Clement Guy, Steven Derrien, and Benoit Combemale, Workshop on Real-time, Embedded and Enterprise-Scale Time-Critical Systems, 2012, (pdf)(pptx),
Thesis
Beyond Shared Memory Loop Parallelism in the Polyhedral Model, Tomofumi Yuki, Colorado State University, December 17, 2012, (pdf)(slides)(slides-pptx), (BibTEX).
Automatic Creation of Tile Size Selection Models Using Neural Networks, Tomofumi Yuki, Colorado State University, December 4, 2009, (pdf), (BibTEX).