@techreport {988, title = {On block-asynchronous execution on GPUs}, journal = {LAPACK Working Note}, number = {291}, year = {2016}, month = {2016-11}, abstract = {This paper experimentally investigates how GPUs execute instructions when used for general purpose computing (GPGPU). We use a light-weight realizing a vector operation to analyze which vector entries are updated subsequently, and identify regions where parallel execution can be expected. The results help us to understand how GPUs operate, and map this operation mode to the mathematical concept of asynchronism. In particular it helps to understand the effects that can occur when implementing a fixed-point method using in-place updates on GPU hardware.}, url = {http://www.netlib.org/lapack/lawnspdf/lawn291.pdf}, author = {Hartwig Anzt and Edmond Chow and Jack Dongarra} }