@article{Philipsen:2014mra,
    author = "Philipsen, Owe and Pinke, Christopher and Sciarra, Alessandro and Bach, Matthias",
    title = "{CL$^2$QCD - Lattice QCD based on OpenCL}",
    eprint = "1411.5219",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    doi = "10.22323/1.214.0038",
    journal = "PoS",
    volume = "LATTICE2014",
    pages = "038",
    year = "2014"
}

@inproceedings{Alexandru:2011sc,
    author = "Alexandru, Andrei and Lujan, Michael and Pelissier, Craig and Gamari, Ben and Lee, Frank X.",
    title = "{Efficient implementation of the overlap operator on multi-GPUs}",
    booktitle = "{2011 Symposium on Application Accelerators in High-Performance Computing (SAAHPC'11)}",
    eprint = "1106.4964",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    doi = "10.1109/SAAHPC.2011.13",
    series = "IEEE Nucl.Sci.Symp.Conf.Rec.",
    pages = "123--130",
    year = "2011"
}

@article{Alexandru:2011ee,
    author = "Alexandru, A. and Pelissier, C. and Gamari, B. and Lee, F.",
    title = "{Multi-mass solvers for lattice QCD on GPUs}",
    eprint = "1103.5103",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    doi = "10.1016/j.jcp.2011.11.003",
    journal = "J. Comput. Phys.",
    volume = "231",
    pages = "1866--1878",
    year = "2012"
}

@article{Clark:2009wm,
    author = "Clark, M. A. and Babich, R. and Barros, K. and Brower, R. C. and Rebbi, C.",
    collaboration = "QUDA",
    title = "{Solving Lattice QCD systems of equations using mixed precision solvers on GPUs}",
    eprint = "0911.3191",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    doi = "10.1016/j.cpc.2010.05.002",
    journal = "Comput. Phys. Commun.",
    volume = "181",
    pages = "1517--1528",
    year = "2010"
}
