@article{Bi:2020wpt,
    author = "Bi, Yu-Jiang and Xiao, Yi and Guo, Wei-Yi and Gong, Ming and Sun, Peng and Xu, Shun and Yang, Yi-Bo",
    title = "{Lattice QCD package GWU-code and QUDA with HIP}",
    eprint = "2001.05706",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    doi = "10.22323/1.363.0286",
    journal = "PoS",
    volume = "LATTICE2019",
    pages = "286",
    year = "2020"
}

@article{Brower:2018ymy,
    author = "Brower, Richard C. and Clark, M. A. and Strelchenko, Alexei and Weinberg, Evan",
    title = "{Multigrid algorithm for staggered lattice fermions}",
    eprint = "1801.07823",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    reportNumber = "FERMILAB-PUB-18-073-CD",
    doi = "10.1103/PhysRevD.97.114513",
    journal = "Phys. Rev. D",
    volume = "97",
    number = "11",
    pages = "114513",
    year = "2018"
}

@inproceedings{Clark:2016rdz,
    author = "Clark, M. A. and Jo{\'o}, B{\'a}lint and Strelchenko, Alexei and Cheng, Michael and Gambhir, Arjun and Brower, Richard. C.",
    collaboration = "QUDA",
    title = "{Accelerating lattice QCD multigrid on GPUs using fine-grained parallelization}",
    booktitle = "{International Conference for High Performance Computing, Networking, Storage and Analysis}",
    eprint = "1612.07873",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    reportNumber = "FERMILAB-CONF-16-638-CD",
    doi = "10.5555/3014904.3014995",
    month = "12",
    year = "2016"
}

@inproceedings{Babich:2011np,
    author = "Babich, R. and Clark, M. A. and Joo, B. and Shi, G. and Brower, R. C. and Gottlieb, S.",
    collaboration = "QUDA",
    title = "{Scaling lattice QCD beyond 100 GPUs}",
    booktitle = "{International Conference for High Performance Computing, Networking, Storage and Analysis}",
    eprint = "1109.2935",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    doi = "10.1145/2063384.2063478",
    month = "9",
    year = "2011"
}

@inproceedings{Alexandru:2011sc,
    author = "Alexandru, Andrei and Lujan, Michael and Pelissier, Craig and Gamari, Ben and Lee, Frank X.",
    title = "{Efficient implementation of the overlap operator on multi-GPUs}",
    booktitle = "{2011 Symposium on Application Accelerators in High-Performance Computing (SAAHPC'11)}",
    eprint = "1106.4964",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    doi = "10.1109/SAAHPC.2011.13",
    series = "IEEE Nucl.Sci.Symp.Conf.Rec.",
    pages = "123--130",
    year = "2011"
}

@article{Alexandru:2011ee,
    author = "Alexandru, A. and Pelissier, C. and Gamari, B. and Lee, F.",
    title = "{Multi-mass solvers for lattice QCD on GPUs}",
    eprint = "1103.5103",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    doi = "10.1016/j.jcp.2011.11.003",
    journal = "J. Comput. Phys.",
    volume = "231",
    pages = "1866--1878",
    year = "2012"
}

@article{xQCD:2010pnl,
    author = "Li, A. and others",
    collaboration = "xQCD",
    title = "{Overlap Valence on 2+1 Flavor Domain Wall Fermion Configurations with Deflation and Low-mode Substitution}",
    eprint = "1005.5424",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    reportNumber = "UK-10-01",
    doi = "10.1103/PhysRevD.82.114501",
    journal = "Phys. Rev. D",
    volume = "82",
    pages = "114501",
    year = "2010"
}

@article{Clark:2009wm,
    author = "Clark, M. A. and Babich, R. and Barros, K. and Brower, R. C. and Rebbi, C.",
    collaboration = "QUDA",
    title = "{Solving Lattice QCD systems of equations using mixed precision solvers on GPUs}",
    eprint = "0911.3191",
    archivePrefix = "arXiv",
    primaryClass = "hep-lat",
    doi = "10.1016/j.cpc.2010.05.002",
    journal = "Comput. Phys. Commun.",
    volume = "181",
    pages = "1517--1528",
    year = "2010"
}

@article{Follana:2006rc,
    author = "Follana, E. and Mason, Q. and Davies, C. and Hornbostel, K. and Lepage, G. P. and Shigemitsu, J. and Trottier, H. and Wong, K.",
    collaboration = "HPQCD, UKQCD",
    title = "{Highly improved staggered quarks on the lattice, with applications to charm physics}",
    eprint = "hep-lat/0610092",
    archivePrefix = "arXiv",
    doi = "10.1103/PhysRevD.75.054502",
    journal = "Phys. Rev. D",
    volume = "75",
    pages = "054502",
    year = "2007"
}

@article{Edwards:2004sx,
    author = "Edwards, Robert G. and Joo, Balint",
    editor = "Bodwin, Geoffrey T. and Sinclair, D. K. and Eichten, E. and Holmgren, D. and Kronfeld, Andreas S. and Mackenzie, P. and Okamoto, M. and Simone, J. and El-Khadra, Aida X.",
    collaboration = "SciDAC, LHPC, UKQCD",
    title = "{The Chroma software system for lattice QCD}",
    eprint = "hep-lat/0409003",
    archivePrefix = "arXiv",
    reportNumber = "JLAB-THY-04-54",
    doi = "10.1016/j.nuclphysbps.2004.11.254",
    journal = "Nucl. Phys. B Proc. Suppl.",
    volume = "140",
    pages = "832",
    year = "2005"
}

@article{Jegerlehner:1996pm,
    author = "Jegerlehner, Beat",
    title = "{Krylov space solvers for shifted linear systems}",
    eprint = "hep-lat/9612014",
    archivePrefix = "arXiv",
    reportNumber = "IUHET-353",
    month = "12",
    year = "1996"
}
