{
  "id": "3124202",
  "uuid": "753323f6-3edc-44e7-b22c-73c9d1bd29ff",
  "metadata": {
    "citation_count": 0,
    "publication_info": [
      {
        "cnum": "C25-11-02",
        "conference_record": {
          "$ref": "https://inspirehep.net/api/conferences/2798819"
        }
      }
    ],
    "citation_count_without_self_citations": 0,
    "core": true,
    "dois": [
      {
        "value": "10.22323/1.518.0027",
        "source": "arXiv",
        "material": "publication"
      }
    ],
    "titles": [
      {
        "title": "A novel gauge-equivariant neural-network architecture for preconditioners in lattice QCD",
        "source": "arXiv"
      }
    ],
    "$schema": "https://inspirehep.net/schemas/records/hep.json",
    "authors": [
      {
        "uuid": "0f12a0b4-e933-46ff-b0d3-cab6c1f86136",
        "emails": [
          "simon.pfahler@ur.de"
        ],
        "record": {
          "$ref": "https://inspirehep.net/api/authors/3140514"
        },
        "full_name": "Pfahler, Simon",
        "affiliations": [
          {
            "value": "Regensburg U.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/903753"
            },
            "curated_relation": true
          }
        ],
        "curated_relation": true
      },
      {
        "uuid": "6c1de0d2-a0c6-4a36-9639-88d96aa31cef",
        "record": {
          "$ref": "https://inspirehep.net/api/authors/3113173"
        },
        "full_name": "Knüttel, Daniel",
        "affiliations": [
          {
            "value": "Regensburg U.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/903753"
            },
            "curated_relation": true
          }
        ]
      },
      {
        "uuid": "074186c5-9c62-47c1-b836-a8f4a779a42e",
        "record": {
          "$ref": "https://inspirehep.net/api/authors/1063281"
        },
        "full_name": "Lehner, Christoph",
        "affiliations": [
          {
            "value": "Regensburg U.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/903753"
            },
            "curated_relation": true
          }
        ]
      },
      {
        "uuid": "a4c60617-38a8-47f0-8bd0-a1dce71dd3ba",
        "record": {
          "$ref": "https://inspirehep.net/api/authors/983711"
        },
        "full_name": "Wettig, Tilo",
        "affiliations": [
          {
            "value": "Regensburg U.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/903753"
            },
            "curated_relation": true
          }
        ]
      }
    ],
    "curated": true,
    "figures": [
      {
        "key": "ab7190f7644691311d50f6e2887d4870",
        "url": "https://inspirehep.net/files/ab7190f7644691311d50f6e2887d4870",
        "label": "fig:network_architecture",
        "source": "arxiv",
        "caption": "Exemplary network architecture using linear layers (L) and parallel-transport layers (PT). For deeper networks, the highlighted block consisting of a PT and an L layer can be repeated, with potentially different parallel-transport paths in each of the PT layers.",
        "filename": "network_architecture.png",
        "material": "preprint"
      },
      {
        "key": "c47ddde352bc503b6d8e2a04cf72cab3",
        "url": "https://inspirehep.net/files/c47ddde352bc503b6d8e2a04cf72cab3",
        "label": "fig:paths_and_filter",
        "source": "arxiv",
        "caption": "Left: Evolution of the residual during GMRES solves with and without preconditioners, comparing the choices $P_s$ and $P_\\ell$ of parallel-transport paths. Networks are trained with the cost function $C_N$ with $N=10$ filter iterations. Right: Operator applications needed in GMRES solves to reach a residual of $10^{-18}$ with and without preconditioners, where all neural networks use the set $P_\\ell$ of parallel-transport paths. Both plots show data for a lattice size of $8^3\\times 16$, a quenched gauge configuration at $\\beta=6$ with topological charge $Q=1$, and bare mass parameter $m=-0.555$ (such that $m-m_\\textrm{crit}\\approx5\\times10^{-4}$).",
        "filename": "short_vs_long_paths.png",
        "material": "preprint"
      },
      {
        "key": "47d84dca8756c7924a65780eb2308c4a",
        "url": "https://inspirehep.net/files/47d84dca8756c7924a65780eb2308c4a",
        "label": "fig:paths_and_filter",
        "source": "arxiv",
        "caption": "Left: Evolution of the residual during GMRES solves with and without preconditioners, comparing the choices $P_s$ and $P_\\ell$ of parallel-transport paths. Networks are trained with the cost function $C_N$ with $N=10$ filter iterations. Right: Operator applications needed in GMRES solves to reach a residual of $10^{-18}$ with and without preconditioners, where all neural networks use the set $P_\\ell$ of parallel-transport paths. Both plots show data for a lattice size of $8^3\\times 16$, a quenched gauge configuration at $\\beta=6$ with topological charge $Q=1$, and bare mass parameter $m=-0.555$ (such that $m-m_\\textrm{crit}\\approx5\\times10^{-4}$).",
        "filename": "filter_score.png",
        "material": "preprint"
      },
      {
        "key": "2656273393050a04727d959818b3f920",
        "url": "https://inspirehep.net/files/2656273393050a04727d959818b3f920",
        "label": "fig:CSD_8c16",
        "source": "arxiv",
        "caption": "Operator applications needed in GMRES solves to reach a residual of $10^{-18}$ with and without preconditioners, depending on the bare mass parameter. An $8^3\\times16$ lattice is used, and the topological charge of the gauge configuration is $Q=0$ (left) and $Q=1$ (right). Models are trained individually for each bare mass parameter. The dashed vertical line denotes the critical mass, defined as the largest bare mass parameter for which an eigenvalue of $D$ has zero real part.Same as \\cref{fig:CSD_8c16}, but for a $16^3\\times32$ lattice and topological charges $Q=0$ (left) and $Q=4$ (right).",
        "filename": "csd.png",
        "material": "preprint"
      },
      {
        "key": "d06f7f7072736acd29b9fbbaef3c3bb5",
        "url": "https://inspirehep.net/files/d06f7f7072736acd29b9fbbaef3c3bb5",
        "label": "fig:transfer",
        "source": "arxiv",
        "caption": "Application of a model trained on the $8^3\\times16$ lattice with a gauge configuration with $Q=0$ and $m=-0.56$ to a $8^3\\times16$ lattice with a gauge configuration with $Q=1$ and different masses (left), and to a $16^3\\times32$ lattice with a gauge configuration with $Q=0$ and different masses (right).",
        "filename": "transfer.png",
        "material": "preprint"
      }
    ],
    "license": [
      {
        "url": "http://arxiv.org/licenses/nonexclusive-distrib/1.0/",
        "license": "arXiv nonexclusive-distrib 1.0",
        "material": "preprint"
      }
    ],
    "texkeys": [
      "Pfahler:2026fpj"
    ],
    "citeable": true,
    "abstracts": [
      {
        "value": "Lattice QCD simulations are computationally expensive, with the solution of the Dirac equation being the major computational bottleneck of many calculations. We introduce a novel gauge-equivariant neural-network architecture for preconditioning the Dirac equation in the regime where critical slowing down occurs. We study the behavior of this preconditioner as a function of topological charge and lattice volume and show that it mitigates critical slowing down. We also show that this preconditioner transfers to unseen gauge configurations without any retraining, therefore enabling applications not possible with competing methods.",
        "source": "arXiv"
      }
    ],
    "references": [
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/756769"
        },
        "raw_refs": [
          {
            "value": "[1] J. Brannick, R.C. Brower, M.A. Clark, J.C. Osborn and C. Rebbi, Adaptive Multigrid Algorithm for Lattice QCD, Physical Review Letters 100 (2008) 041601.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevLett.100.041601"
          ],
          "misc": [
            "Adaptive Multigrid Algorithm for Lattice QCD"
          ],
          "label": "1",
          "texkey": "Brannick_2008",
          "authors": [
            {
              "full_name": "Brannick, J."
            },
            {
              "full_name": "Brower, R.C."
            },
            {
              "full_name": "Clark, M.A."
            },
            {
              "full_name": "Osborn, J.C."
            },
            {
              "full_name": "Rebbi, C."
            }
          ],
          "publication_info": {
            "year": 2008,
            "artid": "041601",
            "journal_title": "Phys.Rev.Lett.",
            "journal_volume": "100"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/855408"
        },
        "raw_refs": [
          {
            "value": "[2] R. Babich, J. Brannick, R.C. Brower, M.A. Clark, T.A. Manteuffel, S.F. McCormick et al., Adaptive multigrid algorithm for the lattice Wilson-Dirac operator, Physical Review Letters 105 (2010) 201602 [1005.3043].",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevLett.105.201602"
          ],
          "misc": [
            "Adaptive multigrid algorithm for the lattice Wilson-Dirac operator"
          ],
          "label": "2",
          "texkey": "Babich_2010",
          "authors": [
            {
              "full_name": "Babich, R."
            },
            {
              "full_name": "Brannick, J."
            },
            {
              "full_name": "Brower, R.C."
            },
            {
              "full_name": "Clark, M.A."
            },
            {
              "full_name": "Manteuffel, T.A."
            },
            {
              "full_name": "McCormick, S.F."
            }
          ],
          "arxiv_eprint": "1005.3043",
          "publication_info": {
            "year": 2010,
            "artid": "201602",
            "journal_title": "Phys.Rev.Lett.",
            "journal_volume": "105"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1222681"
        },
        "raw_refs": [
          {
            "value": "[3] A. Frommer, K. Kahl, S. Krieg, B. Leder and M. Rottmann, Adaptive Aggregation-Based Domain Decomposition Multigrid for the Lattice Wilson–Dirac Operator, SIAM Journal on Scientific Computing 36 (2014) A1581.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "dois": [
            "10.1137/130919507"
          ],
          "misc": [
            "Adaptive Aggregation-Based Domain Decomposition Multigrid for the Lattice Wilson-Dirac Operator"
          ],
          "label": "3",
          "texkey": "Frommer_2014",
          "authors": [
            {
              "full_name": "Frommer, A."
            },
            {
              "full_name": "Kahl, K."
            },
            {
              "full_name": "Krieg, S."
            },
            {
              "full_name": "Leder, B."
            },
            {
              "full_name": "Rottmann, M."
            }
          ],
          "publication_info": {
            "year": 2014,
            "artid": "A1581",
            "page_start": "A1581",
            "journal_title": "SIAM J.Sci.Comput.",
            "journal_volume": "36"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1838186"
        },
        "raw_refs": [
          {
            "value": "[4] M. Favoni, A. Ipp, D.I. Müller and D. Schuh, Lattice Gauge Equivariant Convolutional Neural Networks, Physical Review Letters 128 (2022) 032003.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevLett.128.032003"
          ],
          "misc": [
            "Lattice Gauge Equivariant Convolutional Neural Networks"
          ],
          "label": "4",
          "texkey": "Favoni_2022",
          "authors": [
            {
              "full_name": "Favoni, M."
            },
            {
              "full_name": "Ipp, A."
            },
            {
              "full_name": "Müller, D.I."
            },
            {
              "full_name": "Schuh, D."
            }
          ],
          "publication_info": {
            "year": 2022,
            "artid": "032003",
            "journal_title": "Phys.Rev.Lett.",
            "journal_volume": "128"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1785309"
        },
        "raw_refs": [
          {
            "value": "[5] G. Kanwar, M.S. Albergo, D. Boyda, K. Cranmer, D.C. Hackett, S. Racanière et al., Equivariant Flow-Based Sampling for Lattice Gauge Theory, Physical Review Letters 125 (2020) 121601.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevLett.125.121601"
          ],
          "misc": [
            "Equivariant Flow-Based Sampling for Lattice Gauge Theory"
          ],
          "label": "5",
          "texkey": "Kanwar_2020",
          "authors": [
            {
              "full_name": "Kanwar, G."
            },
            {
              "full_name": "Albergo, M.S."
            },
            {
              "full_name": "Boyda, D."
            },
            {
              "full_name": "Cranmer, K."
            },
            {
              "full_name": "Hackett, D.C."
            },
            {
              "full_name": "Racanière, S."
            }
          ],
          "publication_info": {
            "year": 2020,
            "artid": "121601",
            "journal_title": "Phys.Rev.Lett.",
            "journal_volume": "125"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1842016"
        },
        "raw_refs": [
          {
            "value": "[6] M.S. Albergo, D. Boyda, D.C. Hackett, G. Kanwar, K. Cranmer, S. Racanière et al., Introduction to Normalizing Flows for Lattice Field Theory, Aug., 2021. 10.48550/arXiv.2101.08176.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "misc": [
            "Introduction to Normalizing Flows for Lattice Field Theory, Aug"
          ],
          "label": "6",
          "texkey": "Albergo_2021",
          "authors": [
            {
              "full_name": "Albergo, M.S."
            },
            {
              "full_name": "Boyda, D."
            },
            {
              "full_name": "Hackett, D.C."
            },
            {
              "full_name": "Kanwar, G."
            },
            {
              "full_name": "Cranmer, K."
            },
            {
              "full_name": "Racanière, S."
            }
          ],
          "arxiv_eprint": "2101.08176",
          "publication_info": {
            "year": 2021
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/2116899"
        },
        "raw_refs": [
          {
            "value": "[7] R. Abbott, M.S. Albergo, D. Boyda, K. Cranmer, D.C. Hackett, G. Kanwar et al., Gauge-equivariant flow models for sampling in lattice field theories with pseudofermions, Physical Review D 106 (2022) 074506.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevD.106.074506"
          ],
          "misc": [
            "Gauge-equivariant flow models for sampling in lattice field theories with pseudofermions"
          ],
          "label": "7",
          "texkey": "Abbott_2022",
          "authors": [
            {
              "full_name": "Abbott, R."
            },
            {
              "full_name": "Albergo, M.S."
            },
            {
              "full_name": "Boyda, D."
            },
            {
              "full_name": "Cranmer, K."
            },
            {
              "full_name": "Hackett, D.C."
            },
            {
              "full_name": "Kanwar, G."
            }
          ],
          "publication_info": {
            "year": 2022,
            "artid": "074506",
            "journal_title": "Phys.Rev.D",
            "journal_volume": "106"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/2132290"
        },
        "raw_refs": [
          {
            "value": "[8] S. Calì, D.C. Hackett, Y. Lin, P.E. Shanahan and B. Xiao, Neural-network preconditioners for solving the Dirac equation in lattice gauge theory, Physical Review D 107 (2023) 034508.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevD.107.034508"
          ],
          "misc": [
            "Neural-network preconditioners for solving the Dirac equation in lattice gauge theory"
          ],
          "label": "8",
          "texkey": "Cali_2023",
          "authors": [
            {
              "full_name": "Cal, S."
            },
            {
              "full_name": "Hackett, D.C."
            },
            {
              "full_name": "Lin, Y."
            },
            {
              "full_name": "Shanahan, P.E."
            },
            {
              "full_name": "Xiao, B."
            }
          ],
          "publication_info": {
            "year": 2023,
            "artid": "034508",
            "journal_title": "Phys.Rev.D",
            "journal_volume": "107"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/2969237"
        },
        "raw_refs": [
          {
            "value": "[9] Y. Sun, S. Eswar, Y. Lin, W. Detmold, P. Shanahan, X. Li et al., Matrix-free Neural Preconditioner for the Dirac Operator in Lattice Gauge Theory, Sept., 2025. 10.48550/arXiv.2509.10378.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "misc": [
            "Matrix-free Neural Preconditioner for the Dirac Operator in Lattice Gauge Theory, Sept"
          ],
          "label": "9",
          "texkey": "Sun_2025",
          "authors": [
            {
              "full_name": "Sun, Y."
            },
            {
              "full_name": "Eswar, S."
            },
            {
              "full_name": "Lin, Y."
            },
            {
              "full_name": "Detmold, W."
            },
            {
              "full_name": "Shanahan, P."
            },
            {
              "full_name": "Li, X."
            }
          ],
          "arxiv_eprint": "2509.10378",
          "publication_info": {
            "year": 2025
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/2631052"
        },
        "raw_refs": [
          {
            "value": "[10] C. Lehner and T. Wettig, Gauge-equivariant neural networks as preconditioners in lattice QCD, Physical Review D 108 (2023) 034503.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevD.108.034503"
          ],
          "misc": [
            "Gauge-equivariant neural networks as preconditioners in lattice QCD"
          ],
          "label": "10",
          "texkey": "Lehner_2023",
          "authors": [
            {
              "full_name": "Lehner, C."
            },
            {
              "full_name": "Wettig, T."
            }
          ],
          "publication_info": {
            "year": 2023,
            "artid": "034503",
            "journal_title": "Phys.Rev.D",
            "journal_volume": "108"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/2752000"
        },
        "raw_refs": [
          {
            "value": "[11] D. Knüttel, C. Lehner and T. Wettig, Gauge-equivariant multigrid neural networks, PoS LATTICE2023 (2024) 037.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "dois": [
            "10.22323/1.453.0037"
          ],
          "misc": [
            "Gauge-equivariant multigrid neural networks"
          ],
          "label": "11",
          "texkey": "Knuttel_2024",
          "authors": [
            {
              "full_name": "Knüttel, D."
            },
            {
              "full_name": "Lehner, C."
            },
            {
              "full_name": "Wettig, T."
            }
          ],
          "publication_info": {
            "year": 2024,
            "artid": "037",
            "page_start": "037",
            "journal_title": "PoS",
            "journal_volume": "LATTICE2023"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/2652849"
        },
        "raw_refs": [
          {
            "value": "[12] C. Lehner and T. Wettig, Gauge-equivariant pooling layers for preconditioners in lattice QCD, Physical Review D 110 (2024) 034517.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevD.110.034517"
          ],
          "misc": [
            "Gauge-equivariant pooling layers for preconditioners in lattice QCD"
          ],
          "label": "12",
          "texkey": "Lehner_2024",
          "authors": [
            {
              "full_name": "Lehner, C."
            },
            {
              "full_name": "Wettig, T."
            }
          ],
          "publication_info": {
            "year": 2024,
            "artid": "034517",
            "journal_title": "Phys.Rev.D",
            "journal_volume": "110"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "[13] J.W. Pearson and J. Pestana, Preconditioners for Krylov subspace methods: An overview, GAMM-Mitteilungen 43 (2020) e202000015.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "dois": [
            "10.1002/gamm.202000015"
          ],
          "misc": [
            "Preconditioners for Krylov subspace methods: An overview"
          ],
          "label": "13",
          "texkey": "Pearson_2020",
          "authors": [
            {
              "full_name": "Pearson, J.W."
            },
            {
              "full_name": "Pestana, J."
            }
          ],
          "publication_info": {
            "year": 2020,
            "artid": "e202000015",
            "journal_title": "GAMM Mitt.",
            "journal_volume": "43"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "[14] P. Hovland and J. Hückelheim, Differentiating Through Linear Solvers, May, 2024. 10.48550/arXiv.2404.17039.",
            "schema": "text",
            "source": "arXiv"
          }
        ],
        "reference": {
          "misc": [
            "Differentiating Through Linear Solvers, May"
          ],
          "label": "14",
          "texkey": "Hovland_2024",
          "authors": [
            {
              "full_name": "Hovland, P."
            },
            {
              "full_name": "Hückelheim, J."
            }
          ],
          "arxiv_eprint": "2404.17039",
          "publication_info": {
            "year": 2024
          }
        }
      }
    ],
    "public_notes": [
      {
        "value": "proceedings of Lattice 2025, 10 pages, 5 figures",
        "source": "arXiv"
      }
    ],
    "arxiv_eprints": [
      {
        "value": "2602.23840",
        "categories": [
          "hep-lat"
        ]
      }
    ],
    "document_type": [
      "conference paper"
    ],
    "preprint_date": "2026-02-27",
    "control_number": 3124202,
    "number_of_pages": 10,
    "inspire_categories": [
      {
        "term": "Lattice",
        "source": "arxiv"
      }
    ]
  },
  "revision_id": 8,
  "updated": "2026-04-24T04:02:44.758639+00:00",
  "created": "2026-03-02T04:03:01.435336+00:00",
  "links": {
    "bibtex": "https://inspirehep.net/api/literature/3124202?format=bibtex",
    "latex-eu": "https://inspirehep.net/api/literature/3124202?format=latex-eu",
    "latex-us": "https://inspirehep.net/api/literature/3124202?format=latex-us",
    "json": "https://inspirehep.net/api/literature/3124202?format=json",
    "json-expanded": "https://inspirehep.net/api/literature/3124202?format=json-expanded",
    "cv": "https://inspirehep.net/api/literature/3124202?format=cv",
    "citations": "https://inspirehep.net/api/literature/?q=refersto%3Arecid%3A3124202"
  }
}