{
  "uuid": "a0a4e0cb-3479-45ea-a2be-ea82103ee483",
  "links": {
    "bibtex": "https://inspirehep.net/api/literature/1854165?format=bibtex",
    "latex-eu": "https://inspirehep.net/api/literature/1854165?format=latex-eu",
    "latex-us": "https://inspirehep.net/api/literature/1854165?format=latex-us",
    "json": "https://inspirehep.net/api/literature/1854165?format=json",
    "json-expanded": "https://inspirehep.net/api/literature/1854165?format=json-expanded",
    "cv": "https://inspirehep.net/api/literature/1854165?format=cv",
    "citations": "https://inspirehep.net/api/literature/?q=refersto%3Arecid%3A1854165"
  },
  "id": "1854165",
  "revision_id": 43,
  "metadata": {
    "citation_count": 21,
    "publication_info": [
      {
        "year": 2021,
        "artid": "074504",
        "material": "publication",
        "journal_issue": "7",
        "journal_title": "Phys.Rev.D",
        "journal_record": {
          "$ref": "https://inspirehep.net/api/journals/1613970"
        },
        "journal_volume": "104",
        "pubinfo_freetext": "Phys. Rev. D 104, 074504 (2021)"
      }
    ],
    "citation_count_without_self_citations": 13,
    "core": true,
    "dois": [
      {
        "value": "10.1103/PhysRevD.104.074504",
        "source": "APS",
        "material": "publication"
      },
      {
        "value": "10.1103/PhysRevD.104.074504",
        "source": "arXiv",
        "material": "publication"
      }
    ],
    "titles": [
      {
        "title": "Generalization capabilities of translationally equivariant neural networks",
        "source": "APS"
      },
      {
        "title": "Generalization capabilities of translationally equivariant neural networks",
        "source": "arXiv"
      }
    ],
    "$schema": "https://inspirehep.net/schemas/records/hep.json",
    "authors": [
      {
        "uuid": "6e458953-d8bb-46da-9af3-eb311cf94ff3",
        "emails": [
          "sbulusu@hep.itp.tuwien.ac.at"
        ],
        "record": {
          "$ref": "https://inspirehep.net/api/authors/1940268"
        },
        "full_name": "Bulusu, Srinath",
        "affiliations": [
          {
            "value": "Vienna, Tech. U.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/903325"
            }
          }
        ],
        "signature_block": "BALASs",
        "raw_affiliations": [
          {
            "value": "Institute for Theoretical Physics, TU Wien, Austria",
            "source": "APS"
          }
        ]
      },
      {
        "uuid": "f807487c-49f6-43f0-9bbf-22d3b9b372c1",
        "emails": [
          "favoni@hep.itp.tuwien.ac.at"
        ],
        "record": {
          "$ref": "https://inspirehep.net/api/authors/1940269"
        },
        "full_name": "Favoni, Matteo",
        "affiliations": [
          {
            "value": "Vienna, Tech. U.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/903325"
            }
          }
        ],
        "signature_block": "FAVANm",
        "raw_affiliations": [
          {
            "value": "Institute for Theoretical Physics, TU Wien, Austria",
            "source": "APS"
          }
        ]
      },
      {
        "uuid": "137a7f69-f2d1-4b2d-9bd8-1ac89bbb14cc",
        "emails": [
          "ipp@hep.itp.tuwien.ac.at"
        ],
        "record": {
          "$ref": "https://inspirehep.net/api/authors/1020396"
        },
        "full_name": "Ipp, Andreas",
        "affiliations": [
          {
            "value": "Vienna, Tech. U.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/903325"
            }
          }
        ],
        "signature_block": "IPa",
        "raw_affiliations": [
          {
            "value": "Institute for Theoretical Physics, TU Wien, Austria",
            "source": "APS"
          }
        ]
      },
      {
        "uuid": "6a177a06-7cd6-41c1-bf10-c6f217cdd035",
        "emails": [
          "dmueller@hep.itp.tuwien.ac.at"
        ],
        "record": {
          "$ref": "https://inspirehep.net/api/authors/1465774"
        },
        "full_name": "Müller, David I.",
        "affiliations": [
          {
            "value": "Vienna, Tech. U.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/903325"
            }
          }
        ],
        "signature_block": "MALARd",
        "curated_relation": true,
        "raw_affiliations": [
          {
            "value": "Institute for Theoretical Physics, TU Wien, Austria",
            "source": "APS"
          }
        ]
      },
      {
        "uuid": "495954d5-d0e3-4b93-81d4-a53da8082bfd",
        "emails": [
          "schuh@hep.itp.tuwien.ac.at"
        ],
        "record": {
          "$ref": "https://inspirehep.net/api/authors/1940270"
        },
        "full_name": "Schuh, Daniel",
        "affiliations": [
          {
            "value": "Vienna, Tech. U.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/903325"
            }
          }
        ],
        "signature_block": "Sd",
        "raw_affiliations": [
          {
            "value": "Institute for Theoretical Physics, TU Wien, Austria",
            "source": "APS"
          }
        ]
      }
    ],
    "curated": true,
    "figures": [
      {
        "key": "94e7e9cd1ae44a0071e19f5cceb7ed2c",
        "url": "https://inspirehep.net/files/94e7e9cd1ae44a0071e19f5cceb7ed2c",
        "label": "fig:architectures",
        "source": "arxiv",
        "caption": " : ~Equivariant architecture (EQ)",
        "filename": "cnn_eq_labeled.png",
        "material": "preprint"
      },
      {
        "key": "ad2448dcfc9712d1d70036dca8ae7b3b",
        "url": "https://inspirehep.net/files/ad2448dcfc9712d1d70036dca8ae7b3b",
        "label": "fig:architectures",
        "source": "arxiv",
        "caption": " : ~Strided architecture (ST) : ~Flattening architecture (FL)",
        "filename": "cnn_st_labeled.png",
        "material": "preprint"
      },
      {
        "key": "dcbec020a0372f88db66aa132eaf6f59",
        "url": "https://inspirehep.net/files/dcbec020a0372f88db66aa132eaf6f59",
        "label": "fig:architectures",
        "source": "arxiv",
        "caption": " : The three different architecture types used in this study. The checkmark (\\textcolor{Green}{\\ding{51}}) or cross (\\textcolor{Red}{\\ding{55}}) indicate spatial operations in which translational symmetry is respected or violated, respectively. Translational symmetry can be violated by convolutional or pooling layers with a stride greater than one or by a flattening layer. A global pooling layer allows for the application of the same network to different lattice sizes. Each of the layers can have a number of channels (not depicted) without affecting the translational symmetry properties. : Caption not extracted",
        "filename": "cnn_flat_labeled.png",
        "material": "preprint"
      },
      {
        "key": "b2592e43d4e4be53e9215809d8f09cd0",
        "url": "https://inspirehep.net/files/b2592e43d4e4be53e9215809d8f09cd0",
        "label": "fig:test_loss_60_times_4",
        "source": "arxiv",
        "caption": "Test loss on the whole test set on the \\mbox{$60 \\times 4$}~lattice against the size of the training set (number of samples in the training set) on which the respective model has been trained. At the top, the results of the three architecture types (trained without data augmentation) are shown. In the middle and at the bottom, the effect of data augmentation during training of \\ST{} and \\FLAT{} models, respectively, is depicted. The plots display the best and worst loss (solid lines), the arithmetic mean of all ten random initializations for training (dashed lines) and the $20\\%$ quantiles (shaded regions). The symbols visualize the positions of the measurements; the lines are there to guide the eye.",
        "filename": "reg_loss_over_training_data.png",
        "material": "preprint"
      },
      {
        "key": "9dd621174f2cc13427a4997f57831fef",
        "url": "https://inspirehep.net/files/9dd621174f2cc13427a4997f57831fef",
        "label": "fig:reg_observables_over_mu",
        "source": "arxiv",
        "caption": "Predicted and true values for ensemble averages $\\left< n \\right>$ and $\\left< \\lvert \\phi \\rvert^2 \\right>$ as a function of chemical potential $\\mu$ on a $60 \\times 4$ lattice. The predictions in this plot are made by the \\EQ{} model with the smallest test loss. The model has been trained on data generated with $\\mu = 1.05$ only but shows remarkable generalization capabilities to other values of $\\mu$. In this and in subsequent plots, the training point is highlighted by a rectangle.",
        "filename": "reg_losses_over_mu.png",
        "material": "preprint"
      },
      {
        "key": "accce2b506b047cbdba6d6bf5e8d9350",
        "url": "https://inspirehep.net/files/accce2b506b047cbdba6d6bf5e8d9350",
        "label": "fig:test_plots_mu_60_times_4",
        "source": "arxiv",
        "caption": "Predicted versus true observables for the best and the worst \\ST{} network that have been trained on $18000$ samples. It shows that the \\ST{} architecture's best instance is able to accurately estimate the whole ranges of observable values (top) and that its worst instance is failing to do so for smaller values of~$n$ and~$\\lvert \\phi \\rvert^2$ (middle). The reason for this is that the training set includes only larger values of the observables (bottom) and that the worst model is not able to generalize beyond that. The top and the middle plot show $1\\%$ of the test data; the bottom plot shows $4\\%$ of the training data.",
        "filename": "regression_scatter.png",
        "material": "preprint"
      },
      {
        "key": "bc31bea8fc963e143a7c1e89d9fcae32",
        "url": "https://inspirehep.net/files/bc31bea8fc963e143a7c1e89d9fcae32",
        "label": "fig:test_loss_various_lattice_sizes",
        "source": "arxiv",
        "caption": "Overall test loss (top) and its two parts (middle and bottom) that come from each observable, on various lattice sizes. The training has taken place on the \\mbox{$60\\times 4$} lattice. Both architectures generalize well to lattice sizes different from the one they were trained on, but the \\ST{} architecture (blue) performs visibly worse on the \\mbox{$100 \\times 5$}~lattice. The reason for this is the spatial pooling layer within the architecture, which drops $20 \\%$ of the data, leading to a less accurate prediction for both observables.",
        "filename": "reg_loss_over_lattice_size.png",
        "material": "preprint"
      },
      {
        "key": "7491078e3b66b331a18f4bf337af5477",
        "url": "https://inspirehep.net/files/7491078e3b66b331a18f4bf337af5477",
        "label": "fig:silver_blaze_prediction_larger_lattice_sizes",
        "source": "arxiv",
        "caption": "Predicted and true mean values of each observable for each individual~$\\mu$ on the larger lattices. The predictions come from the \\EQ{} model that has the lowest validation loss from all \\EQ{} models that have been trained on $20000$ training samples. The training has been performed at $\\mu = 1.05$. The kinks in the curves allow for an estimate of the Silver Blaze phase transition, which is indicated by the color gradient from the shaded region to the white background.",
        "filename": "silver_blaze.png",
        "material": "preprint"
      },
      {
        "key": "da4294dde3957e3e4560fbd664f36d7c",
        "url": "https://inspirehep.net/files/da4294dde3957e3e4560fbd664f36d7c",
        "label": "fig:reg_scatter_higher_mu",
        "source": "arxiv",
        "caption": "Predicted versus true observables for the best (according to the validation loss) model of each architecture evaluated on the test set generated from \\mbox{$\\mu \\in [1.1, 1.5]$} on the \\mbox{$60 \\times 4$} lattice. Each model is able to predict higher values of~$n$ than given during training, but the generalization of~$\\lvert \\phi \\rvert^2$ exhibits a clear difference between the generalization capabilities of the models. All these plots show $6.25\\%$ of the test data.",
        "filename": "reg_scatter_higher_mu.png",
        "material": "preprint"
      },
      {
        "key": "621d1f5e546ee0fc448de6062a1b407f",
        "url": "https://inspirehep.net/files/621d1f5e546ee0fc448de6062a1b407f",
        "label": "fig:reg_loss_over_mu",
        "source": "arxiv",
        "caption": "Total test loss and its parts corresponding to the individual observables~$n$ and $\\lvert \\phi \\rvert^2$ over the chemical potential on the  \\mbox{$60 \\times 4$} lattice. It displays the ensemble of models that have been trained on $20000$ training samples corresponding to each architecture. The large difference in the quality of the predictions for \\mbox{$\\mu \\le 1.05$} is also visible in Fig.~\\ref{fig:test_loss_60_times_4}. For \\mbox{$\\mu > 1.05$}, the performance is more similar, although for \\mbox{$\\mu = 1.5$}, the mean value of the total test loss of the \\ST{} models still differs from the mean values of the other architecture's models by roughly one order of magnitude.",
        "filename": "reg_loss_over_mu.png",
        "material": "preprint"
      },
      {
        "key": "5864f6b77a53b6d9efa6b29f41f59cd6",
        "url": "https://inspirehep.net/files/5864f6b77a53b6d9efa6b29f41f59cd6",
        "label": "fig:openworm_schematic",
        "source": "arxiv",
        "caption": " : ~Example field configuration",
        "filename": "openworm_schematic_a.png",
        "material": "preprint"
      },
      {
        "key": "a4913349bdc51703491806ab5210d023",
        "url": "https://inspirehep.net/files/a4913349bdc51703491806ab5210d023",
        "label": "fig:openworm_schematic",
        "source": "arxiv",
        "caption": " : ~Feature maps of convolutional network in best \\EQ{} and \\ST{} models : Visualization of an open worm field configuration and of the best models' predictions. (a) An example field configuration including an open worm (highlighted in brown) and the resulting flux violation given by Eq.~\\eqref{eq:flux_conservation}. The point-like violations occur at the two open ends of the worm (shown as crosses). (b) Feature maps of the convolutional part of the best \\EQ{} (top, green) and \\ST{} (bottom, blue) model showing the first four channels (of 32 and 16, respectively). Because of overparameterization, only some of the channels detect the violation (e.g.~channels 2 and 3 for \\EQ{} and 1 and 3 for \\ST{}), while other channels (e.g.~0 and 1 for \\EQ{} and 0 and 2 for \\ST{}) do not produce easily interpretable output.",
        "filename": "openworm_schematic_b.png",
        "material": "preprint"
      },
      {
        "key": "5e7368607ce276bdbdaf808e66c7d0bc",
        "url": "https://inspirehep.net/files/5e7368607ce276bdbdaf808e66c7d0bc",
        "label": "fig:class_res_8x8",
        "source": "arxiv",
        "caption": "Top: test loss for best equivariant (\\EQ{}, green), non-equivariant strided (\\ST{}, blue) and non-equivariant flattening (\\FLAT{}, red) classification architectures as a function of the chemical potential $\\mu$ on $8 \\times 8$ lattices. Training was performed on data with $\\mu=1$ and $1.5$ only. Bottom: test accuracy as a function of $\\mu$. The colored bands show the ensemble uncertainty from all 50 randomly initialized models with the thick line indicating the median loss (accuracy) and the dashed line showing the mean loss (accuracy). Both \\EQ{} and \\ST{} architectures outperform the \\FLAT{} architecture.",
        "filename": "class_loss_and_acc_8x8.png",
        "material": "preprint"
      },
      {
        "key": "9eb70954825cd8e5abdb1dda18dea2ee",
        "url": "https://inspirehep.net/files/9eb70954825cd8e5abdb1dda18dea2ee",
        "label": "fig:class_res",
        "source": "arxiv",
        "caption": "Top: test loss for best equivariant (\\EQ{}, green) and non-equivariant strided (\\ST{}, blue) classification architectures as a function of  lattice size. Bottom: test accuracy as a function of lattice size. The networks have been trained on the $8 \\times 8$ lattice only. We observe that both types of architecture lead to good generalization across lattice sizes with slightly less variation in the performance of the \\EQ{} architecture.",
        "filename": "class_loss_and_acc.png",
        "material": "preprint"
      },
      {
        "key": "2db34bdd5922a4161b5ea67a4c8b39f6",
        "url": "https://inspirehep.net/files/2db34bdd5922a4161b5ea67a4c8b39f6",
        "label": "fig:reg2_val_mean_res_8x8",
        "source": "arxiv",
        "caption": "Test loss (top) and test accuracy (bottom) of the best architectures according to the mean of the validation loss tested on all $8\\times8$ lattices as functions of the number of open worms. Training and validation are carried out at $N_\\mathrm{worms} = 0$ and $N_\\mathrm{worms} = 5$, while test results are shown for $N_\\mathrm{worms} \\in [0, 10]$.",
        "filename": "reg2_loss_and_acc_vs_worms_val_mean_8.png",
        "material": "preprint"
      },
      {
        "key": "8e7fc02694a1e8644aeff1800a34ee87",
        "url": "https://inspirehep.net/files/8e7fc02694a1e8644aeff1800a34ee87",
        "label": "fig:reg2_val_mean_res",
        "source": "arxiv",
        "caption": "Test loss (top) and test accuracy (bottom) of the best architectures according to the mean of the validation loss tested as functions of the lattice size. Training and validation are carried out on the smallest lattice ($8 \\times 8$), while testing is performed on all lattice sizes.",
        "filename": "reg2_loss_and_acc_vs_size_val_mean.png",
        "material": "preprint"
      },
      {
        "key": "a55e9dc615ee5170dfc5b443d530337d",
        "url": "https://inspirehep.net/files/a55e9dc615ee5170dfc5b443d530337d",
        "label": "fig:reg2_tloss_vloss_8x8",
        "source": "arxiv",
        "caption": "Test loss on $8\\times8$ lattices versus validation loss of every instance for each architecture. This scatter plot shows 20 models obtained during retraining for the three winning architectures of each type (\\EQ{}, \\ST{} and \\FLAT{}). The diagonal black line indicates where validation loss equals test loss. Networks have been trained and validated for $N_\\mathrm{worms}\\in\\{0,5\\}$ and $(\\eta,\\mu)\\in\\{(4.01,1.5),(4.25,1)\\}$ on an $8 \\times 8$ lattice. Generalization (test loss) is checked with zero to ten open worms, $\\mu \\in  \\{1.0, 1.25, 1.5 \\}$, $\\eta \\in \\{ 4.01, 4.04, 4.25\\}$ and a fixed lattice size of $8 \\times 8$. The closer a particular point lies to the black line, the better it generalizes. This appears to be generally the case for \\EQ{} architectures (green circles).",
        "filename": "reg2_tloss_vs_vloss_8.png",
        "material": "preprint"
      },
      {
        "key": "1f768ba281a771a35a07fdd39eb84e0f",
        "url": "https://inspirehep.net/files/1f768ba281a771a35a07fdd39eb84e0f",
        "label": "fig:reg2_tloss_vloss",
        "source": "arxiv",
        "caption": "Scatter plot of test loss on all lattice sizes versus validation loss of every instance for \\EQ{} and \\ST{} architectures. Similar to Fig.~\\ref{fig:reg2_tloss_vloss_8x8}, we demonstrate the generalization capabilities of our models to different lattice sizes from $8 \\times 8$ up to $64 \\times 64$ and different physical parameters, while being trained on only $8 \\times 8$. In particular, \\EQ{} models (green circles) are closer to the black line where test loss and validation loss agree.",
        "filename": "reg2_tloss_vs_vloss.png",
        "material": "preprint"
      },
      {
        "key": "212275c1d4ffcde4ae78ff69b072fc5a",
        "url": "https://inspirehep.net/files/212275c1d4ffcde4ae78ff69b072fc5a",
        "label": "fig:data_distr_reg_kt",
        "source": "arxiv",
        "caption": "Distributions of the link field $k_t$. These histograms feature the distributions of $k_t$ in the training set (top), test set~A (middle) and test set~B (bottom). The test sets maintain a similar distribution along different lattice sizes. Even though training and test set~A cover the same domains, their distributions are different, which is the origin of the generalization issues of some architectures. The distribution of test set~B also reaches higher values of $k_t$, which can make a generalization to data in test set~B even more difficult than to data in test set~A. Bars corresponding to weights smaller than $10^{-4}$ in each plot are not shown.",
        "filename": "data_distribution_reg_kt.png",
        "material": "preprint"
      },
      {
        "key": "aaaa681d8aaeeb26537e447709328b68",
        "url": "https://inspirehep.net/files/aaaa681d8aaeeb26537e447709328b68",
        "label": "fig:data_distr_reg_f",
        "source": "arxiv",
        "caption": "Distributions of $f$ and ratio of $W(f)$. The histograms show the distributions of $f$ in the training set (top), test set~A (middle) and test set~B (bottom). The last plot portrays $W(f+2)/W(f)$ evaluated with the same physical parameters used throughout the task, $\\eta=4.01$ and $\\lambda=1$. The markers represent even integer values of $f$, which enter the computation of $|\\phi|^2$. In every histogram, we do not report weights below $10^{-4}$.",
        "filename": "data_distribution_reg_f_W.png",
        "material": "preprint"
      },
      {
        "key": "778016a39f044ddabc1d6eafe30e327a",
        "url": "https://inspirehep.net/files/778016a39f044ddabc1d6eafe30e327a",
        "label": "fig:data_distr_reg2_kt",
        "source": "arxiv",
        "caption": "Distributions of the link field $k_t$. These two histograms feature the distributions of $k_t$ in the training set (top) and in the test set (bottom).",
        "filename": "data_distribution_reg2_kt.png",
        "material": "preprint"
      },
      {
        "key": "8ce731f530808151fa3a28a41e5f2755",
        "url": "https://inspirehep.net/files/8ce731f530808151fa3a28a41e5f2755",
        "label": "fig:data_distr_reg2_kx",
        "source": "arxiv",
        "caption": "Distributions of the link field $k_x$. These two histograms feature the distributions of $k_x$ in the training set (top) and in the test set (bottom).",
        "filename": "data_distribution_reg2_kx.png",
        "material": "preprint"
      },
      {
        "key": "7ba5e871a84eab899a614c0a756edb99",
        "url": "https://inspirehep.net/files/7ba5e871a84eab899a614c0a756edb99",
        "label": "fig:test_loss_various_lattice_sizes_only_part_of_input",
        "source": "arxiv",
        "caption": "Test loss (top) and its two parts (middle and bottom) that come from each observable, corresponding to discarding $20 \\%$ of the input data, on various lattice sizes. The networks are trained on a $60\\times 4$ lattice. The dimension along which the input data are occluded is marked in red. For~$n$, the predictions become worse if the data are concealed in the spatial direction. For $\\lvert \\phi \\rvert^2$, the predictions become worse if any data are hidden, but they are slightly worse if data are suppressed in the spatial direction. The reason for this lies in the nature of the observables.",
        "filename": "reg_loss_over_lattice_size_minus_20.png",
        "material": "preprint"
      }
    ],
    "license": [
      {
        "url": "https://creativecommons.org/licenses/by/4.0/",
        "license": "CC BY 4.0",
        "material": "publication"
      },
      {
        "url": "http://arxiv.org/licenses/nonexclusive-distrib/1.0/",
        "license": "arXiv nonexclusive-distrib 1.0",
        "material": "preprint"
      }
    ],
    "texkeys": [
      "Bulusu:2021rqz"
    ],
    "citeable": true,
    "imprints": [
      {
        "date": "2021-10-01"
      }
    ],
    "keywords": [
      {
        "value": "particle physics",
        "schema": "INSPIRE"
      },
      {
        "value": "field theory: scalar: complex",
        "schema": "INSPIRE"
      },
      {
        "value": "group: translation",
        "schema": "INSPIRE"
      },
      {
        "value": "dimension: 2",
        "schema": "INSPIRE"
      },
      {
        "value": "neural network",
        "schema": "INSPIRE"
      },
      {
        "value": "lattice",
        "schema": "INSPIRE"
      },
      {
        "value": "lattice field theory",
        "schema": "INSPIRE"
      },
      {
        "value": "performance",
        "schema": "INSPIRE"
      },
      {
        "value": "computer",
        "schema": "INSPIRE"
      }
    ],
    "refereed": true,
    "abstracts": [
      {
        "value": "The rising adoption of machine learning in high-energy physics and lattice field theory necessitates the reevaluation of common methods that are widely used in computer vision, which, when applied to problems in physics, can lead to significant drawbacks in terms of performance and generalizability. One particular example for this is the use of neural network architectures that do not reflect the underlying symmetries of the given physical problem. In this work, we focus on complex scalar field theory on a two-dimensional lattice and investigate the benefits of using group equivariant convolutional neural network architectures based on the translation group. For a meaningful comparison, we conduct a systematic search for equivariant and nonequivariant neural network architectures and apply them to various regression and classification tasks. We demonstrate that in most of these tasks our best equivariant architectures can perform and generalize significantly better than their nonequivariant counterparts, which applies not only to physical parameters beyond those represented in the training set, but also to different lattice sizes.",
        "source": "APS"
      },
      {
        "value": "The rising adoption of machine learning in high energy physics and lattice field theory necessitates the re-evaluation of common methods that are widely used in computer vision, which, when applied to problems in physics, can lead to significant drawbacks in terms of performance and generalizability. One particular example for this is the use of neural network architectures that do not reflect the underlying symmetries of the given physical problem. In this work, we focus on complex scalar field theory on a two-dimensional lattice and investigate the benefits of using group equivariant convolutional neural network architectures based on the translation group. For a meaningful comparison, we conduct a systematic search for equivariant and non-equivariant neural network architectures and apply them to various regression and classification tasks. We demonstrate that in most of these tasks our best equivariant architectures can perform and generalize significantly better than their non-equivariant counterparts, which applies not only to physical parameters beyond those represented in the training set, but also to different lattice sizes.",
        "source": "arXiv"
      }
    ],
    "copyright": [
      {
        "year": 2021,
        "holder": "authors",
        "material": "publication",
        "statement": "Published by the American Physical Society"
      }
    ],
    "references": [
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/2735401"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c1\"><label>[1]</label><mixed-citation publication-type=\"journal\"><object-id>1</object-id><person-group person-group-type=\"author\"><string-name>K. Fukushima</string-name></person-group>, <article-title>Neocognitron: A self-organizing neural network model for a mechanism of pattern recognition unaffected by shift in position</article-title>, <source>Biol. Cybern.</source> <volume>36</volume>, <page-range>193</page-range> (<year>1980</year>).<pub-id pub-id-type=\"coden\">BICYAF</pub-id><issn>0340-1200</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1007/BF00344251</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1007/BF00344251"
          ],
          "label": "1",
          "title": {
            "title": "Neocognitron: A self-organizing neural network model for a mechanism of pattern recognition unaffected by shift in position"
          },
          "authors": [
            {
              "full_name": "Fukushima, K.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 1980,
            "artid": "193",
            "page_start": "193",
            "journal_title": "Biol. Cybern.",
            "journal_volume": "36"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c2\"><label>[2]</label><mixed-citation publication-type=\"journal\"><object-id>2</object-id><person-group person-group-type=\"author\"><string-name>K. Fukushima</string-name></person-group>, <article-title>Cognitron: A self-organizing multilayered neural network</article-title>, <source>Biol. Cybern.</source> <volume>20</volume>, <page-range>121</page-range> (<year>1975</year>).<pub-id pub-id-type=\"coden\">BICYAF</pub-id><issn>0340-1200</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1007/BF00342633</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1007/BF00342633"
          ],
          "label": "2",
          "title": {
            "title": "Cognitron: A self-organizing multilayered neural network"
          },
          "authors": [
            {
              "full_name": "Fukushima, K.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 1975,
            "artid": "121",
            "page_start": "121",
            "journal_title": "Biol. Cybern.",
            "journal_volume": "20"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1620758"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c3\"><label>[3]</label><mixed-citation publication-type=\"journal\"><object-id>3</object-id><person-group person-group-type=\"author\"><string-name>O. Russakovsky</string-name>, <string-name>J. Deng</string-name>, <string-name>H. Su</string-name>, <string-name>J. Krause</string-name>, <string-name>S. Satheesh</string-name>, <string-name>S. Ma</string-name>, <string-name>Z. Huang</string-name>, <string-name>A. Karpathy</string-name>, <string-name>A. Khosla</string-name>, <string-name>M. Bernstein</string-name>, <string-name>A. C. Berg</string-name>, and <string-name>L. Fei-Fei</string-name></person-group>, <article-title>Imagenet large scale visual recognition challenge</article-title>, <source>Int. J. Comput. Vis.</source> <volume>115</volume>, <page-range>211</page-range> (<year>2015</year>).<pub-id pub-id-type=\"coden\">IJCVEQ</pub-id><issn>0920-5691</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1007/s11263-015-0816-y</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1007/s11263-015-0816-y"
          ],
          "label": "3",
          "title": {
            "title": "Imagenet large scale visual recognition challenge"
          },
          "authors": [
            {
              "full_name": "Russakovsky, O.",
              "inspire_role": "author"
            },
            {
              "full_name": "Deng, J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Su, H.",
              "inspire_role": "author"
            },
            {
              "full_name": "Krause, J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Satheesh, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Ma, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Huang, Z.",
              "inspire_role": "author"
            },
            {
              "full_name": "Karpathy, A.",
              "inspire_role": "author"
            },
            {
              "full_name": "Khosla, A.",
              "inspire_role": "author"
            },
            {
              "full_name": "Bernstein, M.",
              "inspire_role": "author"
            },
            {
              "full_name": "Berg, A.C.",
              "inspire_role": "author"
            },
            {
              "full_name": "Fei-Fei, L.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2015,
            "artid": "211",
            "page_start": "211",
            "journal_title": "Int. J. Comput. Vis.",
            "journal_volume": "115"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/2902509"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c4\"><label>[4]</label><mixed-citation publication-type=\"journal\"><object-id>4</object-id><person-group person-group-type=\"author\"><string-name>A. Krizhevsky</string-name>, <string-name>I. Sutskever</string-name>, and <string-name>G. E. Hinton</string-name></person-group>, <article-title>Imagenet classification with deep convolutional neural networks</article-title>, <source>Commun. ACM</source> <volume>60</volume>, <page-range>84</page-range> (<year>2017</year>).<pub-id pub-id-type=\"coden\">CACMA2</pub-id><issn>0001-0782</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1145/3065386</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1145/3065386"
          ],
          "label": "4",
          "title": {
            "title": "Imagenet classification with deep convolutional neural networks"
          },
          "authors": [
            {
              "full_name": "Krizhevsky, A.",
              "inspire_role": "author"
            },
            {
              "full_name": "Sutskever, I.",
              "inspire_role": "author"
            },
            {
              "full_name": "Hinton, G.E.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2017,
            "artid": "84",
            "page_start": "84",
            "journal_title": "Commun.ACM",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1214805"
            },
            "journal_volume": "60"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/2735408"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c5\"><label>[5]</label><mixed-citation publication-type=\"journal\"><object-id>5</object-id><person-group person-group-type=\"author\"><string-name>Y. Lecun</string-name>, <string-name>L. Bottou</string-name>, <string-name>Y. Bengio</string-name>, and <string-name>P. Haffner</string-name></person-group>, <article-title>Gradient-based learning applied to document recognition</article-title>, <source>Proc. IEEE</source> <volume>86</volume>, <page-range>2278</page-range> (<year>1998</year>).<pub-id pub-id-type=\"coden\">IEEPAD</pub-id><issn>0018-9219</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1109/5.726791</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1109/5.726791"
          ],
          "label": "5",
          "title": {
            "title": "Gradient-based learning applied to document recognition"
          },
          "authors": [
            {
              "full_name": "Lecun, Y.",
              "inspire_role": "author"
            },
            {
              "full_name": "Bottou, L.",
              "inspire_role": "author"
            },
            {
              "full_name": "Bengio, Y.",
              "inspire_role": "author"
            },
            {
              "full_name": "Haffner, P.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 1998,
            "artid": "2278",
            "page_start": "2278",
            "journal_title": "IEEE Proc.",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1214725"
            },
            "journal_volume": "86"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c6\"><label>[6]</label><mixed-citation publication-type=\"eprint\"><object-id>6</object-id><person-group person-group-type=\"author\"><string-name>M. Lin</string-name>, <string-name>Q. Chen</string-name>, and <string-name>S. Yan</string-name></person-group>, <article-title>Network in network</article-title>, <pub-id pub-id-type=\"arxiv\">arXiv:1312.4400</pub-id>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "label": "6",
          "title": {
            "title": "Network in network"
          },
          "authors": [
            {
              "full_name": "Lin, M.",
              "inspire_role": "author"
            },
            {
              "full_name": "Chen, Q.",
              "inspire_role": "author"
            },
            {
              "full_name": "Yan, S.",
              "inspire_role": "author"
            }
          ],
          "arxiv_eprint": "1312.4400"
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c7\"><label>[7]</label><mixed-citation publication-type=\"proc\"><object-id>7</object-id><person-group person-group-type=\"author\"><string-name>K. He</string-name>, <string-name>X. Zhang</string-name>, <string-name>S. Ren</string-name>, and <string-name>J. Sun</string-name></person-group>, <article-title>Deep residual learning for image recognition</article-title>, in <source>Proceedings of the 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2016</source> (<publisher-name>IEEE</publisher-name>, Las Vegas, USA, <year>2016</year>), pp. <page-range>770–778</page-range>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2016 (, Las Vegas, USA, ), pp. "
          ],
          "label": "7",
          "title": {
            "title": "Deep residual learning for image recognition"
          },
          "authors": [
            {
              "full_name": "He, K.",
              "inspire_role": "author"
            },
            {
              "full_name": "Zhang, X.",
              "inspire_role": "author"
            },
            {
              "full_name": "Ren, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Sun, J.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "IEEE"
          },
          "publication_info": {
            "year": 2016,
            "page_end": "778",
            "page_start": "770"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c8\"><label>[8]</label><mixed-citation publication-type=\"proc\"><object-id>8</object-id><person-group person-group-type=\"author\"><string-name>T. S. Cohen</string-name> and <string-name>M. Welling</string-name></person-group>, <article-title>Group equivariant convolutional networks</article-title>, in <source>Proceedings of the 33rd International Conference on Machine Learning, Vol. 48, PMLR, 2016</source> (<publisher-name>JMLR</publisher-name>, New York, USA, <year>2016</year>), pp. <page-range>2990–2999</page-range>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the 33rd International Conference on Machine Learning, Vol. 48, PMLR, 2016 (, New York, USA, ), pp. "
          ],
          "label": "8",
          "title": {
            "title": "Group equivariant convolutional networks"
          },
          "authors": [
            {
              "full_name": "Cohen, T.S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Welling, M.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "JMLR"
          },
          "publication_info": {
            "year": 2016,
            "page_end": "2999",
            "page_start": "2990"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c9\"><label>[9]</label><mixed-citation publication-type=\"proc\"><object-id>9</object-id><person-group person-group-type=\"author\"><string-name>T. S. Cohen</string-name> and <string-name>M. Welling</string-name></person-group>, <article-title>Steerable CNNs</article-title>, in <source>Proceedings of the International Conference on Learning Representations (ICLR), 2017</source> (<publisher-name>OpenReview</publisher-name>, Toulon, France, <year>2017</year>).</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the International Conference on Learning Representations (ICLR), 2017 (, Toulon, France, )"
          ],
          "label": "9",
          "title": {
            "title": "Steerable CNNs"
          },
          "authors": [
            {
              "full_name": "Cohen, T.S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Welling, M.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "OpenReview"
          },
          "publication_info": {
            "year": 2017
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c10\"><label>[10]</label><mixed-citation publication-type=\"proc\"><object-id>10</object-id><person-group person-group-type=\"author\"><string-name>D. E. Worrall</string-name>, <string-name>S. J. Garbin</string-name>, <string-name>D. Turmukhambetov</string-name>, and <string-name>G. J. Brostow</string-name></person-group>, <article-title>Harmonic networks: Deep translation and rotation equivariance</article-title>, in <source>Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2017</source> (<publisher-name>IEEE</publisher-name>, Honolulu, USA, <year>2017</year>), pp. <page-range>7168–7177</page-range>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2017 (, Honolulu, USA, ), pp. "
          ],
          "label": "10",
          "title": {
            "title": "Harmonic networks: Deep translation and rotation equivariance"
          },
          "authors": [
            {
              "full_name": "Worrall, D.E.",
              "inspire_role": "author"
            },
            {
              "full_name": "Garbin, S.J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Turmukhambetov, D.",
              "inspire_role": "author"
            },
            {
              "full_name": "Brostow, G.J.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "IEEE"
          },
          "publication_info": {
            "year": 2017,
            "page_end": "7177",
            "page_start": "7168"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c11\"><label>[11]</label><mixed-citation publication-type=\"proc\"><object-id>11</object-id><person-group person-group-type=\"author\"><string-name>D. Worrall</string-name> and <string-name>G. Brostow</string-name></person-group>, <article-title>CubeNet: Equivariance to 3D rotation and translation</article-title>, in <source>Proceedings of the European Conference on Computer Vision (ECCV), 2018</source> (<publisher-name>Springer</publisher-name>, Cham; Munich, Germany, <year>2018</year>), pp. <page-range>567–584</page-range>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the European Conference on Computer Vision (ECCV), 2018 (, Cham; Munich, Germany, ), pp. "
          ],
          "label": "11",
          "title": {
            "title": "CubeNet: Equivariance to 3D rotation and translation"
          },
          "authors": [
            {
              "full_name": "Worrall, D.",
              "inspire_role": "author"
            },
            {
              "full_name": "Brostow, G.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "Springer"
          },
          "publication_info": {
            "year": 2018,
            "page_end": "584",
            "page_start": "567"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c12\"><label>[12]</label><mixed-citation publication-type=\"proc\"><object-id>12</object-id><person-group person-group-type=\"author\"><string-name>A. S. Ecker</string-name>, <string-name>F. H. Sinz</string-name>, <string-name>E. Froudarakis</string-name>, <string-name>P. G. Fahey</string-name>, <string-name>S. A. Cadena</string-name>, <string-name>E. Y. Walker</string-name>, <string-name>E. Cobos</string-name>, <string-name>J. Reimer</string-name>, <string-name>A. S. Tolias</string-name>, and <string-name>M. Bethge</string-name></person-group>, <article-title>A rotation-equivariant convolutional neural network model of primary visual cortex</article-title>, in <source>Proceedings of the International Conference on Learning Representations (ICLR), 2019</source> (<publisher-name>OpenReview</publisher-name>, New Orleans, USA, <year>2019</year>).</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the International Conference on Learning Representations (ICLR), 2019 (, New Orleans, USA, )"
          ],
          "label": "12",
          "title": {
            "title": "A rotation-equivariant convolutional neural network model of primary visual cortex"
          },
          "authors": [
            {
              "full_name": "Ecker, A.S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Sinz, F.H.",
              "inspire_role": "author"
            },
            {
              "full_name": "Froudarakis, E.",
              "inspire_role": "author"
            },
            {
              "full_name": "Fahey, P.G.",
              "inspire_role": "author"
            },
            {
              "full_name": "Cadena, S.A.",
              "inspire_role": "author"
            },
            {
              "full_name": "Walker, E.Y.",
              "inspire_role": "author"
            },
            {
              "full_name": "Cobos, E.",
              "inspire_role": "author"
            },
            {
              "full_name": "Reimer, J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Tolias, A.S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Bethge, M.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "OpenReview"
          },
          "publication_info": {
            "year": 2019
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c13\"><label>[13]</label><mixed-citation publication-type=\"book\"><object-id>13</object-id><person-group person-group-type=\"author\"><string-name>B. S. Veeling</string-name>, <string-name>J. Linmans</string-name>, <string-name>J. Winkens</string-name>, <string-name>T. Cohen</string-name>, and <string-name>M. Welling</string-name></person-group>, <article-title>Rotation equivariant CNNs for digital pathology</article-title>, in <source>Medical Image Computing and Computer-Assisted Intervention (MICCAI), 2018</source> (<publisher-name>Springer International Publishing</publisher-name>, Granada, Spain, <year>2018</year>), pp. <page-range>210–218</page-range>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in  (, Granada, Spain, ), pp. "
          ],
          "label": "13",
          "title": {
            "title": "Rotation equivariant CNNs for digital pathology"
          },
          "authors": [
            {
              "full_name": "Veeling, B.S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Linmans, J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Winkens, J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Cohen, T.",
              "inspire_role": "author"
            },
            {
              "full_name": "Welling, M.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "Springer International Publishing"
          },
          "publication_info": {
            "year": 2018,
            "page_end": "218",
            "page_start": "210",
            "parent_title": "Medical Image Computing and Computer-Assisted Intervention (MICCAI), 2018"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c14\"><label>[14]</label><mixed-citation publication-type=\"proc\"><object-id>14</object-id><person-group person-group-type=\"author\"><string-name>T. S. Cohen</string-name>, <string-name>M. Weiler</string-name>, <string-name>B. Kicanaoglu</string-name>, and <string-name>M. Welling</string-name></person-group>, <article-title>Gauge equivariant convolutional networks and the icosahedral CNN</article-title>, in <source>Proceedings of the 36th International Conference on Machine Learning, Vol. 97, PMLR, 2019</source> (<publisher-name>JMLR</publisher-name>, Long Beach, USA, <year>2019</year>), pp. <page-range>1321–1330</page-range>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the 36th International Conference on Machine Learning, Vol. 97, PMLR, 2019 (, Long Beach, USA, ), pp. "
          ],
          "label": "14",
          "title": {
            "title": "Gauge equivariant convolutional networks and the icosahedral CNN"
          },
          "authors": [
            {
              "full_name": "Cohen, T.S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Weiler, M.",
              "inspire_role": "author"
            },
            {
              "full_name": "Kicanaoglu, B.",
              "inspire_role": "author"
            },
            {
              "full_name": "Welling, M.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "JMLR"
          },
          "publication_info": {
            "year": 2019,
            "page_end": "1330",
            "page_start": "1321"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c15\"><label>[15]</label><mixed-citation publication-type=\"journal\"><object-id>15</object-id><person-group person-group-type=\"author\"><string-name>M. W. Lafarge</string-name>, <string-name>E. J. Bekkers</string-name>, <string-name>J. P. W. Pluim</string-name>, <string-name>R. Duits</string-name>, and <string-name>M. Veta</string-name></person-group>, <article-title>Roto-translation equivariant convolutional networks: Application to histopathology image analysis</article-title>, <source>Med. Image Anal.</source> <volume>68</volume>, <page-range>101849</page-range> (<year>2021</year>).<pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1016/j.media.2020.101849</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1016/j.media.2020.101849"
          ],
          "label": "15",
          "title": {
            "title": "Roto-translation equivariant convolutional networks: Application to histopathology image analysis"
          },
          "authors": [
            {
              "full_name": "Lafarge, M.W.",
              "inspire_role": "author"
            },
            {
              "full_name": "Bekkers, E.J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Pluim, J.P.W.",
              "inspire_role": "author"
            },
            {
              "full_name": "Duits, R.",
              "inspire_role": "author"
            },
            {
              "full_name": "Veta, M.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2021,
            "artid": "101849",
            "journal_title": "Med. Image Anal.",
            "journal_volume": "68"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c16\"><label>[16]</label><mixed-citation publication-type=\"eprint\"><object-id>16</object-id><person-group person-group-type=\"author\"><string-name>S. Pang</string-name>, <string-name>A. Du</string-name>, <string-name>M. A. Orgun</string-name>, <string-name>Y. Wang</string-name>, <string-name>Q. Sheng</string-name>, <string-name>S. Wang</string-name>, <string-name>X. Huang</string-name>, and <string-name>Z. Yu</string-name></person-group>, <article-title>Beyond CNNs: Exploiting further inherent symmetries in medical images for segmentation</article-title>, <pub-id pub-id-type=\"arxiv\">arXiv:2005.03924</pub-id>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "label": "16",
          "title": {
            "title": "Beyond CNNs: Exploiting further inherent symmetries in medical images for segmentation"
          },
          "authors": [
            {
              "full_name": "Pang, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Du, A.",
              "inspire_role": "author"
            },
            {
              "full_name": "Orgun, M.A.",
              "inspire_role": "author"
            },
            {
              "full_name": "Wang, Y.",
              "inspire_role": "author"
            },
            {
              "full_name": "Sheng, Q.",
              "inspire_role": "author"
            },
            {
              "full_name": "Wang, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Huang, X.",
              "inspire_role": "author"
            },
            {
              "full_name": "Yu, Z.",
              "inspire_role": "author"
            }
          ],
          "arxiv_eprint": "2005.03924"
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1806791"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c17\"><label>[17]</label><mixed-citation publication-type=\"journal\"><object-id>17</object-id><person-group person-group-type=\"author\"><string-name>K. A. Nicoli</string-name>, <string-name>C. J. Anders</string-name>, <string-name>L. Funcke</string-name>, <string-name>T. Hartung</string-name>, <string-name>K. Jansen</string-name>, <string-name>P. Kessel</string-name>, <string-name>S. Nakajima</string-name>, and <string-name>P. Stornati</string-name></person-group>, <article-title>Estimation of Thermodynamic Observables in Lattice Field Theories with Deep Generative Models</article-title>, <source>Phys. Rev. Lett.</source> <volume>126</volume>, <page-range>032001</page-range> (<year>2021</year>).<pub-id pub-id-type=\"coden\">PRLTAO</pub-id><issn>0031-9007</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1103/PhysRevLett.126.032001</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevLett.126.032001"
          ],
          "label": "17",
          "title": {
            "title": "Estimation of Thermodynamic Observables in Lattice Field Theories with Deep Generative Models"
          },
          "authors": [
            {
              "full_name": "Nicoli, K.A.",
              "inspire_role": "author"
            },
            {
              "full_name": "Anders, C.J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Funcke, L.",
              "inspire_role": "author"
            },
            {
              "full_name": "Hartung, T.",
              "inspire_role": "author"
            },
            {
              "full_name": "Jansen, K.",
              "inspire_role": "author"
            },
            {
              "full_name": "Kessel, P.",
              "inspire_role": "author"
            },
            {
              "full_name": "Nakajima, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Stornati, P.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2021,
            "artid": "032001",
            "journal_title": "Phys.Rev.Lett.",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1214495"
            },
            "journal_volume": "126"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c18\"><label>[18]</label><mixed-citation publication-type=\"journal\"><object-id>18</object-id><person-group person-group-type=\"author\"><string-name>A. M. M. Scaife</string-name> and <string-name>F. Porter</string-name></person-group>, <article-title>Fanaroff-riley classification of radio galaxies using group-equivariant convolutional neural networks</article-title>, <source>Mon. Not. R. Astron. Soc.</source> <volume>503</volume>, <page-range>2369</page-range> (<year>2021</year>).<pub-id pub-id-type=\"coden\">MNRAA4</pub-id><issn>0035-8711</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1093/mnras/stab530</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1093/mnras/stab530"
          ],
          "label": "18",
          "title": {
            "title": "Fanaroff-riley classification of radio galaxies using group-equivariant convolutional neural networks"
          },
          "authors": [
            {
              "full_name": "Scaife, A.M.M.",
              "inspire_role": "author"
            },
            {
              "full_name": "Porter, F.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2021,
            "artid": "2369",
            "page_start": "2369",
            "journal_title": "Mon. Not. R. Astron. Soc.",
            "journal_volume": "503"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1785309"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c19\"><label>[19]</label><mixed-citation publication-type=\"journal\"><object-id>19</object-id><person-group person-group-type=\"author\"><string-name>G. Kanwar</string-name>, <string-name>M. S. Albergo</string-name>, <string-name>D. Boyda</string-name>, <string-name>K. Cranmer</string-name>, <string-name>D. C. Hackett</string-name>, <string-name>S. Racanière</string-name>, <string-name>D. J. Rezende</string-name>, and <string-name>P. E. Shanahan</string-name></person-group>, <article-title>Equivariant Flow-Based Sampling for Lattice Gauge Theory</article-title>, <source>Phys. Rev. Lett.</source> <volume>125</volume>, <page-range>121601</page-range> (<year>2020</year>).<pub-id pub-id-type=\"coden\">PRLTAO</pub-id><issn>0031-9007</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1103/PhysRevLett.125.121601</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevLett.125.121601"
          ],
          "label": "19",
          "title": {
            "title": "Equivariant Flow-Based Sampling for Lattice Gauge Theory"
          },
          "authors": [
            {
              "full_name": "Kanwar, G.",
              "inspire_role": "author"
            },
            {
              "full_name": "Albergo, M.S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Boyda, D.",
              "inspire_role": "author"
            },
            {
              "full_name": "Cranmer, K.",
              "inspire_role": "author"
            },
            {
              "full_name": "Hackett, D.C.",
              "inspire_role": "author"
            },
            {
              "full_name": "Racanière, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Rezende, D.J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Shanahan, P.E.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2020,
            "artid": "121601",
            "journal_title": "Phys.Rev.Lett.",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1214495"
            },
            "journal_volume": "125"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1811378"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c20\"><label>[20]</label><mixed-citation publication-type=\"journal\"><object-id>20</object-id><person-group person-group-type=\"author\"><string-name>D. Boyda</string-name>, <string-name>G. Kanwar</string-name>, <string-name>S. Racanière</string-name>, <string-name>D. J. Rezende</string-name>, <string-name>M. S. Albergo</string-name>, <string-name>K. Cranmer</string-name>, <string-name>D. C. Hackett</string-name>, and <string-name>P. E. Shanahan</string-name></person-group>, <article-title>Sampling using <inline-formula><math display=\"inline\"><mi>S</mi><mi>U</mi><mo stretchy=\"false\">(</mo><mi>N</mi><mo stretchy=\"false\">)</mo></math></inline-formula> gauge equivariant flows</article-title>, <source>Phys. Rev. D</source> <volume>103</volume>, <page-range>074504</page-range> (<year>2021</year>).<pub-id pub-id-type=\"coden\">PRVDAQ</pub-id><issn>2470-0010</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1103/PhysRevD.103.074504</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevD.103.074504"
          ],
          "label": "20",
          "title": {
            "title": "Sampling using "
          },
          "authors": [
            {
              "full_name": "Boyda, D.",
              "inspire_role": "author"
            },
            {
              "full_name": "Kanwar, G.",
              "inspire_role": "author"
            },
            {
              "full_name": "Racanière, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Rezende, D.J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Albergo, M.S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Cranmer, K.",
              "inspire_role": "author"
            },
            {
              "full_name": "Hackett, D.C.",
              "inspire_role": "author"
            },
            {
              "full_name": "Shanahan, P.E.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2021,
            "artid": "074504",
            "journal_title": "Phys.Rev.D",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1613970"
            },
            "journal_volume": "103"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1838186"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c21\"><label>[21]</label><mixed-citation publication-type=\"eprint\"><object-id>21</object-id><person-group person-group-type=\"author\"><string-name>M. Favoni</string-name>, <string-name>A. Ipp</string-name>, <string-name>D. I. Müller</string-name>, and <string-name>D. Schuh</string-name></person-group>, <article-title>Lattice gauge equivariant convolutional neural networks</article-title>, <pub-id pub-id-type=\"arxiv\">arXiv:2012.12901</pub-id>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "label": "21",
          "title": {
            "title": "Lattice gauge equivariant convolutional neural networks"
          },
          "authors": [
            {
              "full_name": "Favoni, M.",
              "inspire_role": "author"
            },
            {
              "full_name": "Ipp, A.",
              "inspire_role": "author"
            },
            {
              "full_name": "Müller, D.I.",
              "inspire_role": "author"
            },
            {
              "full_name": "Schuh, D.",
              "inspire_role": "author"
            }
          ],
          "arxiv_eprint": "2012.12901"
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1700994"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c22\"><label>[22]</label><mixed-citation publication-type=\"journal\"><object-id>22</object-id><person-group person-group-type=\"author\"><string-name>K. Zhou</string-name>, <string-name>G. Endrődi</string-name>, <string-name>L.-G. Pang</string-name>, and <string-name>H. Stöcker</string-name></person-group>, <article-title>Regressive and generative neural networks for scalar field theory</article-title>, <source>Phys. Rev. D</source> <volume>100</volume>, <page-range>011501</page-range> (<year>2019</year>).<pub-id pub-id-type=\"coden\">PRVDAQ</pub-id><issn>2470-0010</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1103/PhysRevD.100.011501</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevD.100.011501"
          ],
          "label": "22",
          "title": {
            "title": "Regressive and generative neural networks for scalar field theory"
          },
          "authors": [
            {
              "full_name": "Zhou, K.",
              "inspire_role": "author"
            },
            {
              "full_name": "Endrődi, G.",
              "inspire_role": "author"
            },
            {
              "full_name": "Pang, L.-G.",
              "inspire_role": "author"
            },
            {
              "full_name": "Stöcker, H.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2019,
            "artid": "011501",
            "journal_title": "Phys.Rev.D",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1613970"
            },
            "journal_volume": "100"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1599848"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c23\"><label>[23]</label><mixed-citation publication-type=\"journal\"><object-id>23</object-id><person-group person-group-type=\"author\"><string-name>S. J. Wetzel</string-name> and <string-name>M. Scherzer</string-name></person-group>, <article-title>Machine learning of explicit order parameters: From the Ising model to SU(2) lattice gauge theory</article-title>, <source>Phys. Rev. B</source> <volume>96</volume>, <page-range>184410</page-range> (<year>2017</year>).<pub-id pub-id-type=\"coden\">PRBMDO</pub-id><issn>2469-9950</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1103/PhysRevB.96.184410</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevB.96.184410"
          ],
          "label": "23",
          "title": {
            "title": "Machine learning of explicit order parameters: From the Ising model to SU(2) lattice gauge theory"
          },
          "authors": [
            {
              "full_name": "Wetzel, S.J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Scherzer, M.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2017,
            "artid": "184410",
            "journal_title": "Phys.Rev.B",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1613968"
            },
            "journal_volume": "96"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1804513"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c24\"><label>[24]</label><mixed-citation publication-type=\"journal\"><object-id>24</object-id><person-group person-group-type=\"author\"><string-name>D. Bachtis</string-name>, <string-name>G. Aarts</string-name>, and <string-name>B. Lucini</string-name></person-group>, <article-title>Mapping distinct phase transitions to a neural network</article-title>, <source>Phys. Rev. E</source> <volume>102</volume>, <page-range>053306</page-range> (<year>2020</year>).<pub-id pub-id-type=\"coden\">PRESCM</pub-id><issn>2470-0045</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1103/PhysRevE.102.053306</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevE.102.053306"
          ],
          "label": "24",
          "title": {
            "title": "Mapping distinct phase transitions to a neural network"
          },
          "authors": [
            {
              "full_name": "Bachtis, D.",
              "inspire_role": "author"
            },
            {
              "full_name": "Aarts, G.",
              "inspire_role": "author"
            },
            {
              "full_name": "Lucini, B.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2020,
            "artid": "053306",
            "journal_title": "Phys.Rev.E",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1613971"
            },
            "journal_volume": "102"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1793473"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c25\"><label>[25]</label><mixed-citation publication-type=\"journal\"><object-id>25</object-id><person-group person-group-type=\"author\"><string-name>D. Bachtis</string-name>, <string-name>G. Aarts</string-name>, and <string-name>B. Lucini</string-name></person-group>, <article-title>Extending machine learning classification capabilities with histogram reweighting</article-title>, <source>Phys. Rev. E</source> <volume>102</volume>, <page-range>033303</page-range> (<year>2020</year>).<pub-id pub-id-type=\"coden\">PRESCM</pub-id><issn>2470-0045</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1103/PhysRevE.102.033303</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevE.102.033303"
          ],
          "label": "25",
          "title": {
            "title": "Extending machine learning classification capabilities with histogram reweighting"
          },
          "authors": [
            {
              "full_name": "Bachtis, D.",
              "inspire_role": "author"
            },
            {
              "full_name": "Aarts, G.",
              "inspire_role": "author"
            },
            {
              "full_name": "Lucini, B.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2020,
            "artid": "033303",
            "journal_title": "Phys.Rev.E",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1613971"
            },
            "journal_volume": "102"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1783730"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c26\"><label>[26]</label><mixed-citation publication-type=\"journal\"><object-id>26</object-id><person-group person-group-type=\"author\"><string-name>S. Blücher</string-name>, <string-name>L. Kades</string-name>, <string-name>J. M. Pawlowski</string-name>, <string-name>N. Strodthoff</string-name>, and <string-name>J. M. Urban</string-name></person-group>, <article-title>Towards novel insights in lattice field theory with explainable machine learning</article-title>, <source>Phys. Rev. D</source> <volume>101</volume>, <page-range>094507</page-range> (<year>2020</year>).<pub-id pub-id-type=\"coden\">PRVDAQ</pub-id><issn>2470-0010</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1103/PhysRevD.101.094507</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevD.101.094507"
          ],
          "label": "26",
          "title": {
            "title": "Towards novel insights in lattice field theory with explainable machine learning"
          },
          "authors": [
            {
              "full_name": "Blücher, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Kades, L.",
              "inspire_role": "author"
            },
            {
              "full_name": "Pawlowski, J.M.",
              "inspire_role": "author"
            },
            {
              "full_name": "Strodthoff, N.",
              "inspire_role": "author"
            },
            {
              "full_name": "Urban, J.M.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2020,
            "artid": "094507",
            "journal_title": "Phys.Rev.D",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1613970"
            },
            "journal_volume": "101"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c27\"><label>[27]</label><mixed-citation publication-type=\"eprint\"><object-id>27</object-id><person-group person-group-type=\"author\"><string-name>K. Padavala</string-name>, <string-name>A. Singh</string-name>, and <string-name>J. Kundu</string-name></person-group>, <article-title>Machine learned phase transitions in a system of anisotropic particles on a square lattice</article-title>, <pub-id pub-id-type=\"arxiv\">arXiv:2102.03006</pub-id>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "label": "27",
          "title": {
            "title": "Machine learned phase transitions in a system of anisotropic particles on a square lattice"
          },
          "authors": [
            {
              "full_name": "Padavala, K.",
              "inspire_role": "author"
            },
            {
              "full_name": "Singh, A.",
              "inspire_role": "author"
            },
            {
              "full_name": "Kundu, J.",
              "inspire_role": "author"
            }
          ],
          "arxiv_eprint": "2102.03006"
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c28\"><label>[28]</label><mixed-citation publication-type=\"eprint\"><object-id>28</object-id><person-group person-group-type=\"author\"><string-name>Y. Wang</string-name>, <string-name>Z. Cao</string-name>, and <string-name>A. B. Farimani</string-name></person-group>, <article-title>Deep reinforcement learning optimizes graphene nanopores for efficient desalination</article-title>, <pub-id pub-id-type=\"arxiv\">arXiv:2101.07399</pub-id>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "label": "28",
          "title": {
            "title": "Deep reinforcement learning optimizes graphene nanopores for efficient desalination"
          },
          "authors": [
            {
              "full_name": "Wang, Y.",
              "inspire_role": "author"
            },
            {
              "full_name": "Cao, Z.",
              "inspire_role": "author"
            },
            {
              "full_name": "Farimani, A.B.",
              "inspire_role": "author"
            }
          ],
          "arxiv_eprint": "2101.07399"
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c29\"><label>[29]</label><mixed-citation publication-type=\"eprint\"><object-id>29</object-id><person-group person-group-type=\"author\"><string-name>K. Zhang</string-name>, <string-name>S. Lederer</string-name>, <string-name>K. Choo</string-name>, <string-name>T. Neupert</string-name>, <string-name>G. Carleo</string-name>, and <string-name>E.-A. Kim</string-name></person-group>, <article-title>Hamiltonian reconstruction as metric for variational studies</article-title>, <pub-id pub-id-type=\"arxiv\">arXiv:2102.00019</pub-id>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "label": "29",
          "title": {
            "title": "Hamiltonian reconstruction as metric for variational studies"
          },
          "authors": [
            {
              "full_name": "Zhang, K.",
              "inspire_role": "author"
            },
            {
              "full_name": "Lederer, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Choo, K.",
              "inspire_role": "author"
            },
            {
              "full_name": "Neupert, T.",
              "inspire_role": "author"
            },
            {
              "full_name": "Carleo, G.",
              "inspire_role": "author"
            },
            {
              "full_name": "Kim, E.-A.",
              "inspire_role": "author"
            }
          ],
          "arxiv_eprint": "2102.00019"
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c30\"><label>[30]</label><mixed-citation publication-type=\"proc\"><object-id>30</object-id><person-group person-group-type=\"author\"><string-name>T. Akiba</string-name>, <string-name>S. Sano</string-name>, <string-name>T. Yanase</string-name>, <string-name>T. Ohta</string-name>, and <string-name>M. Koyama</string-name></person-group>, <article-title>Optuna: A next-generation hyperparameter optimization framework</article-title>, in <source>Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, Association for Computing Machinery, 2019</source> (<publisher-name>Association for Computing Machinery</publisher-name>, New York, NY, USA; Anchorage, AK, USA, <year>2019</year>), pp. <page-range>2623–2631</page-range>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, Association for Computing Machinery, 2019 (, New York, NY, USA; Anchorage, AK, USA, ), pp. "
          ],
          "label": "30",
          "title": {
            "title": "Optuna: A next-generation hyperparameter optimization framework"
          },
          "authors": [
            {
              "full_name": "Akiba, T.",
              "inspire_role": "author"
            },
            {
              "full_name": "Sano, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Yanase, T.",
              "inspire_role": "author"
            },
            {
              "full_name": "Ohta, T.",
              "inspire_role": "author"
            },
            {
              "full_name": "Koyama, M.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "Association for Computing Machinery"
          },
          "publication_info": {
            "year": 2019,
            "page_end": "2631",
            "page_start": "2623"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c31\"><label>[31]</label><mixed-citation publication-type=\"journal\"><object-id>31</object-id><person-group person-group-type=\"author\"><string-name>E. Noether</string-name></person-group>, <article-title>Invariante Variationsprobleme, Nachrichten von der Gesellschaft der Wissenschaften zu Göttingen</article-title>, <source>Math.-Phys. Kl.</source> <volume>1918</volume>, <page-range>235</page-range> (<year>1918</year>), <ext-link ext-link-type=\"uri\" href=\"http://eudml.org/doc/59024\">http://eudml.org/doc/59024</ext-link>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            ", http://eudml.org/doc/59024"
          ],
          "label": "31",
          "title": {
            "title": "Invariante Variationsprobleme, Nachrichten von der Gesellschaft der Wissenschaften zu Göttingen"
          },
          "authors": [
            {
              "full_name": "Noether, E.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 1918,
            "artid": "235",
            "page_start": "235",
            "journal_title": "Math.-Phys. Kl.",
            "journal_volume": "1918"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1118274"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c32\"><label>[32]</label><mixed-citation publication-type=\"journal\"><object-id>32</object-id><person-group person-group-type=\"author\"><string-name>C. Gattringer</string-name> and <string-name>T. Kloiber</string-name></person-group>, <article-title>Lattice study of the Silver Blaze phenomenon for a charged scalar <inline-formula><math display=\"inline\"><msup><mi>ϕ</mi><mn>4</mn></msup></math></inline-formula> field</article-title>, <source>Nucl. Phys.</source> <volume>B869</volume>, <page-range>56</page-range> (<year>2013</year>).<pub-id pub-id-type=\"coden\">NUPBBO</pub-id><issn>0550-3213</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1016/j.nuclphysb.2012.12.005</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1016/j.nuclphysb.2012.12.005"
          ],
          "label": "32",
          "title": {
            "title": "Lattice study of the Silver Blaze phenomenon for a charged scalar "
          },
          "authors": [
            {
              "full_name": "Gattringer, C.",
              "inspire_role": "author"
            },
            {
              "full_name": "Kloiber, T.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2013,
            "artid": "56",
            "page_start": "56",
            "journal_title": "Nucl.Phys.",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1214548"
            },
            "journal_volume": "B869"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/581060"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c33\"><label>[33]</label><mixed-citation publication-type=\"journal\"><object-id>33</object-id><person-group person-group-type=\"author\"><string-name>N. Prokof’ev</string-name> and <string-name>B. Svistunov</string-name></person-group>, <article-title>Worm Algorithms for Classical Statistical Models</article-title>, <source>Phys. Rev. Lett.</source> <volume>87</volume>, <page-range>160601</page-range> (<year>2001</year>).<pub-id pub-id-type=\"coden\">PRLTAO</pub-id><issn>0031-9007</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1103/PhysRevLett.87.160601</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevLett.87.160601"
          ],
          "label": "33",
          "title": {
            "title": "Worm Algorithms for Classical Statistical Models"
          },
          "authors": [
            {
              "full_name": "Prokof'ev, N.",
              "inspire_role": "author"
            },
            {
              "full_name": "Svistunov, B.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2001,
            "artid": "160601",
            "journal_title": "Phys.Rev.Lett.",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1214495"
            },
            "journal_volume": "87"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/2731270"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c34\"><label>[34]</label><mixed-citation publication-type=\"journal\"><object-id>34</object-id><person-group person-group-type=\"author\"><string-name>G. Cybenko</string-name></person-group>, <article-title>Approximation by superpositions of a sigmoidal function</article-title>, <source>Math. Control Signals Syst.</source> <volume>2</volume>, <page-range>303</page-range> (<year>1989</year>).<pub-id pub-id-type=\"coden\">MCSYE8</pub-id><issn>0932-4194</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1007/BF02551274</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1007/BF02551274"
          ],
          "label": "34",
          "title": {
            "title": "Approximation by superpositions of a sigmoidal function"
          },
          "authors": [
            {
              "full_name": "Cybenko, G.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 1989,
            "artid": "303",
            "page_start": "303",
            "journal_title": "Math.Control Signals Syst.",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1212869"
            },
            "journal_volume": "2"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c35\"><label>[35]</label><mixed-citation publication-type=\"journal\"><object-id>35</object-id><person-group person-group-type=\"author\"><string-name>Z. Lu</string-name>, <string-name>H. Pu</string-name>, <string-name>F. Wang</string-name>, <string-name>Z. Hu</string-name>, and <string-name>L. Wang</string-name></person-group>, <article-title>The expressive power of neural networks: A view from the width</article-title>, <source>Adv. Neural Inf. Process. Syst.</source> <volume>30</volume> (<year>2017</year>), <ext-link ext-link-type=\"uri\" href=\"https://papers.nips.cc/paper/2017/hash/32cbf687880eb1674a07bf717761dd3a-Abstract.html\">https://papers.nips.cc/paper/2017/hash/32cbf687880eb1674a07bf717761dd3a-Abstract.html</ext-link>.<issn>1049-5258</issn></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            ", https://papers.nips.cc/paper/2017/hash/32cbf687880eb1674a07bf717761dd3a-Abstract.html"
          ],
          "label": "35",
          "title": {
            "title": "The expressive power of neural networks: A view from the width"
          },
          "authors": [
            {
              "full_name": "Lu, Z.",
              "inspire_role": "author"
            },
            {
              "full_name": "Pu, H.",
              "inspire_role": "author"
            },
            {
              "full_name": "Wang, F.",
              "inspire_role": "author"
            },
            {
              "full_name": "Hu, Z.",
              "inspire_role": "author"
            },
            {
              "full_name": "Wang, L.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2017,
            "journal_title": "Adv.Neural Inf.Process.Syst.",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1213182"
            },
            "journal_volume": "30"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c36\"><label>[36]</label><mixed-citation publication-type=\"journal\"><object-id>36</object-id><person-group person-group-type=\"author\"><string-name>A. Paszke</string-name> <etal/></person-group>, <article-title><sc>p</sc>y<sc>t</sc>orch: An imperative style, high-performance deep learning library</article-title>, <source>Adv. Neural Inf. Process Syst.</source> <volume>32</volume> (<year>2019</year>), <ext-link ext-link-type=\"uri\" href=\"https://papers.nips.cc/paper/2019/hash/bdbca288fee7f92f2bfa9f7012727740-Abstract.html\">https://papers.nips.cc/paper/2019/hash/bdbca288fee7f92f2bfa9f7012727740-Abstract.html</ext-link>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            ", https://papers.nips.cc/paper/2019/hash/bdbca288fee7f92f2bfa9f7012727740-Abstract.html"
          ],
          "label": "36",
          "title": {
            "title": "y"
          },
          "authors": [
            {
              "full_name": "Paszke, A.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2019,
            "journal_title": "Adv.Neural Inf.Process.Syst.",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1213182"
            },
            "journal_volume": "32"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c37\"><label>[37]</label><mixed-citation publication-type=\"proc\"><object-id>37</object-id><person-group person-group-type=\"author\"><string-name>F. Yu</string-name> and <string-name>V. Koltun</string-name></person-group>, <article-title>Multi-scale context aggregation by dilated convolutions</article-title>, in <source>Proceedings of the International Conference on Learning Representations (ICLR), 2016</source> (<publisher-name>OpenReview</publisher-name>, San Juan, Puerto Rico, <year>2016</year>).</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the International Conference on Learning Representations (ICLR), 2016 (, San Juan, Puerto Rico, )"
          ],
          "label": "37",
          "title": {
            "title": "Multi-scale context aggregation by dilated convolutions"
          },
          "authors": [
            {
              "full_name": "Yu, F.",
              "inspire_role": "author"
            },
            {
              "full_name": "Koltun, V.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "OpenReview"
          },
          "publication_info": {
            "year": 2016
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c38\"><label>[38]</label><mixed-citation publication-type=\"proc\"><object-id>38</object-id><person-group person-group-type=\"author\"><string-name>A. L. Maas</string-name>, <string-name>A. Y. Hannun</string-name>, and <string-name>A. Y. Ng</string-name></person-group>, <article-title>Rectifier nonlinearities improve neural network acoustic models</article-title>, in <source>Proceedings of the ICML Workshop on Deep Learning for Audio, Speech and Language Processing, 2013</source> (<publisher-name>ICML</publisher-name>, Atlanta, USA, <year>2013</year>), <ext-link ext-link-type=\"uri\" href=\"https://sites.google.com/site/deeplearningicml2013/relu_hybrid_icml2013_final.pdf\">https://sites.google.com/site/deeplearningicml2013/relu_hybrid_icml2013_final.pdf</ext-link>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the ICML Workshop on Deep Learning for Audio, Speech and Language Processing, 2013 (, Atlanta, USA, ), https://sites.google.com/site/deeplearningicml2013/relu_hybrid_icml2013_final.pdf"
          ],
          "label": "38",
          "title": {
            "title": "Rectifier nonlinearities improve neural network acoustic models"
          },
          "authors": [
            {
              "full_name": "Maas, A.L.",
              "inspire_role": "author"
            },
            {
              "full_name": "Hannun, A.Y.",
              "inspire_role": "author"
            },
            {
              "full_name": "Ng, A.Y.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "ICML"
          },
          "publication_info": {
            "year": 2013
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c39\"><label>[39]</label><mixed-citation publication-type=\"proc\"><object-id>39</object-id><person-group person-group-type=\"author\"><string-name>S. J. Reddi</string-name>, <string-name>S. Kale</string-name>, and <string-name>S. Kumar</string-name></person-group>, <article-title>On the convergence of Adam and beyond</article-title>, in <source>Proceedings of the International Conference on Learning Representations (ICLR), 2018</source> (<publisher-name>ICLR</publisher-name>, Scottsdale, USA, <year>2018</year>).</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the International Conference on Learning Representations (ICLR), 2018 (, Scottsdale, USA, )"
          ],
          "label": "39",
          "title": {
            "title": "On the convergence of Adam and beyond"
          },
          "authors": [
            {
              "full_name": "Reddi, S.J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Kale, S.",
              "inspire_role": "author"
            },
            {
              "full_name": "Kumar, S.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "ICLR"
          },
          "publication_info": {
            "year": 2018
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c40\"><label>[40]</label><mixed-citation publication-type=\"proc\"><object-id>40</object-id><person-group person-group-type=\"author\"><string-name>I. Loshchilov</string-name> and <string-name>F. Hutter</string-name></person-group>, <article-title>Fixing weight decay regularization in Adam</article-title>, in <source>Proceedings of the International Conference on Learning Representations (ICLR), 2019</source> (<publisher-name>OpenReview</publisher-name>, New Orleans, USA, <year>2019</year>).</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "in Proceedings of the International Conference on Learning Representations (ICLR), 2019 (, New Orleans, USA, )"
          ],
          "label": "40",
          "title": {
            "title": "Fixing weight decay regularization in Adam"
          },
          "authors": [
            {
              "full_name": "Loshchilov, I.",
              "inspire_role": "author"
            },
            {
              "full_name": "Hutter, F.",
              "inspire_role": "author"
            }
          ],
          "imprint": {
            "publisher": "OpenReview"
          },
          "publication_info": {
            "year": 2019
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/622900"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c41\"><label>[41]</label><mixed-citation publication-type=\"journal\"><object-id>41</object-id><person-group person-group-type=\"author\"><string-name>T. D. Cohen</string-name></person-group>, <article-title>Functional Integrals for QCD at Nonzero Chemical Potential and Zero Density</article-title>, <source>Phys. Rev. Lett.</source> <volume>91</volume>, <page-range>222001</page-range> (<year>2003</year>).<pub-id pub-id-type=\"coden\">PRLTAO</pub-id><issn>0031-9007</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1103/PhysRevLett.91.222001</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1103/PhysRevLett.91.222001"
          ],
          "label": "41",
          "title": {
            "title": "Functional Integrals for QCD at Nonzero Chemical Potential and Zero Density"
          },
          "authors": [
            {
              "full_name": "Cohen, T.D.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2003,
            "artid": "222001",
            "journal_title": "Phys.Rev.Lett.",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1214495"
            },
            "journal_volume": "91"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1207597"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c42\"><label>[42]</label><mixed-citation publication-type=\"journal\"><object-id>42</object-id><person-group person-group-type=\"author\"><string-name>C. Gattringer</string-name> and <string-name>T. Kloiber</string-name></person-group>, <article-title>Spectroscopy in finite density lattice field theory: An exploratory study in the relativistic bose gas</article-title>, <source>Phys. Lett. B</source> <volume>720</volume>, <page-range>210</page-range> (<year>2013</year>).<pub-id pub-id-type=\"coden\">PYLBAJ</pub-id><issn>0370-2693</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1016/j.physletb.2013.01.068</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1016/j.physletb.2013.01.068"
          ],
          "label": "42",
          "title": {
            "title": "Spectroscopy in finite density lattice field theory: An exploratory study in the relativistic bose gas"
          },
          "authors": [
            {
              "full_name": "Gattringer, C.",
              "inspire_role": "author"
            },
            {
              "full_name": "Kloiber, T.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2013,
            "artid": "210",
            "page_start": "210",
            "journal_title": "Phys.Lett.B",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1613966"
            },
            "journal_volume": "720"
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1424850"
        },
        "raw_refs": [
          {
            "value": "<ref id=\"c43\"><label>[43]</label><mixed-citation publication-type=\"journal\"><object-id>43</object-id><person-group person-group-type=\"author\"><string-name>T. Rindlisbacher</string-name>, <string-name>O. Åkerlund</string-name>, and <string-name>P. de Forcrand</string-name></person-group>, <article-title>Sampling of general correlators in worm-algorithm based simulations</article-title>, <source>Nucl. Phys.</source> <volume>B909</volume>, <page-range>542</page-range> (<year>2016</year>).<pub-id pub-id-type=\"coden\">NUPBBO</pub-id><issn>0550-3213</issn><pub-id pub-id-type=\"doi\" specific-use=\"suppress-display\">10.1016/j.nuclphysb.2016.05.026</pub-id></mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "dois": [
            "10.1016/j.nuclphysb.2016.05.026"
          ],
          "label": "43",
          "title": {
            "title": "Sampling of general correlators in worm-algorithm based simulations"
          },
          "authors": [
            {
              "full_name": "Rindlisbacher, T.",
              "inspire_role": "author"
            },
            {
              "full_name": "Åkerlund, O.",
              "inspire_role": "author"
            },
            {
              "full_name": "de Forcrand, P.",
              "inspire_role": "author"
            }
          ],
          "publication_info": {
            "year": 2016,
            "artid": "542",
            "page_start": "542",
            "journal_title": "Nucl.Phys.",
            "journal_record": {
              "$ref": "https://inspirehep.net/api/journals/1214548"
            },
            "journal_volume": "B909"
          }
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c44\"><label>[44]</label><mixed-citation publication-type=\"eprint\"><object-id>44</object-id><person-group person-group-type=\"author\"><string-name>G. Gao</string-name>, <string-name>J. Gao</string-name>, <string-name>Q. Liu</string-name>, <string-name>Q. Wang</string-name>, and <string-name>Y. Wang</string-name></person-group>, <article-title>CNN-based density estimation and crowd counting: A survey</article-title>, <pub-id pub-id-type=\"arxiv\">arXiv:2003.12783</pub-id>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "label": "44",
          "title": {
            "title": "CNN-based density estimation and crowd counting: A survey"
          },
          "authors": [
            {
              "full_name": "Gao, G.",
              "inspire_role": "author"
            },
            {
              "full_name": "Gao, J.",
              "inspire_role": "author"
            },
            {
              "full_name": "Liu, Q.",
              "inspire_role": "author"
            },
            {
              "full_name": "Wang, Q.",
              "inspire_role": "author"
            },
            {
              "full_name": "Wang, Y.",
              "inspire_role": "author"
            }
          ],
          "arxiv_eprint": "2003.12783"
        }
      },
      {
        "raw_refs": [
          {
            "value": "<ref id=\"c45\"><label>[45]</label><mixed-citation publication-type=\"misc\"><object-id>45</object-id>See <ext-link ext-link-type=\"uri\" href=\"https://gitlab.com/openpixi/scalar_ml\">https://gitlab.com/openpixi/scalar_ml</ext-link>.</mixed-citation></ref>",
            "schema": "JATS",
            "source": "APS"
          }
        ],
        "reference": {
          "misc": [
            "See https://gitlab.com/openpixi/scalar_ml"
          ],
          "label": "45"
        }
      }
    ],
    "public_notes": [
      {
        "value": "28 pages, 20 figures, v3: equivalent to the version published in PRD",
        "source": "arXiv"
      }
    ],
    "arxiv_eprints": [
      {
        "value": "2103.14686",
        "categories": [
          "hep-lat",
          "cs.LG",
          "hep-ph",
          "stat.ML"
        ]
      }
    ],
    "document_type": [
      "article"
    ],
    "preprint_date": "2021-03-26",
    "control_number": 1854165,
    "legacy_version": "20210501100327.0",
    "number_of_pages": 28,
    "inspire_categories": [
      {
        "term": "Lattice",
        "source": "arxiv"
      },
      {
        "term": "Computing",
        "source": "arxiv"
      },
      {
        "term": "Phenomenology-HEP",
        "source": "arxiv"
      },
      {
        "term": "Other",
        "source": "arxiv"
      },
      {
        "term": "Lattice"
      },
      {
        "term": "Computing"
      },
      {
        "term": "Phenomenology-HEP"
      },
      {
        "term": "Other"
      }
    ],
    "legacy_creation_date": "2021-03-30"
  },
  "updated": "2026-02-09T11:50:32.905225+00:00",
  "created": "2021-03-30T00:00:00+00:00"
}