{
  "revision_id": 94,
  "created": "2015-12-07T00:00:00+00:00",
  "links": {
    "bibtex": "https://inspirehep.net/api/literature/1408296?format=bibtex",
    "latex-eu": "https://inspirehep.net/api/literature/1408296?format=latex-eu",
    "latex-us": "https://inspirehep.net/api/literature/1408296?format=latex-us",
    "json": "https://inspirehep.net/api/literature/1408296?format=json",
    "json-expanded": "https://inspirehep.net/api/literature/1408296?format=json-expanded",
    "cv": "https://inspirehep.net/api/literature/1408296?format=cv",
    "citations": "https://inspirehep.net/api/literature/?q=refersto%3Arecid%3A1408296"
  },
  "id": "1408296",
  "uuid": "af35a277-6377-4a55-8c3f-c952c95dcc0b",
  "metadata": {
    "documents": [
      {
        "key": "9634fa18e43e264cb26f181a482106a9",
        "url": "https://inspirehep.net/files/9634fa18e43e264cb26f181a482106a9",
        "source": "PoS",
        "filename": "PoS(LATTICE 2015)022.pdf",
        "fulltext": true
      }
    ],
    "citation_count_without_self_citations": 0,
    "publication_info": [
      {
        "cnum": "C15-07-14",
        "year": 2016,
        "artid": "022",
        "page_start": "022",
        "journal_title": "PoS",
        "parent_record": {
          "$ref": "https://inspirehep.net/api/literature/1391574"
        },
        "journal_record": {
          "$ref": "https://inspirehep.net/api/journals/1213080"
        },
        "journal_volume": "LATTICE2015",
        "conference_record": {
          "$ref": "https://inspirehep.net/api/conferences/1323575"
        }
      }
    ],
    "citation_count": 0,
    "core": true,
    "dois": [
      {
        "value": "10.22323/1.251.0022"
      }
    ],
    "urls": [
      {
        "value": "http://pos.sissa.it/archive/conferences/251/022/LATTICE%202015_022.pdf",
        "description": "PoS server"
      }
    ],
    "titles": [
      {
        "title": "Optimizing the domain wall fermion Dirac operator using the R-Stream source-to-source compiler",
        "source": "arXiv"
      }
    ],
    "$schema": "https://inspirehep.net/schemas/records/hep.json",
    "authors": [
      {
        "uuid": "977939ee-a043-4009-ba64-97bdb290a627",
        "record": {
          "$ref": "https://inspirehep.net/api/authors/1049380"
        },
        "full_name": "Lin, Meifeng",
        "affiliations": [
          {
            "value": "Brookhaven Natl. Lab.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/1268258"
            }
          }
        ],
        "signature_block": "LANm",
        "raw_affiliations": [
          {
            "value": "Brookhaven National Laboratory"
          }
        ]
      },
      {
        "uuid": "7b6f3edd-2f84-4653-9f15-404ca55b3e6f",
        "record": {
          "$ref": "https://inspirehep.net/api/authors/2510315"
        },
        "full_name": "Papenhausen, Eric",
        "affiliations": [
          {
            "value": "SUNY, Stony Brook",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/903237"
            }
          }
        ],
        "signature_block": "PAPANASANe",
        "raw_affiliations": [
          {
            "value": "Stony Brook Univeristy"
          }
        ]
      },
      {
        "uuid": "34e4c356-e295-4d71-a104-4409a22be495",
        "record": {
          "$ref": "https://inspirehep.net/api/authors/1020606"
        },
        "full_name": "Langston, M. Harper",
        "signature_block": "LANGSTANm",
        "raw_affiliations": [
          {
            "value": "Reservoir Labs Inc., New York"
          },
          {
            "value": "Reservoir Labs Inc"
          }
        ]
      },
      {
        "uuid": "b1447fe9-5d82-40e3-9a72-58bf9374c9ee",
        "record": {
          "$ref": "https://inspirehep.net/api/authors/2510321"
        },
        "full_name": "Meister, Benoit",
        "signature_block": "MASTARb",
        "raw_affiliations": [
          {
            "value": "Reservoir Labs Inc., New York"
          },
          {
            "value": "Reservoir Labs Inc"
          }
        ]
      },
      {
        "uuid": "22d5e7e5-fabd-4554-bdba-99de13f19ef1",
        "record": {
          "$ref": "https://inspirehep.net/api/authors/2510329"
        },
        "full_name": "Baskaran, Muthu",
        "signature_block": "BASCARANm",
        "raw_affiliations": [
          {
            "value": "Reservoir Labs Inc., New York"
          },
          {
            "value": "Reservoir Labs Inc."
          }
        ]
      },
      {
        "uuid": "2d9ae89e-e920-44d4-89f5-0254e2141a21",
        "record": {
          "$ref": "https://inspirehep.net/api/authors/1004674"
        },
        "full_name": "Izubuchi, Taku",
        "affiliations": [
          {
            "value": "Brookhaven Natl. Lab.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/1268258"
            }
          },
          {
            "value": "RIKEN BNL",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/907483"
            }
          }
        ],
        "signature_block": "ISABACt",
        "raw_affiliations": [
          {
            "value": "Brookhaven National Laboratory"
          }
        ]
      },
      {
        "uuid": "65ed62f5-c4a8-4526-8ea8-d6866b022695",
        "record": {
          "$ref": "https://inspirehep.net/api/authors/1274259"
        },
        "full_name": "Jung, Chulwoo",
        "affiliations": [
          {
            "value": "Brookhaven Natl. Lab.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/1268258"
            }
          },
          {
            "value": "Columbia U.",
            "record": {
              "$ref": "https://inspirehep.net/api/institutions/902749"
            }
          }
        ],
        "signature_block": "JANGc",
        "raw_affiliations": [
          {
            "value": "Brookhaven National Laboratory"
          }
        ]
      }
    ],
    "curated": true,
    "figures": [
      {
        "key": "234960151496375fb8296c109c7c1366",
        "url": "https://inspirehep.net/files/234960151496375fb8296c109c7c1366",
        "source": "arxiv",
        "filename": "wilson_time_implementation.png"
      },
      {
        "key": "199b8b08066a06fa52eefd4bfb3b24b9",
        "url": "https://inspirehep.net/files/199b8b08066a06fa52eefd4bfb3b24b9",
        "source": "arxiv",
        "caption": "Single-node performance for the Wilson Dslash on a $16^4$ lattice. Figure~\\protect\\ref{fig:wilson-all} shows the comparison of wall-clock time for four implementations of the even-odd preconditioned Wilson Dslash on \\texttt{HSW-lired}. Figure~\\protect\\ref{fig:wilson-machine} shows the comparison of wall-clock time for RStream+AVX implementation on three different machines. Timing is averaged over 10 runs, and the error bars show its variance.Caption not extracted",
        "filename": "wilson_avx_machine.png"
      },
      {
        "key": "025be827e94071076f8851a4ed98bf36",
        "url": "https://inspirehep.net/files/025be827e94071076f8851a4ed98bf36",
        "source": "arxiv",
        "filename": "dwf_flops_volume.png"
      },
      {
        "key": "7e577ccff178004afe06a4ebac851e24",
        "url": "https://inspirehep.net/files/7e577ccff178004afe06a4ebac851e24",
        "source": "arxiv",
        "caption": "Single-node performance  for the RStream+AVX implementation of the 4D DWF \\dslash on \\texttt{HSW-lired}. Figure~\\protect\\ref{fig:dwf-volume} shows the performance with different OpenMP threads. Figure~\\protect\\ref{fig:wilson-machine} shows the effect of AVX vectorization on different lattice volumes with one OpenMP thread. Timing is averaged over 10 runs, and the error bars show its variance.Caption not extracted",
        "filename": "dwf_flops_vec.png"
      }
    ],
    "license": [
      {
        "url": "http://arxiv.org/licenses/nonexclusive-distrib/1.0/",
        "imposing": "arXiv"
      },
      {
        "license": "CC-BY-NC-SA",
        "imposing": "SISSA"
      }
    ],
    "texkeys": [
      "Lin:2015vzg"
    ],
    "citeable": true,
    "imprints": [
      {
        "date": "2015-12-04",
        "publisher": "SISSA"
      }
    ],
    "keywords": [
      {
        "value": "operator: Dirac",
        "schema": "INSPIRE"
      },
      {
        "value": "fermion: domain wall",
        "schema": "INSPIRE"
      },
      {
        "value": "fermion: Dirac",
        "schema": "INSPIRE"
      },
      {
        "value": "lattice field theory",
        "schema": "INSPIRE"
      },
      {
        "value": "numerical methods: performance",
        "schema": "INSPIRE"
      },
      {
        "value": "benchmark",
        "schema": "INSPIRE"
      },
      {
        "value": "cluster",
        "schema": "INSPIRE"
      },
      {
        "value": "programming",
        "schema": "INSPIRE"
      }
    ],
    "abstracts": [
      {
        "value": "The application of the Dirac operator on a spinor field, the Dslash operation, is the most computation-intensive part of the lattice QCD simulations. It is often the key kernel to optimize to achieve maximum performance on various platforms. Here we report on a project to optimize the domain wall fermion Dirac operator in Columbia Physics System (CPS) using the R-Stream source-to-source compiler. Our initial target platform is the Intel PC clusters. We discuss the optimization strategies involved before and after the automatic code generation with R-Stream and present some preliminary benchmark results.",
        "source": "arXiv"
      }
    ],
    "references": [
      {
        "reference": {
          "urls": [
            {
              "value": "http://qcdoc.phys.columbia.edu/cps.html"
            }
          ],
          "label": "1"
        }
      },
      {
        "reference": {
          "misc": [
            "R-stream compiler, in Encyclopedia of Parallel Computing, pp. 1756-1765"
          ],
          "label": "2",
          "authors": [
            {
              "full_name": "Meister, B."
            },
            {
              "full_name": "Vasilache, N."
            },
            {
              "full_name": "Wohlford, D."
            },
            {
              "full_name": "Baskaran, M.M."
            },
            {
              "full_name": "Leung, A."
            },
            {
              "full_name": "Lethin, R."
            }
          ],
          "publication_info": {
            "year": 2011
          }
        }
      },
      {
        "reference": {
          "misc": [
            "Some efficient solutions to the affine scheduling problem. Part I. One-dimensional time, International Journal of Parallel Programming 21 , no. 5 313-348"
          ],
          "label": "3",
          "authors": [
            {
              "full_name": "Feautrier, P."
            }
          ],
          "publication_info": {
            "year": 1992
          }
        }
      },
      {
        "reference": {
          "misc": [
            "Lattice-based memory allocation"
          ],
          "label": "4",
          "authors": [
            {
              "full_name": "Darte, A."
            },
            {
              "full_name": "Schreiber, R."
            },
            {
              "full_name": "Villard, G."
            }
          ],
          "publication_info": {
            "year": 2005,
            "page_end": "1257",
            "page_start": "1242",
            "journal_title": "IEEE Trans.Comput.",
            "journal_volume": "54"
          }
        }
      },
      {
        "reference": {
          "misc": [
            "Memory reuse optimizations in the r-stream compiler, in Proceedings of the 6th Annual Workshop on General Purpose Processing with Graphics Processing Units (GPGPU), Houston, TX, USA, January"
          ],
          "label": "5",
          "authors": [
            {
              "full_name": "Vasilache, N."
            },
            {
              "full_name": "Baskaran, M.M."
            },
            {
              "full_name": "Meister, B."
            },
            {
              "full_name": "Lethin, R."
            }
          ],
          "publication_info": {
            "year": 2013
          }
        }
      },
      {
        "reference": {
          "misc": [
            "K and R. Lethin, Polyhedral user mapping and assistant visualizer tool for the r-stream auto-parallelizing compiler, in Proc. VISSOFT, pp. 180-184"
          ],
          "label": "6",
          "authors": [
            {
              "full_name": "Papenhausen, E."
            },
            {
              "full_name": "Wang, B."
            },
            {
              "full_name": "Langston, M.H."
            },
            {
              "full_name": "Baskaran, M."
            },
            {
              "full_name": "Henretty, T."
            },
            {
              "full_name": "Izubuchi, T."
            },
            {
              "full_name": "Johnson, A."
            },
            {
              "full_name": "Jung, C."
            },
            {
              "full_name": "Lin, M."
            },
            {
              "full_name": "Meister, B."
            }
          ],
          "imprint": {
            "publisher": "IEEE"
          },
          "publication_info": {
            "year": 2015
          }
        }
      },
      {
        "record": {
          "$ref": "https://inspirehep.net/api/literature/1409303"
        },
        "reference": {
          "misc": [
            "Grid: A next generation data parallel c++ qcd library"
          ],
          "label": "7",
          "authors": [
            {
              "full_name": "Boyle, P."
            },
            {
              "full_name": "Cossu, G."
            },
            {
              "full_name": "Yamaguchi, A."
            },
            {
              "full_name": "Portelli, A."
            }
          ],
          "publication_info": {
            "year": 2015,
            "artid": "23",
            "page_start": "23",
            "journal_title": "PoS",
            "journal_volume": "LATTICE2015"
          }
        }
      }
    ],
    "public_notes": [
      {
        "value": "7 pages, 4 figures. Proceedings of the 33rd International Symposium on Lattice Field Theory, July 14 -18, 2015, Kobe, Japan",
        "source": "arXiv"
      }
    ],
    "arxiv_eprints": [
      {
        "value": "1512.01542",
        "categories": [
          "hep-lat",
          "physics.comp-ph"
        ]
      }
    ],
    "document_type": [
      "conference paper"
    ],
    "preprint_date": "2015-12-04",
    "control_number": 1408296,
    "legacy_version": "20210519184602.0",
    "number_of_pages": 7,
    "inspire_categories": [
      {
        "term": "Lattice"
      },
      {
        "term": "Computing"
      }
    ],
    "legacy_creation_date": "2015-12-07"
  },
  "updated": "2025-08-04T17:26:10.404632+00:00"
}