Database of scalable training of neural network potentials for complex interfaces through data augmentation


JSON Export

{
  "revision": 10, 
  "id": "2619", 
  "created": "2025-03-30T18:03:32.109740+00:00", 
  "metadata": {
    "doi": "10.24435/materialscloud:w6-9a", 
    "status": "published", 
    "title": "Database of scalable training of neural network potentials for complex interfaces through data augmentation", 
    "mcid": "2025.51", 
    "license_addendum": null, 
    "_files": [
      {
        "description": "Description of the dataset", 
        "key": "README.txt", 
        "size": 15393500, 
        "checksum": "md5:02fd7bde8f16958144845121ba163d86"
      }, 
      {
        "description": "ANN training data in XSF format used for H\u2082 molecule example (Total number: 403)", 
        "key": "1_H2_xsf.tar.bz2", 
        "size": 12697, 
        "checksum": "md5:0aa065a05906aabb4a8d5c1fd992e50a"
      }, 
      {
        "description": "ANN training data in XSF format used for EC dimer example (Total number: 181,000)", 
        "key": "2_EC-EC_xsf.tar.bz2", 
        "size": 160212576, 
        "checksum": "md5:12c48fdeabada0f3483e296397c811ba"
      }, 
      {
        "description": "ANN training data in XSF format used for EC on Li surface example (Total number: 68,000)", 
        "key": "3_Li-EC-surface_xsf.tar.bz2", 
        "size": 134492502, 
        "checksum": "md5:6a1ce0f80ef1bf7899eb2a831656d8b4"
      }, 
      {
        "description": "ANN training data in XSF format used for Li-EC interface example (Total number: 80,768)", 
        "key": "4_Li-EC-interfaces_xsf.tar.bz2", 
        "size": 155118490, 
        "checksum": "md5:05f3542df4fa980c62dad03f01456a23"
      }
    ], 
    "owner": 1721, 
    "_oai": {
      "id": "oai:materialscloud.org:2619"
    }, 
    "keywords": [
      "first principles", 
      "machine learning", 
      "Li metal battery", 
      "potential energy surface", 
      "aenet", 
      "data augmentation"
    ], 
    "conceptrecid": "2618", 
    "is_last": true, 
    "references": [
      {
        "type": "Preprint", 
        "doi": "10.48550/arXiv.2412.05773", 
        "url": "https://arxiv.org/abs/2412.05773", 
        "comment": "Preprint where the data is discussed", 
        "citation": "IW Yeu, A Stuke, J L\u00f3pez-Zorrilla, JM Stevenson, DR Reichman, RA Friesner, A Urban, N Artrith, arXiv:2412.05773"
      }
    ], 
    "publication_date": "Apr 02, 2025, 18:03:37", 
    "license": "Creative Commons Attribution 4.0 International", 
    "id": "2619", 
    "description": "This database contains the reference data used for direct force training of Artificial Neural Network (ANN) interatomic potentials using the atomic energy network (\u00e6net) and \u00e6net-PyTorch packages (https://github.com/atomisticnet/aenet-PyTorch). It also includes the GPR-augmented data used for indirect force training via Gaussian Process Regression (GPR) surrogate models using the \u00e6net-GPR package (https://github.com/atomisticnet/aenet-gpr).\nEach data file contains atomic structures, energies, and atomic forces in XCrySDen Structure Format (XSF). The dataset includes all reference training/test data and corresponding GPR-augmented data used in the four benchmark examples presented in the reference paper, \u201cScalable Training of Neural Network Potentials for Complex Interfaces Through Data Augmentation\u201d.\nA hierarchy of the dataset is described in the README.txt file, and an overview of the dataset is also summarized in supplementary Table S1 of the reference paper.", 
    "version": 1, 
    "contributors": [
      {
        "email": "iy2185@columbia.edu", 
        "affiliations": [
          "Department of Chemical Engineering, Columbia University, New York, NY, USA", 
          "Columbia Center for Computational Electrochemistry, Columbia University, New York, NY, USA"
        ], 
        "familyname": "Yeu", 
        "givennames": "In Won"
      }, 
      {
        "email": "as6394@columbia.edu", 
        "affiliations": [
          "Department of Chemical Engineering, Columbia University, New York, NY, USA", 
          "Columbia Center for Computational Electrochemistry, Columbia University, New York, NY, USA"
        ], 
        "familyname": "Stuke", 
        "givennames": "Annika"
      }, 
      {
        "email": "au2229@columbia.edu", 
        "affiliations": [
          "Department of Chemical Engineering, Columbia University, New York, NY, USA", 
          "Columbia Center for Computational Electrochemistry, Columbia University, New York, NY, USA", 
          "Columbia Electrochemical Energy Center, Columbia University, New York, NY, USA"
        ], 
        "familyname": "Urban", 
        "givennames": "Alexander"
      }, 
      {
        "email": "n.artrith@uu.nl", 
        "affiliations": [
          "Columbia Center for Computational Electrochemistry, Columbia University, New York, NY, USA", 
          "Debye Institute for Nanomaterials Science, Utrecht University, 3584 CS Utrecht, The Netherlands"
        ], 
        "familyname": "Artrith", 
        "givennames": "Nongnuch"
      }
    ], 
    "edited_by": 576
  }, 
  "updated": "2025-04-02T16:03:38.014449+00:00"
}