Adaptive energy reference for machine-learning models of the electronic density of states


JSON Export

{
  "revision": 3, 
  "id": "2397", 
  "created": "2024-10-11T13:01:55.842032+00:00", 
  "metadata": {
    "doi": "10.24435/materialscloud:y6-m4", 
    "status": "published", 
    "title": "Adaptive energy reference for machine-learning models of the electronic density of states", 
    "mcid": "2024.158", 
    "license_addendum": null, 
    "_files": [
      {
        "description": "Dataset and scripts necessary to reproduce the results of the paper", 
        "key": "dataset.tar.gz", 
        "size": 5398315550, 
        "checksum": "md5:35bc9589b6102e93910f16e7db607054"
      }
    ], 
    "owner": 1382, 
    "_oai": {
      "id": "oai:materialscloud.org:2397"
    }, 
    "keywords": [
      "ERC", 
      "MARVEL", 
      "SNSF", 
      "machine learning", 
      "electronic structure", 
      "density of states", 
      "EPFL"
    ], 
    "conceptrecid": "2248", 
    "is_last": false, 
    "references": [
      {
        "type": "Preprint", 
        "doi": "10.48550/arXiv.2407.01068", 
        "url": "https://doi.org/10.48550/arXiv.2407.01068", 
        "comment": "Paper in which the data is used", 
        "citation": "WB How, S. Chong, F Grasselli, KK Huguenin-Dumittan, M. Ceriotti  \tarXiv (2024)"
      }
    ], 
    "publication_date": "Oct 11, 2024, 15:32:25", 
    "license": "Creative Commons Attribution 4.0 International", 
    "id": "2397", 
    "description": "The electronic density of states (DOS) provides information regarding the distribution of electronic states in a material, and can be used to approximate its optical and electronic properties and therefore guide computational material design. Given its usefulness and relative simplicity, it has been one of the first electronic properties used as target for machine-learning approaches going beyond interatomic potentials. A subtle but important point, well-appreciated in the condensed matter community but usually overlooked in the construction of data-driven models, is that for bulk configurations the absolute energy reference of single-particle energy levels is ill-defined. Only energy differences matter, and quantities derived from the DOS are typically independent on the absolute alignment. We introduce an adaptive scheme that optimizes the energy reference of each structure as part of training, and show that it consistently improves the quality of ML models compared to traditional choices of energy reference, for different classes of materials and different model architectures. On a practical level, we trace the improved performance to the ability of this self-aligning scheme to match the most prominent features in the DOS. More broadly, we believe that this work highlights the importance of incorporating insights into the nature of the physical target into the definition of the architecture and of the appropriate figures of merit for machine-learning models, that translate in better transferability and overall performance.\nThis record contains all the necessary data files and scripts to support the results presented in the paper with the same title.", 
    "version": 2, 
    "contributors": [
      {
        "email": "weibin.how@epfl.ch", 
        "affiliations": [
          "Laboratory of Computational Science and Modeling (COSMO), IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), 1015 Lausanne, Switzerland"
        ], 
        "familyname": "How", 
        "givennames": "Wei Bin"
      }, 
      {
        "email": "sanggyu.chong@epfl.ch", 
        "affiliations": [
          "Laboratory of Computational Science and Modeling (COSMO), IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), 1015 Lausanne, Switzerland"
        ], 
        "familyname": "Chong", 
        "givennames": "Sanggyu"
      }, 
      {
        "email": "federico.grasselli@epfl.ch", 
        "affiliations": [
          "Laboratory of Computational Science and Modeling (COSMO), IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), 1015 Lausanne, Switzerland"
        ], 
        "familyname": "Grasselli", 
        "givennames": "Federico"
      }, 
      {
        "email": "kevin.huguenin-dumittan@epfl.ch", 
        "affiliations": [
          "Laboratory of Computational Science and Modeling (COSMO), IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), 1015 Lausanne, Switzerland"
        ], 
        "familyname": "Huguenin-Dumittan", 
        "givennames": "Kevin K."
      }, 
      {
        "email": "michele.ceriotti@epfl.ch", 
        "affiliations": [
          "Laboratory of Computational Science and Modeling (COSMO), IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), 1015 Lausanne, Switzerland"
        ], 
        "familyname": "Ceriotti", 
        "givennames": "Michele"
      }
    ], 
    "edited_by": 576
  }, 
  "updated": "2024-10-25T17:07:27.247893+00:00"
}