Structure-property maps with kernel principal covariates regression


JSON Export

{
  "metadata": {
    "edited_by": 100, 
    "owner": 150, 
    "description": "Data analyses based on linear methods constitute the simplest, most robust, and transparent approaches to the automatic processing of large amounts of data for building supervised or unsupervised machine learning models. Principal covariates regression (PCovR) is an underappreciated method that interpolates between principal component analysis and linear regression, and can be used to conveniently reveal structure-property relations in terms of simple-to-interpret, low-dimensional maps. Here we introduce a kernelized version of PCovR and a sparsified extension, and demonstrate the performance of this approach in revealing and predicting structure-property relations in chemistry and materials science, showing a variety of examples including elemental carbon, porous silicate frameworks, organic molecules, amino acid conformers, and molecular materials.", 
    "keywords": [
      "machine learning", 
      "materials science", 
      "dimensionality reduction", 
      "kernel methods", 
      "MaX", 
      "SNSF", 
      "ERC", 
      "EPFL", 
      "MARVEL/DD1"
    ], 
    "is_last": true, 
    "title": "Structure-property maps with kernel principal covariates regression", 
    "status": "published", 
    "license_addendum": null, 
    "doi": "10.24435/materialscloud:9e-3j", 
    "conceptrecid": "457", 
    "_files": [
      {
        "checksum": "md5:fd7f42bcd62917a994115b7dac03dbf9", 
        "description": "Gzipped TAR archive containing all the datasets used in XYZ format", 
        "key": "datasets.tgz", 
        "size": 107648795
      }, 
      {
        "checksum": "md5:4901d18f01498450fddf70d4f1bd0d9e", 
        "description": "Map created with KPCovR for the Arginine-Dipeptide dataset at alpha=0.55 using the chemiscope.org visualizer JSON format", 
        "key": "arginine-kpcovr-0.55-chemiscope.json.gz", 
        "size": 1163153
      }, 
      {
        "checksum": "md5:8a5d0f6f04c6c26a7c3ce9b3c0668d80", 
        "description": "Map created with KPCovR for the Azaphenacenes dataset at alpha=0.65 using the chemiscope.org visualizer JSON format", 
        "key": "azaphenacenes-kpcovr-0.65-chemiscope.json.gz", 
        "size": 287647
      }, 
      {
        "checksum": "md5:500809d4a4a62b864c1dd42f2c01732c", 
        "description": "Map created with KPCovR for the AIRSS carbon dataset at alpha=0.0 using the chemiscope.org visualizer JSON format", 
        "key": "C-VII-kpcovr-0.0-chemiscope.json.gz", 
        "size": 1632157
      }, 
      {
        "checksum": "md5:1af1bd5df08b2cb21aecdd9885829a51", 
        "description": "Map created with KPCovR for the AIRSS carbon dataset at alpha=0.5 using the chemiscope.org visualizer JSON format", 
        "key": "C-VII-kpcovr-0.5-chemiscope.json.gz", 
        "size": 1634315
      }, 
      {
        "checksum": "md5:427aa3e3a939fee3a976fa475092e4bb", 
        "description": "Map created with KPCovR for the AIRSS carbon dataset at alpha=1.0 using the chemiscope.org visualizer JSON format", 
        "key": "C-VII-kpcovr-1.0-chemiscope.json.gz", 
        "size": 1631830
      }, 
      {
        "checksum": "md5:709118a8c4ec0460efda82059b0b57a0", 
        "description": "Map created with KPCovR for the NMR Chemical shielding dataset at alpha=0.5 using the chemiscope.org visualizer JSON format", 
        "key": "CSD-1000R-kpcovr-0.5-chemiscope.json.gz", 
        "size": 1082067
      }, 
      {
        "checksum": "md5:433087121bd75a693da1c51bdd91a519", 
        "description": "Map created with KPCovR for global properties of DEEM zeolites at alpha=0.5 using the chemiscope.org visualizer JSON format", 
        "key": "DEEM-global-kpcovr-0.5-chemiscope.json.gz", 
        "size": 3159070
      }, 
      {
        "checksum": "md5:196238f8be2815f22257fe791eaa2199", 
        "description": "Map created with KPCovR for local properties of DEEM zeolites at alpha=0.5 using the chemiscope.org visualizer JSON format", 
        "key": "DEEM-local-kpcovr-0.5-chemiscope.json.gz", 
        "size": 771946
      }, 
      {
        "checksum": "md5:9000a600226b8bb361eccf89b88e1613", 
        "description": "Map created with KPCovR for the QM9 dataset at alpha=0.5 using the chemiscope.org visualizer JSON format", 
        "key": "qm9-12PC-kpcovr-0.5-chemiscope.json.gz", 
        "size": 3418447
      }, 
      {
        "checksum": "md5:604a61a5e9993b2ba7b59b04a1f6306f", 
        "description": "Map created with KPCovR for the QM9 dataset at alpha=1.0 using the chemiscope.org visualizer JSON format", 
        "key": "qm9-12PC-kpcovr-1.0-chemiscope.json.gz", 
        "size": 3415861
      }
    ], 
    "references": [
      {
        "citation": "B. A. Helfrecht, R. K. Cersonsky, G. Fraux, M. Ceriotti, arXiv:2002.05076 (2020)", 
        "url": "https://arxiv.org/abs/2002.05076", 
        "type": "Preprint"
      }
    ], 
    "contributors": [
      {
        "givennames": "Benjamin A.", 
        "affiliations": [
          "Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland"
        ], 
        "familyname": "Helfrecht", 
        "email": "benjamin.helfrecht@epfl.ch"
      }, 
      {
        "givennames": "Rose K.", 
        "affiliations": [
          "Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland"
        ], 
        "familyname": "Cersonsky", 
        "email": "rose.cersonsky@epfl.ch"
      }, 
      {
        "givennames": "Guillaume", 
        "affiliations": [
          "Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland"
        ], 
        "familyname": "Fraux", 
        "email": "guillaume.fraux@epfl.ch"
      }, 
      {
        "givennames": "Michele", 
        "affiliations": [
          "Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland"
        ], 
        "familyname": "Ceriotti", 
        "email": "michele.ceriotti@epfl.ch"
      }
    ], 
    "_oai": {
      "id": "oai:materialscloud.org:1185"
    }, 
    "publication_date": "Dec 20, 2021, 10:08:22", 
    "mcid": "2021.225", 
    "version": 2, 
    "id": "1185", 
    "license": "Creative Commons Attribution 4.0 International"
  }, 
  "revision": 2, 
  "created": "2021-12-17T11:10:59.044564+00:00", 
  "id": "1185", 
  "updated": "2021-12-20T09:08:23.032840+00:00"
}