You are currently on a failover version of the Materials Cloud Archive hosted at CINECA, Italy.
Click here to access the main Materials Cloud Archive.
Note: If the link above redirects you to this page, it means that the Archive is currently offline due to maintenance. We will be back online as soon as possible.
This version is read-only: you can view published records and download files, but you cannot create new records or make changes to existing ones.

Predicting polymerization reactions via transfer learning using chemical language models


JSON Export

{
  "metadata": {
    "edited_by": 98, 
    "owner": 726, 
    "_oai": {
      "id": "oai:materialscloud.org:1780"
    }, 
    "description": "Polymers are candidate materials for a wide range of sustainability applications such as carbon capture and energy storage. However, computational polymer discovery lacks automated analysis of reaction pathways and stability assessment through retro-synthesis. Here, we report the first extension of transformer-based language models to polymerization reactions for both forward and retrosynthesis tasks. We curated a polymerization dataset for vinyl polymers covering reactions and retrosynthesis for representative homo-polymers and co-polymers. Overall, we report a forward model accuracy of 80% and a backward model accuracy of 60%. We further analyse the model performance on a set of case studies by providing polymerization and retro-synthesis examples and evaluating the model\u2019s predictions quality from a materials science perspective.", 
    "mcid": "2023.137", 
    "id": "1780", 
    "license": "MIT License", 
    "license_addendum": "CDLA-Permissive-2.0", 
    "references": [], 
    "doi": "10.24435/materialscloud:zw-be", 
    "keywords": [
      "polymerization reaction", 
      "machine learning", 
      "homopolymers", 
      "co-polymers", 
      "reactants", 
      "reagents (solvents, catalysts)", 
      "products"
    ], 
    "contributors": [
      {
        "affiliations": [
          "IBM Research Brazil - Avenida Rep\u00fablica do Chile, 330 - 11o. e 12. andares Rio De Janeiro, RJ 20031-170, Brazil"
        ], 
        "familyname": "S. Ferrari", 
        "email": "bferrari@ibm.com", 
        "givennames": "Brenda"
      }, 
      {
        "affiliations": [
          "IBM Research Europe - S\u00e4umerstrasse 4, 8803 R\u00fcschlikon, Switzerland"
        ], 
        "familyname": "Manica", 
        "email": "TTE@zurich.ibm.com", 
        "givennames": "Matteo"
      }, 
      {
        "affiliations": [
          "IBM Research Brazil - Avenida Rep\u00fablica do Chile, 330 - 11o. e 12. andares Rio De Janeiro, RJ 20031-170, Brazil"
        ], 
        "familyname": "Giro", 
        "email": "rgiro@br.ibm.com", 
        "givennames": "Ronaldo"
      }, 
      {
        "affiliations": [
          "IBM Research Europe - S\u00e4umerstrasse 4, 8803 R\u00fcschlikon, Switzerland", 
          "National Center for Competence in Research-Catalysis (NCCR-Catalysis), Switzerland"
        ], 
        "familyname": "Laino", 
        "email": "TEO@zurich.ibm.com", 
        "givennames": "Teodoro"
      }, 
      {
        "affiliations": [
          "IBM Research Brazil - Avenida Rep\u00fablica do Chile, 330 - 11o. e 12. andares Rio De Janeiro, RJ 20031-170, Brazil"
        ], 
        "familyname": "B. Steiner", 
        "email": "mathiast@br.ibm.com", 
        "givennames": "Mathias"
      }
    ], 
    "conceptrecid": "1779", 
    "version": 1, 
    "publication_date": "Sep 06, 2023, 09:31:05", 
    "is_last": false, 
    "status": "published", 
    "_files": [
      {
        "size": 2153792, 
        "checksum": "md5:e98e53c67b90a7e2ec049a93a17dd78f", 
        "description": "polymerization reactions with head and tail atoms assigned by a Python script based on polymerization mechanisms and nucleophilic index from quantum chemistry atom population of Highest Occupied Molecular Orbital", 
        "key": "hta_dataset_all_combinations.csv"
      }, 
      {
        "size": 1589715, 
        "checksum": "md5:def01c2f8f848ab7ad329372cb37898c", 
        "description": "polymerization reactions with head and tail atoms assigned by a modified version of a Python tool called Monomers to Polymers (M2P)", 
        "key": "m2p_dataset_all_combinations.csv"
      }, 
      {
        "size": 4120577643, 
        "checksum": "md5:f43e79c28fec01b7bf665b853b6359a3", 
        "description": "zip file containing the Machine Learning training models (forward and retrosynthesis) where the config files are those with yml extensions and the model weights are those with pt extensions (pickle binary - can be read via pytorch)", 
        "key": "trained_models.zip"
      }
    ], 
    "title": "Predicting polymerization reactions via transfer learning using chemical language models"
  }, 
  "id": "1780", 
  "updated": "2024-02-29T15:30:05.287721+00:00", 
  "created": "2023-05-30T12:47:22.223477+00:00", 
  "revision": 8
}