{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import numpy as np\n", "import pandas as pd\n", "from sklearn import metrics\n", "from sklearn.manifold import TSNE\n", "from sklearn.preprocessing import StandardScaler\n", "import ase.io\n", "import chemiscope\n", "from pymatgen.core import Structure, Lattice, Composition\n", "\n", "import warnings\n", "warnings.filterwarnings('ignore')" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "df = pd.read_json('topoclass.json.gz')" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | ID | \n", "subset | \n", "MAT_TYPE | \n", "TQC_TYPE | \n", "structure | \n", "MP_ID | \n", "ICSD_ID | \n", "AtomicOrbitals|HOMO_character | \n", "AtomicOrbitals|HOMO_element | \n", "AtomicOrbitals|HOMO_energy | \n", "... | \n", "BondFractions|Ho - La bond frac. | \n", "BondFractions|Au - Pd bond frac. | \n", "BondFractions|Dy - Hg bond frac. | \n", "BondFractions|Er - Yb bond frac. | \n", "BondFractions|Hg - Tm bond frac. | \n", "BondFractions|Er - Hg bond frac. | \n", "BondFractions|Be - Sc bond frac. | \n", "BondFractions|Hg - Tb bond frac. | \n", "BondFractions|Be - Lu bond frac. | \n", "BondFractions|Er - Y bond frac. | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "MAT00026906 | \n", "M/T | \n", "TI | \n", "None | \n", "{'@module': 'pymatgen.core.structure', '@class... | \n", "mp-10008 | \n", "NaN | \n", "1 | \n", "20 | \n", "-0.141411 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "
1 | \n", "MAT00020270 | \n", "M/T | \n", "TrI | \n", "None | \n", "{'@module': 'pymatgen.core.structure', '@class... | \n", "mp-1001604 | \n", "NaN | \n", "2 | \n", "16 | \n", "-0.261676 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "
2 | \n", "MAT00015322 | \n", "M/T | \n", "HSLSM | \n", "None | \n", "{'@module': 'pymatgen.core.structure', '@class... | \n", "mp-1001605 | \n", "NaN | \n", "4 | \n", "59 | \n", "-0.155138 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "
3 | \n", "MAT00025094 | \n", "M/T | \n", "TCI | \n", "None | \n", "{'@module': 'pymatgen.core.structure', '@class... | \n", "mp-1001844 | \n", "NaN | \n", "2 | \n", "7 | \n", "-0.266297 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "
4 | \n", "MAT00025479 | \n", "M/T | \n", "HSLSM | \n", "None | \n", "{'@module': 'pymatgen.core.structure', '@class... | \n", "mp-1002220 | \n", "NaN | \n", "2 | \n", "51 | \n", "-0.185623 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
35603 | \n", "MAT00038674 | \n", "M&T | \n", "TrI | \n", "LCEBR | \n", "{'@module': 'pymatgen.core.structure', '@class... | \n", "mp-696736 | \n", "28541.0 | \n", "2 | \n", "9 | \n", "-0.415606 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "
35604 | \n", "MAT00038675 | \n", "M&T | \n", "TrI | \n", "LCEBR | \n", "{'@module': 'pymatgen.core.structure', '@class... | \n", "mp-707276 | \n", "20730.0 | \n", "2 | \n", "7 | \n", "-0.266297 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "
35605 | \n", "MAT00038676 | \n", "M&T | \n", "TrI | \n", "LCEBR | \n", "{'@module': 'pymatgen.core.structure', '@class... | \n", "mp-707334 | \n", "67509.0 | \n", "2 | \n", "8 | \n", "-0.338381 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "
35606 | \n", "MAT00038677 | \n", "M&T | \n", "TrI | \n", "LCEBR | \n", "{'@module': 'pymatgen.core.structure', '@class... | \n", "mp-707897 | \n", "59327.0 | \n", "2 | \n", "8 | \n", "-0.338381 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "
35607 | \n", "MAT00038678 | \n", "M&T | \n", "TrI | \n", "LCEBR | \n", "{'@module': 'pymatgen.core.structure', '@class... | \n", "mp-9198 | \n", "79005.0 | \n", "2 | \n", "15 | \n", "-0.206080 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "0.0 | \n", "0 | \n", "
35608 rows × 4717 columns
\n", "