{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "# install unimol https://unimol.readthedocs.io/en/latest/installation.html#install\n", "import pandas as pd\n", "df = pd.read_csv('/mnt/c/project/qsar/data/A_85.csv',sep=';')" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | Molecule ChEMBL ID | \n", "Molecule Name | \n", "Molecule Max Phase | \n", "Molecular Weight | \n", "#RO5 Violations | \n", "AlogP | \n", "Compound Key | \n", "Smiles | \n", "Standard Type | \n", "Standard Relation | \n", "... | \n", "Target Type | \n", "Document ChEMBL ID | \n", "Source ID | \n", "Source Description | \n", "Document Journal | \n", "Document Year | \n", "Cell ChEMBL ID | \n", "Properties | \n", "Action Type | \n", "Standard Text Value | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "CHEMBL5184894 | \n", "NaN | \n", "None | \n", "916.22 | \n", "3 | \n", "5.74 | \n", "C-3 | \n", "CC[C@H]1OC(=O)C[C@@H](O)[C@H](C)[C@@H](O[C@@H]... | \n", "MIC | \n", "'=' | \n", "... | \n", "ORGANISM | \n", "CHEMBL5126592 | \n", "1 | \n", "Scientific Literature | \n", "Eur J Med Chem | \n", "2022 | \n", "None | \n", "Time_Lower = 16.0 hrs | Time_Upper = 20.0 hrs | \n", "NaN | \n", "NaN | \n", "
| 1 | \n", "CHEMBL5198466 | \n", "NaN | \n", "None | \n", "902.19 | \n", "3 | \n", "5.35 | \n", "C-2 | \n", "CC[C@H]1OC(=O)C[C@@H](O)[C@H](C)[C@@H](O[C@@H]... | \n", "MIC | \n", "'=' | \n", "... | \n", "ORGANISM | \n", "CHEMBL5126592 | \n", "1 | \n", "Scientific Literature | \n", "Eur J Med Chem | \n", "2022 | \n", "None | \n", "Time_Lower = 16.0 hrs | Time_Upper = 20.0 hrs | \n", "NaN | \n", "NaN | \n", "
| 2 | \n", "CHEMBL5179714 | \n", "NaN | \n", "None | \n", "976.02 | \n", "3 | \n", "5.80 | \n", "A-7 | \n", "CC[C@H]1OC(=O)C[C@@H](O)[C@H](C)[C@@H](O[C@@H]... | \n", "MIC | \n", "'=' | \n", "... | \n", "ORGANISM | \n", "CHEMBL5126592 | \n", "1 | \n", "Scientific Literature | \n", "Eur J Med Chem | \n", "2022 | \n", "None | \n", "Time_Lower = 16.0 hrs | Time_Upper = 20.0 hrs | \n", "NaN | \n", "NaN | \n", "
| 3 | \n", "CHEMBL5190735 | \n", "NaN | \n", "None | \n", "904.16 | \n", "2 | \n", "3.93 | \n", "C-4 | \n", "CC[C@H]1OC(=O)C[C@@H](O)[C@H](C)[C@@H](O[C@@H]... | \n", "MIC | \n", "'=' | \n", "... | \n", "ORGANISM | \n", "CHEMBL5126592 | \n", "1 | \n", "Scientific Literature | \n", "Eur J Med Chem | \n", "2022 | \n", "None | \n", "Time_Lower = 16.0 hrs | Time_Upper = 20.0 hrs | \n", "NaN | \n", "NaN | \n", "
| 4 | \n", "CHEMBL5199514 | \n", "NaN | \n", "None | \n", "897.13 | \n", "3 | \n", "5.03 | \n", "1-23(A-2) | \n", "CC[C@H]1OC(=O)C[C@@H](O)[C@H](C)[C@@H](O[C@@H]... | \n", "MIC | \n", "'=' | \n", "... | \n", "ORGANISM | \n", "CHEMBL5126592 | \n", "1 | \n", "Scientific Literature | \n", "Eur J Med Chem | \n", "2022 | \n", "None | \n", "Time_Lower = 16.0 hrs | Time_Upper = 20.0 hrs | \n", "NaN | \n", "NaN | \n", "
5 rows × 47 columns
\n", "| \n", " | SMILES | \n", "TARGET | \n", "
|---|---|---|
| 0 | \n", "CC[C@H]1OC(=O)C[C@@H](O)[C@H](C)[C@@H](O[C@@H]... | \n", "0.5 | \n", "
| 1 | \n", "CC[C@H]1OC(=O)C[C@@H](O)[C@H](C)[C@@H](O[C@@H]... | \n", "0.5 | \n", "
| 2 | \n", "CC[C@H]1OC(=O)C[C@@H](O)[C@H](C)[C@@H](O[C@@H]... | \n", "32.0 | \n", "
| 3 | \n", "CC[C@H]1OC(=O)C[C@@H](O)[C@H](C)[C@@H](O[C@@H]... | \n", "16.0 | \n", "
| 4 | \n", "CC[C@H]1OC(=O)C[C@@H](O)[C@H](C)[C@@H](O[C@@H]... | \n", "4.0 | \n", "