{ "cells": [ { "attachments": {}, "cell_type": "markdown", "metadata": {}, "source": [ "## PCA and VCD (Could delete since there were no matches)" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "# Comput PCS and VCD features to feed into model" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "half_enantiomer_data = pd.read_csv(\"half_enantiomer_data.csv\")" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [], "source": [ "# Read in pca and vcd dataframe to use as features\n", "pca_vcd_values = pd.read_csv(\"../data/vcd/pca_vcd_values.csv\")" ] }, { "cell_type": "code", "execution_count": 10, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | Molecule Name | \n", "0 | \n", "1 | \n", "2 | \n", "3 | \n", "4 | \n", "5 | \n", "6 | \n", "7 | \n", "8 | \n", "9 | \n", "10 | \n", "11 | \n", "12 | \n", "13 | \n", "14 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "(R)-(-)-Carvone | \n", "7.464317 | \n", "-43.591126 | \n", "-8.046428 | \n", "-0.574730 | \n", "-3.580254 | \n", "5.872903 | \n", "-2.689295 | \n", "0.910235 | \n", "3.263888 | \n", "1.241722 | \n", "-1.817992 | \n", "-10.064818 | \n", "-5.517172 | \n", "6.956873 | \n", "0.003187 | \n", "
1 | \n", "(1R,2S,5R)-(-)-Menthol | \n", "-15.984788 | \n", "-48.409755 | \n", "11.599679 | \n", "-6.459996 | \n", "-2.895890 | \n", "-21.817187 | \n", "7.987366 | \n", "30.168379 | \n", "-4.855940 | \n", "-27.966750 | \n", "-15.593791 | \n", "18.881794 | \n", "6.680355 | \n", "-3.869645 | \n", "-18.299473 | \n", "
2 | \n", "(-)-Menthyl chloride | \n", "-5.850617 | \n", "-48.612997 | \n", "25.383460 | \n", "-1.972609 | \n", "-9.623228 | \n", "-12.079316 | \n", "-5.014842 | \n", "9.790833 | \n", "-11.125811 | \n", "-10.948924 | \n", "12.772888 | \n", "-4.068723 | \n", "4.196934 | \n", "0.326200 | \n", "0.769741 | \n", "
3 | \n", "(-)-Borneol | \n", "0.756580 | \n", "-25.884643 | \n", "-4.987043 | \n", "6.148153 | \n", "-18.167909 | \n", "7.294051 | \n", "-16.954397 | \n", "9.166877 | \n", "10.160046 | \n", "8.512541 | \n", "22.090822 | \n", "-60.188603 | \n", "5.246429 | \n", "9.022766 | \n", "-17.823573 | \n", "
4 | \n", "(-)-Isoplegol | \n", "-12.599590 | \n", "-33.717238 | \n", "-12.966523 | \n", "-18.479083 | \n", "5.945713 | \n", "-6.208222 | \n", "-4.337392 | \n", "10.783442 | \n", "-12.640204 | \n", "1.773643 | \n", "1.927400 | \n", "6.935122 | \n", "5.856485 | \n", "8.257695 | \n", "-9.983220 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
156 | \n", "β-Cholestanol | \n", "6.415996 | \n", "-18.840982 | \n", "20.303654 | \n", "-29.238431 | \n", "-26.058052 | \n", "8.328641 | \n", "-8.520251 | \n", "19.753263 | \n", "24.650594 | \n", "37.600273 | \n", "-1.058662 | \n", "-16.200175 | \n", "37.116864 | \n", "-1.951506 | \n", "-10.766619 | \n", "
157 | \n", "Cholesterol Ethyl Carbonate | \n", "230.771312 | \n", "139.215929 | \n", "-45.562654 | \n", "-28.445263 | \n", "7.019739 | \n", "-30.857068 | \n", "18.819408 | \n", "-6.542138 | \n", "7.706800 | \n", "-5.896378 | \n", "7.642116 | \n", "-5.188079 | \n", "5.985704 | \n", "-34.834249 | \n", "-7.737224 | \n", "
158 | \n", "Cholesterol n-Caprate | \n", "181.677425 | \n", "33.151223 | \n", "72.048835 | \n", "-49.147260 | \n", "19.664893 | \n", "20.812246 | \n", "-3.977717 | \n", "5.351038 | \n", "14.182154 | \n", "-2.607771 | \n", "6.333818 | \n", "-0.251176 | \n", "-7.470138 | \n", "19.545668 | \n", "-8.373291 | \n", "
159 | \n", "Cholesterol Laurate | \n", "-130.152846 | \n", "164.035229 | \n", "61.091725 | \n", "-37.136634 | \n", "-13.847154 | \n", "14.540341 | \n", "-4.944992 | \n", "-3.105062 | \n", "2.508800 | \n", "1.700032 | \n", "5.700678 | \n", "8.617406 | \n", "-4.496284 | \n", "22.150449 | \n", "2.389079 | \n", "
160 | \n", "Cholesterol Myristate | \n", "-132.817778 | \n", "151.835799 | \n", "66.528593 | \n", "-50.454738 | \n", "7.112731 | \n", "21.576747 | \n", "6.387919 | \n", "-5.878909 | \n", "-6.011154 | \n", "7.648669 | \n", "4.893929 | \n", "7.866558 | \n", "1.410726 | \n", "11.221058 | \n", "0.188386 | \n", "
161 rows × 16 columns
\n", "\n", " | 0 | \n", "1 | \n", "2 | \n", "3 | \n", "4 | \n", "5 | \n", "6 | \n", "7 | \n", "8 | \n", "9 | \n", "10 | \n", "11 | \n", "12 | \n", "13 | \n", "14 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
Molecule Name | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
(R)-(-)-Carvone | \n", "7.464317 | \n", "-43.591126 | \n", "-8.046428 | \n", "-0.574730 | \n", "-3.580254 | \n", "5.872903 | \n", "-2.689295 | \n", "0.910235 | \n", "3.263888 | \n", "1.241722 | \n", "-1.817992 | \n", "-10.064818 | \n", "-5.517172 | \n", "6.956873 | \n", "0.003187 | \n", "
(1R,2S,5R)-(-)-Menthol | \n", "-15.984788 | \n", "-48.409755 | \n", "11.599679 | \n", "-6.459996 | \n", "-2.895890 | \n", "-21.817187 | \n", "7.987366 | \n", "30.168379 | \n", "-4.855940 | \n", "-27.966750 | \n", "-15.593791 | \n", "18.881794 | \n", "6.680355 | \n", "-3.869645 | \n", "-18.299473 | \n", "
(-)-Menthyl chloride | \n", "-5.850617 | \n", "-48.612997 | \n", "25.383460 | \n", "-1.972609 | \n", "-9.623228 | \n", "-12.079316 | \n", "-5.014842 | \n", "9.790833 | \n", "-11.125811 | \n", "-10.948924 | \n", "12.772888 | \n", "-4.068723 | \n", "4.196934 | \n", "0.326200 | \n", "0.769741 | \n", "
(-)-Borneol | \n", "0.756580 | \n", "-25.884643 | \n", "-4.987043 | \n", "6.148153 | \n", "-18.167909 | \n", "7.294051 | \n", "-16.954397 | \n", "9.166877 | \n", "10.160046 | \n", "8.512541 | \n", "22.090822 | \n", "-60.188603 | \n", "5.246429 | \n", "9.022766 | \n", "-17.823573 | \n", "
(-)-Isoplegol | \n", "-12.599590 | \n", "-33.717238 | \n", "-12.966523 | \n", "-18.479083 | \n", "5.945713 | \n", "-6.208222 | \n", "-4.337392 | \n", "10.783442 | \n", "-12.640204 | \n", "1.773643 | \n", "1.927400 | \n", "6.935122 | \n", "5.856485 | \n", "8.257695 | \n", "-9.983220 | \n", "
\n", " | Unnamed: 0 | \n", "Unnamed: 0.1 | \n", "Molecule Name | \n", "Pubchem ID # | \n", "Note | \n", "SMILES String | \n", "Other SMILES | \n", "Method | \n", "Contributor | \n", "Detection Threshold | \n", "... | \n", "5 | \n", "6 | \n", "7 | \n", "8 | \n", "9 | \n", "10 | \n", "11 | \n", "12 | \n", "13 | \n", "14 | \n", "
---|
0 rows × 32 columns
\n", "