{ "cells": [ { "cell_type": "code", "execution_count": 84, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "from sklearn.utils import shuffle\n", "from sklearn.model_selection import train_test_split,cross_val_score,GridSearchCV\n", "from sklearn.decomposition import PCA\n", "import matplotlib.pyplot as plt\n", "from mpl_toolkits.mplot3d import Axes3D\n", "import seaborn\n", "import numpy as np\n", "from sklearn.ensemble import RandomForestClassifier\n", "from sklearn.neighbors import KNeighborsClassifier\n", "from sklearn import metrics\n", "import itertools\n", "from sklearn.preprocessing import StandardScaler,MinMaxScaler\n", "from sklearn.linear_model import LogisticRegression\n", "from sklearn.externals import joblib" ] }, { "cell_type": "code", "execution_count": 85, "metadata": {}, "outputs": [], "source": [ "galaxies = pd.read_csv('./LAMOST_spectra/galaxy_standardised.csv')" ] }, { "cell_type": "code", "execution_count": 86, "metadata": {}, "outputs": [], "source": [ "qsos = pd.read_csv('./LAMOST_spectra/qso_standardised.csv')" ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | 0 | \n", "1 | \n", "2 | \n", "3 | \n", "4 | \n", "5 | \n", "6 | \n", "7 | \n", "8 | \n", "9 | \n", "... | \n", "2541 | \n", "2542 | \n", "2543 | \n", "2544 | \n", "2545 | \n", "2546 | \n", "2547 | \n", "2548 | \n", "2549 | \n", "type | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0.617188 | \n", "1.078200 | \n", "0.719656 | \n", "0.591135 | \n", "0.249724 | \n", "0.576590 | \n", "0.758004 | \n", "0.434611 | \n", "1.019012 | \n", "0.431297 | \n", "... | \n", "1.230564 | \n", "2.066841 | \n", "1.630086 | \n", "0.345478 | \n", "1.257950 | \n", "-0.641574 | \n", "0.866615 | \n", "0.845419 | \n", "0.875861 | \n", "2 | \n", "
1 | \n", "-0.105619 | \n", "-0.615157 | \n", "-0.151418 | \n", "-0.192431 | \n", "0.600306 | \n", "0.485535 | \n", "-0.460267 | \n", "0.562241 | \n", "0.145672 | \n", "0.118304 | \n", "... | \n", "0.952100 | \n", "1.041957 | \n", "0.870311 | \n", "1.209000 | \n", "1.210865 | \n", "0.831403 | \n", "0.682861 | \n", "1.007102 | \n", "0.998151 | \n", "2 | \n", "
2 | \n", "0.608529 | \n", "0.339985 | \n", "0.612112 | \n", "0.704888 | \n", "0.435795 | \n", "0.564308 | \n", "0.521174 | \n", "0.646109 | \n", "0.386403 | \n", "0.227294 | \n", "... | \n", "1.038180 | \n", "1.026206 | \n", "0.939450 | \n", "1.023971 | \n", "1.122343 | \n", "0.985136 | \n", "1.022401 | \n", "1.032069 | \n", "1.035573 | \n", "2 | \n", "
3 | \n", "-0.125019 | \n", "1.094082 | \n", "0.536864 | \n", "1.023426 | \n", "2.261266 | \n", "2.303743 | \n", "0.980048 | \n", "0.621883 | \n", "0.701422 | \n", "0.720067 | \n", "... | \n", "0.921314 | \n", "0.763278 | \n", "0.740817 | \n", "1.109447 | \n", "0.645768 | \n", "0.984002 | \n", "0.852604 | \n", "0.803293 | \n", "0.816611 | \n", "2 | \n", "
4 | \n", "0.646874 | \n", "0.441916 | \n", "0.839619 | \n", "0.434925 | \n", "0.544952 | \n", "0.256422 | \n", "0.467634 | \n", "0.512585 | \n", "0.236020 | \n", "0.337063 | \n", "... | \n", "1.184212 | \n", "1.159360 | \n", "0.886024 | \n", "1.422036 | \n", "1.451235 | \n", "1.154935 | \n", "1.108076 | \n", "1.149500 | \n", "1.149634 | \n", "2 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
1995 | \n", "1.358673 | \n", "2.255526 | \n", "-1.927181 | \n", "2.189852 | \n", "-1.175295 | \n", "3.158015 | \n", "1.817735 | \n", "1.476316 | \n", "-0.005982 | \n", "2.614979 | \n", "... | \n", "14.729002 | \n", "14.190329 | \n", "6.227650 | \n", "-6.466226 | \n", "-6.466477 | \n", "-6.980642 | \n", "0.129756 | \n", "0.899375 | \n", "2.892127 | \n", "3 | \n", "
1996 | \n", "4.736062 | \n", "8.493721 | \n", "4.307473 | \n", "6.376364 | \n", "6.063689 | \n", "4.828099 | \n", "7.034339 | \n", "5.206685 | \n", "1.766484 | \n", "8.031152 | \n", "... | \n", "-2.224697 | \n", "-2.945363 | \n", "-3.193636 | \n", "1.916528 | \n", "-4.198533 | \n", "-6.026858 | \n", "-2.577864 | \n", "-1.554188 | \n", "-2.068489 | \n", "3 | \n", "
1997 | \n", "2.251206 | \n", "3.835492 | \n", "2.401364 | \n", "2.064844 | \n", "1.606885 | \n", "2.835680 | \n", "2.543361 | \n", "3.106267 | \n", "3.807246 | \n", "3.216638 | \n", "... | \n", "0.240475 | \n", "0.018851 | \n", "-0.472121 | \n", "-0.058201 | \n", "-0.391158 | \n", "0.612688 | \n", "0.288732 | \n", "0.512242 | \n", "0.547362 | \n", "3 | \n", "
1998 | \n", "1.734387 | \n", "2.007688 | \n", "1.798588 | \n", "1.681123 | \n", "2.155894 | \n", "2.156851 | \n", "1.905678 | \n", "1.978067 | \n", "2.447229 | \n", "2.044550 | \n", "... | \n", "0.460327 | \n", "0.609559 | \n", "0.467800 | \n", "0.139381 | \n", "-0.047443 | \n", "0.301798 | \n", "0.392577 | \n", "0.467889 | \n", "0.384213 | \n", "3 | \n", "
1999 | \n", "2.673625 | \n", "2.610178 | \n", "4.171594 | \n", "1.135168 | \n", "1.557421 | \n", "3.336255 | \n", "1.778019 | \n", "2.815661 | \n", "3.667999 | \n", "2.136348 | \n", "... | \n", "0.758155 | \n", "-1.198771 | \n", "-1.827310 | \n", "-2.254883 | \n", "2.136604 | \n", "-1.001851 | \n", "0.965404 | \n", "0.122785 | \n", "0.576359 | \n", "3 | \n", "
4000 rows × 2551 columns
\n", "\n", " | 0 | \n", "1 | \n", "2 | \n", "3 | \n", "4 | \n", "5 | \n", "6 | \n", "7 | \n", "8 | \n", "9 | \n", "... | \n", "2541 | \n", "2542 | \n", "2543 | \n", "2544 | \n", "2545 | \n", "2546 | \n", "2547 | \n", "2548 | \n", "2549 | \n", "type | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
1224 | \n", "2.891349 | \n", "1.437608 | \n", "1.346257 | \n", "1.553989 | \n", "2.882983 | \n", "2.260688 | \n", "0.524664 | \n", "1.037580 | \n", "0.385678 | \n", "2.177028 | \n", "... | \n", "1.114744 | \n", "1.451957 | \n", "-5.536831 | \n", "0.532371 | \n", "8.654653 | \n", "-0.076086 | \n", "1.326490 | \n", "0.453447 | \n", "0.754747 | \n", "3 | \n", "
1830 | \n", "3.879734 | \n", "5.009363 | \n", "6.276478 | \n", "5.035055 | \n", "5.840371 | \n", "4.358024 | \n", "5.324929 | \n", "4.972554 | \n", "2.555320 | \n", "2.953080 | \n", "... | \n", "0.675787 | \n", "0.591280 | \n", "1.069435 | \n", "0.217655 | \n", "0.115893 | \n", "0.581067 | \n", "0.514607 | \n", "0.462505 | \n", "0.649936 | \n", "3 | \n", "
964 | \n", "0.425303 | \n", "-0.773273 | \n", "1.868011 | \n", "0.401713 | \n", "2.898418 | \n", "2.085099 | \n", "1.737992 | \n", "1.282685 | \n", "1.108372 | \n", "1.779551 | \n", "... | \n", "0.595909 | \n", "0.576578 | \n", "0.345612 | \n", "0.631520 | \n", "0.907204 | \n", "-0.226944 | \n", "-0.068086 | \n", "0.521514 | \n", "0.633895 | \n", "3 | \n", "
778 | \n", "1.276239 | \n", "4.518811 | \n", "2.398222 | \n", "2.322696 | \n", "-0.104984 | \n", "1.534739 | \n", "3.207106 | \n", "2.447320 | \n", "2.416217 | \n", "3.429941 | \n", "... | \n", "0.434583 | \n", "0.189397 | \n", "-0.833621 | \n", "-1.580476 | \n", "-0.394436 | \n", "0.575719 | \n", "0.741413 | \n", "0.076439 | \n", "0.215710 | \n", "3 | \n", "
112 | \n", "3.604190 | \n", "-0.166099 | \n", "0.796164 | \n", "3.779741 | \n", "2.862189 | \n", "2.297985 | \n", "1.111864 | \n", "-4.363558 | \n", "3.344258 | \n", "-1.236573 | \n", "... | \n", "1.787055 | \n", "0.912069 | \n", "1.118230 | \n", "-0.070411 | \n", "-0.277597 | \n", "0.754682 | \n", "0.061647 | \n", "0.575771 | \n", "0.907901 | \n", "3 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
1812 | \n", "0.093733 | \n", "0.183721 | \n", "0.050577 | \n", "0.045006 | \n", "-0.053974 | \n", "0.103254 | \n", "0.218459 | \n", "0.296510 | \n", "0.321800 | \n", "0.262396 | \n", "... | \n", "1.072321 | \n", "1.172215 | \n", "0.907360 | \n", "1.556413 | \n", "0.817625 | \n", "0.919094 | \n", "1.151508 | \n", "1.290080 | \n", "1.249178 | \n", "2 | \n", "
532 | \n", "0.868472 | \n", "1.438901 | \n", "1.794490 | \n", "0.754563 | \n", "0.680179 | \n", "0.701802 | \n", "0.556087 | \n", "1.235091 | \n", "0.780536 | \n", "1.650703 | \n", "... | \n", "0.847327 | \n", "0.835260 | \n", "0.950760 | \n", "0.823709 | \n", "0.704693 | \n", "0.701405 | \n", "0.901184 | \n", "0.883823 | \n", "0.856567 | \n", "2 | \n", "
1813 | \n", "2.330337 | \n", "1.271180 | \n", "2.015320 | \n", "2.478237 | \n", "1.989256 | \n", "1.652456 | \n", "1.838835 | \n", "2.860579 | \n", "3.167940 | \n", "2.157424 | \n", "... | \n", "0.198369 | \n", "0.288275 | \n", "0.102458 | \n", "0.628728 | \n", "0.734389 | \n", "0.408767 | \n", "0.310602 | \n", "0.435959 | \n", "0.471247 | \n", "3 | \n", "
463 | \n", "2.992803 | \n", "4.520074 | \n", "1.281727 | \n", "2.560910 | \n", "0.090832 | \n", "1.549194 | \n", "1.371671 | \n", "-1.630202 | \n", "-4.321544 | \n", "-0.210890 | \n", "... | \n", "-0.179296 | \n", "-3.015679 | \n", "-2.220191 | \n", "-2.508168 | \n", "0.847879 | \n", "0.454679 | \n", "-0.945904 | \n", "-0.030512 | \n", "0.630526 | \n", "3 | \n", "
1915 | \n", "0.275238 | \n", "1.066475 | \n", "0.346207 | \n", "0.242615 | \n", "0.915270 | \n", "0.539574 | \n", "0.767515 | \n", "0.643072 | \n", "0.644822 | \n", "0.726666 | \n", "... | \n", "0.827198 | \n", "1.093432 | \n", "1.058417 | \n", "0.406138 | \n", "0.578854 | \n", "0.656705 | \n", "0.672236 | \n", "0.712788 | \n", "0.703433 | \n", "2 | \n", "
4000 rows × 2551 columns
\n", "\n", " | 0 | \n", "1 | \n", "2 | \n", "3 | \n", "4 | \n", "5 | \n", "6 | \n", "7 | \n", "8 | \n", "9 | \n", "... | \n", "2540 | \n", "2541 | \n", "2542 | \n", "2543 | \n", "2544 | \n", "2545 | \n", "2546 | \n", "2547 | \n", "2548 | \n", "2549 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
496 | \n", "0.453018 | \n", "-0.078946 | \n", "1.056244 | \n", "-0.761460 | \n", "-0.108049 | \n", "0.316049 | \n", "1.684295 | \n", "1.277893 | \n", "2.328646 | \n", "-0.490003 | \n", "... | \n", "1.023142 | \n", "0.972128 | \n", "0.877626 | \n", "0.903512 | \n", "0.225082 | \n", "0.656252 | \n", "1.250650 | \n", "0.905113 | \n", "1.123623 | \n", "1.008364 | \n", "
1241 | \n", "0.744684 | \n", "0.706419 | \n", "0.539418 | \n", "0.585637 | \n", "1.159545 | \n", "0.676108 | \n", "0.581048 | \n", "0.410185 | \n", "0.660224 | \n", "0.516061 | \n", "... | \n", "0.728807 | \n", "0.872218 | \n", "1.278320 | \n", "0.577979 | \n", "0.967569 | \n", "0.949157 | \n", "0.762882 | \n", "0.773693 | \n", "0.721741 | \n", "0.852410 | \n", "
1864 | \n", "0.549835 | \n", "0.339083 | \n", "1.420260 | \n", "0.710170 | \n", "1.010419 | \n", "0.306943 | \n", "-0.252886 | \n", "0.437769 | \n", "1.991301 | \n", "0.414019 | \n", "... | \n", "0.846816 | \n", "3.304601 | \n", "15.221448 | \n", "-6.067144 | \n", "-1.988856 | \n", "6.030686 | \n", "2.592641 | \n", "1.119804 | \n", "0.687274 | \n", "0.704317 | \n", "
571 | \n", "-7.031517 | \n", "6.187820 | \n", "-9.371308 | \n", "8.060097 | \n", "-3.906795 | \n", "2.382266 | \n", "-0.073769 | \n", "6.968823 | \n", "2.481344 | \n", "8.414966 | \n", "... | \n", "1.881450 | \n", "-0.323327 | \n", "2.411483 | \n", "-3.733856 | \n", "1.817483 | \n", "-1.802364 | \n", "3.208507 | \n", "1.380639 | \n", "1.492592 | \n", "0.997739 | \n", "
1094 | \n", "0.539701 | \n", "0.670896 | \n", "-0.184938 | \n", "0.392194 | \n", "0.096106 | \n", "0.525495 | \n", "0.418713 | \n", "0.776471 | \n", "0.828761 | \n", "0.931785 | \n", "... | \n", "0.894532 | \n", "0.855367 | \n", "0.714974 | \n", "0.750959 | \n", "0.940317 | \n", "0.995974 | \n", "1.013581 | \n", "0.925367 | \n", "0.879055 | \n", "0.889729 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
1378 | \n", "2.394843 | \n", "1.695996 | \n", "1.064526 | \n", "2.684924 | \n", "1.394738 | \n", "3.577144 | \n", "3.067955 | \n", "0.946760 | \n", "2.945100 | \n", "1.817511 | \n", "... | \n", "1.051854 | \n", "3.754546 | \n", "8.477930 | \n", "1.168571 | \n", "-6.302239 | \n", "1.473663 | \n", "-0.638889 | \n", "0.444808 | \n", "0.817370 | \n", "1.119679 | \n", "
478 | \n", "1.302975 | \n", "4.023532 | \n", "0.029693 | \n", "3.330072 | \n", "1.782232 | \n", "1.015794 | \n", "2.910030 | \n", "2.706038 | \n", "3.512573 | \n", "1.349334 | \n", "... | \n", "0.693626 | \n", "0.542258 | \n", "2.424630 | \n", "-0.655173 | \n", "0.647713 | \n", "1.220641 | \n", "1.382282 | \n", "0.817242 | \n", "0.609625 | \n", "0.833427 | \n", "
1581 | \n", "0.259939 | \n", "0.039702 | \n", "0.313820 | \n", "0.330721 | \n", "0.457388 | \n", "0.079465 | \n", "0.333012 | \n", "0.251914 | \n", "0.294523 | \n", "-0.090406 | \n", "... | \n", "1.411705 | \n", "1.464086 | \n", "1.367845 | \n", "1.287620 | \n", "1.276434 | \n", "1.035445 | \n", "1.370057 | \n", "1.555483 | \n", "1.340720 | \n", "1.450895 | \n", "
438 | \n", "1.505315 | \n", "1.813736 | \n", "1.585130 | \n", "1.981320 | \n", "1.795147 | \n", "1.644358 | \n", "1.660030 | \n", "1.656898 | \n", "1.302048 | \n", "1.976754 | \n", "... | \n", "0.591836 | \n", "1.096665 | \n", "2.010072 | \n", "0.355882 | \n", "-0.075982 | \n", "0.229903 | \n", "0.325398 | \n", "0.396209 | \n", "0.228675 | \n", "0.527300 | \n", "
409 | \n", "1.552886 | \n", "0.375319 | \n", "1.453693 | \n", "2.159667 | \n", "1.925261 | \n", "0.457191 | \n", "0.414648 | \n", "1.671543 | \n", "2.754634 | \n", "0.379460 | \n", "... | \n", "0.461849 | \n", "0.226023 | \n", "-0.802757 | \n", "0.957317 | \n", "2.737699 | \n", "1.378962 | \n", "-0.427378 | \n", "-0.353147 | \n", "0.238610 | \n", "0.332487 | \n", "
3200 rows × 2550 columns
\n", "