Advertisement
Guest User

Untitled

a guest
Jun 19th, 2017
87
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 65.60 KB | None | 0 0
  1. {
  2. "cells": [
  3. {
  4. "cell_type": "code",
  5. "execution_count": 1,
  6. "metadata": {
  7. "collapsed": true
  8. },
  9. "outputs": [],
  10. "source": [
  11. "import numpy as np\n",
  12. "import scipy as sp\n",
  13. "import pandas as pd\n",
  14. "import matplotlib.pyplot as plt\n",
  15. "from sklearn import datasets"
  16. ]
  17. },
  18. {
  19. "cell_type": "code",
  20. "execution_count": 18,
  21. "metadata": {
  22. "collapsed": true
  23. },
  24. "outputs": [],
  25. "source": [
  26. "data = datasets.load_breast_cancer()"
  27. ]
  28. },
  29. {
  30. "cell_type": "code",
  31. "execution_count": 19,
  32. "metadata": {},
  33. "outputs": [
  34. {
  35. "data": {
  36. "text/plain": [
  37. "array(['mean radius', 'mean texture', 'mean perimeter', 'mean area',\n",
  38. " 'mean smoothness', 'mean compactness', 'mean concavity',\n",
  39. " 'mean concave points', 'mean symmetry', 'mean fractal dimension',\n",
  40. " 'radius error', 'texture error', 'perimeter error', 'area error',\n",
  41. " 'smoothness error', 'compactness error', 'concavity error',\n",
  42. " 'concave points error', 'symmetry error', 'fractal dimension error',\n",
  43. " 'worst radius', 'worst texture', 'worst perimeter', 'worst area',\n",
  44. " 'worst smoothness', 'worst compactness', 'worst concavity',\n",
  45. " 'worst concave points', 'worst symmetry', 'worst fractal dimension'],\n",
  46. " dtype='<U23')"
  47. ]
  48. },
  49. "execution_count": 19,
  50. "metadata": {},
  51. "output_type": "execute_result"
  52. }
  53. ],
  54. "source": [
  55. "data.feature_names"
  56. ]
  57. },
  58. {
  59. "cell_type": "code",
  60. "execution_count": 47,
  61. "metadata": {},
  62. "outputs": [
  63. {
  64. "data": {
  65. "text/html": [
  66. "<div>\n",
  67. "<style>\n",
  68. " .dataframe thead tr:only-child th {\n",
  69. " text-align: right;\n",
  70. " }\n",
  71. "\n",
  72. " .dataframe thead th {\n",
  73. " text-align: left;\n",
  74. " }\n",
  75. "\n",
  76. " .dataframe tbody tr th {\n",
  77. " vertical-align: top;\n",
  78. " }\n",
  79. "</style>\n",
  80. "<table border=\"1\" class=\"dataframe\">\n",
  81. " <thead>\n",
  82. " <tr style=\"text-align: right;\">\n",
  83. " <th></th>\n",
  84. " <th>mean radius</th>\n",
  85. " <th>mean texture</th>\n",
  86. " <th>mean perimeter</th>\n",
  87. " <th>mean area</th>\n",
  88. " <th>mean smoothness</th>\n",
  89. " <th>mean compactness</th>\n",
  90. " <th>mean concavity</th>\n",
  91. " <th>mean concave points</th>\n",
  92. " <th>mean symmetry</th>\n",
  93. " <th>mean fractal dimension</th>\n",
  94. " <th>...</th>\n",
  95. " <th>worst radius</th>\n",
  96. " <th>worst texture</th>\n",
  97. " <th>worst perimeter</th>\n",
  98. " <th>worst area</th>\n",
  99. " <th>worst smoothness</th>\n",
  100. " <th>worst compactness</th>\n",
  101. " <th>worst concavity</th>\n",
  102. " <th>worst concave points</th>\n",
  103. " <th>worst symmetry</th>\n",
  104. " <th>worst fractal dimension</th>\n",
  105. " </tr>\n",
  106. " </thead>\n",
  107. " <tbody>\n",
  108. " <tr>\n",
  109. " <th>count</th>\n",
  110. " <td>569.000000</td>\n",
  111. " <td>569.000000</td>\n",
  112. " <td>569.000000</td>\n",
  113. " <td>569.000000</td>\n",
  114. " <td>569.000000</td>\n",
  115. " <td>569.000000</td>\n",
  116. " <td>569.000000</td>\n",
  117. " <td>569.000000</td>\n",
  118. " <td>569.000000</td>\n",
  119. " <td>569.000000</td>\n",
  120. " <td>...</td>\n",
  121. " <td>569.000000</td>\n",
  122. " <td>569.000000</td>\n",
  123. " <td>569.000000</td>\n",
  124. " <td>569.000000</td>\n",
  125. " <td>569.000000</td>\n",
  126. " <td>569.000000</td>\n",
  127. " <td>569.000000</td>\n",
  128. " <td>569.000000</td>\n",
  129. " <td>569.000000</td>\n",
  130. " <td>569.000000</td>\n",
  131. " </tr>\n",
  132. " <tr>\n",
  133. " <th>mean</th>\n",
  134. " <td>14.127292</td>\n",
  135. " <td>19.289649</td>\n",
  136. " <td>91.969033</td>\n",
  137. " <td>654.889104</td>\n",
  138. " <td>0.096360</td>\n",
  139. " <td>0.104341</td>\n",
  140. " <td>0.088799</td>\n",
  141. " <td>0.048919</td>\n",
  142. " <td>0.181162</td>\n",
  143. " <td>0.062798</td>\n",
  144. " <td>...</td>\n",
  145. " <td>16.269190</td>\n",
  146. " <td>25.677223</td>\n",
  147. " <td>107.261213</td>\n",
  148. " <td>880.583128</td>\n",
  149. " <td>0.132369</td>\n",
  150. " <td>0.254265</td>\n",
  151. " <td>0.272188</td>\n",
  152. " <td>0.114606</td>\n",
  153. " <td>0.290076</td>\n",
  154. " <td>0.083946</td>\n",
  155. " </tr>\n",
  156. " <tr>\n",
  157. " <th>std</th>\n",
  158. " <td>3.524049</td>\n",
  159. " <td>4.301036</td>\n",
  160. " <td>24.298981</td>\n",
  161. " <td>351.914129</td>\n",
  162. " <td>0.014064</td>\n",
  163. " <td>0.052813</td>\n",
  164. " <td>0.079720</td>\n",
  165. " <td>0.038803</td>\n",
  166. " <td>0.027414</td>\n",
  167. " <td>0.007060</td>\n",
  168. " <td>...</td>\n",
  169. " <td>4.833242</td>\n",
  170. " <td>6.146258</td>\n",
  171. " <td>33.602542</td>\n",
  172. " <td>569.356993</td>\n",
  173. " <td>0.022832</td>\n",
  174. " <td>0.157336</td>\n",
  175. " <td>0.208624</td>\n",
  176. " <td>0.065732</td>\n",
  177. " <td>0.061867</td>\n",
  178. " <td>0.018061</td>\n",
  179. " </tr>\n",
  180. " <tr>\n",
  181. " <th>min</th>\n",
  182. " <td>6.981000</td>\n",
  183. " <td>9.710000</td>\n",
  184. " <td>43.790000</td>\n",
  185. " <td>143.500000</td>\n",
  186. " <td>0.052630</td>\n",
  187. " <td>0.019380</td>\n",
  188. " <td>0.000000</td>\n",
  189. " <td>0.000000</td>\n",
  190. " <td>0.106000</td>\n",
  191. " <td>0.049960</td>\n",
  192. " <td>...</td>\n",
  193. " <td>7.930000</td>\n",
  194. " <td>12.020000</td>\n",
  195. " <td>50.410000</td>\n",
  196. " <td>185.200000</td>\n",
  197. " <td>0.071170</td>\n",
  198. " <td>0.027290</td>\n",
  199. " <td>0.000000</td>\n",
  200. " <td>0.000000</td>\n",
  201. " <td>0.156500</td>\n",
  202. " <td>0.055040</td>\n",
  203. " </tr>\n",
  204. " <tr>\n",
  205. " <th>25%</th>\n",
  206. " <td>11.700000</td>\n",
  207. " <td>16.170000</td>\n",
  208. " <td>75.170000</td>\n",
  209. " <td>420.300000</td>\n",
  210. " <td>0.086370</td>\n",
  211. " <td>0.064920</td>\n",
  212. " <td>0.029560</td>\n",
  213. " <td>0.020310</td>\n",
  214. " <td>0.161900</td>\n",
  215. " <td>0.057700</td>\n",
  216. " <td>...</td>\n",
  217. " <td>13.010000</td>\n",
  218. " <td>21.080000</td>\n",
  219. " <td>84.110000</td>\n",
  220. " <td>515.300000</td>\n",
  221. " <td>0.116600</td>\n",
  222. " <td>0.147200</td>\n",
  223. " <td>0.114500</td>\n",
  224. " <td>0.064930</td>\n",
  225. " <td>0.250400</td>\n",
  226. " <td>0.071460</td>\n",
  227. " </tr>\n",
  228. " <tr>\n",
  229. " <th>50%</th>\n",
  230. " <td>13.370000</td>\n",
  231. " <td>18.840000</td>\n",
  232. " <td>86.240000</td>\n",
  233. " <td>551.100000</td>\n",
  234. " <td>0.095870</td>\n",
  235. " <td>0.092630</td>\n",
  236. " <td>0.061540</td>\n",
  237. " <td>0.033500</td>\n",
  238. " <td>0.179200</td>\n",
  239. " <td>0.061540</td>\n",
  240. " <td>...</td>\n",
  241. " <td>14.970000</td>\n",
  242. " <td>25.410000</td>\n",
  243. " <td>97.660000</td>\n",
  244. " <td>686.500000</td>\n",
  245. " <td>0.131300</td>\n",
  246. " <td>0.211900</td>\n",
  247. " <td>0.226700</td>\n",
  248. " <td>0.099930</td>\n",
  249. " <td>0.282200</td>\n",
  250. " <td>0.080040</td>\n",
  251. " </tr>\n",
  252. " <tr>\n",
  253. " <th>75%</th>\n",
  254. " <td>15.780000</td>\n",
  255. " <td>21.800000</td>\n",
  256. " <td>104.100000</td>\n",
  257. " <td>782.700000</td>\n",
  258. " <td>0.105300</td>\n",
  259. " <td>0.130400</td>\n",
  260. " <td>0.130700</td>\n",
  261. " <td>0.074000</td>\n",
  262. " <td>0.195700</td>\n",
  263. " <td>0.066120</td>\n",
  264. " <td>...</td>\n",
  265. " <td>18.790000</td>\n",
  266. " <td>29.720000</td>\n",
  267. " <td>125.400000</td>\n",
  268. " <td>1084.000000</td>\n",
  269. " <td>0.146000</td>\n",
  270. " <td>0.339100</td>\n",
  271. " <td>0.382900</td>\n",
  272. " <td>0.161400</td>\n",
  273. " <td>0.317900</td>\n",
  274. " <td>0.092080</td>\n",
  275. " </tr>\n",
  276. " <tr>\n",
  277. " <th>max</th>\n",
  278. " <td>28.110000</td>\n",
  279. " <td>39.280000</td>\n",
  280. " <td>188.500000</td>\n",
  281. " <td>2501.000000</td>\n",
  282. " <td>0.163400</td>\n",
  283. " <td>0.345400</td>\n",
  284. " <td>0.426800</td>\n",
  285. " <td>0.201200</td>\n",
  286. " <td>0.304000</td>\n",
  287. " <td>0.097440</td>\n",
  288. " <td>...</td>\n",
  289. " <td>36.040000</td>\n",
  290. " <td>49.540000</td>\n",
  291. " <td>251.200000</td>\n",
  292. " <td>4254.000000</td>\n",
  293. " <td>0.222600</td>\n",
  294. " <td>1.058000</td>\n",
  295. " <td>1.252000</td>\n",
  296. " <td>0.291000</td>\n",
  297. " <td>0.663800</td>\n",
  298. " <td>0.207500</td>\n",
  299. " </tr>\n",
  300. " </tbody>\n",
  301. "</table>\n",
  302. "<p>8 rows × 30 columns</p>\n",
  303. "</div>"
  304. ],
  305. "text/plain": [
  306. " mean radius mean texture mean perimeter mean area \\\n",
  307. "count 569.000000 569.000000 569.000000 569.000000 \n",
  308. "mean 14.127292 19.289649 91.969033 654.889104 \n",
  309. "std 3.524049 4.301036 24.298981 351.914129 \n",
  310. "min 6.981000 9.710000 43.790000 143.500000 \n",
  311. "25% 11.700000 16.170000 75.170000 420.300000 \n",
  312. "50% 13.370000 18.840000 86.240000 551.100000 \n",
  313. "75% 15.780000 21.800000 104.100000 782.700000 \n",
  314. "max 28.110000 39.280000 188.500000 2501.000000 \n",
  315. "\n",
  316. " mean smoothness mean compactness mean concavity mean concave points \\\n",
  317. "count 569.000000 569.000000 569.000000 569.000000 \n",
  318. "mean 0.096360 0.104341 0.088799 0.048919 \n",
  319. "std 0.014064 0.052813 0.079720 0.038803 \n",
  320. "min 0.052630 0.019380 0.000000 0.000000 \n",
  321. "25% 0.086370 0.064920 0.029560 0.020310 \n",
  322. "50% 0.095870 0.092630 0.061540 0.033500 \n",
  323. "75% 0.105300 0.130400 0.130700 0.074000 \n",
  324. "max 0.163400 0.345400 0.426800 0.201200 \n",
  325. "\n",
  326. " mean symmetry mean fractal dimension ... \\\n",
  327. "count 569.000000 569.000000 ... \n",
  328. "mean 0.181162 0.062798 ... \n",
  329. "std 0.027414 0.007060 ... \n",
  330. "min 0.106000 0.049960 ... \n",
  331. "25% 0.161900 0.057700 ... \n",
  332. "50% 0.179200 0.061540 ... \n",
  333. "75% 0.195700 0.066120 ... \n",
  334. "max 0.304000 0.097440 ... \n",
  335. "\n",
  336. " worst radius worst texture worst perimeter worst area \\\n",
  337. "count 569.000000 569.000000 569.000000 569.000000 \n",
  338. "mean 16.269190 25.677223 107.261213 880.583128 \n",
  339. "std 4.833242 6.146258 33.602542 569.356993 \n",
  340. "min 7.930000 12.020000 50.410000 185.200000 \n",
  341. "25% 13.010000 21.080000 84.110000 515.300000 \n",
  342. "50% 14.970000 25.410000 97.660000 686.500000 \n",
  343. "75% 18.790000 29.720000 125.400000 1084.000000 \n",
  344. "max 36.040000 49.540000 251.200000 4254.000000 \n",
  345. "\n",
  346. " worst smoothness worst compactness worst concavity \\\n",
  347. "count 569.000000 569.000000 569.000000 \n",
  348. "mean 0.132369 0.254265 0.272188 \n",
  349. "std 0.022832 0.157336 0.208624 \n",
  350. "min 0.071170 0.027290 0.000000 \n",
  351. "25% 0.116600 0.147200 0.114500 \n",
  352. "50% 0.131300 0.211900 0.226700 \n",
  353. "75% 0.146000 0.339100 0.382900 \n",
  354. "max 0.222600 1.058000 1.252000 \n",
  355. "\n",
  356. " worst concave points worst symmetry worst fractal dimension \n",
  357. "count 569.000000 569.000000 569.000000 \n",
  358. "mean 0.114606 0.290076 0.083946 \n",
  359. "std 0.065732 0.061867 0.018061 \n",
  360. "min 0.000000 0.156500 0.055040 \n",
  361. "25% 0.064930 0.250400 0.071460 \n",
  362. "50% 0.099930 0.282200 0.080040 \n",
  363. "75% 0.161400 0.317900 0.092080 \n",
  364. "max 0.291000 0.663800 0.207500 \n",
  365. "\n",
  366. "[8 rows x 30 columns]"
  367. ]
  368. },
  369. "execution_count": 47,
  370. "metadata": {},
  371. "output_type": "execute_result"
  372. }
  373. ],
  374. "source": [
  375. "df = pd.DataFrame(data.data)\n",
  376. "df.columns = data.feature_names\n",
  377. "df.describe()"
  378. ]
  379. },
  380. {
  381. "cell_type": "code",
  382. "execution_count": 22,
  383. "metadata": {},
  384. "outputs": [
  385. {
  386. "data": {
  387. "text/html": [
  388. "<div>\n",
  389. "<style>\n",
  390. " .dataframe thead tr:only-child th {\n",
  391. " text-align: right;\n",
  392. " }\n",
  393. "\n",
  394. " .dataframe thead th {\n",
  395. " text-align: left;\n",
  396. " }\n",
  397. "\n",
  398. " .dataframe tbody tr th {\n",
  399. " vertical-align: top;\n",
  400. " }\n",
  401. "</style>\n",
  402. "<table border=\"1\" class=\"dataframe\">\n",
  403. " <thead>\n",
  404. " <tr style=\"text-align: right;\">\n",
  405. " <th></th>\n",
  406. " <th>mean radius</th>\n",
  407. " <th>mean texture</th>\n",
  408. " <th>mean perimeter</th>\n",
  409. " <th>mean area</th>\n",
  410. " <th>mean smoothness</th>\n",
  411. " <th>mean compactness</th>\n",
  412. " <th>mean concavity</th>\n",
  413. " <th>mean concave points</th>\n",
  414. " <th>mean symmetry</th>\n",
  415. " <th>mean fractal dimension</th>\n",
  416. " <th>...</th>\n",
  417. " <th>worst radius</th>\n",
  418. " <th>worst texture</th>\n",
  419. " <th>worst perimeter</th>\n",
  420. " <th>worst area</th>\n",
  421. " <th>worst smoothness</th>\n",
  422. " <th>worst compactness</th>\n",
  423. " <th>worst concavity</th>\n",
  424. " <th>worst concave points</th>\n",
  425. " <th>worst symmetry</th>\n",
  426. " <th>worst fractal dimension</th>\n",
  427. " </tr>\n",
  428. " </thead>\n",
  429. " <tbody>\n",
  430. " <tr>\n",
  431. " <th>mean radius</th>\n",
  432. " <td>1.000000</td>\n",
  433. " <td>0.323782</td>\n",
  434. " <td>0.997855</td>\n",
  435. " <td>0.987357</td>\n",
  436. " <td>0.170581</td>\n",
  437. " <td>0.506124</td>\n",
  438. " <td>0.676764</td>\n",
  439. " <td>0.822529</td>\n",
  440. " <td>0.147741</td>\n",
  441. " <td>-0.311631</td>\n",
  442. " <td>...</td>\n",
  443. " <td>0.969539</td>\n",
  444. " <td>0.297008</td>\n",
  445. " <td>0.965137</td>\n",
  446. " <td>0.941082</td>\n",
  447. " <td>0.119616</td>\n",
  448. " <td>0.413463</td>\n",
  449. " <td>0.526911</td>\n",
  450. " <td>0.744214</td>\n",
  451. " <td>0.163953</td>\n",
  452. " <td>0.007066</td>\n",
  453. " </tr>\n",
  454. " <tr>\n",
  455. " <th>mean texture</th>\n",
  456. " <td>0.323782</td>\n",
  457. " <td>1.000000</td>\n",
  458. " <td>0.329533</td>\n",
  459. " <td>0.321086</td>\n",
  460. " <td>-0.023389</td>\n",
  461. " <td>0.236702</td>\n",
  462. " <td>0.302418</td>\n",
  463. " <td>0.293464</td>\n",
  464. " <td>0.071401</td>\n",
  465. " <td>-0.076437</td>\n",
  466. " <td>...</td>\n",
  467. " <td>0.352573</td>\n",
  468. " <td>0.912045</td>\n",
  469. " <td>0.358040</td>\n",
  470. " <td>0.343546</td>\n",
  471. " <td>0.077503</td>\n",
  472. " <td>0.277830</td>\n",
  473. " <td>0.301025</td>\n",
  474. " <td>0.295316</td>\n",
  475. " <td>0.105008</td>\n",
  476. " <td>0.119205</td>\n",
  477. " </tr>\n",
  478. " <tr>\n",
  479. " <th>mean perimeter</th>\n",
  480. " <td>0.997855</td>\n",
  481. " <td>0.329533</td>\n",
  482. " <td>1.000000</td>\n",
  483. " <td>0.986507</td>\n",
  484. " <td>0.207278</td>\n",
  485. " <td>0.556936</td>\n",
  486. " <td>0.716136</td>\n",
  487. " <td>0.850977</td>\n",
  488. " <td>0.183027</td>\n",
  489. " <td>-0.261477</td>\n",
  490. " <td>...</td>\n",
  491. " <td>0.969476</td>\n",
  492. " <td>0.303038</td>\n",
  493. " <td>0.970387</td>\n",
  494. " <td>0.941550</td>\n",
  495. " <td>0.150549</td>\n",
  496. " <td>0.455774</td>\n",
  497. " <td>0.563879</td>\n",
  498. " <td>0.771241</td>\n",
  499. " <td>0.189115</td>\n",
  500. " <td>0.051019</td>\n",
  501. " </tr>\n",
  502. " <tr>\n",
  503. " <th>mean area</th>\n",
  504. " <td>0.987357</td>\n",
  505. " <td>0.321086</td>\n",
  506. " <td>0.986507</td>\n",
  507. " <td>1.000000</td>\n",
  508. " <td>0.177028</td>\n",
  509. " <td>0.498502</td>\n",
  510. " <td>0.685983</td>\n",
  511. " <td>0.823269</td>\n",
  512. " <td>0.151293</td>\n",
  513. " <td>-0.283110</td>\n",
  514. " <td>...</td>\n",
  515. " <td>0.962746</td>\n",
  516. " <td>0.287489</td>\n",
  517. " <td>0.959120</td>\n",
  518. " <td>0.959213</td>\n",
  519. " <td>0.123523</td>\n",
  520. " <td>0.390410</td>\n",
  521. " <td>0.512606</td>\n",
  522. " <td>0.722017</td>\n",
  523. " <td>0.143570</td>\n",
  524. " <td>0.003738</td>\n",
  525. " </tr>\n",
  526. " <tr>\n",
  527. " <th>mean smoothness</th>\n",
  528. " <td>0.170581</td>\n",
  529. " <td>-0.023389</td>\n",
  530. " <td>0.207278</td>\n",
  531. " <td>0.177028</td>\n",
  532. " <td>1.000000</td>\n",
  533. " <td>0.659123</td>\n",
  534. " <td>0.521984</td>\n",
  535. " <td>0.553695</td>\n",
  536. " <td>0.557775</td>\n",
  537. " <td>0.584792</td>\n",
  538. " <td>...</td>\n",
  539. " <td>0.213120</td>\n",
  540. " <td>0.036072</td>\n",
  541. " <td>0.238853</td>\n",
  542. " <td>0.206718</td>\n",
  543. " <td>0.805324</td>\n",
  544. " <td>0.472468</td>\n",
  545. " <td>0.434926</td>\n",
  546. " <td>0.503053</td>\n",
  547. " <td>0.394309</td>\n",
  548. " <td>0.499316</td>\n",
  549. " </tr>\n",
  550. " <tr>\n",
  551. " <th>mean compactness</th>\n",
  552. " <td>0.506124</td>\n",
  553. " <td>0.236702</td>\n",
  554. " <td>0.556936</td>\n",
  555. " <td>0.498502</td>\n",
  556. " <td>0.659123</td>\n",
  557. " <td>1.000000</td>\n",
  558. " <td>0.883121</td>\n",
  559. " <td>0.831135</td>\n",
  560. " <td>0.602641</td>\n",
  561. " <td>0.565369</td>\n",
  562. " <td>...</td>\n",
  563. " <td>0.535315</td>\n",
  564. " <td>0.248133</td>\n",
  565. " <td>0.590210</td>\n",
  566. " <td>0.509604</td>\n",
  567. " <td>0.565541</td>\n",
  568. " <td>0.865809</td>\n",
  569. " <td>0.816275</td>\n",
  570. " <td>0.815573</td>\n",
  571. " <td>0.510223</td>\n",
  572. " <td>0.687382</td>\n",
  573. " </tr>\n",
  574. " <tr>\n",
  575. " <th>mean concavity</th>\n",
  576. " <td>0.676764</td>\n",
  577. " <td>0.302418</td>\n",
  578. " <td>0.716136</td>\n",
  579. " <td>0.685983</td>\n",
  580. " <td>0.521984</td>\n",
  581. " <td>0.883121</td>\n",
  582. " <td>1.000000</td>\n",
  583. " <td>0.921391</td>\n",
  584. " <td>0.500667</td>\n",
  585. " <td>0.336783</td>\n",
  586. " <td>...</td>\n",
  587. " <td>0.688236</td>\n",
  588. " <td>0.299879</td>\n",
  589. " <td>0.729565</td>\n",
  590. " <td>0.675987</td>\n",
  591. " <td>0.448822</td>\n",
  592. " <td>0.754968</td>\n",
  593. " <td>0.884103</td>\n",
  594. " <td>0.861323</td>\n",
  595. " <td>0.409464</td>\n",
  596. " <td>0.514930</td>\n",
  597. " </tr>\n",
  598. " <tr>\n",
  599. " <th>mean concave points</th>\n",
  600. " <td>0.822529</td>\n",
  601. " <td>0.293464</td>\n",
  602. " <td>0.850977</td>\n",
  603. " <td>0.823269</td>\n",
  604. " <td>0.553695</td>\n",
  605. " <td>0.831135</td>\n",
  606. " <td>0.921391</td>\n",
  607. " <td>1.000000</td>\n",
  608. " <td>0.462497</td>\n",
  609. " <td>0.166917</td>\n",
  610. " <td>...</td>\n",
  611. " <td>0.830318</td>\n",
  612. " <td>0.292752</td>\n",
  613. " <td>0.855923</td>\n",
  614. " <td>0.809630</td>\n",
  615. " <td>0.452753</td>\n",
  616. " <td>0.667454</td>\n",
  617. " <td>0.752399</td>\n",
  618. " <td>0.910155</td>\n",
  619. " <td>0.375744</td>\n",
  620. " <td>0.368661</td>\n",
  621. " </tr>\n",
  622. " <tr>\n",
  623. " <th>mean symmetry</th>\n",
  624. " <td>0.147741</td>\n",
  625. " <td>0.071401</td>\n",
  626. " <td>0.183027</td>\n",
  627. " <td>0.151293</td>\n",
  628. " <td>0.557775</td>\n",
  629. " <td>0.602641</td>\n",
  630. " <td>0.500667</td>\n",
  631. " <td>0.462497</td>\n",
  632. " <td>1.000000</td>\n",
  633. " <td>0.479921</td>\n",
  634. " <td>...</td>\n",
  635. " <td>0.185728</td>\n",
  636. " <td>0.090651</td>\n",
  637. " <td>0.219169</td>\n",
  638. " <td>0.177193</td>\n",
  639. " <td>0.426675</td>\n",
  640. " <td>0.473200</td>\n",
  641. " <td>0.433721</td>\n",
  642. " <td>0.430297</td>\n",
  643. " <td>0.699826</td>\n",
  644. " <td>0.438413</td>\n",
  645. " </tr>\n",
  646. " <tr>\n",
  647. " <th>mean fractal dimension</th>\n",
  648. " <td>-0.311631</td>\n",
  649. " <td>-0.076437</td>\n",
  650. " <td>-0.261477</td>\n",
  651. " <td>-0.283110</td>\n",
  652. " <td>0.584792</td>\n",
  653. " <td>0.565369</td>\n",
  654. " <td>0.336783</td>\n",
  655. " <td>0.166917</td>\n",
  656. " <td>0.479921</td>\n",
  657. " <td>1.000000</td>\n",
  658. " <td>...</td>\n",
  659. " <td>-0.253691</td>\n",
  660. " <td>-0.051269</td>\n",
  661. " <td>-0.205151</td>\n",
  662. " <td>-0.231854</td>\n",
  663. " <td>0.504942</td>\n",
  664. " <td>0.458798</td>\n",
  665. " <td>0.346234</td>\n",
  666. " <td>0.175325</td>\n",
  667. " <td>0.334019</td>\n",
  668. " <td>0.767297</td>\n",
  669. " </tr>\n",
  670. " <tr>\n",
  671. " <th>radius error</th>\n",
  672. " <td>0.679090</td>\n",
  673. " <td>0.275869</td>\n",
  674. " <td>0.691765</td>\n",
  675. " <td>0.732562</td>\n",
  676. " <td>0.301467</td>\n",
  677. " <td>0.497473</td>\n",
  678. " <td>0.631925</td>\n",
  679. " <td>0.698050</td>\n",
  680. " <td>0.303379</td>\n",
  681. " <td>0.000111</td>\n",
  682. " <td>...</td>\n",
  683. " <td>0.715065</td>\n",
  684. " <td>0.194799</td>\n",
  685. " <td>0.719684</td>\n",
  686. " <td>0.751548</td>\n",
  687. " <td>0.141919</td>\n",
  688. " <td>0.287103</td>\n",
  689. " <td>0.380585</td>\n",
  690. " <td>0.531062</td>\n",
  691. " <td>0.094543</td>\n",
  692. " <td>0.049559</td>\n",
  693. " </tr>\n",
  694. " <tr>\n",
  695. " <th>texture error</th>\n",
  696. " <td>-0.097317</td>\n",
  697. " <td>0.386358</td>\n",
  698. " <td>-0.086761</td>\n",
  699. " <td>-0.066280</td>\n",
  700. " <td>0.068406</td>\n",
  701. " <td>0.046205</td>\n",
  702. " <td>0.076218</td>\n",
  703. " <td>0.021480</td>\n",
  704. " <td>0.128053</td>\n",
  705. " <td>0.164174</td>\n",
  706. " <td>...</td>\n",
  707. " <td>-0.111690</td>\n",
  708. " <td>0.409003</td>\n",
  709. " <td>-0.102242</td>\n",
  710. " <td>-0.083195</td>\n",
  711. " <td>-0.073658</td>\n",
  712. " <td>-0.092439</td>\n",
  713. " <td>-0.068956</td>\n",
  714. " <td>-0.119638</td>\n",
  715. " <td>-0.128215</td>\n",
  716. " <td>-0.045655</td>\n",
  717. " </tr>\n",
  718. " <tr>\n",
  719. " <th>perimeter error</th>\n",
  720. " <td>0.674172</td>\n",
  721. " <td>0.281673</td>\n",
  722. " <td>0.693135</td>\n",
  723. " <td>0.726628</td>\n",
  724. " <td>0.296092</td>\n",
  725. " <td>0.548905</td>\n",
  726. " <td>0.660391</td>\n",
  727. " <td>0.710650</td>\n",
  728. " <td>0.313893</td>\n",
  729. " <td>0.039830</td>\n",
  730. " <td>...</td>\n",
  731. " <td>0.697201</td>\n",
  732. " <td>0.200371</td>\n",
  733. " <td>0.721031</td>\n",
  734. " <td>0.730713</td>\n",
  735. " <td>0.130054</td>\n",
  736. " <td>0.341919</td>\n",
  737. " <td>0.418899</td>\n",
  738. " <td>0.554897</td>\n",
  739. " <td>0.109930</td>\n",
  740. " <td>0.085433</td>\n",
  741. " </tr>\n",
  742. " <tr>\n",
  743. " <th>area error</th>\n",
  744. " <td>0.735864</td>\n",
  745. " <td>0.259845</td>\n",
  746. " <td>0.744983</td>\n",
  747. " <td>0.800086</td>\n",
  748. " <td>0.246552</td>\n",
  749. " <td>0.455653</td>\n",
  750. " <td>0.617427</td>\n",
  751. " <td>0.690299</td>\n",
  752. " <td>0.223970</td>\n",
  753. " <td>-0.090170</td>\n",
  754. " <td>...</td>\n",
  755. " <td>0.757373</td>\n",
  756. " <td>0.196497</td>\n",
  757. " <td>0.761213</td>\n",
  758. " <td>0.811408</td>\n",
  759. " <td>0.125389</td>\n",
  760. " <td>0.283257</td>\n",
  761. " <td>0.385100</td>\n",
  762. " <td>0.538166</td>\n",
  763. " <td>0.074126</td>\n",
  764. " <td>0.017539</td>\n",
  765. " </tr>\n",
  766. " <tr>\n",
  767. " <th>smoothness error</th>\n",
  768. " <td>-0.222600</td>\n",
  769. " <td>0.006614</td>\n",
  770. " <td>-0.202694</td>\n",
  771. " <td>-0.166777</td>\n",
  772. " <td>0.332375</td>\n",
  773. " <td>0.135299</td>\n",
  774. " <td>0.098564</td>\n",
  775. " <td>0.027653</td>\n",
  776. " <td>0.187321</td>\n",
  777. " <td>0.401964</td>\n",
  778. " <td>...</td>\n",
  779. " <td>-0.230691</td>\n",
  780. " <td>-0.074743</td>\n",
  781. " <td>-0.217304</td>\n",
  782. " <td>-0.182195</td>\n",
  783. " <td>0.314457</td>\n",
  784. " <td>-0.055558</td>\n",
  785. " <td>-0.058298</td>\n",
  786. " <td>-0.102007</td>\n",
  787. " <td>-0.107342</td>\n",
  788. " <td>0.101480</td>\n",
  789. " </tr>\n",
  790. " <tr>\n",
  791. " <th>compactness error</th>\n",
  792. " <td>0.206000</td>\n",
  793. " <td>0.191975</td>\n",
  794. " <td>0.250744</td>\n",
  795. " <td>0.212583</td>\n",
  796. " <td>0.318943</td>\n",
  797. " <td>0.738722</td>\n",
  798. " <td>0.670279</td>\n",
  799. " <td>0.490424</td>\n",
  800. " <td>0.421659</td>\n",
  801. " <td>0.559837</td>\n",
  802. " <td>...</td>\n",
  803. " <td>0.204607</td>\n",
  804. " <td>0.143003</td>\n",
  805. " <td>0.260516</td>\n",
  806. " <td>0.199371</td>\n",
  807. " <td>0.227394</td>\n",
  808. " <td>0.678780</td>\n",
  809. " <td>0.639147</td>\n",
  810. " <td>0.483208</td>\n",
  811. " <td>0.277878</td>\n",
  812. " <td>0.590973</td>\n",
  813. " </tr>\n",
  814. " <tr>\n",
  815. " <th>concavity error</th>\n",
  816. " <td>0.194204</td>\n",
  817. " <td>0.143293</td>\n",
  818. " <td>0.228082</td>\n",
  819. " <td>0.207660</td>\n",
  820. " <td>0.248396</td>\n",
  821. " <td>0.570517</td>\n",
  822. " <td>0.691270</td>\n",
  823. " <td>0.439167</td>\n",
  824. " <td>0.342627</td>\n",
  825. " <td>0.446630</td>\n",
  826. " <td>...</td>\n",
  827. " <td>0.186904</td>\n",
  828. " <td>0.100241</td>\n",
  829. " <td>0.226680</td>\n",
  830. " <td>0.188353</td>\n",
  831. " <td>0.168481</td>\n",
  832. " <td>0.484858</td>\n",
  833. " <td>0.662564</td>\n",
  834. " <td>0.440472</td>\n",
  835. " <td>0.197788</td>\n",
  836. " <td>0.439329</td>\n",
  837. " </tr>\n",
  838. " <tr>\n",
  839. " <th>concave points error</th>\n",
  840. " <td>0.376169</td>\n",
  841. " <td>0.163851</td>\n",
  842. " <td>0.407217</td>\n",
  843. " <td>0.372320</td>\n",
  844. " <td>0.380676</td>\n",
  845. " <td>0.642262</td>\n",
  846. " <td>0.683260</td>\n",
  847. " <td>0.615634</td>\n",
  848. " <td>0.393298</td>\n",
  849. " <td>0.341198</td>\n",
  850. " <td>...</td>\n",
  851. " <td>0.358127</td>\n",
  852. " <td>0.086741</td>\n",
  853. " <td>0.394999</td>\n",
  854. " <td>0.342271</td>\n",
  855. " <td>0.215351</td>\n",
  856. " <td>0.452888</td>\n",
  857. " <td>0.549592</td>\n",
  858. " <td>0.602450</td>\n",
  859. " <td>0.143116</td>\n",
  860. " <td>0.310655</td>\n",
  861. " </tr>\n",
  862. " <tr>\n",
  863. " <th>symmetry error</th>\n",
  864. " <td>-0.104321</td>\n",
  865. " <td>0.009127</td>\n",
  866. " <td>-0.081629</td>\n",
  867. " <td>-0.072497</td>\n",
  868. " <td>0.200774</td>\n",
  869. " <td>0.229977</td>\n",
  870. " <td>0.178009</td>\n",
  871. " <td>0.095351</td>\n",
  872. " <td>0.449137</td>\n",
  873. " <td>0.345007</td>\n",
  874. " <td>...</td>\n",
  875. " <td>-0.128121</td>\n",
  876. " <td>-0.077473</td>\n",
  877. " <td>-0.103753</td>\n",
  878. " <td>-0.110343</td>\n",
  879. " <td>-0.012662</td>\n",
  880. " <td>0.060255</td>\n",
  881. " <td>0.037119</td>\n",
  882. " <td>-0.030413</td>\n",
  883. " <td>0.389402</td>\n",
  884. " <td>0.078079</td>\n",
  885. " </tr>\n",
  886. " <tr>\n",
  887. " <th>fractal dimension error</th>\n",
  888. " <td>-0.042641</td>\n",
  889. " <td>0.054458</td>\n",
  890. " <td>-0.005523</td>\n",
  891. " <td>-0.019887</td>\n",
  892. " <td>0.283607</td>\n",
  893. " <td>0.507318</td>\n",
  894. " <td>0.449301</td>\n",
  895. " <td>0.257584</td>\n",
  896. " <td>0.331786</td>\n",
  897. " <td>0.688132</td>\n",
  898. " <td>...</td>\n",
  899. " <td>-0.037488</td>\n",
  900. " <td>-0.003195</td>\n",
  901. " <td>-0.001000</td>\n",
  902. " <td>-0.022736</td>\n",
  903. " <td>0.170568</td>\n",
  904. " <td>0.390159</td>\n",
  905. " <td>0.379975</td>\n",
  906. " <td>0.215204</td>\n",
  907. " <td>0.111094</td>\n",
  908. " <td>0.591328</td>\n",
  909. " </tr>\n",
  910. " <tr>\n",
  911. " <th>worst radius</th>\n",
  912. " <td>0.969539</td>\n",
  913. " <td>0.352573</td>\n",
  914. " <td>0.969476</td>\n",
  915. " <td>0.962746</td>\n",
  916. " <td>0.213120</td>\n",
  917. " <td>0.535315</td>\n",
  918. " <td>0.688236</td>\n",
  919. " <td>0.830318</td>\n",
  920. " <td>0.185728</td>\n",
  921. " <td>-0.253691</td>\n",
  922. " <td>...</td>\n",
  923. " <td>1.000000</td>\n",
  924. " <td>0.359921</td>\n",
  925. " <td>0.993708</td>\n",
  926. " <td>0.984015</td>\n",
  927. " <td>0.216574</td>\n",
  928. " <td>0.475820</td>\n",
  929. " <td>0.573975</td>\n",
  930. " <td>0.787424</td>\n",
  931. " <td>0.243529</td>\n",
  932. " <td>0.093492</td>\n",
  933. " </tr>\n",
  934. " <tr>\n",
  935. " <th>worst texture</th>\n",
  936. " <td>0.297008</td>\n",
  937. " <td>0.912045</td>\n",
  938. " <td>0.303038</td>\n",
  939. " <td>0.287489</td>\n",
  940. " <td>0.036072</td>\n",
  941. " <td>0.248133</td>\n",
  942. " <td>0.299879</td>\n",
  943. " <td>0.292752</td>\n",
  944. " <td>0.090651</td>\n",
  945. " <td>-0.051269</td>\n",
  946. " <td>...</td>\n",
  947. " <td>0.359921</td>\n",
  948. " <td>1.000000</td>\n",
  949. " <td>0.365098</td>\n",
  950. " <td>0.345842</td>\n",
  951. " <td>0.225429</td>\n",
  952. " <td>0.360832</td>\n",
  953. " <td>0.368366</td>\n",
  954. " <td>0.359755</td>\n",
  955. " <td>0.233027</td>\n",
  956. " <td>0.219122</td>\n",
  957. " </tr>\n",
  958. " <tr>\n",
  959. " <th>worst perimeter</th>\n",
  960. " <td>0.965137</td>\n",
  961. " <td>0.358040</td>\n",
  962. " <td>0.970387</td>\n",
  963. " <td>0.959120</td>\n",
  964. " <td>0.238853</td>\n",
  965. " <td>0.590210</td>\n",
  966. " <td>0.729565</td>\n",
  967. " <td>0.855923</td>\n",
  968. " <td>0.219169</td>\n",
  969. " <td>-0.205151</td>\n",
  970. " <td>...</td>\n",
  971. " <td>0.993708</td>\n",
  972. " <td>0.365098</td>\n",
  973. " <td>1.000000</td>\n",
  974. " <td>0.977578</td>\n",
  975. " <td>0.236775</td>\n",
  976. " <td>0.529408</td>\n",
  977. " <td>0.618344</td>\n",
  978. " <td>0.816322</td>\n",
  979. " <td>0.269493</td>\n",
  980. " <td>0.138957</td>\n",
  981. " </tr>\n",
  982. " <tr>\n",
  983. " <th>worst area</th>\n",
  984. " <td>0.941082</td>\n",
  985. " <td>0.343546</td>\n",
  986. " <td>0.941550</td>\n",
  987. " <td>0.959213</td>\n",
  988. " <td>0.206718</td>\n",
  989. " <td>0.509604</td>\n",
  990. " <td>0.675987</td>\n",
  991. " <td>0.809630</td>\n",
  992. " <td>0.177193</td>\n",
  993. " <td>-0.231854</td>\n",
  994. " <td>...</td>\n",
  995. " <td>0.984015</td>\n",
  996. " <td>0.345842</td>\n",
  997. " <td>0.977578</td>\n",
  998. " <td>1.000000</td>\n",
  999. " <td>0.209145</td>\n",
  1000. " <td>0.438296</td>\n",
  1001. " <td>0.543331</td>\n",
  1002. " <td>0.747419</td>\n",
  1003. " <td>0.209146</td>\n",
  1004. " <td>0.079647</td>\n",
  1005. " </tr>\n",
  1006. " <tr>\n",
  1007. " <th>worst smoothness</th>\n",
  1008. " <td>0.119616</td>\n",
  1009. " <td>0.077503</td>\n",
  1010. " <td>0.150549</td>\n",
  1011. " <td>0.123523</td>\n",
  1012. " <td>0.805324</td>\n",
  1013. " <td>0.565541</td>\n",
  1014. " <td>0.448822</td>\n",
  1015. " <td>0.452753</td>\n",
  1016. " <td>0.426675</td>\n",
  1017. " <td>0.504942</td>\n",
  1018. " <td>...</td>\n",
  1019. " <td>0.216574</td>\n",
  1020. " <td>0.225429</td>\n",
  1021. " <td>0.236775</td>\n",
  1022. " <td>0.209145</td>\n",
  1023. " <td>1.000000</td>\n",
  1024. " <td>0.568187</td>\n",
  1025. " <td>0.518523</td>\n",
  1026. " <td>0.547691</td>\n",
  1027. " <td>0.493838</td>\n",
  1028. " <td>0.617624</td>\n",
  1029. " </tr>\n",
  1030. " <tr>\n",
  1031. " <th>worst compactness</th>\n",
  1032. " <td>0.413463</td>\n",
  1033. " <td>0.277830</td>\n",
  1034. " <td>0.455774</td>\n",
  1035. " <td>0.390410</td>\n",
  1036. " <td>0.472468</td>\n",
  1037. " <td>0.865809</td>\n",
  1038. " <td>0.754968</td>\n",
  1039. " <td>0.667454</td>\n",
  1040. " <td>0.473200</td>\n",
  1041. " <td>0.458798</td>\n",
  1042. " <td>...</td>\n",
  1043. " <td>0.475820</td>\n",
  1044. " <td>0.360832</td>\n",
  1045. " <td>0.529408</td>\n",
  1046. " <td>0.438296</td>\n",
  1047. " <td>0.568187</td>\n",
  1048. " <td>1.000000</td>\n",
  1049. " <td>0.892261</td>\n",
  1050. " <td>0.801080</td>\n",
  1051. " <td>0.614441</td>\n",
  1052. " <td>0.810455</td>\n",
  1053. " </tr>\n",
  1054. " <tr>\n",
  1055. " <th>worst concavity</th>\n",
  1056. " <td>0.526911</td>\n",
  1057. " <td>0.301025</td>\n",
  1058. " <td>0.563879</td>\n",
  1059. " <td>0.512606</td>\n",
  1060. " <td>0.434926</td>\n",
  1061. " <td>0.816275</td>\n",
  1062. " <td>0.884103</td>\n",
  1063. " <td>0.752399</td>\n",
  1064. " <td>0.433721</td>\n",
  1065. " <td>0.346234</td>\n",
  1066. " <td>...</td>\n",
  1067. " <td>0.573975</td>\n",
  1068. " <td>0.368366</td>\n",
  1069. " <td>0.618344</td>\n",
  1070. " <td>0.543331</td>\n",
  1071. " <td>0.518523</td>\n",
  1072. " <td>0.892261</td>\n",
  1073. " <td>1.000000</td>\n",
  1074. " <td>0.855434</td>\n",
  1075. " <td>0.532520</td>\n",
  1076. " <td>0.686511</td>\n",
  1077. " </tr>\n",
  1078. " <tr>\n",
  1079. " <th>worst concave points</th>\n",
  1080. " <td>0.744214</td>\n",
  1081. " <td>0.295316</td>\n",
  1082. " <td>0.771241</td>\n",
  1083. " <td>0.722017</td>\n",
  1084. " <td>0.503053</td>\n",
  1085. " <td>0.815573</td>\n",
  1086. " <td>0.861323</td>\n",
  1087. " <td>0.910155</td>\n",
  1088. " <td>0.430297</td>\n",
  1089. " <td>0.175325</td>\n",
  1090. " <td>...</td>\n",
  1091. " <td>0.787424</td>\n",
  1092. " <td>0.359755</td>\n",
  1093. " <td>0.816322</td>\n",
  1094. " <td>0.747419</td>\n",
  1095. " <td>0.547691</td>\n",
  1096. " <td>0.801080</td>\n",
  1097. " <td>0.855434</td>\n",
  1098. " <td>1.000000</td>\n",
  1099. " <td>0.502528</td>\n",
  1100. " <td>0.511114</td>\n",
  1101. " </tr>\n",
  1102. " <tr>\n",
  1103. " <th>worst symmetry</th>\n",
  1104. " <td>0.163953</td>\n",
  1105. " <td>0.105008</td>\n",
  1106. " <td>0.189115</td>\n",
  1107. " <td>0.143570</td>\n",
  1108. " <td>0.394309</td>\n",
  1109. " <td>0.510223</td>\n",
  1110. " <td>0.409464</td>\n",
  1111. " <td>0.375744</td>\n",
  1112. " <td>0.699826</td>\n",
  1113. " <td>0.334019</td>\n",
  1114. " <td>...</td>\n",
  1115. " <td>0.243529</td>\n",
  1116. " <td>0.233027</td>\n",
  1117. " <td>0.269493</td>\n",
  1118. " <td>0.209146</td>\n",
  1119. " <td>0.493838</td>\n",
  1120. " <td>0.614441</td>\n",
  1121. " <td>0.532520</td>\n",
  1122. " <td>0.502528</td>\n",
  1123. " <td>1.000000</td>\n",
  1124. " <td>0.537848</td>\n",
  1125. " </tr>\n",
  1126. " <tr>\n",
  1127. " <th>worst fractal dimension</th>\n",
  1128. " <td>0.007066</td>\n",
  1129. " <td>0.119205</td>\n",
  1130. " <td>0.051019</td>\n",
  1131. " <td>0.003738</td>\n",
  1132. " <td>0.499316</td>\n",
  1133. " <td>0.687382</td>\n",
  1134. " <td>0.514930</td>\n",
  1135. " <td>0.368661</td>\n",
  1136. " <td>0.438413</td>\n",
  1137. " <td>0.767297</td>\n",
  1138. " <td>...</td>\n",
  1139. " <td>0.093492</td>\n",
  1140. " <td>0.219122</td>\n",
  1141. " <td>0.138957</td>\n",
  1142. " <td>0.079647</td>\n",
  1143. " <td>0.617624</td>\n",
  1144. " <td>0.810455</td>\n",
  1145. " <td>0.686511</td>\n",
  1146. " <td>0.511114</td>\n",
  1147. " <td>0.537848</td>\n",
  1148. " <td>1.000000</td>\n",
  1149. " </tr>\n",
  1150. " </tbody>\n",
  1151. "</table>\n",
  1152. "<p>30 rows × 30 columns</p>\n",
  1153. "</div>"
  1154. ],
  1155. "text/plain": [
  1156. " mean radius mean texture mean perimeter mean area \\\n",
  1157. "mean radius 1.000000 0.323782 0.997855 0.987357 \n",
  1158. "mean texture 0.323782 1.000000 0.329533 0.321086 \n",
  1159. "mean perimeter 0.997855 0.329533 1.000000 0.986507 \n",
  1160. "mean area 0.987357 0.321086 0.986507 1.000000 \n",
  1161. "mean smoothness 0.170581 -0.023389 0.207278 0.177028 \n",
  1162. "mean compactness 0.506124 0.236702 0.556936 0.498502 \n",
  1163. "mean concavity 0.676764 0.302418 0.716136 0.685983 \n",
  1164. "mean concave points 0.822529 0.293464 0.850977 0.823269 \n",
  1165. "mean symmetry 0.147741 0.071401 0.183027 0.151293 \n",
  1166. "mean fractal dimension -0.311631 -0.076437 -0.261477 -0.283110 \n",
  1167. "radius error 0.679090 0.275869 0.691765 0.732562 \n",
  1168. "texture error -0.097317 0.386358 -0.086761 -0.066280 \n",
  1169. "perimeter error 0.674172 0.281673 0.693135 0.726628 \n",
  1170. "area error 0.735864 0.259845 0.744983 0.800086 \n",
  1171. "smoothness error -0.222600 0.006614 -0.202694 -0.166777 \n",
  1172. "compactness error 0.206000 0.191975 0.250744 0.212583 \n",
  1173. "concavity error 0.194204 0.143293 0.228082 0.207660 \n",
  1174. "concave points error 0.376169 0.163851 0.407217 0.372320 \n",
  1175. "symmetry error -0.104321 0.009127 -0.081629 -0.072497 \n",
  1176. "fractal dimension error -0.042641 0.054458 -0.005523 -0.019887 \n",
  1177. "worst radius 0.969539 0.352573 0.969476 0.962746 \n",
  1178. "worst texture 0.297008 0.912045 0.303038 0.287489 \n",
  1179. "worst perimeter 0.965137 0.358040 0.970387 0.959120 \n",
  1180. "worst area 0.941082 0.343546 0.941550 0.959213 \n",
  1181. "worst smoothness 0.119616 0.077503 0.150549 0.123523 \n",
  1182. "worst compactness 0.413463 0.277830 0.455774 0.390410 \n",
  1183. "worst concavity 0.526911 0.301025 0.563879 0.512606 \n",
  1184. "worst concave points 0.744214 0.295316 0.771241 0.722017 \n",
  1185. "worst symmetry 0.163953 0.105008 0.189115 0.143570 \n",
  1186. "worst fractal dimension 0.007066 0.119205 0.051019 0.003738 \n",
  1187. "\n",
  1188. " mean smoothness mean compactness mean concavity \\\n",
  1189. "mean radius 0.170581 0.506124 0.676764 \n",
  1190. "mean texture -0.023389 0.236702 0.302418 \n",
  1191. "mean perimeter 0.207278 0.556936 0.716136 \n",
  1192. "mean area 0.177028 0.498502 0.685983 \n",
  1193. "mean smoothness 1.000000 0.659123 0.521984 \n",
  1194. "mean compactness 0.659123 1.000000 0.883121 \n",
  1195. "mean concavity 0.521984 0.883121 1.000000 \n",
  1196. "mean concave points 0.553695 0.831135 0.921391 \n",
  1197. "mean symmetry 0.557775 0.602641 0.500667 \n",
  1198. "mean fractal dimension 0.584792 0.565369 0.336783 \n",
  1199. "radius error 0.301467 0.497473 0.631925 \n",
  1200. "texture error 0.068406 0.046205 0.076218 \n",
  1201. "perimeter error 0.296092 0.548905 0.660391 \n",
  1202. "area error 0.246552 0.455653 0.617427 \n",
  1203. "smoothness error 0.332375 0.135299 0.098564 \n",
  1204. "compactness error 0.318943 0.738722 0.670279 \n",
  1205. "concavity error 0.248396 0.570517 0.691270 \n",
  1206. "concave points error 0.380676 0.642262 0.683260 \n",
  1207. "symmetry error 0.200774 0.229977 0.178009 \n",
  1208. "fractal dimension error 0.283607 0.507318 0.449301 \n",
  1209. "worst radius 0.213120 0.535315 0.688236 \n",
  1210. "worst texture 0.036072 0.248133 0.299879 \n",
  1211. "worst perimeter 0.238853 0.590210 0.729565 \n",
  1212. "worst area 0.206718 0.509604 0.675987 \n",
  1213. "worst smoothness 0.805324 0.565541 0.448822 \n",
  1214. "worst compactness 0.472468 0.865809 0.754968 \n",
  1215. "worst concavity 0.434926 0.816275 0.884103 \n",
  1216. "worst concave points 0.503053 0.815573 0.861323 \n",
  1217. "worst symmetry 0.394309 0.510223 0.409464 \n",
  1218. "worst fractal dimension 0.499316 0.687382 0.514930 \n",
  1219. "\n",
  1220. " mean concave points mean symmetry \\\n",
  1221. "mean radius 0.822529 0.147741 \n",
  1222. "mean texture 0.293464 0.071401 \n",
  1223. "mean perimeter 0.850977 0.183027 \n",
  1224. "mean area 0.823269 0.151293 \n",
  1225. "mean smoothness 0.553695 0.557775 \n",
  1226. "mean compactness 0.831135 0.602641 \n",
  1227. "mean concavity 0.921391 0.500667 \n",
  1228. "mean concave points 1.000000 0.462497 \n",
  1229. "mean symmetry 0.462497 1.000000 \n",
  1230. "mean fractal dimension 0.166917 0.479921 \n",
  1231. "radius error 0.698050 0.303379 \n",
  1232. "texture error 0.021480 0.128053 \n",
  1233. "perimeter error 0.710650 0.313893 \n",
  1234. "area error 0.690299 0.223970 \n",
  1235. "smoothness error 0.027653 0.187321 \n",
  1236. "compactness error 0.490424 0.421659 \n",
  1237. "concavity error 0.439167 0.342627 \n",
  1238. "concave points error 0.615634 0.393298 \n",
  1239. "symmetry error 0.095351 0.449137 \n",
  1240. "fractal dimension error 0.257584 0.331786 \n",
  1241. "worst radius 0.830318 0.185728 \n",
  1242. "worst texture 0.292752 0.090651 \n",
  1243. "worst perimeter 0.855923 0.219169 \n",
  1244. "worst area 0.809630 0.177193 \n",
  1245. "worst smoothness 0.452753 0.426675 \n",
  1246. "worst compactness 0.667454 0.473200 \n",
  1247. "worst concavity 0.752399 0.433721 \n",
  1248. "worst concave points 0.910155 0.430297 \n",
  1249. "worst symmetry 0.375744 0.699826 \n",
  1250. "worst fractal dimension 0.368661 0.438413 \n",
  1251. "\n",
  1252. " mean fractal dimension ... \\\n",
  1253. "mean radius -0.311631 ... \n",
  1254. "mean texture -0.076437 ... \n",
  1255. "mean perimeter -0.261477 ... \n",
  1256. "mean area -0.283110 ... \n",
  1257. "mean smoothness 0.584792 ... \n",
  1258. "mean compactness 0.565369 ... \n",
  1259. "mean concavity 0.336783 ... \n",
  1260. "mean concave points 0.166917 ... \n",
  1261. "mean symmetry 0.479921 ... \n",
  1262. "mean fractal dimension 1.000000 ... \n",
  1263. "radius error 0.000111 ... \n",
  1264. "texture error 0.164174 ... \n",
  1265. "perimeter error 0.039830 ... \n",
  1266. "area error -0.090170 ... \n",
  1267. "smoothness error 0.401964 ... \n",
  1268. "compactness error 0.559837 ... \n",
  1269. "concavity error 0.446630 ... \n",
  1270. "concave points error 0.341198 ... \n",
  1271. "symmetry error 0.345007 ... \n",
  1272. "fractal dimension error 0.688132 ... \n",
  1273. "worst radius -0.253691 ... \n",
  1274. "worst texture -0.051269 ... \n",
  1275. "worst perimeter -0.205151 ... \n",
  1276. "worst area -0.231854 ... \n",
  1277. "worst smoothness 0.504942 ... \n",
  1278. "worst compactness 0.458798 ... \n",
  1279. "worst concavity 0.346234 ... \n",
  1280. "worst concave points 0.175325 ... \n",
  1281. "worst symmetry 0.334019 ... \n",
  1282. "worst fractal dimension 0.767297 ... \n",
  1283. "\n",
  1284. " worst radius worst texture worst perimeter \\\n",
  1285. "mean radius 0.969539 0.297008 0.965137 \n",
  1286. "mean texture 0.352573 0.912045 0.358040 \n",
  1287. "mean perimeter 0.969476 0.303038 0.970387 \n",
  1288. "mean area 0.962746 0.287489 0.959120 \n",
  1289. "mean smoothness 0.213120 0.036072 0.238853 \n",
  1290. "mean compactness 0.535315 0.248133 0.590210 \n",
  1291. "mean concavity 0.688236 0.299879 0.729565 \n",
  1292. "mean concave points 0.830318 0.292752 0.855923 \n",
  1293. "mean symmetry 0.185728 0.090651 0.219169 \n",
  1294. "mean fractal dimension -0.253691 -0.051269 -0.205151 \n",
  1295. "radius error 0.715065 0.194799 0.719684 \n",
  1296. "texture error -0.111690 0.409003 -0.102242 \n",
  1297. "perimeter error 0.697201 0.200371 0.721031 \n",
  1298. "area error 0.757373 0.196497 0.761213 \n",
  1299. "smoothness error -0.230691 -0.074743 -0.217304 \n",
  1300. "compactness error 0.204607 0.143003 0.260516 \n",
  1301. "concavity error 0.186904 0.100241 0.226680 \n",
  1302. "concave points error 0.358127 0.086741 0.394999 \n",
  1303. "symmetry error -0.128121 -0.077473 -0.103753 \n",
  1304. "fractal dimension error -0.037488 -0.003195 -0.001000 \n",
  1305. "worst radius 1.000000 0.359921 0.993708 \n",
  1306. "worst texture 0.359921 1.000000 0.365098 \n",
  1307. "worst perimeter 0.993708 0.365098 1.000000 \n",
  1308. "worst area 0.984015 0.345842 0.977578 \n",
  1309. "worst smoothness 0.216574 0.225429 0.236775 \n",
  1310. "worst compactness 0.475820 0.360832 0.529408 \n",
  1311. "worst concavity 0.573975 0.368366 0.618344 \n",
  1312. "worst concave points 0.787424 0.359755 0.816322 \n",
  1313. "worst symmetry 0.243529 0.233027 0.269493 \n",
  1314. "worst fractal dimension 0.093492 0.219122 0.138957 \n",
  1315. "\n",
  1316. " worst area worst smoothness worst compactness \\\n",
  1317. "mean radius 0.941082 0.119616 0.413463 \n",
  1318. "mean texture 0.343546 0.077503 0.277830 \n",
  1319. "mean perimeter 0.941550 0.150549 0.455774 \n",
  1320. "mean area 0.959213 0.123523 0.390410 \n",
  1321. "mean smoothness 0.206718 0.805324 0.472468 \n",
  1322. "mean compactness 0.509604 0.565541 0.865809 \n",
  1323. "mean concavity 0.675987 0.448822 0.754968 \n",
  1324. "mean concave points 0.809630 0.452753 0.667454 \n",
  1325. "mean symmetry 0.177193 0.426675 0.473200 \n",
  1326. "mean fractal dimension -0.231854 0.504942 0.458798 \n",
  1327. "radius error 0.751548 0.141919 0.287103 \n",
  1328. "texture error -0.083195 -0.073658 -0.092439 \n",
  1329. "perimeter error 0.730713 0.130054 0.341919 \n",
  1330. "area error 0.811408 0.125389 0.283257 \n",
  1331. "smoothness error -0.182195 0.314457 -0.055558 \n",
  1332. "compactness error 0.199371 0.227394 0.678780 \n",
  1333. "concavity error 0.188353 0.168481 0.484858 \n",
  1334. "concave points error 0.342271 0.215351 0.452888 \n",
  1335. "symmetry error -0.110343 -0.012662 0.060255 \n",
  1336. "fractal dimension error -0.022736 0.170568 0.390159 \n",
  1337. "worst radius 0.984015 0.216574 0.475820 \n",
  1338. "worst texture 0.345842 0.225429 0.360832 \n",
  1339. "worst perimeter 0.977578 0.236775 0.529408 \n",
  1340. "worst area 1.000000 0.209145 0.438296 \n",
  1341. "worst smoothness 0.209145 1.000000 0.568187 \n",
  1342. "worst compactness 0.438296 0.568187 1.000000 \n",
  1343. "worst concavity 0.543331 0.518523 0.892261 \n",
  1344. "worst concave points 0.747419 0.547691 0.801080 \n",
  1345. "worst symmetry 0.209146 0.493838 0.614441 \n",
  1346. "worst fractal dimension 0.079647 0.617624 0.810455 \n",
  1347. "\n",
  1348. " worst concavity worst concave points \\\n",
  1349. "mean radius 0.526911 0.744214 \n",
  1350. "mean texture 0.301025 0.295316 \n",
  1351. "mean perimeter 0.563879 0.771241 \n",
  1352. "mean area 0.512606 0.722017 \n",
  1353. "mean smoothness 0.434926 0.503053 \n",
  1354. "mean compactness 0.816275 0.815573 \n",
  1355. "mean concavity 0.884103 0.861323 \n",
  1356. "mean concave points 0.752399 0.910155 \n",
  1357. "mean symmetry 0.433721 0.430297 \n",
  1358. "mean fractal dimension 0.346234 0.175325 \n",
  1359. "radius error 0.380585 0.531062 \n",
  1360. "texture error -0.068956 -0.119638 \n",
  1361. "perimeter error 0.418899 0.554897 \n",
  1362. "area error 0.385100 0.538166 \n",
  1363. "smoothness error -0.058298 -0.102007 \n",
  1364. "compactness error 0.639147 0.483208 \n",
  1365. "concavity error 0.662564 0.440472 \n",
  1366. "concave points error 0.549592 0.602450 \n",
  1367. "symmetry error 0.037119 -0.030413 \n",
  1368. "fractal dimension error 0.379975 0.215204 \n",
  1369. "worst radius 0.573975 0.787424 \n",
  1370. "worst texture 0.368366 0.359755 \n",
  1371. "worst perimeter 0.618344 0.816322 \n",
  1372. "worst area 0.543331 0.747419 \n",
  1373. "worst smoothness 0.518523 0.547691 \n",
  1374. "worst compactness 0.892261 0.801080 \n",
  1375. "worst concavity 1.000000 0.855434 \n",
  1376. "worst concave points 0.855434 1.000000 \n",
  1377. "worst symmetry 0.532520 0.502528 \n",
  1378. "worst fractal dimension 0.686511 0.511114 \n",
  1379. "\n",
  1380. " worst symmetry worst fractal dimension \n",
  1381. "mean radius 0.163953 0.007066 \n",
  1382. "mean texture 0.105008 0.119205 \n",
  1383. "mean perimeter 0.189115 0.051019 \n",
  1384. "mean area 0.143570 0.003738 \n",
  1385. "mean smoothness 0.394309 0.499316 \n",
  1386. "mean compactness 0.510223 0.687382 \n",
  1387. "mean concavity 0.409464 0.514930 \n",
  1388. "mean concave points 0.375744 0.368661 \n",
  1389. "mean symmetry 0.699826 0.438413 \n",
  1390. "mean fractal dimension 0.334019 0.767297 \n",
  1391. "radius error 0.094543 0.049559 \n",
  1392. "texture error -0.128215 -0.045655 \n",
  1393. "perimeter error 0.109930 0.085433 \n",
  1394. "area error 0.074126 0.017539 \n",
  1395. "smoothness error -0.107342 0.101480 \n",
  1396. "compactness error 0.277878 0.590973 \n",
  1397. "concavity error 0.197788 0.439329 \n",
  1398. "concave points error 0.143116 0.310655 \n",
  1399. "symmetry error 0.389402 0.078079 \n",
  1400. "fractal dimension error 0.111094 0.591328 \n",
  1401. "worst radius 0.243529 0.093492 \n",
  1402. "worst texture 0.233027 0.219122 \n",
  1403. "worst perimeter 0.269493 0.138957 \n",
  1404. "worst area 0.209146 0.079647 \n",
  1405. "worst smoothness 0.493838 0.617624 \n",
  1406. "worst compactness 0.614441 0.810455 \n",
  1407. "worst concavity 0.532520 0.686511 \n",
  1408. "worst concave points 0.502528 0.511114 \n",
  1409. "worst symmetry 1.000000 0.537848 \n",
  1410. "worst fractal dimension 0.537848 1.000000 \n",
  1411. "\n",
  1412. "[30 rows x 30 columns]"
  1413. ]
  1414. },
  1415. "execution_count": 22,
  1416. "metadata": {},
  1417. "output_type": "execute_result"
  1418. }
  1419. ],
  1420. "source": [
  1421. "df.corr()"
  1422. ]
  1423. },
  1424. {
  1425. "cell_type": "code",
  1426. "execution_count": 25,
  1427. "metadata": {},
  1428. "outputs": [],
  1429. "source": [
  1430. "from sklearn.model_selection import train_test_split\n",
  1431. "\n",
  1432. "X = data.data\n",
  1433. "y = data.target\n",
  1434. "X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3)"
  1435. ]
  1436. },
  1437. {
  1438. "cell_type": "code",
  1439. "execution_count": 27,
  1440. "metadata": {},
  1441. "outputs": [],
  1442. "source": [
  1443. "from sklearn.preprocessing import StandardScaler\n",
  1444. "\n",
  1445. "sc = StandardScaler()\n",
  1446. "sc.fit(X_train)\n",
  1447. "\n",
  1448. "X_train_std = sc.transform(X_train)\n",
  1449. "X_test_std = sc.transform(X_test)"
  1450. ]
  1451. },
  1452. {
  1453. "cell_type": "code",
  1454. "execution_count": 42,
  1455. "metadata": {},
  1456. "outputs": [
  1457. {
  1458. "data": {
  1459. "text/plain": [
  1460. "LogisticRegression(C=1000, class_weight=None, dual=False, fit_intercept=True,\n",
  1461. " intercept_scaling=1, max_iter=100, multi_class='ovr', n_jobs=1,\n",
  1462. " penalty='l2', random_state=None, solver='liblinear', tol=0.0001,\n",
  1463. " verbose=0, warm_start=False)"
  1464. ]
  1465. },
  1466. "execution_count": 42,
  1467. "metadata": {},
  1468. "output_type": "execute_result"
  1469. }
  1470. ],
  1471. "source": [
  1472. "from sklearn.linear_model import LogisticRegression\n",
  1473. "\n",
  1474. "lr = LogisticRegression(C=1000)\n",
  1475. "lr.fit(X_train, y_train)"
  1476. ]
  1477. },
  1478. {
  1479. "cell_type": "code",
  1480. "execution_count": 43,
  1481. "metadata": {},
  1482. "outputs": [
  1483. {
  1484. "data": {
  1485. "text/plain": [
  1486. "array([1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1,\n",
  1487. " 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 1,\n",
  1488. " 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0,\n",
  1489. " 0, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0,\n",
  1490. " 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0,\n",
  1491. " 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0,\n",
  1492. " 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1,\n",
  1493. " 1, 1, 0, 1, 1, 1, 1, 1, 1, 0])"
  1494. ]
  1495. },
  1496. "execution_count": 43,
  1497. "metadata": {},
  1498. "output_type": "execute_result"
  1499. }
  1500. ],
  1501. "source": [
  1502. "lr.predict(X_test_std)"
  1503. ]
  1504. },
  1505. {
  1506. "cell_type": "code",
  1507. "execution_count": 44,
  1508. "metadata": {},
  1509. "outputs": [
  1510. {
  1511. "data": {
  1512. "text/plain": [
  1513. "array([1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 0,\n",
  1514. " 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1,\n",
  1515. " 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0,\n",
  1516. " 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1,\n",
  1517. " 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1,\n",
  1518. " 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0,\n",
  1519. " 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1,\n",
  1520. " 1, 1, 1, 1, 0, 1, 1, 1, 1, 0])"
  1521. ]
  1522. },
  1523. "execution_count": 44,
  1524. "metadata": {},
  1525. "output_type": "execute_result"
  1526. }
  1527. ],
  1528. "source": [
  1529. "y_test"
  1530. ]
  1531. },
  1532. {
  1533. "cell_type": "code",
  1534. "execution_count": 45,
  1535. "metadata": {},
  1536. "outputs": [
  1537. {
  1538. "data": {
  1539. "text/plain": [
  1540. "0.79532163742690054"
  1541. ]
  1542. },
  1543. "execution_count": 45,
  1544. "metadata": {},
  1545. "output_type": "execute_result"
  1546. }
  1547. ],
  1548. "source": [
  1549. "from sklearn import metrics\n",
  1550. "\n",
  1551. "predicts = lr.predict(X_test_std)\n",
  1552. "metrics.accuracy_score(y_test, predicts)"
  1553. ]
  1554. }
  1555. ],
  1556. "metadata": {
  1557. "kernelspec": {
  1558. "display_name": "Python 3",
  1559. "language": "python",
  1560. "name": "python3"
  1561. },
  1562. "language_info": {
  1563. "codemirror_mode": {
  1564. "name": "ipython",
  1565. "version": 3
  1566. },
  1567. "file_extension": ".py",
  1568. "mimetype": "text/x-python",
  1569. "name": "python",
  1570. "nbconvert_exporter": "python",
  1571. "pygments_lexer": "ipython3",
  1572. "version": "3.6.0"
  1573. }
  1574. },
  1575. "nbformat": 4,
  1576. "nbformat_minor": 2
  1577. }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement