Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- {
- "nbformat_minor": 1,
- "cells": [
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "from sklearn.model_selection import train_test_split\nfrom sklearn.ensemble import ExtraTreesClassifier,GradientBoostingClassifier\nfrom sklearn.svm import SVC\nfrom sklearn.ensemble import VotingClassifier\nfrom sklearn.metrics import accuracy_score\nimport numpy as np\nimport pandas as pd"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {
- "scrolled": true
- },
- "outputs": [],
- "source": "# The code was removed by Watson Studio for sharing."
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "df_data_1['address']=df_data_1['addr_state'].astype(str)+df_data_1['zip_code'].astype(str)"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "removal_cols=['mths_since_last_major_derog',\n 'zip_code',\n 'application_type',\n 'mths_since_last_record',\n 'addr_state',\n 'mths_since_last_delinq']\npreserve_cols=[\"emp_title\",\"emp_length\",\"address\",\"last_week_pay\"]\nstring_cols=[\"term\",\"batch_enrolled\",\"grade\",\"sub_grade\"]"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "df_final=df_data_1[preserve_cols].copy(deep=True)\nremoval_cols+=preserve_cols"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "df_data_1.drop(removal_cols,axis=1,inplace=True)"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "df_data_1.head()"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "def replace_missing_values(df):\n return df_data_1.apply(lambda x: x.fillna(0) if x.dtype.kind in 'biufc' else x.fillna(' '))\n "
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "df_data_1=df_data_1[df_data_1['batch_enrolled']!=' ']"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "df=replace_missing_values(df_data_1)"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "df['no_funded_amnt']=df['loan_amnt']==df['funded_amnt']"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "df=pd.get_dummies(df,columns=string_cols)"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "target_col=df['home_ownership']\ndf.drop('home_ownership',axis=1,inplace=True)"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "xtrain,xtest,ytrain,ytest=train_test_split(df,target_col,test_size=0.20, random_state=42)"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": "xg_clf=ExtraTreesClassifier(n_estimators=20)\ng_clf=GradientBoostingClassifier(n_estimators=40,learning_rate=0.001)\nsvm_clf = SVC(kernel=\"rbf\")\nv_clf=VotingClassifier(estimators=[('xg',xg_clf),('gb',g_clf),('svc',svm_clf)],voting='hard')"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {
- "scrolled": true
- },
- "outputs": [],
- "source": "v_clf.fit(xtrain,ytrain)"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {
- "scrolled": true
- },
- "outputs": [],
- "source": "for clf in (xg_clf, g_clf, svm_clf, v_clf):\n clf.fit(xtrain, ytrain)\n ypred = clf.predict(xtest)\n print(clf.__class__.__name__, accuracy_score(ytest, ypred))"
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- },
- {
- "execution_count": null,
- "cell_type": "code",
- "metadata": {},
- "outputs": [],
- "source": ""
- }
- ],
- "metadata": {
- "kernelspec": {
- "display_name": "Python 3.6",
- "name": "python3",
- "language": "python"
- },
- "language_info": {
- "mimetype": "text/x-python",
- "nbconvert_exporter": "python",
- "version": "3.6.8",
- "name": "python",
- "file_extension": ".py",
- "pygments_lexer": "ipython3",
- "codemirror_mode": {
- "version": 3,
- "name": "ipython"
- }
- }
- },
- "nbformat": 4
- }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement