{ "cells": [ { "cell_type": "code", "execution_count": 3, "metadata": { "collapsed": false }, "outputs": [], "source": [ "import graphlab \n", "graphlab.canvas.set_target('ipynb')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Load Loan Dataset" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "collapsed": false }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "2016-03-24 07:49:12,384 [INFO] graphlab.cython.cy_server, 176: GraphLab Create v1.8.5 started. Logging: C:\\Users\\erigits\\AppData\\Local\\Temp\\graphlab_server_1458794950.log.0\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "This non-commercial license of GraphLab Create is assigned to ericgithua2011@gmail.com and will expire on November 01, 2016. For commercial licensing options, visit https://dato.com/buy/.\n" ] } ], "source": [ "loans = graphlab.SFrame('lending-club-data.gl/')" ] }, { "cell_type": "code", "execution_count": 5, "metadata": { "collapsed": false }, "outputs": [ { "data": { "text/html": [ "
id | \n", "member_id | \n", "loan_amnt | \n", "funded_amnt | \n", "funded_amnt_inv | \n", "term | \n", "int_rate | \n", "installment | \n", "grade | \n", "sub_grade | \n", "
---|---|---|---|---|---|---|---|---|---|
1077501 | \n", "1296599 | \n", "5000 | \n", "5000 | \n", "4975 | \n", "36 months | \n", "10.65 | \n", "162.87 | \n", "B | \n", "B2 | \n", "
1077430 | \n", "1314167 | \n", "2500 | \n", "2500 | \n", "2500 | \n", "60 months | \n", "15.27 | \n", "59.83 | \n", "C | \n", "C4 | \n", "
1077175 | \n", "1313524 | \n", "2400 | \n", "2400 | \n", "2400 | \n", "36 months | \n", "15.96 | \n", "84.33 | \n", "C | \n", "C5 | \n", "
1076863 | \n", "1277178 | \n", "10000 | \n", "10000 | \n", "10000 | \n", "36 months | \n", "13.49 | \n", "339.31 | \n", "C | \n", "C1 | \n", "
1075269 | \n", "1311441 | \n", "5000 | \n", "5000 | \n", "5000 | \n", "36 months | \n", "7.9 | \n", "156.46 | \n", "A | \n", "A4 | \n", "
1072053 | \n", "1288686 | \n", "3000 | \n", "3000 | \n", "3000 | \n", "36 months | \n", "18.64 | \n", "109.43 | \n", "E | \n", "E1 | \n", "
1071795 | \n", "1306957 | \n", "5600 | \n", "5600 | \n", "5600 | \n", "60 months | \n", "21.28 | \n", "152.39 | \n", "F | \n", "F2 | \n", "
1071570 | \n", "1306721 | \n", "5375 | \n", "5375 | \n", "5350 | \n", "60 months | \n", "12.69 | \n", "121.45 | \n", "B | \n", "B5 | \n", "
1070078 | \n", "1305201 | \n", "6500 | \n", "6500 | \n", "6500 | \n", "60 months | \n", "14.65 | \n", "153.45 | \n", "C | \n", "C3 | \n", "
1069908 | \n", "1305008 | \n", "12000 | \n", "12000 | \n", "12000 | \n", "36 months | \n", "12.69 | \n", "402.54 | \n", "B | \n", "B5 | \n", "
emp_title | \n", "emp_length | \n", "home_ownership | \n", "annual_inc | \n", "is_inc_v | \n", "issue_d | \n", "loan_status | \n", "pymnt_plan | \n", "
---|---|---|---|---|---|---|---|
\n", " | 10+ years | \n", "RENT | \n", "24000 | \n", "Verified | \n", "20111201T000000 | \n", "Fully Paid | \n", "n | \n", "
Ryder | \n", "< 1 year | \n", "RENT | \n", "30000 | \n", "Source Verified | \n", "20111201T000000 | \n", "Charged Off | \n", "n | \n", "
\n", " | 10+ years | \n", "RENT | \n", "12252 | \n", "Not Verified | \n", "20111201T000000 | \n", "Fully Paid | \n", "n | \n", "
AIR RESOURCES BOARD | \n", "10+ years | \n", "RENT | \n", "49200 | \n", "Source Verified | \n", "20111201T000000 | \n", "Fully Paid | \n", "n | \n", "
Veolia Transportaton | \n", "3 years | \n", "RENT | \n", "36000 | \n", "Source Verified | \n", "20111201T000000 | \n", "Fully Paid | \n", "n | \n", "
MKC Accounting | \n", "9 years | \n", "RENT | \n", "48000 | \n", "Source Verified | \n", "20111201T000000 | \n", "Fully Paid | \n", "n | \n", "
\n", " | 4 years | \n", "OWN | \n", "40000 | \n", "Source Verified | \n", "20111201T000000 | \n", "Charged Off | \n", "n | \n", "
Starbucks | \n", "< 1 year | \n", "RENT | \n", "15000 | \n", "Verified | \n", "20111201T000000 | \n", "Charged Off | \n", "n | \n", "
Southwest Rural metro | \n", "5 years | \n", "OWN | \n", "72000 | \n", "Not Verified | \n", "20111201T000000 | \n", "Fully Paid | \n", "n | \n", "
UCLA | \n", "10+ years | \n", "OWN | \n", "75000 | \n", "Source Verified | \n", "20111201T000000 | \n", "Fully Paid | \n", "n | \n", "
url | \n", "desc | \n", "purpose | \n", "title | \n", "zip_code | \n", "
---|---|---|---|---|
https://www.lendingclub.c om/browse/loanDetail. ... | \n",
" Borrower added on 12/22/11 > I need to ... | \n",
" credit_card | \n", "Computer | \n", "860xx | \n", "
https://www.lendingclub.c om/browse/loanDetail. ... | \n",
" Borrower added on 12/22/11 > I plan to use ... | \n",
" car | \n", "bike | \n", "309xx | \n", "
https://www.lendingclub.c om/browse/loanDetail. ... | \n",
" \n", " | small_business | \n", "real estate business | \n", "606xx | \n", "
https://www.lendingclub.c om/browse/loanDetail. ... | \n",
" Borrower added on 12/21/11 > to pay for ... | \n",
" other | \n", "personel | \n", "917xx | \n", "
https://www.lendingclub.c om/browse/loanDetail. ... | \n",
" \n", " | wedding | \n", "My wedding loan I promise to pay back ... | \n",
" 852xx | \n", "
https://www.lendingclub.c om/browse/loanDetail. ... | \n",
" Borrower added on 12/16/11 > Downpayment ... | \n",
" car | \n", "Car Downpayment | \n", "900xx | \n", "
https://www.lendingclub.c om/browse/loanDetail. ... | \n",
" Borrower added on 12/21/11 > I own a small ... | \n",
" small_business | \n", "Expand Business & Buy Debt Portfolio ... | \n",
" 958xx | \n", "
https://www.lendingclub.c om/browse/loanDetail. ... | \n",
" Borrower added on 12/16/11 > I'm trying to ... | \n",
" other | \n", "Building my credit history. ... | \n",
" 774xx | \n", "
https://www.lendingclub.c om/browse/loanDetail. ... | \n",
" Borrower added on 12/15/11 > I had recived ... | \n",
" debt_consolidation | \n", "High intrest Consolidation ... | \n",
" 853xx | \n", "
https://www.lendingclub.c om/browse/loanDetail. ... | \n",
" \n", " | debt_consolidation | \n", "Consolidation | \n", "913xx | \n", "
addr_state | \n", "dti | \n", "delinq_2yrs | \n", "earliest_cr_line | \n", "inq_last_6mths | \n", "mths_since_last_delinq | \n", "mths_since_last_record | \n", "
---|---|---|---|---|---|---|
AZ | \n", "27.65 | \n", "0 | \n", "19850101T000000 | \n", "1 | \n", "None | \n", "None | \n", "
GA | \n", "1.0 | \n", "0 | \n", "19990401T000000 | \n", "5 | \n", "None | \n", "None | \n", "
IL | \n", "8.72 | \n", "0 | \n", "20011101T000000 | \n", "2 | \n", "None | \n", "None | \n", "
CA | \n", "20.0 | \n", "0 | \n", "19960201T000000 | \n", "1 | \n", "35 | \n", "None | \n", "
AZ | \n", "11.2 | \n", "0 | \n", "20041101T000000 | \n", "3 | \n", "None | \n", "None | \n", "
CA | \n", "5.35 | \n", "0 | \n", "20070101T000000 | \n", "2 | \n", "None | \n", "None | \n", "
CA | \n", "5.55 | \n", "0 | \n", "20040401T000000 | \n", "2 | \n", "None | \n", "None | \n", "
TX | \n", "18.08 | \n", "0 | \n", "20040901T000000 | \n", "0 | \n", "None | \n", "None | \n", "
AZ | \n", "16.12 | \n", "0 | \n", "19980101T000000 | \n", "2 | \n", "None | \n", "None | \n", "
CA | \n", "10.78 | \n", "0 | \n", "19891001T000000 | \n", "0 | \n", "None | \n", "None | \n", "
open_acc | \n", "pub_rec | \n", "revol_bal | \n", "revol_util | \n", "total_acc | \n", "initial_list_status | \n", "out_prncp | \n", "out_prncp_inv | \n", "total_pymnt | \n", "
---|---|---|---|---|---|---|---|---|
3 | \n", "0 | \n", "13648 | \n", "83.7 | \n", "9 | \n", "f | \n", "0.0 | \n", "0.0 | \n", "5861.07 | \n", "
3 | \n", "0 | \n", "1687 | \n", "9.4 | \n", "4 | \n", "f | \n", "0.0 | \n", "0.0 | \n", "1008.71 | \n", "
2 | \n", "0 | \n", "2956 | \n", "98.5 | \n", "10 | \n", "f | \n", "0.0 | \n", "0.0 | \n", "3003.65 | \n", "
10 | \n", "0 | \n", "5598 | \n", "21.0 | \n", "37 | \n", "f | \n", "0.0 | \n", "0.0 | \n", "12226.3 | \n", "
9 | \n", "0 | \n", "7963 | \n", "28.3 | \n", "12 | \n", "f | \n", "0.0 | \n", "0.0 | \n", "5631.38 | \n", "
4 | \n", "0 | \n", "8221 | \n", "87.5 | \n", "4 | \n", "f | \n", "0.0 | \n", "0.0 | \n", "3938.14 | \n", "
11 | \n", "0 | \n", "5210 | \n", "32.6 | \n", "13 | \n", "f | \n", "0.0 | \n", "0.0 | \n", "646.02 | \n", "
2 | \n", "0 | \n", "9279 | \n", "36.5 | \n", "3 | \n", "f | \n", "0.0 | \n", "0.0 | \n", "1476.19 | \n", "
14 | \n", "0 | \n", "4032 | \n", "20.6 | \n", "23 | \n", "f | \n", "0.0 | \n", "0.0 | \n", "7677.52 | \n", "
12 | \n", "0 | \n", "23336 | \n", "67.1 | \n", "34 | \n", "f | \n", "0.0 | \n", "0.0 | \n", "13943.1 | \n", "
total_pymnt_inv | \n", "... | \n", "
---|---|
5831.78 | \n", "... | \n", "
1008.71 | \n", "... | \n", "
3003.65 | \n", "... | \n", "
12226.3 | \n", "... | \n", "
5631.38 | \n", "... | \n", "
3938.14 | \n", "... | \n", "
646.02 | \n", "... | \n", "
1469.34 | \n", "... | \n", "
7677.52 | \n", "... | \n", "
13943.1 | \n", "... | \n", "