0% found this document useful (0 votes)

13 views9 pages

Import As Import As Import As: "Default - CSV"

Uploaded by

growhigh007

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

13 views9 pages

Import As Import As Import As: "Default - CSV"

Uploaded by

growhigh007

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 9

In [35]: import numpy as np

import pandas as pd
import seaborn as sns

In [36]: df = pd.read_csv("Default.csv")
df.head(5)

Out[36]: Unnamed: 0 default student balance income

0 1 No No 729.53 44361.63

1 2 No Yes 817.18 12106.13

2 3 No No 1073.55 31767.14

3 4 No No 529.25 35704.49

4 5 No No 785.66 38463.50

In [37]: df.drop(['Unnamed: 0'],axis = 1,inplace =True)

In [38]: df.shape

Out[38]: (10000, 4)

In [39]: import matplotlib.pyplot as plt

from scipy import stats, integrate
from sklearn.model_selection import train_test_split
from sklearn import metrics
from sklearn.linear_model import LogisticRegression
%matplotlib inline
pd.options.display.float_format = '{:.2f}'.format
plt.rcParams['figure.figsize'] = (8, 6)
plt.rcParams['font.size'] = 14
In [40]: sns.boxplot(x='default', y='income', data=df)
plt.show()

In [41]: sns.lmplot(x='balance', y='income', hue = 'default', data=df, aspect=1.5, fit_

plt.show()
In [42]: df.default.value_counts()

Out[42]: default
No 9667
Yes 333
Name: count, dtype: int64

In [43]: df.student.value_counts()

Out[43]: student
No 7056
Yes 2944
Name: count, dtype: int64

In [44]: df['default 1'] = df.default.factorize()[0]

In [45]: df['student 1'] = df.student.factorize()[0]

In [46]: df.head()

Out[46]: default student balance income default 1 student 1

0 No No 729.53 44361.63 0 0

1 No Yes 817.18 12106.13 0 1

2 No No 1073.55 31767.14 0 0

3 No No 529.25 35704.49 0 0

4 No No 785.66 38463.50 0 0

In [47]: df.drop(["default","student"],axis = 1,inplace = True)

In [48]: pd.crosstab(df['default 1'], df['student 1'], rownames=['Default'], colnames=[

Out[48]: Student 0 1

Default

0 6850 2817

1 206 127

In [57]: X = df[['balance']]
y = df['default 1']

In [50]:
In [58]: y

Out[58]: 0 0
1 0
2 0
3 0
4 0
..
9995 0
9996 0
9997 0
9998 0
9999 0
Name: default 1, Length: 10000, dtype: int64
In [59]: from sklearn.linear_model import LogisticRegression
from sklearn import metrics
logreg = LogisticRegression()
logreg.fit(X, y)
print(logreg.coef_)
print(logreg.intercept_)

y_pred = logreg.predict_proba(X)
plt.scatter(X.values, y_pred[:,1])
#plt.scatter(X.values, y)
plt.show()

[[0.00549892]]
[-10.65132824]

In [60]: y_pred

Out[60]: array([[9.98694319e-01, 1.30568146e-03],

[9.97887402e-01, 2.11259754e-03],
[9.91405252e-01, 8.59474814e-03],
...,
[9.97533484e-01, 2.46651596e-03],
[8.83240365e-01, 1.16759635e-01],
[9.99928552e-01, 7.14476480e-05]])
In [61]: y_pred[:,0]

Out[61]: array([0.99869432, 0.9978874 , 0.99140525, ..., 0.99753348, 0.88324037,

0.99992855])

In [62]: X.head()

Out[62]: balance

0 729.53

1 817.18

2 1073.55

3 529.25

4 785.66

In [63]: #splitting the data into train and test with 70:30 ratio
from sklearn.model_selection import train_test_split
xTrain, xTest, yTrain, yTest = train_test_split(X, y, test_size=0.30, random_st

In [64]: from sklearn.linear_model import LogisticRegression

from sklearn import metrics
logreg = LogisticRegression(class_weight='balanced')
logreg.fit(X, y)
print(logreg.coef_)
print(logreg.intercept_)

[[0.005602]]
[-7.42029855]

In [65]: logreg.fit(xTrain, yTrain)

Out[65]: LogisticRegression(class_weight='balanced')
In a Jupyter environment, please rerun this cell to show the HTML representation or trust
the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with
nbviewer.org.

In [66]: #now applying our learnt model on test and also on train data
y_log_pred_test = logreg.predict(xTest)
y_log_pred_train = logreg.predict(xTrain)

In [67]: y_log_pred_test.shape

Out[67]: (3000,)

In [68]: y_log_pred_train.shape

Out[68]: (7000,)
In [69]: y_log_pred_test

Out[69]: array([0, 0, 0, ..., 0, 0, 0])

In [70]: conf = metrics.confusion_matrix(yTest, y_log_pred_test)

conf

Out[70]: array([[2514, 377],

[ 22, 87]])

In [77]: confusion = metrics.confusion_matrix(yTest, y_log_pred_test)

print(confusion)
#[row, column]
TN = confusion[1, 1]
TP = confusion[0, 0]
FP = confusion[0, 1]
FN = confusion[1, 0]
print ("TP",TP)
print ("TN",TN)
print("FN",FN)
print ("FP",FP)

[[2514 377]
[ 22 87]]
TP 2514
TN 87
FN 22
FP 377
In [79]: cmap = sns.cubehelix_palette(50, hue=0.05, rot=0, light=0.9, dark=0, as_cmap=T
sns.heatmap(conf,cmap = cmap,xticklabels=['predicted_default_yes=0','predicted_
 
Out[79]: <Axes: >

In [80]: # print the first 25 true and predicted responses

print('True', yTest.values[0:15])
print('Pred', y_log_pred_test[0:15])

True [0 0 0 0 0 0 0 0 0 0 0 0 0 1 0]
Pred [0 0 0 0 0 0 1 0 1 0 1 1 1 1 1]

In [81]: #comparing the metrics of predicted lebel and real label of test data
print('Accuracy_Score:', metrics.accuracy_score(yTest, y_log_pred_test))

Accuracy_Score: 0.867

In [82]: print('Classification Error:',1 - metrics.accuracy_score(yTest, y_log_pred_test

Classification Error: 0.133

In [83]: print('Sensitivity or Recall:', metrics.recall_score(yTest, y_log_pred_test))

Sensitivity or Recall: 0.7981651376146789

In [84]: specificity = TN / (TN + FP)

print(specificity)

0.1875

In [85]: from sklearn.metrics import classification_report

print(classification_report(yTest, y_log_pred_test))

precision recall f1-score support

0 0.99 0.87 0.93 2891

1 0.19 0.80 0.30 109

accuracy 0.87 3000

macro avg 0.59 0.83 0.62 3000
weighted avg 0.96 0.87 0.90 3000

In [ ]:

PussyPrayers PDF
80% (110)
PussyPrayers PDF
108 pages
Vegetable Processing
No ratings yet
Vegetable Processing
20 pages
Backward Design
100% (1)
Backward Design
41 pages
Data analytics
No ratings yet
Data analytics
10 pages
Supervised Learning For Data Science...
No ratings yet
Supervised Learning For Data Science...
14 pages
_payal_practical5_edited
No ratings yet
_payal_practical5_edited
5 pages
DA_012307
No ratings yet
DA_012307
8 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
DSBDA05
No ratings yet
DSBDA05
5 pages
ML-journal
No ratings yet
ML-journal
45 pages
MachineLearning
No ratings yet
MachineLearning
10 pages
Aiml Ex 4-7
No ratings yet
Aiml Ex 4-7
8 pages
ML L - Ab
No ratings yet
ML L - Ab
13 pages
Print out ML_finallllllllllllllll
No ratings yet
Print out ML_finallllllllllllllll
11 pages
Logistic Regression
No ratings yet
Logistic Regression
3 pages
Vertopal.com Untitled (3)
No ratings yet
Vertopal.com Untitled (3)
6 pages
22se02cs039 DS P-11
No ratings yet
22se02cs039 DS P-11
10 pages
St. John College of Engineering and Management, Palghar - Maharashtra
No ratings yet
St. John College of Engineering and Management, Palghar - Maharashtra
11 pages
Vertopal.com Untitled (2)
No ratings yet
Vertopal.com Untitled (2)
4 pages
05 E RandomForest LoanData
No ratings yet
05 E RandomForest LoanData
8 pages
Rain in Australia Logistic Regression Classifier
No ratings yet
Rain in Australia Logistic Regression Classifier
10 pages
ML File
No ratings yet
ML File
17 pages
IRis
No ratings yet
IRis
19 pages
DL Lab 5
No ratings yet
DL Lab 5
3 pages
AI ML - Cycle 2 Programs (1)
No ratings yet
AI ML - Cycle 2 Programs (1)
15 pages
Classification Review
No ratings yet
Classification Review
8 pages
Exp3 ML
No ratings yet
Exp3 ML
4 pages
ML Algorithms
100% (1)
ML Algorithms
1 page
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 3
No ratings yet
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 3
30 pages
ML Lab PT
No ratings yet
ML Lab PT
25 pages
Machine Learning Strategies
No ratings yet
Machine Learning Strategies
59 pages
Btech1007022_lab5.1
No ratings yet
Btech1007022_lab5.1
9 pages
DA LAB MANNUAL
No ratings yet
DA LAB MANNUAL
25 pages
Linear and Logistic Regression
No ratings yet
Linear and Logistic Regression
6 pages
Home Work
No ratings yet
Home Work
12 pages
Cheat Sheet Linear and Logistic Regression
No ratings yet
Cheat Sheet Linear and Logistic Regression
2 pages
B-56 Sanket Jambhulkar MLA-3
No ratings yet
B-56 Sanket Jambhulkar MLA-3
7 pages
Machine
100% (1)
Machine
45 pages
Regression Prac 9
No ratings yet
Regression Prac 9
8 pages
ML Practicals
No ratings yet
ML Practicals
11 pages
ML - LAB - 7 - Jupyter Notebook
100% (1)
ML - LAB - 7 - Jupyter Notebook
7 pages
Logistic Regression
100% (1)
Logistic Regression
10 pages
Credit_defaulters_prediction-using-logostic-regression
No ratings yet
Credit_defaulters_prediction-using-logostic-regression
17 pages
Logistic _Regresssion
No ratings yet
Logistic _Regresssion
22 pages
23BCE7092_ML_Lab_Assignment[1]
No ratings yet
23BCE7092_ML_Lab_Assignment[1]
14 pages
ML Lab
No ratings yet
ML Lab
7 pages
ADS_phase 3
No ratings yet
ADS_phase 3
34 pages
Machine Learning Hands-On
100% (1)
Machine Learning Hands-On
18 pages
ML file_1
No ratings yet
ML file_1
12 pages
Machine Learning Cheatsheet
No ratings yet
Machine Learning Cheatsheet
5 pages
1
No ratings yet
1
13 pages
ML Lab Prgms Split
No ratings yet
ML Lab Prgms Split
3 pages
AIML PRACTICALS
No ratings yet
AIML PRACTICALS
22 pages
I Avaliação Parcial - 25.0 PTS - Gabarito
No ratings yet
I Avaliação Parcial - 25.0 PTS - Gabarito
9 pages
Aiml Practical
No ratings yet
Aiml Practical
17 pages
Import Pandas As PD DF PD - Read - CSV ("Titanic - Train - CSV") DF - Head
No ratings yet
Import Pandas As PD DF PD - Read - CSV ("Titanic - Train - CSV") DF - Head
20 pages
B24 ML Exp-1
No ratings yet
B24 ML Exp-1
10 pages
ML Lab Programs (1)
No ratings yet
ML Lab Programs (1)
9 pages
8 - Logistic - Regression - Multiclass - Ipynb - Colaboratory
No ratings yet
8 - Logistic - Regression - Multiclass - Ipynb - Colaboratory
6 pages
Shobit Sharma (2124399) ML lab file pdf
No ratings yet
Shobit Sharma (2124399) ML lab file pdf
19 pages
Develop Snakes & Ladders Game Complete Guide with Code & Design
From Everand
Develop Snakes & Ladders Game Complete Guide with Code & Design
Anurag Pandey
No ratings yet
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Develop Snake & Ladder Game in an Hour (Complete Guide with Code & Design)
From Everand
Develop Snake & Ladder Game in an Hour (Complete Guide with Code & Design)
Anurag Pandey
No ratings yet
Volume9 Issue3 (5) 2020
No ratings yet
Volume9 Issue3 (5) 2020
224 pages
Digital Versus Conventional Impression Method in Children: Comfort, Preference and Time
No ratings yet
Digital Versus Conventional Impression Method in Children: Comfort, Preference and Time
8 pages
k7_giữa kỳ 2425 các môn
No ratings yet
k7_giữa kỳ 2425 các môn
35 pages
Dr. Paul R. Fleischman - Vipassana Meditation - Healing The Healer and The Experience of Impermanence-Vipassana Research Institute (2023)
No ratings yet
Dr. Paul R. Fleischman - Vipassana Meditation - Healing The Healer and The Experience of Impermanence-Vipassana Research Institute (2023)
6 pages
Miles For Moffitt Event Guide
No ratings yet
Miles For Moffitt Event Guide
5 pages
Sw124 1st Unit Final
No ratings yet
Sw124 1st Unit Final
28 pages
Jatamansi - Health Benefits, Uses, Dosage and Side Effects
No ratings yet
Jatamansi - Health Benefits, Uses, Dosage and Side Effects
6 pages
6466-Article Text-44967-1-10-20230101
No ratings yet
6466-Article Text-44967-1-10-20230101
10 pages
Arkansas Durable Medical Power of Attorney Form
No ratings yet
Arkansas Durable Medical Power of Attorney Form
3 pages
AAGBI18.07 Anaesthesia Team
No ratings yet
AAGBI18.07 Anaesthesia Team
12 pages
Complete Subjective Test 02 _ Test Solutions (English I) __ Radiant 2025
No ratings yet
Complete Subjective Test 02 _ Test Solutions (English I) __ Radiant 2025
9 pages
10-02-2015 Health Products of 2013-14, Feb 2015 Attachment-1
No ratings yet
10-02-2015 Health Products of 2013-14, Feb 2015 Attachment-1
19 pages
Mental health needs of children & young people: guiding you to key issues and practices in CAMHS Padmore 2024 Scribd Download
100% (3)
Mental health needs of children & young people: guiding you to key issues and practices in CAMHS Padmore 2024 Scribd Download
36 pages
Root Surface Demineralization in Periodontal Therapy Subject Review
No ratings yet
Root Surface Demineralization in Periodontal Therapy Subject Review
6 pages
Jacob Riegle
No ratings yet
Jacob Riegle
4 pages
Motional Ating Uestionnaire: Are You An Emotional Eater?
No ratings yet
Motional Ating Uestionnaire: Are You An Emotional Eater?
1 page
Ngô Gia Huy - HW U3-U4
No ratings yet
Ngô Gia Huy - HW U3-U4
4 pages
Importance of Employee Benefits
No ratings yet
Importance of Employee Benefits
3 pages
STRONGkids Nutritional Screening Tool in Pediatrics An Analysis of Cutoff Points in South America
No ratings yet
STRONGkids Nutritional Screening Tool in Pediatrics An Analysis of Cutoff Points in South America
8 pages
Miss Sidra
No ratings yet
Miss Sidra
36 pages
Vaginal Pessaries 1st Edition all chapter
100% (11)
Vaginal Pessaries 1st Edition all chapter
14 pages
Mhaf20001enn 002 PDF
No ratings yet
Mhaf20001enn 002 PDF
182 pages
Skrip MPU3022 Role Play Q1
No ratings yet
Skrip MPU3022 Role Play Q1
10 pages
cathay pacific airline requarements
No ratings yet
cathay pacific airline requarements
66 pages
Tabela lubrificantes Shell pro
No ratings yet
Tabela lubrificantes Shell pro
1 page
Skillful Teacher Chapter 7 & 8
No ratings yet
Skillful Teacher Chapter 7 & 8
3 pages
Referat - Septic Artritis
No ratings yet
Referat - Septic Artritis
23 pages

Import As Import As Import As: "Default - CSV"

Uploaded by

Import As Import As Import As: "Default - CSV"

Uploaded by

In [35]: import numpy as np

Out[36]: Unnamed: 0 default student balance income

1 2 No Yes 817.18 12106.13

In [37]: df.drop(['Unnamed: 0'],axis = 1,inplace =True)

In [39]: import matplotlib.pyplot as plt

In [41]: sns.lmplot(x='balance', y='income', hue = 'default', data=df, aspect=1.5, fit_

In [44]: df['default 1'] = df.default.factorize()[0]

In [45]: df['student 1'] = df.student.factorize()[0]

Out[46]: default student balance income default 1 student 1

1 No Yes 817.18 12106.13 0 1

In [47]: df.drop(["default","student"],axis = 1,inplace = True)

In [48]: pd.crosstab(df['default 1'], df['student 1'], rownames=['Default'], colnames=[

Out[60]: array([[9.98694319e-01, 1.30568146e-03],

Out[61]: array([0.99869432, 0.9978874 , 0.99140525, ..., 0.99753348, 0.88324037,

In [64]: from sklearn.linear_model import LogisticRegression

In [65]: logreg.fit(xTrain, yTrain)

Out[69]: array([0, 0, 0, ..., 0, 0, 0])

In [70]: conf = metrics.confusion_matrix(yTest, y_log_pred_test)

Out[70]: array([[2514, 377],

In [77]: confusion = metrics.confusion_matrix(yTest, y_log_pred_test)

In [80]: # print the first 25 true and predicted responses

In [82]: print('Classification Error:',1 - metrics.accuracy_score(yTest, y_log_pred_test

Classification Error: 0.133

In [83]: print('Sensitivity or Recall:', metrics.recall_score(yTest, y_log_pred_test))

Sensitivity or Recall: 0.7981651376146789

In [85]: from sklearn.metrics import classification_report

precision recall f1-score support

0 0.99 0.87 0.93 2891

accuracy 0.87 3000

You might also like