0% found this document useful (0 votes)

42 views9 pages

ML 3

Uploaded by

yefigoh133

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

42 views9 pages

ML 3

Uploaded by

yefigoh133

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

from google.

colab import files

uploaded = [Link]()

Choose Files No file chosen Upload widget is only available when the cell has been executed in the current browser session. Please rerun this cell to
enable.
Saving [Link] to [Link]

import numpy as np
import pandas as pd
import [Link] as px
import [Link] as plt
titanic = pd.read_csv('[Link]')
[Link]

(891, 12)

[Link](5)

output PassengerId Survived Pclass Name Sex Age SibSp Parch Ticket Fare Cabin Embarked

0 1 0 3 Braund, Mr. Owen Harris male 22.0 1 0 A/5 21171 7.2500 NaN S

Cumings, Mrs. John Bradley

1 2 1 1 female 38.0 1 0 PC 17599 71.2833 C85 C
(Florence Briggs Th...

STON/O2.
2 3 1 3 Heikkinen, Miss. Laina female 26.0 0 0 7.9250 NaN S
3101282

Futrelle, Mrs. Jacques Heath (Lily

3 4 1 1 female 35.0 1 0 113803 53.1000 C123 S
May Peel)

4 5 0 3 Allen, Mr. William Henry male 35.0 0 0 373450 8.0500 NaN S

[Link](5)

PassengerId Survived Pclass Name Sex Age SibSp Parch Ticket Fare Cabin Embarked

682 683 0 3 Olsvigen, Mr. Thor Anderson male 20.0 0 0 6563 9.225 NaN S

790 791 0 3 Keane, Mr. Andrew "Andy" male NaN 0 0 12460 7.750 NaN Q

417 418 1 2 Silven, Miss. Lyyli Karoliina female 18.0 0 2 250652 13.000 NaN S

560 561 0 3 Morrow, Mr. Thomas Rowan male NaN 0 0 372622 7.750 NaN Q

Hart, Mrs. Benjamin (Esther Ada F.C.C.

440 441 1 2 female 45.0 1 1 26.250 NaN S
Bloomfield) 13529

X = [Link]([Link][ : , \
['Pclass', 'Sex', 'Age', 'SibSp', 'Parch', 'Fare', 'Embarked']])
X

Pclass Sex Age SibSp Parch Fare Embarked

0 3 male 22.0 1 0 7.2500 S

1 1 female 38.0 1 0 71.2833 C

2 3 female 26.0 0 0 7.9250 S

3 1 female 35.0 1 0 53.1000 S

4 3 male 35.0 0 0 8.0500 S

... ... ... ... ... ... ... ...

886 2 male 27.0 0 0 13.0000 S

887 1 female 19.0 0 0 30.0000 S

888 3 female NaN 1 2 23.4500 S

889 1 male 26.0 0 0 30.0000 C

890 3 male 32.0 0 0 7.7500 Q

891 rows × 7 columns

Y = [Link]([Link][:, ['Survived']])
Y
Survived

0 0

1 1

2 1

3 1

4 0

... ...

886 0

887 1

888 0

889 1

890 0

891 rows × 1 columns

[Link]()

array([0, 1])

fig.update_layout(yaxis_title = '% of Survival')

[Link]()

Sex vs. Survived

100 Survived
18.89 74.20
0
80 1
81.11
% of Survival

20 25.80

0
male female

Sex

fig = [Link](titanic ,
x = 'Pclass' ,
color = 'Survived' ,
nbins = 3,
width = 400,
height = 400,
title = 'Pclass vs. Survived',
text_auto = '.2f',
barnorm = 'percent')

fig.update_layout( bargap = 0.2 , yaxis_title = '% of Survival')

[Link]()
Pclass vs. Survived

100 Survived
62.96 47.28 24.24
0
80 1
% of Survival

75.76
60

52.72
40
37.04

0
1 2 3

Pclass

fig = [Link](titanic ,
x = 'Fare' ,
color = 'Survived' ,
nbins = 5,
width = 500,
height = 500,
title = 'Fare vs. Survived',
text_auto = '.2f',
barnorm = 'percent',
barmode = 'group')

fig.update_layout(yaxis_title = '% of Survival')

[Link]()

Fare vs. Survived

100 Survived
100.00

0
1

80
72.00
% of Survival

63.84

40
36.16

28.00

0
0 200 400 600

Fare

fig = [Link](titanic ,
x = 'Age' ,
color = 'Survived' ,
nbins = 5,
width = 500,
height = 500,
title = 'Age vs. Survived',
text_auto = '.2f',
barnorm = 'percent',
barmode = 'group' )

fig.update_layout(yaxis_title = '% of Survival')

[Link]()
Age vs. Survived

Survived

85.71
80 0
1

63.35
60
61.29

61.19
% of Survival

40 58.20

41.80

38.81
38.71

36.65

14.29
0
0 20 40 60 80

Age

family_size = [Link] + [Link]

family_size.unique()

array([ 1, 0, 4, 2, 6, 5, 3, 7, 10])

fig = [Link](titanic ,
x = family_size ,
color = 'Survived' ,
nbins = 4,
width = 500,
height = 500,
title = 'Family Size vs. Survived',
text_auto = '.2f',
barnorm = 'percent',
barmode = 'group',
labels = {'x' : 'Family Size' , })

fig.update_layout(yaxis_title = '% of Survival')

[Link]()

Family Size vs. Survived

100 Survived
100.00

0
1

80 82.50
% of Survival

60
60.31

40
39.69

20
17.50

0
2 7 12

Family Size
fig = [Link](titanic ,
x = 'Embarked' ,
color = 'Survived' ,
width = 400,
height = 400,
barnorm = 'percent',
text_auto = '.2f',
title = 'Embarked vs. Survived')

fig.update_layout(yaxis_title = '% of Survival')

[Link]()

Embarked vs. Survived

100 Survived
33.70 38.96 55.36
0
80 1
% of Survival

60 66.30
61.04

40 44.64

0
S Q C

Embarked

[Link]()

<class '[Link]'>
RangeIndex: 891 entries, 0 to 890
Data columns (total 7 columns):
# Column Non-Null Count Dtype
--- ------ -------------- -----
0 Pclass 891 non-null int64
1 Sex 891 non-null object
2 Age 714 non-null float64
3 SibSp 891 non-null int64
4 Parch 891 non-null int64
5 Fare 891 non-null float64
6 Embarked 889 non-null object
dtypes: float64(2), int64(3), object(2)
memory usage: 48.9+ KB

print('% of missing values')

[Link]().mean()*100

% of missing values
Pclass 0.000000
Sex 0.000000
Age 19.865320
SibSp 0.000000
Parch 0.000000
Fare 0.000000
Embarked 0.224467
dtype: float64

meanAge = X['Age'].mean()

meanAge

29.69911764705882

X['Age'].fillna( meanAge , inplace = True)

[Link]().sum()

Pclass 0
Sex 0
Age 0
SibSp 0
Parch 0
Fare 0
Embarked 2
dtype: int64

modeEmbarked = X['Embarked'].mode()[0]

modeEmbarked

'S'

X['Embarked'].fillna( modeEmbarked , inplace = True)

[Link]().sum()

Pclass 0
Sex 0
Age 0
SibSp 0
Parch 0
Fare 0
Embarked 0
dtype: int64

[Link]()
[Link]()

array(['S', 'C', 'Q'], dtype=object)

from sklearn import preprocessing

# fit the 'Sex' attribute for label encoding

label_encoder_Sex = [Link]().fit(X['Sex'])
X['Sex'] = label_encoder_Sex.transform(X['Sex'])

[Link](5)

Pclass Sex Age SibSp Parch Fare Embarked

0 3 1 22.0 1 0 7.2500 S

1 1 0 38.0 1 0 71.2833 C

2 3 0 26.0 0 0 7.9250 S

3 1 0 35.0 1 0 53.1000 S

4 3 1 35.0 0 0 8.0500 S

label_encoder_Embarked = [Link]().fit(X['Embarked'])
X['Embarked'] = label_encoder_Embarked.transform(X['Embarked'])

[Link](5)

Pclass Sex Age SibSp Parch Fare Embarked

0 3 1 22.0 1 0 7.2500 2

1 1 0 38.0 1 0 71.2833 0

2 3 0 26.0 0 0 7.9250 2

3 1 0 35.0 1 0 53.1000 2

4 3 1 35.0 0 0 8.0500 2

[Link]([Link], method='pearson')

Pclass -0.338481
Sex -0.543351
Age -0.069809
SibSp -0.035322
Parch 0.081629
Fare 0.257307
Embarked -0.167675
dtype: float64
from sklearn.model_selection import train_test_split

X_train, X_test, Y_train, Y_test = train_test_split(X, Y,

test_size=0.25,
random_state = 35)
X_train

Pclass Sex Age SibSp Parch Fare Embarked

786 3 0 18.0 0 0 7.4958 2

636 3 1 32.0 0 0 7.9250 2

401 3 1 26.0 0 0 8.0500 2

811 3 1 39.0 0 0 24.1500 2

780 3 0 13.0 0 0 7.2292 0

... ... ... ... ... ... ... ...

249 2 1 54.0 1 0 26.0000 2

448 3 0 5.0 2 1 19.2583 0

33 2 1 66.0 0 0 10.5000 2

271 3 1 25.0 0 0 0.0000 2

713 3 1 29.0 0 0 9.4833 2

668 rows × 7 columns

from [Link] import DecisionTreeClassifier

# creating an object of KNeighborsClassifier class

dtc = DecisionTreeClassifier( criterion = 'entropy' , random_state = 1 )

# train the model

[Link](X_train, Y_train)

▾ DecisionTreeClassifier
DecisionTreeClassifier(criterion='entropy', random_state=1)

from sklearn import tree

fig = [Link]( figsize = (25 , 20) , dpi = 200.0)

_ = tree.plot_tree( dtc,
feature_names = ['Pclass' ,'Sex', 'Age', 'SibSp', 'Parch', 'Fare', 'Embarked'],
class_names = ['Not Survived' , 'Survived'] ,
filled = True)
Y_pred = [Link](X_test)

from [Link] import confusion_matrix , accuracy_score

# make a confusion matrix

cm = confusion_matrix(Y_test, Y_pred)

# display confusion matrix as a heatmap

fig = [Link](cm ,
width = 400,
height = 400 ,
text_auto = True,
color_continuous_scale = 'tealgrn')

[Link]()

# compute and display the the accuracy of the KNN model

print('The % of Accuracy is : {0:.2f} '.format(accuracy_score(Y_test , Y_pred)*100))
−0.5

100

0 113 23

0.5
60

1 27 60
40

Titanic Survival Prediction
No ratings yet
Titanic Survival Prediction
5 pages
Advanced Python for Data Scientists
No ratings yet
Advanced Python for Data Scientists
19 pages
Titanic Survival Prediction Guide
No ratings yet
Titanic Survival Prediction Guide
16 pages
Dspracticalexternak 23 Aug
No ratings yet
Dspracticalexternak 23 Aug
8 pages
Project Report
No ratings yet
Project Report
7 pages
Titanic Data Analysis in Colab
No ratings yet
Titanic Data Analysis in Colab
4 pages
Python For Data Analysis
No ratings yet
Python For Data Analysis
28 pages
Titanic Dataset Preprocessing Guide
No ratings yet
Titanic Dataset Preprocessing Guide
5 pages
Titanic Data Analysis
No ratings yet
Titanic Data Analysis
14 pages
Titanic Dataset
No ratings yet
Titanic Dataset
9 pages
Data Cleaning and Manipulation in Python
No ratings yet
Data Cleaning and Manipulation in Python
33 pages
Titanic Survival Analysis
100% (2)
Titanic Survival Analysis
13 pages
Titanic Survival Prediction Analysis
No ratings yet
Titanic Survival Prediction Analysis
15 pages
A09Ass01 - Jupyter Notebook
No ratings yet
A09Ass01 - Jupyter Notebook
8 pages
7 8 - Missing Value Handling
No ratings yet
7 8 - Missing Value Handling
4 pages
Titanic ML for Data Scientists
No ratings yet
Titanic ML for Data Scientists
36 pages
Logistic Regression on Titanic Data
No ratings yet
Logistic Regression on Titanic Data
6 pages
ML - Lab 03.ipynb Colab
No ratings yet
ML - Lab 03.ipynb Colab
4 pages
ML Dataset Performance
No ratings yet
ML Dataset Performance
11 pages
Titanic Eda
No ratings yet
Titanic Eda
17 pages
Assignment 2
No ratings yet
Assignment 2
5 pages
Data Mining
No ratings yet
Data Mining
59 pages
Assignment
No ratings yet
Assignment
14 pages
Titanic Logistic Regression Project
No ratings yet
Titanic Logistic Regression Project
35 pages
178 - NaiveBaye's.ipynb - Colab
No ratings yet
178 - NaiveBaye's.ipynb - Colab
3 pages
Decision Tree
No ratings yet
Decision Tree
2 pages
Assignment Data Science
No ratings yet
Assignment Data Science
2 pages
LOGISTIC - REGRESSION - Jupyter Notebook
No ratings yet
LOGISTIC - REGRESSION - Jupyter Notebook
18 pages
Pandas Day 4
No ratings yet
Pandas Day 4
7 pages
Titanic Survival Classification Analysis
100% (1)
Titanic Survival Classification Analysis
7 pages
Titanic Survival Prediction Model
No ratings yet
Titanic Survival Prediction Model
4 pages
Python For Machine Learning
No ratings yet
Python For Machine Learning
33 pages
The Titanic Dataset
No ratings yet
The Titanic Dataset
6 pages
Ds 9
No ratings yet
Ds 9
12 pages
Titanic
No ratings yet
Titanic
6 pages
PANDAS Groupby Continues 2
No ratings yet
PANDAS Groupby Continues 2
5 pages
Assign8.ipynb - Colab
No ratings yet
Assign8.ipynb - Colab
14 pages
9914 ML Lab3
No ratings yet
9914 ML Lab3
6 pages
Loading The Dataset: ## The Matplotlib and Seaborn Library For Result Visualization and Analysis
No ratings yet
Loading The Dataset: ## The Matplotlib and Seaborn Library For Result Visualization and Analysis
13 pages
Unit 5 Analysis With Pandas in Python
No ratings yet
Unit 5 Analysis With Pandas in Python
26 pages
Seaborn Ploting in Titanic
No ratings yet
Seaborn Ploting in Titanic
18 pages
Learneverythingai 1695069129
No ratings yet
Learneverythingai 1695069129
56 pages
Lab 5.ipynb - Colab
No ratings yet
Lab 5.ipynb - Colab
6 pages
Data Cleaning by Manish Batra 1697684636
No ratings yet
Data Cleaning by Manish Batra 1697684636
30 pages
Prac3 23bme053
No ratings yet
Prac3 23bme053
5 pages
Experiment 1
No ratings yet
Experiment 1
2 pages
Dataset Visualization Basic Ml-1
No ratings yet
Dataset Visualization Basic Ml-1
12 pages
AM19 EDA Assignment1
No ratings yet
AM19 EDA Assignment1
13 pages
Assignment ML
No ratings yet
Assignment ML
4 pages
Titanic
No ratings yet
Titanic
22 pages
Titanic PuneethRegonda
No ratings yet
Titanic PuneethRegonda
8 pages
Pyt Manual 1
No ratings yet
Pyt Manual 1
85 pages
Machine Learning Lab: Titanic PCA & ID3 Decision Tree
No ratings yet
Machine Learning Lab: Titanic PCA & ID3 Decision Tree
19 pages
Titanic Data Analysis & Modeling
No ratings yet
Titanic Data Analysis & Modeling
11 pages
3 Practical
No ratings yet
3 Practical
2 pages
Pandas Data Imputation Guide
No ratings yet
Pandas Data Imputation Guide
12 pages
Passive & Active Transport
100% (1)
Passive & Active Transport
31 pages
Oscm Assignment
No ratings yet
Oscm Assignment
2 pages
Barcode Report
No ratings yet
Barcode Report
5 pages
RSH The Role of Rented Condo Stock
No ratings yet
RSH The Role of Rented Condo Stock
92 pages
(Trending 18+!) +one Girl 50 Snake Viral Video Original Link
No ratings yet
(Trending 18+!) +one Girl 50 Snake Viral Video Original Link
5 pages
Swedish Match Debt Recapitalization Analysis
No ratings yet
Swedish Match Debt Recapitalization Analysis
6 pages
Nayara Energy Retail Outlet Application Form
No ratings yet
Nayara Energy Retail Outlet Application Form
12 pages
Course Outline Teaching Macro
No ratings yet
Course Outline Teaching Macro
3 pages
Lesson 3 Spanish Colonial Period in Philippine Literature
100% (7)
Lesson 3 Spanish Colonial Period in Philippine Literature
10 pages
Basic Numerical Ability - Sample Questions - HDFC ACE Banker
No ratings yet
Basic Numerical Ability - Sample Questions - HDFC ACE Banker
9 pages
ARES Research Report No. 7 Cased Telescoped Ammunition PDF
100% (2)
ARES Research Report No. 7 Cased Telescoped Ammunition PDF
43 pages
Molecular Weight of Carbopol and Pemulen
No ratings yet
Molecular Weight of Carbopol and Pemulen
3 pages
Jis G3455
No ratings yet
Jis G3455
21 pages
HG - G8 - Week 4
No ratings yet
HG - G8 - Week 4
4 pages
Post Market Survellianece Plan Cum Report
No ratings yet
Post Market Survellianece Plan Cum Report
3 pages
Milk Quality Assurance Katam
100% (2)
Milk Quality Assurance Katam
41 pages
Lift Brochure en v1
100% (1)
Lift Brochure en v1
28 pages
Vstep Speaking Part 1-2-3
No ratings yet
Vstep Speaking Part 1-2-3
23 pages
Embankment Construction Methodology
No ratings yet
Embankment Construction Methodology
2 pages
02 Praesidium Series Midnight Pleasure
100% (1)
02 Praesidium Series Midnight Pleasure
793 pages
CBSE 2021 Exam Mark Sheet
No ratings yet
CBSE 2021 Exam Mark Sheet
1 page
Simulation of Un-Symmetrical 2-Phase Induction Motor
No ratings yet
Simulation of Un-Symmetrical 2-Phase Induction Motor
4 pages
Diagnostic Test for English V Skills
No ratings yet
Diagnostic Test for English V Skills
4 pages
Dielectric Properties
No ratings yet
Dielectric Properties
10 pages
3design and Performance Evaluation of A Borehole Solar PV Pumping System For A South African Based Mine
No ratings yet
3design and Performance Evaluation of A Borehole Solar PV Pumping System For A South African Based Mine
6 pages
1022-Sadiq Ali
No ratings yet
1022-Sadiq Ali
1 page
Ourlog 1300
No ratings yet
Ourlog 1300
9 pages
Silent Partners Women As Public Investors During Britain's Financial Revolution, 1690-1750 1st Edition Amy M. Froide PDF Download
No ratings yet
Silent Partners Women As Public Investors During Britain's Financial Revolution, 1690-1750 1st Edition Amy M. Froide PDF Download
100 pages
IMO Olympiad Champs Maths 3
67% (3)
IMO Olympiad Champs Maths 3
280 pages
SACS Import
100% (1)
SACS Import
22 pages

ML 3

Uploaded by

ML 3

Uploaded by

from google.

colab import files

Cumings, Mrs. John Bradley

Futrelle, Mrs. Jacques Heath (Lily

4 5 0 3 Allen, Mr. William Henry male 35.0 0 0 373450 8.0500 NaN S

Hart, Mrs. Benjamin (Esther Ada F.C.C.

Pclass Sex Age SibSp Parch Fare Embarked

0 3 male 22.0 1 0 7.2500 S

1 1 female 38.0 1 0 71.2833 C

2 3 female 26.0 0 0 7.9250 S

3 1 female 35.0 1 0 53.1000 S

4 3 male 35.0 0 0 8.0500 S

... ... ... ... ... ... ... ...

886 2 male 27.0 0 0 13.0000 S

887 1 female 19.0 0 0 30.0000 S

888 3 female NaN 1 2 23.4500 S

889 1 male 26.0 0 0 30.0000 C

890 3 male 32.0 0 0 7.7500 Q

891 rows × 7 columns

891 rows × 1 columns

fig = [Link]( titanic ,

fig.update_layout(yaxis_title = '% of Survival')

Sex vs. Survived

fig.update_layout( bargap = 0.2 , yaxis_title = '% of Survival')

fig.update_layout(yaxis_title = '% of Survival')

Fare vs. Survived

fig.update_layout(yaxis_title = '% of Survival')

family_size = [Link] + [Link]

fig.update_layout(yaxis_title = '% of Survival')

Family Size vs. Survived

fig.update_layout(yaxis_title = '% of Survival')

Embarked vs. Survived

print('% of missing values')

X['Age'].fillna( meanAge , inplace = True)

X['Embarked'].fillna( modeEmbarked , inplace = True)

array(['S', 'C', 'Q'], dtype=object)

from sklearn import preprocessing

# fit the 'Sex' attribute for label encoding

Pclass Sex Age SibSp Parch Fare Embarked

Pclass Sex Age SibSp Parch Fare Embarked

X_train, X_test, Y_train, Y_test = train_test_split(X, Y,

Pclass Sex Age SibSp Parch Fare Embarked

786 3 0 18.0 0 0 7.4958 2

636 3 1 32.0 0 0 7.9250 2

401 3 1 26.0 0 0 8.0500 2

811 3 1 39.0 0 0 24.1500 2

780 3 0 13.0 0 0 7.2292 0

... ... ... ... ... ... ... ...

249 2 1 54.0 1 0 26.0000 2

448 3 0 5.0 2 1 19.2583 0

271 3 1 25.0 0 0 0.0000 2

713 3 1 29.0 0 0 9.4833 2

668 rows × 7 columns

from [Link] import DecisionTreeClassifier

# creating an object of KNeighborsClassifier class

# train the model

from sklearn import tree

fig = [Link]( figsize = (25 , 20) , dpi = 200.0)

from [Link] import confusion_matrix , accuracy_score

# make a confusion matrix

# display confusion matrix as a heatmap

# compute and display the the accuracy of the KNN model

You might also like