Professional Documents
Culture Documents
: 201803100920017
Experiment 6
Aim : Write a program to apply decision tree classifier on Pima Indian diabetes
dataset.
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.model_selection import train_test_split
from sklearn.tree import decisiontreeclassifier
from sklearn.metrics import classification_report
from sklearn.model_selection import cross_val_score
df = pd.read_csv("diabetes.csv")
df.head()
df.isnull().sum()
df.dtypes
df['outcome'].value_counts()
inputs=df[['pregnancies','glucose','bloodpressure','skinthickness','insulin','bmi','diabetespedigreefunction',
' age']].values
classes = df['outcome'].values
x_train, y_train, x_test, y_test = train_test_split(inputs,classes, train_size=0.75, random_state=1)
decision_tree = decisiontreeclassifier()
decision_tree.fit(x_train,x_test)
decision_tree.score(y_train,y_test)
prediction = decision_tree.predict(y_train)
print(classification_report(y_test, prediction, target_names = ['0','1']))
Output: