You are on page 1of 1

iris_data=iris_data.

dropna(subset=["sepal_length"], axis=0)
import matplotlib.pyplot as plt
corr=iris_data.corr()
cor_target = abs(corr["species"])
relevant_features = cor_target[cor_target>=0.40]
X = iris_data.drop("species",1)
Y = iris_data["species"]
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split( X, Y, test_size=0.3)
from sklearn.neighbors import KNeighborsClassifier
from sklearn.linear_model import LogisticRegression
k = 3
knn = KNeighborsClassifier(n_neighbors = k).fit(X_train,y_train)
knn_predict = knn.predict(X_test)
lr = LogisticRegression().fit(X_train,y_train)
from sklearn.metrics import accuracy_score
from sklearn import metrics
print("Train set Accuracy: ", metrics.accuracy_score(y_train,
knn.predict(X_train)))
print("Test set Accuracy: ", metrics.accuracy_score(y_test, knn_predict))

input=iris_data['sepal_length']
output=iris_data['species']
plt.ylabel("Sepal length")
plt.xlabel("Species")
plt.bar(output,input)
plt.show()

You might also like