You are on page 1of 2

keyboard_arrow_down NAME- PIYUSH VERMA

REGNO- 23MCA1104

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.datasets import load_iris
from scipy.cluster.hierarchy import dendrogram, linkage
from scipy.cluster.hierarchy import fcluster

# Load the Iris dataset


iris = load_iris()
X = iris.data
species = iris.target_names[iris.target]

# Perform hierarchical clustering


Z = linkage(X, method='ward')

plt.figure(figsize=(10, 5))
plt.title('Hierarchical Clustering Dendrogram')
plt.xlabel('Species')
plt.ylabel('Distance')
dendrogram(
Z,
leaf_rotation=90.,
leaf_font_size=8.,
labels=species,
)
plt.show()

output

# Determine the number of clusters using the dendrogram


max_d = 7 # Maximum distance to be considered
clusters = fcluster(Z, max_d, criterion='distance')

# Plot the scatter plot with clusters


plt.figure(figsize=(8, 6))
plt.scatter(X[:, 0], X[:, 1], c=clusters, cmap='viridis')
plt.title('Hierarchical Clustering')
plt.xlabel('Sepal Length (cm)')
plt.ylabel('Sepal Width (cm)')
plt.show()

NOTEBOOK LINK- https://colab.research.google.com/drive/1A74gzkurxoGYnsfhsRI_OXvpCCVPT0tc?usp=sharing

You might also like