You are on page 1of 37

{

"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "f1d2e05f",
"metadata": {},
"outputs": [],
"source": [
"csv_url =
'https://archive.ics.uci.edu/ml/machine-learning-databases/iris/iris.data'"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "4ea30303",
"metadata": {},
"outputs": [],
"source": [
"import pandas as pd"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "0900a5d5",
"metadata": {},
"outputs": [],
"source": [
"iris = pd.read_csv(csv_url, header = None)"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "4f06783d",
"metadata": {},
"outputs": [],
"source": [
"\n",
"col_names
=['Sepal_Length','Sepal_Width','Petal_Length','Petal_Width','Species']"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "e1bbf744",
"metadata": {},
"outputs": [],
"source": [
"iris = pd.read_csv(csv_url, names = col_names)"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "a3d85ab5",
"metadata": {},
"outputs": [],
"source": [
"df1=df=iris"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "74d6fe66",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Sepal_Length</th>\n",
" <th>Sepal_Width</th>\n",
" <th>Petal_Length</th>\n",
" <th>Petal_Width</th>\n",
" <th>Species</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>5.1</td>\n",
" <td>3.5</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>4.9</td>\n",
" <td>3.0</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>4.7</td>\n",
" <td>3.2</td>\n",
" <td>1.3</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>4.6</td>\n",
" <td>3.1</td>\n",
" <td>1.5</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>5.0</td>\n",
" <td>3.6</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>5.4</td>\n",
" <td>3.9</td>\n",
" <td>1.7</td>\n",
" <td>0.4</td>\n",
" <td>Iris-setosa</td>\n",
" </tr>\n",
" <tr>\n",
" <th>6</th>\n",
" <td>4.6</td>\n",
" <td>3.4</td>\n",
" <td>1.4</td>\n",
" <td>0.3</td>\n",
" <td>Iris-setosa</td>\n",
" </tr>\n",
" <tr>\n",
" <th>7</th>\n",
" <td>5.0</td>\n",
" <td>3.4</td>\n",
" <td>1.5</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Sepal_Length Sepal_Width Petal_Length Petal_Width Species\n",
"0 5.1 3.5 1.4 0.2 Iris-setosa\n",
"1 4.9 3.0 1.4 0.2 Iris-setosa\n",
"2 4.7 3.2 1.3 0.2 Iris-setosa\n",
"3 4.6 3.1 1.5 0.2 Iris-setosa\n",
"4 5.0 3.6 1.4 0.2 Iris-setosa\n",
"5 5.4 3.9 1.7 0.4 Iris-setosa\n",
"6 4.6 3.4 1.4 0.3 Iris-setosa\n",
"7 5.0 3.4 1.5 0.2 Iris-setosa"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"iris.head(8)\n"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "ef29dc68",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Sepal_Length</th>\n",
" <th>Sepal_Width</th>\n",
" <th>Petal_Length</th>\n",
" <th>Petal_Width</th>\n",
" <th>Species</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>6.7</td>\n",
" <td>3.0</td>\n",
" <td>5.2</td>\n",
" <td>2.3</td>\n",
" <td>Iris-virginica</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>6.3</td>\n",
" <td>2.5</td>\n",
" <td>5.0</td>\n",
" <td>1.9</td>\n",
" <td>Iris-virginica</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>6.5</td>\n",
" <td>3.0</td>\n",
" <td>5.2</td>\n",
" <td>2.0</td>\n",
" <td>Iris-virginica</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>6.2</td>\n",
" <td>3.4</td>\n",
" <td>5.4</td>\n",
" <td>2.3</td>\n",
" <td>Iris-virginica</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>5.9</td>\n",
" <td>3.0</td>\n",
" <td>5.1</td>\n",
" <td>1.8</td>\n",
" <td>Iris-virginica</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Sepal_Length Sepal_Width Petal_Length Petal_Width Species\
n",
"145 6.7 3.0 5.2 2.3 Iris-virginica\
n",
"146 6.3 2.5 5.0 1.9 Iris-virginica\
n",
"147 6.5 3.0 5.2 2.0 Iris-virginica\
n",
"148 6.2 3.4 5.4 2.3 Iris-virginica\
n",
"149 5.9 3.0 5.1 1.8 Iris-virginica"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"\n",
"iris.tail()"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "0c1cd0e4",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"RangeIndex(start=0, stop=150, step=1)"
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"\n",
"iris.index"
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "2faba46b",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Index(['Sepal_Length', 'Sepal_Width', 'Petal_Length', 'Petal_Width',\n",
" 'Species'],\n",
" dtype='object')"
]
},
"execution_count": 10,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"iris.columns"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "38725202",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"(150, 5)"
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"iris.shape"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "f160fe14",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Sepal_Length float64\n",
"Sepal_Width float64\n",
"Petal_Length float64\n",
"Petal_Width float64\n",
"Species object\n",
"dtype: object"
]
},
"execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"\n",
"iris.dtypes"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "13d18049",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Sepal_Length</th>\n",
" <th>Sepal_Width</th>\n",
" <th>Petal_Length</th>\n",
" <th>Petal_Width</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>count</th>\n",
" <td>150.000000</td>\n",
" <td>150.000000</td>\n",
" <td>150.000000</td>\n",
" <td>150.000000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>mean</th>\n",
" <td>5.843333</td>\n",
" <td>3.054000</td>\n",
" <td>3.758667</td>\n",
" <td>1.198667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>std</th>\n",
" <td>0.828066</td>\n",
" <td>0.433594</td>\n",
" <td>1.764420</td>\n",
" <td>0.763161</td>\n",
" </tr>\n",
" <tr>\n",
" <th>min</th>\n",
" <td>4.300000</td>\n",
" <td>2.000000</td>\n",
" <td>1.000000</td>\n",
" <td>0.100000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>25%</th>\n",
" <td>5.100000</td>\n",
" <td>2.800000</td>\n",
" <td>1.600000</td>\n",
" <td>0.300000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>50%</th>\n",
" <td>5.800000</td>\n",
" <td>3.000000</td>\n",
" <td>4.350000</td>\n",
" <td>1.300000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>75%</th>\n",
" <td>6.400000</td>\n",
" <td>3.300000</td>\n",
" <td>5.100000</td>\n",
" <td>1.800000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>max</th>\n",
" <td>7.900000</td>\n",
" <td>4.400000</td>\n",
" <td>6.900000</td>\n",
" <td>2.500000</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Sepal_Length Sepal_Width Petal_Length Petal_Width\n",
"count 150.000000 150.000000 150.000000 150.000000\n",
"mean 5.843333 3.054000 3.758667 1.198667\n",
"std 0.828066 0.433594 1.764420 0.763161\n",
"min 4.300000 2.000000 1.000000 0.100000\n",
"25% 5.100000 2.800000 1.600000 0.300000\n",
"50% 5.800000 3.000000 4.350000 1.300000\n",
"75% 6.400000 3.300000 5.100000 1.800000\n",
"max 7.900000 4.400000 6.900000 2.500000"
]
},
"execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"iris.describe()"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "3d0500e9",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array(['Sepal_Length', 'Sepal_Width', 'Petal_Length', 'Petal_Width',\n",
" 'Species'], dtype=object)"
]
},
"execution_count": 14,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"iris.columns.values"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "ceab47a4",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Sepal_Length 5.4\n",
"Sepal_Width 3.9\n",
"Petal_Length 1.7\n",
"Petal_Width 0.4\n",
"Species Iris-setosa\n",
"Name: 5, dtype: object"
]
},
"execution_count": 15,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"iris.iloc[5]\n",
" "
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "8bd21833",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Sepal_Length</th>\n",
" <th>Sepal_Width</th>\n",
" <th>Petal_Length</th>\n",
" <th>Petal_Width</th>\n",
" <th>Species</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>47</th>\n",
" <td>4.6</td>\n",
" <td>3.2</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" </tr>\n",
" <tr>\n",
" <th>48</th>\n",
" <td>5.3</td>\n",
" <td>3.7</td>\n",
" <td>1.5</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" </tr>\n",
" <tr>\n",
" <th>49</th>\n",
" <td>5.0</td>\n",
" <td>3.3</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" </tr>\n",
" <tr>\n",
" <th>50</th>\n",
" <td>7.0</td>\n",
" <td>3.2</td>\n",
" <td>4.7</td>\n",
" <td>1.4</td>\n",
" <td>Iris-versicolor</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Sepal_Length Sepal_Width Petal_Length Petal_Width Species\
n",
"47 4.6 3.2 1.4 0.2 Iris-setosa\
n",
"48 5.3 3.7 1.5 0.2 Iris-setosa\
n",
"49 5.0 3.3 1.4 0.2 Iris-setosa\
n",
"50 7.0 3.2 4.7 1.4 Iris-versicolor"
]
},
"execution_count": 16,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"iris[47:51]"
]
},
{
"cell_type": "code",
"execution_count": 17,
"id": "7431acf1",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Sepal_Length</th>\n",
" <th>Sepal_Width</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>5.1</td>\n",
" <td>3.5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>4.9</td>\n",
" <td>3.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>4.7</td>\n",
" <td>3.2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>4.6</td>\n",
" <td>3.1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>5.0</td>\n",
" <td>3.6</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>6.7</td>\n",
" <td>3.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>6.3</td>\n",
" <td>2.5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>6.5</td>\n",
" <td>3.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>6.2</td>\n",
" <td>3.4</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>5.9</td>\n",
" <td>3.0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>150 rows × 2 columns</p>\n",
"</div>"
],
"text/plain": [
" Sepal_Length Sepal_Width\n",
"0 5.1 3.5\n",
"1 4.9 3.0\n",
"2 4.7 3.2\n",
"3 4.6 3.1\n",
"4 5.0 3.6\n",
".. ... ...\n",
"145 6.7 3.0\n",
"146 6.3 2.5\n",
"147 6.5 3.0\n",
"148 6.2 3.4\n",
"149 5.9 3.0\n",
"\n",
"[150 rows x 2 columns]"
]
},
"execution_count": 17,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"iris.loc[:,[\"Sepal_Length\",\"Sepal_Width\"]] "
]
},
{
"cell_type": "code",
"execution_count": 18,
"id": "2d1d3ca2",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Petal_Length</th>\n",
" <th>Petal_Width</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>1.3</td>\n",
" <td>0.2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>1.5</td>\n",
" <td>0.2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>5.2</td>\n",
" <td>2.3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>5.0</td>\n",
" <td>1.9</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>5.2</td>\n",
" <td>2.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>5.4</td>\n",
" <td>2.3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>5.1</td>\n",
" <td>1.8</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>150 rows × 2 columns</p>\n",
"</div>"
],
"text/plain": [
" Petal_Length Petal_Width\n",
"0 1.4 0.2\n",
"1 1.4 0.2\n",
"2 1.3 0.2\n",
"3 1.5 0.2\n",
"4 1.4 0.2\n",
".. ... ...\n",
"145 5.2 2.3\n",
"146 5.0 1.9\n",
"147 5.2 2.0\n",
"148 5.4 2.3\n",
"149 5.1 1.8\n",
"\n",
"[150 rows x 2 columns]"
]
},
"execution_count": 18,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"cols_2_4=iris.columns[2:4]\n",
"iris[cols_2_4]\n",
" "
]
},
{
"cell_type": "code",
"execution_count": 19,
"id": "da15dc11",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Sepal_Length False\n",
"Sepal_Width False\n",
"Petal_Length False\n",
"Petal_Width False\n",
"Species False\n",
"dtype: bool"
]
},
"execution_count": 19,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"iris.isnull().any()\n",
" "
]
},
{
"cell_type": "code",
"execution_count": 20,
"id": "50e4c6cd",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Sepal_Length 0\n",
"Sepal_Width 0\n",
"Petal_Length 0\n",
"Petal_Width 0\n",
"Species 0\n",
"dtype: int64"
]
},
"execution_count": 20,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"iris.isnull().sum()"
]
},
{
"cell_type": "code",
"execution_count": 21,
"id": "a1d345a1",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Sepal_Length float64\n",
"Sepal_Width float64\n",
"Petal_Length float64\n",
"Petal_Width float64\n",
"Species object\n",
"dtype: object"
]
},
"execution_count": 21,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"iris.dtypes"
]
},
{
"cell_type": "code",
"execution_count": 22,
"id": "1c0b5fb9",
"metadata": {},
"outputs": [],
"source": [
"df=iris\n",
"df['petal Length(cm)']=iris['Petal_Length'].astype(\"int\")"
]
},
{
"cell_type": "code",
"execution_count": 23,
"id": "196be98f",
"metadata": {},
"outputs": [],
"source": [
"df1=df"
]
},
{
"cell_type": "code",
"execution_count": 24,
"id": "add99d02",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Sepal_Length</th>\n",
" <th>Sepal_Width</th>\n",
" <th>Petal_Length</th>\n",
" <th>Petal_Width</th>\n",
" <th>Species</th>\n",
" <th>petal Length(cm)</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>5.1</td>\n",
" <td>3.5</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>4.9</td>\n",
" <td>3.0</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>4.7</td>\n",
" <td>3.2</td>\n",
" <td>1.3</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>4.6</td>\n",
" <td>3.1</td>\n",
" <td>1.5</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>5.0</td>\n",
" <td>3.6</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>Iris-setosa</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>6.7</td>\n",
" <td>3.0</td>\n",
" <td>5.2</td>\n",
" <td>2.3</td>\n",
" <td>Iris-virginica</td>\n",
" <td>5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>6.3</td>\n",
" <td>2.5</td>\n",
" <td>5.0</td>\n",
" <td>1.9</td>\n",
" <td>Iris-virginica</td>\n",
" <td>5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>6.5</td>\n",
" <td>3.0</td>\n",
" <td>5.2</td>\n",
" <td>2.0</td>\n",
" <td>Iris-virginica</td>\n",
" <td>5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>6.2</td>\n",
" <td>3.4</td>\n",
" <td>5.4</td>\n",
" <td>2.3</td>\n",
" <td>Iris-virginica</td>\n",
" <td>5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>5.9</td>\n",
" <td>3.0</td>\n",
" <td>5.1</td>\n",
" <td>1.8</td>\n",
" <td>Iris-virginica</td>\n",
" <td>5</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>150 rows × 6 columns</p>\n",
"</div>"
],
"text/plain": [
" Sepal_Length Sepal_Width Petal_Length Petal_Width
Species \\\n",
"0 5.1 3.5 1.4 0.2 Iris-setosa
\n",
"1 4.9 3.0 1.4 0.2 Iris-setosa
\n",
"2 4.7 3.2 1.3 0.2 Iris-setosa
\n",
"3 4.6 3.1 1.5 0.2 Iris-setosa
\n",
"4 5.0 3.6 1.4 0.2 Iris-setosa
\n",
".. ... ... ... ... ...
\n",
"145 6.7 3.0 5.2 2.3 Iris-virginica
\n",
"146 6.3 2.5 5.0 1.9 Iris-virginica
\n",
"147 6.5 3.0 5.2 2.0 Iris-virginica
\n",
"148 6.2 3.4 5.4 2.3 Iris-virginica
\n",
"149 5.9 3.0 5.1 1.8 Iris-virginica
\n",
"\n",
" petal Length(cm) \n",
"0 1 \n",
"1 1 \n",
"2 1 \n",
"3 1 \n",
"4 1 \n",
".. ... \n",
"145 5 \n",
"146 5 \n",
"147 5 \n",
"148 5 \n",
"149 5 \n",
"\n",
"[150 rows x 6 columns]"
]
},
"execution_count": 24,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df"
]
},
{
"cell_type": "code",
"execution_count": 25,
"id": "b70d717b",
"metadata": {},
"outputs": [],
"source": [
"\n",
"from sklearn import preprocessing\n",
"min_max_scaler = preprocessing.MinMaxScaler()"
]
},
{
"cell_type": "code",
"execution_count": 26,
"id": "77891624",
"metadata": {},
"outputs": [],
"source": [
"X=iris.iloc[:,:4]"
]
},
{
"cell_type": "code",
"execution_count": 27,
"id": "15518c7c",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Sepal_Length</th>\n",
" <th>Sepal_Width</th>\n",
" <th>Petal_Length</th>\n",
" <th>Petal_Width</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>5.1</td>\n",
" <td>3.5</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>4.9</td>\n",
" <td>3.0</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>4.7</td>\n",
" <td>3.2</td>\n",
" <td>1.3</td>\n",
" <td>0.2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>4.6</td>\n",
" <td>3.1</td>\n",
" <td>1.5</td>\n",
" <td>0.2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>5.0</td>\n",
" <td>3.6</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>6.7</td>\n",
" <td>3.0</td>\n",
" <td>5.2</td>\n",
" <td>2.3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>6.3</td>\n",
" <td>2.5</td>\n",
" <td>5.0</td>\n",
" <td>1.9</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>6.5</td>\n",
" <td>3.0</td>\n",
" <td>5.2</td>\n",
" <td>2.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>6.2</td>\n",
" <td>3.4</td>\n",
" <td>5.4</td>\n",
" <td>2.3</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>5.9</td>\n",
" <td>3.0</td>\n",
" <td>5.1</td>\n",
" <td>1.8</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>150 rows × 4 columns</p>\n",
"</div>"
],
"text/plain": [
" Sepal_Length Sepal_Width Petal_Length Petal_Width\n",
"0 5.1 3.5 1.4 0.2\n",
"1 4.9 3.0 1.4 0.2\n",
"2 4.7 3.2 1.3 0.2\n",
"3 4.6 3.1 1.5 0.2\n",
"4 5.0 3.6 1.4 0.2\n",
".. ... ... ... ...\n",
"145 6.7 3.0 5.2 2.3\n",
"146 6.3 2.5 5.0 1.9\n",
"147 6.5 3.0 5.2 2.0\n",
"148 6.2 3.4 5.4 2.3\n",
"149 5.9 3.0 5.1 1.8\n",
"\n",
"[150 rows x 4 columns]"
]
},
"execution_count": 27,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"X"
]
},
{
"cell_type": "code",
"execution_count": 28,
"id": "445f79bd",
"metadata": {},
"outputs": [],
"source": [
"\n",
"X_scaled = min_max_scaler.fit_transform(X)"
]
},
{
"cell_type": "code",
"execution_count": 29,
"id": "7bebe45c",
"metadata": {},
"outputs": [],
"source": [
"df_normalized = pd.DataFrame(X_scaled)"
]
},
{
"cell_type": "code",
"execution_count": 30,
"id": "715e5807",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>0</th>\n",
" <th>1</th>\n",
" <th>2</th>\n",
" <th>3</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>0.222222</td>\n",
" <td>0.625000</td>\n",
" <td>0.067797</td>\n",
" <td>0.041667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>0.166667</td>\n",
" <td>0.416667</td>\n",
" <td>0.067797</td>\n",
" <td>0.041667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>0.111111</td>\n",
" <td>0.500000</td>\n",
" <td>0.050847</td>\n",
" <td>0.041667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>0.083333</td>\n",
" <td>0.458333</td>\n",
" <td>0.084746</td>\n",
" <td>0.041667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>0.194444</td>\n",
" <td>0.666667</td>\n",
" <td>0.067797</td>\n",
" <td>0.041667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>0.666667</td>\n",
" <td>0.416667</td>\n",
" <td>0.711864</td>\n",
" <td>0.916667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>0.555556</td>\n",
" <td>0.208333</td>\n",
" <td>0.677966</td>\n",
" <td>0.750000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>0.611111</td>\n",
" <td>0.416667</td>\n",
" <td>0.711864</td>\n",
" <td>0.791667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>0.527778</td>\n",
" <td>0.583333</td>\n",
" <td>0.745763</td>\n",
" <td>0.916667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>0.444444</td>\n",
" <td>0.416667</td>\n",
" <td>0.694915</td>\n",
" <td>0.708333</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>150 rows × 4 columns</p>\n",
"</div>"
],
"text/plain": [
" 0 1 2 3\n",
"0 0.222222 0.625000 0.067797 0.041667\n",
"1 0.166667 0.416667 0.067797 0.041667\n",
"2 0.111111 0.500000 0.050847 0.041667\n",
"3 0.083333 0.458333 0.084746 0.041667\n",
"4 0.194444 0.666667 0.067797 0.041667\n",
".. ... ... ... ...\n",
"145 0.666667 0.416667 0.711864 0.916667\n",
"146 0.555556 0.208333 0.677966 0.750000\n",
"147 0.611111 0.416667 0.711864 0.791667\n",
"148 0.527778 0.583333 0.745763 0.916667\n",
"149 0.444444 0.416667 0.694915 0.708333\n",
"\n",
"[150 rows x 4 columns]"
]
},
"execution_count": 30,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_normalized"
]
},
{
"cell_type": "code",
"execution_count": 31,
"id": "d26880a2",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array(['Iris-setosa', 'Iris-versicolor', 'Iris-virginica'], dtype=object)"
]
},
"execution_count": 31,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df2=df\n",
"df2['Species'].unique()"
]
},
{
"cell_type": "code",
"execution_count": 32,
"id": "00409d0a",
"metadata": {},
"outputs": [],
"source": [
"df_normalized = pd.DataFrame(X_scaled)"
]
},
{
"cell_type": "code",
"execution_count": 33,
"id": "85180b19",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>0</th>\n",
" <th>1</th>\n",
" <th>2</th>\n",
" <th>3</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>0.222222</td>\n",
" <td>0.625000</td>\n",
" <td>0.067797</td>\n",
" <td>0.041667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>0.166667</td>\n",
" <td>0.416667</td>\n",
" <td>0.067797</td>\n",
" <td>0.041667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>0.111111</td>\n",
" <td>0.500000</td>\n",
" <td>0.050847</td>\n",
" <td>0.041667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>0.083333</td>\n",
" <td>0.458333</td>\n",
" <td>0.084746</td>\n",
" <td>0.041667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>0.194444</td>\n",
" <td>0.666667</td>\n",
" <td>0.067797</td>\n",
" <td>0.041667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>0.666667</td>\n",
" <td>0.416667</td>\n",
" <td>0.711864</td>\n",
" <td>0.916667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>0.555556</td>\n",
" <td>0.208333</td>\n",
" <td>0.677966</td>\n",
" <td>0.750000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>0.611111</td>\n",
" <td>0.416667</td>\n",
" <td>0.711864</td>\n",
" <td>0.791667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>0.527778</td>\n",
" <td>0.583333</td>\n",
" <td>0.745763</td>\n",
" <td>0.916667</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>0.444444</td>\n",
" <td>0.416667</td>\n",
" <td>0.694915</td>\n",
" <td>0.708333</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>150 rows × 4 columns</p>\n",
"</div>"
],
"text/plain": [
" 0 1 2 3\n",
"0 0.222222 0.625000 0.067797 0.041667\n",
"1 0.166667 0.416667 0.067797 0.041667\n",
"2 0.111111 0.500000 0.050847 0.041667\n",
"3 0.083333 0.458333 0.084746 0.041667\n",
"4 0.194444 0.666667 0.067797 0.041667\n",
".. ... ... ... ...\n",
"145 0.666667 0.416667 0.711864 0.916667\n",
"146 0.555556 0.208333 0.677966 0.750000\n",
"147 0.611111 0.416667 0.711864 0.791667\n",
"148 0.527778 0.583333 0.745763 0.916667\n",
"149 0.444444 0.416667 0.694915 0.708333\n",
"\n",
"[150 rows x 4 columns]"
]
},
"execution_count": 33,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_normalized"
]
},
{
"cell_type": "code",
"execution_count": 34,
"id": "70af7c57",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array(['Iris-setosa', 'Iris-versicolor', 'Iris-virginica'], dtype=object)"
]
},
"execution_count": 34,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df2=df\n",
"df2['Species'].unique()"
]
},
{
"cell_type": "code",
"execution_count": 35,
"id": "c1be0065",
"metadata": {},
"outputs": [],
"source": [
"\n",
"from sklearn import preprocessing\n",
"enc = preprocessing.OneHotEncoder()"
]
},
{
"cell_type": "code",
"execution_count": 36,
"id": "49175ccd",
"metadata": {},
"outputs": [],
"source": [
"features_df=df2.drop(columns=['Species'])"
]
},
{
"cell_type": "code",
"execution_count": 37,
"id": "dae0b47c",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Sepal_Length</th>\n",
" <th>Sepal_Width</th>\n",
" <th>Petal_Length</th>\n",
" <th>Petal_Width</th>\n",
" <th>petal Length(cm)</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>5.1</td>\n",
" <td>3.5</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>4.9</td>\n",
" <td>3.0</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>4.7</td>\n",
" <td>3.2</td>\n",
" <td>1.3</td>\n",
" <td>0.2</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>4.6</td>\n",
" <td>3.1</td>\n",
" <td>1.5</td>\n",
" <td>0.2</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>5.0</td>\n",
" <td>3.6</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>6.7</td>\n",
" <td>3.0</td>\n",
" <td>5.2</td>\n",
" <td>2.3</td>\n",
" <td>5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>6.3</td>\n",
" <td>2.5</td>\n",
" <td>5.0</td>\n",
" <td>1.9</td>\n",
" <td>5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>6.5</td>\n",
" <td>3.0</td>\n",
" <td>5.2</td>\n",
" <td>2.0</td>\n",
" <td>5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>6.2</td>\n",
" <td>3.4</td>\n",
" <td>5.4</td>\n",
" <td>2.3</td>\n",
" <td>5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>5.9</td>\n",
" <td>3.0</td>\n",
" <td>5.1</td>\n",
" <td>1.8</td>\n",
" <td>5</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>150 rows × 5 columns</p>\n",
"</div>"
],
"text/plain": [
" Sepal_Length Sepal_Width Petal_Length Petal_Width petal
Length(cm)\n",
"0 5.1 3.5 1.4 0.2
1\n",
"1 4.9 3.0 1.4 0.2
1\n",
"2 4.7 3.2 1.3 0.2
1\n",
"3 4.6 3.1 1.5 0.2
1\n",
"4 5.0 3.6 1.4 0.2
1\n",

".. ... ... ... ... ...\n",


"145 6.7 3.0 5.2 2.3
5\n",
"146 6.3 2.5 5.0 1.9
5\n",
"147 6.5 3.0 5.2 2.0
5\n",
"148 6.2 3.4 5.4 2.3
5\n",
"149 5.9 3.0 5.1 1.8
5\n",
"\n",
"[150 rows x 5 columns]"
]
},
"execution_count": 37,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"features_df"
]
},
{
"cell_type": "code",
"execution_count": 38,
"id": "71128fa0",
"metadata": {},
"outputs": [],
"source": [
"enc_df=(enc.fit_transform(df2[['Species']])).toarray()\n",
" "
]
},
{
"cell_type": "code",
"execution_count": 39,
"id": "bc4dc81b",
"metadata": {},
"outputs": [],
"source": [
"enc_df = pd.DataFrame(enc_df, columns = ['Iris-Setosa','Iris-
Versicolor','Iris-Virginica'])"
]
},
{
"cell_type": "code",
"execution_count": 40,
"id": "dc16ee27",
"metadata": {},
"outputs": [],
"source": [
"df_encode = features_df.join(enc_df)"
]
},
{
"cell_type": "code",
"execution_count": 41,
"id": "c5bb1aab",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Sepal_Length</th>\n",
" <th>Sepal_Width</th>\n",
" <th>Petal_Length</th>\n",
" <th>Petal_Width</th>\n",
" <th>petal Length(cm)</th>\n",
" <th>Iris-Setosa</th>\n",
" <th>Iris-Versicolor</th>\n",
" <th>Iris-Virginica</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>5.1</td>\n",
" <td>3.5</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>1</td>\n",
" <td>1.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>4.9</td>\n",
" <td>3.0</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>1</td>\n",
" <td>1.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>4.7</td>\n",
" <td>3.2</td>\n",
" <td>1.3</td>\n",
" <td>0.2</td>\n",
" <td>1</td>\n",
" <td>1.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>4.6</td>\n",
" <td>3.1</td>\n",
" <td>1.5</td>\n",
" <td>0.2</td>\n",
" <td>1</td>\n",
" <td>1.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>5.0</td>\n",
" <td>3.6</td>\n",
" <td>1.4</td>\n",
" <td>0.2</td>\n",
" <td>1</td>\n",
" <td>1.0</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>6.7</td>\n",
" <td>3.0</td>\n",
" <td>5.2</td>\n",
" <td>2.3</td>\n",
" <td>5</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>1.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>6.3</td>\n",
" <td>2.5</td>\n",
" <td>5.0</td>\n",
" <td>1.9</td>\n",
" <td>5</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>1.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>6.5</td>\n",
" <td>3.0</td>\n",
" <td>5.2</td>\n",
" <td>2.0</td>\n",
" <td>5</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>1.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>6.2</td>\n",
" <td>3.4</td>\n",
" <td>5.4</td>\n",
" <td>2.3</td>\n",
" <td>5</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>1.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>5.9</td>\n",
" <td>3.0</td>\n",
" <td>5.1</td>\n",
" <td>1.8</td>\n",
" <td>5</td>\n",
" <td>0.0</td>\n",
" <td>0.0</td>\n",
" <td>1.0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>150 rows × 8 columns</p>\n",
"</div>"
],
"text/plain": [
" Sepal_Length Sepal_Width Petal_Length Petal_Width petal Length(cm)
\\\n",
"0 5.1 3.5 1.4 0.2 1
\n",
"1 4.9 3.0 1.4 0.2 1
\n",
"2 4.7 3.2 1.3 0.2 1
\n",
"3 4.6 3.1 1.5 0.2 1
\n",
"4 5.0 3.6 1.4 0.2 1
\n",
".. ... ... ... ... ...
\n",
"145 6.7 3.0 5.2 2.3 5
\n",
"146 6.3 2.5 5.0 1.9 5
\n",
"147 6.5 3.0 5.2 2.0 5
\n",
"148 6.2 3.4 5.4 2.3 5
\n",
"149 5.9 3.0 5.1 1.8 5
\n",
"\n",
" Iris-Setosa Iris-Versicolor Iris-Virginica \n",
"0 1.0 0.0 0.0 \n",
"1 1.0 0.0 0.0 \n",
"2 1.0 0.0 0.0 \n",
"3 1.0 0.0 0.0 \n",
"4 1.0 0.0 0.0 \n",
".. ... ... ... \n",
"145 0.0 0.0 1.0 \n",
"146 0.0 0.0 1.0 \n",
"147 0.0 0.0 1.0 \n",
"148 0.0 0.0 1.0 \n",
"149 0.0 0.0 1.0 \n",
"\n",
"[150 rows x 8 columns]"
]
},
"execution_count": 41,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_encode"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "56ec0845",
"metadata": {},
"outputs": [],
"source": []
},
{
"cell_type": "code",
"execution_count": null,
"id": "4a842adc",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.13"
}
},
"nbformat": 4,
"nbformat_minor": 5
}

You might also like