Answer To: % 1. Title: 1984 United States Congressional Voting Records Database % % 2. Source Information: %...
Apoorv answered on Nov 22 2021
FBLSolution/IONOshphere_dataset.ipynb
{
"cells": [
{
"cell_type": "code",
"execution_count": 20,
"metadata": {},
"outputs": [],
"source": [
"from scipy.io import arff\n",
"import pandas as pd\n",
"\n",
"\n",
"from sklearn import model_selection \n",
"from sklearn.ensemble import BaggingClassifier \n",
"from sklearn.tree import DecisionTreeClassifier \n",
"\n",
"from sklearn.model_selection import train_test_split\n",
"from sklearn.preprocessing import MultiLabelBinarizer\n",
"from sklearn.preprocessing import LabelEncoder \n",
"\n",
"import matplotlib.pyplot as plt \n",
"\n",
"\n",
"\n",
"from scipy.io import arff\n",
"import pandas as pd\n",
"\n",
"\n",
"from sklearn import model_selection \n",
"from sklearn.ensemble import BaggingClassifier \n",
"from sklearn.tree import DecisionTreeClassifier \n",
"\n",
"from sklearn.model_selection import train_test_split\n",
"from sklearn.preprocessing import MultiLabelBinarizer\n",
"\n",
"\n",
"\n",
"from sklearn.metrics import accuracy_score\n",
"\n",
"import matplotlib.pyplot as plt \n",
"from sklearn import svm, datasets \n",
"import warnings\n",
"warnings.filterwarnings(\"ignore\")"
]
},
{
"cell_type": "code",
"execution_count": 21,
"metadata": {},
"outputs": [],
"source": [
"data = arff.loadarff('C:/Users/avira/Downloads/ionosphere-qocpqvmv.arff')\n",
"df = pd.DataFrame(data[0])"
]
},
{
"cell_type": "code",
"execution_count": 22,
"metadata": {},
"outputs": [],
"source": [
"X = df.drop(\"class\",axis=1)\n",
"y = df[\"class\"]"
]
},
{
"cell_type": "code",
"execution_count": 23,
"metadata": {},
"outputs": [],
"source": [
"y = pd.get_dummies(df['class'],drop_first=True)"
]
},
{
"cell_type": "code",
"execution_count": 24,
"metadata": {},
"outputs": [],
"source": [
"X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.25, random_state=42)"
]
},
{
"cell_type": "code",
"execution_count": 25,
"metadata": {},
"outputs": [],
"source": [
"def model_definitions_tree_depth(depth):\n",
" # initialize the base classifier\n",
" base_cls = DecisionTreeClassifier(max_depth=depth) \n",
" # no. of base classifier \n",
" # bagging classifier \n",
" model = BaggingClassifier(base_estimator = base_cls)\n",
" \n",
" model.fit(X_train,y_train)\n",
" y_pred = model.predict(X_train)\n",
" training_accuracy = accuracy_score(y_pred,y_train)\n",
" y_pred_test = model.predict(X_test)\n",
" testing_accuracy = accuracy_score(y_pred_test,y_test)\n",
" \n",
" return training_accuracy,testing_accuracy\n",
" "
]
},
{
"cell_type": "code",
"execution_count": 34,
"metadata": {},
"outputs": [],
"source": [
"def calculate_depth_wise(tree_depth): \n",
" training = []\n",
" testing = [] \n",
" for depth in tree_depth:\n",
" tr,te = model_definitions_tree_depth(depth)\n",
" training.append(tr)\n",
" testing.append(te)\n",
" plt.plot(tree_depth, training)\n",
" plt.plot(tree_depth, testing)"
]
},
{
"cell_type": "code",
"execution_count": 37,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"