ptyadana
diff --git a/‎ML - Applied Machine Learning - Algorithms/03.Support Vector Machine/01.Support Vector Machines - Hyperparameters.ipynb
Lines changed: 177 additions & 0 deletions b/‎ML - Applied Machine Learning - Algorithms/03.Support Vector Machine/01.Support Vector Machines - Hyperparameters.ipynb
Lines changed: 177 additions & 0 deletions
diff --git a/‎ML - Applied Machine Learning - Algorithms/03.Support Vector Machine/02.Support Vector Machines - Fit and evaluate a model.ipynb
Lines changed: 176 additions & 0 deletions b/‎ML - Applied Machine Learning - Algorithms/03.Support Vector Machine/02.Support Vector Machines - Fit and evaluate a model.ipynb
Lines changed: 176 additions & 0 deletions
diff --git a/‎ML - Applied Machine Learning - Algorithms/03.Support Vector Machine/img/CV.png
289 KB b/‎ML - Applied Machine Learning - Algorithms/03.Support Vector Machine/img/CV.png
289 KB
diff --git a/‎ML - Applied Machine Learning - Algorithms/03.Support Vector Machine/img/Cross-Val.png
96.2 KB b/‎ML - Applied Machine Learning - Algorithms/03.Support Vector Machine/img/Cross-Val.png
96.2 KB
diff --git a/‎ML - Applied Machine Learning - Algorithms/03.Support Vector Machine/img/c.png
30.1 KB b/‎ML - Applied Machine Learning - Algorithms/03.Support Vector Machine/img/c.png
30.1 KB
diff --git a/‎ML - Applied Machine Learning - Algorithms/Pickled_Models/SVM_model.pkl
19.9 KB b/‎ML - Applied Machine Learning - Algorithms/Pickled_Models/SVM_model.pkl
19.9 KB
@@ -0,0 +1,177 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Support Vector Machines: Hyperparameters\n",
+    "\n",
+    "Import [Support Vector Machines](https://scikit-learn.org/stable/modules/generated/sklearn.svm.SVC.html) from `sklearn` and explore the hyperparameters."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Import Support Vector Machines Algorithm"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "SVC()"
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from sklearn.svm import SVC\n",
+    "\n",
+    "SVC()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "['C',\n",
+       " '__abstractmethods__',\n",
+       " '__class__',\n",
+       " '__delattr__',\n",
+       " '__dict__',\n",
+       " '__dir__',\n",
+       " '__doc__',\n",
+       " '__eq__',\n",
+       " '__format__',\n",
+       " '__ge__',\n",
+       " '__getattribute__',\n",
+       " '__getstate__',\n",
+       " '__gt__',\n",
+       " '__hash__',\n",
+       " '__init__',\n",
+       " '__init_subclass__',\n",
+       " '__le__',\n",
+       " '__lt__',\n",
+       " '__module__',\n",
+       " '__ne__',\n",
+       " '__new__',\n",
+       " '__reduce__',\n",
+       " '__reduce_ex__',\n",
+       " '__repr__',\n",
+       " '__setattr__',\n",
+       " '__setstate__',\n",
+       " '__sizeof__',\n",
+       " '__str__',\n",
+       " '__subclasshook__',\n",
+       " '__weakref__',\n",
+       " '_abc_impl',\n",
+       " '_check_n_features',\n",
+       " '_check_proba',\n",
+       " '_compute_kernel',\n",
+       " '_decision_function',\n",
+       " '_dense_decision_function',\n",
+       " '_dense_fit',\n",
+       " '_dense_predict',\n",
+       " '_dense_predict_proba',\n",
+       " '_estimator_type',\n",
+       " '_get_coef',\n",
+       " '_get_param_names',\n",
+       " '_get_tags',\n",
+       " '_impl',\n",
+       " '_more_tags',\n",
+       " '_pairwise',\n",
+       " '_predict_log_proba',\n",
+       " '_predict_proba',\n",
+       " '_repr_html_',\n",
+       " '_repr_html_inner',\n",
+       " '_repr_mimebundle_',\n",
+       " '_sparse_decision_function',\n",
+       " '_sparse_fit',\n",
+       " '_sparse_kernels',\n",
+       " '_sparse_predict',\n",
+       " '_sparse_predict_proba',\n",
+       " '_validate_data',\n",
+       " '_validate_for_predict',\n",
+       " '_validate_targets',\n",
+       " '_warn_from_fit_status',\n",
+       " 'break_ties',\n",
+       " 'cache_size',\n",
+       " 'class_weight',\n",
+       " 'coef0',\n",
+       " 'coef_',\n",
+       " 'decision_function',\n",
+       " 'decision_function_shape',\n",
+       " 'degree',\n",
+       " 'epsilon',\n",
+       " 'fit',\n",
+       " 'gamma',\n",
+       " 'get_params',\n",
+       " 'kernel',\n",
+       " 'max_iter',\n",
+       " 'n_support_',\n",
+       " 'nu',\n",
+       " 'predict',\n",
+       " 'predict_log_proba',\n",
+       " 'predict_proba',\n",
+       " 'probA_',\n",
+       " 'probB_',\n",
+       " 'probability',\n",
+       " 'random_state',\n",
+       " 'score',\n",
+       " 'set_params',\n",
+       " 'shrinking',\n",
+       " 'tol',\n",
+       " 'verbose']"
+      ]
+     },
+     "execution_count": 2,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "dir(SVC())"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.3"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
@@ -0,0 +1,176 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Support Vector Machines: Fit and evaluate a model\n",
+    "\n",
+    "Using the Titanic dataset from [this](https://www.kaggle.com/c/titanic/overview) Kaggle competition.\n",
+    "\n",
+    "In this section, we will fit and evaluate a simple Support Vector Machines model."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Read in Data\n",
+    "\n",
+    "![CV](img/CV.png)\n",
+    "![Cross-Val](img/Cross-Val.png)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import joblib\n",
+    "import pandas as pd\n",
+    "from sklearn.svm import SVC\n",
+    "from sklearn.model_selection import GridSearchCV\n",
+    "\n",
+    "import warnings\n",
+    "warnings.filterwarnings('ignore', category=FutureWarning)\n",
+    "warnings.filterwarnings('ignore', category=DeprecationWarning)\n",
+    "\n",
+    "train_features = pd.read_csv('../Data/train_features.csv')\n",
+    "train_labels = pd.read_csv('../Data/train_labels.csv', header=None)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Hyperparameter tuning\n",
+    "\n",
+    "![c](img/c.png)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def print_results(results):\n",
+    "    print('BEST PARAMS: {}\\n'.format(results.best_params_))\n",
+    "    \n",
+    "    means = results.cv_results_['mean_test_score']\n",
+    "    stds = results.cv_results_['std_test_score']\n",
+    "    for mean, std, params in zip(means, stds, results.cv_results_['params']):\n",
+    "        print('{} (+-{}) for {}'.format(round(mean,3), round(std * 2,3), params))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "BEST PARAMS: {'C': 0.1, 'kernel': 'linear'}\n",
+      "\n",
+      "0.796 (+-0.115) for {'C': 0.1, 'kernel': 'linear'}\n",
+      "0.654 (+-0.06) for {'C': 0.1, 'kernel': 'rbf'}\n",
+      "0.796 (+-0.115) for {'C': 1, 'kernel': 'linear'}\n",
+      "0.661 (+-0.048) for {'C': 1, 'kernel': 'rbf'}\n",
+      "0.796 (+-0.115) for {'C': 10, 'kernel': 'linear'}\n",
+      "0.684 (+-0.07) for {'C': 10, 'kernel': 'rbf'}\n"
+     ]
+    }
+   ],
+   "source": [
+    "svc = SVC()\n",
+    "parameters = {\n",
+    "    'kernel': ['linear', 'rbf'],\n",
+    "    'C': [0.1, 1, 10]\n",
+    "}\n",
+    "\n",
+    "cv = GridSearchCV(svc, parameters, cv=5)\n",
+    "cv.fit(train_features, train_labels.values.ravel())\n",
+    "\n",
+    "print_results(cv)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "SVC(C=0.1, kernel='linear')"
+      ]
+     },
+     "execution_count": 9,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "cv.best_estimator_"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Write out pickled model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "['../Pickled_Models/SVM_model.pkl']"
+      ]
+     },
+     "execution_count": 11,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "joblib.dump(cv.best_estimator_, '../Pickled_Models/SVM_model.pkl')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.3"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}