From 7eeda4bdc5f89d9b8e46153859dc6ca1c8f614fe Mon Sep 17 00:00:00 2001 From: Pooriana Date: Tue, 7 Feb 2023 20:51:17 +0330 Subject: [PATCH 1/2] Tamrin team 8 - Amini - Tizkar - Elahi --- ...n_Data_Analysis.ipynb => HW_01_Team8.ipynb | 0 ...Library_Dataset.ipynb => HW_02_Team8.ipynb | 0 Graph_Analysis.ipynb => HW_03_Team8.ipynb | 0 HW_04_Team8.ipynb | 519 ++++++++++++++++++ ..._Mining_Apriori.ipynb => HW_05_Team8.ipynb | 0 5 files changed, 519 insertions(+) rename Exploration_Data_Analysis.ipynb => HW_01_Team8.ipynb (100%) rename Preparing_Library_Dataset.ipynb => HW_02_Team8.ipynb (100%) rename Graph_Analysis.ipynb => HW_03_Team8.ipynb (100%) create mode 100644 HW_04_Team8.ipynb rename Association_Rule_Mining_Apriori.ipynb => HW_05_Team8.ipynb (100%) diff --git a/Exploration_Data_Analysis.ipynb b/HW_01_Team8.ipynb similarity index 100% rename from Exploration_Data_Analysis.ipynb rename to HW_01_Team8.ipynb diff --git a/Preparing_Library_Dataset.ipynb b/HW_02_Team8.ipynb similarity index 100% rename from Preparing_Library_Dataset.ipynb rename to HW_02_Team8.ipynb diff --git a/Graph_Analysis.ipynb b/HW_03_Team8.ipynb similarity index 100% rename from Graph_Analysis.ipynb rename to HW_03_Team8.ipynb diff --git a/HW_04_Team8.ipynb b/HW_04_Team8.ipynb new file mode 100644 index 0000000..4928620 --- /dev/null +++ b/HW_04_Team8.ipynb @@ -0,0 +1,519 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "c4485712", + "metadata": { + "heading_collapsed": true + }, + "source": [ + "# Loading libraries" + ] + }, + { + "cell_type": "code", + "execution_count": 65, + "id": "27e52151", + "metadata": { + "hidden": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "libraries loaded.\n" + ] + } + ], + "source": [ + "import numpy as np\n", + "import pandas as pd\n", + "\n", + "from collections import Counter\n", + "\n", + "import matplotlib.pyplot as plt\n", + "import seaborn as sns\n", + "\n", + "sns.set_style('white')\n", + "\n", + "print('libraries loaded.')" + ] + }, + { + "cell_type": "markdown", + "id": "7ebfb208", + "metadata": { + "heading_collapsed": true + }, + "source": [ + "# Loading dataset" + ] + }, + { + "cell_type": "code", + "execution_count": 66, + "id": "f951115b", + "metadata": { + "hidden": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
sepal_lengthsepal_widthpetal_lengthpetal_widthiris_name
05.93.04.21.5Iris-versicolor
16.93.14.91.5Iris-versicolor
26.62.94.61.3Iris-versicolor
34.63.21.40.2Iris-setosa
46.02.24.01.0Iris-versicolor
\n", + "
" + ], + "text/plain": [ + " sepal_length sepal_width petal_length petal_width iris_name\n", + "0 5.9 3.0 4.2 1.5 Iris-versicolor\n", + "1 6.9 3.1 4.9 1.5 Iris-versicolor\n", + "2 6.6 2.9 4.6 1.3 Iris-versicolor\n", + "3 4.6 3.2 1.4 0.2 Iris-setosa\n", + "4 6.0 2.2 4.0 1.0 Iris-versicolor" + ] + }, + "execution_count": 66, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_iris = pd.read_csv('Data/iris.txt', sep= ',', header= None) \n", + "\n", + "df_iris.columns= ['sepal_length', 'sepal_width', 'petal_length', 'petal_width', 'iris_name']\n", + "\n", + "df_iris.head()" + ] + }, + { + "cell_type": "markdown", + "id": "35b796a1", + "metadata": { + "heading_collapsed": true + }, + "source": [ + "# Finding max absolute value of first 2-dimension" + ] + }, + { + "cell_type": "code", + "execution_count": 67, + "id": "9776c250", + "metadata": { + "hidden": true + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
sepal_lengthsepal_width
00.06-0.05
11.060.05
20.76-0.15
3-1.240.15
40.16-0.85
\n", + "
" + ], + "text/plain": [ + " sepal_length sepal_width\n", + "0 0.06 -0.05\n", + "1 1.06 0.05\n", + "2 0.76 -0.15\n", + "3 -1.24 0.15\n", + "4 0.16 -0.85" + ] + }, + "execution_count": 67, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "centred_sepal = pd.DataFrame()\n", + "\n", + "sl_mean, sw_mean = np.round(df_iris.loc[:, ['sepal_length', 'sepal_width']].mean(), 2)\n", + "\n", + "centred_sepal['sepal_length'] = df_iris['sepal_length'] - sl_mean\n", + "\n", + "centred_sepal['sepal_width'] = df_iris['sepal_width'] - sw_mean\n", + "\n", + "centred_sepal.head()" + ] + }, + { + "cell_type": "markdown", + "id": "6c93ceb3", + "metadata": { + "hidden": true + }, + "source": [ + "## Finding max value of each dimension" + ] + }, + { + "cell_type": "code", + "execution_count": 68, + "id": "564d4c99", + "metadata": { + "hidden": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "sepal_length 2.06\n", + "sepal_width 1.35\n", + "dtype: float64" + ] + }, + "execution_count": 68, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "centred_sepal.max()" + ] + }, + { + "cell_type": "markdown", + "id": "8033d8de", + "metadata": { + "hidden": true + }, + "source": [ + "## Find the max value index of the maximume value" + ] + }, + { + "cell_type": "code", + "execution_count": 69, + "id": "4ae2582b", + "metadata": { + "hidden": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "sepal_length 70\n", + "sepal_width 22\n", + "dtype: int64" + ] + }, + "execution_count": 69, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "centred_sepal.idxmax()" + ] + }, + { + "cell_type": "markdown", + "id": "b58ff3dc", + "metadata": { + "hidden": true + }, + "source": [ + "## Caculate magnitude of the max_vector" + ] + }, + { + "cell_type": "code", + "execution_count": 73, + "id": "7801c7e1", + "metadata": { + "hidden": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "(2.06, 0.75, 2.19)" + ] + }, + "execution_count": 73, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "l, w = np.round(centred_sepal.loc[centred_sepal.idxmax().max()], 2)\n", + "\n", + "magnitude = np.round(np.sqrt(l * l + w * w), 2)\n", + "\n", + "l, w, magnitude" + ] + }, + { + "cell_type": "markdown", + "id": "871e2131", + "metadata": { + "hidden": true + }, + "source": [ + "## Get the magnitude of the maximum vector straightforward " + ] + }, + { + "cell_type": "code", + "execution_count": 71, + "id": "ff8df487", + "metadata": { + "hidden": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "2.19" + ] + }, + "execution_count": 71, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "np.round(centred_sepal.apply(np.linalg.norm, axis= 1).max(), 2)" + ] + }, + { + "cell_type": "markdown", + "id": "368dafdf", + "metadata": {}, + "source": [ + "# plotting centred_sepal" + ] + }, + { + "cell_type": "code", + "execution_count": 97, + "id": "6bba21a2", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "figure, axes = plt.subplots() \n", + "\n", + "plt.scatter(centred_sepal['sepal_length'], centred_sepal['sepal_width'])\n", + "\n", + "plt.scatter(2.06, 0.75, marker= 'o', color= 'k')\n", + "\n", + "sphere = plt.Circle((0, 0), magnitude, color= 'k', fill= False)\n", + "\n", + "axes.set_aspect(1) \n", + "axes.add_artist(sphere)\n", + "\n", + "plt.axvline(x = 0, color = 'k')\n", + "plt.axhline(y = 0, color = 'k')\n", + "\n", + "plt.arrow(0, 0, 2, 0.75, color= 'k', width= .02, length_includes_head= True)\n", + "plt.text(1, 0.5, 'r', fontsize= 12)\n", + "\n", + "plt.xlim((-2.5, 2.5))\n", + "plt.ylim((-2.5, 2.5))\n", + "\n", + "plt.xlabel('Sepal Length')\n", + "plt.ylabel('Sepal Width')\n", + "\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "bf476d54", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.6" + }, + "toc": { + "base_numbering": 1, + "nav_menu": {}, + "number_sections": true, + "sideBar": true, + "skip_h1_title": false, + "title_cell": "Table of Contents", + "title_sidebar": "Contents", + "toc_cell": false, + "toc_position": {}, + "toc_section_display": true, + "toc_window_display": false + }, + "varInspector": { + "cols": { + "lenName": 16, + "lenType": 16, + "lenVar": 40 + }, + "kernels_config": { + "python": { + "delete_cmd_postfix": "", + "delete_cmd_prefix": "del ", + "library": "var_list.py", + "varRefreshCmd": "print(var_dic_list())" + }, + "r": { + "delete_cmd_postfix": ") ", + "delete_cmd_prefix": "rm(", + "library": "var_list.r", + "varRefreshCmd": "cat(var_dic_list()) " + } + }, + "types_to_exclude": [ + "module", + "function", + "builtin_function_or_method", + "instance", + "_Feature" + ], + "window_display": false + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/Association_Rule_Mining_Apriori.ipynb b/HW_05_Team8.ipynb similarity index 100% rename from Association_Rule_Mining_Apriori.ipynb rename to HW_05_Team8.ipynb From 0ff07d6bf3917286c8c7ff52039104c83846e5eb Mon Sep 17 00:00:00 2001 From: Pooriana Date: Tue, 7 Feb 2023 21:41:54 +0330 Subject: [PATCH 2/2] Team 8 - Amini - Tizkar - Elahi --- HW_05_Team8.ipynb => Association_Rule_Mining_Apriori.team8.ipynb | 0 HW_03_Team8.ipynb => Exploration_Data_Analysis.team8.ipynb | 0 HW_01_Team8.ipynb => Graph_Analysis.team8.ipynb | 0 HW_04_Team8.ipynb => High_Dimentional_Data.team8.ipynb | 0 HW_02_Team8.ipynb => Preparing_Library_Dataset.team8.ipynb | 0 5 files changed, 0 insertions(+), 0 deletions(-) rename HW_05_Team8.ipynb => Association_Rule_Mining_Apriori.team8.ipynb (100%) rename HW_03_Team8.ipynb => Exploration_Data_Analysis.team8.ipynb (100%) rename HW_01_Team8.ipynb => Graph_Analysis.team8.ipynb (100%) rename HW_04_Team8.ipynb => High_Dimentional_Data.team8.ipynb (100%) rename HW_02_Team8.ipynb => Preparing_Library_Dataset.team8.ipynb (100%) diff --git a/HW_05_Team8.ipynb b/Association_Rule_Mining_Apriori.team8.ipynb similarity index 100% rename from HW_05_Team8.ipynb rename to Association_Rule_Mining_Apriori.team8.ipynb diff --git a/HW_03_Team8.ipynb b/Exploration_Data_Analysis.team8.ipynb similarity index 100% rename from HW_03_Team8.ipynb rename to Exploration_Data_Analysis.team8.ipynb diff --git a/HW_01_Team8.ipynb b/Graph_Analysis.team8.ipynb similarity index 100% rename from HW_01_Team8.ipynb rename to Graph_Analysis.team8.ipynb diff --git a/HW_04_Team8.ipynb b/High_Dimentional_Data.team8.ipynb similarity index 100% rename from HW_04_Team8.ipynb rename to High_Dimentional_Data.team8.ipynb diff --git a/HW_02_Team8.ipynb b/Preparing_Library_Dataset.team8.ipynb similarity index 100% rename from HW_02_Team8.ipynb rename to Preparing_Library_Dataset.team8.ipynb