diff --git a/EDA.ipynb b/EDA.ipynb index bc217d904b024f1ffc1ed4920cd489a37469a527..75a3b680fa5aa28a7cac2460d0097efda94cf0c5 100644 --- a/EDA.ipynb +++ b/EDA.ipynb @@ -347,6 +347,756 @@ "cell_type": "markdown", "metadata": {}, "source": [] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### OpracowaĹ: Jakub Szczegiecki" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "import seaborn as sns\n", + "from plotnine import ggplot, aes, geom_point, geom_line, ggtitle\n", + "from sklearn.decomposition import PCA" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<style scoped>\n", + " .dataframe tbody tr th:only-of-type {\n", + " vertical-align: middle;\n", + " }\n", + "\n", + " .dataframe tbody tr th {\n", + " vertical-align: top;\n", + " }\n", + "\n", + " .dataframe thead th {\n", + " text-align: right;\n", + " }\n", + "</style>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>PROXIMITY</th>\n", + " <th>TIMESTAMP</th>\n", + " <th>MEASUREMENT</th>\n", + " <th>EPC</th>\n", + " <th>EAN</th>\n", + " <th>ITEMID</th>\n", + " <th>STYLECOLOR</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>-70.4</td>\n", + " <td>2021-10-26T09:46:33.735</td>\n", + " <td>1</td>\n", + " <td>3035684754340E0000B594FD</td>\n", + " <td>5902805533040</td>\n", + " <td>2127269</td>\n", + " <td>RH267-85J</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>-61.8</td>\n", + " <td>2021-10-26T09:46:33.747</td>\n", + " <td>1</td>\n", + " <td>303568480C2B874000B59A39</td>\n", + " <td>5902851445731</td>\n", + " <td>2217401</td>\n", + " <td>RS483-99X</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>-74.4</td>\n", + " <td>2021-10-26T09:46:33.751</td>\n", + " <td>1</td>\n", + " <td>303568480C357A0000B59999</td>\n", + " <td>5902851547602</td>\n", + " <td>2227511</td>\n", + " <td>SB281-90M</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>-78.0</td>\n", + " <td>2021-10-26T09:46:33.754</td>\n", + " <td>1</td>\n", + " <td>30356847541DA78000B5BA4D</td>\n", + " <td>5902805303667</td>\n", + " <td>2104706</td>\n", + " <td>RJ369-87X</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>-71.1</td>\n", + " <td>2021-10-26T09:46:33.758</td>\n", + " <td>1</td>\n", + " <td>30356847542A2B0000B5B215</td>\n", + " <td>5902805431803</td>\n", + " <td>2117629</td>\n", + " <td>RM119-93X</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th>502684</th>\n", + " <td>-59.9</td>\n", + " <td>2021-10-26T10:52:08.744</td>\n", + " <td>43</td>\n", + " <td>303568458835010000B5BA58</td>\n", + " <td>5902690542769</td>\n", + " <td>2028744</td>\n", + " <td>QY337-00X</td>\n", + " </tr>\n", + " <tr>\n", + " <th>502685</th>\n", + " <td>-79.9</td>\n", + " <td>2021-10-26T10:52:08.745</td>\n", + " <td>43</td>\n", + " <td>513568458843D94000B5B5DE</td>\n", + " <td>5902690694772</td>\n", + " <td>2044040</td>\n", + " <td>QZ555-20X</td>\n", + " </tr>\n", + " <tr>\n", + " <th>502686</th>\n", + " <td>-66.8</td>\n", + " <td>2021-10-26T10:52:08.745</td>\n", + " <td>43</td>\n", + " <td>30356847541DA7C000B5BADD</td>\n", + " <td>5902805303674</td>\n", + " <td>2104707</td>\n", + " <td>RJ369-87X</td>\n", + " </tr>\n", + " <tr>\n", + " <th>502687</th>\n", + " <td>-60.8</td>\n", + " <td>2021-10-26T10:52:08.747</td>\n", + " <td>43</td>\n", + " <td>303568458835010000B5BA58</td>\n", + " <td>5902690542769</td>\n", + " <td>2028744</td>\n", + " <td>QY337-00X</td>\n", + " </tr>\n", + " <tr>\n", + " <th>502688</th>\n", + " <td>-75.7</td>\n", + " <td>2021-10-26T10:52:08.748</td>\n", + " <td>43</td>\n", + " <td>303568480C34550000B5A5E7</td>\n", + " <td>5902851535883</td>\n", + " <td>2226337</td>\n", + " <td>RV167-87X</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>502689 rows Ă 7 columns</p>\n", + "</div>" + ], + "text/plain": [ + " PROXIMITY TIMESTAMP MEASUREMENT \\\n", + "0 -70.4 2021-10-26T09:46:33.735 1 \n", + "1 -61.8 2021-10-26T09:46:33.747 1 \n", + "2 -74.4 2021-10-26T09:46:33.751 1 \n", + "3 -78.0 2021-10-26T09:46:33.754 1 \n", + "4 -71.1 2021-10-26T09:46:33.758 1 \n", + "... ... ... ... \n", + "502684 -59.9 2021-10-26T10:52:08.744 43 \n", + "502685 -79.9 2021-10-26T10:52:08.745 43 \n", + "502686 -66.8 2021-10-26T10:52:08.745 43 \n", + "502687 -60.8 2021-10-26T10:52:08.747 43 \n", + "502688 -75.7 2021-10-26T10:52:08.748 43 \n", + "\n", + " EPC EAN ITEMID STYLECOLOR \n", + "0 3035684754340E0000B594FD 5902805533040 2127269 RH267-85J \n", + "1 303568480C2B874000B59A39 5902851445731 2217401 RS483-99X \n", + "2 303568480C357A0000B59999 5902851547602 2227511 SB281-90M \n", + "3 30356847541DA78000B5BA4D 5902805303667 2104706 RJ369-87X \n", + "4 30356847542A2B0000B5B215 5902805431803 2117629 RM119-93X \n", + "... ... ... ... ... \n", + "502684 303568458835010000B5BA58 5902690542769 2028744 QY337-00X \n", + "502685 513568458843D94000B5B5DE 5902690694772 2044040 QZ555-20X \n", + "502686 30356847541DA7C000B5BADD 5902805303674 2104707 RJ369-87X \n", + "502687 303568458835010000B5BA58 5902690542769 2028744 QY337-00X \n", + "502688 303568480C34550000B5A5E7 5902851535883 2226337 RV167-87X \n", + "\n", + "[502689 rows x 7 columns]" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df = pd.read_csv('C:/Users/jakub/Documents/query_main.csv', sep = ';', header = None)\n", + "df.columns = ['PROXIMITY', 'TIMESTAMP', 'MEASUREMENT', 'EPC', 'EAN', 'ITEMID', 'STYLECOLOR']\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<style scoped>\n", + " .dataframe tbody tr th:only-of-type {\n", + " vertical-align: middle;\n", + " }\n", + "\n", + " .dataframe tbody tr th {\n", + " vertical-align: top;\n", + " }\n", + "\n", + " .dataframe thead th {\n", + " text-align: right;\n", + " }\n", + "</style>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>timestamp</th>\n", + " <th>hour</th>\n", + " <th>minute</th>\n", + " <th>second</th>\n", + " <th>microsecond</th>\n", + " <th>delta_ms</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>2021-10-26 09:46:33.735</td>\n", + " <td>9</td>\n", + " <td>46</td>\n", + " <td>33</td>\n", + " <td>735000</td>\n", + " <td>0.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>2021-10-26 09:46:33.747</td>\n", + " <td>9</td>\n", + " <td>46</td>\n", + " <td>33</td>\n", + " <td>747000</td>\n", + " <td>12.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>2021-10-26 09:46:33.751</td>\n", + " <td>9</td>\n", + " <td>46</td>\n", + " <td>33</td>\n", + " <td>751000</td>\n", + " <td>16.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>2021-10-26 09:46:33.754</td>\n", + " <td>9</td>\n", + " <td>46</td>\n", + " <td>33</td>\n", + " <td>754000</td>\n", + " <td>19.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>2021-10-26 09:46:33.758</td>\n", + " <td>9</td>\n", + " <td>46</td>\n", + " <td>33</td>\n", + " <td>758000</td>\n", + " <td>23.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th>502684</th>\n", + " <td>2021-10-26 10:52:08.744</td>\n", + " <td>10</td>\n", + " <td>52</td>\n", + " <td>8</td>\n", + " <td>744000</td>\n", + " <td>3935009.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>502685</th>\n", + " <td>2021-10-26 10:52:08.745</td>\n", + " <td>10</td>\n", + " <td>52</td>\n", + " <td>8</td>\n", + " <td>745000</td>\n", + " <td>3935010.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>502686</th>\n", + " <td>2021-10-26 10:52:08.745</td>\n", + " <td>10</td>\n", + " <td>52</td>\n", + " <td>8</td>\n", + " <td>745000</td>\n", + " <td>3935010.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>502687</th>\n", + " <td>2021-10-26 10:52:08.747</td>\n", + " <td>10</td>\n", + " <td>52</td>\n", + " <td>8</td>\n", + " <td>747000</td>\n", + " <td>3935012.0</td>\n", + " </tr>\n", + " <tr>\n", + " <th>502688</th>\n", + " <td>2021-10-26 10:52:08.748</td>\n", + " <td>10</td>\n", + " <td>52</td>\n", + " <td>8</td>\n", + " <td>748000</td>\n", + " <td>3935013.0</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>502689 rows Ă 6 columns</p>\n", + "</div>" + ], + "text/plain": [ + " timestamp hour minute second microsecond delta_ms\n", + "0 2021-10-26 09:46:33.735 9 46 33 735000 0.0\n", + "1 2021-10-26 09:46:33.747 9 46 33 747000 12.0\n", + "2 2021-10-26 09:46:33.751 9 46 33 751000 16.0\n", + "3 2021-10-26 09:46:33.754 9 46 33 754000 19.0\n", + "4 2021-10-26 09:46:33.758 9 46 33 758000 23.0\n", + "... ... ... ... ... ... ...\n", + "502684 2021-10-26 10:52:08.744 10 52 8 744000 3935009.0\n", + "502685 2021-10-26 10:52:08.745 10 52 8 745000 3935010.0\n", + "502686 2021-10-26 10:52:08.745 10 52 8 745000 3935010.0\n", + "502687 2021-10-26 10:52:08.747 10 52 8 747000 3935012.0\n", + "502688 2021-10-26 10:52:08.748 10 52 8 748000 3935013.0\n", + "\n", + "[502689 rows x 6 columns]" + ] + }, + "execution_count": 12, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "import datetime\n", + "\n", + "timestamp1 = df[\"TIMESTAMP\"].astype('datetime64[ns]')\n", + "\n", + "hour = timestamp1.astype('datetime64[ns]').dt.hour.astype(int)\n", + "minute = timestamp1.astype('datetime64[ns]').dt.minute.astype(int)\n", + "second = timestamp1.astype('datetime64[ns]').dt.second.astype(int)\n", + "microsecond = timestamp1.astype('datetime64[ns]').dt.microsecond.astype(int)\n", + "\n", + "millisecond = microsecond/1000+second*1000+minute*60000+hour*3600000\n", + "delta_ms = millisecond - millisecond[0]\n", + "delta_ms\n", + "\n", + "timestamp = pd.DataFrame()\n", + "timestamp = pd.concat([timestamp1, hour, minute, second, microsecond, delta_ms], axis = 1)\n", + "timestamp.columns = ['timestamp', 'hour', 'minute', 'second', 'microsecond', 'delta_ms']\n", + "\n", + "timestamp" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<style scoped>\n", + " .dataframe tbody tr th:only-of-type {\n", + " vertical-align: middle;\n", + " }\n", + "\n", + " .dataframe tbody tr th {\n", + " vertical-align: top;\n", + " }\n", + "\n", + " .dataframe thead th {\n", + " text-align: right;\n", + " }\n", + "</style>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>PROXIMITY</th>\n", + " <th>NUMBER</th>\n", + " <th>EAN</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>-75.210592</td>\n", + " <td>4003</td>\n", + " <td>5902805820515</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>-75.055416</td>\n", + " <td>7902</td>\n", + " <td>5902805820546</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>-75.673864</td>\n", + " <td>6780</td>\n", + " <td>5902851535869</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>-76.017081</td>\n", + " <td>11937</td>\n", + " <td>5902851535913</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>-76.254074</td>\n", + " <td>8283</td>\n", + " <td>5902975218037</td>\n", + " </tr>\n", + " <tr>\n", + " <th>...</th>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " <td>...</td>\n", + " </tr>\n", + " <tr>\n", + " <th>71</th>\n", + " <td>-74.921590</td>\n", + " <td>7531</td>\n", + " <td>5902805820447</td>\n", + " </tr>\n", + " <tr>\n", + " <th>72</th>\n", + " <td>-75.528464</td>\n", + " <td>7237</td>\n", + " <td>5902851852638</td>\n", + " </tr>\n", + " <tr>\n", + " <th>73</th>\n", + " <td>-76.882319</td>\n", + " <td>10967</td>\n", + " <td>5902975217993</td>\n", + " </tr>\n", + " <tr>\n", + " <th>74</th>\n", + " <td>-76.228160</td>\n", + " <td>3196</td>\n", + " <td>5902975236970</td>\n", + " </tr>\n", + " <tr>\n", + " <th>75</th>\n", + " <td>-76.337086</td>\n", + " <td>6439</td>\n", + " <td>5902975236994</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "<p>76 rows Ă 3 columns</p>\n", + "</div>" + ], + "text/plain": [ + " PROXIMITY NUMBER EAN\n", + "0 -75.210592 4003 5902805820515\n", + "1 -75.055416 7902 5902805820546\n", + "2 -75.673864 6780 5902851535869\n", + "3 -76.017081 11937 5902851535913\n", + "4 -76.254074 8283 5902975218037\n", + ".. ... ... ...\n", + "71 -74.921590 7531 5902805820447\n", + "72 -75.528464 7237 5902851852638\n", + "73 -76.882319 10967 5902975217993\n", + "74 -76.228160 3196 5902975236970\n", + "75 -76.337086 6439 5902975236994\n", + "\n", + "[76 rows x 3 columns]" + ] + }, + "execution_count": 13, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df = pd.read_csv('C:/Users/jakub/Documents/query4.csv', sep = ';')\n", + "df['EAN'] = df['EAN'].astype(str)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "([], [])" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "<Figure size 432x288 with 1 Axes>" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "plt.scatter(x=df['EAN'], y=df['NUMBER'], c=df['NUMBER'])\n", + "plt.xlabel('Tag')\n", + "plt.ylabel('Liczba odczytĂłw')\n", + "plt.title('Liczba odczytĂłw dla danego tagu')\n", + "plt.xticks([])" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "\n", + "text/plain": [ + "<Figure size 432x288 with 2 Axes>" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "fig, ax1 = plt.subplots()\n", + "\n", + "ax2 = ax1.twinx()\n", + "\n", + "ax1.bar(df['EAN'], df['NUMBER'], color='darkred', alpha=0.3, width = 0.5)\n", + "ax1.set_xticklabels([])\n", + "ax1.set_xlabel('Tag')\n", + "ax1.set_ylabel(\"Liczba odczytĂłw\" ,color='darkred')\n", + " \n", + "ax2.scatter(x=df['EAN'], y=df['PROXIMITY'], color='b')\n", + "ax2.set_xticklabels([])\n", + "ax2.set_ylim(-110,-25)\n", + "ax2.set_ylabel(\"Ĺrednia siĹa odczytu\",color='b')\n", + "\n", + "plt.title('Liczba odczytĂłw i Ĺrednia siĹa pomiaru z podziaĹem na tagi')\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<style scoped>\n", + " .dataframe tbody tr th:only-of-type {\n", + " vertical-align: middle;\n", + " }\n", + "\n", + " .dataframe tbody tr th {\n", + " vertical-align: top;\n", + " }\n", + "\n", + " .dataframe thead th {\n", + " text-align: right;\n", + " }\n", + "</style>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>PROXIMITY</th>\n", + " <th>NUMBER</th>\n", + " <th>ClassName</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>-75.313509</td>\n", + " <td>10674</td>\n", + " <td>knitwear</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>-75.236090</td>\n", + " <td>26874</td>\n", + " <td>ladies'_und/socks</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>-74.951699</td>\n", + " <td>160731</td>\n", + " <td>t-shirts_s_s</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>-76.448187</td>\n", + " <td>38199</td>\n", + " <td>jeans_others</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>-75.847888</td>\n", + " <td>43547</td>\n", + " <td>trousers</td>\n", + " </tr>\n", + " <tr>\n", + " <th>5</th>\n", + " <td>-75.493705</td>\n", + " <td>222664</td>\n", + " <td>t-shirts</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " PROXIMITY NUMBER ClassName\n", + "0 -75.313509 10674 knitwear\n", + "1 -75.236090 26874 ladies'_und/socks\n", + "2 -74.951699 160731 t-shirts_s_s\n", + "3 -76.448187 38199 jeans_others\n", + "4 -75.847888 43547 trousers\n", + "5 -75.493705 222664 t-shirts" + ] + }, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df = pd.read_csv('C:/Users/jakub/Documents/query5.csv', sep = ';')\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "<ipython-input-18-3c518dfe74d5>:6: UserWarning: FixedFormatter should only be used together with FixedLocator\n" + ] + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "<Figure size 432x288 with 2 Axes>" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "fig, ax1 = plt.subplots()\n", + "\n", + "ax2 = ax1.twinx()\n", + "\n", + "ax1.bar(df['ClassName'], df['NUMBER'], color='darkred', alpha=0.3)\n", + "ax1.set_xticklabels(labels = df['ClassName'], rotation = 90)\n", + "ax1.set_ylim(0,280000)\n", + "ax1.set_xlabel(\"Klasa\")\n", + "for x,y in zip(df['ClassName'],df['NUMBER']):\n", + " label = '{:d}'.format(y)\n", + " ax1.annotate(label, \n", + " (x,y), \n", + " textcoords=\"offset points\", \n", + " xytext=(0,10), \n", + " ha='center',\n", + " fontsize = 10) \n", + "ax1.set_ylabel(\"Liczba odczytĂłw\" ,color='darkred')\n", + " \n", + "ax2.scatter(x=df['ClassName'], y=df['PROXIMITY'], color='b')\n", + "ax2.set_ylim(-110,-25)\n", + "ax2.set_ylabel(\"Ĺrednia siĹa odczytu\",color='b')\n", + "\n", + "plt.title('Liczba odczytĂłw i Ĺrednia siĹa pomiaru z podziaĹem na klasy')\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] } ], "metadata": { @@ -365,7 +1115,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.3" + "version": "3.8.5" } }, "nbformat": 4, diff --git a/query4.csv b/query4.csv new file mode 100644 index 0000000000000000000000000000000000000000..d520c7916c8b39d4ea0d37600ec2406a97bb6e06 --- /dev/null +++ b/query4.csv @@ -0,0 +1,77 @@ +ďťżPROXIMITY;NUMBER;EAN +-75.210592;4003;5902805820515 +-75.055416;7902;5902805820546 +-75.673864;6780;5902851535869 +-76.017081;11937;5902851535913 +-76.254074;8283;5902975218037 +-73.848516;7045;5902975309292 +-73.886521;5149;5902690542745 +-75.297758;3480;5902805219685 +-75.428973;5788;5902805219692 +-75.241095;21180;5902805385885 +-76.780842;6431;5902805458756 +-75.883087;9159;5902805716504 +-76.237238;20688;5902851547602 +-74.208092;8650;5902690694734 +-72.697246;4322;5902805219708 +-75.250195;9445;5902805431803 +-75.937224;8258;5902805444681 +-75.077195;7389;5902805820553 +-75.281615;10449;5902975218044 +-74.381076;10146;5902975302408 +-74.846588;7798;5902690542769 +-75.655436;3449;5902805219715 +-75.719736;3420;5902805444674 +-76.673707;3986;5902805444698 +-76.642385;3329;5902805444711 +-76.891586;4861;5902805458763 +-76.605848;3522;5902851414515 +-75.358942;8968;5902851445731 +-77.425064;1951;5902851535906 +-77.892417;2387;5902975236956 +-74.803037;5235;5902975302415 +-73.495835;7852;5902975309285 +-75.679136;13411;5902805162677 +-75.976042;9546;5902805532999 +-75.567014;3926;5902805533002 +-78.560146;1912;5902805533224 +-76.340889;3666;5902805533255 +-74.685312;7544;5902805820461 +-75.252176;3653;5902805820577 +-76.334626;3919;5902851457468 +-74.026573;5020;5902975302385 +-73.516268;4223;5902975309308 +-75.320198;3634;5902805162639 +-73.858554;4027;5902805303674 +-78.279402;1976;5902805431797 +-75.080143;2367;5902805431810 +-76.217731;2989;5902805458787 +-74.170812;6938;5902805820416 +-71.926733;4874;5902805820423 +-74.212993;4056;5902805820454 +-77.527480;2016;5902975302392 +-74.894652;11369;5902690694741 +-75.932590;3231;5902805303650 +-74.470013;23157;5902805385823 +-74.897840;3566;5902805533019 +-77.018357;3361;5902805716511 +-72.377993;4994;5902805820393 +-75.241835;17117;5902805820508 +-75.732196;10405;5902851414508 +-75.596670;8769;5902851445700 +-74.726766;11630;5902851535883 +-74.860896;3437;5902851852614 +-76.746779;3012;5902975217986 +-75.818346;4028;5902690694772 +-75.250458;7519;5902805303667 +-76.576883;3664;5902805303681 +-76.845064;12420;5902805533040 +-78.004046;3163;5902805533279 +-77.475953;3514;5902805716498 +-76.856280;3065;5902805716535 +-76.370902;2959;5902805820409 +-74.921590;7531;5902805820447 +-75.528464;7237;5902851852638 +-76.882319;10967;5902975217993 +-76.228160;3196;5902975236970 +-76.337086;6439;5902975236994 diff --git a/query5.csv b/query5.csv new file mode 100644 index 0000000000000000000000000000000000000000..0906163e03296fbab7334fcf76529a152328c55e --- /dev/null +++ b/query5.csv @@ -0,0 +1,7 @@ +ďťżPROXIMITY;NUMBER;ClassName +-75.313509;10674;knitwear +-75.236090;26874;ladies'_und/socks +-74.951699;160731;t-shirts_s_s +-76.448187;38199;jeans_others +-75.847888;43547;trousers +-75.493705;222664;t-shirts