ml-course/sample_project/example-notebook.ipynb

279 lines
12 KiB
Plaintext
Raw Normal View History

2022-08-13 19:02:12 +02:00
{
"cells": [
{
"cell_type": "markdown",
"id": "e81cac73",
"metadata": {},
"source": [
"# Lets import file"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "4bc999ac",
"metadata": {},
"outputs": [],
"source": [
"import pandas as pd"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "0eec8a65",
"metadata": {},
"outputs": [],
"source": [
"df = pd.read_csv(\"heart-disease.csv\")"
]
},
{
"cell_type": "markdown",
"id": "f588239f",
"metadata": {},
"source": [
"Poglejmo kaj smo importali"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "0cec76a8",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>age</th>\n",
" <th>sex</th>\n",
" <th>cp</th>\n",
" <th>trestbps</th>\n",
" <th>chol</th>\n",
" <th>fbs</th>\n",
" <th>restecg</th>\n",
" <th>thalach</th>\n",
" <th>exang</th>\n",
" <th>oldpeak</th>\n",
" <th>slope</th>\n",
" <th>ca</th>\n",
" <th>thal</th>\n",
" <th>target</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>63</td>\n",
" <td>1</td>\n",
" <td>3</td>\n",
" <td>145</td>\n",
" <td>233</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>150</td>\n",
" <td>0</td>\n",
" <td>2.3</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>37</td>\n",
" <td>1</td>\n",
" <td>2</td>\n",
" <td>130</td>\n",
" <td>250</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>187</td>\n",
" <td>0</td>\n",
" <td>3.5</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>41</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>130</td>\n",
" <td>204</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>172</td>\n",
" <td>0</td>\n",
" <td>1.4</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>56</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>120</td>\n",
" <td>236</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>178</td>\n",
" <td>0</td>\n",
" <td>0.8</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>57</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>120</td>\n",
" <td>354</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>163</td>\n",
" <td>1</td>\n",
" <td>0.6</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>1</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" age sex cp trestbps chol fbs restecg thalach exang oldpeak slope \\\n",
"0 63 1 3 145 233 1 0 150 0 2.3 0 \n",
"1 37 1 2 130 250 0 1 187 0 3.5 0 \n",
"2 41 0 1 130 204 0 0 172 0 1.4 2 \n",
"3 56 1 1 120 236 0 1 178 0 0.8 2 \n",
"4 57 0 0 120 354 0 1 163 1 0.6 2 \n",
"\n",
" ca thal target \n",
"0 0 1 1 \n",
"1 0 2 1 \n",
"2 0 2 1 \n",
"3 0 2 1 \n",
"4 0 2 1 "
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df.head()"
]
},
{
"cell_type": "markdown",
"id": "ec647955",
"metadata": {},
"source": [
"# Lets graph our data"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "c9e4750b",
"metadata": {},
"outputs": [],
"source": [
"import matplotlib.pyplot as plt"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "a4cf20f4",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"<AxesSubplot:>"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAXcAAAD1CAYAAACrz7WZAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/YYfK9AAAACXBIWXMAAAsTAAALEwEAmpwYAAAOF0lEQVR4nO3df6zdd13H8efL1k2BGLr0tnb9YYd2YEcwmMtEiQaZuBkI3T9LuohpcEmjGQhGA538sb+azB9BTRSTBupqxC0NoGsgIrWKi1E27tiAdWW0YWO7tK53zt8mhY63f9zv9Hg4d/fe8z33Xvrp8/HPOd/P9/s95/1H8+w3357Tk6pCktSW71rrASRJk2fcJalBxl2SGmTcJalBxl2SGmTcJalB69d6AICNGzfWzp0713oMSbqkPPTQQ89W1dSofd8Rcd+5cyczMzNrPYYkXVKSfG2hfd6WkaQGGXdJapBxl6QGGXdJapBxl6QGGXdJapBxl6QGGXdJatB3xJeYLhU7D3xyrUdoypN3vWWtR5Ca5ZW7JDXIuEtSgxaNe5LDSc4neXRo/V1JHk9yMslvDazfkeRMt+/GlRhakvTilnLP/W7gD4A/eWEhyU8De4DXVNWFJJu69d3AXuA64Grgr5NcW1XPT3pwSdLCFr1yr6r7geeGln8ZuKuqLnTHnO/W9wD3VtWFqnoCOANcP8F5JUlLMO4992uBn0zyQJK/S/K6bn0r8PTAcbPdmiRpFY37Ucj1wAbg9cDrgKNJXgFkxLE16gWS7Af2A+zYsWPMMSRJo4x75T4LfLzmPQh8C9jYrW8fOG4bcHbUC1TVoaqarqrpqamRPyQiSRrTuHH/C+BNAEmuBa4AngWOAXuTXJnkGmAX8OAE5pQkLcOit2WS3AO8EdiYZBa4EzgMHO4+HvkNYF9VFXAyyVHgMeAicLuflJGk1bdo3Kvq1gV2vX2B4w8CB/sMJUnqx2+oSlKDjLskNci4S1KDjLskNci4S1KDjLskNci4S1KDjLskNci4S1KDjLskNci4S1KDjLskNci4S1KDjLskNci4S1KDjLskNWjRuCc5nOR896tLw/t+PUkl2TiwdkeSM0keT3LjpAeWJC1uKVfudwM3DS8m2Q68GXhqYG03sBe4rjvng0nWTWRSSdKSLRr3qrofeG7Ert8F3gvUwNoe4N6qulBVTwBngOsnMagkaenGuuee5G3A16vqC0O7tgJPD2zPdmuSpFW06A9kD0vyEuD9wM+O2j1irUaskWQ/sB9gx44dyx1DkvQixrly/0HgGuALSZ4EtgGfT/L9zF+pbx84dhtwdtSLVNWhqpququmpqakxxpAkLWTZV+5V9SVg0wvbXeCnq+rZJMeAP0vyAeBqYBfw4IRmlfQidh745FqP0Iwn73rLWo/Q21I+CnkP8I/AK5PMJrltoWOr6iRwFHgM+BRwe1U9P6lhJUlLs+iVe1Xdusj+nUPbB4GD/caSJPXhN1QlqUHGXZIaZNwlqUHGXZIaZNwlqUHGXZIaZNwlqUHGXZIaZNwlqUHGXZIaZNwlqUHGXZIaZNwlqUHGXZIaZNwlqUHGXZIatJRfYjqc5HySRwfWfjvJl5N8McmfJ3n5wL47kpxJ8niSG1dobknSi1jKlfvdwE1Da8eBV1fVa4CvAHcAJNkN7AWu6875YJJ1E5tWkrQki8a9qu4Hnhta+3RVXew2Pwts657vAe6tqgtV9QRwBrh+gvNKkpZgEvfcfxH4y+75VuDpgX2z3ZokaRX1inuS9wMXgY+8sDTisFrg3P1JZpLMzM3N9RlDkjRk7Lgn2Qe8Ffj5qnoh4LPA9oHDtgFnR51fVYeqarqqpqempsYdQ5I0wlhxT3IT8D7gbVX13wO7jgF7k1yZ5BpgF/Bg/zElScuxfrEDktwDvBHYmGQWuJP5T8dcCRxPAvDZqvqlqjqZ5CjwGPO3a26vqudXanhJ0miLxr2qbh2x/OEXOf4gcLDPUJKkfvyGqiQ1yLhLUoOMuyQ1yLhLUoOMuyQ1yLhLUoOMuyQ1yLhLUoOMuyQ1yLhLUoOMuyQ1yLhLUoOMuyQ1yLhLUoOMuyQ1yLhLUoMWjXuSw0nOJ3l0YO2qJMeTnO4eNwzsuyPJmSSPJ7lxpQaXJC1sKVfudwM3Da0dAE5U1S7gRLdNkt3AXuC67pwPJlk3sWklSUuyaNyr6n7guaHlPcCR7vkR4OaB9Xur6kJVPQGcAa6fzKiSpKUa95775qo6B9A9burWtwJPDxw3261JklbRpP9BNSPWauSByf4kM0lm5ubmJjyGJF3exo37M0m2AHSP57v1WWD7wHHbgLOjXqCqDlXVdFVNT01NjTmGJGmUceN+DNjXPd8H3DewvjfJlUmuAXYBD/YbUZK0XOsXOyDJPcAbgY1JZoE7gbuAo0luA54CbgGoqpNJjgKPAReB26vq+RWaXZK0gEXjXlW3LrDrhgWOPwgc7DOUJKkfv6EqSQ0y7pLUIOMuSQ0y7pLUIOMuSQ0y7pLUIOMuSQ0y7pLUIOMuSQ0y7pLUIOMuSQ0y7pLUIOMuSQ0y7pLUIOMuSQ0y7pLUoF5xT/KrSU4meTTJPUm+J8lVSY4nOd09bpjUsJKkpRk77km2Ar8CTFfVq4F1wF7gAHCiqnYBJ7ptSdIq6ntbZj3wvUnWAy8BzgJ7gCPd/iPAzT3fQ5K0TGPHvaq+DvwO8z+QfQ74t6r6NLC5qs51x5wDNk1iUEnS0vW5LbOB+av0a4CrgZcmefsyzt+fZCbJzNzc3LhjSJJG6HNb5meAJ6pqrqq+CXwc+AngmSRbALrH86NOrqpDVTVdVdNTU1M9xpAkDesT96eA1yd5SZIANwCngGPAvu6YfcB9/UaUJC3X+nFPrKoHknwU+DxwEXgYOAS8DDia5Dbm/wK4ZRKDSpKWbuy4A1TVncCdQ8sXmL+KlyStEb+hKkkNMu6S1CDjLkkNMu6S1CDjLkkNMu6S1CDjLkkNMu6S1CDjLkkNMu6S1CDjLkkNMu6S1CDjLkkNMu6S1CDjLkkNMu6S1KBecU/y8iQfTfLlJKeS/HiSq5IcT3K6e9wwqWElSUvT98r994FPVdWrgB9h/jdUDwAnqmoXcKLbliStorHjnuT7gJ8CPgxQVd+oqn8F9gBHusOOADf3G1GStFx9rtxfAcwBf5zk4SQfSvJSYHNVnQPoHjdNYE5J0jL0ift64EeBP6qq1wL/xTJuwSTZn2Qmyczc3FyPMSRJw/rEfRaYraoHuu2PMh/7Z5JsAegez486uaoOVdV0VU1PTU31GEOSNGzsuFfVPwFPJ3llt3QD8BhwDNjXre0D7us1oSRp2db3PP9dwEeSXAF8FXgH839hHE1yG/AUcEvP95AkLVOvuFfVI8D0iF039HldSVI/fkNVkhpk3CWpQcZdkhpk3CWpQcZdkhpk3CWpQcZdkhpk3CWpQcZdkhpk3CWpQcZdkhpk3CWpQcZdkhpk3CWpQcZdkhpk3CWpQb3jnmRdkoeTfKLbvirJ8SSnu8cN/ceUJC3HJK7c3w2cGtg+AJyoql3AiW5bkrSKesU9yTbgLcCHBpb3AEe650eAm/u8hyRp+fpeuf8e8F7gWwNrm6vqHED3uKnne0iSlmnsuCd5K3C+qh4a8/z9SWaSzMzNzY07hiRphD5X7m8A3pbkSeBe4E1J/hR4JskWgO7x/KiTq+pQVU1X1fTU1FSPMSRJw8aOe1XdUVXbqmonsBf4m6p6O3AM2Ncdtg+4r/eUkqRlWYnPud8FvDnJaeDN3bYkaRWtn8SLVNVngM90z/8ZuGESrytJGo/fUJWkBhl3SWqQcZekBhl3SWqQcZekBhl3SWqQcZekBhl3SWqQcZekBhl3SWqQcZekBhl3SWqQcZekBhl3SWqQcZekBhl3SWqQcZekBo0d9yTbk/xtklNJTiZ5d7d+VZLjSU53jxsmN64kaSn6XLlfBH6tqn4YeD1we5LdwAHgRFXtAk5025KkVTR23KvqXFV9vnv+H8ApYCuwBzjSHXYEuLnnjJKkZZrIPfckO4HXAg8Am6vqHMz/BQBsWuCc/UlmkszMzc1NYgx
"text/plain": [
"<Figure size 432x288 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"df.target.value_counts().plot(kind=\"bar\")"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "a7a80c15",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.4"
}
},
"nbformat": 4,
"nbformat_minor": 5
}