Files
cas-pml/SL/aufgaben/WS1/notebooks/3.1 Regression - Einfuehrung.ipynb
T

271 lines
27 KiB
Plaintext

{
"cells": [
{
"cell_type": "markdown",
"metadata": {
"tags": []
},
"source": [
"# Feature Engineering\n",
"# Klassifikation\n",
"# Regression\n",
"## Einleitung"
]
},
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
"import sys\n",
"sys.path.append('./')"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {
"ExecuteTime": {
"end_time": "2020-04-08T10:06:24.890328Z",
"start_time": "2020-04-08T10:06:23.220148Z"
},
"tags": []
},
"outputs": [],
"source": [
"## prepare\n",
"import pandas as pd\n",
"import numpy as np\n",
"import matplotlib.pyplot as plt\n",
"import seaborn as sns; sns.set()\n",
"%matplotlib inline\n",
"\n",
"datapath = '../3_data'\n",
"from os import chdir; chdir(datapath)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Abgrenzung gegenüber Klassifikation\n",
"(kein Code)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Das Demo Dataset: demo_data_regr.csv"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
" X y\n",
"0 6.0 2.5\n",
"1 5.1 1.9\n",
"2 5.9 2.1\n",
"3 5.6 1.8\n",
"4 5.8 2.2\n"
]
}
],
"source": [
"demo_data = pd.read_csv('demo_data_regr.csv')\n",
"print(demo_data.head())"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {
"ExecuteTime": {
"end_time": "2020-04-08T10:06:25.476230Z",
"start_time": "2020-04-08T10:06:24.976970Z"
},
"scrolled": true
},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAhwAAAIRCAYAAAABYGSiAAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjMsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvZiW1igAAAAlwSFlzAAAPYQAAD2EBqD+naQAAOsRJREFUeJzt3Qt8VNWdwPH/nZmESYKjgaLSjy6ou0ZrQcNTK75Y9dPaViVt16Li+0ERH8Un4gupLrigaDUCbdUq2N3PpyCCxfXxae2DShXNGkUNdXVTQYTQBIeQhGRm7n7OoYl5EeYm98x95Pf9fOI4956cOf97Jvf+59xzBsu2bVsAAAAMipisHAAAQCHhAAAAxpFwAAAA40g4AACAcSQcAADAOBIOAABgHAkHAAAwjoQDAAAYFzP/Ev6nvvssk3H3+88iEcv1Ov0grHGFOTbiChbiCp6wxhbJIi5VxrKsrOoj4RDRB7S2dpdr9cViESkuLpJkskFSqYyERVjjCnNsxBUsxBU8YY0tlmVcgwYVSTSaXcLBLRUAAGAcCQcAADCOhAMAABhHwgEAAIwj4QAAAMaRcAAAAONIOAAAgHEkHAAAwDgSDgAAYBwJBwAAMI6EAwAAGEfCAQAAjCPhAAAAxpFwAAAA40g4AACAcSQcABBitmVJQyoj2+ub9aN6nuvXTzalpaq6VnbuTvf4+l63FWbFDNcPAPBI2rKkfHmlVGysadtWWjJEppWNlKht++r1vW4rzGOEAwBCyO7mAq5UVNVI+YpK46MHTl7f67YiN0g4ACCEGlvSXS7g7S/kar9fXt/rtiI3SDgAIIQamlJ92p/L1/e6rcgNEg4ACKHCeKxP+3P5+l63FblBwgEAIVSQF9WTLrujtqv9fnl9r9uK3CDhAIAQsmxbr/DofCFvXfmh9vvl9b1uK3KDcSoACCm1nHR62Ug96VLNg1C3JtRoQa4u4F++fkaamlMSz1evH+n29b1uK8wj4QCAEFMX7MJYRAoH5u/ZkOMLuHr9RDwqw4YmpK5ul6RSGd+2FWZxSwUAABhHwgEAAIwj4QAAAMaRcAAAAONIOAAAgHEkHAAAwDgSDgAAYBwJBwAAMI6EAwAAGEfCAQAAjCPhAAAAxpFwAAAA40g4AACAcSQcAADAOBIOAABgHAkHAAAwjoQDAACEP+HYsWOH3HXXXXLyySfLqFGjZPLkybJ+/fqsfvfxxx+XkpIS420EAAABTzhmzJghFRUV8uCDD8ry5cvl6KOPlssvv1w+/vjjHn+vsrJSHn300Zy1E0Dw2JYlDamMbK9v1o/qeRiENS6EW8zLF6+urpa1a9fKs88+K6NHj9bb7rzzTvnjH/8oq1evluuvv77b32toaJCbb75ZxowZI+vWrctxqwEEQdqypHx5pVRsrGnbVloyRKaVjZSobUtQhTUuhJ+nIxzFxcWyZMkSGTFiRNs2y7L0TzKZ3Ovv3XfffXLkkUfKOeeck6OWAggSu5uLslJRVSPlKyoDOyIQ1rjQP3g6wpFIJOSUU07psO2ll17SIx+33357t7/z8ssvy+9//3s9AvK73/3OtbbEYu7lXtFopMNjWIQ1rjDH1l/jSjalu1yU21+cG1sykohHxW/6a1xBFtbYogbi8jTh6Oztt9+WmTNnyplnnimnnnpql/1bt27VE0wfeOABPTrilkjEkuLiInFbIlEgYRTWuMIcW3+La1t1bY+/19SckmFDE+JX/S2uMAhrbAkX4/JNwvHqq6/KTTfdpFeqzJ8/v8t+27bltttuk29961t6RYubMhlbkskG1+pTGaHqpGSyUdLpjIRFWOMKc2z9Na54fs+nNrW/rm6X+E1/jSvIwhpbNMu4VJlsR0F8kXAsXbpUz8v45je/KfPmzZP8/PwuZT777DP585//rEdBVq5cqbelUin9WFpaKrNnz5azzz67121Ipdx/o6hOMlGv18IaV5hj629xFeRF9ERKdZuhM7Vd7ffz8ehvcYVBWGNLuxiX5wmHWqEyZ84cmTJlisyaNUtPGO3OQQcdpOdvtKeeq9EQlYAMHjw4Ry0G4HeWbetVG2oiZfuLc+tqDrU/iMIaF/oHTxOOTz75RO6//34544wz5Oqrr5bt27e37YvH4zJgwAD54osvZP/999ejHsOGDevw+61JRuftAKCWiE4vGymNLWlpaEpJYTwmBXnRwF+UwxoXws/ThEOtSGlpaZFXXnlF/7Q3adIk/XPRRRfJ008/LePHj/esnQCCSV2EC2MRKRz4j9u0IbkohzUuhJtlq9mY/Zy6R1Vbu8vVJbZq1YuavBWme3phjSvMsRFXsBBX8IQ1tliWcQ0aVJT1pNFwLRwGAAC+RMIBAACMI+EAAADGkXAAAADjSDgAAIBxJBwAAMA4Eg4AAGAcCQcAADCOhAMAABhHwgEAAIwj4QAAAMaRcAAAAONIOAAAgHEkHAAAwDgSDgAAYBwJBwAAMI6EAwAAGEfCASC0bMuShlRGttc360f1PJdlndRpiqk2mKjXD8crrGwfHNtYzl8RAHIgbVlSvrxSKjbWtG0rLRki08pGStS2jZd1Uqcpptpgol4/HK+wSvvk2DLCASB07G5OsEpFVY2Ur6js8OnORFkndZpiqg0m6vXD8Qor20fHloQDQOg0tqS7nGDbn2jVfpNlndRpiqk2mKjXD8crrBp9dGxJOACETkNTKuv9Jso6qdMUU20wUa8fjldYNfjo2JJwAAidwngs6/0myjqp0xRTbTBRrx+OV1gV+ujYknAACJ2CvKieFNcdtV3tN1nWSZ2mmGqDiXr9cLzCqsBHx5aEA0DoWLatZ+B3PtG2zsxX+02WdVKnKabaYKJePxyvsLJ8dGwt26Yn0+mM1Nbucq2+WCwixcVFUle3S1KpjIRFWOMKc2z9PS41A19NilP3qdXQsfo0t7cTrImyTup0EpcTTttgol4T/eUXQfkbsw29FwcNKpJoNLuxC26MAQgtdUItjEWkcGD+ng09nGBNlHVSpymm2mCiXj8cr7CyfHBsuaUCAACMI+EAAADGkXAAAADjSDgAAIBxJBwAAMA4Eg4AAGAcCQcAADCOhAMAABhHwgEAAIwj4QAAAMaRcAAAAONIOAAAgHEkHAAAwDgSDgAAYBwJBwAAMI6EAwAAGEfCAQAAjCPhAAAA4U84duzYIXfddZecfPLJMmrUKJk8ebKsX79+r+XffvttmTJliowePVpOOukkmTVrlq4DAPoL27KkIZWR7fXN+lE993O9yF6Y+yDmdQNmzJghNTU18uCDD8rgwYPlmWeekcsvv1yee+45OfzwwzuU/eSTT/S+733ve3LPPfdIXV2dzJ49W66//nr55S9/6VkMAJAracuS8uWVUrGxpm1backQmVY2UqK27bt6kb10yPvA0xGO6upqWbt2rU4exowZI4cddpjceeedcuCBB8rq1au7lF+5cqXep0Y1jjjiCP07d999t6xbt04+/fRTT2IAgFyxu7kgKRVVNVK+orLXn4ZN1Yvs2f2gDzwd4SguLpYlS5bIiBEj2rZZlqV/kslkl/Jnn322nHbaaXp/+/LKF198IYceemiv2xKLuZd7RaORDo9hEda4whwbcYUrrmRTussFqf2FqbElI4l41PHrmqo37P3lZmxJw33ghz7zNOFIJBJyyimndNj20ksv6ZGP22+/vUt5NarR2c9+9jMZMmSIlJSU9LodkYglxcVF4rZEokDCKKxxhTk24gpHXNuqa3v8vabmlAwbmnD8eqbq7S/95UZs23LUB172medzODpPCJ05c6aceeaZcuqpp+6z/Lx58+S1116TRx99VPLy8nr9upmMLclkg7hFZYSqk5LJRkmnMxIWYY0rzLERV7jiiuf3fMpW++vqdjl+XVP1hr2/3IwtbrgPTMWlymQ7CuKbhOPVV1+Vm266Sa9UmT9/fo9lW1pa9MoWNadjzpw5cvrpp/f59VMp9/8IVCeZqNdrYY0rzLERVzjiKsiL6EmEaoi9M7Vd7e/N8TBVb3/pLzdiK8hRH3jZZ764obZ06VK59tpr9fyMRYsWyYABA/Zatr6+Xq688ko9qVStbPnBD36Q07YCgFcs29YrFtQFqL3WlQxqv5/qRfasftAHno9wPPvss3qUQn23hlp90n5CaGfNzc1y9dVXywcffCC/+MUvZPz48TltKwB4TS2PnF42Uhpb0tLQlJLCeEwK8qJ9viCZqhfZi4a8DzxNONT3atx///1yxhln6ERi+/btbfvi8bge6VCrT/bff3/Jz8+XxYsXy1tvvSULFizQ39Ghvr+jVWsZAAg7dQEqjEWkcOA/znkuXZBM1YvshbkPPE041IoUNR/jlVde0T/tTZo0Sf9cdNFF8vTTT+vRjBdeeEFs29ZfFtZZaxkAAOA/niYcU6dO1T89qaqq6pCgAACA4PHFpFEAABBuJBwAAMA4Eg4AAGAcCQcAADCOhAMAABhHwgEAAIwj4QAAAMaRcAAAAONIOAAAgHEkHAAAwDgSDgAAYBwJBwAAMI6EAwAAGEfCAQAAjCPhAAAAxpFwAAAA40g4AMAQ27KkIZWR7fXN+lE976lssiktVdW1snN3ep9lndSbbVknTNUbRhyrPWL/eAQAuChtWVK+vFIqNta0bSstGSLTykZK1LZ9V9ZUbP0dx+pLjHAAgMvsbi4ySkVVjZSvqOzwCdcPZU3F1t9xrDoi4QAAlzW2pLtcZNpfbNR+P5V1wlS9YcSx6oiEAwBc1tCUynq/H8o6YareMOJYdUTCAQAuK4zHst7vh7JOmKo3jDhWHZFwAIDLCvKiemJgd9R2td9PZZ0wVW8Ycaw6IuEAAJdZtq1XIXS+2LSuTlD7/VTWVGz9HceqI8u2+1nE3UinM1Jbu8u1+mKxiBQXF0ld3S5JpTISFmGNK8yxEZe31CoENTFQ3atXw+fqE+3eLjJ7ymakqTkl8XxVNrKPsk7qza6sqdiC0l+9kU1spvrApGz7bNCgIolGsxu76F83kAAgh9RFpTAWkcKB+Xs29HCRUWUT8agMG5rY50neab3ZlnXCVL1hxLHag1sqAADAOBIOAABgHAkHAAAwjoQDAAAYR8IBAACMI+EAAADGkXAAAADjSDgAAIBxJBwAAMA4Eg4AAGAcCQcAADCOhAMAABhHwgEAAIwj4QAAAMaRcAAAAONIOAAAgHEkHAAAwDgSDgAAEP6EY8eOHXLXXXfJySefLKNGjZLJkyfL+vXr91p+06ZNcvXVV+uyEyZMkIULF0o6nc5pmwG4y7YsaUhlZHt9s35Uz3sqm2xKS1V1rezcnd5nWSf1ZlsW4eX1+8AO8fsw5nUDZsyYITU1NfLggw/K4MGD5ZlnnpHLL79cnnvuOTn88MM7lG1padH7hg8fLv/5n/8pf/vb32TWrFkSiUTkuuuu8ywGAL2XtiwpX14pFRtr2raVlgyRaWUjJWrbviuL8PL6fZAO+fvQ0xGO6upqWbt2rdxzzz0yZswYOeyww+TOO++UAw88UFavXt2l/EsvvSSfffaZPPDAA3LkkUfK6aefrhOWX/7yl9Lc3OxJDAB6z+7mBKtUVNVI+YrKDp/u/FAW4eX1+8DuB+9DT0c4iouLZcmSJTJixIi2bZZl6Z9kMtmlvLrVcswxx8j+++/ftu3444+X+vp6+eCDD+TYY4/tdVtiMfdyr2g00uExLMIaV5hj83tc6tZI5xNs+xNtY0tGEvGob8r29/4Kc1y9fR+4FVvSR+9DU33macKRSCTklFNO6TKKoUY+br/99i7lP//8czn44IM7bFOjIcqWLVt6nXBEIpYUFxeJ2xKJAgmjsMYV5tj8Gte26toe9zc1p2TY0IRvyvb3/gpzXH19H/Q1tm0+fB+63Weez+Fo7+2335aZM2fKmWeeKaeeemqX/U1NTTpJaW/AgAH6cffu3b1+3UzGlmSyQdyiMkLVSclko6TTGQmLsMYV5tj8Hlc8P7bP/XV1u3xTtr/3V5jj6u37wK3Y4j56HzqJS5XJdhTENwnHq6++KjfddJNefTJ//vxuy8Tj8S5zNVoTjcLCwj69firl/h+B6iQT9XotrHGFOTa/xlWQF9GT4tSQcWdqu9rf2m4/lO3v/RXmuPr6PuhrbAU+fB+63We+uKG2dOlSufbaa+W0006TRYsWtY1adKZup2zbtq3DttbnBx10UE7aCsA9lm3rGfjqhNpe68x8td9PZRFeXr8PrH7wPvR8hOPZZ5+VOXPmyJQpU/QSVzVhdG/Gjh0rK1eu1JNEBw4cqLetW7dOioqK5KijjsphqwG4RS33m142Uhpb0tLQlJLCeEwK8qLdnmC/LJvR97TVMLP65NdzWSf17rsswsvr90E05O9DT0c4PvnkE7n//vvljDPO0F/mtX37dv2dHOpn586d+vaJ+v/W2yhqGeyQIUPkhhtukA8//FDfhlHf33HZZZdJfn6+l6EA6AN1Qi2MReQrA/P1Y08nWLVPzdYvGTZIP+6rrJN6sy2L8PL6fWCF+H3o6QiHWpGivszrlVde0T/tTZo0Sf9cdNFF8vTTT8v48eP1rZaf//znMnv2bPm3f/s3vTz2/PPPl2nTpnkWAwAA2DfLtkOUPvVhUkxtrXuzf9V3eqhltmpGsV8nSPVGWOMKc2zEFSzEFTxhjS2WZVyDBhVlvUrFF5NGAQBAuJFwAAAA40g4AACAcSQcAADAOBIOAABgHAkHAAAwjoQDAAAYR8IBAACMI+EAAADGkXAAAADjSDgAAIBxJBwAAMA4Eg4AAGAcCQcAADCOhAMAABhHwgEAAIwj4QBghG1Z0pDKyPb6Zv2onrtVb7IpLVXVtbJzd7rHek22wUS9/R3HNdxiXjcAQPikLUvKl1dKxcaatm2lJUNkWtlIidp2Tur1QxuQPY5r+DHCAcBVdjcXDqWiqkbKV1T2+lOrk3r90AZkj+PaP5BwAHBVY0u6y4Wj/QVE7Tddrx/agOxxXPsHEg4ArmpoSvVpvxv1+qENyB7HtX8g4QDgqsJ4rE/73ajXD21A9jiu/QMJBwBXFeRF9WS/7qjtar/pev3QBmSP49o/kHAAcJVl23plQecLSOuKA7XfdL1+aAOyx3HtHyzbpifT6YzU1u5yrb5YLCLFxUVSV7dLUqmMhEVY4wpzbF7GpVYWqMl+6v67GhJXn1LduHDsqTcjTc0pieereiN7rddsG9yvt7+/D00dV5P6e58NGlQk0Wh2YxfcGANghLpQFMYiUjgwf88Gly4cqt5EPCrDhib2eTI02QYT9fZ3HNdw45YKAAAwjoQDAAAYR8IBAACMI+EAAADGkXAAAADjSDgAAIBxJBwAAMA4Eg4AAGAcCQcAADCOhAMAABhHwgEAAIwj4QAAAMaRcAAAAONIOAAAgHEkHAAAwDgSDgAAYBwJBwAAMI6EAwAA9K+EY/HixTJlypQey/z973+XG2+8UY4//ngZP368/PjHP5atW7fmrI0AsmNbljSkMrK9vlk/qudulDXVBq+ptiWb0lJVXSs7d6dDc7ycxGVKkN4HYRYTn1i2bJksXLhQxowZ02O5G264QVKplDz55JNi27bMnj1brrnmGvn1r3+ds7YC6FnasqR8eaVUbKxp21ZaMkSmlY2UqG33uqypNngtrMfLD33ghzbAJyMcanRi6tSpMn/+fBk+fHiPZZPJpLzxxhty5ZVXytFHHy1f+9rX5KqrrpJ3331XduzYkbM2A9g7u5sTvFJRVSPlKyo7fLp0UtZUG7wW1uPlhz7wQxvgoxGODRs2SF5enqxatUoee+wx2bx5817LxuNxKSoqkpUrV8q4ceP0tueff14OO+wwSSQSfWpHLOZe7hWNRjo8hkVY4wpzbF7EpYbPO5/g25/oG1sykohHHZd1Eldv6/VCLo6Xm23wsk6nctEGzh0BSjgmTpyof7KRn58vc+fOlbvuukvferEsSw488EBZunSpRCK9PyiRiCXFxUXitkSiQMIorHGFObZcxrWturbH/U3NKRk2NOG4rJO4+lpvLuXyeLnRBi/rdCqXbeDcEYCEwwk1Z+ODDz6Q0tJSueKKKySdTstDDz0k06ZNk1/96lcycODAXtWbydiSTDa41k6VEapOSiYbJZ3OSFiENa4wx+ZFXPH82D7319XtclzWSVy9rdcLuThebrbByzqdykUb+vu5I5EoyHoUJFAJx4svvqhHM373u9+1JReLFi2S0047TU8aveSSS3pddyrl/htFdZKJer0W1rjCHFsu4yrIi+hJeWrIujO1Xe1vbYuTsk7i6mu9uZTL4+VGG7ys06lctoFzx74F6qbT+vXr9XyN9iMZ+++/v95WXV3tadsA7GHZtl4BoE7o7bWuDFD7e1PWVBu8Ftbj5Yc+8EMbENARjoMPPlh+85vfyO7du2XAgAF6W0NDg2zatEnOPvtsr5sH4B/UcsPpZSOlsSUtDU0pKYzHpCAv2u0J3klZU23w2pdtzeh5BWqoX336DvrxchKXKUF6H4Sdr0c41ByNmpoaaWpq0s/PPffctu/i+PDDD/XPjBkzdPJRVlbmcWsBtKdO6IWxiHxlYL5+7OkE76SsqTZ4TbVNrZgoGTZIP4bleDmJy5QgvQ/CzNcJx5YtW2TChAmyZs0a/VytSHn22Wf15NGLL75YLr30Ur2kVm3bb7/9vG4uAAAIwi0VteS1vUMOOUSqqqo6bDviiCP0RFEAABAcvh7hAAAA4UDCAQAAjCPhAAAA/ks41JJUAAAAownHiSeeKHfffbdUVlY6/VUAANBPOU44LrvsMlm3bp2cd955ctZZZ8nPf/5z/V0ZAAAAriUc6h9Ke+mll2TZsmUyevRoWbx4sf63TK666iq9vaWlxWmVAAAg5Ho9aXTUqFEyZ84cWbt2rTz88MPS2NiovwFUfVHXvHnzZPPmze62FAAA9M9VKuqbQJ944gl55JFH5M0335Thw4frrxj/wx/+oG+3tH5DKAAA6N8cf9NofX29vnWycuVKeeuttyQej8s3v/lNPZFUjXoot956q1x99dVy//3368QDAAD0b7HerFJpbm6WY489Vu69916dUBQWFnYpN2LECHn//ffdaicAAOhPCccFF1wg3//+9+Xwww/vsZz6h9V+9KMf9aVtAACgvyYct9xyS1blioqKetMeAAAQQny1OQAAMI6EAwAAGEfCAQAA/DeHA0Aw2JYlyaa0bKuulYIBMYnHImLZdk5fv7ElLQ1NKSmMx6QgL+rK63sdF4DeIeEAQihtWVK+vFIqNn757xyVlgyRaWUjJZqDi7Op1/c6LgC9xy0VIGTsbi7KSkVVjZSvqNT7g/j6XscFoG9IOICQUbcxOl+U21+c1f4gvr7XcQHoGxIOIGTUnIm+7Pfr63sdF4C+IeEAQkZN0OzLfr++vtdxAegbEg4gZNRqEDWRsjtqu9ofxNf3Oi4AfUPCAYSMWiKqVm10vji3ruYwvYTU1Ot7HReAvmEMEgghtUR0etlIaWzJSFNzSuL56nswcvd9FV++vrvfw+F1XAB6j4QDCCl1EU7EozJsaELq6nZJKpXJ+esXxiJSODB/zwaXkgKv4wLQO9xSAQAAxpFwAAAA40g4AACAcSQcAADAOBIOAABgHAkHAAAwjoQDAAAYR8IBAACMI+EAAADGkXAAAADjSDgAAIBxJBwAAMA4Eg4AAGAcCQcAADCOhAMAABhHwgEAAIwj4QAAAMaRcAAAgP6VcCxevFimTJnSY5mWlhZZsGCBnHTSSXLcccfJhRdeKB988EHO2ggEhW1ZkmxKS1V1rezcndbP3aq3IZWR7fXN+tGtek0IUlv9gOMFk2LiE8uWLZOFCxfKmDFjeix3zz33yGuvvSZz586Vr371q/Lwww/LlVdeKS+++KLst99+OWsv4Gdpy5Ly5ZVSsbGmbVtpyRCZVjZSorbtu3pNCFJb/YDjhdCPcGzdulWmTp0q8+fPl+HDh/dY9tNPP5Xly5fLfffdp0c4jjjiCPnJT34i+fn58t577+WszYCf2d1cOJSKqhopX1HZ60+tpuo1IUht9QOOF/rFCMeGDRskLy9PVq1aJY899phs3rx5r2XXrl2rRzFOPvnktm2JREJ++9vf9rkdsZh7uVc0GunwGBZhjStssanbKJ0vHO0vII0tGUnEo76p10R/+amtQXgfmj5eYfr76i+xRQ3E5XnCMXHiRP2TjU8++UQOPfRQefnll2XJkiV6dORrX/ua3HbbbXq0o7ciEUuKi4vEbYlEgYRRWOMKS2zbqmt73N/UnJJhQxO+qddEf/mxrX5+H+bqeIXh76u/xZZwMS7PEw4n6uvrpbq6WsrLy+WWW27RoxuPP/64nH/++bJmzRoZPHhwr+rNZGxJJhtca6fKCFUnJZONkk5nJCzCGlfYYovnx/a5v65ul2/qNdFffmprEN6Hpo9XmP6++kts0SzjUmWyHQUJVMIRi8V00vHQQw+1jWio/z/llFPkueeekyuuuKLXdadS7r9RVCeZqNdrYY0rLLEV5EX0ZD81FN6Z2q729yZGU/Wa6C8/ttXP78NcHa8w/H31t9jSLsYVqJtOBx98sE462t8+icfj+jbLpk2bPG0b4BeWbeuVBepC0V7rigO130/1mhCktvoBxwu5EKgRjrFjx0oqlZJ3331XRowYobc1NTXp1Svf/va3vW4e4BtqGeP0spF6sp+6/66GxNWn1L5eOL6sNy0NTSkpjKt6o768IAWprX7A8YJpvh7hSKfTUlNTo5MKRX1Hxze+8Q259dZbZf369fLRRx/puRzRaFTOOeccr5sL+Iq6UKiVBSXDBulHty4cqp7CWES+MjBfP/r5ghSktvoBxwsm+Trh2LJli0yYMEFPCG3105/+VMaNGyfTp0+X73//+3pOx9NPPy2DBg3ytK0AAGDvLNsmhVWTYmpr3Zuxrr7TQy2zVbO6wzSJKKxxhTk24goW4gqesMYWyzKuQYOKsl6l4usRDgAAEA4kHAAAwDgSDgAAYBwJBwAAMI6EAwAAGEfCAQAAjCPhAAAAxpFwAAAA40g4AACAcSQcAADAOBIOAABgHAkHAAAwjoQDAAAYR8IBAACMI+EAAADGkXAAAADjSDgAA2zLkoZURrbXN+tH9dyLNiSb0lJVXSs7d6d7bIOT9pqIzenrZxsXAP+Ied0AIGzSliXlyyulYmNN27bSkiEyrWykRG3bd20wVdbrtgLwF0Y4ABfZ3VwQlYqqGilfUZmTT+NO2mCqrNdtBeA/JByAixpb0l0uiO0vjGq/n9pgqqzXbQXgPyQcgIsamlJ92p/rNpgqmy2vXx9A7pBwAC4qjMf6tD/XbTBVNltevz6A3CHhAFxUkBfVkxi7o7ar/X5qg6myXrcVgP+QcAAusmxbr5jofGFsXUmh9vupDabKet1WAP5j2TZ/pel0Rmprd7lWXywWkeLiIqmr2yWpVEbCIqxxmYhNrZhQkxjVvAI11K8+fef6grinDRlpak5JPF+1IbLXNjhpr4nYnL9+dnEFTVj/xsIaV5hji2UZ16BBRRKNZjd2wU1PwAB1ASyMRaRwYP6eDR5cEFUbEvGoDBua2OdJw0l7TcTm9PWzjQuAf3BLBQAAGEfCAQAAjCPhAAAAxpFwAAAA40g4AACAcSQcAADAOBIOAABgHAkHAAAwjoQDAAAYR8IBAACMI+EAAADGkXAAAADjSDgAAIBxJBwAAMA4Eg4AAGAcCQcAADCOhAMAABhHwgEAAPpXwrF48WKZMmVK1uVXrVolJSUlsmnTJqPtQvDYliUNqYxsr2/Wj+p5GJiKy0m92ZYNax/4AccWQRQTn1i2bJksXLhQxowZk1X5zZs3y7333mu8XQietGVJ+fJKqdhY07attGSITCsbKVHblqAyFZeTerMtG9Y+8AOOLYLK8xGOrVu3ytSpU2X+/PkyfPjwrH4nk8nIzTffLMccc4zx9iFY7G5OxkpFVY2Ur6gM7CdBU3E5qTfbsmHtAz/g2CLIPB/h2LBhg+Tl5enbI4899pgeudiXRYsWSUtLi0yfPl3WrVvnSjtiMfdyr2g00uExLIIQV7Ip3eVk3P6k3NiSkUQ8GrjYTMXlpN5sy/a2rU74vb96y83+8pOw9leYY4saiMvzhGPixIn6J1uVlZXyxBNPyK9//Ws9OuKGSMSS4uIicVsiUSBh5Oe4tlXX9ri/qTklw4YmAhebqbic1Jtt2b621Qm/9ldfudFffhTW/gpzbAkX4/I84XCioaFBbrrpJv2jbr+4lXBkMrYkkw3iFpURqk5KJhslnc5IWAQhrnh+bJ/76+p2BS42U3E5qTfbsr1tqxN+76/ecrO//CSs/RXm2KJZxqXKZDsKEqiE4yc/+Ykcdthh8sMf/tD1ulMp998oqpNM1Os1P8dVkBfRE+jU8HJnarva31Pb/Rqbqbic1Jtt2b621Qm/9ldfudFffhTW/gpzbGkX4wrUTafly5fLn//8ZyktLdU/V155pd7+ne98R8/rACzb1rP11cm3vdZZ/Gp/EJmKy0m92ZYNax/4AccWQRaoEY6XX365w/N33nlHr1ZZsmSJHHnkkZ61C/6ilgZOLxspjS1paWhKSWE8JgV50cCfjE3F5aTebMuGtQ/8gGOLoPJ1wpFOp6W2tlb2228/icfjMmzYsA77P//8c/341a9+VQ444ACPWgk/UiffwlhECgfm79kQkpOxqbic1Jtt2bD2gR9wbBFEvr6lsmXLFpkwYYKsWbPG66YAAICwjHDMnTu3w/NDDjlEqqqq9lp+/PjxPe4HAAD+4OsRDgAAEA4kHAAAwDgSDgAAYBwJBwAAMI6EAwAAGEfCAQAAjCPhAAAAxpFwAAAA40g4AACAcSQcAADAOBIOAABgHAkHAAAwjoQDAAAYR8IBAACMI+EAAADGkXAAAADjSDjgOtuypCGVke31zfpRPfcz1b5kU1qqqmtl5+70XtvrJC6/lM0mLqf1AkBvxHr1W8BepC1LypdXSsXGmrZtpSVDZFrZSInatgS1vU7iCnNZAOgtRjjgGrubC5dSUVUj5SsqffepOdv2OokrzGUBoC9IOOCaxpZ0lwtX+wuY2h/E9jqJK8xlAaAvSDjgmoamVJ/2+7W9TuIKc1kA6AsSDrimMB7r036/ttdJXGEuCwB9QcIB1xTkRfVkw+6o7Wp/ENvrJK4wlwWAviDhgGss29YrGzpfwFpXPKj9QWyvk7jCXBYA+sKybc4o6XRGamt3uVZfLBaR4uIiqavbJalURsIi27jUygY12VDd/1dD8upTsp8vXHvam5Gm5pTE81V7I92210lc/im777ic1usH/f1vLGjCGleYY4tlGdegQUUSjWY3dsENWrhOXagKYxEpHJi/Z4OPL1yt7U3EozJsaKLHPy4ncfmlbDZxOa0XAHqDWyoAAMA4Eg4AAGAcCQcAADCOhAMAABhHwgEAAIwj4QAAAMaRcAAAAONIOAAAgHEkHAAAwDgSDgAAYBwJBwAAMI6EAwAAGEfCAQAAjCPhAAAAxpFwAAAA40g4AACAcSQcAACgfyUcixcvlilTpvRY5q9//atcddVVMn78eDnhhBPkuuuuk88++yxnbQQAAAFOOJYtWyYLFy7ssUxdXZ1ceumlEo/H5ZlnnpGf/exnUltbK1dccYXs3r07Z22F/9mWJQ2pjGyvb9aP6nlPZZNNaamqrpWdu9M9ljXx+n6oN2htABA8Ma8bsHXrVrn77rvlL3/5iwwfPrzHsq+++qo0NDTIAw88oJMO5T/+4z/k1FNPlbfffluPeABpy5Ly5ZVSsbGmbVtpyRCZVjZSorbd67ImXt8P9QatDQCCyfMRjg0bNkheXp6sWrVKjj322B7LqoSivLy8LdlQIpE9ISSTSeNthf/Z3VwQlYqqGilfUdnh07iTsiZe3w/1Bq0NAILL8xGOiRMn6p9sHHLIIfqnvSVLlugEZOzYsX1qRyzmXu4VjUY6PIZFEOJSt0Y6XxDbXxgbWzKSiEcdlzXx+rmo180+MxVbWN+LvUFcwRPW2KIG4vI84egLNY9j6dKlcscdd8igQYN6XU8kYklxcZGrbVMSiQIJIz/Hta26tsf9Tc0pGTY04bisidfPZb1u9Jmp2ML6XuwL4gqesMaWcDGuQCYctm3Lww8/LI8//rj86Ec/2ufKln3JZGxJJhtca5/KCFUnJZONkk5nJCyCEFc8P7bP/XV1uxyXNfH6uajXzT4zFVtY34u9QVzBE9bYolnGpcpkOwoSuISjpaVFZs6cKS+88IJ+vOSSS1ypN5Vy/42iOslEvV7zc1wFeRE9iVEN8Xemtqv9rW13UtbE6+eyXjf6zFRsYX0v9gVxBU9YY0u7GFfgbjrdcsst8t///d+yYMEC15INhIdl23rFhLoAtte6kkLt701ZE6/vh3qD1gYAweXrEY50Oq2/Z2O//fbTE0NXrFgha9as0UnHuHHjpKbmy09arWUAtTxzetlIaWxJS0NTSgrjMSnIi3Z7QfyybEbPQVC3BdQn9b5cPJ28vh/qDVobAASTr0c4tmzZIhMmTNBJhqJuoyjqezjU9vY/rWUARV0AC2MR+crAfP3Y0wVR7VOrK0qGDdKPblw8nby+H+oNWhsABI+vRjjmzp3b4blaAltVVdX2/IknnvCgVQAAINQjHAAAIBxIOAAAgHEkHAAAwDgSDgAAYBwJBwAAMI6EAwAAGEfCAQAAjCPhAAAAxpFwAAAA40g4AACAcSQcAADAOBIOAABgHAkHAAAwjoQDAAAYR8IBAACMI+EAAADGkXAAAADjSDhcZluWJJvSUlVdKzt3p/VzuEMdy4ZURrbXN+vHno6tk7IAAPNiOXiNfiNtWVK+vFIqNta0bSstGSLTykZK1LY9bVt/Orb0AwD4DyMcLrG7ucgpFVU1Ur6ikk/YOTq29AMA+BMJh0saW9JdLnLtL3ZqP8wfW/oBAPyJhMMlDU2pPu2HO8eWfgAAfyLhcElhPNan/XDn2NIPAOBPJBwuKciL6omJ3VHb1X6YP7b0AwD4EwmHSyzb1qsgOl/sWldHqP0wf2zpBwDwJ8aXXaSWXE4vGymNLRlpak5JPD8mBXkRLnKuHtu0noehbo2o0Yrujq2TsgCA3CDhcJm6qCXiURk2NCF1dbsklcp43aRQHdvCWEQKB+bv2dBDAuGkLADAPG6pAAAA40g4AACAcSQcAADAOBIOAABgHAkHAAAwjoQDAAAYR8IBAACMI+EAAADGkXAAAADjSDgAAIBxJBwAAMA4Eg4AAGAcCQcAADCOhAMAABhHwgEAAIwj4QAAAMaRcAAAAONIOAAAQP9KOBYvXixTpkzpsUxdXZ3ceOONMnbsWBk3bpzMnj1bGhsbc9bGILAtSxpSGdle36wf1XM36kw2paWqulZ27k67UqeptpqKzQ9tBYCgiolPLFu2TBYuXChjxozpsdx1112nE4ynnnpKksmkzJo1SxoaGmTevHk5a6ufpS1LypdXSsXGmrZtpSVDZFrZSInatm/qNFmviTb4oa0AEGSej3Bs3bpVpk6dKvPnz5fhw4f3WLaiokLeeOMNnVwcc8wxcsIJJ8i9994rzz//vK6nv7O7uSgqFVU1Ur6islefyE3UabJeE23wQ1sBIOg8H+HYsGGD5OXlyapVq+Sxxx6TzZs377Xs+vXrZciQIXLEEUe0bVO3VSzLkrfeekvOOuusXrcjFnMv94pGIx0ec0XdFuh8UWx/cWxsyUgiHvW8TpP1mmiDH9oatPeiacQVLGGNK8yxRQ3E5XnCMXHiRP2TDTWKMXTo0A7b8vPz5YADDpAtW7b0ug2RiCXFxUXitkSiQHJpW3Vtj/ubmlMybGjC8zpN1muiDX5oa9Dei7lCXMES1rjCHFvCxbg8TzicUHM3VILR2YABA2T37t29rjeTsSWZbBC3qIxQdVIy2SjpdEZyJZ4f2+f+urpdntdpsl4TbfBDW4P2XjSNuIIlrHGFObZolnGpMtmOggQq4YjH49Lc3Nxlu0o2CgsL+1R3KuX+G0V1kol696YgL6InMqph/s7UdrXfaXtM1GmyXhNt8ENbg/ZezBXiCpawxhXm2NIuxhWom04HH3ywbNu2rcM2lYDs2LFDDjzwQOnvLNvWqybURbC91tUUar8f6jRZr4k2+KGtABB0gRrhUN+9oVazVFdXy7Bhw/Q2tWpFGT16tMet8we1RHN62UhpbElLQ1NKCuMxKciL9umi+GWdGT1fQd1CUJ/q+3qhNdFWU7H5oa0AEGS+HuFIp9NSU1MjTU1N+vmxxx4ro0aNkh//+MdSWVkp69atk7vuukvOPfdcOeigg7xurm+oi2BhLCJfGZivH924KKo61EqMkmGD9KNbF1oTbTUVmx/aCgBB5euEQ608mTBhgqxZs0Y/V8tfH330UTnkkEPk4osvlhtuuEFOPvlkueeee7xuKgAACMotlblz53Z4rhKLqqqqDtsGDx4sjzzySI5bBgAAQjvCAQAAwoGEAwAAGEfCAQAAjCPhAAAAxpFwAAAA40g4AACAcSQcAADAOBIOAABgHAkHAAAwjoQDAAAYR8IBAACMI+EAAADGWbbNv7GtDkEm4+5hiEYjkk5nJGzCGleYYyOuYCGu4AlrbNEs4opELP0vuWeDhAMAABjHLRUAAGAcCQcAADCOhAMAABhHwgEAAIwj4QAAAMaRcAAAAONIOAAAgHEkHAAAwDgSDgAAYBwJBwAAMI6EAwAAGEfCAQAAjCPhAAAAxpFw9MLf//53ufnmm+X444+X0tJSueqqq+R///d/91q+rq5ObrzxRhk7dqyMGzdOZs+eLY2NjRL0uFatWiUlJSVdfjZt2iR+9cknn+jYVqxYEfj+chpXkPpr69at3bZ1b/EFpc+cxhWkPlu5cqWcddZZMmLECPn2t78tL7744l7L7t69W/fRCSecoN+3qu9qa2vFr5zE9tZbb3XbZ3/5y1/EL1Rbumuj+vnXf/1XY30Wc6n9/co111wjmUxGlixZIkVFRfLwww/LJZdcIi+//LIUFBR0KX/dddfpk99TTz0lyWRSZs2aJQ0NDTJv3jwJclxVVVX65P7ggw922D5o0CDxo5aWFrnpppv0se9JUPrLaVxB6q8PP/xQBgwYIK+++qpYltW2fb/99gt0nzmNKyh99vzzz+tjfvvtt8tJJ50kv/nNb2TGjBly8MEH64tTZ/fcc4+sX79efvrTn0p+fr7cfffdug+XLl0qfuM0NtVn//RP/yTPPvtsh+3777+/+IVq95/+9KcO2/7nf/5Hrr32Wpk2bVq3v+NKn9lwZMeOHfaMGTPsqqqqtm0ffPCBfeSRR9rvvPNOl/Jvv/223vfRRx+1bfvjH/9ol5SU2J9//rkd1LiUK664wp4zZ44dFAsWLLAvuugiHdPy5cu7LROU/nIaV9D6a8mSJfZ3v/vdrMoGqc+cxBWUPstkMvZpp51mz507t8P2yy67zF60aFGX8qpPjjrqKPu1115r2/bxxx/rPlR9GeTYlLvvvtueOnWqHSS7du3Scd52223d7nerz7il4pDKUhcsWCBHHnmkfq6GlNSnKpXt/vM//3OX8iojHDJkiBxxxBFt29QnFvXpRg29BTWu1ky+fVx+9uabb8p//dd/ydy5c3ssF5T+chpX0PrLSVuD1GdO+yAIfaZu523evFm++93vdtj+i1/8Qq6++uou5Vv7RN26bXXYYYfJQQcdpN/PQY4tKH3W2aJFi/QI4a233irdcavPSDj64M4779T3s9QQ23333SeFhYXd3rMdOnRoh21qOOqAAw6QLVu2SFDj+uKLL3Rs6mSv/hgnTJigh+LUH6jfqCH2W265Re64444ufRHk/nISV5D6S9m4caNOei+44AL5xje+IZMnT5Y//OEPge8zJ3EFpc9a26NuYV1++eX63PGDH/xAfvvb33ZbXsVUXFysby21d+CBB8rnn38uQY5N+etf/yoff/yxlJWVyYknniiXXnqpVFZWil+1fricOnWq/psx2WckHH1w8cUXy/Lly+U73/mOnv+wYcOGLmVU1qhOfp2pjlOTcIIal/qjUmzbln//93+XhQsX6njOP/982b59u/iJuveo7ll2/pTSnSD1l5O4gtRfqVRKn7DVBVfdU1Zzio477jg9ifn1118PbJ85jSsofVZfX68f1adjdc544okn9IVWJUdB7q/exKYS3J07d+oERX0QKC8vl6985Sty4YUXykcffSR+pOaaqDlE55133l7LuNVnTBrtg9ZbDWoU4J133tGTZ9SJob14PC7Nzc1dfld1UncjB0GJa8yYMfoPTmW9rZPfHn30UTn11FP1jHt1EvXL7HL1CXH16tVZlQ9KfzmNKyj9pcRiMT2LPhqN6v5Qvv71r+sLsBrKVp8yg9hnTuMKSp/l5eXpRzUCMGnSJP3/Rx99tLz//vvy5JNPOuqv7ianByk2NdKmbjGoOFp/V61sUeWfeeYZvcrDb9S55Nxzz217T3bHrT5jhKMXw0/qVoP6tNIqEonoi/S2bdu6lFdzIDpvVx23Y8cOPRwV1LhaZ8q3n2mv3niHHHKIHn7zCzVSo5b7qpO0Gg1onVWuZlhfccUVge0vp3EFpb9aqVVSnU+A//Iv/9JtW4PSZ07jCkqfqfv4Suv8r1bq3NHd8l3VX6pvOl/AVB+21hXU2JREItGWbLSeR9Wcjq0+6rP2q6Y+/fTTfY6SutVnJBwOqaFMtSSq/XCaWpaoMtjuJgqp7wVQ97iqq6vbtr3xxhv6cfTo0RLUuNRExfHjx3dYiqmGH//v//5vr5NMvTB//nxZs2aNzuJbfxS1nEuN4AS1v5zGFZT+UtQn/lGjRnX53oL33nuv27YGpc+cxhWUPjvmmGN0IqVGQzvPV1HLQztTfaKW37ef0KvmSqgLsupLP3Eam5qPo5J/dRFvpT7EqQv7P/uoz1qpUdLBgwfLUUcd1WM51/rMlTU1/YxaqnbmmWfab7zxhl5GqpaTjh071t68ebOdSqXsbdu22Y2NjW3Lqn74wx/akyZN0stLX3/99R6XHwUlrs8++8weM2aMfc0119gbN260Kysr7UsuucQ+/fTT7aamJtvP2i8fDXJ/OYkrSP2VTqft733ve/ZZZ51lv/nmm3q56/33329//etf1+/LoPaZ07iC1GePPfaYXVpaaq9evdqurq62y8vL9TLKdevW6f0qrvr6+rby6twyceJEvV/12bnnnmtfeOGFth85iW3nzp36vTd58mT73XfftT/88MO282hNTY3tNzNnztTvqe6Y6DMSjl5IJpN6rfWJJ55ojxw5Uq/JVicE5dNPP+3yfQjbt2+3r732Wvu4446zx48fr3/XbyeM3sT13nvv2Zdeeqk9evRoe9SoUTpGdZL0u/ZxBLm/nMYVpP5SJ2eVMKj34ogRI+zzzjtPX6SD3mdO4wpSnz3xxBP6gnTMMcfYZ599tv3KK6+07VNxPfLIIx2+92HWrFk6oVI/6mJWW1tr+5WT2FRSovpp3Lhx9rHHHqvPo+2/38hvHzJvuOGGbveZ6DNL/acvQzIAAAD7whwOAABgHAkHAAAwjoQDAAAYR8IBAACMI+EAAADGkXAAAADjSDgAAIBxJBwAAMA4Eg4AvqH+MSj174eof0yqu3+dUv2Lm+rfffj973/vSfsA9B4JBwDfUP+665w5c/Q/jvXQQw912Pfuu+/KvHnz5NJLL5VTTjnFszYC6B2+2hyA78ycOVOee+45eeqpp+T444+XZDIpkyZNkuLiYvnVr37V4Z//BhAMJBwAfGfXrl1yzjnn6H/ae/Xq1XLHHXfI2rVrdRJy6KGHet08AL1AwgHAlyoqKuSCCy6QkpISef/992XhwoXyrW99y+tmAegl5nAA8KXS0lK56KKLdLJx+umnk2wAAUfCAcCXGhsb9WoUy7Lk9ddfl08//dTrJgHoAxIOAL5077336iTj0UcflUwmIzfffLOk02mvmwWgl0g4APjOCy+8ICtWrJDrr79e30655ZZb9JyO8vJyr5sGoJeYNArAV/72t7/JueeeKyNGjJAnn3xSIpE9n4uuuuoq+dOf/iTLli3T8zsABAsJBwDfUN8uOnnyZNm0aZOsWrVKDjrooLZ9NTU1+htIBw4cKCtXrtSPAIKDWyoAfGPBggXy3nvv6fkb7ZMNZciQIfpbSNW8DvUIIFgY4QAAAMYxwgEAAIwj4QAAAMaRcAAAAONIOAAAgHEkHAAAwDgSDgAAYBwJBwAAMI6EAwAAGEfCAQAAjCPhAAAAxpFwAAAAMe3/Aag1Wtn1XLxDAAAAAElFTkSuQmCC",
"text/plain": [
"<Figure size 600x600 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"plt.figure(figsize=(6,6))\n",
"ax = sns.scatterplot(x='X', y='y', data=demo_data)\n",
"ax.set(xlabel='X', ylabel='y');"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Das Fallstudien Dataset: melb_data_prep.csv"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"<class 'pandas.core.frame.DataFrame'>\n",
"RangeIndex: 18393 entries, 0 to 18392\n",
"Data columns (total 24 columns):\n",
" # Column Non-Null Count Dtype \n",
"--- ------ -------------- ----- \n",
" 0 Rooms 18393 non-null int64 \n",
" 1 Type 18393 non-null int64 \n",
" 2 Price 18393 non-null float64\n",
" 3 Distance 18393 non-null float64\n",
" 4 Bathroom 18393 non-null float64\n",
" 5 Car 18393 non-null float64\n",
" 6 logLandsize 18393 non-null float64\n",
" 7 logBuildingArea 18393 non-null float64\n",
" 8 YearBuilt 18393 non-null float64\n",
" 9 CouncilArea 18393 non-null int64 \n",
" 10 Lattitude 18393 non-null float64\n",
" 11 Longtitude 18393 non-null float64\n",
" 12 Propertycount 18393 non-null float64\n",
" 13 Method_S 18393 non-null int64 \n",
" 14 Method_SP 18393 non-null int64 \n",
" 15 Method_VB 18393 non-null int64 \n",
" 16 Regionname_Northern_Metropolitan 18393 non-null int64 \n",
" 17 Regionname_South_Eastern_Metropolitan 18393 non-null int64 \n",
" 18 Regionname_Southern_Metropolitan 18393 non-null int64 \n",
" 19 Regionname_Victoria 18393 non-null int64 \n",
" 20 Regionname_Western_Metropolitan 18393 non-null int64 \n",
" 21 month 18393 non-null int64 \n",
" 22 year 18393 non-null int64 \n",
" 23 day_of_week 18393 non-null int64 \n",
"dtypes: float64(10), int64(14)\n",
"memory usage: 3.4 MB\n",
"None\n"
]
}
],
"source": [
"data = pd.read_csv('melb_data_prep.csv')\n",
"print(data.info())"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Vorbereiten der Daten"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"## read and prep data\n",
"from bfh_cas_pml import prep_data, prep_demo_data\n",
"X_train, X_test, y_train, y_test = prep_data(\n",
" 'melb_data_prep.csv', 'Price', seed = 1234)\n",
"\n",
"X_demo, y_demo = prep_demo_data('demo_data_regr.csv', 'y')"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "teaching",
"language": "python",
"name": "teaching"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.13.0"
},
"toc": {
"base_numbering": "3.1",
"nav_menu": {},
"number_sections": true,
"sideBar": true,
"skip_h1_title": false,
"title_cell": "3.1 Regression - Einführung",
"title_sidebar": "Contents",
"toc_cell": true,
"toc_position": {
"height": "calc(100% - 180px)",
"left": "10px",
"top": "150px",
"width": "206.2px"
},
"toc_section_display": true,
"toc_window_display": true
},
"toc-autonumbering": true,
"varInspector": {
"cols": {
"lenName": 16,
"lenType": 16,
"lenVar": 40
},
"kernels_config": {
"python": {
"delete_cmd_postfix": "",
"delete_cmd_prefix": "del ",
"library": "var_list.py",
"varRefreshCmd": "print(var_dic_list())"
},
"r": {
"delete_cmd_postfix": ") ",
"delete_cmd_prefix": "rm(",
"library": "var_list.r",
"varRefreshCmd": "cat(var_dic_list()) "
}
},
"position": {
"height": "321.85px",
"left": "787px",
"right": "20px",
"top": "115px",
"width": "350px"
},
"types_to_exclude": [
"module",
"function",
"builtin_function_or_method",
"instance",
"_Feature"
],
"window_display": false
}
},
"nbformat": 4,
"nbformat_minor": 4
}