{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# CS 307: Week 05" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Regularization" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import numpy as np\n", "import pandas as pd\n", "from sklearn.datasets import make_regression\n", "from sklearn.linear_model import LinearRegression\n", "from sklearn.linear_model import Lasso\n", "from sklearn.linear_model import Ridge\n", "from sklearn.preprocessing import StandardScaler" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "# create some data\n", "X, y = make_regression(n_samples=100, n_features=20, noise=0.1, random_state=42)" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "array([[-0.92216532, 1.87679581, 0.75698862, 0.27996863, 0.72576662,\n", " 0.48100923, 1.35563786, -1.2446547 , 0.4134349 , 0.86960592,\n", " 0.65436566, -1.12548905, 2.44575198, 0.12922118, 0.22388402,\n", " 1.49604431, -0.7737892 , -0.05558467, 0.10939479, -1.77872025],\n", " [-0.08310557, -1.4575515 , -1.40631746, -0.1601328 , -0.79602586,\n", " 1.07600714, 0.76005596, -0.75215641, 0.08243975, -1.50472037,\n", " -1.87517247, 0.67134008, 0.21319663, -0.75196933, 0.02131165,\n", " 1.34045045, -0.30920908, 0.11502608, -0.31905394, 0.31917451]])" ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "# view first two rows of the X data\n", "X[0:2]" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "array([ 108.81742028, -250.567936 , 1.86765761, 127.84318259,\n", " 34.15127975])" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "# view some examples from the y data\n", "y[0:5]" ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | 0 | \n", "1 | \n", "2 | \n", "3 | \n", "4 | \n", "5 | \n", "6 | \n", "7 | \n", "8 | \n", "9 | \n", "10 | \n", "11 | \n", "12 | \n", "13 | \n", "14 | \n", "15 | \n", "16 | \n", "17 | \n", "18 | \n", "19 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "-0.922165 | \n", "1.876796 | \n", "0.756989 | \n", "0.279969 | \n", "0.725767 | \n", "0.481009 | \n", "1.355638 | \n", "-1.244655 | \n", "0.413435 | \n", "0.869606 | \n", "0.654366 | \n", "-1.125489 | \n", "2.445752 | \n", "0.129221 | \n", "0.223884 | \n", "1.496044 | \n", "-0.773789 | \n", "-0.055585 | \n", "0.109395 | \n", "-1.778720 | \n", "
1 | \n", "-0.083106 | \n", "-1.457551 | \n", "-1.406317 | \n", "-0.160133 | \n", "-0.796026 | \n", "1.076007 | \n", "0.760056 | \n", "-0.752156 | \n", "0.082440 | \n", "-1.504720 | \n", "-1.875172 | \n", "0.671340 | \n", "0.213197 | \n", "-0.751969 | \n", "0.021312 | \n", "1.340450 | \n", "-0.309209 | \n", "0.115026 | \n", "-0.319054 | \n", "0.319175 | \n", "
2 | \n", "0.810808 | \n", "-1.662492 | \n", "-0.134309 | \n", "-0.308034 | \n", "-0.209222 | \n", "-1.683438 | \n", "-1.748532 | \n", "1.126705 | \n", "1.304340 | \n", "0.793489 | \n", "-1.105705 | \n", "0.779661 | \n", "1.310309 | \n", "1.395684 | \n", "-0.805870 | \n", "-0.410814 | \n", "1.032546 | \n", "-0.214921 | \n", "-0.562168 | \n", "-1.090966 | \n", "
3 | \n", "0.536653 | \n", "-0.756795 | \n", "-1.046911 | \n", "0.455888 | \n", "0.268592 | \n", "1.528468 | \n", "0.718953 | \n", "1.501334 | \n", "0.996048 | \n", "1.185704 | \n", "1.328194 | \n", "2.165002 | \n", "-0.643518 | \n", "0.927840 | \n", "0.507836 | \n", "-0.250833 | \n", "-1.421811 | \n", "0.556230 | \n", "0.057013 | \n", "-0.322680 | \n", "
4 | \n", "1.532739 | \n", "-0.401220 | \n", "0.519347 | \n", "1.451144 | \n", "0.183342 | \n", "2.189803 | \n", "0.401712 | \n", "0.012592 | \n", "0.690144 | \n", "-0.108760 | \n", "0.024510 | \n", "0.959271 | \n", "2.153182 | \n", "-0.767348 | \n", "-0.808298 | \n", "-0.773010 | \n", "0.224092 | \n", "0.497998 | \n", "0.872321 | \n", "0.097676 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
95 | \n", "-0.114736 | \n", "-0.334501 | \n", "-0.792521 | \n", "2.122156 | \n", "-0.707669 | \n", "0.443819 | \n", "0.865755 | \n", "-0.653329 | \n", "-1.200296 | \n", "0.504987 | \n", "-1.260884 | \n", "1.032465 | \n", "-1.519370 | \n", "-0.484234 | \n", "0.774634 | \n", "0.404982 | \n", "-0.474945 | \n", "0.917862 | \n", "1.266911 | \n", "1.765454 | \n", "
96 | \n", "-0.599375 | \n", "0.622850 | \n", "-1.594428 | \n", "-1.534114 | \n", "0.115675 | \n", "1.179297 | \n", "0.046981 | \n", "-0.142379 | \n", "-0.450065 | \n", "0.005244 | \n", "0.711615 | \n", "1.277677 | \n", "0.332314 | \n", "-0.748487 | \n", "0.067518 | \n", "0.514439 | \n", "-1.067620 | \n", "-1.124642 | \n", "1.551152 | \n", "0.120296 | \n", "
97 | \n", "-0.152470 | \n", "-1.331233 | \n", "0.133541 | \n", "-0.006071 | \n", "-0.290275 | \n", "0.267392 | \n", "0.956702 | \n", "0.507991 | \n", "-0.785989 | \n", "0.708109 | \n", "0.388579 | \n", "0.838491 | \n", "0.081829 | \n", "-0.098890 | \n", "0.321698 | \n", "-2.152891 | \n", "-1.836205 | \n", "2.493000 | \n", "0.919076 | \n", "-1.103367 | \n", "
98 | \n", "-1.379618 | \n", "0.513085 | \n", "-0.971657 | \n", "1.188913 | \n", "-0.881875 | \n", "-0.163067 | \n", "0.862393 | \n", "0.516178 | \n", "0.953125 | \n", "-0.626717 | \n", "0.800410 | \n", "0.708304 | \n", "0.351448 | \n", "1.070150 | \n", "-0.744903 | \n", "0.431923 | \n", "0.725096 | \n", "0.754291 | \n", "-0.026521 | \n", "-0.641482 | \n", "
99 | \n", "-2.848543 | \n", "-1.119670 | \n", "0.771699 | \n", "0.076822 | \n", "-0.428115 | \n", "1.500760 | \n", "-1.739714 | \n", "1.160827 | \n", "-0.362441 | \n", "1.148766 | \n", "-0.046921 | \n", "-1.282992 | \n", "0.996267 | \n", "-0.493757 | \n", "0.850222 | \n", "0.346504 | \n", "-1.294681 | \n", "0.477041 | \n", "-1.556582 | \n", "-0.467701 | \n", "
100 rows × 20 columns
\n", "