From 5fb44475ff4ccd63c27e0fc298d11a48500a1794 Mon Sep 17 00:00:00 2001 From: Abhimanyu22 Date: Mon, 29 Oct 2018 09:49:50 +0000 Subject: [PATCH 1/6] Done --- __pycache__/__init__.cpython-36.pyc | Bin 164 -> 154 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 178 -> 168 bytes .../__pycache__/build.cpython-36.pyc | Bin 650 -> 657 bytes q01_load_data/build.py | 13 ++++++++++--- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 184 -> 174 bytes .../test_q01_load_data.cpython-36.pyc | Bin 3979 -> 3969 bytes 6 files changed, 10 insertions(+), 3 deletions(-) diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index ebbd53a2d5f8e74c1825d49e211ea6c89bbb6b24..5e39e7483ff47586cf1ae23031b1c4c055038ce3 100644 GIT binary patch delta 53 zcmZ3&IE#_Pn3tF9{P}Cq6FJNk-Sso_b5r#llQJ@M6Z0xdjg0ie^NX^J3lfu4^^@~c JQYU6v0RY_C5{&== delta 63 zcmbQmxP+0zn3tD})qh^pL=JQ9K>dvT+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAXRq0+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX*AZXm z;W$fKcyc{XQZk*-y4~<1K}Ex0U5pBd{+KDTvs21XJ?Hkco&t#ICIPq zM{CT<--K$%5JL?Z%<(H3ld@B~rC0jKF&*O?&-fF1g@*KU0|=oZZhS42j@9f*G@(ou zyvSpv6D>ABwxriCkp?e$<4KY5I92yeJ%U~!JJyn}Mg0KmaN9QDV>T^v!IInQj9nDz zDi;f_*qs!Qi7s-MWZC{w7ITqmRe!-*f6IncV1Xcj2zsysGOG9R0Q~v{9~_6)kx`5G Z{6F-qY`oLF;HylWW2;pAjt8Mb=r1#TPT2qe diff --git a/q01_load_data/build.py b/q01_load_data/build.py index e4cd8e3..1b6f17d 100644 --- a/q01_load_data/build.py +++ b/q01_load_data/build.py @@ -1,10 +1,17 @@ -# Default imports import pandas as pd from sklearn.model_selection import train_test_split - path = 'data/house_prices_multivariate.csv' +def load_data(path, test_size=0.33, randomst=9): + df = pd.read_csv(path) + X = df.iloc[:,:-1] + y = df['SalePrice'] + X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=randomst, train_size=0.67) + + return df, X_train, X_test, y_train, y_test + + + -# Write your solution here diff --git a/q01_load_data/tests/__pycache__/__init__.cpython-36.pyc b/q01_load_data/tests/__pycache__/__init__.cpython-36.pyc index 133357e0803cc77a9fa179800aad36162ab7db97..2c6b4ce786ef4e7ed1db707d3f1c54addcbd52f0 100644 GIT binary patch delta 53 zcmdnNxQ>y-n3tD}@4~g{i5%vN(fS$rxvBb&Ng0{BiFuW!Mn?MK`9;~q1&PV2`pNkz IsS~sO0LI%A9RL6T delta 63 zcmZ3-xPy_yn3tD})qh^pL=JQ9RQ-(n+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX)_{M=N1$E1wR+{C=fQX?b%@cg3e;)2BFRQ=@q Kl+;a3-Mj$xD-y#1 delta 66 zcmZpa@0RB<=H=!3=|3-OBga`r?R@=={M=Oi#H5T&eV6>?(%jU%l4AYzqSVU7lKfo# V#GD+3f};Ga)Z~)l&EFWic>(+j7*YTL From 31103ab6b68338e7e9284dc832dacc654962d825 Mon Sep 17 00:00:00 2001 From: Abhimanyu22 Date: Mon, 29 Oct 2018 10:59:27 +0000 Subject: [PATCH 2/6] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 190 -> 180 bytes .../__pycache__/build.cpython-36.pyc | Bin 636 -> 679 bytes q02_Max_important_feature/build.py | 16 +++++++++++++--- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 196 -> 186 bytes ...st_q02max_important_feature.cpython-36.pyc | Bin 1735 -> 1725 bytes 5 files changed, 13 insertions(+), 3 deletions(-) diff --git a/q02_Max_important_feature/__pycache__/__init__.cpython-36.pyc b/q02_Max_important_feature/__pycache__/__init__.cpython-36.pyc index 93c9119e93bd10425c9a680002a7f8007ca6fad4..3ca4e50ad1b978aded6709d24c5eaf684e07705a 100644 GIT binary patch delta 53 zcmdnTxP_6!n3tF9{P}Cq6FJNk6ZJFlb5r#llQJ@M6Z0xdjg0ie^NX^J3lfu4^^@~c JQYU7G008SM67>K8 delta 63 zcmdnOxQ~&;n3tD})qh^pL=JQ9Z2gS<+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX5UuLzo}Hatqj(8kJwyf%3oAJUg7E`#^b$m9B}=>2sOx;uGYb($JdA%p z_D6*Lp&a^}fOz*Lg4TGl;k_z~dawFD%iro|YiTKdx&M3ohyefK-BaA}FskoN1cWJQ ze5*nSTtzA~r4@oz6tsAvbf|ke(tRCML?QKVQ4j3Eh9p~otp5Q?|AD>WAVJ?x3qun! zcl7P1yA&|?8P%Anff=+g!$uH(ga%vD;2O-B&#=W=a2+(z1U%ubYuQM476%U;021lt zv~bQxd1~C5t!gjH6{S}fIoV%{@)4QZOe$OJ<+|IbCyPxSY<04<@?x6(0r!EOo_>zb zi_DI8PtPwhlV8opX%SFE+%d&zj90c`f(uL7q9Gk=%f>T`rfi;r=T4{t-tvcRQ52H>aJ@1 zmvqOGK_2vs%FAtB-VvNyK0&uB;Ah|uvPAj8^RV+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX4n3tF9{P}Cq8#xX!D%R*{ Date: Wed, 31 Oct 2018 16:57:12 +0000 Subject: [PATCH 3/6] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 179 -> 169 bytes .../__pycache__/build.cpython-36.pyc | Bin 892 -> 931 bytes q03_polynomial/build.py | 18 ++++++++++++++---- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 185 -> 175 bytes .../test_q03_polynomial.cpython-36.pyc | Bin 1393 -> 1383 bytes 5 files changed, 14 insertions(+), 4 deletions(-) diff --git a/q03_polynomial/__pycache__/__init__.cpython-36.pyc b/q03_polynomial/__pycache__/__init__.cpython-36.pyc index aa42922819662c41fcd07685edf2a72bf7ac881e..478bd965fa60a3044b6563639b918970a263800a 100644 GIT binary patch delta 53 zcmdnYxRQ~>n3tF9{P}Cq6FJNk!}K%qb5r#llQJ@M6Z0xdjg0ie^NX^J3lfu4^^@~c JQYU740s!S363GAn delta 63 zcmZ3M~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX*v`wAmlf>F&Og4 zxT-0FAc88wX&Zq%7(uxikcB*KIa5*A;T=jO6Q1xzP&=;~@A4ks z;@f;jbVWZBoez}n%H5ja6*?k=-Ub_z)6Yw_n%ukm^Ww+dt4EsMX&yhAq&ca6f|aYEr|}SvXVQ1Pc&MkV~xV6BE`z$-=?* z-l_IcjfbOnrQ~y+Ch}we))R7~rR3c-Pt;7v@p&3o8;X^K$Oa-d@wk$PyGfz74RRIh ziL8ueX)fe@-I&!*1C3?tyh)AqUyY59)7<*=Ycg;xD~oqh^FYVBD6(S|KtWaUs4Ucc zoE1W2Rd2qSXuR1p hYOSdoa0_!bc!-u~N**`=RP7)HG@#w<2?r4Q{{fZ!nZf`7 literal 892 zcmZ`%OK;Oa5cc|!r&FQ|khmelC6~CUx2i&*qV`gi0++G^SsU**-FE%x>^dmOIfW~K zfjfW6S56WCfD^M$QhLFbKhMmrX6E~5_6LLB^N&C1Z`W~tIrp9b?N|8ea|G^iqMVda zLagm7H}$C3*q-v!fCi22t5({kZQ=;RgC+SC&<^d=9_`bR_j!kRzY#j%y${YPTwzvc zMCz`}8IL(L44vKcT+OpQl}sHAW=aqmql1*)h`5l2P%;x37@p#v!Fw^q3tHyc*Jn0C zbd{GHFM>>jj?+>ZIb$H15#vP9R+iAJi;y7I=4m0?=n;PU0Kp(l?sAX&Q~!yxa1B{_ z#x-8$@PN0zyT-4`k}TbYU-{QT7FTjI{(s5w?cR&{Zhgj0MX~h6g80gsKEu4|i2J9-)7S72!mPRAzJ=nom W-8sZer4lb~V-5KbY2)kd`hNjy-~ELE diff --git a/q03_polynomial/build.py b/q03_polynomial/build.py index 26d8971..ba09723 100644 --- a/q03_polynomial/build.py +++ b/q03_polynomial/build.py @@ -1,11 +1,21 @@ -# Default imports +import pandas as pd +import numpy as np from greyatomlib.advanced_linear_regression.q01_load_data.build import load_data from sklearn.preprocessing import PolynomialFeatures from sklearn.pipeline import make_pipeline from sklearn.linear_model import LinearRegression -# We have already loaded the data for you -data_set, X_train, X_test, y_train, y_test = load_data('data/house_prices_multivariate.csv') +data_set, X_train, X_test, y_train, y_test = load_data('data/house_prices_multivariate.csv', 0.33, 9) + +def polynomial(power = 5, randomst=9): + cols = data_set.corr().nlargest(5, 'SalePrice')['SalePrice'].index + poly_model = make_pipeline(PolynomialFeatures(degree=power, include_bias=False), LinearRegression()) + poly_model.fit(X_train[cols[1:]], y_train) + + return poly_model + +polynomial() + + -# Write your solution here diff --git a/q03_polynomial/tests/__pycache__/__init__.cpython-36.pyc b/q03_polynomial/tests/__pycache__/__init__.cpython-36.pyc index 6e2087691199f0bc7e5f879b594cb46948bbd2d5..d0d65732c969b967dca254e1682969270701fa7e 100644 GIT binary patch delta 53 zcmdnVxSo;2n3tF9{P}Cq6FJNkWArofb5r#llQJ@M6Z0xdjg0ie^NX^J3lfu4^^@~c JQYU8l0|4l065#*< delta 63 zcmZ3_xRa5?n3tD})qh^pL=JQ9H2sYH+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAXN_T7WacL3RhAkV>4)bRWfvDDCa3Br Y=clA@KE^1;#ClQb_D{XdPnmld0aa!hiU0rr delta 78 zcmaFP^^uFyn3tC;Gh$wp-bT(zjM|0z8Tq-X`iV&ynffmI$)&lec_qdA=|!oPi6!~D i`iVI?3I#>^S*gh-#hdpqN-?p{nmKc(<>uSWJ&XV Date: Wed, 31 Oct 2018 17:21:43 +0000 Subject: [PATCH 4/6] Done --- q04_ridge/__pycache__/__init__.cpython-36.pyc | Bin 174 -> 164 bytes q04_ridge/__pycache__/build.cpython-36.pyc | Bin 975 -> 907 bytes q04_ridge/build.py | 21 ++++++++++++++---- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 180 -> 170 bytes .../__pycache__/test_q04_ridge.cpython-36.pyc | Bin 2080 -> 2096 bytes 5 files changed, 17 insertions(+), 4 deletions(-) diff --git a/q04_ridge/__pycache__/__init__.cpython-36.pyc b/q04_ridge/__pycache__/__init__.cpython-36.pyc index 43421366bedf944488ce2a27f63ac34969d0db1a..dd2d3463d678850ad927ad219d33507e78eb9869 100644 GIT binary patch delta 53 zcmZ3-xP+0zn3tF9{P}Cq6FJNk1NAfVb5r#llQJ@M6Z0xdjg0ie^NX^J3lfu4^^@~c JQYU7)0081z614yT delta 63 zcmZ3&xQ>y-n3tD})qh^pL=JQ9X#I@*+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAXjCLDXlwN8MqN2+o33 zgq@f=UkIqw7Lnwi2j!0($~T&*facql-|k1;U;owaL}5G}G#dU+UmVFKY;nJ(gLr;{ z7pDvIKFtA&R6Gq=kc(|(!(PFnmjA(iwZI80NIZy=VS(c$pVW8S)M8;829l@32AXhH xP%^@UP?#c&SwAWa$vG1>Raf%gLRGa{%ka!WkFTg7m#WQ07AzMoF^SFLmUc&mD#A%kGM zQXFWqapm6Ma4opc)|L1NuB-~fFm>3;Kko!FN2yDFlv`_y8x@-I6-uCZpIBf^8 z`$Ey&Z3uVf!08uqMwFNPDo}PqHe>^5b_2PiLd~4s>0COU3+JG5dM9n{h8~mWR^qlC zl3Of(w%~Iytx@pBOeN5Hvue32N|{9MSGfP4)SLx}naZAGR)~(2b?3-;s8CO9b?(tr z38^}F-Jgkzo{=e0vcn z6*onxWI9K&&Qw*T*>ZWO#wr&xCEEk?;4V&d+emL|hy_E4AcPT&NRNP%_MD_+jP+wj z%T-aYaj1Fwle|3cT+B*d6?!5eIPM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAXN_T7WacL3RhAkV>4)bRWfvDDCa3Br z=clA@e#)55D9^&cz`zE?&OltO0VGNoQW%>VW0-3hYnf`9C+9LxW@G^(Vdh(m@sm|q z6(*ao2r}|b4hOQ*SojI*pTyEE#8Si!G`L6%M2Le3iOC~wiZ|b8%x08jW?*1o17c?&E>;5)B@8Ky&5SWjwT!h)lT(=|i!c{) z1BGv~7UdSF8bT Date: Wed, 31 Oct 2018 17:28:30 +0000 Subject: [PATCH 5/6] Done --- q05_lasso/__pycache__/__init__.cpython-36.pyc | Bin 174 -> 164 bytes q05_lasso/__pycache__/build.cpython-36.pyc | Bin 975 -> 905 bytes q05_lasso/build.py | 20 +++++++++++++++--- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 180 -> 170 bytes .../__pycache__/test_q05_lasso.cpython-36.pyc | Bin 2080 -> 2070 bytes 5 files changed, 17 insertions(+), 3 deletions(-) diff --git a/q05_lasso/__pycache__/__init__.cpython-36.pyc b/q05_lasso/__pycache__/__init__.cpython-36.pyc index 1005306dfd1495f17293e8f96d1fe442f494d410..628f92779d54bcba01bfa10f36bfc2234f3863be 100644 GIT binary patch delta 53 zcmZ3-xP+0zn3tF9{P}Cq6FJNk1NAfVb5r#llQJ@M6Z0xdjg0ie^NX^J3lfu4^^@~c JQYU7)0081z614yT delta 63 zcmZ3&xQ>y-n3tD})qh^pL=JQ9X#I@*+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAXJWOSY9* zE{xZy#gU7k%E+mF3Z3dHVRt?=}eh zI$S+@cm4HvIKqImS>Rg!Ex6jL4g74Q!eg_95p$!oN~0nR!p%o$ZUSmm#yz5ySPGY6 yq^pAup|NC~@jPuzB?Ol}UDxstLRYuhTky>3M7+}ft#q4*ZCD=mj1>YG@&5vCIC{_k delta 549 zcmYjMzi-qq7>%7czb-lMPJ#g;QBg#dg^03rs49kvi47!*g><-Qx4kG%g6*qxQYwb) z0s^E{Bt|9{{tZSJcCSo`|9}ZQt*ZKypFcmp_vG(=@GIDSoTl-&S6}gG*KvM3*A_DU z6SL);_2$kND&k^5(Fy>EMbuw`*9a###Y21pk7!Io8l3|?UVqp@eX;?MdlW&C*W?D!4 z2UEqQ(*CkPGhYOjMx_nK>1FCv2{NxV5?r!JIJsi2vnRK|JL0A>{yWG|YR+)C?eW|flpv0zK0YMzs_+-O8yu$hwG9(;IDOpI-4wzQ1{h9Chk7=aPIKr!h)!h9@J z^Qcj^;LTE4dG`~(Jkq`(6|K3Mh%t&oYQ~&Oro_M~#K=NoVQj(X_n*85w+yGlU0%~g T$@ZYRNgJMk&{Sf}op}EN=}e2> diff --git a/q05_lasso/build.py b/q05_lasso/build.py index fb30d50..d8a601c 100644 --- a/q05_lasso/build.py +++ b/q05_lasso/build.py @@ -1,14 +1,28 @@ -# Default imports from sklearn.linear_model import Lasso import pandas as pd import numpy as np from sklearn.metrics import mean_squared_error from greyatomlib.advanced_linear_regression.q01_load_data.build import load_data -np.random.seed(9) # We have already loaded the data for you data_set, X_train, X_test, y_train, y_test = load_data('data/house_prices_multivariate.csv') +np.random.seed(9) + +def lasso(al=0.01): + + lasso_model = Lasso(alpha=al, normalize=True, random_state=9) + lasso_model.fit(X_train, y_train) + + y_pred_train = lasso_model.predict(X_train) + y_pred_test = lasso_model.predict(X_test) + + rmse_train = mean_squared_error(y_train, y_pred_train)**0.5 + rmse_test = mean_squared_error(y_test, y_pred_test)**0.5 + + return rmse_train, rmse_test + +lasso(0.01) + -# Write your solution here diff --git a/q05_lasso/tests/__pycache__/__init__.cpython-36.pyc b/q05_lasso/tests/__pycache__/__init__.cpython-36.pyc index 88694349bfe01743507f538dd58873ee81a6ec3c..cb6cbc29436ca8230de2b6503a09c6d17c5c28ce 100644 GIT binary patch delta 53 zcmdnOxQda(n3tF9{P}Cq6FJNk!}T-rb5r#llQJ@M6Z0xdjg0ie^NX^J3lfu4^^@~c JQYU740RZKw63qYr delta 63 zcmZ3*xP_6!n3tD})qh^pL=JQ9ME#8X+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX Date: Wed, 31 Oct 2018 17:35:45 +0000 Subject: [PATCH 6/6] Done --- q05_lasso/__pycache__/build.cpython-36.pyc | Bin 905 -> 905 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 185 -> 175 bytes .../__pycache__/build.cpython-36.pyc | Bin 702 -> 726 bytes q06_cross_validation/build.py | 13 ++++++++++--- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 191 -> 181 bytes .../test_q06_cross_validation.cpython-36.pyc | Bin 2091 -> 2081 bytes 6 files changed, 10 insertions(+), 3 deletions(-) diff --git a/q05_lasso/__pycache__/build.cpython-36.pyc b/q05_lasso/__pycache__/build.cpython-36.pyc index 5910febe507b6b5f5a9424e558695b353f18d301..dc3169fb88251a00eea7dfaaed3f14c027edad88 100644 GIT binary patch delta 14 VcmeBV?__5+=H=xI+{oI(3;-7o0}B8E delta 14 VcmeBV?__5+=H=zm-N@R)3;-5e0_Ok# diff --git a/q06_cross_validation/__pycache__/__init__.cpython-36.pyc b/q06_cross_validation/__pycache__/__init__.cpython-36.pyc index fa7d8bff4b4367609876242346df0325d2410dff..ac1de307606719eae063c95b0eede4b8460c1f0c 100644 GIT binary patch delta 53 zcmdnVxSo;2n3tF9{P}Cq6FJNkWArofb5r#llQJ@M6Z0xdjg0ie^NX^J3lfu4^^@~c JQYU8l0|4l065#*< delta 63 zcmZ3_xRa5?n3tD})qh^pL=JQ9H2sYH+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX7&QbUW1i;01ufqCqzw30%_UMWUNp~MT4 zU2FcnjK)ol&-X&2*4R`RMajuL{)p8fg_^ADS?-9NGo TW)pD&c2j{x2tI_Q4^_x7>1xrc&e?Ke z)KWOzmZE76=SJ76a(4R+*L(ed6!-`X!0c|nVLnNW=%j9aY?YEelfsFyRn8>XyIB0*|7T&d&(4r_(Wr~?lFiWy$e@UdXuy5|i*H%{ diff --git a/q06_cross_validation/build.py b/q06_cross_validation/build.py index e39b93b..958f926 100644 --- a/q06_cross_validation/build.py +++ b/q06_cross_validation/build.py @@ -1,13 +1,20 @@ -# Default imports from sklearn.model_selection import cross_val_score import numpy as np from greyatomlib.advanced_linear_regression.q01_load_data.build import load_data -np.random.seed(9) # We have already loaded the data for you data_set, X_train, X_test, y_train, y_test = load_data('data/house_prices_multivariate.csv') +np.random.seed(9) + +def cross_validation(model, X, y): + + model.fit(X_train, y_train) + scores = cross_val_score(model, X, y, scoring='neg_mean_squared_error', cv=5) + neg_mse = scores.mean() + + return neg_mse + -# Write your solution here diff --git a/q06_cross_validation/tests/__pycache__/__init__.cpython-36.pyc b/q06_cross_validation/tests/__pycache__/__init__.cpython-36.pyc index ca3f5cd76d3a5d9abb66f9d0edaf0d9dac4ec0bc..b11cd3d1e257ad07a9690721a8db1f7725be8dd7 100644 GIT binary patch delta 53 zcmdnbxRsH^n3tF9{P}Cq6FJNklk_w4b5r#llQJ@M6Z0xdjg0ie^NX^J3lfu4^^@~c JQYU7G0s!l`68QiC delta 63 zcmdnWxSx^3n3tD})qh^pL=JQ99Q};^+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAXiwhEyQ}vVc MQ&KnkGu>eY02$5`oB#j- delta 66 zcmZ1|uv&n_n3tF9r~kaDjT|ye+O_%_`MIh3iAfom`Y!p&rManjCB^#bMX8mECHcAf Wi8(n61x5K;smUe9n_ZdiumS+$GZ$+B