From c99866c71cdf60bf890022cbed4888077b2c54de Mon Sep 17 00:00:00 2001 From: psicktrick Date: Thu, 29 Nov 2018 10:27:03 +0000 Subject: [PATCH 1/5] Done --- __pycache__/__init__.cpython-36.pyc | Bin 0 -> 154 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 172 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 970 bytes q01_missing_value/build.py | 16 ++++++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 178 bytes .../test_q01_imputation.cpython-36.pyc | Bin 0 -> 2327 bytes 6 files changed, 16 insertions(+) create mode 100644 __pycache__/__init__.cpython-36.pyc create mode 100644 q01_missing_value/__pycache__/__init__.cpython-36.pyc create mode 100644 q01_missing_value/__pycache__/build.cpython-36.pyc create mode 100644 q01_missing_value/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q01_missing_value/tests/__pycache__/test_q01_imputation.cpython-36.pyc diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..1d37ed440c375005e9a3ab24ecc775170666e3df GIT binary patch literal 154 zcmXr!<>h)>{y&-l2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CU+(%D`MIh31;v@k z*(F6lLO(peD7&~IF*#K~IX@*;KP@$}q_ikCJ~b~rGcPr@C^IiTzMv>SD>b=9KR!M) cFS8^*Uaz3?7Kcr4eoARhsvXFJVjyM!0FfgpC;$Ke literal 0 HcmV?d00001 diff --git a/q01_missing_value/__pycache__/__init__.cpython-36.pyc b/q01_missing_value/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..22b4ca393bd7a79c2cf65f162563a108471bd5de GIT binary patch literal 172 zcmXr!<>h)>{y&-l2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CUy=G5`MIh31;v@k z*(F6lLO(peD7&~IF*#K~IX@*;KP@$}q_ikCJ~b~rGcPr@C^IiTzMv>SD>b=9ztF%i sJ~y+t7$jDfm{XdnA0MBYmst`YuUAlci^C>2KczG$)edB3F%UBV0PnFd5C8xG literal 0 HcmV?d00001 diff --git a/q01_missing_value/__pycache__/build.cpython-36.pyc b/q01_missing_value/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..3f6043dd2fb5755622908dd960dec56e9824a9b8 GIT binary patch literal 970 zcmYjP&1w`u5bo~z-N`0M1RO-ksDNapqN9~HU&JB0VdjEu0+(bK6(J?=mf#2Jw zIe(`_%2RCN;8?aETu_1ZcQBt(h8bq$Dy&hBzn}@Qp5xbOjxTNGfFksXv^XPc=#sQ# z;==Xj$g28EFoGI?5?I^fHQVKYA1=C_uFE|i)V_CjKCE9y*uJ$LHwa5z7A%LT6FxVBZ=(Oj7)vyw)h)4b)nTUo{;s6=O)PVl7bTx z6+oK`!Nl13tcDTkm>4qHG?+q)u(XQ=02-aBfQvfL9=7mBaJO{=|66c#6s~H%`u_>Oso50ve5;z4J;dGC7Z3dqkJTtz~vdMGf=%(mM+%p}Ia0}!$Ip6N~Jc0*9CnBqExYWo0 E0D+$ds{jB1 literal 0 HcmV?d00001 diff --git a/q01_missing_value/build.py b/q01_missing_value/build.py index 7dc4d18..a6ea383 100644 --- a/q01_missing_value/build.py +++ b/q01_missing_value/build.py @@ -1,3 +1,4 @@ +# %load q01_missing_value/build.py # Default imports import pandas as pd @@ -8,3 +9,18 @@ # Write your code here: +def imputation(df): + num_features = [a for a in range(len(df.dtypes)) if df.dtypes[a] in ['int64', 'float64']] + num_data = df.iloc[:,num_features] + num_data.fillna(num_data.mean(), inplace = True) + + cat_features = df.columns.difference(df.columns[num_features]) + cat_data = df.loc[:,cat_features] + for column in list(cat_features): + cat_data[column].fillna(cat_data[column].mode()[0], inplace=True) + + return num_data, cat_data +x,y = imputation(housing_data) +y.isnull().sum() + + diff --git a/q01_missing_value/tests/__pycache__/__init__.cpython-36.pyc b/q01_missing_value/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..7164506e725de1b87b9e8f4647e714da7353b08f GIT binary patch literal 178 zcmYL?JqiLb5QVc~A;KQS#!+lVJi#^=78XOuj%(b_kC{aANM6a-&Lh}pQiu<}kH>4? zvaTnu>t`==o<+Y@xok2#%4)?{OsnQDLYe=1BOIL}@T^rILl*2@=-Ep}pj=CEAQ@92 xB-?3A6twNo2X`VB;XGfU(adGL$RQC#;>dugt&WH@e|wBq#Our+69XU_b5-+brHr~Q8T`;UKq|7(ko-^khz zzR5i(nuFnl(}GNCLMgVL!bx22aFyKW z^_qsDXwbyZUtuMuc^x+g5PfVPE z&Of}!<<4a@E)a|}Yl3e^28OhQ_Q)aTG zXk4>;(Ia+O3@g0b*ij)=s*45*Z4834H(x#c`C57tMjOZ!AbGbTCH z(U;)$P_e0adM7$9E0CW!_l28}wsqXL*BZGU=mV(@lbNtCT)uT?+SA1^#+>j zXx>C~0}VpG8Y_G6fa}#+*;}%LnQ0j~AHj!#2Vjd#=mIj+#9fd&M|luJkeim_bDoPH z&ZEccI>}0DAT{e~$cE>E6#F$i+sd_sL~dJ6d|8*t)Ag`P!e%8*9WZn#7{h z)#ZMGsOyXYTA1IyObM4w`}gQk4_8O8-UfGtSESxWvz9KB?h5zrm4WYV!!rLI_}(z? z*dR?MgkPH4Fioc=uL^AU(iESEW<+h^DX*cqiDnDUduTAVuAQg<{X@Uru?e(L3EdQ?{U nz$Cr%1}cFy;e-2Mb}$>XgH+q2JtuTFY2f??0r6Gn literal 0 HcmV?d00001 From 5f2d3bf613c20fe313b8ccd34b75eb84a8dbc535 Mon Sep 17 00:00:00 2001 From: psicktrick Date: Fri, 30 Nov 2018 03:53:18 +0000 Subject: [PATCH 2/5] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 174 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 641 bytes q02_outlier_removal/build.py | 24 ++++++++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 180 bytes .../test_q02_outlier_removal.cpython-36.pyc | Bin 0 -> 1790 bytes 5 files changed, 24 insertions(+) create mode 100644 q02_outlier_removal/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_outlier_removal/__pycache__/build.cpython-36.pyc create mode 100644 q02_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_outlier_removal/tests/__pycache__/test_q02_outlier_removal.cpython-36.pyc diff --git a/q02_outlier_removal/__pycache__/__init__.cpython-36.pyc b/q02_outlier_removal/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..71d6440cb8c16fa2d0628b3e2b3f2d7205c4f63d GIT binary patch literal 174 zcmYL?F$w}P5Jj_KA;KQS#u05rJb{gc#TLVojBDK8Oq?W&NAgOx;w5Y}TZkXtnEE}KjkWf`?o(_(v9GR%LyD>!mb;Dgm|lq}e@w87V!K(iq@P#u#H vl54CZ66+fD!Y9%Z&hrIwik&4vp`I^w2Z+|$h&c1N$9UDVNgb_+(~wbLT%|Df literal 0 HcmV?d00001 diff --git a/q02_outlier_removal/__pycache__/build.cpython-36.pyc b/q02_outlier_removal/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..07437c2de5ddc9d5858691115132e66453bdc846 GIT binary patch literal 641 zcmZ8fO>fgc5Z(1h;#f^v$|<)VxL87U1&C9{hd}BjR7gP-Ss-iiOdKbU*V$c1O_fMU z;mQx;%)i+yCocQ|PK=`B zj(qBXv*n44F1X-<4;|>{{(vPO1kn4+5+C@8Md2^%Vpq3^AdHBO5=C{E>7@rfN zFBJ;gyHvwsxeJ4#G^2^A(T0~oi5%apDDI6!iEmYrVa8iJGLO7f_KI8&3D#^%+Q7*j zaKG^lU-KykZ_78%%|qj?`If(CpH4R})sfTZ4%pghapn!!w5?=|2iKG#)&7<3j!P-b z(C`q@G@>#^iPkF%ZL9}M)-40zP2^bz z#>sKj%#n_gj!~FKp-zteHKj{YHpJ51r@k|Fk52aILp+gljB8zFGefPj_*$x&u0@7% zCIRDpeTr3HR7mVqp4LiENm;x&f0W9`lm)6(;at)l@#m%};jCWSqyI7o?QMnxj34um zAM#VK?$avj*iJ1f5ZXF5*np-6>28eGDxJti(~kCFAEfQ5cWpcQci@DmY;ZA`(3JR$ O9vai_3 quantile_values[feature]].index) +# return df + +def outlier_removal(df): + numeric_features = df.select_dtypes(include = ['float64', 'int64']) + quantile_values = numeric_features.quantile(0.95) + for feature in list(numeric_features): + df = df[df[feature]<=quantile_values[feature]] + return df + +len(outlier_removal(housing_data)) + + + + + + + + diff --git a/q02_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc b/q02_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..a07400ff6b4b2cb1e1f019e87a86bc5b67b0df6c GIT binary patch literal 180 zcmYL?F$w}P5Jj_KA;KQS#u05rJb{gcg~brEqsHCM#L2AUk-U-k?}vZC{rA^DJ;wfG8&?bc zCwOa#Ml#8BHs>+t+amlyYIZlL-H~vqYEq3k_Zk)m! zD;jP^X8Fal-w=WU86l5q4u#Rtj@*q7vQsF~8+yveIEAasY*%Ov$~-%%L~h+2ilJjY z4f(`+MDq`(dKmW4$>^w@!)T$i^w=Pq3p@Wh`@fm04&b*l~xoMFU zH-zSlmoF~?;4X^{?wM#(sz?C}plE1BnT}pBL?MNazQd^Rm6*fp-RP{WP?T^HiyDb` z^ssI3G$MSipBLJQA_d!ho0%ij46VO)7SeiYslfUZ8Yu3p$Fv^JKjaO_YYYc9LplrU zv@L8 zQXtzTv0;+TOIhXQ_mYH8hUSYJ;F#(TnNP@kM&^=v?U8sDK_*da>LK8PkH1#^cG$N; zRb+;WR#ao$YGk7B;~(q4sj^%)CsR8s=rA|+rilYQyJb=z=EYfp($J`$xOd?sv|=@^ edX}4tvccC)SKrXInp)}M?& Date: Fri, 30 Nov 2018 04:03:12 +0000 Subject: [PATCH 3/5] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 171 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 532 bytes q03_skewness_log/build.py | 10 ++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 177 bytes .../test_q03_skewness_log.cpython-36.pyc | Bin 0 -> 2202 bytes 5 files changed, 10 insertions(+) create mode 100644 q03_skewness_log/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_skewness_log/__pycache__/build.cpython-36.pyc create mode 100644 q03_skewness_log/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_skewness_log/tests/__pycache__/test_q03_skewness_log.cpython-36.pyc diff --git a/q03_skewness_log/__pycache__/__init__.cpython-36.pyc b/q03_skewness_log/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..72c9f354d7ac11adbb3d6e9507ea23d6aaf16cf8 GIT binary patch literal 171 zcmXr!<>h)>{y&-l2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CUlIBl`MIh31;v@k z*(F6lLO(peD7&~IF*#K~IX@*;KP@$}q_ikCJ~b~rGcPr@C^IiTzMv>SD>b=9ztF%q tzBoIzJTJAlI6fyoT|YiPGcU6wK3=b&@)n0pZhlH>PO2Tq#$q65006wjFRuUq literal 0 HcmV?d00001 diff --git a/q03_skewness_log/__pycache__/build.cpython-36.pyc b/q03_skewness_log/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..bdafbdbb03f34047e91628182c4e0cd883e02fc4 GIT binary patch literal 532 zcmYjN%}N6?5Kgk&?Y6cay!i;dbp5$W5k;o}7dV4a}E(nHj$M=D6E!e|?gNH6`SmY#oO0GYox#Ac&wPnbMR}_huza1Am8U z1A=iRf;CN>A{32xlE%;+x7GwJ*)8csKiE%t)P{Njufw-p!3|H0;ziZZ^*l#ie*#1o z7Z~~y!H_XsqV7If`+GnP`{ygV$+AtBZL*%P*pe>UlT#0dY3oW|7xQxkJZ;_b5^hwH zLocwbk~S#ok#bIvhidLPZf`b5ha$t3ss>WuZ^LK&^FFqq>8l6RTFgo~ Qb?&`(hsHE!?J$o10M_4vKmY&$ literal 0 HcmV?d00001 diff --git a/q03_skewness_log/build.py b/q03_skewness_log/build.py index f008d0f..3493378 100644 --- a/q03_skewness_log/build.py +++ b/q03_skewness_log/build.py @@ -1,3 +1,4 @@ +# %load q03_skewness_log/build.py from scipy.stats import skew import pandas as pd import numpy as np @@ -6,3 +7,12 @@ # Write code here: +def skewness_log(data): + data['GrLivArea'] = np.log(data['GrLivArea']) + sv1 = skew(data['GrLivArea']) + data['SalePrice'] = np.log(data['SalePrice']) + sv2 = skew(data['SalePrice']) + return sv1, sv2 +data.head() + + diff --git a/q03_skewness_log/tests/__pycache__/__init__.cpython-36.pyc b/q03_skewness_log/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..0b7c3b4ee94dab5bd18ab3eb0c5638076ad031f9 GIT binary patch literal 177 zcmYL?F$%&!6ht>*Awmvf;}_D3cmf*>3&Bs=jB!n}yYAl*Jd#(k6)$0@L>$Nf9oEWLAd#1aptG@cG=4P+g{`JY9U;XYA z@(WpcJXqg>p}znjh@csn(3nzOJDC%^!WCZTP5jum-~6mGX~s=Tq`Mc0#+=42>C4uf ze(l8VxU)?}Qv^?m2qc}maaTAyBx)_dHi>8zd@i-Q$F&?Rocc>wkL8nGYR$4@1Si%; z(hSQi<7%X*GMTLjZg}4)p5|ML-cQib@q;Grz|glqND@;)Vnja*>jA0NCn*_ zbGQ|NT6rHj8)WVxWMJPLC^WY~F?;*|w-A|;B7`8ziOh`-uZU~mcDgTfSVf+KBoT#~ zsXAP1sm%SyCC@51lX>J+o|f6L@(`k*i0ZmF(=^*7Ts-!2MGi41MW}D7A~BceXxX6$RRH?6Yle@lsXhem=`9T zaFgtYBMa{76OnrYw89iej%vfCFcOPvEqd@;ZT{W;BWssnyN;Ve+*dCU_mScf5)~C+YrOB{{R&8*pA@Xaulv=N;7?d5J$xopw zWeo~u_ys{ZW8oAi*eon_(5IR?!ozkn_m0|+KNzhyo_+Vy4~MrGSYorQpRH0w6i_WE zr6P~pldYp;&F9c~F4cs&n@tK`w6jE=ZIH^dx!d|7Y;INTt{1nij5%_@z(zQEL zuL{aMHJBcSnTQ)xo(rxkXDTZHn=;Kr{qt$2IsSx=ZIf{TRV^6&gyVL8z;=sLLnpBW duy9%1=ebh_x9Z3~#LKKtUFZf~+I8A6{sP~!N&x@> literal 0 HcmV?d00001 From 08bfc0b5743f9f687172bb8e43d07be08ddbdbea Mon Sep 17 00:00:00 2001 From: psicktrick Date: Fri, 30 Nov 2018 04:15:11 +0000 Subject: [PATCH 4/5] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 172 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 552 bytes q03_skewness_sqrt/build.py | 9 +++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 178 bytes .../test-q03_skewness_sqrt.cpython-36.pyc | Bin 0 -> 2073 bytes 5 files changed, 9 insertions(+) create mode 100644 q03_skewness_sqrt/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_skewness_sqrt/__pycache__/build.cpython-36.pyc create mode 100644 q03_skewness_sqrt/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_skewness_sqrt/tests/__pycache__/test-q03_skewness_sqrt.cpython-36.pyc diff --git a/q03_skewness_sqrt/__pycache__/__init__.cpython-36.pyc b/q03_skewness_sqrt/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..58a3e4ab9113a386e67b8c4156dd5bccd4a82b3f GIT binary patch literal 172 zcmXr!<>h)>{y&-l2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CUy=G5`MIh31;v@k z*(F6lLO(peD7&~IF*#K~IX@*;KP@$}q_ikCJ~b~rGcPr@C^IiTzMv>SD>b=9ztF%q uzBoIzJTJAlIKH^Bs6;TZlX-=vg$jV|MW&i;7IWRZ? literal 0 HcmV?d00001 diff --git a/q03_skewness_sqrt/__pycache__/build.cpython-36.pyc b/q03_skewness_sqrt/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..881f52e7ca5cc31ab7451536762204c59ea51d01 GIT binary patch literal 552 zcmY*V%}N6?5Kgk&y8ZLuP4ESJ>1ul|q9}NgA`}#Yu*6NO+itUIlC4zgN#DXJ@DY5K zTs`>;o}4VD)WCc*nJ<%XW(J*3^XLoRe_({Z(as?dpMjY^07o3>XpSkyJ|;P#LFGeQ z6T!63gEvg~c*tw-h(?@@QMdjBb*PJ7XlCMh^s>*HWwF&PlfBd|Q_!nU0O;)k%v=Ik zG{tMsJ4A2ZlOeLidw+k$8#dUm;f4(>maOrbOuTw+L>pK7I$NG=!DxFMju)CX#w-^% zI!gs@Z$luufg@5uzYA@(AKxeVga&4L;-UYEbRE*axA9Xk7qK!~Ie4fC*T~n@-r=m2_OZ81P a$`0&R&xiAZm$^9g#m1|(afBn%4F3R=7mZE; literal 0 HcmV?d00001 diff --git a/q03_skewness_sqrt/build.py b/q03_skewness_sqrt/build.py index 4bdb0e4..ab6e904 100644 --- a/q03_skewness_sqrt/build.py +++ b/q03_skewness_sqrt/build.py @@ -1,3 +1,4 @@ +# %load q03_skewness_sqrt/build.py # Default imports from scipy.stats import skew import pandas as pd @@ -7,4 +8,12 @@ # Write your Solution Here: +def skewness_sqrt(df): + df['GrLivAreaSqr'] = np.sqrt(df['GrLivArea']) + sv1 = skew(df['GrLivAreaSqr']) + df['SalePriceSqr'] = np.sqrt(df['SalePrice']) + sv2 = skew(df['SalePriceSqr']) + return sv1, sv2 + + diff --git a/q03_skewness_sqrt/tests/__pycache__/__init__.cpython-36.pyc b/q03_skewness_sqrt/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..2d7f9b53b38444049cedef0e45ebb35d9c90c5b7 GIT binary patch literal 178 zcmYL?F$%&!5Jfj&Awmvf;|OU*Jb_IL3yUFa#<<4pZe}I~kK~nX#Y@=erVu~8$LBY{ z$n(W({2WcnbJ8zaD!YWtl4?_$WwyT?p60*a2 literal 0 HcmV?d00001 diff --git a/q03_skewness_sqrt/tests/__pycache__/test-q03_skewness_sqrt.cpython-36.pyc b/q03_skewness_sqrt/tests/__pycache__/test-q03_skewness_sqrt.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..dab91ec2bf72bb6c73958c8f2984c9c643201793 GIT binary patch literal 2073 zcmc&#-EJF26rR~1d*j$q!cR-8s;rO#S`=bvu0R!ORZ3I|SrtJ=T9CGb=h)d~f1H`w zlvw4;eHp|n@FaV|1&9mZ@BrMDb9PO!9=KJmj3_R$_&=w55|csT;c0J2z>h&9KQC*hijhOnA5gF04%W zk5R69NAG-ZqLU#bd z6bd59hH(a<;%pd=RDOg&x+kCRMoS0LHOPjp>?ao%cSdLBb=t7(6A>K3q6s&%Jw6UD zkh=26P zF}%DZu+Q06bk2dLT6j~dWGJE9bZ}PQxCH+!+*`O_r_M3;?bk|u<~q-wF-<*xWALPncfJdFx4EVA3pM0I`X(O^el(57}8_$@y=@zGTP_j-a&H(N)AKU3bDe$sIRb_-dXQS50y(G Date: Fri, 30 Nov 2018 04:27:49 +0000 Subject: [PATCH 5/5] Done --- q04_encoding/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 167 bytes q04_encoding/__pycache__/build.cpython-36.pyc | Bin 0 -> 764 bytes q04_encoding/build.py | 10 ++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 173 bytes .../__pycache__/test_q04_encoding.cpython-36.pyc | Bin 0 -> 1731 bytes 5 files changed, 10 insertions(+) create mode 100644 q04_encoding/__pycache__/__init__.cpython-36.pyc create mode 100644 q04_encoding/__pycache__/build.cpython-36.pyc create mode 100644 q04_encoding/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q04_encoding/tests/__pycache__/test_q04_encoding.cpython-36.pyc diff --git a/q04_encoding/__pycache__/__init__.cpython-36.pyc b/q04_encoding/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..3aef6126d9207f95f6038ec3e49651fc11198ecf GIT binary patch literal 167 zcmXr!<>h)>{y&-l2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CUm^M#`MIh31;v@k z*(F6lLO(peD7&~IF*#K~IX@*;KP@$}q_ikCJ~b~rGcPr@C^IiTzMv>SD>b=9ztF%0 lC=OHx6x5H8&&lE61@;mbnqw#}rR0)^mV_2ez$n(N<6T*DB{_7<=Cr-$ zLHZ7T5?y=BEA-Tn+du>}ni-SVd^Al3 z6%FusB9sK>9g4j`<;a>WsGx$?OhmVILvN^K8*;r4LyDtDRkBBVp_5|gzV~uqZo**i zLcf?9^KXqkpD{B*Kh$-SS1`+bEF0_m)Ph9FQaGe*4L%Vmrt`*?I51`B+O(c^!l#v1 z*oNP(0dxDdZNU0i7~Rbx&&0fVRB73_%AV_gbN5WbPhy@T-k(qTm2M&LY*Q^A&T^T5 z(Pn8o>?03vl+S^?-arYeZWMrNR9$vP2d??omxma~Gz{jKeIvy|xANJ2Xd8cE12sY) z)0FPf7j&1J=jbEFwBt%}Yj)8sp4g=XZqz|%0KqG;79j`5KEq`Y<**%URbJ^neDah3 kMj19}z#RBIP|pz9XGg6Ty@c0cGwc{uMkj1c_u?%33x%oGE&u=k literal 0 HcmV?d00001 diff --git a/q04_encoding/build.py b/q04_encoding/build.py index a52c57f..836af89 100644 --- a/q04_encoding/build.py +++ b/q04_encoding/build.py @@ -1,3 +1,4 @@ +# %load q04_encoding/build.py # Default imports import pandas as pd from sklearn.preprocessing import LabelEncoder @@ -7,4 +8,13 @@ # Write your code here: +def encoding(df): + columnsToEncode = list(df.select_dtypes(include=['category','object'])) + le = LabelEncoder() + df['LotShape_Label'] = le.fit_transform(df['LotShape']) + df=pd.concat([df, pd.get_dummies(df['GarageType'])], axis=1); + df.drop('GarageType', axis=1, inplace = True) + return df + +housing_data diff --git a/q04_encoding/tests/__pycache__/__init__.cpython-36.pyc b/q04_encoding/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..2ea428ef28dd6f04f5358150e858f2149639b9ef GIT binary patch literal 173 zcmXr!<>h)>{y&-l2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CUs3uQ`MIh31;v@k z*(F6lLO(peD7&~IF*#K~IX@*;KP@$}q_ikCJ~b~rGcPr@C^IiTzMv>SD>b=9ztF%0 rC=OHx6x1(CEiNh6kB`sH%PfhH*DI*J#bJ}1pHiBWY6r5j7>F4F97Zrl literal 0 HcmV?d00001 diff --git a/q04_encoding/tests/__pycache__/test_q04_encoding.cpython-36.pyc b/q04_encoding/tests/__pycache__/test_q04_encoding.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..4e8e498c39b42e30e1b3bc649db6ea0592e444e3 GIT binary patch literal 1731 zcmaJ>&yU+g6rS;q#PKFkyOf0$sI@>nSXyl=;DUruQCU`%NPI)X0t8Dk)K~?-n@C=_r95r2ZQjhpa1#s509}w+1ArR z{~^9wqLEDUg3WotIr&cEB(8L&S9o(j@$HyjbmrZp%Ne+{Kz3F<=|N9+WgvSplsi*@ zpCuvq5aP_vF_V2cc**1d_{vTC(m7%AaE&{$m^Z;w(B_fQFkU;CBT#0Q%*!dx4yRxy zbx{a4)eFd$Ln(|H871=aFw^Hr__fgAm+A`zBIzBgC;7Q`gC~_aITZ^?!egPt6rNt7 z-#ZZne5>*dGTQv=p=}@Hs}IlsOSoi-Be`^5vKBagJ?YC1etiOo-;V4dh_LBX^+%WW zW*igHLm2~nAK|M%LSvZWEB-5g!DfzeUvSCy*$Q_+TDSgBoISR3iD1m_jTNO^lUd$7 z`UTM&kP#A5&!IFrx-So+-^kPr>7^kqWtl1G-gEB|YYf&_A0cGqoo`z!5ctqoG zO!YDB?`(8h&0)0Ad3I)yl(W$fl{(W4k--T0htULtsTHJ9PV*8#VMo%1s%BWo==p(%dF8rTuAhO@%Ti;LCg41RlN~eS=e4WjVcz&Ninlqa@Z1 zf9`ngV$|}}4RsPGqApByE{Ym-B&(>bOf(lJJB_B6$eR(ddrhjMcE*kh@uPOg5RBFg z&};T?mVTK@-^RHXEJv^({twuz6&t|RcsiFBaD)zu2W4cOnLG1lzT~DuqS}&-GhTjk zjTR3|WKj0eq*9RrY-QO(k8&M7TZmE$9es&WUnwz%X9v+mRinJ%G8VfX-Pduqxz)<) zv3^`?Bgzb#JGS#6)6=TfqzXEejkA!AmsJWHe?l3P-X?kDQ6VvJ>3fB_w=HvRfi{y} zy@!A`!DoEP9lreFb?RPSa)Y^zRPJn;n>o^x?nWT~c>Oybnl*KE`QW>4f;3$nC=gW1 zwM5|R2wMH17T(2$Y99>>h2)`j(KNnY{06MIx3Sv5_i>G;`-1W1-8W*ip<`@DkftSa zo2E^ert?bH1^N9nrNiFNs39g(x5&Ih<~=gkoLi41tB73!uc`Qe2R{Bfb~GL|L0#sC zs#R26(rNXg-oihP|5Ke8vb}7&c}W+uu}38d@E(?_y_n03D|saSZJk(_>@NRRR1