From 790544565234022d01b8b39f114df376bc898c9e Mon Sep 17 00:00:00 2001 From: ramyakrishnan86 Date: Tue, 16 Oct 2018 18:10:07 +0000 Subject: [PATCH 1/4] Done --- __pycache__/__init__.cpython-36.pyc | Bin 159 -> 159 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 170 -> 179 bytes .../__pycache__/build.cpython-36.pyc | Bin 655 -> 568 bytes q01_outlier_removal/build.py | 12 ++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 185 -> 185 bytes .../test_q01_outlier_removal.cpython-36.pyc | Bin 1835 -> 1839 bytes 6 files changed, 12 insertions(+) diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index 2e5da7da778c48a9c58d7d055bbdb642fcb66418..7f94ce1399c668e184df67322066dbb2a5b70358 100644 GIT binary patch delta 55 zcmbQwIG>Tjn3tEUSo2u)L=H>kjQreG{i4L&%EauV%;Jo^#5@Z#{qX#v?BasNTjn3tDpxuj9lL=H>k(BjmhV*SLVjLhPU)a>HYq@u*!#JtSJJpH`X^7ypO KoYdlpDb@hqK@$xC diff --git a/q01_outlier_removal/__pycache__/__init__.cpython-36.pyc b/q01_outlier_removal/__pycache__/__init__.cpython-36.pyc index 2f9a42a105b2b26ec10c60ac4d11fa03f7624d22..682b4cdc84a83f70986663e7a87a33ab7663b0e5 100644 GIT binary patch delta 57 zcmZ3*xS5f|n3tEUMDtkmL=JP+1pSQs+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QQpl01v4Xq5uE@ delta 48 zcmdnYxQda(n3tF9Mtoz`L=JPAaQ%$@+*JL`1G>54qhgWr GHTez4w@?@W delta 394 zcmZ9Ize>bF5XN`1n==U)@7i!afY+G9_7FrXu@JPfk$Agk{%+iC;EJflbvAOGwY_iP zgIKNaU@cZo4uU~u=Yx;m%*U|r?Adnrec$_tUoXE_?$aY9gxJ_e*wqV4Lpa<(KoY{O zCENpg+Vd8A*7H&D;!?=>AvEzb^1#&mTl`9_U$N;`;1M@ec zd|dvy2ybOB!YC7q@K{u-mSuRRWFqFeT0g+a#BKj%j6z_%sUhraN{!Z^Fqx@#Ky9@$ bYNbu>$u?T!%yP-=OdMF~ssV~)c`#(Zq77Sf diff --git a/q01_outlier_removal/build.py b/q01_outlier_removal/build.py index ec278ba..5ea8165 100644 --- a/q01_outlier_removal/build.py +++ b/q01_outlier_removal/build.py @@ -1,3 +1,4 @@ +# %load q01_outlier_removal/build.py # Default imports import pandas as pd @@ -6,3 +7,14 @@ # Write your Solution here: +def outlier_removal(df): + df = df.drop(df[(df['ApplicantIncome']>df['ApplicantIncome'].quantile(0.95)) | + (df['CoapplicantIncome']>df['CoapplicantIncome'].quantile(0.95)) | + (df['LoanAmount']>df['LoanAmount'].quantile(0.95))].index) + + return df + +# outlier_removal(loan_data) +# loan_data.head() + + diff --git a/q01_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc b/q01_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc index 5a057ffb73694628cef3ed87e03ee3a17f7410bc..2c7fe5d9e7c32991411c72c088018bdfd7772b79 100644 GIT binary patch delta 55 zcmdnVxRa5?n3tEUO!HXuL=H>kjQreG{i4L&%EauV%;Jo^#5@Z#{qX#v?BasNk(BjmhV*SLVjLhPU)a>HYq@u*!#JtSJJpH`X^7ypO KoYdlpDWL%AQxjVN diff --git a/q01_outlier_removal/tests/__pycache__/test_q01_outlier_removal.cpython-36.pyc b/q01_outlier_removal/tests/__pycache__/test_q01_outlier_removal.cpython-36.pyc index 4c0b6c7431c6a14108ba9d55dd44059612f144a5..fdf2a8efba79d3a487969708d0ab9fd6b433aab8 100644 GIT binary patch delta 71 zcmZ3@x1NvFn3tEUO!HXu$%&k+IQY_2OVUbnayD*vV^q$_&rQ`YO3bZH%r43-&d5v5 bvoO;S&o9a@E=WvH)lbe(N!_f##LWr-eYzOR delta 67 zcmZ3_x0;XBn3tE!Sjs4B??ld3EL`cSB^!6UF)D`^rxq3KCnjZN7H6bp7ndd#CFUmP XWhUn7=cSg%r)B1(7H?Kz;${T^<4YF0 From b41442855871576122516b32107068f126ee0d3a Mon Sep 17 00:00:00 2001 From: ramyakrishnan86 Date: Tue, 16 Oct 2018 19:00:51 +0000 Subject: [PATCH 2/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 181 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 1359 bytes q02_data_cleaning_all/build.py | 26 +++++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 187 bytes .../test_q02_data_cleaning.cpython-36.pyc | Bin 0 -> 3409 bytes 5 files changed, 25 insertions(+), 1 deletion(-) create mode 100644 q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all/__pycache__/build.cpython-36.pyc create mode 100644 q02_data_cleaning_all/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc diff --git a/q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..43306728db48313f6f52974fdf25e67224184684 GIT binary patch literal 181 zcmYL?F$w}P5Jj_KA;KPH8%GqxLc|l;SXfvLV>0Z<%_i$47JDQw;vsCkg_YSt{O}&1 z-~3fs&QkR}tDN_!Uy5AznK;QZ>Zq#X@K7?&e|;{{gpNU|8>kf<8&7_-hEtF>_M{nf zFbpo#HYTf4xE7Al29LdjE9(Te#S#rALhYEm^)-@nfM~rPmdcl6u0MpvYSmpTd^yZ9uSvYk^%ztP(iB}K_%Erkysfd%N;veXFZ;&?W{Ug za!Rkg^jmP@V{qo|E2sSmoOqt3C~#mbzh}Rn|GeLO&-3|U(7*WN_n&`D5&9Dyd@x6k zpxbvKIO13#veTGgftJxS78qo5D0#HSyM}jbQ<8Oib5ekgRj=xkqYg{daWx==Zk(!< zYDk6{iEKII*%p(r7%xBIIWM*mjE70sU_Ww( zNll%wj@m{^2e$lK)vTN_FdWt^r=&2{h^oG3>h;H*IW|)@)3h;y%hJhO)0HljU|R5L zX|H|$eSn`my}@u@8ASLB=o$1U(CuBYI^-}1?mXi0+h~K=5SumP$pW9DEndc36lM>D zOwZ6V+3R$RcotTKd57kEH0VP#@6ck827QPY9opNYK_8;M4(;#Jpbyc0haT3JZyIV$u43i1y>EUTH_NZ-wTFw%9z83!2FwN_VS_f`T3X{MJpU$CD92v~vK=4=Fd2K468g?y|&!7mEWX2D z8EG#y(+|F!{ZyMP+ptp1O1KY7cmWJ$36;Gt0%8kg+?aYPN;i9X|1%ouoOV?mqRy0> zy;w=br%mez|H8&_r#%IMq7gog?%{tL%!}wWGWP(R-1f0;t&eK!lZLrVpRp!n#phfa z%_`xu1|rB{NyB}rR~6h8>4to0ui$MNJq=+})CvVIg107yW6f<4ZGdT_)u}0|N6AhhMpl(KT;R1w4VHK3+E6!8Avne zU>ICztR$;3auZp^29HAwSJnw`t2G)*gxWEA>l-BJAh9F?MC)xrTn^)FzVCy%JFce( Gl2Kn?QZ&5) literal 0 HcmV?d00001 diff --git a/q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc b/q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..4702bb6cc01cc3fa94746dc9ee352e342c8f5c04 GIT binary patch literal 3409 zcmd6p-EQ1O6o5Up*Y^JAr)k>ILQNr+jLL2sBq$O>MQy1fRY9U4Dud*@p4pAJUVAe$ zj@VVX+CBwuz>Dw@bIVm;fh*3jlk8@b=7-+IE1xqS&zza_`OKd4MYCCx-rv9eT+_6F zw3*9-_CvVEpCG74Nuv1#w4Ue#!#4=_8HqWl_!VfIw31i@+qa8;D{%%@ze+Sl`Za1# zh+k**euFx+I?d0I?iv>l0E-+qR#Hy`g2FdE_V z2N$mL5N`1d1S^2~Iwe$ptN8{ss0kWSQ44g1+SCDU(JHNhwrQO!~yg34!ml?&V&g%GvU(AO*82ZLK$tl zy#o5t5uP#q0K5veJe}7;@dgUyT?+J1-8jLCeRJXp3@8B*0Py*_036Ic^dAEUuWftCp{{s&VT~2!B#YMTfXK}kdM{MKb#4ahT(Ug_4AgRPm zDC>ElPm8p(h>h;NH?h&>Bxa9}oy}X|D|b=6$JyLB``H|~i=WMXLzk1D1-panFbz6> zE_i1ph0vOms+8@buC(J6OLAFMI=;hMNCPatt3`E=g&@?@ zJR9Bz7BSX3DS^!fE^`+ni;Nr;s5 aP09UREOrDYKu2$o@>c`xkQGS&E%F~Sk)T`v literal 0 HcmV?d00001 From 6a7b94f1382102ac9a0c39b154bce8e3d37d0e71 Mon Sep 17 00:00:00 2001 From: ramyakrishnan86 Date: Tue, 16 Oct 2018 19:36:50 +0000 Subject: [PATCH 3/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 183 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 1053 bytes q02_data_cleaning_all_2/build.py | 16 ++++++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 189 bytes .../q02_test_data_cleaning_2.cpython-36.pyc | Bin 0 -> 4764 bytes 5 files changed, 16 insertions(+) create mode 100644 q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all_2/__pycache__/build.cpython-36.pyc create mode 100644 q02_data_cleaning_all_2/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all_2/tests/__pycache__/q02_test_data_cleaning_2.cpython-36.pyc diff --git a/q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..cb92068cd089c09e8795debc1eeee5af7d6c9ddc GIT binary patch literal 183 zcmYL?F$%&!5Jfj&Awmw4#*qkOA>s*aEG#UBVRuN@YZGdT_)u}0|N0ncL(dSYAE}F0T2FqvfpdtR45S%! zFbpm|B(`Uc54tO3z_n-G`7_?qwfVD66h)4OEU E7k45u=l}o! literal 0 HcmV?d00001 diff --git a/q02_data_cleaning_all_2/__pycache__/build.cpython-36.pyc b/q02_data_cleaning_all_2/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..9381ebd53b6adff7e91ddb762d4ff97ab3d1ed71 GIT binary patch literal 1053 zcma)4PjAyO6t|N!X|s0i214S>iC)?Hp2I-fgb5x^@ zB|R3f<|jnf7(PJ#))l;k_WRg$7}Ye21*bBRGXT0-sYSw7qS-vxW>1i~_3$*Yo zx6kep)qDJBk6DX_Y-Q#y8y6dk#sqzMy!5p*cj1oz5MA24{uZhce2swKLTB5D2z+?q zEZnIF`L_3o|B6e-6$xHbr4r6aIN`a4q%KHnhm|q4iIL6$7t?4b%|%whsm>df=hnkK5yq&v!Uk;GK$T^VO7Cu`%3-ho0}q*0ocQujUMwXG-@26C6ca(L@>_3|?pxRKEc*03hyoyhm1LnR1oH(Jx8{$6t_I zgF^qH!xLaJR5Y#VsY;3yN#*lr!^2FS7CDXiFwPi7xn8xa*E+8iF2iC}}gGTqzW&93co4+L_07(OS&AzsH1u(}6Wf8F>wm5dgu30uUpI?Ymedais~#C$?@PHoCbg8G^iOV$3`0cf21eTok72j z_S@higDcgBQ>tUdsuec(I?cNJH^e$POmi#ESSk2R8@n!16E|@ix1mIBuy78Vx6usbB1YuV(Eu!6*r1Q4ya32`-yulc?Y=I;0~ IeUOa$0?1J{Pyhe` literal 0 HcmV?d00001 diff --git a/q02_data_cleaning_all_2/tests/__pycache__/q02_test_data_cleaning_2.cpython-36.pyc b/q02_data_cleaning_all_2/tests/__pycache__/q02_test_data_cleaning_2.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..3aabcd962cecda8ce303693e64ab713e17085af0 GIT binary patch literal 4764 zcmd5=O_LKv7@n^rlh6HLSP&Rdz*v}&MG+A!wg4%rtZ0cA)JWAZqMOPirRHlb-PTow=)~}iR?1F+u8@?UZe{F@)YHD%%Gz0}XZ&0% zZ|7Bos?7p1`>I`}#b$|QNv^Mfo~1=um%;K$+Fr7k?G<~~UbEL}imuRAx<=Rg#uH;) zyF&6?N^_&H*qd~P6o&cFxlY5UZr}xb&NfsPC#tYb*ol0PGKbMt_|o;Es&5T zqjw(PsrsQCIBiCW*ND6@a5{kmrliu~FYU}X`1rxyfeN3t3wLRo280F?cWU<9cPwmE z7ImE+MqTGe_RI|$*y+&^yL%gM?t`Fma%_#LM0>5+I!+Fh21$`Llqr%SCX{KU9m)*J zlLC}xOpTo-OJo`T=g10Kg)&dp$U2k-vOzYXERqxCB$Oqx1>~I)Ye?GNNuC-w2>fBk zOt|mB&9^~BN~HGHU({DhQ;YOhDp9wTK6Dg1nfSk}Z7O}VD+NAb)EUAJ3=q9@_kIRO zBT6hFx6?v`tPA9_b>DkQ1JKF_%RoDZjYZz&9B8}uqT~8P_i0epgu$u5D-4{PKNPkE z&Hm|C_rn&gGPl)rpEHl|2X1ivTJ=%Lp7XZbpw&i5C`{j;$0M%+^Ss9>=QxFJ7B-1)Y!N7B>j^u%KE`n zusmRuH3pGIVI>sEd@Pnh6KAFlV+hE%ph--F3N+M?O~dH@F$-u&7|kRL7ARncV3Cp5 z)SE^#Mbs#b_L;Cgt={|gfC4acE9$nXwHq>v(Wt|Mm=DY2*3-5d5SLr%3}1sa(WjTK zZrA}!rNg!mM63(EoDs{hWj^2!0v>@gQ;~k`AO%8e6Jaz$Mn!5DF+_F@Ck*^_S&dmd zMBt^V1jb!-@I5E~z&RK+M+y|Rq-tvK%VU%IU#xeHR<;hq5*ZjMbG?9V!asHb#Yq%s zMC=rZBN+VXI1D22hk%i!@aCcvBG^01VfQeHA`PL`qg zcaTZoOeY2tcN}Dz8Zi>#B~>5%hE9ZQ#@>~Q@WS_9ScuJxF0kUf3NJE@1H%x*-UD5v z_7!+^uCp}3CXU=b}f+={R)h*h{bt{P3%Ov9CuSK8D^muyu&ZKvZkzfAAK z>;ztf#=~&@BK54}`9y9-?K`k%?7C6d^1Wx38C%K9)U9MCMoIyyy>on|nsexEVu*vw zf06M5Je-K+Ce1eCV1YPz5RsMV6u6s(BLg^h5b9&0cBR`eX(YILWaqIfh1jp-6wWSU pJ+A23Cn#ztkjrT#3-e|?n_q!*D;yzBwJ^H09B8Jxu5ONN{so|IB{l#6 literal 0 HcmV?d00001 From c3667663877a86389a7f6d659dcb24def576855a Mon Sep 17 00:00:00 2001 From: ramyakrishnan86 Date: Tue, 16 Oct 2018 19:42:24 +0000 Subject: [PATCH 4/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 183 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 1213 bytes q03_logistic_regression/build.py | 16 ++++++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 189 bytes .../test_q03_logistic_regression.cpython-36.pyc | Bin 0 -> 2303 bytes 5 files changed, 16 insertions(+) create mode 100644 q03_logistic_regression/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_logistic_regression/__pycache__/build.cpython-36.pyc create mode 100644 q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_logistic_regression/tests/__pycache__/test_q03_logistic_regression.cpython-36.pyc diff --git a/q03_logistic_regression/__pycache__/__init__.cpython-36.pyc b/q03_logistic_regression/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..20c81b8a1fdc01dc7e8577540ce90f1da18cee67 GIT binary patch literal 183 zcmXr!<>e~TJQmFW1dl-k3@`#24nSPY0whuxf*CX!{Z=v*frJsnuN3`^{M=OiqQu2#XCH{U=0bS>+Lb?5Q{zlBkJg+MKe zxP=isZEmLyc97v5?xr60YV2}94RBCnkB4akH)`zjX4=B78V9_cc5nw-3{6*PSRveH z-RUZA&}L-=Zm@36waoL>$7{HU*Kr?j-~sEfb=GGaY*4wU?vkY~+WunUO^S}KVdoY) zwT^~JuN*5PD3SCyCY(uNdWYF0DO3`_XA{YaBFO}>t8pgIXXYhJiIT}D;JVpN@r21p zvNXFU9HOoTcRah5W@wwI9yRMWJyn`SeihMu%xb?uxdN;(Dwi=9Z* z>M+#7Nu(r6g!TcjLg`?>Bmfw~D~#MY;MoM!n`nPttASfa=7qxFEV%*oev$D7G&Pna zos&zM6c>VsmoLU2GI?3#Bxd6{qYM=Nb84pC;@F^MHf6CIUp?E29?6f-W(lXGe6H6Y z$@XFGVg-U_`=}42Z8uTVmYcu~x3r%d-xS);Dc&e9;l!mFfex@{Y+NHIwMw|Z%<)9P zoG686c`Y06E>kH3N5w@gpWcP`=R{>GPtHb<^tIg8=<39%$YexV8 literal 0 HcmV?d00001 diff --git a/q03_logistic_regression/build.py b/q03_logistic_regression/build.py index cdbd506..3c40150 100644 --- a/q03_logistic_regression/build.py +++ b/q03_logistic_regression/build.py @@ -1,3 +1,4 @@ +# %load q03_logistic_regression/build.py # Default Imports import pandas as pd from sklearn.preprocessing import StandardScaler @@ -16,3 +17,18 @@ # Write your solution code here: +def logistic_regression(X_train,X_test,y_train,y_test): + + scale = StandardScaler() + scale.fit(X_train[['ApplicantIncome','CoapplicantIncome','LoanAmount']]) + + log_reg = LogisticRegression() + log_reg.fit(X_train,y_train) + + y_pred = log_reg.predict(X_test) + conf_matrix = confusion_matrix(y_test,y_pred) + + return conf_matrix +# logistic_regression(X_train,X_test,y_train,y_test) + + diff --git a/q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc b/q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..81080038089c570cc2756295eb879b7fda1df07d GIT binary patch literal 189 zcmXr!<>e~TJQmFW1dl-k3@`#24nSPY0whuxf*CX!{Z=v*frJsnuPptH{M=OiqQuC2mvVWl0J>@U#X?IfM*lB{Un*<(DN9xG??&I-6r_(awA3y!+S=L|H z+ymd%BWU_}5ZvNKT9j11O>O9H>7*`o3643kk$TjtbXPW0pZb;FkV|Qcwm|oIQ!b}% z+OF)r?4(`VC6*w=6}~hjbXBYlZ}Apip4ypuz&8++w=}yqj%{#-4MQ56L-bB z*qFM{-I=w0X{8@Mv3Q$z-demP+^Iu1Ir-iSyJrxGbr_P;|3PT8$Fu;w!A# zLXUl!vn(1Z!IRj)yr{^kMFsE0`jj@G;_$(DX9QfwxY3IT*Lnm^?|=|h3IKk>?Y9KREKC;)Xse_q>W!yuB?#^5glh5{FL&!$(0HQBakr^Fq^PS*Haw;;=LRaB> zstKZ8W?Bnn_D>2XOGk<wTL>NSJjikr zq|C&}!JtaV;*8L_OpR)Tuh3Rq=+p`d%tS42fmVKgV<_iN^#)9hVBY# z;f<)(dy1;sgAOo0jnP`9MQk#8{K5EL^|*lJj9Ke59EbK4YWyOjeumM>{TYl4!0{YN zg^a4XG(QGRLjEXpUOFjzeFGfZ?}MYF?iP5_Sg0&A`R2dEPZ?&;2wo*ham-s?0Z&4DUfxl^5zO!FYss-cofXBIV%%Q~9VQ&q^|; z&1aEOEXk+`3cy91;|l{Qh#&H*g890vl>XOsTE9h@H6{;IL)vq13v{2Xk#*9w{{eIf BnGyg1 literal 0 HcmV?d00001