From 5f7ff527eba3052a76f984f8e9711e33c2a41177 Mon Sep 17 00:00:00 2001 From: nemkothari Date: Fri, 9 Nov 2018 09:34:25 +0000 Subject: [PATCH 1/4] Done --- __pycache__/__init__.cpython-36.pyc | Bin 159 -> 154 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 170 -> 174 bytes .../__pycache__/build.cpython-36.pyc | Bin 655 -> 607 bytes q01_outlier_removal/build.py | 10 +++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 185 -> 180 bytes .../test_q01_outlier_removal.cpython-36.pyc | Bin 1835 -> 1834 bytes 6 files changed, 9 insertions(+), 1 deletion(-) diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index 2e5da7da778c48a9c58d7d055bbdb642fcb66418..6a06b88f3ad3a20931015dc34182b5e22aefdfef 100644 GIT binary patch delta 52 zcmbQwIE#_Pn3tDpYRJ>*i5%t%?)n+|xvBbjskzztB^ilDnfl@RMcKs#iOH$@$@wX% H6H}}Kx*rk@ delta 57 zcmbQmIG>Tjn3tDpxuj9lL=JORAN|nc)S_bj#H5VO;*8Yn;?ks|#N5QZ%)~tXywvje Mw9K5;;)(Ir0Qch)egFUf diff --git a/q01_outlier_removal/__pycache__/__init__.cpython-36.pyc b/q01_outlier_removal/__pycache__/__init__.cpython-36.pyc index 2f9a42a105b2b26ec10c60ac4d11fa03f7624d22..f249e6dd31b29cdbd64769e022c64f73dd8e8ac9 100644 GIT binary patch delta 52 zcmZ3*xQ>y-n3tDpYRJ>*i5%t%(fS$rxvBbjskzztB^ilDnfl@RMcKs#iOH$@$@wX% H6QlhB!vPXX delta 48 zcmZ3-xQda(n3tF9Mtoz`L=JPAaQ%$@+*JL_-&R^({ z=wIR*WXO^q(5XjtF@hd(kCfg$>hY*|ySwGD)BEoWM#vr6iVWAEFvD8}AV4*#={U1G zleC=x+t50fc{_y+CL31gki+zr)H9%8$b9yIIeZMkWjm!L$itZ4=#wB$y@ zfe2S|c9Q7h&kqzOB0&mtL~_g{%y5RVCN28d&>M;?%rybFPu4WyYO+sSbaa!d{&CsJ zA^wNMYSbZabLcu>EYHVy{8;ZDI;WN3rav~qcCvnPWcia!TE3EcknoWzEu~vZDnM)vi$}3s`_gEDmX4=B`iqn+ERsH ziN?#Nmm#FiId5Aj`s(uao5l{kR?;Kg*(Mll`6t?3ecRlsEGM>c5b_@-O6#-SdR6-RJOj#l~&m2yDwre|8i^6pL1ZH;r z50h7>F8u*aJcofR5_aCFJb&+dFYh_e=kwVQ`K`Xo2>D5N7Q^?~X#NQT5TJ_GRM0Mi zY)fkJXNo@C@iX-E9iIg{&>W9aM-{;~i z^?I~1y$&vQy2|79vPZ2{A{N$39byj7*jPvn;u`tAae8Tvk>Yb6Y5SeHIf{S1uRdbI ziYswlod|ysjIG`}(}^~C9Qs=NAlt@?wG-Z_!P`G%b@}vJWBQ<^a7b^=6<5`HFBKfx zo4ELg*-JNYfI#TMxcBL!ak~Yct;$$hu7UfQS%_07I5c>zF3H>^K?)l`cn2QfS)9Ju T80eLFiN783CBihD(f#~4xYMeW diff --git a/q01_outlier_removal/build.py b/q01_outlier_removal/build.py index ec278ba..0cd3f90 100644 --- a/q01_outlier_removal/build.py +++ b/q01_outlier_removal/build.py @@ -1,8 +1,16 @@ +# %load q01_outlier_removal/build.py # Default imports import pandas as pd +import numpy as np loan_data = pd.read_csv('data/loan_prediction_uncleaned.csv') loan_data = loan_data.drop('Loan_ID', 1) +def outlier_removal(loan_data): + df= loan_data.quantile(.95) + loan_data = loan_data.drop(loan_data [loan_data['ApplicantIncome'] > df['ApplicantIncome']].index) + loan_data = loan_data.drop(loan_data [loan_data['CoapplicantIncome'] > df['CoapplicantIncome']].index) + loan_data = loan_data.drop(loan_data [loan_data['LoanAmount'] > df['LoanAmount']].index) + return loan_data + -# Write your Solution here: diff --git a/q01_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc b/q01_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc index 5a057ffb73694628cef3ed87e03ee3a17f7410bc..1c1c4193535d74e34061bce42f11b7577d081779 100644 GIT binary patch delta 52 zcmdnVxP_6!n3tDpddSo0i5%t%iTWA&xvBbjskzztB^ilDnfl@RMcKs#iOH$@$@wX% H6H`I~$axZW delta 57 zcmdnOxRa5?n3tDpxuj9lL=JP+H2u)x)S_bj#H5VO;*8Yn;?ks|#N5QZ%)~tXywvje Mw9K5;;)(I000(>%<^TWy diff --git a/q01_outlier_removal/tests/__pycache__/test_q01_outlier_removal.cpython-36.pyc b/q01_outlier_removal/tests/__pycache__/test_q01_outlier_removal.cpython-36.pyc index 4c0b6c7431c6a14108ba9d55dd44059612f144a5..7946ac60a6519f9b89379222415cc2f280ce1f40 100644 GIT binary patch delta 68 zcmZ3@w~CL`n3tDpddSo0lM^{taqy+5mZX*Dm-q-GbFCKV;- ZCgx=(=IQ69mdB@M=A;&HmS^H-1po|o7gYcN From 85020720715f704d8fd6e7580f94540c93e35e47 Mon Sep 17 00:00:00 2001 From: nemkothari Date: Fri, 9 Nov 2018 10:05:08 +0000 Subject: [PATCH 2/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 176 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 1178 bytes q02_data_cleaning_all/build.py | 20 +++++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 182 bytes .../test_q02_data_cleaning.cpython-36.pyc | Bin 0 -> 3404 bytes 5 files changed, 19 insertions(+), 1 deletion(-) create mode 100644 q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all/__pycache__/build.cpython-36.pyc create mode 100644 q02_data_cleaning_all/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc diff --git a/q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..ffaa7f1b039200b5601289fe8ad11582eb54ee4a GIT binary patch literal 176 zcmYL?F$w}P5Jj_KA;KQS#u05rJb{gZg~$++VRzglvnH|dARfXi*@~C2GFylr-sAI| zzpU%Yeg8hHlGmVLs!}$EG%B)cr>52Rq2e(A^*KQ+o*71S4G7%>L` literal 0 HcmV?d00001 diff --git a/q02_data_cleaning_all/__pycache__/build.cpython-36.pyc b/q02_data_cleaning_all/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..17814509988ce110e35ee130d8e8c303b1295a86 GIT binary patch literal 1178 zcmaJ>y>8q%5GEz9q}9r6Cx>&+DSXBu%{IIFX%F{iWF#fKMf0)*b98)F3P z-$3*~peUkPpzLbK8D^;TN}plS!A(uQ4ZeEtRqQAWhj*hahS?Y6D#?<;7l=ufW+_H2 zEVt-rgR?1{mfJL>(Z+*y%BI)09f*(V_-~ZmVz-Yg{XDgj4J!Q&+Cv-M<0a}n5dSaH;Y0K%?E@2Zs0;Q` z2|y`cd5T`|!|OTPAnNS_MKrkZFzUQA?g9t({N7iQV~G3|<$sAfag`)=M8l2Ok2*w0 zd#Df1q#JcWsUz?r_#^0}KJLeT;;dcN#of3|UWSg$BOBJIB`b__V4neR5tof11f@@==q84o>wGFwJtq|5H za&3KWlntp_Hw-**h(Zz@R5fKbBu&F4g&mxU4XCOc<-25)EIq4R&E+z8$CynjuHDY1 z$$|osT3@!6#Vd=STfDZ>^L%Iu8^Qwm!ba;)23UaMEmHgN<&W9otghHXvT9YEGotw7 zq*g2400oNzYJ!egLK0p;BP|t!tk5-$svT*I^ZO5ndh(%(Ty;c<#c9h0oi}T{^4xe*4C@F4H{z3)OTRD5#>sf3P@^z zYXbg;+7W<;M4oK2J9-73tmND=DRRvOR0zcm1lr%B_BAneCHU$58<6Jb_aEe6U7h&= zNWs4X*;p|`b9Yz9!&Pz!)%W00sZ$3|IbLt5A7N|bpP{T)uwUG9>RnJf_#R-60eR{r K1O5=l+y4VQ)lIkn literal 0 HcmV?d00001 diff --git a/q02_data_cleaning_all/build.py b/q02_data_cleaning_all/build.py index b56e2bc..1fd08ea 100644 --- a/q02_data_cleaning_all/build.py +++ b/q02_data_cleaning_all/build.py @@ -1,3 +1,4 @@ +# %load q02_data_cleaning_all/build.py # Default Imports import sys, os sys.path.append(os.path.dirname(os.path.dirname(os.path.dirname('__file__')))) @@ -9,6 +10,23 @@ loan_data = pd.read_csv('data/loan_prediction_uncleaned.csv') loan_data = loan_data.drop('Loan_ID', 1) loan_data = outlier_removal(loan_data) +loan_data.columns +def data_cleaning (housing_data): + missinglist = list(housing_data.columns[housing_data.isnull().any()]) + cate=[] + num=[] + for k in missinglist : + if (str(housing_data[k].dtypes) == 'object' ): + housing_data[k].fillna(housing_data[k].mode()[0], inplace =True) + cate.append(k) + else: + housing_data[k].fillna(housing_data[k].mean(), inplace =True) + num.append(k) + X=housing_data.drop('Loan_Status',1) + y=housing_data['Loan_Status'] + X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.25, random_state=9) + return X ,y, X_train, X_test, y_train, y_test +data_cleaning(loan_data) + -# Write your solution here : diff --git a/q02_data_cleaning_all/tests/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..047f6a5b91e7c261af5e3953b296edbb81ad9c4e GIT binary patch literal 182 zcmYL?F$w}P5Jj_KA;KQS#u05rJb{gZg~bq(VK)~7q<_oFU BGj9L@ literal 0 HcmV?d00001 diff --git a/q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc b/q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..d19378278947e9ac66019fe3a04eb495cf58f7f4 GIT binary patch literal 3404 zcmd6pOK;mo5P-QPMN&^c;y7`WHf&l4P?1WBduR(3MT#U13NR7roxB3 zyEG~xJt=>om;QtPrM(tC_%HO-8Pc|7+3};fm;z^(%iYtd@%*1(eyVBO z-`dP&LHhyR;!hA%qa@Zm0$Pvt#PAG)eMW316|VwqlU8CYu|2!!w_+!$dR3w^GN@5| zLcBVw4;s{=)rk)63ab}=HtJt3uj#eC1#i(?@|M}c;L1cBtPHMBG;ftH&OBXvqR|?y zztw1+856_1PRTQ^-PnWuX! zNTak59j!i-y*!Qs-WNj_j&I|DZkz?FKje%?p^UQB&(mTGqn%LfdiGO%z4>U5fYA__ zKe%v}2XKq0AXov+(~5 zjV^(k%W4VTdo;WK5ZA{Gmv!KN2)Eb(AvH-RA zn5Au9nS#YVWg^wTG~R?^|L%0RvxIe1mb}j7cEF?V&l!I$hC#@>VMZB1??*yLA$+qw zXF?$OA3=EM~kPy!$T;PZ02&eM{F8wvO2Fi2@2T#Wkfd62M| zcimBzLr}8)v2cjpb*hDvE0; zu7h|7yE|vIL$i2ZX5oGHf8e2^%Sn&CxF|RGEN-{wh;3Y)*d=8(nzB+B&o%{6tb4@tD5g88O>vCH+&zPht^-L!63ZJLbW!c-vm{tTGW7w3L&lku2b0-RXS?#o8#4SrSLD zI;Yfdot=C4{kgKd^D2*G%CRC+m9kxwly;P2H7<)v$8$IfsE?I*wJ6N75QH+CXG4Ay zW^zm;91}6el7{1dB>xnIXGJ1~+Fn^@ZKaGL9eK4Miz>s1KCeD)-!FVU36XNXDY<`( W#g4!P=;#en{%W8dvI5D!Mg9X9lb;R% literal 0 HcmV?d00001 From 5d9f9546a945ce7e0d1867d2e841c15e220f454f Mon Sep 17 00:00:00 2001 From: nemkothari Date: Sat, 10 Nov 2018 17:39:41 +0000 Subject: [PATCH 3/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 178 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 1105 bytes q02_data_cleaning_all_2/build.py | 21 +++++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 184 bytes .../q02_test_data_cleaning_2.cpython-36.pyc | Bin 0 -> 4759 bytes 5 files changed, 20 insertions(+), 1 deletion(-) create mode 100644 q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all_2/__pycache__/build.cpython-36.pyc create mode 100644 q02_data_cleaning_all_2/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all_2/tests/__pycache__/q02_test_data_cleaning_2.cpython-36.pyc diff --git a/q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..8067a4c8977512172204578e21298a87143f5002 GIT binary patch literal 178 zcmYL?F$w}P5Jj_KA;KQS#*wuZ@dP#s78XNDhTUH$s}B?Y2TxZH17aLh6FbREpeO&ot8{4t7#8Rk|um z_zV{O0pH>+3)Ej=#dZ2%iVz}Ej_<=c_u=b}DC&NC_~YFd$Fja#3y+8LbNti<0W2Vy zMM=Bbw1caiIk`(+Vtk#<%YEt-i<4OZ&IO?%4`*F)!Mm_g_IcRaT(cf}bcyz8MEi6= zm%)eNqebrl*|&z_CC0M$hD1leDi$XhXGK~}(J&Bom8D$9lIP--WoM7gj&UYf5touf znpCMM;<{-6;V??nsrFwP_sgA2g0u-%*ggTGscsuT^$h_C*w6vT!bjRXE?``kkfJ&iZDA%GAq7VdM=yQsN~8gy^8mWf<5`7IM^{97i{kOihI?S`q< zZkY&XKpMO0OdRaj(jN6*@B+A`{%a;>%7J!wcxg;UrD(Vdb;3+zXtd9>NxYkvnV93Q z=#3O5m(@JplAK|G{X}GSUMT5eLr{0vhg6+Kzscf_Cqqw~zG)BpUvs7H67+OmMm;YhNvSA4B~- z93P9Ej|-lki0YWhbo^Gx6IHT=j}rkL2Vk12Dot=MrjjdVhM<&U#*=FN{^@#rXO3bF z6t9nu>NJBI0arnUHw+i}g)F+2etFvR9MgzarHHA_>eCI_0# sWrU*a8yFZ^HeiZu4`2aS(WZmVTtJ=iXNFpty#WbGkM!&=Vn9~OFC@=9Z~y=R literal 0 HcmV?d00001 diff --git a/q02_data_cleaning_all_2/build.py b/q02_data_cleaning_all_2/build.py index e20ff7b..e0eee15 100644 --- a/q02_data_cleaning_all_2/build.py +++ b/q02_data_cleaning_all_2/build.py @@ -1,3 +1,4 @@ +# %load q02_data_cleaning_all_2/build.py # Default Imports import pandas as pd import numpy as np @@ -8,6 +9,24 @@ loan_data = loan_data.drop('Loan_ID', 1) loan_data = outlier_removal(loan_data) X, y, X_train, X_test, y_train, y_test = data_cleaning(loan_data) +def data_cleaning_2(X_train, X_test, y_train, y_test): + col=['Gender', 'Married', 'Dependents', 'Education', 'Self_Employed', 'Property_Area'] + allcolumn = X_train.columns.values + + df=pd.get_dummies(X_train , columns=col ) + X_train = pd.concat([X_train,df], axis=1) + X_train = X_train.drop(col,axis=1) + X_train = X_train.drop(allcolumn,axis=1) + X_train = X_train.drop('Dependents_3+',axis=1) + + df1=pd.get_dummies(X_test , columns=col ) + X_test = pd.concat([X_test,df1], axis=1) + X_test = X_test.drop(col,axis=1) + X_test = X_test.drop(allcolumn,axis=1) + X_test = X_test.drop('Dependents_3+',axis=1) + + return X_train ,X_test,y_train,y_test + + -# Write your solution here : diff --git a/q02_data_cleaning_all_2/tests/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all_2/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..f5d200efaf132095395229cff78f99e2516c4470 GIT binary patch literal 184 zcmYL?F$w}P5Jj_KA;KQS#*wuZ@dP#s78XNDhTXVHX3fOHgLnw9WGi06%4{Kic#qF- z{;IBL_rv?7N?xOWsY=-vWKv|+Ud^lBL#1*4>qF3SAcz!t&YeyUj+}ZKv>`BT2|Tw> zvNM>dO(fzt;*j`ECc|afpw(HU@uZ`REo$$vflQJG5M6W`aWUMU({*5b^|Tr9rJ%kM CKQsaW literal 0 HcmV?d00001 diff --git a/q02_data_cleaning_all_2/tests/__pycache__/q02_test_data_cleaning_2.cpython-36.pyc b/q02_data_cleaning_all_2/tests/__pycache__/q02_test_data_cleaning_2.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..6d3cf9da66cfa13556e2088b6c747dc8f73493bb GIT binary patch literal 4759 zcmd5=TaVL56!tBSbKCnaEEI5Qfu^DfS$d%qDiAjzRcTeIKrWIonc1v^V}}_VH4%LZ zFZ}_P`qcOSn?BEL)rb6rKJ^?s$vWF?x(PfG%V$o;Cv@zFM;+hwoAwS=l_sjNO%R2iOPS4RJ9z1MP_@*g;cn!44r}rb zZS>CKJ5?`me7nOaaT}o<_;%#Sz?4)P{H2xs1|Q$QJ&@tkR`E9NP@hmg<=H1D}DsSjFNV_9g&u(2pOoC9rlUPO*3RFC>)MQEIQyF$aM`9osM z(CnY6x)-!*)u-*}LAd8IxB4hx&w0mb&}t(f6lSjJ^3ZL-6gL^=9A~e?f);e7`r^`# zJz)~I<9YT@H3U|8{1mkVO?E1st~fpIfju79I&_WWFeKHGdplEDuFM9Qm;?lhC*d?G z=}AbY0G)YExLO~m(5m<4m}^3JoyZGKFz<+RlLV$8gl5|b8+&FmW`43oS>2xnRsgKB z!XT(fYzYODo`@CD#Hp#n7y|NbXp+z%0}Zt!(=d8}%mUgF2C|q16BIB(Fvd`6sV%LQ zA#$jrX{HQMsrSC!rvNP647(j_?gq?cG>n*^@L{^#eA;n*;&2oF;4X98^yx*j8$@8F zbl4W+hk1^dvtlJN%KQAj&qMHID)h%TQXrHL5n3Z)RAhD$L*&MALc>p&<%Gop1YVd* zVA4e!-?NhsoPj}eq(G9FWJT_Mb!0OCi}kM2$~ItFA`1g$j_b26_{WZ+IF161h@Aj& z2!kITg+T=V5HQjdUR#tx1bat0>>lJ$=nzF+%7y+QF5isFA$<9*FgXN!H<{F-ci`74 zV?+;RCW;xx`2X&l;8qSWxR^U9SQ7+}a|L#C6eS@^Lz-?vq8{f7t?oX8s5-a_&3ae9 zPlv=t5MgE}0c4B)R6$3%JI*6!(g<<|W(c8qkYhzI_Fp?*N6jDXV%)@hKSg$M`5`S3 z=u$X~GP8-y^x^Yw%nUmRC?Y>5rnX2BOO2@Z1>lXSnLB``ffnRu@CZ6Ez}4Ve;>L)> zH}vcfX3ozF@52Fsqh3w%a&_Loz7Mk~D-2n|ob{Gi$&FY!%wT2)n*H(AuBUjJJIJJP zrW1pSI|(u^g=neplBo}VLnp#DWAD;Lc;R~vEW~C;7g%v#h8G#efnkVY?}08d@ymx; zN_m#0#4qAn3X}H@z#2Kx^?8kD0%?9)et~bt16zm|bpHujHnHL}5QmU5b9FQx3OG=_ zv>wLXxdTfYs9s(chHd+>2)1pJx9xU7A`kVVZR2h(dBRq)=eSW~CsCY2@ji+VP+UOq zF$zqT3tI*fmnl^ydaDYTbf8W7i3Tw&y;p%-Bj+rfwxG2~q}7t(!+js@VsQC5AY-{1;i* z$8(7=-lSOuoGB0+&meN~5e4pM;j{pb9EAK>$lcg&SZpM?d1Pm?E5*dGlN8R*V?D0u m*e57zD3Hr(Bn#tOGMit6b4wf{4Y@eFlsssLydiImYyJhzg(K(y literal 0 HcmV?d00001 From afd8d90f60450e29afd56a59cc22700695e6249a Mon Sep 17 00:00:00 2001 From: nemkothari Date: Sat, 10 Nov 2018 18:11:42 +0000 Subject: [PATCH 4/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 178 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 1277 bytes q03_logistic_regression/build.py | 18 +++++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 184 bytes ...est_q03_logistic_regression.cpython-36.pyc | Bin 0 -> 2298 bytes 5 files changed, 17 insertions(+), 1 deletion(-) create mode 100644 q03_logistic_regression/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_logistic_regression/__pycache__/build.cpython-36.pyc create mode 100644 q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_logistic_regression/tests/__pycache__/test_q03_logistic_regression.cpython-36.pyc diff --git a/q03_logistic_regression/__pycache__/__init__.cpython-36.pyc b/q03_logistic_regression/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..7d7eb09b7ec059ca52b1e6a63a60dfaf7eadd3c8 GIT binary patch literal 178 zcmXr!<>i_h@-&(O2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CU-9}G`MIh3d8xVC z`6U^NMVb2H`9;~q1&PV2`pNkzsrotj>6yhPnaS}*sp&_2c6+^D;}~L z(&WwIDyy;j%mcl~n+{vD`&mfVNQ<;dhpdwg-r#NC;p=>37MukOlr6F4&xkx>_ylzu zw~#41?qaiYqG`^kVkZd|TmjNLl7qC=Y4VN_6fetE=76pyGQSwvhd85Jr5^!n%8?c+ zSFz%myrBZ12BVtBiQqI(^MUob2gEy{o?DNes1 zOpbDWYtw|nmlg0Tv$)h$^KPg-fKB5f)v*Rkc_CG%Y&FIQ%tUi8lr6SfGtsGaOLG%~ z!b@-%F91*gAYthmMm&)kPbd?P9iOD0kyUqasfoM%^3Us9F!-%E8> z7Bu1gL^2ND_|tJ{j5o-&MEv-N}#C6<)yN;J( z)v{Ck|8`2LhrA?A_nufe?euSoIE zJXU05RTZZ!wjW8&eM9zO6EGzUgHH_}E6ciSThXy%-3m*&8-+V!3oujN13E{7zqFHB T+F_|eoBrOOZCVv~{0;mYwi$hr literal 0 HcmV?d00001 diff --git a/q03_logistic_regression/build.py b/q03_logistic_regression/build.py index cdbd506..44fe044 100644 --- a/q03_logistic_regression/build.py +++ b/q03_logistic_regression/build.py @@ -1,3 +1,4 @@ +# %load q03_logistic_regression/build.py # Default Imports import pandas as pd from sklearn.preprocessing import StandardScaler @@ -11,8 +12,23 @@ loan_data = loan_data.drop('Loan_ID', 1) loan_data = outlier_removal(loan_data) X, y, X_train, X_test, y_train, y_test = data_cleaning(loan_data) + + X_train, X_test, y_train, y_test = data_cleaning_2(X_train, X_test, y_train, y_test) +def logistic_regression(X_train, X_test, y_train, y_test ): + scaler = StandardScaler() + li= ['ApplicantIncome','CoapplicantIncome','LoanAmount'] + X_train[li] = scaler.fit_transform(X_train[li]) + X_test[li] = scaler.fit_transform(X_test[li]) + lr= LogisticRegression(random_state=9) + lr.fit(X_train,y_train) + y_pred= lr.predict(X_test) + cnf_matrix = confusion_matrix(y_test, y_pred) + return cnf_matrix + + + + -# Write your solution code here: diff --git a/q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc b/q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..568425ec50fbe57b31becf81e585710cf37c0640 GIT binary patch literal 184 zcmXr!<>i_h@-&(O2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CU#a>T`MIh3d8xVC z`6U^NMVb2H`9;~q1&PV2`pNkzsrotj>6yhPnaS}*sp&^-EHVON#a5<1_OzOXB183My}L*yQG?l;)(`fvhhEVg>*!;xwKB literal 0 HcmV?d00001 diff --git a/q03_logistic_regression/tests/__pycache__/test_q03_logistic_regression.cpython-36.pyc b/q03_logistic_regression/tests/__pycache__/test_q03_logistic_regression.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..4f051414c4cfe60b435ed863069d31ffe4542955 GIT binary patch literal 2298 zcmbtVQE%He5Edm_Rvg<&+ca5*VbcQSK|o-)=~IVoXpsd)fFLg`u!1Y9vLfTir6h-> zg4*bw+`q6NvA?m`{R6!Yd&pnd)9$3iwbKM$HwiqRj?|I&-N)mDPN((j)4zWH!?UbE zt+@xjtw+%G?;yCviL@xGdYjtN+tNv0>Jl7tWFz&cSLv>7ratv6y&;#<7Hxs<@upl( z+q7NTec4I7v`Z{OhAVt&O6aOs9p2(CzC5)-Z;92)=3)QbqqpfDx<>EPb-E#Zu_o?{ zb+IvZpSv?_`@NNZ_Qc|C-g#&7j&P?A-Q?s)E9{;_9M(}tO8=?QW{+tBdWSQ^qF4%+ zCD{NBD+`8b7fpF#WFl0gM4F#5d2WLvu-}pSAkij?VPK$y)=8d$xjPW%xR8>mfgXu? zvV|V|GG|#dQi3P3fq7ApRf`JVi}e|89^&x959b72$GFkU2iJN8P49pZRSE!p!tHk! zb-2S_=w0669`p^~I=?nB#yrguRY%aAGgg}k+fwsGDP zPByJ6ECvhBeIMKF*3`jF!ZPlWLU-pbh{;#`Zy;nNcmUBCsmP2Dw)sx*BsmiqXrZfc zJ=FwJE;Fr#GW(|mlcgg?7TTq&g*+}@#O^mst-`dw$NiH$75z-4uXA(4RMP(`SFiPm z#iAeQTmZBmqydo5hp>_U>AeThHRF8)$mmK&H%#e`#^n}HyYByJ7T#^xqQ=-Q$0w6- zZa}>EaYqYDL5EdRz651HDRoNl_{|dF9GyEbYw~c0Jr~EUkR|}G7D5L+53<|@DKqg& zFsL%II3sl4XGOKaS7@s)bZP|!CZQI$Kr6q#F_a6ZdIP4_kPv|6;U`0K>1T!r@(asR zg~%7606l@I#vVGH7#Ar!M@aiP z8^7EM#(4qE6&DksA_UtyY?P}tQxEh(rVYztQQC1@HmbjA^Wyi?#dShbLw5zW@J7_? zJw;X7K?fM0#%L|lA~u;k{$%{FdR)M9#;o-jjzfD2<$aM+FJN?Xe+J_Ma6AW6A){(8 z&5r?-kUt8Ymrlyw+yKY+$Ka@_y9Hh})+mcizWc8*RGyB)X6Z*!#!?YQWh;u(oEH-H zb`)X#sYeu^X0?W569wjCj{j9o@ersM2vjsyGoSbkc)iLReonm+14`)99&v?dq4bL^ zF&MGJVCWuP7Gq}eR3@)_*A%DA;?+C7w_Ee#@_ve#l)YC)BDumNPxt?qr)c-W7jl9= z{`bD_M^|pd3qK7Ewo&h|s_@Mu!z<8K<%Rl6FdpG`w^ZGRNO`!sR6Z)nvyzNy^I2pR xOET(#0&vmh_|gCh;)lGdV7@LZrT=Z6*6$H!jmd-5koMf$0^KKTWSw;Fe*pIMm&5=7 literal 0 HcmV?d00001