From aa067888f361fda5b571fce030acd615bf2aac52 Mon Sep 17 00:00:00 2001 From: soham009 Date: Mon, 31 Dec 2018 23:06:05 +0000 Subject: [PATCH 1/4] Done --- __pycache__/__init__.cpython-36.pyc | Bin 159 -> 152 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 170 -> 172 bytes .../__pycache__/build.cpython-36.pyc | Bin 655 -> 561 bytes q01_outlier_removal/build.py | 12 ++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 185 -> 178 bytes .../test_q01_outlier_removal.cpython-36.pyc | Bin 1835 -> 1832 bytes 6 files changed, 12 insertions(+) diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index 2e5da7da778c48a9c58d7d055bbdb642fcb66418..438a7bbc848271c2abb82237d3671872dda47e4f 100644 GIT binary patch delta 50 zcmbQwID?VHn3tF9$O5gHi5%u~uKF4IxvBca`5B411_qY;;rT_`#RZAUsrt$JDX9}v FtO0%M5Jmt1 delta 57 zcmbQiIG>Tjn3tDpxuj9lL=JORAN|nc)S_bj#H5VO;*8Yn;?ks|#N5QZ%)~tXywvje Mw9K5;;)$`=0QYSZdH?_b diff --git a/q01_outlier_removal/__pycache__/__init__.cpython-36.pyc b/q01_outlier_removal/__pycache__/__init__.cpython-36.pyc index 2f9a42a105b2b26ec10c60ac4d11fa03f7624d22..5a3d28bbf6e3c3ebbd8c4b2c0619fdb91cf95eea 100644 GIT binary patch delta 50 zcmZ3*xQ3C#n3tF9$O5gHi5%u~k@^|=xvBca`5B411_qY;;rT_`#RZAUsrt$JDX9~q F{Q-t%5QG2# delta 48 zcmZ3(xQda(n3tF9Mtoz`L=JPAaQ%$@+*JLQN diff --git a/q01_outlier_removal/__pycache__/build.cpython-36.pyc b/q01_outlier_removal/__pycache__/build.cpython-36.pyc index 8248a1626e901c868c177407620fc7ec379db180..dd704474319239ad892dfa5bb2d5332009550af3 100644 GIT binary patch delta 322 zcmeBY-N?de%*)GlWPw(U-bBu>R7M5{1~wpe2IAr%AW_4R1;jNBDU6a(GK(>VshKgG z1t`W076XznF(;537O*IgM2G^}Ks~iU*DR*;yNl309;sUYPRM^S2G zN_=v0*)7f-pc~>-5=#<`Sb*xliotdv5u8AYTO2mI`6;D2sdmgjUNIuLcW^NBQ?mVN5&i{F`V){Io{T~?Z5;e3$~tQuP7Tw(Of6CB!f^-oKT%eT=t%3ZO#1~vW*}lM-wBbr8=hQT#S;?7PR>< DNyKZG diff --git a/q01_outlier_removal/build.py b/q01_outlier_removal/build.py index ec278ba..5ea8165 100644 --- a/q01_outlier_removal/build.py +++ b/q01_outlier_removal/build.py @@ -1,3 +1,4 @@ +# %load q01_outlier_removal/build.py # Default imports import pandas as pd @@ -6,3 +7,14 @@ # Write your Solution here: +def outlier_removal(df): + df = df.drop(df[(df['ApplicantIncome']>df['ApplicantIncome'].quantile(0.95)) | + (df['CoapplicantIncome']>df['CoapplicantIncome'].quantile(0.95)) | + (df['LoanAmount']>df['LoanAmount'].quantile(0.95))].index) + + return df + +# outlier_removal(loan_data) +# loan_data.head() + + diff --git a/q01_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc b/q01_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc index 5a057ffb73694628cef3ed87e03ee3a17f7410bc..4bcc5669e18717db38de3f0c5462f59b26b45cca 100644 GIT binary patch delta 50 zcmdnVxQUU&n3tF9*aEGXi5%u~@%kD0xvBca`5B411_qY;;rT_`#RZAUsrt$JDX9}v FLII1U5U>CM delta 57 zcmdnQxRa5?n3tDpxuj9lL=JP+H2u)x)S_bj#H5VO;*8Yn;?ks|#N5QZ%)~tXywvje Mw9K5;;)$`L00#yW;s5{u diff --git a/q01_outlier_removal/tests/__pycache__/test_q01_outlier_removal.cpython-36.pyc b/q01_outlier_removal/tests/__pycache__/test_q01_outlier_removal.cpython-36.pyc index 4c0b6c7431c6a14108ba9d55dd44059612f144a5..c3dc8be5bb2e5c2791ed7c25205cd7f8638d2411 100644 GIT binary patch delta 66 zcmZ3@w}Ow;n3tF9*aEGXlM^{taqy+5mZX*DV5uLT WUzA;3keHmRpPZkPx>m-q-GbFCKV;- ZCgx=(=IQ69mdB@M=A;&HmSy5*1po`=7f}EJ From 7097d83adde4b6c694cdc8921a99f1a79077dfe4 Mon Sep 17 00:00:00 2001 From: soham009 Date: Mon, 31 Dec 2018 23:07:40 +0000 Subject: [PATCH 2/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 174 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 1352 bytes q02_data_cleaning_all/build.py | 26 +++++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 180 bytes .../test_q02_data_cleaning.cpython-36.pyc | Bin 0 -> 3402 bytes 5 files changed, 25 insertions(+), 1 deletion(-) create mode 100644 q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all/__pycache__/build.cpython-36.pyc create mode 100644 q02_data_cleaning_all/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc diff --git a/q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..6a3e32500d45e298b9dc19ec11c40775fab702fa GIT binary patch literal 174 zcmXr!<>flEKr4m;2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CU(xy*`MIh3#rYYD zxdsN7`r-LS*~JBk$*KCu`6;RTIr-_C#U+`^@kOcWMXANbnfZC~1x5K;smUe!g$73P xDTyVC@yR)G6py^b3<5GMCuy3|Fh^fQ zcOO7-#IZtTr!m0-Es{klFv#ps@??v54e!?Gq-gh+qyn9)j_#797R%JJ?vY+Q&ee(T zlRieGSPXcv#bhXki%)pTt8D_~z8FRu@9^#~h}`1%B^n*wfM4h$RFux75|oZ`7HfzMQIX**Myhyhw&K^aX zpP@yz*ZCIlBCd$@7A^N^)Q4!C#%#*^Y(VYsk1#+;NtFl(jYr2AYn(QdpW zy_Z7G=r_7i^$MUto2uPz`lGO#oIHzZ_4GUGd~H{@grlGkGWN4{a~Q+-$CH~5s8K>X zySkC@L^!t0@LE&n!L3ncGguMw8B~fVy%`(`{u(!{tq!?m*FuE?iclE_6l*R*#%nN6wr^a+reZRMi=cMrKuu1eq~}&ZP@#SsTQ9`aPu`w?MPq@}wwzy7B<2Vl3_QRWY$b9yp65*@D#S*!pdwRet3`1 zZ~n5bC(rxrs7l_0eyK{?7GzXp)m}}j-9x2e{_CTm<3J$X>CiMQIB+^kuML4=OW?V6 zlAXasZ6XoJ5&Og^G8rz-0%jKvX)|0)L45(n Cq%o}k literal 0 HcmV?d00001 diff --git a/q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc b/q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..ae6bee63e4c5728482486e6d823b942aafbc5030 GIT binary patch literal 3402 zcmd6pOK;mo5P-QPMN&^c;y7`WHf&l4P>@QFduRg`MT#U13NR7rpkxB zyEG~xJt@DUr(XL%`YZO@lm9|bogr;YmQz2Piz#qsx!j%I`8cbYFPqKUUw_@#9BsdyD=o3s*JiS5}%zZE-4)vFSXkwJ~x z6XMlbebAr|txj}kS6IF1vr)gYyr$Rk7Q97o$y;U%gDVqlurjzh(Y#f*IP-MvsYYwG z{!XKHW=st4Iwdc(c4Hs*r){^1a(-k&J_-bb_Cl7+IAYxAEXnqQcwdJ>(BGti4E!)= zK^mof=xFts?B#JB@V*$baC{pFbmJ^Y{UK*G3T2d~ex4Rn80~~&&$FN5>#fK81dN8b z{NaVGJcL_31HlSlo=yqX-)Wvf4Qhf0RMY}pp*D3uTeM1Rplw>G4bTp4(iZ3{U7(Ag zYjg?RTvkiy-s9QrhqyjoxU2*BBe=yT2&qXjA-|Eg+CZ1aTSCd2Hi2!x7G|D%`l>c5 zz9cMQZgVupZ4l#IPksd$l2I49`qS=+BA#-~fcR7G>hkD7T(wY2Ob)_ob<@ci*j?%;&ywE*yhEFT~bz~DJx|`Hi?)}){8=) z7HMY@8{PR}Vx!AR%pRRMo43GM?xOgBvw2|l?i{y^pUne9my@0ayMyd74LW`~7rm=Zf;qn>>ms$BIZ*%63su+EI$NxGX9i&*3bfKGxmUqAbTk5Q=D?4f#!& z$uW&^OvD^Z8jk;w{BsbV6^Rrodu5fil`?{K Date: Mon, 31 Dec 2018 23:09:16 +0000 Subject: [PATCH 3/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 176 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 1046 bytes q02_data_cleaning_all_2/build.py | 17 +++++++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 182 bytes .../q02_test_data_cleaning_2.cpython-36.pyc | Bin 0 -> 4757 bytes 5 files changed, 17 insertions(+) create mode 100644 q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all_2/__pycache__/build.cpython-36.pyc create mode 100644 q02_data_cleaning_all_2/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_data_cleaning_all_2/tests/__pycache__/q02_test_data_cleaning_2.cpython-36.pyc diff --git a/q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..cd7452da1e90ed3e1d539c925bdfce1cb291c0b5 GIT binary patch literal 176 zcmXr!<>flEKr4m;2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CU$Ocb`MIh3#rYYD zxdsN7`r-LS*~JBk$*KCu`6;RTIr-_C#U+`^@kOcWMXANbnfZC~1x5K;smUe!g$73P zDTyVC@yR)G6pt>(DRQ literal 0 HcmV?d00001 diff --git a/q02_data_cleaning_all_2/__pycache__/build.cpython-36.pyc b/q02_data_cleaning_all_2/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..9c746d3b44e807753f4f8fc11378e6ecaef6c798 GIT binary patch literal 1046 zcma)4PjAyO6t|N!X|s0S214S>iE?PmI3Z1FRX3qYV?r9zCTl42Vz*0i?96ed6}6{v z<-#}M$XD`})4l>Hp2I-fgbEx8W}*AQ)m; zAcAY{5g)WCg1kW**!g@B<`Ic7;&|3%!4)Pg-kQa%!NMyK?1;B&tl{)YNLEOjbjT{{ zk~J2w<|jnf89qe4)-}9^4tm&j7&SCW1*bBTQvkZEG9u$T(L7fdRD68mP7H*iGAT4? zS!yyRlSA4ytxWx8<8ruY?4b8gm!a`yKHLc(qbqke+(I>iZxGO1=zRMKfe$ad zg+B=(-}V6sUvtU0Cea(Jb;cQqcX;6-X-d-CWmQUDVx)7(#U$Cy3!&z4s`FN>f@?ER zMw-)iJ+ls8#8bvlT4R}bVo%YvXn}*CsUPkvOZSy9u&JGjdE2<(+jLuFuOA4 zCSg^cXS}qYENoDoYtxHtbetGXGigIGcxh}j{|$fv0P)A;eX=U6oa-!2eo?YG{f6{9 z6#54loB@kLsm^FV9KIYJDgB`=XvznvVjQ|T%}N6oHJ@r;mae0PRx_TO!TE4Axib_A z6(ZRjoK~4&{bFvrcfFfk*WNV{$Xmnkc`=Uh27ZL~1HgJ4HY})QwA4-5+6Hhg<~nxv z7#^QfqjHg*_W!}D|5r}^nvwQgq|yIJdY;^y@S8Zki_?TAv&4;btDbn5stsJDEk3q* uuG?@*cbr&t!sTA4S(p8m*Z_xZZsm$qg1>UH>k>6_6Sr|2O4J7HVek_Yh%$2k literal 0 HcmV?d00001 diff --git a/q02_data_cleaning_all_2/build.py b/q02_data_cleaning_all_2/build.py index e20ff7b..e7a6258 100644 --- a/q02_data_cleaning_all_2/build.py +++ b/q02_data_cleaning_all_2/build.py @@ -1,3 +1,4 @@ +# %load q02_data_cleaning_all_2/build.py # Default Imports import pandas as pd import numpy as np @@ -11,3 +12,19 @@ # Write your solution here : +def data_cleaning_2(X_train, X_test, y_train, y_test): + + CCL=['Gender', 'Married', 'Dependents', 'Education', 'Self_Employed', 'Property_Area'] + X_train=pd.get_dummies(X_train,columns=CCL, drop_first=True) + X_test=pd.get_dummies(X_test,columns=CCL, drop_first=True) + + numeric_column=['ApplicantIncome', 'CoapplicantIncome', 'LoanAmount'] + for c in numeric_column: + X_train[c] = np.sqrt(X_train[c]) + X_test[c] = np.sqrt(X_test[c]) + return X_train, X_test, y_train, y_test + +# data_cleaning_2(X_train, X_test, y_train, y_test) + + + diff --git a/q02_data_cleaning_all_2/tests/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all_2/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..ec956e4a9d160c0df71e553da2fa651cd046e7e3 GIT binary patch literal 182 zcmYL?F$w}P5Jj_KA;KO+3ujp?K^9M7V__o=baP(Q)e#`;OnM{TwrD6~kIUMqBorTQuB6eW+8(((XCrPNA9 z8s9S!-gN{Us89nH%hU-SyY4Z^cm0OF3suF5Dr^&ULeFK~=ByRGbUdh9YOrvx<9QBm zh&HSD&f_~3FK~Rj%^7v;p&R&i$B%#+E!V|MEAurzet2&{;L}#&9&0n7GCve{)ms0S z2W`f~u6>6y$NqsoclP? z2^b9-HG$kt3kfnW&@1Kx_a*Z|D``9f?Kn1;c}EDK?f#37B z*Pbv4+wnYmw-N#;B6^D2p(eZKc2}OA_P`zwY8^Tza1ct$Aidow9G7PUOiTd+MN@DV zl;jk|6M(KfraM&|q@Y#r`j~0T_MDCvnqb@=CQKTbeh`{1C#>(AjfnTj7Nyj|9Pm6~ zl~fKPMd3>*kn&ipfF{pO9mWt)Y(tZn1_Crxk4?kq{V@w@K^Vp&7EDmU0KpVPwV7&a z%`_#Uj)s{qJGIvP=70jQZ!_$+nYkBmle4hH{g@Ba73Q6__EU=0T2?*~owGXcaYou#0eG^Zf+b!NrHN zK%h(DEXvF#GSi38zcDlX0-(s;n3(D!K`b$%>gRwrqGs*@mIPXmo55q~zyQ~RZ;2Zt z3g6JPBbd23E4&W}1de(m!OM+#1N#BYqO5Ra1#{M0VkJ9b1SK@1(Pbad%PYIH@dN~bM7Uh_xkT^b$V z4bgZwj$fvqcU+G~dr<2x>>0aG7_>b1d3nZGvOIMwS&os?fNI@2K2p^_bSN>z!R5cq zxIUgrgwZC=GT=mk+IRwyjSeVqHw$M4aNr=x6G^&}+wjOpaP!E|V^<2XU&kq&U&MM` n(eaN_R8b(8(@2)a&3HDy1m{)+LK>tny3`zK2H7B6 Date: Mon, 31 Dec 2018 23:10:56 +0000 Subject: [PATCH 4/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 176 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 1206 bytes q03_logistic_regression/build.py | 16 ++++++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 182 bytes .../test_q03_logistic_regression.cpython-36.pyc | Bin 0 -> 2296 bytes 5 files changed, 16 insertions(+) create mode 100644 q03_logistic_regression/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_logistic_regression/__pycache__/build.cpython-36.pyc create mode 100644 q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_logistic_regression/tests/__pycache__/test_q03_logistic_regression.cpython-36.pyc diff --git a/q03_logistic_regression/__pycache__/__init__.cpython-36.pyc b/q03_logistic_regression/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..41652e9e3875daa3a973085152d1dffc65e26199 GIT binary patch literal 176 zcmXr!<>flEKr4m;2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CU$Ocb`MIh3#rYYD zxdsN7`r-LS*~JBk$*KCu`6;RTIr-_C#U+`^@kOcWMXANbnfZC~1x5K;smUe!g$Bm) iSmgEN<1_OzOXB183My}L*yQG?l;)(`fvhbCVg>*L+Awqg literal 0 HcmV?d00001 diff --git a/q03_logistic_regression/__pycache__/build.cpython-36.pyc b/q03_logistic_regression/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..e49c76efdd9fdb98ae28c3b43292dbae5b242b99 GIT binary patch literal 1206 zcmbtTyKdVs6eaccE6&4q(zTmA*lscvD2fJ2hX6r_W@tbJ5Ezkhlu)8V$w6HxllmhC zy7ZU0b_%+6?9@xuMw1{zflA=j(Ye&+<>Apzr_=oT<;Cd_2chri-sJ&)3nTvufgy$k zA{d^Quo9ct*l@OR5|_9&c7&Js#ILa{f}}wjHTFa^X^~cqebG)jq=OO1mn$r&FzNE{ zy7FiDPs@4_wRMK!-w{yLM$qo ze_Fr$uS((eqLy!J1&UJ^8h1Bp^P7dW!<5W4KGArtx-d(vny_ZVx(P<|+64E)05~1I b203SfzcK#Hw;%+#{r83gYvTa-@WA~ILrZ9~ literal 0 HcmV?d00001 diff --git a/q03_logistic_regression/build.py b/q03_logistic_regression/build.py index cdbd506..3c40150 100644 --- a/q03_logistic_regression/build.py +++ b/q03_logistic_regression/build.py @@ -1,3 +1,4 @@ +# %load q03_logistic_regression/build.py # Default Imports import pandas as pd from sklearn.preprocessing import StandardScaler @@ -16,3 +17,18 @@ # Write your solution code here: +def logistic_regression(X_train,X_test,y_train,y_test): + + scale = StandardScaler() + scale.fit(X_train[['ApplicantIncome','CoapplicantIncome','LoanAmount']]) + + log_reg = LogisticRegression() + log_reg.fit(X_train,y_train) + + y_pred = log_reg.predict(X_test) + conf_matrix = confusion_matrix(y_test,y_pred) + + return conf_matrix +# logistic_regression(X_train,X_test,y_train,y_test) + + diff --git a/q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc b/q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..131f5101045a18595d6f14ea55d20726bf51ca44 GIT binary patch literal 182 zcmXr!<>flEKr4m;2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CU&;Cz`MIh3#rYYD zxdsN7`r-LS*~JBk$*KCu`6;RTIr-_C#U+`^@kOcWMXANbnfZC~1x5K;smUe!g$Bm) oSmgCfQj1H9_2c6+^D;}~XGkzA0HpL+s!|I{p$G7x@G-k z%{=gJJ%y%!2f-~)q(w>D+th~MmQLbQm*AKqYe}8fOWl=?#G_uR*W^Odq)pK4ydf8p z7HySwPqvc|?GQ_l!4hAX5V|au2lsfBFHUUGn_{`N)v-UW)BE%RU7-)@DqRzvSP>7! zs#u%2$L`eHy0+3!o?E=d+wUyi7VgBM>zsUV1)U3s!#WB`;r$@A*<)IO-sa4(Fp`3$ zaoPvN(wrgOK~t6+84DFEk!0sgUfAFW>I=?m^pwrguOX%a95Ag}k)}wsGDP zPS&jnECvhBe4p5>*2KX~!ZPlWLU$J~i18QuZy;nNxDV0iiAat1H~E(TJU$mGXo0J6 zJ=FkFEHbTyGW%yalZ7Ki8rX%ag*+)-#O^msEyJ|GU-wS4MD%oa%98Ev-QJIx`dJTI zBzjTC1pxbA5&-9H0Nd!DZ9fig8SfduMVB(XV@h{8DmHN1ZU2YU;O@f)HAZeZ9vMHm z1MlvK9nGZ#9hNEi9F*CVR0+YuH-+Chx^Q6Dcz23C7bh&2#s{Y6Li;@P)6Dn@GtsHv zFY_=zBXF*BqFUf9uvG^-wS)pwP>Fk>6<^*N%B54i2Gc4?2tcy?(U4sEnIeMh!eUe+ z@);;VPN1o=2M#C3MZ(U|(LNd75rwB&t)N&(fw`FBf0}!6sN1=)jiwZsd#a9JB3Wj?yEeOT;Y+Y`~S;RxO3?XIYFQO zdtZ;j8~5R*pBe^RtM*sc_ePxJ1!&6hLOmrI5Am{FDDOg~JltF=8y4h6K}NLkA~cG{ wDXoJ7aM8x-$^Z)DhrB9bzAY<-_jQ%lZxLpV$%E98*38=k-6Jbxm2~WX0O;730ssI2 literal 0 HcmV?d00001