From 63e18301e624826e1436e82d4af48366707f52ed Mon Sep 17 00:00:00 2001 From: nemkothari Date: Sun, 12 Aug 2018 18:34:07 +0000 Subject: [PATCH 1/5] Done --- __pycache__/__init__.cpython-36.pyc | Bin 165 -> 148 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 179 -> 162 bytes .../__pycache__/build.cpython-36.pyc | Bin 568 -> 446 bytes q01_load_data/build.py | 11 +++++++++-- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 185 -> 168 bytes .../tests/__pycache__/tests.cpython-36.pyc | Bin 1577 -> 1560 bytes 6 files changed, 9 insertions(+), 2 deletions(-) diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index b4b72099455159189764a0ad76aa1fabbc62e96a..991934475fd6f193f4bbfed7a3794f6d16abd0dd 100644 GIT binary patch delta 52 zcmZ3=IE9hJn3tC;w6-96B8RzxqkcwyZmND>YHoIZNk(E(rha&SQFd`bVsff}a(+tc H!~#YHoIZNk(E(rha&SQFd`bVsff}a(+tc H!~$mksx%R} delta 69 zcmZ3)xS5f|n3tDJb=ID!i5%vJ3HqVMsYS*5iAfom#TlvD#idC_iMfe+nTdJ&E~&-Y YCHV#V`30$Y@dZWsS*gh-#S`P50V>oP6951J diff --git a/q01_load_data/__pycache__/build.cpython-36.pyc b/q01_load_data/__pycache__/build.cpython-36.pyc index e27baf631ae2be11ac2de9e6f21754e2497753d8..ec61f07a0b9088c57c6b995a105a71a1dc32712e 100644 GIT binary patch delta 255 zcmdnNvX7b5n3tEUtF|Ee=R{6_St|wxh7yJ>#u|oZ##+W2#w?~3#uTPZ#uVmWM#hQN zwvth-!6k_$skc~*L6j!rE%xO6oYLI9;>kUXG9FP}MX8A?@u?NbsX4dUic<3ub5k{$ zZm|?3mSo&wN=aMEP{aeY;g^qoMt*LpeqL&Bc791lVo|1kcz#iKaY15os(x~QO6p{7 zM!iJdLIcD2oP3~pDTyVCEI@t596*ABiHlKyQHH6A56ISJzQtCMn3s}RTm+H>i-D~` aB6xukw>WHa^HWN5Qtg<4ykZc+!2|&A?nGAr delta 365 zcmYjNF;2rU6t$BE(uxi&NJy2CV9L^fIua@d#0UdoL7?b2Hngb|8#@sN6)}_xR6PJQ zH()?qfE)M#9D<4OcEQqn{_p?y?QehiAB|?O-EI|cpI1Ng=K0<+A*3QXost=Src=u3 zHpxBaG5-}aPABvF=*0%6f{JGp?QXf<;R0boq$$bC3}r;mB5DI6AGpSVPTq+Qu>N}! zUmC7W41?jw4Efm90}Ta~BPin&ZpM{Vu~fWFm6kcrDibRx8JP609P#y@7I>``6$erd^i}lR~mu@V@&L;~|Cq9}Yxd7XSbN diff --git a/q01_load_data/build.py b/q01_load_data/build.py index 69d7209..dc3c28f 100644 --- a/q01_load_data/build.py +++ b/q01_load_data/build.py @@ -1,5 +1,12 @@ +# %load q01_load_data/build.py import pandas as pd - def q01_load_data(path): - "write your solution here" + 'write your solution here' + df= pd.read_excel(path) + df.rename(columns={'State':'state'}) + df['total']= df['Jan'] + df['Feb'] + df['Mar'] + + return df + + diff --git a/q01_load_data/tests/__pycache__/__init__.cpython-36.pyc b/q01_load_data/tests/__pycache__/__init__.cpython-36.pyc index 2a2dfc72b54611f7a4f5a7734a9c697f606c0089..abb4e899c1d88274bf060557294718c6cdeab7ba 100644 GIT binary patch delta 52 zcmdnVxPpYHoIZNk(E(rha&SQFd`bVsff}a(+tc H!~#zMwt^A{ delta 69 zcmZ3%xRa5?n3tD}ZT6n1i5%vJY5JkXsYS*5iAfom#TlvD#idC_iMfe+nTdJ&E~&-Y YCHV#V`30$Y@dZWsS*gh-#S`N_0Vp{c4FCWD diff --git a/q01_load_data/tests/__pycache__/tests.cpython-36.pyc b/q01_load_data/tests/__pycache__/tests.cpython-36.pyc index 76e04c8a5e2c476c2fba795d8bae25fd09cc88ed..5763a0b8f29a54af22247953c38d31008e842eb4 100644 GIT binary patch delta 55 zcmZ3nA2AR#B cXP4v`=;s%t=EWBj Date: Mon, 13 Aug 2018 18:47:08 +0000 Subject: [PATCH 2/5] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 180 -> 163 bytes .../__pycache__/build.cpython-36.pyc | Bin 626 -> 625 bytes q02_append_row/build.py | 13 +++++++++++-- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 186 -> 169 bytes .../tests/__pycache__/tests.cpython-36.pyc | Bin 1355 -> 1338 bytes 5 files changed, 11 insertions(+), 2 deletions(-) diff --git a/q02_append_row/__pycache__/__init__.cpython-36.pyc b/q02_append_row/__pycache__/__init__.cpython-36.pyc index de0cf6163be25541da218f6f8a0c4d005729c09c..d366be243ff8494cb23462e1bca19f840302ff78 100644 GIT binary patch delta 52 zcmdnOxR{Z{n3tC;w6-96B8Ry`fPO}PZmND>YHoIZNk(E(rha&SQFd`bVsff}a(+tc H!~z!ps=g7t delta 69 zcmZ3?xP_6!n3tE!c-Ee%i5%vJiTa_%sYS*5iAfom#TlvD#idC_iMfe+nTdJ&E~&-Y YCHV#V`30$Y@dZWsS*gh-#S`OQ04~`XB>(^b diff --git a/q02_append_row/__pycache__/build.cpython-36.pyc b/q02_append_row/__pycache__/build.cpython-36.pyc index 508826776138177582df97d666bb284c1e1484b0..9537b191fdbcf43bb13174d58ecf6fba9fb36c73 100644 GIT binary patch delta 314 zcmYk1u}Z{16h$+WY%&|NvWoShc4-V^D>jOtpp6ScEW(hPnCxa|;v~TZ6YT7^2n+s$ zzhgO_pP-dkIY}iCF7F-gz3{%RFUviiOx)SW<9!P|_ZeJuuZIWbV$^_zP3$#jO}#md zNgRUKu(cZN*6_zS-RJDZ2g->>UNc_KeGq!t0~eA;87Fk*BMA+|P-a;(1q-6a=eWWb z5;Lm6Jai--Y!dY*8y5xT#2+cEz*QO|l0-?yaUME49!c>O+8Pa2BzZUFRHuITu7gxC z8gR;%qDryMf;%CXWr1TF#DdVx8#vqdwAFwJ?1HU+Ou3_P-%)mfIl-lLH$UL=sE0%A YKiSqyp%W%Zozv6)o6^>Tz!ZA$54d?(u>b%7 delta 320 zcmYj~y-ve06oq3aP12}^RssnY$eN)keDe08Hil$5VwhK*@?P4EcD&CAgU%sVR^yV!e$PtMA@ zup<9qZz*X-!h2rJQ1PO!C}&|#BxyDW&(jDbJ$lQyBq?Q>+(oX0mSt&M)uo04>+S?q z=uD!LXfV|-5`r)sb+jW;m1~Hz#51p{Cdw8`$@Ce5r_3F`DI6 zVVs5~xkbF*VDiyawxZAG5=rAw<3;JLOY?+Zm<04PH0x^t~ i?6zOv{P;KgYx*YxlWBika$FbW6d0#mBR&|wp8W&Q8(!G} diff --git a/q02_append_row/build.py b/q02_append_row/build.py index af3701d..ba4df74 100644 --- a/q02_append_row/build.py +++ b/q02_append_row/build.py @@ -1,11 +1,20 @@ +# %load q02_append_row/build.py import pandas as pd import sys, os #sys.path.append(os.path.join(os.path.dirname(os.curdir))) from greyatomlib.pandas_guided_project.q01_load_data.build import q01_load_data - def q02_append_row(path): - "write your solution here" + #'write your solution here' + df_final =q01_load_data(path) + sum_row=df_final[['Jan','Feb','Mar','total']].sum() + df_sum=pd.DataFrame(data=sum_row).T + df_sum=df_sum.reindex(columns=df_final.columns) + df=df_final.append(df_sum,ignore_index=True) + #df_final.sum(numeric_only=True) + #df_final.append(df_final.sum(numeric_only=True).T, ignore_index=True) + return df + diff --git a/q02_append_row/tests/__pycache__/__init__.cpython-36.pyc b/q02_append_row/tests/__pycache__/__init__.cpython-36.pyc index dab3ecac755f4882f0d0d63dd70ab57f6fb428f8..f9ca2d88d4563e31e6568a32b0739840fa001436 100644 GIT binary patch delta 52 zcmdnRxRQ~>n3tC;w6-96B8Ry`n0`inZmND>YHoIZNk(E(rha&SQFd`bVsff}a(+tc H!~!n>t@;tv delta 69 zcmZ3H49?sYS*5iAfom#TlvD#idC_iMfe+nTdJ&E~&-Y YCHV#V`30$Y@dZWsS*gh-#S`Pb078KoegFUf diff --git a/q02_append_row/tests/__pycache__/tests.cpython-36.pyc b/q02_append_row/tests/__pycache__/tests.cpython-36.pyc index 742ee79571b722fe1fcab2f42f1dbcae23a14bd1..3041098423077cdedb0ebbeccd70db318d6434f5 100644 GIT binary patch delta 55 zcmX@jwTp|xn3tC;w6-96Bga`rg<$=R{M=Oiywu$6{F02sqD=kp{G#mQg2d!h{p9?V K)Xi*6uFL@Y*%EXB delta 72 zcmdnRb()LAn3tDJY{8zWjT~ng4O8?(i&Kk=^%IjaGK(`(vx`fUiV|}Z^D-0j^j%Vm cvrF;|^z#c+^WqDN^0QKtONuvtWprf*0G;$2#Q*>R From 6276af051b545a0767ad9551c2205c33cb5763f8 Mon Sep 17 00:00:00 2001 From: nemkothari Date: Tue, 21 Aug 2018 20:00:57 +0000 Subject: [PATCH 3/5] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 182 -> 165 bytes .../__pycache__/build.cpython-36.pyc | Bin 888 -> 679 bytes q03_scrape_clean/build.py | 15 +++++++++++++-- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 188 -> 171 bytes .../tests/__pycache__/tests.cpython-36.pyc | Bin 1396 -> 1379 bytes 5 files changed, 13 insertions(+), 2 deletions(-) diff --git a/q03_scrape_clean/__pycache__/__init__.cpython-36.pyc b/q03_scrape_clean/__pycache__/__init__.cpython-36.pyc index e99e1734469b0d74feccbb92229a5c70c95d8904..79fddca935afd2d582670a303a5633ec5740f3e1 100644 GIT binary patch delta 52 zcmdnSxRjB@n3tC;w6-96B8Ry`kbXvfZmND>YHoIZNk(E(rha&SQFd`bVsff}a(+tc H!~!<}tI`p~ delta 69 zcmZ3=xQ&s+n3tE!a@L-xi5%vJ$@-zisYS*5iAfom#TlvD#idC_iMfe+nTdJ&E~&-Y YCHV#V`30$Y@dZWsS*gh-#S`P*05Q86GXMYp diff --git a/q03_scrape_clean/__pycache__/build.cpython-36.pyc b/q03_scrape_clean/__pycache__/build.cpython-36.pyc index cdec2c4c90379271521fc76a792f2606530a2690..a0f8e1f142f090a2e530c64911a9e3230b9b0140 100644 GIT binary patch literal 679 zcmZ8ev5wR*5Vaj|lHFsE6%rCOXxlUdbS*-M=qQfjKuDnoCNq1RY!c^eM{p=tEtGr+ zzvPzc#2-*G$s%#Wmfw3blgt|@C(Gqxr-%2yIAcHAttCmH(y^}yfB~;r#wQk;m^jFS ziDf2HRI@6?fH0acCY!B>_ofSJcLc-DOB^~>Lz_E%uQ3V6r z^GfddH6J+ehwNGmf;zEpf^;whK<<;41Nlx*%m!J7!we+Mz6;LA2ttTT{x3rl#AjwS zzd0IVRBsaDqe9nx)7mU5+pbmxetGb=Egi!8+$o24tvBlz4Vto0+5JQ1P|%yd=_K-^ zgKTb4LB4fO?PG(NJz8gdaDmQCho4<0%UTycG}x*JlhDgfxh;Lk%~LO6lZCL!Tl|#G ziMP}VjSmm}gPA1_`}=je)eWXCHaqRM%9QClZFaV!nbSf8rk!d*+5Dm}0U_^i<$iHg-k8_&px;JG2-4n6$Y|x#Y-)2MaT!&N4Hs795Z7#m^cIeT~lrMK&gg`HCiZ GB>n(CL$PlF literal 888 zcmZWn&2H2%5Vn(SHccto6KW-dB5svX1L}2Ef#AfUm#UY&EZ)qtn>2}C+W~g9J#FE} zgYXVKiLXdVeE=>!G0yT+l|=J-G9G{P%{YfUJL%}hx5-b=*mrj4iO7FRX5JD2175QU z@7G`w^lLZ?`!$+G7*vBQ#*lE>V?wyK=Kkdj0tm0!Bn5uL_M;o(W5)&6>z|NtK=zu< zd?v80;w!f1SKJ0wxZ+i`=D_#ZRj{Hep6e5t$FtyfH12o!zbHgsIOPuh&xLr8RYMp; za!oa=#FENY0P&a+M+)@C$s?WVa`%HSEoKYZ>CDKwv!!gaIcn5i`^`4N@jiFMg7%u$ z-1z8n_q3%$keygz(PZ*0d)1&W3-PyMpXQrBAu|sMR;;4&La_E_!{b|?Ip%pas#+9C zF8}zI=`BjVeV3ma)Fv0Rd1>Z&VY-3LTI z!k=({`TTHd3M~{)iyG3iEz{+a($=J2cj~@EolR6u2#o0;Y4@)P8QQ#n!s0BsLdoY(;}^Ae5>XE*8cv z6uMZ>d><~ha_U(_7k0Y#)JDnHApL`9FZ$VRASJYHoIZNk(E(rha&SQFd`bVsff}a(+tc H!~!1xuMQF1 delta 69 zcmZ3@xQCI$n3tF9*up(g6FJNcGxbA@Q;UlA6O%GBi!)NQi%XM=5_1#tG86OkT~dp) ZOY#f!^9xe*;tPuMvr>~wiYLbV003Ch8Q%Z^ diff --git a/q03_scrape_clean/tests/__pycache__/tests.cpython-36.pyc b/q03_scrape_clean/tests/__pycache__/tests.cpython-36.pyc index 8529c871c1d09e03d187c6dc0d0810c3df16d3e3..aaf0393f0b6a7ccf73d6cdfd949f333ae5b4f55c 100644 GIT binary patch delta 55 zcmeyu^_Yvpn3tC;w6-96BgYp;g;4#B{M=Oiywu$6{F02sqD=kp{G#mQg2d!h{p9?V K)Xlm~?#uubHWL^C delta 72 zcmaFN^@WSWn3tC;bkUxujT~PX4b${Pi&Kk=^%IjaGK(`(vx`fUiV|}Z^D-0j^j%Vm cvrF;|^z#c+^WqDN^0QKtONuwkFu5}W0LpC|s{jB1 From 986dfb9d5c8e5efd8827de24a579b63bbb95eb3d Mon Sep 17 00:00:00 2001 From: nemkothari Date: Wed, 22 Aug 2018 19:24:21 +0000 Subject: [PATCH 4/5] Done --- .../__pycache__/build.cpython-36.pyc | Bin 446 -> 446 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 177 -> 160 bytes q04_mapping/__pycache__/build.cpython-36.pyc | Bin 877 -> 635 bytes q04_mapping/build.py | 13 ++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 183 -> 166 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1685 -> 1668 bytes 6 files changed, 12 insertions(+), 1 deletion(-) diff --git a/q01_load_data/__pycache__/build.cpython-36.pyc b/q01_load_data/__pycache__/build.cpython-36.pyc index ec61f07a0b9088c57c6b995a105a71a1dc32712e..1cc8f40a2580accb032213e3c600cb8d483e8eb2 100644 GIT binary patch delta 90 zcmdnTypNgHn3tDp?nKr{jJGDfP-5hr%*|Nj$j`vQpvioTtspTkC9$}O1IR4`i52mp a5_~}JEe@O9{FKt1R68ahuNXvdFaZGG>JqmA delta 90 zcmdnTypNgHn3tEUYa;6-#;A!elo)v?b2An>@-Z+lXfoeoD@e>sNh~hn0CI~!VnsZt Z1TT<#i^C>2KczG$)s6|sD+Uo9OaQU45*+{l diff --git a/q04_mapping/__pycache__/__init__.cpython-36.pyc b/q04_mapping/__pycache__/__init__.cpython-36.pyc index ee0618f2c89597e870d478c12dab4aec6d95e7c7..a7e56715249651e2e03839c4128fc173930ee63b 100644 GIT binary patch delta 52 zcmdnUxPXzvn3tC;w6-96B8RzxuYN{;ZmND>YHoIZNk(E(rha&SQFd`bVsff}a(+tc H!~#bEsUQ)s delta 69 zcmZ3$xRH^=n3tE!W7eLii5%vJar&XfsYS*5iAfom#TlvD#idC_iMfe+nTdJ&E~&-Y YCHV#V`30$Y@dZWsS*gh-#S`Nl0WpplE&u=k diff --git a/q04_mapping/__pycache__/build.cpython-36.pyc b/q04_mapping/__pycache__/build.cpython-36.pyc index 8283165768b4bf279030f79c34448f8435bb4125..032325f610c79bbbb7a2665c43b32436db1a0b70 100644 GIT binary patch delta 427 zcmYjNyGjE=6rIQJW?f&wO1rcHA-+lph?N#1gdnU%n9NMfCc87^%qAG!kRr8(33umK+T<*E&z`6Ip{RqCi=x}{Kx_q5pzrm;IVdet>PFWyTwVXG59y zw}?&}S5gm+B9u3%WPI@gch6RD_l`P$o0alCYYqU6T!pX-H=wRMU0<<*B7za4LnkdZ t6JwDyu`foMnph;%;u|#&OYbuMA8eKj;c+I}DCJG$lqqkN*F&@he*nbRcrX9} literal 877 zcmZuv&2H2%5VoD)Zd+6#4n=^p*S%~?L5Rbu0>PQfs+VwxoY?IqP3+WmXj7%9?Ykfz z1Mv@+eep2#~E!~E?B1IRpHKeBLMh- z4*-1)!k_`I@hvg9A_E4?8$5=eqRKP=8dm`$%)5gK=UpI>{==TLou>*JEIA?8*;ndBqhN`1%`CuIS&NlT*!=PH4U= z^@?BUE?2anqNF1E$n}MhZ6cvxS*v8l3!{^k3PyEy-j$5A2X}IL^g3&xv!yss@~*7e zyzOngsA-ckdNOf*0O;n$R^WV5%YxSW1dL6bC8x{#5aO&)^IX|LyHaO+$~}}NEwi!W zlx2nfVneD;-*W3|1A%aL-P;|_O;!rVuWe*x#>&FjuoO_Cu|%}i6I56ac+LVFwA8F# zZq%`j*;#g03RYHoIZNk(E(rha&SQFd`bVsff}a(+tc H!~%B!tXvVu delta 69 zcmZ3+xSf&1n3tF9@$NlQ6FJNcQ}jcNQ;UlA6O%GBi!)NQi%XM=5_1#tG86OkT~dp) ZOY#f!^9xe*;tPuMvr>~wiYLaq0{~&`8Ug?S diff --git a/q04_mapping/tests/__pycache__/test.cpython-36.pyc b/q04_mapping/tests/__pycache__/test.cpython-36.pyc index 7f7c96e914a8d9dd0deb7c46cab1b7ff9ad3e05a..09edd36d348eb81bd414ebf171be66302470175a 100644 GIT binary patch delta 55 zcmbQr+rrCX%*)FaT3Zmkk>fd|g1>%7er~FMUTSW3eo01RQKo))eo=ODL1J>MesX?F K>ShI|QWgN}loD?M delta 72 zcmZqSoyyB$%*)H=vv*I_MvmuQb`iV&ynZ+5Y*~O(vMTxnId6|iM`Yx%( b*(Lb}`uPQ^dGQ5B`B|ySCB>WhnMzpzm$DiZ From 7e5cd85f583481d5aa80b37de2f6f167457e59d1 Mon Sep 17 00:00:00 2001 From: nemkothari Date: Mon, 27 Aug 2018 19:36:22 +0000 Subject: [PATCH 5/5] Done --- q04_mapping/__pycache__/build.cpython-36.pyc | Bin 635 -> 796 bytes q04_mapping/build.py | 13 ++++--- .../__pycache__/__init__.cpython-36.pyc | Bin 192 -> 175 bytes .../__pycache__/build.cpython-36.pyc | Bin 808 -> 1231 bytes q05_replace_missing_values/build.py | 35 ++++++++++++++++-- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 198 -> 181 bytes .../tests/__pycache__/tests.cpython-36.pyc | Bin 1741 -> 1724 bytes 7 files changed, 39 insertions(+), 9 deletions(-) diff --git a/q04_mapping/__pycache__/build.cpython-36.pyc b/q04_mapping/__pycache__/build.cpython-36.pyc index 032325f610c79bbbb7a2665c43b32436db1a0b70..0242141ce0daeb302dae378ae0ed7ac0ca3fcde4 100644 GIT binary patch delta 549 zcmY*WO=}x55S6sr53lXUDLus02ScFXLsCL-C4_`R4~4b|{q3AaLt+& z+-ncP^wvMnza;3XKcUB7I=iPsTdhM%reyWR}ikX1&O8cvnH zRZY!i`Dk6V7ie~YP?06A>5gt0daNesdFXjH13Dy2jwc%u@V>I8zav{-d%*ENxU2b& zBJs}&VgMmT&;brHcG`s=^l#!J*?P5y{XTdj*lfBvn&nBQVLYv5rR})59$#hJBuY-G z^OGF(+WEGL2`(24BSNWEvC1pQbD3!o*ve>K39gdr)8=irEHJql9klaa$=rD_^}>0t zrJ00|l^`OcCCqVp5w~6|l?bNzrnWA)mFY@b5mv<<619I$ACFqaQ1I)yN;OstGg+2N ze)EHvgZ)SP{z=@()4=&`epsc(A zZ@^3N0$y3@Gq7+*3~;CW?)y&mS)X6LFV^X`T8*=}<@qNN@mHUI>BD{5pKv7DzbtlMMf(?<_HjU0!voW zsUsZ0ge$x!2S`N)+agm|u@zW_FZzSJ3)`nL9SzqWu8SETkF{|WSCM0!EKiM>=GlCv zjJx33Tt=>;g@_wka*@cpRAzDT!_#tMyooBMuHRv2H_aqhXzMa5Q_TzG&(O_8UA+<= z){I{4`PM-bfj|Q@fHs7n+o+=r;}u*9Uh1HJq@$i4>hM2oqBOzLEEn@k_U-qS0fJo< H&?bBXC8k(o diff --git a/q04_mapping/build.py b/q04_mapping/build.py index da75afe..24c1c43 100644 --- a/q04_mapping/build.py +++ b/q04_mapping/build.py @@ -4,12 +4,16 @@ import numpy as np #sys.path.append(os.path.join(os.path.dirname(os.curdir))) from greyatomlib.pandas_guided_project.q02_append_row.build import q02_append_row +path1 = 'data/excel-comp-data.xlsx' +path2 = 'data/scraped.csv' + def q04_mapping(path1,path2): - df_clean = pd.read_excel(path1) df_scrap =pd.read_csv(path2) - mapping ={'United States of America':'US'} - df_clean.insert(loc=6, column='abbr' ,value ='nan') - df_clean['abbr'].map(mapping) + df_clean = pd.read_excel(path1) + mapping = pd.Series(df_scrap['US'].values,index=df_scrap['United States of America']).to_dict() + #df_clean.insert(loc=6, column='abbr' ,value ='nan') + df_clean['abbr'] = df_clean['state'].map(mapping) + df_clean = df_clean[['account','name','street','city','state','postal-code','abbr','Jan','Feb','Mar']] return df_clean @@ -18,4 +22,3 @@ def q04_mapping(path1,path2): - diff --git a/q05_replace_missing_values/__pycache__/__init__.cpython-36.pyc b/q05_replace_missing_values/__pycache__/__init__.cpython-36.pyc index f50c1d5e3fce9c03c9a40722e1899cfd21d8ee70..7f93d401d4782d582098b009a39e23015790a3f4 100644 GIT binary patch delta 52 zcmX@WxSo;2n3tC;w6-96B8Ry`jDALbZmND>YHoIZNk(E(rha&SQFd`bVsff}a(+tc H#DV|-u{IIx delta 69 zcmZ3_cz}_^n3tE!f7YI;i5%vJx%#2SsYS*5iAfom#TlvD#idC_iMfe+nTdJ&E~&-Y YCHV#V`30$Y@dZWsS*gh-#S`NL06s+-aR2}S diff --git a/q05_replace_missing_values/__pycache__/build.cpython-36.pyc b/q05_replace_missing_values/__pycache__/build.cpython-36.pyc index 6a32964667ab0d808d5677d1ae67893cfb4e2b10..862dea1a8bac42ed713648b87b1a50c58180faf3 100644 GIT binary patch literal 1231 zcmZ`&%WfMt6y;-PG#*(-8gvl{UKm9;T10Zw$0{gV6!0Q|g`!GOlwAy{A#IO5FO#EG zGREk_+2%jmU*fi_{6befq>D5uT8?;Mb48we&z;XFlkB%2UjO`SM93fHy~SXEgKfWu zP(;y+2pTjKJm^S7LB}G7W>r#;#E25bMXDmPr(%`7CL&WKl|qlzp30#26$>6xoLm7IaIQjbGnq1bex>dGxX=d##R_z3jC;ZqJXut+go&iQ3|_QF`lQ z>)*LZu2x2jWKp!6rgu>zYb_Gn8?Ad06=lD>8Fwvmec?(w{#-VWpX!z4XVOeZj&(|; zMoX2Wc98`uG)g2(T&b-~Udd{str+!fuF9f!yq4WGc5x^B%g^rBQ_ypshb{)Is5I^w zA+al)i{FWPfd2jY)BLin^}NybRoh=mQ_g>E&6VwBq30gmypxTRHow@EN~^px?OGT8 z{QBg}+~}@CT3(md;>7$O(|ollD>dtOZhU?6MgI47o;14;L1>2Oh&`l7)I5Y=P#?we z+VdQ^eGa211K7Qzie54EY48|4<~_v+lC$QMcR3NFryt~;s@UfY1RN#{k)3&%_;sb@ z4LZTjmLh$j8*Q!Dj=fk+x#M8T;0qzfPa2rz7}e0Id+`yXZoKI*pxW1KKSsc25Crw4 z*a(HluhXD-$Nzp4q8e+sf+UGtU@PPNeAR2Lej^c0&x1h5ayW#c8i>zc?OEp`MIjdPJ zmboa7^QzRxZJsO(yIdc3l+6v(f+xAX$=iuL3n=3L# z3tW?h$30-Yd&b{m0$}_NSzvIV_r_@B@sRhwdKleT2T=7NsxV8me)`eKT1-||VgyqO|iAQ_hz~mB)b#G^^*&cJLf_e3@NJ#R@utw+B5sg!E4CJ2H>p(m#vzgB8Z6 zY&w^AF0O1dHLPSxGL^m)_NuOQT4|v&ZK{RHYny7OIJ4QTkzDY*a(aF8GP~_>C#h!H z4J#U9(`h3Mp6Hc3`u|7mob~_$A`w0Udje(-A&-Zyx07^4a~i0o)GIRp#(8#S9jPom zof)xWbyXH}n*6iBWbfZfx`w))npV<`+R$osE7=Q=Tb2H+vf@o4USr5?yR<&;j2sXj G`}i-#^WbCv diff --git a/q05_replace_missing_values/build.py b/q05_replace_missing_values/build.py index 97d9755..18b7be0 100644 --- a/q05_replace_missing_values/build.py +++ b/q05_replace_missing_values/build.py @@ -1,13 +1,40 @@ +# %load q05_replace_missing_values/build.py import pandas as pd import numpy as np import sys import os #sys.path.append(os.path.join(os.path.dirname(os.curdir))) -from greyatomlib.pandas_guided_project.q04_mapping.build import q04_mapping - +from greyatomlib.pandas_guided_project.q02_append_row.build import q02_append_row path1 = 'data/excel-comp-data.xlsx' path2 = 'data/scraped.csv' -def q05_replace_missing_values(path1,path2): + +def q04_mapping(path1,path2): + df_scrap =pd.read_csv(path2) + df_clean = pd.read_excel(path1) + mapping = pd.Series(df_scrap['US'].values,index=df_scrap['United States of America']).to_dict() + #df_clean.insert(loc=6, column='abbr' ,value ='nan') + df_clean['abbr'] = df_clean['state'].map(mapping) + df_clean = df_clean[['account','name','street','city','state','postal-code','abbr','Jan','Feb','Mar']] + return df_clean + +def update_vals(row): + if str(row.state) == 'Mississipi' and str(row.abbr) == 'nan': + row.abbr = 'MS' + elif str(row.state) == 'Tenessee' and str(row.abbr) == 'nan' : + row.abbr = 'TN' + + return row + +def q05_replace_missing_values (path1,path2): + + df_final = q04_mapping(path1,path2) + df_final= df_final.apply(update_vals,axis=1) + return df_final + + + + + + -#print(q05_replace_missing_values(path1,path2).shape) \ No newline at end of file diff --git a/q05_replace_missing_values/tests/__pycache__/__init__.cpython-36.pyc b/q05_replace_missing_values/tests/__pycache__/__init__.cpython-36.pyc index 03391a7d73977c58beb60b2c9e2dcb47994c3aa6..6334cc15d0b5a314b359da3cb92c3863af077391 100644 GIT binary patch delta 52 zcmX@cxRsH^n3tC;w6-96B8Ry`l72>hZmND>YHoIZNk(E(rha&SQFd`bVsff}a(+tc H#DXvYv~m&z delta 69 zcmdnWc#M(5n3tC;e(#>Bi5%vJ#rmPesYS*5iAfom#TlvD#idC_iMfe+nTdJ&E~&-Y YCHV#V`30$Y@dZWsS*gh-#S`Ph08WG%yZ`_I diff --git a/q05_replace_missing_values/tests/__pycache__/tests.cpython-36.pyc b/q05_replace_missing_values/tests/__pycache__/tests.cpython-36.pyc index 3b9d62a38f2709ee27852c154007b83f7dde0610..dd327e6adc6d7e2607b1d8ad2a787908dd45a9b7 100644 GIT binary patch delta 55 zcmX@hyN8#MesX?F K>SlYUJ{ADtF%m}r delta 72 zcmdnPdzP2On3tDp?!G-y8#&mR3=8x_i&Kk=^%IjaGK(`(vx`fUiV|}Z^D-0j^j%Vm cvrF;|^z#c+^WqDN^0QKtONuw^G4-(k0G%8fJ^%m!