From d1001d2ea48a07fd89229bc95f869ed29f0416d2 Mon Sep 17 00:00:00 2001 From: nitikagoel01 Date: Tue, 4 Jul 2017 18:59:26 +0000 Subject: [PATCH] Done --- build.py | 21 ++++++++++++++------- build.pyc | Bin 0 -> 2055 bytes tests/__init__.pyc | Bin 0 -> 170 bytes tests/test_get_categorical_variables.pyc | Bin 0 -> 2751 bytes 4 files changed, 14 insertions(+), 7 deletions(-) create mode 100644 build.pyc create mode 100644 tests/__init__.pyc create mode 100644 tests/test_get_categorical_variables.pyc diff --git a/build.py b/build.py index 35cdd2a..dcda46c 100644 --- a/build.py +++ b/build.py @@ -1,25 +1,32 @@ +import pandas as pd + def get_categorical_variables(df): - return [] + categorical_data = list(df[['country', 'new_user', 'source', 'converted']]) + return categorical_data def get_numerical_variables(df): - return [] + numerical_data = list(df[['age', 'total_pages_visited']]) + return numerical_data def get_numerical_variables_percentile(df): - pass + return df.describe() def get_categorical_variables_modes(df): - pass - + return df[get_categorical_variables(df)].mode() def get_missing_values_count(df): - pass + return pd.DataFrame(df.isnull().sum()) def plot_histogram_with_numerical_values(df): - pass + plt.hist(df['age'], color='r', bins=50) + plt.hist(df['total_pages_visited'], color='b', bins=50) + plt.xlabel('age') + plt.ylabel('total_pages_visited') + plt.show() def plot_facet_box(df): diff --git a/build.pyc b/build.pyc new file mode 100644 index 0000000000000000000000000000000000000000..4a68884f1785c5454f8c620896f8eedff864bfc9 GIT binary patch literal 2055 zcmcgtO>fgc5M3uunik53KtK>572=Rf2yjLS3B-Xzkjw!A2W#!!I-731mUo@DQW1yp zSNR3}0C+QL)3j1=kT@QX*Xx~qGjE>Tzqhx3{QCAK7bm|Ku5WPqk1z`VNLV4hMnbj3 zPdF{1+U&H2irI;U>af!hs>@DSs10^DgzB-=qjf$FHnFDpgWouh;8LtE&bK)I4onc@ zh(jV6!l+mjvFIO1;(H{HXn_tUjl%|P?wT^xhoJ|*)ca}UbscCi@0vQ-fkNf3oMTk0 z0YwWjj5R(CC~hF5cEb%^av5~tYLiQwDjDPeV}gzU0B>YC^>7i;8&?i%tU08`ybhzRF;+dR4nrTy6*{D=5$CctGPByZ@zB#I zMf4zACWr<&LHFUTCa7qgOAWm}4rC=F+@i@Y08oWnpU#apr-?{tNlrpS`3%=!%4Vk5 zk$}61MF}{Iw}elXJb`~_0iUWyC&S-@19D7-I2K?6jgJ>~r5Bac_NuO14GqeFt_0V%%Ys&cYhkK!lKs_VmWhm28yi%*JA{{l$3p5JX2b5W#zFGPdR-p1@=gF&dhgR)_ucGTjOu$-9|(0eiv7f_eoNR82q2 z#p``MNB7gja&MNIAvsr9V{@ns?hjI12RH5r`mDLZD^t7Pz==yE14e?#iGULN3l|@` ne^8Oky)UTb6DkTRD2WP$kZmM{)$r80?QT0x_m+0!yO`Y<1tKad literal 0 HcmV?d00001 diff --git a/tests/test_get_categorical_variables.pyc b/tests/test_get_categorical_variables.pyc new file mode 100644 index 0000000000000000000000000000000000000000..9d085d73ea343615189666cf312ff46b51fd0f84 GIT binary patch literal 2751 zcmc&$OK;Oa5FR^^HatXmKg2^IBywp32W|))?#mpTgQ&P>msCbf2bnzTFK8IRXH-#4@4){oOCzI}i5E|I-o3)d$YZU~X$KagBx9LO+` zfO;r-D8rVdEg81Owq&a#wk==a(N%RxY**D~N#PL4D3G)xUq!x%yc_no#74i1<+Gpo z^#jcOGQ?}^{JL@WmAeLQZIBvo21!}$*ve&P5mR4F+>XDo=lsI@I5FOCmQ|LRJl-)? zX5Q!4O{3x3Pchs>2rCQ%F<>jhkdbkMNJ5>o84@iW?wgaYL>v7Mo=mt7k>Oa!a3us5 zAR3C!XP~nSy(KK>&gLU^^E6e~^>GmuF2ii_p&Z*mk@;-fY?d~^|6uU8thU|6Bo_Rpc3@Mp zIx4HxeX>_8@VZLIo%I8c%y25>xdE?DKKYw?8-3?{F;sU7LV}gxOmJTR4%7P*4*!K- zC5}+f5_cIo<0$H}J&?H#(!|lg<2 z$j1|lS}1&$TLrYw%4tC6PWM69Isg%c^QJ)cus|lM7SS{0>+{Nto8oAQ(1#aF#64{A zZ$!*Q&dhX7*M^g0VB{9wHMgeYF-`|}kd8}uWS@@c9933IbOBBVym(KUH;hynQa>=LkaTQ`K;4 zbXx)u!64e|C#Fb^(>lRnDKf%2r>>PXY0R%GTG?>5j2gcAo`puLJABlz@tC{Oh*yGB KVHe%|O!y0gCYad( literal 0 HcmV?d00001