diff --git a/q01_load_data_and_add_column_names/__init__.pyc b/q01_load_data_and_add_column_names/__init__.pyc index ca8ec44..44f8b51 100644 Binary files a/q01_load_data_and_add_column_names/__init__.pyc and b/q01_load_data_and_add_column_names/__init__.pyc differ diff --git a/q01_load_data_and_add_column_names/build.py b/q01_load_data_and_add_column_names/build.py index 3c7624e..b62d743 100644 --- a/q01_load_data_and_add_column_names/build.py +++ b/q01_load_data_and_add_column_names/build.py @@ -1,6 +1,15 @@ import pandas as pd - +import numpy as np path = 'data/GermanData.csv' -def q01_load_data_and_add_column_names(): +def q01_load_data_and_add_column_names(path): + df = pd.read_csv(path) + #print df.head(5) + df.columns = ['account_status', 'month', 'credit_history', 'purpose', 'credit_amount', 'savings_account/bonds', + 'employment', 'installment_rate', 'personal_status/sex', 'guarantors', 'residence_since', + 'property', 'age', 'other_installment_plans', 'housing', 'number_of_existing_credits', 'job', 'liable', 'telephone', 'foreign_worker', 'good/bad'] + + df["good/bad"] = np.where(df["good/bad"]==1 , 0 ,1) + + return df diff --git a/q01_load_data_and_add_column_names/build.pyc b/q01_load_data_and_add_column_names/build.pyc index 33a30a8..f3d0bc8 100644 Binary files a/q01_load_data_and_add_column_names/build.pyc and b/q01_load_data_and_add_column_names/build.pyc differ diff --git a/q01_load_data_and_add_column_names/tests/__init__.pyc b/q01_load_data_and_add_column_names/tests/__init__.pyc index 68ab5b6..d970cbf 100644 Binary files a/q01_load_data_and_add_column_names/tests/__init__.pyc and b/q01_load_data_and_add_column_names/tests/__init__.pyc differ diff --git a/q01_load_data_and_add_column_names/tests/test.pyc b/q01_load_data_and_add_column_names/tests/test.pyc index 5a2c337..3858009 100644 Binary files a/q01_load_data_and_add_column_names/tests/test.pyc and b/q01_load_data_and_add_column_names/tests/test.pyc differ