Systematic loading and testing of individual files for the ASHRAE energy predictor competition.
%%time
csvs = get_csvs()
Get the core of the train dataset
%%time
df_meter_train = get_meter_data(csvs['train'], nrows=N_TRAIN)
display(df_meter_train.head(), df_meter_train.info())
%%time
df_meter_test = get_meter_data(csvs['test'], nrows=N_TEST)
display(df_meter_test.head(), df_meter_test.info())
get_nan_stats(df_meter_train, 'meter_reading')
%%time
meter_train_nans = show_nans(df_meter_train)
meter_train_nans
%%time
df_building = get_building_data(csvs['building'])
df_building.head()
%%time
df_weather_train = get_weather_data(csvs['weather_train'])
df_weather_train.head()
%%time
df_weather_test = get_weather_data(csvs['weather_test'])
%%time
ashrae_data = load_all()