読み込み
train = pd.read_csv(os.path.join(Input, "train.csv"))
test = pd.read_csv(os.path.join(Input, "test.csv"))
df_data= pd.concat([train.assign(ind="train"),test.assign(ind="test")], sort=False)
df_data.date_time = pd.to_datetime(df_data.date_time)
df_data=df_data.set_index('date_time')
test, train = df_data[df_data["ind"].eq("test")], df_data[df_data["ind"].eq("train")]
test.drop(['ind'],axis = 1,inplace = True)
train.drop(['ind'],axis = 1,inplace = True)
df_data.reset_index()
CO_features = [feature for feature in train.columns if feature not in ('target_carbon_monoxide')]
benzene_features = [feature for feature in train.columns if feature not in ('target_benzene','target_carbon_monoxide','target_nitrogen_oxides')]
NOx_features = [feature for feature in train.columns if feature not in ('target_benzene','target_carbon_monoxide','target_nitrogen_oxides')]
学習データを2010-03-10 18:00:00〜2010-12-31 23:00:00の期間としX_trainに入力する
X1 = train[CO_features].copy()
y1 = train.target_carbon_monoxide.copy()
X2 = train[benzene_features].copy()
y2 = train.target_benzene.copy()
X3 = train[NOx_features].copy()
y3 = train.target_nitrogen_oxides.copy()
X1_train = X1['2010-03-10 18:00:00' : '2010-12-31 23:00:00']
y1_train = y1['2010-03-10 18:00:00' : '2010-12-31 23:00:00']
X2_train = X2['2010-03-10 18:00:00' : '2010-12-31 23:00:00']
y2_train = y2['2010-03-10 18:00:00' : '2010-12-31 23:00:00']
X3_train = X3['2010-03-10 18:00:00' : '2010-12-31 23:00:00']
y3_train = y3['2010-03-10 18:00:00' : '2010-12-31 23:00:00']
検証データを2011-01-01 00:00:00としてとしてX_validに入力する
X1_valid = X1['2011-01-01 00:00:00' :]
y1_valid = y1['2011-01-01 00:00:00' :]
X2_valid = X2['2011-01-01 00:00:00' :]
y2_valid = y2['2011-01-01 00:00:00' :]
X3_valid = X3['2011-01-01 00:00:00' :]
y3_valid = y3['2011-01-01 00:00:00' :]
testデータを2011-01-01 01:00:00以降としてとしてX_testに入力する
X1 = df_data[CO_features].copy()
y1 = df_data.target_carbon_monoxide.copy()
X2 = df_data[benzene_features].copy()
y2 = df_data.target_benzene.copy()
X3 = df_data[NOx_features].copy()
y3 =df_data.target_nitrogen_oxides.copy()
X1_test = X1['2011-01-01 01:00:00' :]
y1_test = y1['2011-01-01 01:00:00' :]
X2_test = X2['2011-01-01 01:00:00' :]
y2_test = y2['2011-01-01 01:00:00' :]
X3_test = X3['2011-01-01 01:00:00' :]
y3_test = y3['2011-01-01 01:00:00' :]