ad

yul19079 · Feb 2, 2024 · 6137c1b · 6137c1b
1 parent 9743440
commit 6137c1b
Show file tree

Hide file tree

Showing 37 changed files with 2,068 additions and 1,953 deletions.
diff --git a/GenDs2.py b/GenDs2.py
@@ -0,0 +1,99 @@
+# get data
+import pandas as pd
+import numpy as np
+import tensorflow as tf
+
+from sklearn.preprocessing import StandardScaler,MinMaxScaler
+raw_data = pd.read_pickle("./data/raw_feature.pkl")
+X_train = pd.read_pickle("./data/X_train.pkl")
+y_train = pd.read_pickle("./data/y_train.pkl")
+X_test = pd.read_pickle("./data/X_test.pkl")
+y_test = pd.read_pickle("./data/y_test.pkl")
+def apply_sin(X,axis,range):
+    """Apply sin function on some time features"""
+    X = X.copy()
+    X[:,axis,:] = np.sin(X[:,axis,:]*2*np.pi/range)
+    return X
+def apply_cos(X,axis,range):
+    """same for cos"""
+    X = X.copy()
+    X[:,axis,:] = np.cos(X[:,axis,:]*2*np.pi/range)
+    return X
+def create_rolling_window(matrix,t):
+    """This function is used for create X for lstm"""
+    matrix_shape = matrix.shape
+    return_length = matrix_shape[0] - t 
+    dataset = tf.data.Dataset.from_tensor_slices(matrix)
+    windows = dataset.window(t,shift = 1,drop_remainder=True)
+    windows = windows.take(return_length)
+    windows = windows.flat_map(lambda window: window.batch(t))
+
+
+    return windows
+def create_result_ds(matrix,delay):
+    """Creat Y target """
+    dataset = tf.data.Dataset.from_tensor_slices(matrix)
+    dataset = dataset.skip(delay)
+    return dataset
+
+
+def combine_ds(X_train,ds1,ds2):
+    """zip two dataset and returns a batch dataset"""
+    combined_ds = tf.data.Dataset.zip(((X_train,ds1),ds2))
+    combined_ds = combined_ds.batch(batch_size=32)
+    return combined_ds
+def gen_train_ds(X_train,y_train,step_len):
+
+    X = create_rolling_window(y_train,step_len)
+    X_train_ds = create_result_ds(X_train,step_len)
+    y = create_result_ds(y_train,step_len)
+
+    train_ds = combine_ds(X_train_ds,X,y)
+    return train_ds
+
+def gen_test_ds(X_test,y_test,step_len):
+
+    X = create_rolling_window(y_test,step_len)
+    y = create_result_ds(y_test,step_len)
+    X_test_ds = create_result_ds(X_test,step_len)
+
+    test_ds = combine_ds(X_test_ds,X,y)
+    return test_ds
+
+# preprocess data
+"""Normalize the original data"""
+std = StandardScaler()
+
+train_shape = y_train.shape
+test_shape = y_test.shape
+y_train = std.fit_transform(np.reshape(y_train,(-1,y_train.shape[-2]*y_train.shape[-1])))
+y_train = y_train.reshape(train_shape)
+y_test = std.transform(np.reshape(y_test,(-1,y_test.shape[-2]*y_test.shape[-1])))
+y_test = y_test.reshape(test_shape)
+
+
+X_train = X_train[:,1:,:].astype(np.float64)
+X_test = X_test[:,1:,:].astype(np.float64)
+
+X_train = apply_sin(X_train,2,24)
+X_train = apply_sin(X_test,2,24)
+
+
+X_train = X_train/X_train.max()
+X_test = X_test/X_test.max()
+
+
+
+
+# gen dataset
+time_step = 48
+train_ds = gen_train_ds(X_train,y_train,step_len=time_step)
+test_ds = gen_test_ds(X_test,y_test,step_len=time_step)
+
+class GenDs(object):
+    def gen_train(time_step = 48):
+        train_ds = gen_train_ds(X_train,y_train,step_len=time_step)
+        return train_ds,std
+    def gen_test(time_step = 48):
+        test_ds = gen_test_ds(X_test,y_test,step_len=time_step)
+        return test_ds
diff --git a/GenFeature.py b/GenFeature.py
@@ -0,0 +1,26 @@
+import pandas as pd
+import numpy as np
+spatio_data_file = "./data/SpatialFeatures.csv"
+raw_spatio_feature = pd.read_csv(spatio_data_file)
+def get_feauture_by_name(data,name):
+    feature = data[name]
+    feature = feature.fillna(0).to_numpy()
+    feature = feature/feature.max()
+    feature = feature.reshape(16,8)
+    feature = feature[::-1,:]
+    return feature
+
+def get_feature_list(data,name_list):
+    result_array = np.empty((len(name_list),16,8))
+    for i in range(len(name_list)):
+        result_array[i] = get_feauture_by_name(data,name_list[i])
+
+    return result_array
+
+
+feature_list = ["BikeLane_miles","AADT","Pop_Density","StationNum"]
+def gen_features(feature_list = feature_list):
+    feature_array = get_feature_list(raw_spatio_feature,feature_list)
+
+
+    return feature_array
diff --git a/ModelPerformance.py b/ModelPerformance.py
@@ -20,19 +20,25 @@ def compare_result(predict,real):
     # assert(np.array_equal(predict_flatten.reshape(original_shape), predict))
 
     print(mean_squared_error(predict_flatten,real_flatten))
+
+    return (mean_squared_error(predict_flatten,real_flatten))
 def plot_result(predict,real,batch =0,in_out = 0):
 
-    vmin = min(predict[batch].min(), real[batch].min())
-    vmax = max(predict[batch].max(), real[batch].max())
+    # vmin = min(predict[batch].min(), real[batch].min())
+    vmin = 0
+    vmax = max(predict[batch,in_out].max(), real[batch,in_out].max())
 
     cmap = 'viridis'
     fig, axs = plt.subplots(1, 3)
 
     axs[0].set_title("predict")
-    axs[0].imshow(predict[batch,in_out,:,:],cmap = cmap,vmin = vmin,vmax = vmax)
+    predict_fig = axs[0].imshow(predict[batch,in_out,:,:],cmap = cmap,vmin = vmin,vmax = vmax)
     axs[1].set_title("real")
-    axs[1].imshow(real[batch,in_out,:,:],cmap = cmap,vmin = vmin,vmax = vmax)
+    real_fig = axs[1].imshow(real[batch,in_out,:,:],cmap = cmap,vmin = vmin,vmax = vmax)
     axs[2].set_title("diff")
-    axs[2].imshow(np.abs(predict[batch,in_out,:,:] - real[batch,in_out,:,:]), cmap = cmap,vmin = vmin,vmax = vmax)
-
+    diff_matrix  = np.abs(predict[batch,in_out,:,:] - real[batch,in_out,:,:])
+    diff_fig = axs[2].imshow(diff_matrix, cmap = cmap,vmin = vmin,vmax = vmax)
+    plt.colorbar(predict_fig,ax=axs)
+    # plt.colorbar(real_fig,ax = axs)
+    print(diff_matrix.mean(),diff_matrix.shape)
     plt.show()
diff --git a/TrainingData.h5 b/TrainingData.h5
diff --git a/__pycache__/GenDs.cpython-310.pyc b/__pycache__/GenDs.cpython-310.pyc
diff --git a/__pycache__/GenDs.cpython-311.pyc b/__pycache__/GenDs.cpython-311.pyc
diff --git a/__pycache__/GenDs.cpython-38.pyc b/__pycache__/GenDs.cpython-38.pyc
diff --git a/__pycache__/GenDs2.cpython-311.pyc b/__pycache__/GenDs2.cpython-311.pyc
diff --git a/__pycache__/GenFeature.cpython-310.pyc b/__pycache__/GenFeature.cpython-310.pyc
diff --git a/__pycache__/GenFeature.cpython-311.pyc b/__pycache__/GenFeature.cpython-311.pyc
diff --git a/__pycache__/ModelPerformance.cpython-310.pyc b/__pycache__/ModelPerformance.cpython-310.pyc
diff --git a/__pycache__/ModelPerformance.cpython-311.pyc b/__pycache__/ModelPerformance.cpython-311.pyc
diff --git a/base.h5 b/base.h5
diff --git a/cnn.h5 b/cnn.h5