Case study of prediction performance in the Yangtze River Estuary

[1]:

import h5py
import scipy
import numpy as np
import torch

[2]:

def load(path):
    path = path + "/with_imputation"
    preds = []
    for i in range(10):
        preds.append(np.load(path+"/prediction_{}.npy".format(i)))
    return np.stack(preds, axis=1)

[3]:

base_dir = "../log_bak/prediction/Yangtze/"
prediction_xg_wo = torch.from_numpy(np.load(base_dir+"XGBoost/without_imputation/prediction_0.npy", allow_pickle=True))
prediction_our = torch.from_numpy(load(base_dir+"STIMP"))
prediction_predrnn_wo = torch.from_numpy(np.load(base_dir+"PredRNN/without_imputation/prediction_0.npy", allow_pickle=True))

[4]:

label = np.load("../data/Yangtze/trues.npy")
label_masks = np.load("../data/Yangtze/true_masks.npy")
index = [46*i for i in range(306//46)]
label_masks = label_masks.squeeze()
label = label.squeeze()
label = torch.from_numpy(label)
label_masks = torch.from_numpy(label_masks)
import pandas as pd
date = pd.date_range(start='2016-02-02', end='2022-02-10', freq='8D')

Fig 5f: Predicted Chl_a of XGBoost, STIMP and PredRNN at Position 1

[5]:

#XGBoost
from copy import deepcopy
import seaborn as sns
import matplotlib.pyplot as plt
n=500

index = [46*i for i in range(306//46)]
tmp  = deepcopy(label[index].reshape(276,-1))
tmp_mask  = deepcopy(label_masks[index].reshape(276,-1))
tmp[~tmp_mask.bool()]=np.nan
plt.scatter(date, tmp[:,n], c='red', s=10,label="Observed")

predict = deepcopy(prediction_xg_wo[index].reshape(276,1, 4572))
predict = predict[:,0,n]

plt.plot(date, predict, label="PredRNN")

# plt.legend()
plt.xticks(fontsize=16)
# plt.yticks([])
plt.ylim(-0.5,1.5)
plt.yticks([-0.4,0.4,1.4], fontsize=16)
plt.ylabel("Chl_a (Log(ug/L))", fontsize=20)
plt.show()

../../_images/analysis_Yangtze_13-prediction-yangtze-estuary-case-study_6_0.png

[7]:

#STIMP
plt.scatter(date, tmp[:,n], c='red', s=10,label="Observed")
predict = deepcopy(prediction_our[index].transpose(1,2).reshape(276,10,4572))
predict = predict[:,:,n]
mean = predict.mean(1)
std = predict.std(1)

plt.plot(date, mean, label="STImp")
plt.fill_between(date, mean-std, mean+std, alpha=0.3)

plt.xticks(fontsize=16)
# plt.yticks([])
plt.ylim(-0.5,1.5)
plt.yticks([-0.4,0.4,1.4], fontsize=16)
# plt.ylabel("Chl_a (Log(ug/L))", fontsize=20)
plt.show()

../../_images/analysis_Yangtze_13-prediction-yangtze-estuary-case-study_7_0.png

[6]:

#PredRNN
plt.scatter(date, tmp[:,n], c='red', s=10,label="Observed")
predict = deepcopy(prediction_predrnn_wo[index].reshape(276,4572))
predict = predict[:,n]
plt.plot(date, predict, label="STImp")

plt.xticks(fontsize=16)
# plt.yticks([])
plt.ylim(-0.5,1.5)
plt.yticks([-0.4,0.4,1.4], fontsize=16)
# plt.ylabel("Chl_a (Log(ug/L))", fontsize=20)
plt.show()

../../_images/analysis_Yangtze_13-prediction-yangtze-estuary-case-study_8_0.png

Fig 5f: Predicted Chl_a of XGBoost, STIMP and PredRNN at Position 2

[9]:

n=4000

index = [46*i for i in range(306//46)]
tmp  = deepcopy(label[index].reshape(276,-1))
tmp_mask  = deepcopy(label_masks[index].reshape(276,-1))
tmp[~tmp_mask.bool()]=np.nan
plt.scatter(date, tmp[:,n], c='red', s=10,label="Observed")

predict = deepcopy(prediction_xg_wo[index].reshape(276,1, 4572))
predict = predict[:,0,n]

plt.plot(date, predict, label="PredRNN")

# plt.legend()
plt.xticks(fontsize=16)
# plt.yticks([])
plt.ylim(-0.5,1.5)
plt.yticks([-0.4,0.4,1.4], fontsize=16)
plt.ylabel("Chl_a (Log(ug/L))", fontsize=20)
plt.show()

../../_images/analysis_Yangtze_13-prediction-yangtze-estuary-case-study_10_0.png

[10]:

#STIMP
plt.scatter(date, tmp[:,n], c='red', s=10,label="Observed")

predict = deepcopy(prediction_our[index].transpose(1,2).reshape(276,10,4572))
predict = predict[:,:,n]
mean = predict.mean(1)
std = predict.std(1)

plt.plot(date, mean, label="STImp")
plt.fill_between(date, mean-std, mean+std, alpha=0.3)

# plt.legend()
plt.xticks(fontsize=16)
# plt.yticks([])
plt.ylim(-0.5,1.5)
plt.yticks([-0.4,0.4,1.4], fontsize=16)
# plt.ylabel("Chl_a (Log(ug/L))", fontsize=20)
plt.show()

../../_images/analysis_Yangtze_13-prediction-yangtze-estuary-case-study_11_0.png

[11]:

#PredRNN
plt.scatter(date, tmp[:,n], c='red', s=10,label="Observed")

predict = deepcopy(prediction_predrnn_wo[index].reshape(276,4572))
predict = predict[:,n]

plt.plot(date, predict, label="STImp")

# plt.legend()
plt.xticks(fontsize=16)
# plt.yticks([])
plt.ylim(-0.5,1.5)
plt.yticks([-0.4,0.4,1.4], fontsize=16)
# plt.ylabel("Chl_a (Log(ug/L))", fontsize=20)
plt.show()

../../_images/analysis_Yangtze_13-prediction-yangtze-estuary-case-study_12_0.png