forked from ML4ITS/mtad-gat-pytorch
-
Notifications
You must be signed in to change notification settings - Fork 0
/
mtad_gat.py
79 lines (66 loc) · 3.01 KB
/
mtad_gat.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
import torch
import torch.nn as nn
from modules import (
ConvLayer,
FeatureAttentionLayer,
TemporalAttentionLayer,
GRULayer,
Forecasting_Model,
ReconstructionModel,
)
class MTAD_GAT(nn.Module):
""" MTAD-GAT model class.
:param n_features: Number of input features
:param window_size: Length of the input sequence
:param out_dim: Number of features to output
:param kernel_size: size of kernel to use in the 1-D convolution
:param feat_gat_embed_dim: embedding dimension (output dimension of linear transformation)
in feat-oriented GAT layer
:param time_gat_embed_dim: embedding dimension (output dimension of linear transformation)
in time-oriented GAT layer
:param use_gatv2: whether to use the modified attention mechanism of GATv2 instead of standard GAT
:param gru_n_layers: number of layers in the GRU layer
:param gru_hid_dim: hidden dimension in the GRU layer
:param forecast_n_layers: number of layers in the FC-based Forecasting Model
:param forecast_hid_dim: hidden dimension in the FC-based Forecasting Model
:param recon_n_layers: number of layers in the GRU-based Reconstruction Model
:param recon_hid_dim: hidden dimension in the GRU-based Reconstruction Model
:param dropout: dropout rate
:param alpha: negative slope used in the leaky rely activation function
"""
def __init__(
self,
n_features,
window_size,
out_dim,
kernel_size=7,
feat_gat_embed_dim=None,
time_gat_embed_dim=None,
use_gatv2=True,
gru_n_layers=1,
gru_hid_dim=150,
forecast_n_layers=1,
forecast_hid_dim=150,
recon_n_layers=1,
recon_hid_dim=150,
dropout=0.2,
alpha=0.2
):
super(MTAD_GAT, self).__init__()
self.conv = ConvLayer(n_features, kernel_size)
self.feature_gat = FeatureAttentionLayer(n_features, window_size, dropout, alpha, feat_gat_embed_dim, use_gatv2)
self.temporal_gat = TemporalAttentionLayer(n_features, window_size, dropout, alpha, time_gat_embed_dim, use_gatv2)
self.gru = GRULayer(3 * n_features, gru_hid_dim, gru_n_layers, dropout)
self.forecasting_model = Forecasting_Model(gru_hid_dim, forecast_hid_dim, out_dim, forecast_n_layers, dropout)
self.recon_model = ReconstructionModel(window_size, gru_hid_dim, recon_hid_dim, out_dim, recon_n_layers, dropout)
def forward(self, x):
# x shape (b, n, k): b - batch size, n - window size, k - number of features
x = self.conv(x)
h_feat = self.feature_gat(x)
h_temp = self.temporal_gat(x)
h_cat = torch.cat([x, h_feat, h_temp], dim=2) # (b, n, 3k)
_, h_end = self.gru(h_cat)
h_end = h_end.view(x.shape[0], -1) # Hidden state for last timestamp
predictions = self.forecasting_model(h_end)
recons = self.recon_model(h_end)
return predictions, recons