yongbinfeng · YujiLee301 · Aug 9, 2023 · Aug 15, 2023 · Aug 15, 2023 · Aug 16, 2023
diff --git a/README.md b/README.md
@@ -65,3 +65,7 @@ You can specify arguments for training, or it will follow the default sets in th
 
 ### Testing ###
 Use the `testing/test_physics_metrics.py` for now.
+please make sure that training and testing are configured with the same nn model.
+```
+cp training/models.py testing
+```
diff --git a/testing/models.py b/testing/models.py
@@ -0,0 +1,230 @@
+"""
+Save models here
+"""
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from torch.autograd import Function
+import torch_geometric.nn as pyg_nn
+import torch_geometric.utils as pyg_utils
+import math
+from math import pi
+
+
+class GNNStack(torch.nn.Module):
+    def __init__(self, input_dim, hidden_dim, output_dim, args):
+        # since we do not need phi and eta in x
+        input_dim = input_dim - 2
+
+        super(GNNStack, self).__init__()
+        conv_model = self.build_conv_model(args.model_type)
+        self.convs = nn.ModuleList()
+        self.convs.append(conv_model(input_dim, hidden_dim))
+        assert (args.num_layers >= 1), 'Number of layers is not >=1'
+        for l in range(args.num_layers - 1):
+            self.convs.append(conv_model(hidden_dim, hidden_dim))
+
+        # post-message-passing
+        self.post_mp = nn.Sequential(
+            nn.Linear(hidden_dim, hidden_dim), nn.ReLU(
+            ), nn.Dropout(args.dropout),
+            nn.Linear(hidden_dim, hidden_dim),nn.ReLU(
+            ),nn.Linear(hidden_dim, hidden_dim),nn.ReLU(
+            ),nn.Dropout(args.dropout),
+            nn.Linear(hidden_dim, hidden_dim),nn.ReLU(
+            ),nn.Linear(hidden_dim, hidden_dim),nn.ReLU(
+            ),nn.Linear(hidden_dim, output_dim),
+        )
+        self.lamb = args.lamb
+        self.grlparam = args.grlparam
+        self.grl = GradientReverseLayer(self.grlparam)
+        self.post_da = nn.Sequential(
+            nn.Linear(hidden_dim, hidden_dim), nn.ReLU(
+            ), nn.Dropout(args.dropout),
+            nn.Linear(hidden_dim, hidden_dim),nn.ReLU(
+            ),nn.Linear(hidden_dim, hidden_dim),nn.ReLU(
+            ),nn.Dropout(args.dropout),
+            nn.Linear(hidden_dim, hidden_dim),nn.ReLU(
+            ),
+            nn.Linear(hidden_dim, output_dim),
+        )
+
+        self.dropout = args.dropout
+        self.beta_one = nn.parameter.Parameter(torch.rand(1))
+        self.num_layers = args.num_layers
+
+
+    def build_conv_model(self, model_type):
+        if model_type == 'GraphSage':
+            return GraphSage
+        elif model_type == 'Gated':
+            return Gated_model
+
+    def forward(self, data):
+        num_feature = data.num_feature_actual[0].item()
+        original_x = data.x[:, 0:num_feature]
+        train_mask = data.x[:, num_feature]
+        train_default = data.x[:, (num_feature + 1):]
+
+        x = torch.transpose(original_x, 0, 1) * (1 - train_mask) + \
+            torch.transpose(train_default, 0, 1) * train_mask
+        x = torch.transpose(x, 0, 1)
+
+        edge_index = data.edge_index
+        eta_pos = 0
+        phi_pos = 1
+        eta = x[:, eta_pos]
+        phi = x[:, phi_pos]
+        # x = x[:, 2:-1]
+        x = x[:, 2:]
+
+        # x = self.before_mp(x)
+
+        for layer in self.convs:
+            x = layer(x, edge_index, eta, phi)
+            # x = self.batchnorm(x)
+            x = F.relu(x)
+            x = F.dropout(x, self.dropout, training=self.training)
+
+        x_cl = self.post_mp(x)
+        x_da = self.grl(x)
+        x_da = self.post_da(x_da)
+
+        x_cl = torch.sigmoid(x_cl)
+        x_da = torch.sigmoid(x_da)
+
+        return x_cl, x_da
+
+    def loss(self, pred, label, domain_discrimiant, domain_label):
+        # loss = nn.CrossEntropyLoss()
+        """
+        weight = torch.zeros_like(label)
+        weight[label == 1] = 2
+        weight[label == 0] = 0.2
+        """
+        loss = nn.BCELoss()
+        eps = 1e-10
+        temp = loss(pred + eps, label)
+        temp_da = loss(domain_discrimiant + eps, domain_label)
+        return temp + self.lamb*temp_da
+
+
+class GraphSage(pyg_nn.MessagePassing):
+
+    def __init__(self, in_channels, out_channels, reducer='meansacct',
+                 normalize_embedding=True):
+        super(GraphSage, self).__init__(aggr='mean')
+        in_channels = in_channels
+        self.lin = torch.nn.Linear(2 * in_channels + 1, out_channels)
+        self.agg_lin = torch.nn.Linear(
+            out_channels + 2 * in_channels + 1, out_channels)
+
+        if normalize_embedding:
+            self.normalize_emb = True
+
+    def forward(self, x, edge_index, eta, phi):
+        # x = torch.cat((x, eta.view(-1, 1)), dim=1)
+        # x = torch.cat((x, phi.view(-1, 1)), dim=1)
+        num_nodes = x.size(0)
+        return self.propagate(edge_index, size=(num_nodes, num_nodes), x=x)
+
+    def message(self, x_j, edge_index, size, x_i, x):
+        self.node_count = torch.tensor(size[0]).type(torch.float32).to('cuda')
+        x_g = torch.mean(x, dim=0)
+        log_count = torch.log(self.node_count)
+        log_count = log_count.repeat(x_i.size()[0], 1)
+        x_g = x_g.repeat(x_i.size()[0], 1)
+        x_j = torch.cat((x_j, x_g, log_count), dim=1)
+        x_j = self.lin(x_j)
+        return x_j
+
+    def update(self, aggr_out, x):
+        x_g = torch.mean(x, dim=0)
+        x_g = x_g.repeat(x.size()[0], 1)
+        log_count = torch.log(self.node_count)
+        log_count = log_count.repeat(x.size()[0], 1)
+        aggr_out = torch.cat((aggr_out, x, x_g, log_count), dim=-1)
+        aggr_out = self.agg_lin(aggr_out)
+        aggr_out = F.relu(aggr_out)
+        if self.normalize_emb:
+            aggr_out = F.normalize(aggr_out, p=2, dim=-1)
+
+        return aggr_out
+
+class GradientReverseFunction(Function):
+
+    @staticmethod
+    def forward(ctx, x, coeff = 1.):
+        ctx.coeff = coeff
+        output = x * 1.0
+        return output
+
+    @staticmethod
+    def backward(ctx, grad_output):
+        return grad_output.neg() * ctx.coeff, None
+
+
+class GradientReverseLayer(nn.Module):
+    def __init__(self,coeff):
+        super(GradientReverseLayer, self).__init__()
+        self.coeff = coeff
+    def forward(self, x):
+        return GradientReverseFunction.apply(x,self.coeff)
+
+class Gated_model(pyg_nn.MessagePassing):
+    def __init__(self, in_channels, out_channels, normalize_embedding=True):
+        super(Gated_model, self).__init__(aggr='mean')
+        # last sclar = d_eta, d_phi, d_R, append x_i, x_j, x_g so * 3，+1 for log count
+        new_x_input = 3 * (in_channels) + 3 + 1
+        self.x_dim = new_x_input
+        self.lin_m2 = torch.nn.Linear(new_x_input, 1)
+        # also append x and x_g, so + 2 * in_channels, +1 for log count in the global node
+        self.lin_m5 = torch.nn.Linear(new_x_input + 2 * in_channels + 1, 1)
+        self.lin_m5_g1 = torch.nn.Linear(in_channels, out_channels)
+        self.lin_m5_g2 = torch.nn.Linear(new_x_input, out_channels)
+
+    def forward(self, x, edge_index, eta, phi):
+        num_nodes = x.size(0)
+        x = torch.cat((x, eta.view(-1, 1)), dim=1)
+        x = torch.cat((x, phi.view(-1, 1)), dim=1)
+        return self.propagate(edge_index, size=(num_nodes, num_nodes), x=x)
+
+    def message(self, x_j, x_i, edge_index, size, x):
+        self.node_count = torch.tensor(size[0]).type(torch.float32).to('cuda')
+        # eta at position 0
+        dif_eta_phi = x_j[:, -2: x_j.size()[1]] - x_i[:, -2: x_i.size()[1]]
+
+        # make sure delta within 2pi
+        indices = dif_eta_phi[:, 1] > pi
+        temp = torch.ceil(
+            (dif_eta_phi[:, 1][indices] - pi) / (2 * pi)) * (2 * pi)
+        dif_eta_phi[:, 1][indices] = dif_eta_phi[:, 1][indices] - temp
+
+        delta_r = torch.sum(torch.sqrt(dif_eta_phi ** 2), dim=1).reshape(-1, 1)
+
+        x = x[:, 0:-2]
+        x_i = x_i[:, 0:-2]
+        x_j = x_j[:, 0:-2]
+        x_g = torch.mean(x, dim=0)
+        log_count = torch.log(self.node_count)
+        log_count = log_count.repeat(x_i.size()[0], 1)
+        x_g = x_g.repeat(x_i.size()[0], 1)
+        x_j = torch.cat((x_j, x_i, x_g, dif_eta_phi,
+                        delta_r, log_count), dim=1)
+        M_1 = self.lin_m2(x_j)
+        M_2 = torch.sigmoid(M_1)
+        x_j = x_j * M_2
+        return x_j
+
+    def update(self, aggr_out, x):
+        x = x[:, 0:-2]
+        x_g = torch.mean(x, dim=0)
+        log_count = torch.log(self.node_count)
+        log_count = log_count.repeat(x.size()[0], 1)
+        x_g = x_g.repeat(x.size()[0], 1)
+        aggr_out_temp = aggr_out
+        aggr_out = torch.cat((aggr_out, x, x_g, log_count), dim=1)
+        aggr_out = torch.sigmoid(self.lin_m5(aggr_out))
+        aggr_out = F.relu(aggr_out * self.lin_m5_g1(x) +
+                          (1 - aggr_out) * self.lin_m5_g2(aggr_out_temp))
+        return aggr_out