CCST_edited.py

import os
import sys
import matplotlib
matplotlib.use('Agg')
#matplotlib.use('TkAgg')
import matplotlib.pyplot as plt
import datetime

from sklearn import metrics
from scipy import sparse

import numpy as np
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch_geometric.nn import GCNConv, ChebConv, DeepGraphInfomax, TAGConv, GraphConv
from torch_geometric.data import Data, DataLoader

def get_graph(adj, X):
    # create sparse matrix
    row_col = []
    edge_weight = []
    rows, cols = adj.nonzero()
    edge_nums = adj.getnnz()
    for i in range(edge_nums):
        row_col.append([rows[i], cols[i]])
        edge_weight.append(adj.data[i])

    edge_index = torch.tensor(np.array(row_col), dtype=torch.long).T
    edge_attr = torch.tensor(np.array(edge_weight), dtype=torch.float)

    graph_bags = []
    graph = Data(x=torch.tensor(X, dtype=torch.float), edge_index=edge_index, edge_attr=edge_attr)  
    graph_bags.append(graph)

    return graph_bags

class Encoder(nn.Module):
    def __init__(self, in_channels, hidden_channels, GNN_type):
        super(Encoder, self).__init__()

        if GNN_type == 'GraphConv':
            self.conv = GraphConv(in_channels, hidden_channels)  # first param is input, 2nd param is output
            self.conv_2 = GraphConv(hidden_channels, hidden_channels)
            self.conv_3 = GraphConv(hidden_channels, hidden_channels)
            self.conv_4 = GraphConv(hidden_channels, hidden_channels)
        if GNN_type == 'ChebConv':
            self.conv = ChebConv(in_channels, hidden_channels, 3)
            self.conv_2 = ChebConv(hidden_channels, hidden_channels, 2)
            self.conv_3 = ChebConv(hidden_channels, hidden_channels, 2)
            self.conv_4 = ChebConv(hidden_channels, hidden_channels)
        if GNN_type == 'TAGConv':
            self.conv = TAGConv(in_channels, hidden_channels)
            self.conv_2 = TAGConv(hidden_channels, hidden_channels)
            self.conv_3 = TAGConv(hidden_channels, hidden_channels)
            self.conv_4 = TAGConv(hidden_channels, hidden_channels)
        if GNN_type == 'GCNConv':
            self.conv = GCNConv(in_channels, hidden_channels)
            self.conv_2 = GCNConv(hidden_channels, hidden_channels)
            self.conv_3 = GCNConv(hidden_channels, hidden_channels)
            self.conv_4 = GCNConv(hidden_channels, hidden_channels)
#           self.linear_1 = Linear(hidden_channels, hidden_channels)
#           self.conv_5 = GCNConv(hidden_channels, hidden_channels)
#           self.conv_6 = GCNConv(hidden_channels, hidden_channels)
        #self.prelu = nn.Tanh(hidden_channels)
        self.GNN_type = GNN_type
        self.prelu = nn.PReLU(hidden_channels) # hidden_channels is the output of last layer above

    def forward(self, data):

        x, edge_index, edge_weight = data.x, data.edge_index, data.edge_attr

        #if self.GNN_type == 'TAGConv' or self.GNN_type == 'GCNConv' or self.GNN_type == 'ChebConv':
        x = self.conv(x, edge_index, edge_weight=edge_weight)
        x = self.conv_2(x, edge_index, edge_weight=edge_weight)
        x = self.conv_3(x, edge_index, edge_weight=edge_weight)
        x = self.conv_4(x, edge_index, edge_weight=edge_weight)
#        x = self.linear_1(x)
#        x = self.conv_5(x, edge_index, edge_weight=edge_weight)
#        x = self.conv_6(x, edge_index, edge_weight=edge_weight)
        x = self.prelu(x)

        return x


class my_data():
    def __init__(self, x, edge_index, edge_attr):
        self.x = x
        self.edge_index = edge_index
        self.edge_attr = edge_attr

def corruption(data):
    x = data.x[torch.randperm(data.x.size(0))]
    return my_data(x, data.edge_index, data.edge_attr)

def train_DGI(args, data_loader, in_channels):
    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
    DGI_model = DeepGraphInfomax(
        hidden_channels=args.hidden,
        encoder=Encoder(in_channels=in_channels, hidden_channels=args.hidden, GNN_type = args.GNN_type),
        summary=lambda z, *args, **kwargs: torch.sigmoid(z.mean(dim=0)),
        corruption=corruption).to(device)
    DGI_optimizer = torch.optim.Adam(DGI_model.parameters(), lr=1e-5) #6
    DGI_filename = args.model_path+'DGI'+ args.model_name  +'.pth.tar'
    if args.load:
        DGI_model.load_state_dict(torch.load(DGI_filename))
    else:
	start_time = datetime.datetime.now()
        min_loss=10000
        if args.retrain==1:
            DGI_load_path = args.model_load_path+'DGI'+ args.model_name+'.pth.tar'
            DGI_model.load_state_dict(torch.load(DGI_load_path))
        print('Saving init model state ...')
        torch.save(DGI_model.state_dict(), args.model_path+'DGI_init'+ args.model_name  + '.pth.tar')
        print('training starts ...')
        for epoch in range(args.num_epoch):
            DGI_model.train()
            DGI_optimizer.zero_grad()

            DGI_all_loss = []

            for data in data_loader:
                data = data.to(device)
                pos_z, neg_z, summary = DGI_model(data=data)

                DGI_loss = DGI_model.loss(pos_z, neg_z, summary)
                DGI_loss.backward()
                DGI_all_loss.append(DGI_loss.item())
                DGI_optimizer.step()

            if ((epoch+1)%100) == 0:
                print('Epoch: {:03d}, Loss: {:.4f}'.format(epoch+1, np.mean(DGI_all_loss)))
                if np.mean(DGI_all_loss)<min_loss:
                    min_loss=np.mean(DGI_all_loss)
                    torch.save(DGI_model.state_dict(), DGI_filename)
                    save_tupple=[pos_z, neg_z, summary]

        end_time = datetime.datetime.now()

#        torch.save(DGI_model.state_dict(), DGI_filename)
        print('Training time in seconds: ', (end_time-start_time).seconds)
        DGI_model.load_state_dict(torch.load(DGI_filename))
        print("debug loss")
        DGI_loss = DGI_model.loss(pos_z, neg_z, summary)
        print("debug loss latest tupple %g"%DGI_loss.item())
        DGI_loss = DGI_model.loss(save_tupple[0], save_tupple[1], save_tupple[2])
        print("debug loss min loss tupple %g"%DGI_loss.item())

    return DGI_model