RLSolver/rlsolver/methods/seq2seq/main.py at main · Open-Finance-Lab/RLSolver · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
import torch
import torch.nn as nn
import torch.optim as optim
import random
import numpy as np
import tqdm
from util import load_data_from_txt
SEED = 1234

random.seed(SEED)
np.random.seed(SEED)
torch.manual_seed(SEED)
torch.cuda.manual_seed(SEED)
torch.backends.cudnn.deterministic = True

from config import GPU_ID
from rlsolver.methods.util import calc_device
DEVICE = calc_device(GPU_ID)
data_type = "torch"
DATA_PATH = '../../data/syn_BA/BA_100_ID0.txt'
BATCH_SIZE = 2**5
data= load_data_from_txt(DATA_PATH)
src = data['adj_matrix']

NUM_NODES = src.shape[0]

def cal_obj(adj_matrix,x):
    delta_x = x * 2 - 1
    XA = torch.matmul(delta_x, adj_matrix)
    energy_x = -0.25 * (XA * delta_x).sum(dim=1)+0.25*torch.sum(adj_matrix)
    return energy_x
#input_dim:输入的解向量的维度

class Solver(nn.Module):
    def __init__(self, input_dim, hidden_dim, n_layers, dropout):
        super().__init__()
        self.input_dim = input_dim
        self.hidden_dim = hidden_dim
        self.n_layers = n_layers
        self.rnn = nn.LSTM(input_dim, hidden_dim, n_layers, dropout=dropout)
        self.fc_out = nn.Linear(hidden_dim, input_dim)
        self.dropout = nn.Dropout(dropout)
        self.sigmoid = torch.nn.Sigmoid()

    def forward(self, input, hidden, cell):
        input = input.unsqueeze(0)
        output, (hidden, cell) = self.rnn(input, (hidden, cell))
        prediction = self.fc_out(output.squeeze(0))
        prediction = self.sigmoid(prediction)

        prediction = (prediction - 0.5) * 0.999999 + 0.5
        return prediction, hidden, cell

def init_weights(m):
    for name, param in m.named_parameters():
        nn.init.uniform_(param.data, -0.08, 0.08)

def count_parameters(model):
    return sum(p.numel() for p in model.parameters() if p.requires_grad)

def sample_from_prob(prob):
    prob=prob.detach()
    sample = 1-torch.bernoulli(prob)
    return sample

def get_return(value,prob,sample):
    sample = sample.detach()
    log_prob = torch.sum((sample * prob + (1 - sample) * (1 - prob)).log(),dim=1)
    objective = (log_prob * value.detach()).mean()
    return objective

def train_fn(model, src,sample, optimizer,sol):
    model.train()
    obj1 = cal_obj(src, sample)
    hidden = torch.zeros(1, BATCH_SIZE, 256, device=DEVICE)
    cell = torch.zeros(1, BATCH_SIZE, 256, device=DEVICE)
    for i in range(2000):
        optimizer.zero_grad()
        output,hidden,cell = model(sample,hidden.detach(), cell.detach())
        sample = sample_from_prob(output)
        obj = cal_obj(src,sample)
        if i ==1999:
            print(obj.max())
        obj = (torch.sum(src)/2+obj)/2
        value = obj-obj.mean()
        loss = get_return(value,output,sample)
        loss.backward()
        torch.nn.utils.clip_grad_norm_(model.parameters(), clip)
        optimizer.step()
        loss.detach()
    return loss

sol=1


input_dim = NUM_NODES
output_dim = NUM_NODES

hidden_dim = 256
n_layers = 1
encoder_dropout = 0.5
decoder_dropout = 0.5
device = DEVICE
sample = torch.randint(0,2,(BATCH_SIZE,NUM_NODES),device=DEVICE,dtype=torch.float)
model = Solver(
    output_dim,
    hidden_dim,
    n_layers,
    decoder_dropout,
).to(device)

model.apply(init_weights)
optimizer = optim.Adam(model.parameters())
n_epochs = 10000
clip = 1.0
best_valid_loss = float("inf")
teacher_forcing_ratio = 0.5
print(f"The model has {count_parameters(model):,} trainable parameters")


for epoch in tqdm.tqdm(range(n_epochs)):
    train_loss = train_fn(
        model,
        src,
        sample,
        optimizer,
        sol
    )

    if (epoch %100) ==0 :
        print(f"\tTrain Loss: {train_loss:7.3f} ")
        # print(f"\tValid Loss: {valid_loss:7.3f}")

model.load_state_dict(torch.load("tut1-model.pt"))