-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathevaluate.py
More file actions
65 lines (56 loc) · 2.54 KB
/
evaluate.py
File metadata and controls
65 lines (56 loc) · 2.54 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
import os
import torch
from env import VectorizedVRP
import numpy as np
from runner import Runner
from torch.utils.data import DataLoader
from network.model import PPO, Policy
import argparse
from env import utils
torch.multiprocessing.set_sharing_strategy('file_system')
def run():
step = 0
while True:
results = runner.run()
if results is None:
print("Exiting...")
break
if __name__ == "__main__":
parser = argparse.ArgumentParser()
parser.add_argument('--device', type=str, default='cpu', choices=['cuda', 'cpu'])
parser.add_argument('--n-envs', type=int, default=1)
parser.add_argument('--n-steps', type=int, default=16)
parser.add_argument('--hidden-dim', type=int, default=256)
parser.add_argument('--egde-dim', type=int, default=128)
parser.add_argument('--gamma', type=float, default=0.995)
parser.add_argument('--lam', type=float, default=0.95)
parser.add_argument('--seed', type=int, default=0)
parser.add_argument('--accumulation-iteration', type=int, default=1)
parser.add_argument('--data-folder', type=str, default='dataset/data_cvrp')
parser.add_argument('--min-extend-nodes', type=int, default=256)
parser.add_argument('--min-extend-tours', type=int, default=4)
parser.add_argument('--ent-coef', type=float, default=0.01)
parser.add_argument('--vf-coef', type=float, default=0.5)
parser.add_argument('--max-grad-norm', type=float, default=0.5)
parser.add_argument('--clip-range', type=float, default=0.2)
parser.add_argument('--imitation-rate', type=float, default=0.1)
parser.add_argument('--lr', type=float, default=3e-4)
parser.add_argument('--eps', type=float, default=1e-5)
parser.add_argument('--max-steps', type=int, default=64)
parser.add_argument('--max-count', type=int, default=200)
parser.add_argument('--reward-norm', type=int, default=100)
parser.add_argument('--round-int', action='store_true')
parser.add_argument('--algo', type=str, default='HGS', choices=['VNS', 'HGS'])
parser.add_argument('--model-path', type=str)
args = parser.parse_args()
print("Running:", args)
utils.set_seed(args.seed)
env = VectorizedVRP(args)
policy = Policy(3, args.hidden_dim, 2, args.egde_dim)
ppo = PPO(policy, args)
policy.load_state_dict(torch.load(args.model_path))
policy.eval()
name = "_".join(os.path.normpath(args.data_folder).split(os.sep))
log_name = f"{name}_{args.algo}_{args.imitation_rate}/seed_{args.seed}"
runner = Runner(env, policy, log_name, args)
run()