-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathlaunch.py
89 lines (78 loc) · 3.83 KB
/
launch.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
#!/usr/bin/python
# encoding: utf-8
import numpy as np
import ipdb
import logger
from datetime import datetime
import sys
from util import get_objects,set_global_seeds,arg_parser
import envs as all_envs
import agents as all_agents
import functionApproximation as all_FA
import os
def str2bool(str=""):
str = str.lower()
if str.__contains__("yes") or str.__contains__("true") or str.__contains__("y") or str.__contains__("t"):
return True
else:
return False
def common_arg_parser():
"""
Create an argparse.ArgumentParser for run.py.
"""
parser = arg_parser()
parser.add_argument('-seed',type=int, default=123)
parser.add_argument('-environment', type=str, default="Env")
parser.add_argument('-data_path',type=str,default="./data/")
parser.add_argument('-data_name',type=str,default="name")
parser.add_argument('-agent',type=str,default="training methods")
parser.add_argument('-FA',type=str,default="function approximation")
parser.add_argument('-CDM', dest='CDM', type=str, default='CDM', help="type of CDM")
parser.add_argument('-T', dest='T', type=int, default=3, help="time_step")
parser.add_argument('-ST', dest='ST', type=eval, default="[10,30,60,120]", help="evaluation_time_step")
parser.add_argument('-gpu_no', dest='gpu_no', type=str, default="0", help='which gpu for usage')
parser.add_argument('-latent_factor', dest='latent_factor', type=int, default=10, help="latent factor")
parser.add_argument('-learning_rate', dest='learning_rate', type=float, default=0.01, help="learning rate")
parser.add_argument('-training_epoch', dest='training_epoch', type=int, default=30000, help="training epoch")
parser.add_argument('-rnn_layer', dest='rnn_layer', type=int, default=1, help="rnn_layer")
parser.add_argument('-inner_epoch', dest='inner_epoch', type=int, default=50, help="rnn_layer")
parser.add_argument('-batch', dest='batch', type=int, default=128, help="batch_size")
parser.add_argument('-gamma', dest='gamma', type=float, default=0.0, help="gamma")
parser.add_argument('-clip_param', dest='clip_param', type=float, default=0.2, help="clip_param")
parser.add_argument('-restore_model', dest='restore_model', type=str2bool, default="False", help="")
parser.add_argument('-num_blocks', dest='num_blocks', type=int, default=1, help="")
parser.add_argument('-num_heads', dest='num_heads', type=int, default=1, help="")
parser.add_argument('-dropout_rate', dest='dropout_rate', type=float, default=0.0, help="")
return parser
def main(args):
# arguments
print(args)
arg_parser = common_arg_parser()
args, unknown_args = arg_parser.parse_known_args(args)
args.model = "_".join([args.agent,args.FA,str(args.T)])
# initialization
set_global_seeds(args.seed)
os.environ["CUDA_VISIBLE_DEVICES"] = str(args.gpu_no)
# logger
logger.configure("./log"+args.data_path.split("/")[-2]+"/"+"_".join([args.model,datetime.now().strftime("%Y%m%d_%H%M%S"),args.data_path.split("/")[-2],str(args.learning_rate),str(args.T),str(args.ST),str(args.gamma)]))
logger.log("Training Model: "+args.model)
# environments
envs = get_objects(all_envs)
env = envs[args.environment](args)
# ipdb.set_trace()
# policy network
args.user_num = env.user_num
args.item_num = env.item_num
args.utype_num = env.utype_num
# ipdb.set_trace()
args.saved_path = os.path.join(os.path.abspath("./"),"saved_path_"+args.data_path.split("/")[-2]+"_"+str(args.FA)+"_"+str(args.learning_rate)+"_"+str(args.agent)+"_"+str(args.seed))
nets = get_objects(all_FA)
print(nets)
fa = nets[args.FA].create_model(args)
# return
logger.log("Hype-Parameters: "+str(args))
# # agents
agents = get_objects(all_agents)
agents[args.agent](env, fa, args).train()
if __name__ == '__main__':
main(sys.argv)