nflubis commited on
Commit
c395f7f
1 Parent(s): 64a1ea2

Upload model and config file

Browse files
Files changed (2) hide show
  1. reward_best.model +3 -0
  2. rl_config.json +27 -0
reward_best.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:586eb00007fcade60200c0422841106a164204f2b023c6b0bdb08ca14c73f4dc
3
+ size 9449481
rl_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "train_path": "../data/norm-multi-woz/train_dials.json",
3
+ "valid_path": "../data/norm-multi-woz/val_dials.json",
4
+ "test_path": "../data/norm-multi-woz/test_dials.json",
5
+ "sv_config_path": "sys_config_log_model/2020-05-12-14-51-49-actz_cat/config.json",
6
+ "sv_model_path": "sys_config_log_model/2020-05-12-14-51-49-actz_cat/19-model",
7
+ "rl_config_path": "sys_config_log_model/2020-05-12-14-51-49-actz_cat/rl-2020-05-18-10-50-48/rl_config.json",
8
+ "rl_model_path": "sys_config_log_model/2020-05-12-14-51-49-actz_cat/rl-2020-05-18-10-50-48/rl_model",
9
+ "ppl_best_model_path": "sys_config_log_model/2020-05-12-14-51-49-actz_cat/rl-2020-05-18-10-50-48/ppl_best.model",
10
+ "reward_best_model_path": "sys_config_log_model/2020-05-12-14-51-49-actz_cat/rl-2020-05-18-10-50-48/reward_best.model",
11
+ "record_path": "sys_config_log_model/2020-05-12-14-51-49-actz_cat/rl-2020-05-18-10-50-48",
12
+ "record_freq": 200,
13
+ "sv_train_freq": 0,
14
+ "use_gpu": true,
15
+ "nepoch": 10,
16
+ "nepisode": 0,
17
+ "tune_pi_only": false,
18
+ "max_words": 100,
19
+ "temperature": 1.0,
20
+ "episode_repeat": 1.0,
21
+ "rl_lr": 0.01,
22
+ "momentum": 0.0,
23
+ "nesterov": false,
24
+ "gamma": 0.99,
25
+ "rl_clip": 5.0,
26
+ "random_seed": 38
27
+ }