SimingSiming
commited on
Commit
•
de4cbd0
1
Parent(s):
883d985
Update README.md
Browse files
README.md
CHANGED
@@ -23,23 +23,23 @@ model-index:
|
|
23 |
This is a trained model of a **Q-Learning** agent playing **FrozenLake-v1** .
|
24 |
|
25 |
|
26 |
-
n_training_episodes = 200000 # Total training episodes
|
27 |
-
learning_rate = 0.8 # Learning rate
|
28 |
|
29 |
# Evaluation parameters
|
30 |
-
n_eval_episodes = 100 # Total number of test episodes
|
31 |
|
32 |
-
# Environment parameters
|
33 |
-
env_id = "FrozenLake-v1" # Name of the environment
|
34 |
-
max_steps = 100 # Max steps per episode
|
35 |
-
gamma = 0.99 # Discounting rate
|
36 |
-
eval_seed = [] # The evaluation seed of the environment
|
37 |
|
38 |
-
# Exploration parameters
|
39 |
-
epsilon = 1.0 # Exploration rate
|
40 |
-
max_epsilon = 1.0 # Exploration probability at start
|
41 |
-
min_epsilon = 0.05 # Minimum exploration probability
|
42 |
-
decay_rate = 0.00005 # Exponential decay rate for exploration prob
|
43 |
|
44 |
```
|
45 |
|
|
|
23 |
This is a trained model of a **Q-Learning** agent playing **FrozenLake-v1** .
|
24 |
|
25 |
|
26 |
+
n_training_episodes = 200000 # Total training episodes <br>
|
27 |
+
learning_rate = 0.8 # Learning rate <br>
|
28 |
|
29 |
# Evaluation parameters
|
30 |
+
n_eval_episodes = 100 # Total number of test episodes <br>
|
31 |
|
32 |
+
# Environment parameters <br>
|
33 |
+
env_id = "FrozenLake-v1" # Name of the environment <br>
|
34 |
+
max_steps = 100 # Max steps per episode <br>
|
35 |
+
gamma = 0.99 # Discounting rate <br>
|
36 |
+
eval_seed = [] # The evaluation seed of the environment <br>
|
37 |
|
38 |
+
# Exploration parameters <br>
|
39 |
+
epsilon = 1.0 # Exploration rate <br>
|
40 |
+
max_epsilon = 1.0 # Exploration probability at start <br>
|
41 |
+
min_epsilon = 0.05 # Minimum exploration probability <br>
|
42 |
+
decay_rate = 0.00005 # Exponential decay rate for exploration prob <br>
|
43 |
|
44 |
```
|
45 |
|