Update README.md
Browse filesAdd training hyperparameters
README.md
CHANGED
@@ -36,4 +36,26 @@ model-index:
|
|
36 |
desc=["SFFF", "FHHF", "FFHF", "HFFG"],
|
37 |
is_slippery=True)
|
38 |
```
|
39 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
36 |
desc=["SFFF", "FHHF", "FFHF", "HFFG"],
|
37 |
is_slippery=True)
|
38 |
```
|
39 |
+
|
40 |
+
## Training parameters
|
41 |
+
|
42 |
+
```python
|
43 |
+
# Training parameters
|
44 |
+
n_training_episodes = 105000 # Total training episodes
|
45 |
+
learning_rate = 0.8 # Learning rate
|
46 |
+
|
47 |
+
# Evaluation parameters
|
48 |
+
n_eval_episodes = 100 # Total number of test episodes
|
49 |
+
|
50 |
+
# Environment parameters
|
51 |
+
env_id = "FrozenLake-v1" # Name of the environment
|
52 |
+
max_steps = 99 # Max steps per episode
|
53 |
+
gamma = 0.98 # Discounting rate
|
54 |
+
eval_seed = [] # The evaluation seed of the environment
|
55 |
+
|
56 |
+
# Exploration parameters
|
57 |
+
max_epsilon = 0.99 # Exploration probability at start
|
58 |
+
min_epsilon = 0.02 # Minimum exploration probability
|
59 |
+
decay_rate = 0.009 # Exponential decay rate for exploration prob
|
60 |
+
|
61 |
+
```
|