biwako commited on
Commit
cf3f65d
1 Parent(s): d456738

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +29 -1
README.md CHANGED
@@ -20,35 +20,63 @@ model-index:
20
  verified: false
21
  ---
22
 
 
23
  # **Q-Learning** Agent playing1 **FrozenLake-v1**
24
  This is a trained model of a **Q-Learning** agent playing **FrozenLake-v1** .
25
 
26
  ## Usage
27
 
28
  {'env_id': 'FrozenLake-v1',
 
29
  'max_steps': 99,
 
30
  'n_training_episodes': 10000,
 
31
  'n_eval_episodes': 100,
 
32
  'eval_seed': [],
 
33
  'learning_rate': 0.7,
 
34
  'gamma': 0.95,
 
35
  'max_epsilon': 1.0,
 
36
  'min_epsilon': 0.05,
 
37
  'decay_rate': 0.0005,
38
- 'qtable': array([[0.73509189, 0.77378094, 0.77378094, 0.73509189],
 
 
 
 
39
  [0.73509189, 0. , 0.81450625, 0.77378094],
 
40
  [0.77378094, 0.857375 , 0.77378094, 0.81450625],
 
41
  [0.81450625, 0. , 0.77378094, 0.77378094],
 
42
  [0.77378094, 0.81450625, 0. , 0.73509189],
 
43
  [0. , 0. , 0. , 0. ],
 
44
  [0. , 0.9025 , 0. , 0.81450625],
 
45
  [0. , 0. , 0. , 0. ],
 
46
  [0.81450625, 0. , 0.857375 , 0.77378094],
 
47
  [0.81450625, 0.9025 , 0.9025 , 0. ],
 
48
  [0.857375 , 0.95 , 0. , 0.857375 ],
 
49
  [0. , 0. , 0. , 0. ],
 
50
  [0. , 0. , 0. , 0. ],
 
51
  [0. , 0.9025 , 0.95 , 0.857375 ],
 
52
  [0.9025 , 0.95 , 1. , 0.9025 ],
 
53
  [0. , 0. , 0. , 0. ]])}
54
 
 
20
  verified: false
21
  ---
22
 
23
+
24
  # **Q-Learning** Agent playing1 **FrozenLake-v1**
25
  This is a trained model of a **Q-Learning** agent playing **FrozenLake-v1** .
26
 
27
  ## Usage
28
 
29
  {'env_id': 'FrozenLake-v1',
30
+
31
  'max_steps': 99,
32
+
33
  'n_training_episodes': 10000,
34
+
35
  'n_eval_episodes': 100,
36
+
37
  'eval_seed': [],
38
+
39
  'learning_rate': 0.7,
40
+
41
  'gamma': 0.95,
42
+
43
  'max_epsilon': 1.0,
44
+
45
  'min_epsilon': 0.05,
46
+
47
  'decay_rate': 0.0005,
48
+
49
+ 'qtable': array([[
50
+
51
+ 0.73509189, 0.77378094, 0.77378094, 0.73509189],
52
+
53
  [0.73509189, 0. , 0.81450625, 0.77378094],
54
+
55
  [0.77378094, 0.857375 , 0.77378094, 0.81450625],
56
+
57
  [0.81450625, 0. , 0.77378094, 0.77378094],
58
+
59
  [0.77378094, 0.81450625, 0. , 0.73509189],
60
+
61
  [0. , 0. , 0. , 0. ],
62
+
63
  [0. , 0.9025 , 0. , 0.81450625],
64
+
65
  [0. , 0. , 0. , 0. ],
66
+
67
  [0.81450625, 0. , 0.857375 , 0.77378094],
68
+
69
  [0.81450625, 0.9025 , 0.9025 , 0. ],
70
+
71
  [0.857375 , 0.95 , 0. , 0.857375 ],
72
+
73
  [0. , 0. , 0. , 0. ],
74
+
75
  [0. , 0. , 0. , 0. ],
76
+
77
  [0. , 0.9025 , 0.95 , 0.857375 ],
78
+
79
  [0.9025 , 0.95 , 1. , 0.9025 ],
80
+
81
  [0. , 0. , 0. , 0. ]])}
82