From b2f954d06822a16a8c9b9ad3a46a45e97002cd13 Mon Sep 17 00:00:00 2001 From: rrbb014 Date: Wed, 28 Oct 2020 09:17:27 +0900 Subject: [PATCH] FIXED: epsilon for e-greedy selection --- 1-grid-world/5-q-learning/q_learning_agent.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/1-grid-world/5-q-learning/q_learning_agent.py b/1-grid-world/5-q-learning/q_learning_agent.py index 496aeaf..7e25cc2 100644 --- a/1-grid-world/5-q-learning/q_learning_agent.py +++ b/1-grid-world/5-q-learning/q_learning_agent.py @@ -9,7 +9,7 @@ def __init__(self, actions): self.actions = actions self.learning_rate = 0.01 self.discount_factor = 0.9 - self.epsilon = 0.9 + self.epsilon = 0.1 self.q_table = defaultdict(lambda: [0.0, 0.0, 0.0, 0.0]) # 샘플로부터 큐함수 업데이트