kevinwang676 commited on
Commit
15d57a8
·
verified ·
1 Parent(s): dbbff58

Update test2.py

Browse files
Files changed (1) hide show
  1. test2.py +1 -1
test2.py CHANGED
@@ -394,7 +394,7 @@ def train_pong():
394
 
395
  # Hyperparameters
396
  gamma = 0.99
397
- learning_rate = 0.01 # Lower learning rate for stability
398
  num_episodes = 1000 # Pong requires more episodes
399
 
400
  # Action mapping: policy outputs 0 or 1, map to RIGHT(2) or LEFT(3)
 
394
 
395
  # Hyperparameters
396
  gamma = 0.99
397
+ learning_rate = 0.001 # Lower learning rate for stability
398
  num_episodes = 1000 # Pong requires more episodes
399
 
400
  # Action mapping: policy outputs 0 or 1, map to RIGHT(2) or LEFT(3)