dqn_config.yaml 527 B

12345678910111213141516171819202122232425
  1. # ==================== DQN 超参数配置 ====================
  2. # ===== 神经网络参数 =====
  3. learning_rate: 1.0e-4
  4. # ===== 经验回放参数 =====
  5. buffer_size: 100000
  6. learning_starts: 10000
  7. batch_size: 32
  8. # ===== 强化学习核心参数 =====
  9. gamma: 0.95
  10. train_freq: 4
  11. # ===== 目标网络更新参数 =====
  12. target_update_interval: 1
  13. tau: 0.005
  14. # ===== 探索策略(ε-greedy) =====
  15. exploration_initial_eps: 1.0
  16. exploration_fraction: 0.3
  17. exploration_final_eps: 0.02
  18. # ===== 实验标识 =====
  19. remark: "default"