---
tags:
- Pixelcopter-PLE-v0
- reinforce
- reinforcement-learning
- custom-implementation
- deep-rl-class
model-index:
- name: Reinforce-PixelCopter-v2
  results:
  - task:
      type: reinforcement-learning
      name: reinforcement-learning
    dataset:
      name: Pixelcopter-PLE-v0
      type: Pixelcopter-PLE-v0
    metrics:
    - type: mean_reward
      value: 18.50 +/- 21.02
      name: mean_reward
      verified: false
---
<br>
pixelcopter_hyperparameters = { <br>
    "h_size": 64, <br>
    "n_training_episodes": 50000, <br>
    "n_evaluation_episodes": 10, <br>
    "max_t": 10000, <br>
    "gamma": 0.99, <br>
    "lr": 1e-4, <br>
    "env_id": env_id, <br>
    "state_space": s_size, <br>
    "action_space": a_size, <br>
}<br>