Push agent to the Hub
Browse files- README.md +2 -2
 - logs/events.out.tfevents.1677769314.17b1e39a51ac.5257.0 +3 -0
 - model.pt +1 -1
 - replay.mp4 +0 -0
 - results.json +1 -1
 
    	
        README.md
    CHANGED
    
    | 
         @@ -17,7 +17,7 @@ model-index: 
     | 
|
| 17 | 
         
             
                  type: LunarLander-v2
         
     | 
| 18 | 
         
             
                metrics:
         
     | 
| 19 | 
         
             
                - type: mean_reward
         
     | 
| 20 | 
         
            -
                  value:  
     | 
| 21 | 
         
             
                  name: mean_reward
         
     | 
| 22 | 
         
             
                  verified: false
         
     | 
| 23 | 
         
             
            ---
         
     | 
| 
         @@ -37,7 +37,7 @@ model-index: 
     | 
|
| 37 | 
         
             
            'wandb_entity': None
         
     | 
| 38 | 
         
             
            'capture_video': False
         
     | 
| 39 | 
         
             
            'env_id': 'LunarLander-v2'
         
     | 
| 40 | 
         
            -
            'total_timesteps':  
     | 
| 41 | 
         
             
            'learning_rate': 0.00025
         
     | 
| 42 | 
         
             
            'num_envs': 4
         
     | 
| 43 | 
         
             
            'num_steps': 128
         
     | 
| 
         | 
|
| 17 | 
         
             
                  type: LunarLander-v2
         
     | 
| 18 | 
         
             
                metrics:
         
     | 
| 19 | 
         
             
                - type: mean_reward
         
     | 
| 20 | 
         
            +
                  value: 108.56 +/- 79.22
         
     | 
| 21 | 
         
             
                  name: mean_reward
         
     | 
| 22 | 
         
             
                  verified: false
         
     | 
| 23 | 
         
             
            ---
         
     | 
| 
         | 
|
| 37 | 
         
             
            'wandb_entity': None
         
     | 
| 38 | 
         
             
            'capture_video': False
         
     | 
| 39 | 
         
             
            'env_id': 'LunarLander-v2'
         
     | 
| 40 | 
         
            +
            'total_timesteps': 500000
         
     | 
| 41 | 
         
             
            'learning_rate': 0.00025
         
     | 
| 42 | 
         
             
            'num_envs': 4
         
     | 
| 43 | 
         
             
            'num_steps': 128
         
     | 
    	
        logs/events.out.tfevents.1677769314.17b1e39a51ac.5257.0
    ADDED
    
    | 
         @@ -0,0 +1,3 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:2abf722e1483c8d2ae46a76ea69fd47512b2cbc7d5b1692f104bbb89fa75a518
         
     | 
| 3 | 
         
            +
            size 659816
         
     | 
    	
        model.pt
    CHANGED
    
    | 
         @@ -1,3 +1,3 @@ 
     | 
|
| 1 | 
         
             
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            -
            oid sha256: 
     | 
| 3 | 
         
             
            size 42597
         
     | 
| 
         | 
|
| 1 | 
         
             
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:a9f46f0c7b70f362e72eed22c3293e3d84fecfb7f3a67337d95096ecff1763a0
         
     | 
| 3 | 
         
             
            size 42597
         
     | 
    	
        replay.mp4
    CHANGED
    
    | 
         Binary files a/replay.mp4 and b/replay.mp4 differ 
     | 
| 
         | 
    	
        results.json
    CHANGED
    
    | 
         @@ -1 +1 @@ 
     | 
|
| 1 | 
         
            -
            {"env_id": "LunarLander-v2", "mean_reward":  
     | 
| 
         | 
|
| 1 | 
         
            +
            {"env_id": "LunarLander-v2", "mean_reward": 108.55838286299323, "std_reward": 79.21764001927377, "n_evaluation_episodes": 10, "eval_datetime": "2023-03-02T15:16:51.786283"}
         
     |