nsanghi commited on
Commit
8a3e520
·
1 Parent(s): c44c918

Push to Hub

Browse files
args.yml CHANGED
@@ -54,13 +54,13 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 3520579075
58
  - - storage
59
  - null
60
  - - study_name
61
  - null
62
  - - tensorboard_log
63
- - runs/CartPole-v1__dqn__3520579075__1698322478
64
  - - track
65
  - true
66
  - - trained_agent
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2652168140
58
  - - storage
59
  - null
60
  - - study_name
61
  - null
62
  - - tensorboard_log
63
+ - runs/CartPole-v1__dqn__2652168140__1699149373
64
  - - track
65
  - true
66
  - - trained_agent
dqn-CartPole-v1.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e00d5567eb6d03ca577b3424af23b7f32da66df34531deb6b02084e911f7c1bf
3
- size 1109094
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff14dc16a0b6df20c08ad329c5b1a4ec4f4f069f9496f78b3a939829a11d1e77
3
+ size 1107483
dqn-CartPole-v1/_stable_baselines3_version CHANGED
@@ -1 +1 @@
1
- 2.2.0a8
 
1
+ 2.1.0
dqn-CartPole-v1/data CHANGED
@@ -5,15 +5,15 @@
5
  "__module__": "stable_baselines3.dqn.policies",
6
  "__annotations__": "{'q_net': <class 'stable_baselines3.dqn.policies.QNetwork'>, 'q_net_target': <class 'stable_baselines3.dqn.policies.QNetwork'>}",
7
  "__doc__": "\n Policy class with Q-Value Net and target net for DQN\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
8
- "__init__": "<function DQNPolicy.__init__ at 0x7f3cc89cc430>",
9
- "_build": "<function DQNPolicy._build at 0x7f3cc89cc4c0>",
10
- "make_q_net": "<function DQNPolicy.make_q_net at 0x7f3cc89cc550>",
11
- "forward": "<function DQNPolicy.forward at 0x7f3cc89cc5e0>",
12
- "_predict": "<function DQNPolicy._predict at 0x7f3cc89cc670>",
13
- "_get_constructor_parameters": "<function DQNPolicy._get_constructor_parameters at 0x7f3cc89cc700>",
14
- "set_training_mode": "<function DQNPolicy.set_training_mode at 0x7f3cc89cc790>",
15
  "__abstractmethods__": "frozenset()",
16
- "_abc_impl": "<_abc._abc_data object at 0x7f3cc89c9140>"
17
  },
18
  "verbose": 1,
19
  "policy_kwargs": {
@@ -22,17 +22,17 @@
22
  256
23
  ]
24
  },
25
- "num_timesteps": 50000,
26
  "_total_timesteps": 50000,
27
  "_num_timesteps_at_start": 0,
28
  "seed": 0,
29
  "action_noise": null,
30
- "start_time": 1698322479232068894,
31
  "learning_rate": {
32
  ":type:": "<class 'function'>",
33
- ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuDQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9i13MY/FBIhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
34
  },
35
- "tensorboard_log": "runs/CartPole-v1__dqn__3520579075__1698322478/CartPole-v1",
36
  "_last_obs": null,
37
  "_last_episode_starts": {
38
  ":type:": "<class 'numpy.ndarray'>",
@@ -40,22 +40,22 @@
40
  },
41
  "_last_original_obs": {
42
  ":type:": "<class 'numpy.ndarray'>",
43
- ":serialized:": "gAWVhQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAFHcDz8KnRA/xFG8vJs29D2UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwFLBIaUjAFDlHSUUpQu"
44
  },
45
- "_episode_num": 440,
46
  "use_sde": false,
47
  "sde_sample_freq": -1,
48
- "_current_progress_remaining": 2.0000000000020002e-05,
49
  "_stats_window_size": 100,
50
  "ep_info_buffer": {
51
  ":type:": "<class 'collections.deque'>",
52
- ":serialized:": "gAWVCgwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQDcAAAAAAACMAWyUSxeMAXSUR0BMPCoCMglodX2UKGgGR0BdQAAAAAAAaAdLdWgIR0BMRc2BJ7LMdX2UKGgGR0BbAAAAAAAAaAdLbGgIR0BMfDin5zo2dX2UKGgGR0BawAAAAAAAaAdLa2gIR0BMhX9BKL88dX2UKGgGR0BagAAAAAAAaAdLamgIR0BMutN8E3bVdX2UKGgGR0BfwAAAAAAAaAdLf2gIR0BMxP+4smOVdX2UKGgGR0BgQAAAAAAAaAdLgmgIR0BM/UornTy8dX2UKGgGR0BfwAAAAAAAaAdLf2gIR0BNB6ab4Ju3dX2UKGgGR0BfgAAAAAAAaAdLfmgIR0BNPopYs/Y8dX2UKGgGR0BgoAAAAAAAaAdLhWgIR0BNSeHBUJfIdX2UKGgGR0BgIAAAAAAAaAdLgWgIR0BNgRUedTYNdX2UKGgGR0BnYAAAAAAAaAdLu2gIR0BNj5r56+nJdX2UKGgGR0BkwAAAAAAAaAdLpmgIR0BN1GqYJE6UdX2UKGgGR0BlIAAAAAAAaAdLqWgIR0BOIcer+5vtdX2UKGgGR0BjYAAAAAAAaAdLm2gIR0BOMxgy/KyOdX2UKGgGR0BgQAAAAAAAaAdLgmgIR0BOfbdSEUTMdX2UKGgGR0BeQAAAAAAAaAdLeWgIR0BOiv99+gDidX2UKGgGR0BdgAAAAAAAaAdLdmgIR0BO1FK02LpBdX2UKGgGR0BcQAAAAAAAaAdLcWgIR0BO4dmpVCHAdX2UKGgGR0BdAAAAAAAAaAdLdGgIR0BPLAp8WsRydX2UKGgGR0BiIAAAAAAAaAdLkWgIR0BPPO6d1+y7dX2UKGgGR0Bo4AAAAAAAaAdLx2gIR0BPk9SuQp4KdX2UKGgGR0BsIAAAAAAAaAdL4WgIR0BP72pZOi35dX2UKGgGR0BaAAAAAAAAaAdLaGgIR0BP/N+b3Gn5dX2UKGgGR0BcgAAAAAAAaAdLcmgIR0BQKAiml67edX2UKGgGR0Bg4AAAAAAAaAdLh2gIR0BQMHFo+OfedX2UKGgGR0BsgAAAAAAAaAdL5GgIR0BQX6Zpi7TVdX2UKGgGR0B1UAAAAAAAaAdNVQFoCEdAUKann+yZ8nV9lChoBkdAa6AAAAAAAGgHS91oCEdAUK9Q3xWkrXV9lChoBkdAbgAAAAAAAGgHS/BoCEdAUM+9f1Hvt3V9lChoBkdAeRAAAAAAAGgHTZEBaAhHQFENhOP/7zl1fZQoaAZHQGfgAAAAAABoB0u/aAhHQFErZOzposZ1fZQoaAZHQH9AAAAAAABoB030AWgIR0BRa2attALRdX2UKGgGR0ByoAAAAAAAaAdNKgFoCEdAUf4VtXPqs3V9lChoBkdAaOAAAAAAAGgHS8doCEdAUhx/WlMyrXV9lChoBkdAbyAAAAAAAGgHS/loCEdAUju/O+qR2nV9lChoBkdAcEAAAAAAAGgHTQQBaAhHQFJbfuCwr2B1fZQoaAZHQG/AAAAAAABoB0v+aAhHQFJ7yxiXpnp1fZQoaAZHQHxgAAAAAABoB03GAWgIR0BSpi75Ec81dX2UKGgGR0ByoAAAAAAAaAdNKgFoCEdAUshEgGKQ73V9lChoBkdAcrAAAAAAAGgHTSsBaAhHQFL/vvjOs1d1fZQoaAZHQHLAAAAAAABoB00sAWgIR0BTK4PK+zt1dX2UKGgGR0B6UAAAAAAAaAdNpQFoCEdAU2G3Ytg8bXV9lChoBkdAc9AAAAAAAGgHTT0BaAhHQFOymqYJE6V1fZQoaAZHQHBQAAAAAABoB00FAWgIR0BT4cabWmP6dX2UKGgGR0B/QAAAAAAAaAdN9AFoCEdAVEDpSrHU+nV9lChoBkdAf0AAAAAAAGgHTfQBaAhHQFSj+n62v0R1fZQoaAZHQHEQAAAAAABoB00RAWgIR0BUyra/RE4OdX2UKGgGR0AsAAAAAAAAaAdLDmgIR0BUyzKPn0TUdX2UKGgGR0B9sAAAAAAAaAdN2wFoCEdAVQpBdD6WPnV9lChoBkdAfFAAAAAAAGgHTcUBaAhHQFUy5Zr56+p1fZQoaAZHQH9AAAAAAABoB030AWgIR0BVc5qREF4cdX2UKGgGR0B4oAAAAAAAaAdNigFoCEdAVa/dSEUTMHV9lChoBkdAcFAAAAAAAGgHTQUBaAhHQFXQPzWf9P11fZQoaAZHQHygAAAAAABoB03KAWgIR0BWDsqz7di2dX2UKGgGR0BswAAAAAAAaAdL5mgIR0BWLo86mwaBdX2UKGgGR0AoAAAAAAAAaAdLDGgIR0BWL0sBhhH9dX2UKGgGR0AzAAAAAAAAaAdLE2gIR0BWME8vEjxDdX2UKGgGR0AwAAAAAAAAaAdLEGgIR0BWMPqs2eg+dX2UKGgGR0AxAAAAAAAAaAdLEWgIR0BWMav3ai9JdX2UKGgGR0AyAAAAAAAAaAdLEmgIR0BWMuuq3mV8dX2UKGgGR0BgIAAAAAAAaAdLgWgIR0BWOGxt52QodX2UKGgGR0AoAAAAAAAAaAdLDGgIR0BWOSAc1fmcdX2UKGgGR0AuAAAAAAAAaAdLD2gIR0BWObjLjghsdX2UKGgGR0BeQAAAAAAAaAdLeWgIR0BWVPdqL0jDdX2UKGgGR0BewAAAAAAAaAdLe2gIR0BWWhJEpiI+dX2UKGgGR0Bg4AAAAAAAaAdLh2gIR0BWde6y0KJEdX2UKGgGR0BhIAAAAAAAaAdLiWgIR0BWkStq59VndX2UKGgGR0BfwAAAAAAAaAdLf2gIR0BWlhA4XGfgdX2UKGgGR0BfgAAAAAAAaAdLfmgIR0BWmyofjjrBdX2UKGgGR0B4UAAAAAAAaAdNhQFoCEdAVtZNpM6BAnV9lChoBkdAX4AAAAAAAGgHS35oCEdAVvFiZv1lG3V9lChoBkdAYuAAAAAAAGgHS5doCEdAVvicvugHvHV9lChoBkdAZGAAAAAAAGgHS6NoCEdAVxVZHNHH3nV9lChoBkdAXAAAAAAAAGgHS3BoCEdAVxmvStvGZXV9lChoBkdAW4AAAAAAAGgHS25oCEdAVzSy0KJEY3V9lChoBkdAWkAAAAAAAGgHS2loCEdAVzt/EwWWQnV9lChoBkdAPgAAAAAAAGgHSx5oCEdAVz1hfBvaUXV9lChoBkdAMQAAAAAAAGgHSxFoCEdAVz43ZPEbYXV9lChoBkdAWIAAAAAAAGgHS2JoCEdAV18GTs6aLHV9lChoBkdAf0AAAAAAAGgHTfQBaAhHQFiECV8kUsZ1fZQoaAZHQH9AAAAAAABoB030AWgIR0BYwkKArhBJdX2UKGgGR0B74AAAAAAAaAdNvgFoCEdAWQpR/EwWWXV9lChoBkdAf0AAAAAAAGgHTfQBaAhHQFlKwtrbg0l1fZQoaAZHQH9AAAAAAABoB030AWgIR0BZjK8xsVL0dX2UKGgGR0B/QAAAAAAAaAdN9AFoCEdAWcvSOR1YAHV9lChoBkdAf0AAAAAAAGgHTfQBaAhHQFoNeJpFkQR1fZQoaAZHQH9AAAAAAABoB030AWgIR0BaTjZDiOvMdX2UKGgGR0B/QAAAAAAAaAdN9AFoCEdAWo1P0qYqonV9lChoBkdAf0AAAAAAAGgHTfQBaAhHQFrPIn0Cih51fZQoaAZHQH9AAAAAAABoB030AWgIR0BbEkit7rs0dX2UKGgGR0B/QAAAAAAAaAdN9AFoCEdAW1RqtYB/7XV9lChoBkdAf0AAAAAAAGgHTfQBaAhHQFuknwob4rV1fZQoaAZHQH9AAAAAAABoB030AWgIR0Bb/MJ6Y3NtdX2UKGgGR0B/QAAAAAAAaAdN9AFoCEdAXFpiay8jA3V9lChoBkdAf0AAAAAAAGgHTfQBaAhHQFy3Y1YQrc11fZQoaAZHQH9AAAAAAABoB030AWgIR0BdFpmqYJE6dX2UKGgGR0B/QAAAAAAAaAdN9AFoCEdAXVdEnb7CSHV9lChoBkdAf0AAAAAAAGgHTfQBaAhHQF2CKMNtqHp1fZQoaAZHQH9AAAAAAABoB030AWgIR0BdwhfBvaUSdWUu"
53
  },
54
  "ep_success_buffer": {
55
  ":type:": "<class 'collections.deque'>",
56
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
57
  },
58
- "_n_updates": 24576,
59
  "observation_space": {
60
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
61
  ":serialized:": "gAWVFgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAJqZmcD//3//UHfWvv//f/+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAJqZmUD//39/UHfWPv//f3+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMPVstNC44MDAwMDAyZSswMCAtMy40MDI4MjM1ZSszOCAtNC4xODg3OTAzZS0wMSAtMy40MDI4MjM1ZSszOF2UjAloaWdoX3JlcHKUjDlbNC44MDAwMDAyZSswMCAzLjQwMjgyMzVlKzM4IDQuMTg4NzkwM2UtMDEgMy40MDI4MjM1ZSszOF2UjApfbnBfcmFuZG9tlE51Yi4=",
@@ -73,7 +73,7 @@
73
  },
74
  "action_space": {
75
  ":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
76
- ":serialized:": "gAWVpQEAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIAgAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgLjAJpOJSJiIeUUpQoSwNoD05OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwQX19nZW5lcmF0b3JfY3RvcpSTlIwFUENHNjSUhZRSlH2UKIwNYml0X2dlbmVyYXRvcpSMBVBDRzY0lIwFc3RhdGWUfZQoaCiKEONhlaa3XlgJLUWWWTS1oRqMA2luY5SKEKlzeES8M4FYghr3OtvajUF1jApoYXNfdWludDMylEsAjAh1aW50ZWdlcpRLAHVidWIu",
77
  "n": "2",
78
  "start": "0",
79
  "_shape": [],
@@ -92,15 +92,14 @@
92
  ":type:": "<class 'abc.ABCMeta'>",
93
  ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
94
  "__module__": "stable_baselines3.common.buffers",
95
- "__annotations__": "{'observations': <class 'numpy.ndarray'>, 'next_observations': <class 'numpy.ndarray'>, 'actions': <class 'numpy.ndarray'>, 'rewards': <class 'numpy.ndarray'>, 'dones': <class 'numpy.ndarray'>, 'timeouts': <class 'numpy.ndarray'>}",
96
  "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
97
- "__init__": "<function ReplayBuffer.__init__ at 0x7f3cc89b49d0>",
98
- "add": "<function ReplayBuffer.add at 0x7f3cc89b4a60>",
99
- "sample": "<function ReplayBuffer.sample at 0x7f3cc89b4af0>",
100
- "_get_samples": "<function ReplayBuffer._get_samples at 0x7f3cc89b4b80>",
101
- "_maybe_cast_dtype": "<staticmethod(<function ReplayBuffer._maybe_cast_dtype at 0x7f3cc89b4c10>)>",
102
  "__abstractmethods__": "frozenset()",
103
- "_abc_impl": "<_abc._abc_data object at 0x7f3cc8944480>"
104
  },
105
  "replay_buffer_kwargs": {},
106
  "train_freq": {
@@ -112,17 +111,17 @@
112
  "exploration_final_eps": 0.04,
113
  "exploration_fraction": 0.16,
114
  "target_update_interval": 10,
115
- "_n_calls": 49999,
116
  "max_grad_norm": 10,
117
  "exploration_rate": 0.04,
118
  "lr_schedule": {
119
  ":type:": "<class 'function'>",
120
- ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuDQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9i13MY/FBIhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
121
  },
122
  "batch_norm_stats": [],
123
  "batch_norm_stats_target": [],
124
  "exploration_schedule": {
125
  ":type:": "<class 'function'>",
126
- ":serialized:": "gAWVZQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLBEsTQyhkAXwAGACIAWsEcgiIAFMAiAJkAXwAGACIAIgCGAAUAIgBGwAXAFMAlE5LAYaUKYwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLcUMGDAEEARgClIwDZW5klIwMZW5kX2ZyYWN0aW9ulIwFc3RhcnSUh5QpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxJL3Vzci9sb2NhbC9saWIvcHl0aG9uMy4xMC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlGgdKVKUaB0pUpSHlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoI32UfZQoaBhoDYwMX19xdWFsbmFtZV9flIwbZ2V0X2xpbmVhcl9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UKGgKjAhidWlsdGluc5SMBWZsb2F0lJOUjAZyZXR1cm6UaC91jA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/pHrhR64Ue4WUUpRoN0c/xHrhR64Ue4WUUpRoN0c/8AAAAAAAAIWUUpSHlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
127
  }
128
  }
 
5
  "__module__": "stable_baselines3.dqn.policies",
6
  "__annotations__": "{'q_net': <class 'stable_baselines3.dqn.policies.QNetwork'>, 'q_net_target': <class 'stable_baselines3.dqn.policies.QNetwork'>}",
7
  "__doc__": "\n Policy class with Q-Value Net and target net for DQN\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
8
+ "__init__": "<function DQNPolicy.__init__ at 0x7f4dcefc8790>",
9
+ "_build": "<function DQNPolicy._build at 0x7f4dcefc8820>",
10
+ "make_q_net": "<function DQNPolicy.make_q_net at 0x7f4dcefc88b0>",
11
+ "forward": "<function DQNPolicy.forward at 0x7f4dcefc8940>",
12
+ "_predict": "<function DQNPolicy._predict at 0x7f4dcefc89d0>",
13
+ "_get_constructor_parameters": "<function DQNPolicy._get_constructor_parameters at 0x7f4dcefc8a60>",
14
+ "set_training_mode": "<function DQNPolicy.set_training_mode at 0x7f4dcefc8af0>",
15
  "__abstractmethods__": "frozenset()",
16
+ "_abc_impl": "<_abc._abc_data object at 0x7f4dcefbb840>"
17
  },
18
  "verbose": 1,
19
  "policy_kwargs": {
 
22
  256
23
  ]
24
  },
25
+ "num_timesteps": 30000,
26
  "_total_timesteps": 50000,
27
  "_num_timesteps_at_start": 0,
28
  "seed": 0,
29
  "action_noise": null,
30
+ "start_time": 1699149376068469832,
31
  "learning_rate": {
32
  ":type:": "<class 'function'>",
33
+ ":serialized:": "gAWVAwMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMaC9ob21lL25zYW5naGkvc2FuZGJveC9hcHJlc3MvZHJsLTJlZC92ZW52L2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLg0MCBAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxoL2hvbWUvbnNhbmdoaS9zYW5kYm94L2FwcmVzcy9kcmwtMmVkL3ZlbnYvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP2LXcxj8UEiFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
34
  },
35
+ "tensorboard_log": "runs/CartPole-v1__dqn__2652168140__1699149373/CartPole-v1",
36
  "_last_obs": null,
37
  "_last_episode_starts": {
38
  ":type:": "<class 'numpy.ndarray'>",
 
40
  },
41
  "_last_original_obs": {
42
  ":type:": "<class 'numpy.ndarray'>",
43
+ ":serialized:": "gAWVhQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAACh7/z7bw5M8GP0HvMGnDz2UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwFLBIaUjAFDlHSUUpQu"
44
  },
45
+ "_episode_num": 388,
46
  "use_sde": false,
47
  "sde_sample_freq": -1,
48
+ "_current_progress_remaining": 0.40002000000000004,
49
  "_stats_window_size": 100,
50
  "ep_info_buffer": {
51
  ":type:": "<class 'collections.deque'>",
52
+ ":serialized:": "gAWV8AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQFgAAAAAAACMAWyUS2CMAXSUR0BPPxFqi48VdX2UKGgGR0BTwAAAAAAAaAdLT2gIR0BPRTDwYtQLdX2UKGgGR0BeQAAAAAAAaAdLeWgIR0BP41y3kPtldX2UKGgGR0BfwAAAAAAAaAdLf2gIR0BP8mnXNC7cdX2UKGgGR0BbwAAAAAAAaAdLb2gIR0BQSPu9eyAydX2UKGgGR0BbgAAAAAAAaAdLbmgIR0BQTV3Qla8pdX2UKGgGR0BaAAAAAAAAaAdLaGgIR0BQlVWbPQfIdX2UKGgGR0BcwAAAAAAAaAdLc2gIR0BQmb+98JD3dX2UKGgGR0BYwAAAAAAAaAdLY2gIR0BQ3RqbjLjhdX2UKGgGR0BtIAAAAAAAaAdL6WgIR0BQ5Ndu5z5odX2UKGgGR0BiAAAAAAAAaAdLkGgIR0BRNukpI+W4dX2UKGgGR0BiQAAAAAAAaAdLkmgIR0BRgBgAp8WsdX2UKGgGR0BsYAAAAAAAaAdL42gIR0BRy5bY9Pk8dX2UKGgGR0Bk4AAAAAAAaAdLp2gIR0BR1zwYtQKsdX2UKGgGR0BkgAAAAAAAaAdLpGgIR0BSNNRFZxJedX2UKGgGR0BbQAAAAAAAaAdLbWgIR0BSOSe/Yao/dX2UKGgGR0BcQAAAAAAAaAdLcWgIR0BSn28dxQzldX2UKGgGR0BbQAAAAAAAaAdLbWgIR0BSpPuPV/c4dX2UKGgGR0BcwAAAAAAAaAdLc2gIR0BTKWJ79hqkdX2UKGgGR0BTgAAAAAAAaAdLTmgIR0BTMGS2Yv38dX2UKGgGR0BUAAAAAAAAaAdLUGgIR0BTN8FINEw4dX2UKGgGR0BVgAAAAAAAaAdLVmgIR0BTO/NRm9QGdX2UKGgGR0BUAAAAAAAAaAdLUGgIR0BTwYHTqjagdX2UKGgGR0AyAAAAAAAAaAdLEmgIR0BTwg8OkLx7dX2UKGgGR0AyAAAAAAAAaAdLEmgIR0BTwqTKT0QLdX2UKGgGR0AyAAAAAAAAaAdLEmgIR0BTw3O8kD6ndX2UKGgGR0AmAAAAAAAAaAdLC2gIR0BTw8sg+yJLdX2UKGgGR0AxAAAAAAAAaAdLEWgIR0BTxEJSiudPdX2UKGgGR0AyAAAAAAAAaAdLEmgIR0BTxMvugHu7dX2UKGgGR0A3AAAAAAAAaAdLF2gIR0BTxYL9deIEdX2UKGgGR0A0AAAAAAAAaAdLFGgIR0BTxhPCVKPGdX2UKGgGR0BZwAAAAAAAaAdLZ2gIR0BUJxu0kWykdX2UKGgGR0BZwAAAAAAAaAdLZ2gIR0BULSteUpuudX2UKGgGR0BZwAAAAAAAaAdLZ2gIR0BUjqB7NSqEdX2UKGgGR0BhIAAAAAAAaAdLiWgIR0BUk4z3yqdZdX2UKGgGR0BhQAAAAAAAaAdLimgIR0BU6mfkFOfvdX2UKGgGR0B9IAAAAAAAaAdN0gFoCEdAVWZbUwztTnV9lChoBkdAZmAAAAAAAGgHS7NoCEdAVcmgpSaVlnV9lChoBkdAZqAAAAAAAGgHS7VoCEdAViEnfEXLvHV9lChoBkdAcYAAAAAAAGgHTRgBaAhHQFaM1DjR2KV1fZQoaAZHQDMAAAAAAABoB0sTaAhHQFaNl7dBSk11fZQoaAZHQFkAAAAAAABoB0tkaAhHQFaTNjbzshR1fZQoaAZHQH9AAAAAAABoB030AWgIR0BXVS0WuX/pdX2UKGgGR0BoIAAAAAAAaAdLwWgIR0BYJiwr1/UfdX2UKGgGR0BiYAAAAAAAaAdLk2gIR0BYnaSTyJ9BdX2UKGgGR0AwAAAAAAAAaAdLEGgIR0BYnjbnHNordX2UKGgGR0AxAAAAAAAAaAdLEWgIR0BYnrx3FDOUdX2UKGgGR0AuAAAAAAAAaAdLD2gIR0BYnzV6NVBEdX2UKGgGR0AsAAAAAAAAaAdLDmgIR0BYn6LCN0eVdX2UKGgGR0AqAAAAAAAAaAdLDWgIR0BYoPHtF8XvdX2UKGgGR0AwAAAAAAAAaAdLEGgIR0BYoX/95yEMdX2UKGgGR0AqAAAAAAAAaAdLDWgIR0BYorW/ag27dX2UKGgGR0AuAAAAAAAAaAdLD2gIR0BYoyXt0FKTdX2UKGgGR0AoAAAAAAAAaAdLDGgIR0BYo4/mknCwdX2UKGgGR0AzAAAAAAAAaAdLE2gIR0BYpC/O+qR2dX2UKGgGR0AwAAAAAAAAaAdLEGgIR0BYpM/2TPjXdX2UKGgGR0AqAAAAAAAAaAdLDWgIR0BYpTW07bL2dX2UKGgGR0AxAAAAAAAAaAdLEWgIR0BYpc/yGzrvdX2UKGgGR0BkAAAAAAAAaAdLoGgIR0BZA7fUF0PpdX2UKGgGR0BjAAAAAAAAaAdLmGgIR0BZdTmSyMUAdX2UKGgGR0BmwAAAAAAAaAdLtmgIR0BZf194NZvDdX2UKGgGR0BlQAAAAAAAaAdLqmgIR0BZ73Xyy2QXdX2UKGgGR0BlQAAAAAAAaAdLqmgIR0BaWWKIi1RcdX2UKGgGR0B/QAAAAAAAaAdN9AFoCEdAWx0Kx9oexXV9lChoBkdAZwAAAAAAAGgHS7hoCEdAWygDoyKvV3V9lChoBkdAfCAAAAAAAGgHTcIBaAhHQFvxAdn003x1fZQoaAZHQGPgAAAAAABoB0ufaAhHQFxBNVzZHut1fZQoaAZHQHbQAAAAAABoB01tAWgIR0BcrQdXDFZQdX2UKGgGR0BroAAAAAAAaAdL3WgIR0BdGo2OyVv/dX2UKGgGR0AoAAAAAAAAaAdLDGgIR0BdGw2VE/jbdX2UKGgGR0BwgAAAAAAAaAdNCAFoCEdAXYcaBI4EOnV9lChoBkdAZKAAAAAAAGgHS6VoCEdAXdgi3XqZ+nV9lChoBkdAXoAAAAAAAGgHS3poCEdAXd6HzpX6qXV9lChoBkdAYwAAAAAAAGgHS5hoCEdAXkPIxQBPsXV9lChoBkdAf0AAAAAAAGgHTfQBaAhHQF8XYjB2wFF1fZQoaAZHQDIAAAAAAABoB0sSaAhHQF8YNm16Vt51fZQoaAZHQFpAAAAAAABoB0tpaAhHQF8eTAnDziF1fZQoaAZHQEMAAAAAAABoB0smaAhHQF8f92X9itt1fZQoaAZHQFhAAAAAAABoB0thaAhHQF9mTbnHNot1fZQoaAZHQFmAAAAAAABoB0tmaAhHQF9qsasIVud1fZQoaAZHQFqAAAAAAABoB0tqaAhHQF++smv4dp91fZQoaAZHQH9AAAAAAABoB030AWgIR0BgUVoUSIxhdX2UKGgGR0BgQAAAAAAAaAdLgmgIR0BgVSGpMpPRdX2UKGgGR0BgAAAAAAAAaAdLgGgIR0Bgh4OUdJardX2UKGgGR0BpAAAAAAAAaAdLyGgIR0BgjYFPi1iOdX2UKGgGR0BmAAAAAAAAaAdLsGgIR0BgvkcCHRCydX2UKGgGR0BnQAAAAAAAaAdLumgIR0Bg7AsK9f1IdX2UKGgGR0ByMAAAAAAAaAdNIwFoCEdAYQ8CCBf8dnV9lChoBkdAW8AAAAAAAGgHS29oCEdAYREhIOH313V9lChoBkdAdoAAAAAAAGgHTWgBaAhHQGFcp3os7Mh1fZQoaAZHQH9AAAAAAABoB030AWgIR0BhoeIGhVU/dX2UKGgGR0B/QAAAAAAAaAdN9AFoCEdAYgCNR3u/lHV9lChoBkdAc/AAAAAAAGgHTT8BaAhHQGIov+OwPiF1fZQoaAZHQFsAAAAAAABoB0tsaAhHQGIqSNGViWp1fZQoaAZHQGVgAAAAAABoB0uraAhHQGJIC48U21l1fZQoaAZHQG0AAAAAAABoB0voaAhHQGJvnM+u/1x1fZQoaAZHQFzAAAAAAABoB0tzaAhHQGJx0GFBY3h1fZQoaAZHQGVAAAAAAABoB0uqaAhHQGKRxKpT/AF1fZQoaAZHQHcQAAAAAABoB01xAWgIR0BitGMXJo0zdX2UKGgGR0B7gAAAAAAAaAdNuAFoCEdAYwrlpXZGrnVlLg=="
53
  },
54
  "ep_success_buffer": {
55
  ":type:": "<class 'collections.deque'>",
56
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
57
  },
58
+ "_n_updates": 14592,
59
  "observation_space": {
60
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
61
  ":serialized:": "gAWVFgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAJqZmcD//3//UHfWvv//f/+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAJqZmUD//39/UHfWPv//f3+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMPVstNC44MDAwMDAyZSswMCAtMy40MDI4MjM1ZSszOCAtNC4xODg3OTAzZS0wMSAtMy40MDI4MjM1ZSszOF2UjAloaWdoX3JlcHKUjDlbNC44MDAwMDAyZSswMCAzLjQwMjgyMzVlKzM4IDQuMTg4NzkwM2UtMDEgMy40MDI4MjM1ZSszOF2UjApfbnBfcmFuZG9tlE51Yi4=",
 
73
  },
74
  "action_space": {
75
  ":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
76
+ ":serialized:": "gAWVwAEAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIAgAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgLjAJpOJSJiIeUUpQoSwNoD05OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwQX19nZW5lcmF0b3JfY3RvcpSTlIwFUENHNjSUaB+MFF9fYml0X2dlbmVyYXRvcl9jdG9ylJOUhpRSlH2UKIwNYml0X2dlbmVyYXRvcpSMBVBDRzY0lIwFc3RhdGWUfZQoaCqKEONhlaa3XlgJLUWWWTS1oRqMA2luY5SKEKlzeES8M4FYghr3OtvajUF1jApoYXNfdWludDMylEsAjAh1aW50ZWdlcpRLAHVidWIu",
77
  "n": "2",
78
  "start": "0",
79
  "_shape": [],
 
92
  ":type:": "<class 'abc.ABCMeta'>",
93
  ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
94
  "__module__": "stable_baselines3.common.buffers",
 
95
  "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
96
+ "__init__": "<function ReplayBuffer.__init__ at 0x7f4dcefa8f70>",
97
+ "add": "<function ReplayBuffer.add at 0x7f4dcefa9000>",
98
+ "sample": "<function ReplayBuffer.sample at 0x7f4dcefa9090>",
99
+ "_get_samples": "<function ReplayBuffer._get_samples at 0x7f4dcefa9120>",
100
+ "_maybe_cast_dtype": "<staticmethod(<function ReplayBuffer._maybe_cast_dtype at 0x7f4dcefa91b0>)>",
101
  "__abstractmethods__": "frozenset()",
102
+ "_abc_impl": "<_abc._abc_data object at 0x7f4dcf3ca7c0>"
103
  },
104
  "replay_buffer_kwargs": {},
105
  "train_freq": {
 
111
  "exploration_final_eps": 0.04,
112
  "exploration_fraction": 0.16,
113
  "target_update_interval": 10,
114
+ "_n_calls": 29999,
115
  "max_grad_norm": 10,
116
  "exploration_rate": 0.04,
117
  "lr_schedule": {
118
  ":type:": "<class 'function'>",
119
+ ":serialized:": "gAWVAwMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMaC9ob21lL25zYW5naGkvc2FuZGJveC9hcHJlc3MvZHJsLTJlZC92ZW52L2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLg0MCBAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxoL2hvbWUvbnNhbmdoaS9zYW5kYm94L2FwcmVzcy9kcmwtMmVkL3ZlbnYvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP2LXcxj8UEiFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
120
  },
121
  "batch_norm_stats": [],
122
  "batch_norm_stats_target": [],
123
  "exploration_schedule": {
124
  ":type:": "<class 'function'>",
125
+ ":serialized:": "gAWVowMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLBEsTQyhkAXwAGACIAWsEcgiIAFMAiAJkAXwAGACIAIgCGAAUAIgBGwAXAFMAlE5LAYaUKYwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjGgvaG9tZS9uc2FuZ2hpL3NhbmRib3gvYXByZXNzL2RybC0yZWQvdmVudi9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS3FDBgwBBAEYApSMA2VuZJSMDGVuZF9mcmFjdGlvbpSMBXN0YXJ0lIeUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMaC9ob21lL25zYW5naGkvc2FuZGJveC9hcHJlc3MvZHJsLTJlZC92ZW52L2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUaB0pUpRoHSlSlIeUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgjfZR9lChoGGgNjAxfX3F1YWxuYW1lX1+UjBtnZXRfbGluZWFyX2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZQoaAqMCGJ1aWx0aW5zlIwFZmxvYXSUk5SMBnJldHVybpRoL3WMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgZjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz+keuFHrhR7hZRSlGg3Rz/EeuFHrhR7hZRSlGg3Rz/wAAAAAAAAhZRSlIeUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
126
  }
127
  }
dqn-CartPole-v1/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a18dc4edcb79ecccc026b5865cf90a4038d63d6b3bec99f9cf4ff0366a2e5c8
3
- size 546144
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0583cc5a3c614b0148d4f94d06e2b1f5d15f9805fe9f4efd91ef3109befb3d41
3
+ size 545519
dqn-CartPole-v1/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fceb029f5b0a441b1ea3950e911effc8eab5bec5db6e6ad6234fbc8d3a0b4ad2
3
- size 545202
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d0338306e5f82dc7f9488376dcf4065b971b6ad0504880550233d2c50975322
3
+ size 544641
dqn-CartPole-v1/pytorch_variables.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c35cea3b2e60fb5e7e162d3592df775cd400e575a31c72f359fb9e654ab00c5
3
- size 864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d030ad8db708280fcae77d87e973102039acd23a11bdecc3db8eb6c0ac940ee1
3
+ size 431
dqn-CartPole-v1/system_info.txt CHANGED
@@ -1,9 +1,9 @@
1
- - OS: Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023
2
- - Python: 3.10.12
3
- - Stable-Baselines3: 2.2.0a8
4
- - PyTorch: 2.1.0+cu118
5
- - GPU Enabled: True
6
- - Numpy: 1.23.5
7
  - Cloudpickle: 2.2.1
8
- - Gymnasium: 0.29.1
9
  - OpenAI Gym: 0.26.2
 
1
+ - OS: Linux-5.15.90.1-microsoft-standard-WSL2-x86_64-with-glibc2.35 # 1 SMP Fri Jan 27 02:56:13 UTC 2023
2
+ - Python: 3.10.6
3
+ - Stable-Baselines3: 2.1.0
4
+ - PyTorch: 2.0.1+cu117
5
+ - GPU Enabled: False
6
+ - Numpy: 1.25.1
7
  - Cloudpickle: 2.2.1
8
+ - Gymnasium: 0.28.1
9
  - OpenAI Gym: 0.26.2
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca307ee0168baafff11e4f56255a78d31ca9b6bb7216cb67a314ad490534c9ac
3
- size 70404
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4679ef83d04ba51e951bdb271cc9f118916235e1b10f315c0f637d8b9b05afba
3
+ size 51590
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 500.0, "std_reward": 0.0, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-10-26T12:18:09.847415"}
 
1
+ {"mean_reward": 500.0, "std_reward": 0.0, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-11-05T07:33:04.960059"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9cd0d932ae8bc0c012039cb79393bfc5469c4620d051eca0e3505fce850852e6
3
- size 10467
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a168ecc6eb2ff4596c35e8b2603c37faf2715d3bb849e5d4c629fa0106344053
3
+ size 10586