{ "battle_won_mean": [ 0.0, 0.0, 0.0, 0.0, 0.0 ], "battle_won_mean_T": [ 108, 10163, 20248, 30251, 40289 ], "dead_allies_mean": [ 5.0, 4.994949494949495, 4.997727272727273, 4.9978991596638656, 4.996 ], "dead_allies_mean_T": [ 108, 10163, 20248, 30251, 40289 ], "dead_enemies_mean": [ 0.0, 0.0, 0.0, 0.018907563025210083, 0.124 ], "dead_enemies_mean_T": [ 108, 10163, 20248, 30251, 40289 ], "ep_length_mean": [ 27.0, 25.391414141414142, 22.920454545454547, 21.014705882352942, 20.076 ], "ep_length_mean_T": [ 108, 10163, 20248, 30251, 40289 ], "episode": [ 396, 832, 1308, 1808 ], "episode_T": [ 10068, 20069, 30094, 40134 ], "episode_in_buffer": [ 396, 832, 1308, 1808 ], "episode_in_buffer_T": [ 10068, 20069, 30094, 40134 ], "epsilon": [ 1.0, 0.904354, 0.8084800000000001, 0.7133565000000001, 0.6179955 ], "epsilon_T": [ 108, 10163, 20248, 30251, 40289 ], "grad_norm": [ { "py/reduce": [ { "py/function": "torch._utils._rebuild_tensor_v2" }, { "py/tuple": [ { "py/reduce": [ { "py/function": "torch.storage._load_from_bytes" }, { "py/tuple": [ { "py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADI5Mzc2MjcxMTk2OTZxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyOTM3NjI3MTE5Njk2cQFhLgEAAAAAAAAAwgPxPg==" } ] } ] }, 0, { "py/tuple": [] }, { "py/tuple": [] }, false, { "py/reduce": [ { "py/type": "collections.OrderedDict" }, { "py/tuple": [] }, null, null, { "py/tuple": [] } ] } ] } ] }, { "py/reduce": [ { "py/function": "torch._utils._rebuild_tensor_v2" }, { "py/tuple": [ { "py/reduce": [ { "py/function": "torch.storage._load_from_bytes" }, { "py/tuple": [ { "py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADI5Mzc2MjcxNjc5ODRxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyOTM3NjI3MTY3OTg0cQFhLgEAAAAAAAAAjyhPPQ==" } ] } ] }, 0, { "py/tuple": [] }, { "py/tuple": [] }, false, { "py/reduce": [ { "py/type": "collections.OrderedDict" }, { "py/tuple": [] }, null, null, { "py/tuple": [] } ] } ] } ] }, { "py/reduce": [ { "py/function": "torch._utils._rebuild_tensor_v2" }, { "py/tuple": [ { "py/reduce": [ { "py/function": "torch.storage._load_from_bytes" }, { "py/tuple": [ { "py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADI5Mzc2MjcxNTQ1NDRxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyOTM3NjI3MTU0NTQ0cQFhLgEAAAAAAAAARv11PQ==" } ] } ] }, 0, { "py/tuple": [] }, { "py/tuple": [] }, false, { "py/reduce": [ { "py/type": "collections.OrderedDict" }, { "py/tuple": [] }, null, null, { "py/tuple": [] } ] } ] } ] }, { "py/reduce": [ { "py/function": "torch._utils._rebuild_tensor_v2" }, { "py/tuple": [ { "py/reduce": [ { "py/function": "torch.storage._load_from_bytes" }, { "py/tuple": [ { "py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADI5Mzc2MjcxMTQ2MDhxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyOTM3NjI3MTE0NjA4cQFhLgEAAAAAAAAAZGYAPg==" } ] } ] }, 0, { "py/tuple": [] }, { "py/tuple": [] }, false, { "py/reduce": [ { "py/type": "collections.OrderedDict" }, { "py/tuple": [] }, null, null, { "py/tuple": [] } ] } ] } ] } ], "grad_norm_T": [ 3390, 13498, 23565, 33599 ], "loss_td": [ 0.029275426641106606, 0.008867704309523106, 0.00828527007251978, 0.011645584367215633 ], "loss_td_T": [ 3390, 13498, 23565, 33599 ], "q_taken_mean": [ 0.010331014897619378, 0.13366268382352942, 0.20415240698298645, 0.26490462531228465 ], "q_taken_mean_T": [ 3390, 13498, 23565, 33599 ], "return_max": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 1.5849056603773584 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 3.3962264150943393 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 3.3962264150943393 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 4.30188679245283 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 5.245283018867924 } ], "return_max_T": [ 108, 10163, 20248, 30251, 40289 ], "return_mean": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 1.3018867924528301 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 1.5191538021726703 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 1.7969125214408233 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 2.1112256223244015 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 2.654641509433962 } ], "return_mean_T": [ 108, 10163, 20248, 30251, 40289 ], "return_min": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 0.9056603773584906 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.4528301886792453 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.679245283018868 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.9056603773584906 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 1.1320754716981132 } ], "return_min_T": [ 108, 10163, 20248, 30251, 40289 ], "return_std": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 0.29412183524754515 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.45845612324356316 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.5206001167133067 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.6097681028977217 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.765011763917395 } ], "return_std_T": [ 108, 10163, 20248, 30251, 40289 ], "target_mean": [ 0.046066559648091816, 0.13057054290381234, 0.20175707048026098, 0.2706919190967436 ], "target_mean_T": [ 3390, 13498, 23565, 33599 ], "td_error_abs": [ 0.029275427174075868, 0.008867704045132298, 0.008285269786077323, 0.011645584579667578 ], "td_error_abs_T": [ 3390, 13498, 23565, 33599 ], "test_battle_won_mean": [ 0.0, 0.0, 0.0, 0.0, 0.0 ], "test_battle_won_mean_T": [ 108, 10163, 20248, 30251, 40289 ], "test_dead_allies_mean": [ 2.59375, 5.0, 5.0, 5.0, 5.0 ], "test_dead_allies_mean_T": [ 108, 10163, 20248, 30251, 40289 ], "test_dead_enemies_mean": [ 0.0625, 2.125, 2.28125, 1.90625, 2.0625 ], "test_dead_enemies_mean_T": [ 108, 10163, 20248, 30251, 40289 ], "test_ep_length_mean": [ 60.59375, 18.9375, 19.96875, 18.53125, 18.96875 ], "test_ep_length_mean_T": [ 108, 10163, 20248, 30251, 40289 ], "test_return_max": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 4.113207547169811 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 8.943396226415096 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 9.433962264150944 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 7.811320754716981 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 8.49056603773585 } ], "test_return_max_T": [ 108, 10163, 20248, 30251, 40289 ], "test_return_mean": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 1.283018867924528 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 6.964622641509434 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 7.1120283018867925 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 6.475235849056602 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 6.799528301886792 } ], "test_return_mean_T": [ 108, 10163, 20248, 30251, 40289 ], "test_return_min": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 0.0 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 5.245283018867924 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 4.981132075471698 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 5.245283018867924 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 5.245283018867924 } ], "test_return_min_T": [ 108, 10163, 20248, 30251, 40289 ], "test_return_std": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 1.141821257893222 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.9287992177150309 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 1.0831398416674247 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.6995052016567793 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.8086527819915745 } ], "test_return_std_T": [ 108, 10163, 20248, 30251, 40289 ] }