{ "battle_won_mean": [ 0.0, 0.0 ], "battle_won_mean_T": [ 91, 10157 ], "dead_allies_mean": [ 5.0, 4.994897959183674 ], "dead_allies_mean_T": [ 91, 10157 ], "dead_enemies_mean": [ 0.0, 0.0 ], "dead_enemies_mean_T": [ 91, 10157 ], "ep_length_mean": [ 22.75, 25.678571428571427 ], "ep_length_mean_T": [ 91, 10157 ], "episode": [ 392 ], "episode_T": [ 10066 ], "episode_in_buffer": [ 392 ], "episode_in_buffer_T": [ 10066 ], "epsilon": [ 1.0, 0.904373 ], "epsilon_T": [ 91, 10157 ], "grad_norm": [ { "py/reduce": [ { "py/function": "torch._utils._rebuild_tensor_v2" }, { "py/tuple": [ { "py/reduce": [ { "py/function": "torch.storage._load_from_bytes" }, { "py/tuple": [ { "py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADI3NTczMjk5NzQ3MzZxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyNzU3MzI5OTc0NzM2cQFhLgEAAAAAAAAAxFokPw==" } ] } ] }, 0, { "py/tuple": [] }, { "py/tuple": [] }, false, { "py/reduce": [ { "py/type": "collections.OrderedDict" }, { "py/tuple": [] }, null, null, { "py/tuple": [] } ] } ] } ] }, { "py/reduce": [ { "py/function": "torch._utils._rebuild_tensor_v2" }, { "py/tuple": [ { "py/reduce": [ { "py/function": "torch.storage._load_from_bytes" }, { "py/tuple": [ { "py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADI3NTczMzAwMDc2NjRxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyNzU3MzMwMDA3NjY0cQFhLgEAAAAAAAAAMfg7PQ==" } ] } ] }, 0, { "py/tuple": [] }, { "py/tuple": [] }, false, { "py/reduce": [ { "py/type": "collections.OrderedDict" }, { "py/tuple": [] }, null, null, { "py/tuple": [] } ] } ] } ] } ], "grad_norm_T": [ 3449, 13477 ], "loss_td": [ 0.04804620519280434, 0.008500373922288418 ], "loss_td_T": [ 3449, 13477 ], "q_taken_mean": [ 0.029340348170438894, 0.13147327403257877 ], "q_taken_mean_T": [ 3449, 13477 ], "return_max": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 1.5849056603773584 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 3.3962264150943393 } ], "return_max_T": [ 91, 10157 ], "return_mean": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 1.1320754716981132 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 1.5294570658452062 } ], "return_mean_T": [ 91, 10157 ], "return_min": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 0.4528301886792453 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.679245283018868 } ], "return_min_T": [ 91, 10157 ], "return_std": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 0.4235838551064839 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.4868555532060793 } ], "return_std_T": [ 91, 10157 ], "target_mean": [ 0.0754477704701544, 0.13361987431649586 ], "target_mean_T": [ 3449, 13477 ], "td_error_abs": [ 0.04804620607309184, 0.008500374286099652 ], "td_error_abs_T": [ 3449, 13477 ], "test_battle_won_mean": [ 0.0, 0.0 ], "test_battle_won_mean_T": [ 91, 10157 ], "test_dead_allies_mean": [ 0.0, 5.0 ], "test_dead_allies_mean_T": [ 91, 10157 ], "test_dead_enemies_mean": [ 0.0, 2.0 ], "test_dead_enemies_mean_T": [ 91, 10157 ], "test_ep_length_mean": [ 70.0, 18.71875 ], "test_ep_length_mean_T": [ 91, 10157 ], "test_return_max": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 0.0 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 9.433962264150942 } ], "test_return_max_T": [ 91, 10157 ], "test_return_mean": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 0.0 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 6.662735849056603 } ], "test_return_mean_T": [ 91, 10157 ], "test_return_min": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 0.0 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 5.245283018867925 } ], "test_return_min_T": [ 91, 10157 ], "test_return_std": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 0.0 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.8664331680367857 } ], "test_return_std_T": [ 91, 10157 ] }