{ "battle_won_mean": [ 0.0, 0.0 ], "battle_won_mean_T": [ 211, 10252 ], "dead_allies_mean": [ 5.0, 5.0 ], "dead_allies_mean_T": [ 211, 10252 ], "dead_enemies_mean": [ 0.5, 0.3111111111111111 ], "dead_enemies_mean_T": [ 211, 10252 ], "ep_length_mean": [ 52.75, 55.78333333333333 ], "ep_length_mean_T": [ 211, 10252 ], "episode": [ 180 ], "episode_T": [ 10030 ], "episode_in_buffer": [ 180 ], "episode_in_buffer_T": [ 10030 ], "epsilon": [ 1.0, 0.904715 ], "epsilon_T": [ 211, 10252 ], "grad_norm_manager": [ { "py/reduce": [ { "py/function": "torch._utils._rebuild_tensor_v2" }, { "py/tuple": [ { "py/reduce": [ { "py/function": "torch.storage._load_from_bytes" }, { "py/tuple": [ { "py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADIxNDAzMDE2ODY1NjBxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyMTQwMzAxNjg2NTYwcQFhLgEAAAAAAAAAnTV0RA==" } ] } ] }, 0, { "py/tuple": [] }, { "py/tuple": [] }, false, { "py/reduce": [ { "py/type": "collections.OrderedDict" }, { "py/tuple": [] }, null, null, { "py/tuple": [] } ] } ] } ] } ], "grad_norm_manager_T": [ 7135 ], "grad_norm_worker": [ { "py/reduce": [ { "py/function": "torch._utils._rebuild_tensor_v2" }, { "py/tuple": [ { "py/reduce": [ { "py/function": "torch.storage._load_from_bytes" }, { "py/tuple": [ { "py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADIxNDAzMDE2NjI2NTZxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyMTQwMzAxNjYyNjU2cQFhLgEAAAAAAAAAHtgcRg==" } ] } ] }, 0, { "py/tuple": [] }, { "py/tuple": [] }, false, { "py/reduce": [ { "py/type": "collections.OrderedDict" }, { "py/tuple": [] }, null, null, { "py/tuple": [] } ] } ] } ] } ], "grad_norm_worker_T": [ 7135 ], "hit_prob": [ 0.4580238461494446 ], "hit_prob_T": [ 7135 ], "manager_advantage": [ 0.1406308114528656 ], "manager_advantage_T": [ 7135 ], "manager_cos_sim": [ -0.00032846396788954735 ], "manager_cos_sim_T": [ 7135 ], "manager_loss": [ 10.693564414978027 ], "manager_loss_T": [ 7135 ], "q_taken_mean": [ 0.06587212437587596 ], "q_taken_mean_T": [ 7135 ], "return_max": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 7.432926829268293 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 14.95343137254902 } ], "return_max_T": [ 211, 10252 ], "return_mean": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 4.3768681252989 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 4.579137772995377 } ], "return_mean_T": [ 211, 10252 ], "return_min": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 2.2794117647058827 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 1.4308943089430894 } ], "return_min_T": [ 211, 10252 ], "return_std": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 1.89094258138571 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 2.421259942116347 } ], "return_std_T": [ 211, 10252 ], "target_mean": [ 0.10347526224159075 ], "target_mean_T": [ 7135 ], "td_error_abs": [ 0.22424918631197444 ], "td_error_abs_T": [ 7135 ], "test_battle_won_mean": [ 0.0, 0.0 ], "test_battle_won_mean_T": [ 211, 10252 ], "test_dead_allies_mean": [ 5.0, 5.0 ], "test_dead_allies_mean_T": [ 211, 10252 ], "test_dead_enemies_mean": [ 0.34375, 1.0 ], "test_dead_enemies_mean_T": [ 211, 10252 ], "test_ep_length_mean": [ 52.21875, 57.5625 ], "test_ep_length_mean_T": [ 211, 10252 ], "test_return_max": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 6.959349593495936 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 19.607843137254893 } ], "test_return_max_T": [ 211, 10252 ], "test_return_mean": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 2.185841104734577 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 4.841020668938307 } ], "test_return_mean_T": [ 211, 10252 ], "test_return_min": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 0.0 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 0.0 } ], "test_return_min_T": [ 211, 10252 ], "test_return_std": [ { "dtype": "float64", "py/object": "numpy.float64", "value": 2.2407881654472965 }, { "dtype": "float64", "py/object": "numpy.float64", "value": 4.010960846314079 } ], "test_return_std_T": [ 211, 10252 ], "worker_loss": [ 714.7169189453125 ], "worker_loss_T": [ 7135 ] }