368 lines
No EOL
6.7 KiB
JSON
368 lines
No EOL
6.7 KiB
JSON
{
|
|
"battle_won_mean": [
|
|
0.0,
|
|
0.0
|
|
],
|
|
"battle_won_mean_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"dead_allies_mean": [
|
|
5.0,
|
|
5.0
|
|
],
|
|
"dead_allies_mean_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"dead_enemies_mean": [
|
|
0.5,
|
|
0.3111111111111111
|
|
],
|
|
"dead_enemies_mean_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"ep_length_mean": [
|
|
52.75,
|
|
55.78333333333333
|
|
],
|
|
"ep_length_mean_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"episode": [
|
|
180
|
|
],
|
|
"episode_T": [
|
|
10030
|
|
],
|
|
"episode_in_buffer": [
|
|
180
|
|
],
|
|
"episode_in_buffer_T": [
|
|
10030
|
|
],
|
|
"epsilon": [
|
|
1.0,
|
|
0.904715
|
|
],
|
|
"epsilon_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"grad_norm_manager": [
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch._utils._rebuild_tensor_v2"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch.storage._load_from_bytes"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADIxNDAzMDE2ODY1NjBxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyMTQwMzAxNjg2NTYwcQFhLgEAAAAAAAAAnTV0RA=="
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
0,
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
false,
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/type": "collections.OrderedDict"
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
null,
|
|
null,
|
|
{
|
|
"py/tuple": []
|
|
}
|
|
]
|
|
}
|
|
]
|
|
}
|
|
]
|
|
}
|
|
],
|
|
"grad_norm_manager_T": [
|
|
7135
|
|
],
|
|
"grad_norm_worker": [
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch._utils._rebuild_tensor_v2"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch.storage._load_from_bytes"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADIxNDAzMDE2NjI2NTZxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyMTQwMzAxNjYyNjU2cQFhLgEAAAAAAAAAHtgcRg=="
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
0,
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
false,
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/type": "collections.OrderedDict"
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
null,
|
|
null,
|
|
{
|
|
"py/tuple": []
|
|
}
|
|
]
|
|
}
|
|
]
|
|
}
|
|
]
|
|
}
|
|
],
|
|
"grad_norm_worker_T": [
|
|
7135
|
|
],
|
|
"hit_prob": [
|
|
0.4580238461494446
|
|
],
|
|
"hit_prob_T": [
|
|
7135
|
|
],
|
|
"manager_advantage": [
|
|
0.1406308114528656
|
|
],
|
|
"manager_advantage_T": [
|
|
7135
|
|
],
|
|
"manager_cos_sim": [
|
|
-0.00032846396788954735
|
|
],
|
|
"manager_cos_sim_T": [
|
|
7135
|
|
],
|
|
"manager_loss": [
|
|
10.693564414978027
|
|
],
|
|
"manager_loss_T": [
|
|
7135
|
|
],
|
|
"q_taken_mean": [
|
|
0.06587212437587596
|
|
],
|
|
"q_taken_mean_T": [
|
|
7135
|
|
],
|
|
"return_max": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 7.432926829268293
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 14.95343137254902
|
|
}
|
|
],
|
|
"return_max_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"return_mean": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 4.3768681252989
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 4.579137772995377
|
|
}
|
|
],
|
|
"return_mean_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"return_min": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 2.2794117647058827
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 1.4308943089430894
|
|
}
|
|
],
|
|
"return_min_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"return_std": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 1.89094258138571
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 2.421259942116347
|
|
}
|
|
],
|
|
"return_std_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"target_mean": [
|
|
0.10347526224159075
|
|
],
|
|
"target_mean_T": [
|
|
7135
|
|
],
|
|
"td_error_abs": [
|
|
0.22424918631197444
|
|
],
|
|
"td_error_abs_T": [
|
|
7135
|
|
],
|
|
"test_battle_won_mean": [
|
|
0.0,
|
|
0.0
|
|
],
|
|
"test_battle_won_mean_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"test_dead_allies_mean": [
|
|
5.0,
|
|
5.0
|
|
],
|
|
"test_dead_allies_mean_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"test_dead_enemies_mean": [
|
|
0.34375,
|
|
1.0
|
|
],
|
|
"test_dead_enemies_mean_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"test_ep_length_mean": [
|
|
52.21875,
|
|
57.5625
|
|
],
|
|
"test_ep_length_mean_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"test_return_max": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 6.959349593495936
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 19.607843137254893
|
|
}
|
|
],
|
|
"test_return_max_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"test_return_mean": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 2.185841104734577
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 4.841020668938307
|
|
}
|
|
],
|
|
"test_return_mean_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"test_return_min": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.0
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.0
|
|
}
|
|
],
|
|
"test_return_min_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"test_return_std": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 2.2407881654472965
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 4.010960846314079
|
|
}
|
|
],
|
|
"test_return_std_T": [
|
|
211,
|
|
10252
|
|
],
|
|
"worker_loss": [
|
|
714.7169189453125
|
|
],
|
|
"worker_loss_T": [
|
|
7135
|
|
]
|
|
} |