672 lines
No EOL
13 KiB
JSON
672 lines
No EOL
13 KiB
JSON
{
|
|
"battle_won_mean": [
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0
|
|
],
|
|
"battle_won_mean_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"dead_allies_mean": [
|
|
5.0,
|
|
4.994949494949495,
|
|
4.997727272727273,
|
|
4.9978991596638656,
|
|
4.996
|
|
],
|
|
"dead_allies_mean_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"dead_enemies_mean": [
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.018907563025210083,
|
|
0.124
|
|
],
|
|
"dead_enemies_mean_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"ep_length_mean": [
|
|
27.0,
|
|
25.391414141414142,
|
|
22.920454545454547,
|
|
21.014705882352942,
|
|
20.076
|
|
],
|
|
"ep_length_mean_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"episode": [
|
|
396,
|
|
832,
|
|
1308,
|
|
1808
|
|
],
|
|
"episode_T": [
|
|
10068,
|
|
20069,
|
|
30094,
|
|
40134
|
|
],
|
|
"episode_in_buffer": [
|
|
396,
|
|
832,
|
|
1308,
|
|
1808
|
|
],
|
|
"episode_in_buffer_T": [
|
|
10068,
|
|
20069,
|
|
30094,
|
|
40134
|
|
],
|
|
"epsilon": [
|
|
1.0,
|
|
0.904354,
|
|
0.8084800000000001,
|
|
0.7133565000000001,
|
|
0.6179955
|
|
],
|
|
"epsilon_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"grad_norm": [
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch._utils._rebuild_tensor_v2"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch.storage._load_from_bytes"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADI5Mzc2MjcxMTk2OTZxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyOTM3NjI3MTE5Njk2cQFhLgEAAAAAAAAAwgPxPg=="
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
0,
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
false,
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/type": "collections.OrderedDict"
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
null,
|
|
null,
|
|
{
|
|
"py/tuple": []
|
|
}
|
|
]
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch._utils._rebuild_tensor_v2"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch.storage._load_from_bytes"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADI5Mzc2MjcxNjc5ODRxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyOTM3NjI3MTY3OTg0cQFhLgEAAAAAAAAAjyhPPQ=="
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
0,
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
false,
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/type": "collections.OrderedDict"
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
null,
|
|
null,
|
|
{
|
|
"py/tuple": []
|
|
}
|
|
]
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch._utils._rebuild_tensor_v2"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch.storage._load_from_bytes"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADI5Mzc2MjcxNTQ1NDRxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyOTM3NjI3MTU0NTQ0cQFhLgEAAAAAAAAARv11PQ=="
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
0,
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
false,
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/type": "collections.OrderedDict"
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
null,
|
|
null,
|
|
{
|
|
"py/tuple": []
|
|
}
|
|
]
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch._utils._rebuild_tensor_v2"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/function": "torch.storage._load_from_bytes"
|
|
},
|
|
{
|
|
"py/tuple": [
|
|
{
|
|
"py/b64": "gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAAAGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAAaW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApGbG9hdFN0b3JhZ2UKcQFYDQAAADI5Mzc2MjcxMTQ2MDhxAlgGAAAAY3VkYTowcQNLAU50cQRRLoACXXEAWA0AAAAyOTM3NjI3MTE0NjA4cQFhLgEAAAAAAAAAZGYAPg=="
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
0,
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
false,
|
|
{
|
|
"py/reduce": [
|
|
{
|
|
"py/type": "collections.OrderedDict"
|
|
},
|
|
{
|
|
"py/tuple": []
|
|
},
|
|
null,
|
|
null,
|
|
{
|
|
"py/tuple": []
|
|
}
|
|
]
|
|
}
|
|
]
|
|
}
|
|
]
|
|
}
|
|
],
|
|
"grad_norm_T": [
|
|
3390,
|
|
13498,
|
|
23565,
|
|
33599
|
|
],
|
|
"loss_td": [
|
|
0.029275426641106606,
|
|
0.008867704309523106,
|
|
0.00828527007251978,
|
|
0.011645584367215633
|
|
],
|
|
"loss_td_T": [
|
|
3390,
|
|
13498,
|
|
23565,
|
|
33599
|
|
],
|
|
"q_taken_mean": [
|
|
0.010331014897619378,
|
|
0.13366268382352942,
|
|
0.20415240698298645,
|
|
0.26490462531228465
|
|
],
|
|
"q_taken_mean_T": [
|
|
3390,
|
|
13498,
|
|
23565,
|
|
33599
|
|
],
|
|
"return_max": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 1.5849056603773584
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 3.3962264150943393
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 3.3962264150943393
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 4.30188679245283
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 5.245283018867924
|
|
}
|
|
],
|
|
"return_max_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"return_mean": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 1.3018867924528301
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 1.5191538021726703
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 1.7969125214408233
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 2.1112256223244015
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 2.654641509433962
|
|
}
|
|
],
|
|
"return_mean_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"return_min": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.9056603773584906
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.4528301886792453
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.679245283018868
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.9056603773584906
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 1.1320754716981132
|
|
}
|
|
],
|
|
"return_min_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"return_std": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.29412183524754515
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.45845612324356316
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.5206001167133067
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.6097681028977217
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.765011763917395
|
|
}
|
|
],
|
|
"return_std_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"target_mean": [
|
|
0.046066559648091816,
|
|
0.13057054290381234,
|
|
0.20175707048026098,
|
|
0.2706919190967436
|
|
],
|
|
"target_mean_T": [
|
|
3390,
|
|
13498,
|
|
23565,
|
|
33599
|
|
],
|
|
"td_error_abs": [
|
|
0.029275427174075868,
|
|
0.008867704045132298,
|
|
0.008285269786077323,
|
|
0.011645584579667578
|
|
],
|
|
"td_error_abs_T": [
|
|
3390,
|
|
13498,
|
|
23565,
|
|
33599
|
|
],
|
|
"test_battle_won_mean": [
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0
|
|
],
|
|
"test_battle_won_mean_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"test_dead_allies_mean": [
|
|
2.59375,
|
|
5.0,
|
|
5.0,
|
|
5.0,
|
|
5.0
|
|
],
|
|
"test_dead_allies_mean_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"test_dead_enemies_mean": [
|
|
0.0625,
|
|
2.125,
|
|
2.28125,
|
|
1.90625,
|
|
2.0625
|
|
],
|
|
"test_dead_enemies_mean_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"test_ep_length_mean": [
|
|
60.59375,
|
|
18.9375,
|
|
19.96875,
|
|
18.53125,
|
|
18.96875
|
|
],
|
|
"test_ep_length_mean_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"test_return_max": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 4.113207547169811
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 8.943396226415096
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 9.433962264150944
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 7.811320754716981
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 8.49056603773585
|
|
}
|
|
],
|
|
"test_return_max_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"test_return_mean": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 1.283018867924528
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 6.964622641509434
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 7.1120283018867925
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 6.475235849056602
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 6.799528301886792
|
|
}
|
|
],
|
|
"test_return_mean_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"test_return_min": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.0
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 5.245283018867924
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 4.981132075471698
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 5.245283018867924
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 5.245283018867924
|
|
}
|
|
],
|
|
"test_return_min_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
],
|
|
"test_return_std": [
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 1.141821257893222
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.9287992177150309
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 1.0831398416674247
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.6995052016567793
|
|
},
|
|
{
|
|
"dtype": "float64",
|
|
"py/object": "numpy.float64",
|
|
"value": 0.8086527819915745
|
|
}
|
|
],
|
|
"test_return_std_T": [
|
|
108,
|
|
10163,
|
|
20248,
|
|
30251,
|
|
40289
|
|
]
|
|
} |