|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 2.309561014175415, |
|
"min": 2.281111478805542, |
|
"max": 3.2957603931427, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 43974.04296875, |
|
"min": 18621.85546875, |
|
"max": 132478.5, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 50.45360824742268, |
|
"min": 44.34234234234234, |
|
"max": 999.0, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19576.0, |
|
"min": 14472.0, |
|
"max": 26132.0, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1355.5547328663977, |
|
"min": 1170.5394824436014, |
|
"max": 1377.3069070113052, |
|
"count": 380 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 262977.61817608116, |
|
"min": 2361.320079440623, |
|
"max": 298231.5035719138, |
|
"count": 380 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 3939974.0, |
|
"min": 9082.0, |
|
"max": 3939974.0, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 3939974.0, |
|
"min": 9082.0, |
|
"max": 3939974.0, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.041746560484170914, |
|
"min": -0.11274479329586029, |
|
"max": 0.1803084909915924, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -8.140579223632812, |
|
"min": -17.926422119140625, |
|
"max": 26.505348205566406, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.040217842906713486, |
|
"min": -0.10436349362134933, |
|
"max": 0.17117635905742645, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -7.842479705810547, |
|
"min": -17.932662963867188, |
|
"max": 24.61751937866211, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": -0.0719497439188835, |
|
"min": -0.625, |
|
"max": 0.46092973206494303, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": -14.030200064182281, |
|
"min": -33.70920014381409, |
|
"max": 45.10700011253357, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": -0.0719497439188835, |
|
"min": -0.625, |
|
"max": 0.46092973206494303, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": -14.030200064182281, |
|
"min": -33.70920014381409, |
|
"max": 45.10700011253357, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 394 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.014392319566104561, |
|
"min": 0.010217342836161455, |
|
"max": 0.025237433375635495, |
|
"count": 187 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.014392319566104561, |
|
"min": 0.010217342836161455, |
|
"max": 0.025237433375635495, |
|
"count": 187 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.09865847503145536, |
|
"min": 0.00013014958870674793, |
|
"max": 0.10634844924012819, |
|
"count": 187 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.09865847503145536, |
|
"min": 0.00013014958870674793, |
|
"max": 0.10634844924012819, |
|
"count": 187 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.10076268985867501, |
|
"min": 0.00012500778199561562, |
|
"max": 0.1087349534034729, |
|
"count": 187 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.10076268985867501, |
|
"min": 0.00012500778199561562, |
|
"max": 0.1087349534034729, |
|
"count": 187 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 187 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 187 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 187 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 187 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 187 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 187 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1679247432", |
|
"python_version": "3.9.16 (main, Mar 8 2023, 04:29:24) \n[Clang 14.0.6 ]", |
|
"command_line_arguments": "/Users/alessio/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1679262837" |
|
}, |
|
"total": 15331.936170459, |
|
"count": 1, |
|
"self": 0.1366623760004586, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.1844646249999995, |
|
"count": 1, |
|
"self": 0.1844646249999995 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 15331.615043458, |
|
"count": 1, |
|
"self": 3.0446913397772732, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.8925383340009363, |
|
"count": 20, |
|
"self": 2.8925383340009363 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 15325.58360245022, |
|
"count": 262919, |
|
"self": 3.028552508651046, |
|
"children": { |
|
"env_step": { |
|
"total": 12431.596222326261, |
|
"count": 262919, |
|
"self": 11982.406396551347, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 447.1306771715281, |
|
"count": 262919, |
|
"self": 12.720688878481383, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 434.4099882930467, |
|
"count": 503569, |
|
"self": 434.4099882930467 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 2.059148603387108, |
|
"count": 262918, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 15323.905628031922, |
|
"count": 262918, |
|
"is_parallel": true, |
|
"self": 3780.745046928694, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.030383457991041363, |
|
"count": 40, |
|
"is_parallel": true, |
|
"self": 0.0034091219993073185, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.026974335991734044, |
|
"count": 160, |
|
"is_parallel": true, |
|
"self": 0.026974335991734044 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 11543.130197645236, |
|
"count": 262918, |
|
"is_parallel": true, |
|
"self": 31.898869138076407, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 194.25133372881731, |
|
"count": 262918, |
|
"is_parallel": true, |
|
"self": 194.25133372881731 |
|
}, |
|
"communicator.exchange": { |
|
"total": 10895.712968361237, |
|
"count": 262918, |
|
"is_parallel": true, |
|
"self": 10895.712968361237 |
|
}, |
|
"steps_from_proto": { |
|
"total": 421.2670264171064, |
|
"count": 525836, |
|
"is_parallel": true, |
|
"self": 46.50732735628554, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 374.7596990608209, |
|
"count": 2103344, |
|
"is_parallel": true, |
|
"self": 374.7596990608209 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 2890.958827615309, |
|
"count": 262918, |
|
"self": 24.60439574676002, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 572.0797707045465, |
|
"count": 262918, |
|
"self": 571.4511638295482, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.6286068749982405, |
|
"count": 7, |
|
"self": 0.6286068749982405 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 2294.2746611640027, |
|
"count": 187, |
|
"self": 307.0505535550551, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 1987.2241076089476, |
|
"count": 5610, |
|
"self": 1987.2241076089476 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 5.420006345957518e-07, |
|
"count": 1, |
|
"self": 5.420006345957518e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.09421079200001259, |
|
"count": 1, |
|
"self": 0.0013693340006284416, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.09284145799938415, |
|
"count": 1, |
|
"self": 0.09284145799938415 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |