|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.28421467542648315, |
|
"min": 0.28421467542648315, |
|
"max": 1.4405357837677002, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 8503.703125, |
|
"min": 8503.703125, |
|
"max": 43700.09375, |
|
"count": 50 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 1499903.0, |
|
"min": 29952.0, |
|
"max": 1499903.0, |
|
"count": 50 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 1499903.0, |
|
"min": 29952.0, |
|
"max": 1499903.0, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.6422605514526367, |
|
"min": -0.12505429983139038, |
|
"max": 0.6437637209892273, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 178.54843139648438, |
|
"min": -30.013032913208008, |
|
"max": 180.89759826660156, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.00918685831129551, |
|
"min": -0.009508224204182625, |
|
"max": 0.5712061524391174, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 2.5539464950561523, |
|
"min": -2.6147615909576416, |
|
"max": 135.3758544921875, |
|
"count": 50 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.0669284677683858, |
|
"min": 0.06261540081544727, |
|
"max": 0.07318900337309796, |
|
"count": 50 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9369985487574013, |
|
"min": 0.5105135901503255, |
|
"max": 1.0654427599057432, |
|
"count": 50 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.015309359984322717, |
|
"min": 2.626431715347892e-05, |
|
"max": 0.017680035694779474, |
|
"count": 50 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.21433103978051804, |
|
"min": 0.00036770044014870486, |
|
"max": 0.24752049972691262, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 0.00015146664236827855, |
|
"min": 0.00015146664236827855, |
|
"max": 0.00029838354339596195, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.0021205329931558996, |
|
"min": 0.0020886848037717336, |
|
"max": 0.003801056332981266, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.15048886428571429, |
|
"min": 0.15048886428571429, |
|
"max": 0.19946118095238097, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 2.1068441, |
|
"min": 1.3962282666666668, |
|
"max": 2.667018733333334, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.005053837542142857, |
|
"min": 0.005053837542142857, |
|
"max": 0.009946171977142856, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.07075372559, |
|
"min": 0.06962320384, |
|
"max": 0.12671517146, |
|
"count": 50 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.008841591887176037, |
|
"min": 0.008407366462051868, |
|
"max": 0.5084035992622375, |
|
"count": 50 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.12378229200839996, |
|
"min": 0.11770313233137131, |
|
"max": 3.5588250160217285, |
|
"count": 50 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 291.1188118811881, |
|
"min": 289.969696969697, |
|
"max": 999.0, |
|
"count": 50 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 29403.0, |
|
"min": 15984.0, |
|
"max": 32467.0, |
|
"count": 50 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.6098455259262925, |
|
"min": -1.0000000521540642, |
|
"max": 1.6696141258333668, |
|
"count": 50 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 162.59439811855555, |
|
"min": -31.998801663517952, |
|
"max": 167.99539843201637, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.6098455259262925, |
|
"min": -1.0000000521540642, |
|
"max": 1.6696141258333668, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 162.59439811855555, |
|
"min": -31.998801663517952, |
|
"max": 167.99539843201637, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.026676239869972265, |
|
"min": 0.026482453851400866, |
|
"max": 10.544406680390239, |
|
"count": 50 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.694300226867199, |
|
"min": 2.6217629312886856, |
|
"max": 168.71050688624382, |
|
"count": 50 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 50 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 50 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1675262501", |
|
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.6", |
|
"end_time_seconds": "1675267025" |
|
}, |
|
"total": 4523.411260270001, |
|
"count": 1, |
|
"self": 0.6396289430012985, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.18999339700008022, |
|
"count": 1, |
|
"self": 0.18999339700008022 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 4522.5816379299995, |
|
"count": 1, |
|
"self": 3.299644830998659, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 6.748880285999803, |
|
"count": 1, |
|
"self": 6.748880285999803 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 4512.358936176001, |
|
"count": 95942, |
|
"self": 3.0160458228401694, |
|
"children": { |
|
"env_step": { |
|
"total": 2856.0333407072317, |
|
"count": 95942, |
|
"self": 2654.137594056332, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 199.7660629909958, |
|
"count": 95942, |
|
"self": 9.029875897853572, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 190.73618709314223, |
|
"count": 94165, |
|
"self": 42.13363956603712, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 148.60254752710512, |
|
"count": 94165, |
|
"self": 148.60254752710512 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 2.129683659903776, |
|
"count": 95942, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 4513.928799117089, |
|
"count": 95942, |
|
"is_parallel": true, |
|
"self": 2090.086618842244, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.003678712999999334, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.001608643000054144, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.00207006999994519, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.00207006999994519 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.08292716899995867, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006813109998802247, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0006417800000235729, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006417800000235729 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.07926404499994533, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.07926404499994533 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0023400330001095426, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005988769999021315, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0017411560002074111, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0017411560002074111 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 2423.8421802748444, |
|
"count": 95941, |
|
"is_parallel": true, |
|
"self": 59.7987793307002, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 39.34728622500961, |
|
"count": 95941, |
|
"is_parallel": true, |
|
"self": 39.34728622500961 |
|
}, |
|
"communicator.exchange": { |
|
"total": 2113.0560614410897, |
|
"count": 95941, |
|
"is_parallel": true, |
|
"self": 2113.0560614410897 |
|
}, |
|
"steps_from_proto": { |
|
"total": 211.6400532780449, |
|
"count": 95941, |
|
"is_parallel": true, |
|
"self": 54.18102753587914, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 157.45902574216575, |
|
"count": 767528, |
|
"is_parallel": true, |
|
"self": 157.45902574216575 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 1653.3095496459293, |
|
"count": 95942, |
|
"self": 6.141486998865503, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 294.5213748260728, |
|
"count": 95942, |
|
"self": 294.0877338470734, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.43364097899939225, |
|
"count": 3, |
|
"self": 0.43364097899939225 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 1352.646687820991, |
|
"count": 680, |
|
"self": 363.6795565189875, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 988.9671313020035, |
|
"count": 34427, |
|
"self": 988.9671313020035 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.97000008483883e-06, |
|
"count": 1, |
|
"self": 1.97000008483883e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.17417466699953366, |
|
"count": 1, |
|
"self": 0.005935031999797502, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.16823963499973615, |
|
"count": 1, |
|
"self": 0.16823963499973615 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |