First Push

94bfc32 over 2 years ago

15.6 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.309561014175415,
	"min": 2.281111478805542,
	"max": 3.2957603931427,
	"count": 394
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 43974.04296875,
	"min": 18621.85546875,
	"max": 132478.5,
	"count": 394
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 50.45360824742268,
	"min": 44.34234234234234,
	"max": 999.0,
	"count": 394
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19576.0,
	"min": 14472.0,
	"max": 26132.0,
	"count": 394
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1355.5547328663977,
	"min": 1170.5394824436014,
	"max": 1377.3069070113052,
	"count": 380
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 262977.61817608116,
	"min": 2361.320079440623,
	"max": 298231.5035719138,
	"count": 380
	},
	"SoccerTwos.Step.mean": {
	"value": 3939974.0,
	"min": 9082.0,
	"max": 3939974.0,
	"count": 394
	},
	"SoccerTwos.Step.sum": {
	"value": 3939974.0,
	"min": 9082.0,
	"max": 3939974.0,
	"count": 394
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.041746560484170914,
	"min": -0.11274479329586029,
	"max": 0.1803084909915924,
	"count": 394
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -8.140579223632812,
	"min": -17.926422119140625,
	"max": 26.505348205566406,
	"count": 394
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.040217842906713486,
	"min": -0.10436349362134933,
	"max": 0.17117635905742645,
	"count": 394
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -7.842479705810547,
	"min": -17.932662963867188,
	"max": 24.61751937866211,
	"count": 394
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 394
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 394
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.0719497439188835,
	"min": -0.625,
	"max": 0.46092973206494303,
	"count": 394
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -14.030200064182281,
	"min": -33.70920014381409,
	"max": 45.10700011253357,
	"count": 394
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.0719497439188835,
	"min": -0.625,
	"max": 0.46092973206494303,
	"count": 394
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -14.030200064182281,
	"min": -33.70920014381409,
	"max": 45.10700011253357,
	"count": 394
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 394
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 394
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.014392319566104561,
	"min": 0.010217342836161455,
	"max": 0.025237433375635495,
	"count": 187
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.014392319566104561,
	"min": 0.010217342836161455,
	"max": 0.025237433375635495,
	"count": 187
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.09865847503145536,
	"min": 0.00013014958870674793,
	"max": 0.10634844924012819,
	"count": 187
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.09865847503145536,
	"min": 0.00013014958870674793,
	"max": 0.10634844924012819,
	"count": 187
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10076268985867501,
	"min": 0.00012500778199561562,
	"max": 0.1087349534034729,
	"count": 187
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10076268985867501,
	"min": 0.00012500778199561562,
	"max": 0.1087349534034729,
	"count": 187
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 187
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 187
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 187
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 187
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 187
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 187
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1679247432",
	"python_version": "3.9.16 (main, Mar 8 2023, 04:29:24) \n[Clang 14.0.6 ]",
	"command_line_arguments": "/Users/alessio/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1679262837"
	},
	"total": 15331.936170459,
	"count": 1,
	"self": 0.1366623760004586,
	"children": {
	"run_training.setup": {
	"total": 0.1844646249999995,
	"count": 1,
	"self": 0.1844646249999995
	},
	"TrainerController.start_learning": {
	"total": 15331.615043458,
	"count": 1,
	"self": 3.0446913397772732,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.8925383340009363,
	"count": 20,
	"self": 2.8925383340009363
	},
	"TrainerController.advance": {
	"total": 15325.58360245022,
	"count": 262919,
	"self": 3.028552508651046,
	"children": {
	"env_step": {
	"total": 12431.596222326261,
	"count": 262919,
	"self": 11982.406396551347,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 447.1306771715281,
	"count": 262919,
	"self": 12.720688878481383,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 434.4099882930467,
	"count": 503569,
	"self": 434.4099882930467
	}
	}
	},
	"workers": {
	"total": 2.059148603387108,
	"count": 262918,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 15323.905628031922,
	"count": 262918,
	"is_parallel": true,
	"self": 3780.745046928694,
	"children": {
	"steps_from_proto": {
	"total": 0.030383457991041363,
	"count": 40,
	"is_parallel": true,
	"self": 0.0034091219993073185,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.026974335991734044,
	"count": 160,
	"is_parallel": true,
	"self": 0.026974335991734044
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 11543.130197645236,
	"count": 262918,
	"is_parallel": true,
	"self": 31.898869138076407,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 194.25133372881731,
	"count": 262918,
	"is_parallel": true,
	"self": 194.25133372881731
	},
	"communicator.exchange": {
	"total": 10895.712968361237,
	"count": 262918,
	"is_parallel": true,
	"self": 10895.712968361237
	},
	"steps_from_proto": {
	"total": 421.2670264171064,
	"count": 525836,
	"is_parallel": true,
	"self": 46.50732735628554,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 374.7596990608209,
	"count": 2103344,
	"is_parallel": true,
	"self": 374.7596990608209
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 2890.958827615309,
	"count": 262918,
	"self": 24.60439574676002,
	"children": {
	"process_trajectory": {
	"total": 572.0797707045465,
	"count": 262918,
	"self": 571.4511638295482,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.6286068749982405,
	"count": 7,
	"self": 0.6286068749982405
	}
	}
	},
	"_update_policy": {
	"total": 2294.2746611640027,
	"count": 187,
	"self": 307.0505535550551,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 1987.2241076089476,
	"count": 5610,
	"self": 1987.2241076089476
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 5.420006345957518e-07,
	"count": 1,
	"self": 5.420006345957518e-07
	},
	"TrainerController._save_models": {
	"total": 0.09421079200001259,
	"count": 1,
	"self": 0.0013693340006284416,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09284145799938415,
	"count": 1,
	"self": 0.09284145799938415
	}
	}
	}
	}
	}
	}
	}