Second Push

d026e96 verified 2 months ago

15.6 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.9366713762283325,
	"min": 1.921223759651184,
	"max": 2.7980246543884277,
	"count": 303
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 41150.39453125,
	"min": 37370.90625,
	"max": 70047.9765625,
	"count": 303
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 50.63157894736842,
	"min": 44.56363636363636,
	"max": 113.30232558139535,
	"count": 303
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19240.0,
	"min": 12676.0,
	"max": 20980.0,
	"count": 303
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1539.5732252586963,
	"min": 1314.574975317422,
	"max": 1546.7909758691726,
	"count": 303
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 292518.9127991523,
	"min": 105256.0186730712,
	"max": 330571.684406115,
	"count": 303
	},
	"SoccerTwos.Step.mean": {
	"value": 4999926.0,
	"min": 1979962.0,
	"max": 4999926.0,
	"count": 303
	},
	"SoccerTwos.Step.sum": {
	"value": 4999926.0,
	"min": 1979962.0,
	"max": 4999926.0,
	"count": 303
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.014108068309724331,
	"min": -0.12224282324314117,
	"max": 0.1356886327266693,
	"count": 303
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 2.680532932281494,
	"min": -22.737165451049805,
	"max": 22.769405364990234,
	"count": 303
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.012007688172161579,
	"min": -0.12296264618635178,
	"max": 0.15052008628845215,
	"count": 303
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 2.281460762023926,
	"min": -22.871051788330078,
	"max": 23.143291473388672,
	"count": 303
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 303
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 303
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.02655789287466752,
	"min": -0.3654246926307678,
	"max": 0.33317027059761256,
	"count": 303
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 5.045999646186829,
	"min": -61.52800005674362,
	"max": 49.309200048446655,
	"count": 303
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.02655789287466752,
	"min": -0.3654246926307678,
	"max": 0.33317027059761256,
	"count": 303
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 5.045999646186829,
	"min": -61.52800005674362,
	"max": 49.309200048446655,
	"count": 303
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 303
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 303
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01171204614705251,
	"min": 0.011686608046875335,
	"max": 0.02374286432750523,
	"count": 147
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01171204614705251,
	"min": 0.011686608046875335,
	"max": 0.02374286432750523,
	"count": 147
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10385078514615695,
	"min": 0.06091271998981635,
	"max": 0.11298494984706244,
	"count": 147
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10385078514615695,
	"min": 0.06091271998981635,
	"max": 0.11298494984706244,
	"count": 147
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10561498229702314,
	"min": 0.06363024786114693,
	"max": 0.11561396370331446,
	"count": 147
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10561498229702314,
	"min": 0.06363024786114693,
	"max": 0.11561396370331446,
	"count": 147
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 147
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 147
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 147
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 147
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 147
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 147
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1739662040",
	"python_version": "3.10.12 (main, Jul 5 2023, 15:34:07) [Clang 14.0.6 ]",
	"command_line_arguments": "/Users/asafsmac/miniconda3/envs/rl/bin/mlagents-learn config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics --resume",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.2",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1739708635"
	},
	"total": 46596.602719252,
	"count": 1,
	"self": 0.8277513469802216,
	"children": {
	"run_training.setup": {
	"total": 0.0526851590257138,
	"count": 1,
	"self": 0.0526851590257138
	},
	"TrainerController.start_learning": {
	"total": 46595.72228274599,
	"count": 1,
	"self": 12.153964645927772,
	"children": {
	"TrainerController._reset_env": {
	"total": 8.442461882834323,
	"count": 20,
	"self": 8.442461882834323
	},
	"TrainerController.advance": {
	"total": 46574.71806539234,
	"count": 209434,
	"self": 14.309848440927453,
	"children": {
	"env_step": {
	"total": 35972.25376434636,
	"count": 209434,
	"self": 34347.69145393954,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1617.3485647756606,
	"count": 209434,
	"self": 86.76540581020527,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1530.5831589654554,
	"count": 380058,
	"self": 1530.5831589654554
	}
	}
	},
	"workers": {
	"total": 7.213745631161146,
	"count": 209434,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 46568.56154363707,
	"count": 209434,
	"is_parallel": true,
	"self": 13358.061990369693,
	"children": {
	"steps_from_proto": {
	"total": 0.11668114690110087,
	"count": 40,
	"is_parallel": true,
	"self": 0.020781399682164192,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.09589974721893668,
	"count": 160,
	"is_parallel": true,
	"self": 0.09589974721893668
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 33210.38287212048,
	"count": 209434,
	"is_parallel": true,
	"self": 155.9417895032093,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 672.769520398113,
	"count": 209434,
	"is_parallel": true,
	"self": 672.769520398113
	},
	"communicator.exchange": {
	"total": 31152.906478734687,
	"count": 209434,
	"is_parallel": true,
	"self": 31152.906478734687
	},
	"steps_from_proto": {
	"total": 1228.765083484468,
	"count": 418868,
	"is_parallel": true,
	"self": 219.4591452423483,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 1009.3059382421197,
	"count": 1675472,
	"is_parallel": true,
	"self": 1009.3059382421197
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 10588.154452605057,
	"count": 209434,
	"self": 78.7347104542423,
	"children": {
	"process_trajectory": {
	"total": 1864.6498735909117,
	"count": 209434,
	"self": 1861.6086807028623,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 3.041192888049409,
	"count": 7,
	"self": 3.041192888049409
	}
	}
	},
	"_update_policy": {
	"total": 8644.769868559903,
	"count": 147,
	"self": 719.2591106550535,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 7925.510757904849,
	"count": 4410,
	"self": 7925.510757904849
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 2.058921381831169e-06,
	"count": 1,
	"self": 2.058921381831169e-06
	},
	"TrainerController._save_models": {
	"total": 0.4077887659659609,
	"count": 1,
	"self": 0.0035792149137705564,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.40420955105219036,
	"count": 1,
	"self": 0.40420955105219036
	}
	}
	}
	}
	}
	}
	}