Initial Commit

a6f0ed7 about 2 years ago

20.1 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 3.18869686126709,
	"min": 3.1670570373535156,
	"max": 3.2957441806793213,
	"count": 117
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 38570.4765625,
	"min": 12105.599609375,
	"max": 152054.90625,
	"count": 117
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 695.3333333333334,
	"min": 433.4166666666667,
	"max": 999.0,
	"count": 117
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 16688.0,
	"min": 4452.0,
	"max": 28136.0,
	"count": 117
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1193.2650606209672,
	"min": 1190.7322727579492,
	"max": 1201.5572309876034,
	"count": 108
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 9546.120484967738,
	"min": 2381.635987580858,
	"max": 16755.748691303368,
	"count": 108
	},
	"SoccerTwos.Step.mean": {
	"value": 1169334.0,
	"min": 9084.0,
	"max": 1169334.0,
	"count": 117
	},
	"SoccerTwos.Step.sum": {
	"value": 1169334.0,
	"min": 9084.0,
	"max": 1169334.0,
	"count": 117
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.027071211487054825,
	"min": -0.06372575461864471,
	"max": 0.027482615783810616,
	"count": 117
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 0.3519257605075836,
	"min": -0.8284347653388977,
	"max": 0.3535115420818329,
	"count": 117
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.026384852826595306,
	"min": -0.06369052082300186,
	"max": 0.028071589767932892,
	"count": 117
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 0.3430030941963196,
	"min": -0.827970564365387,
	"max": 0.364930659532547,
	"count": 117
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 117
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 117
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.14698461844370916,
	"min": -0.5714285714285714,
	"max": 0.27497142979076933,
	"count": 117
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -1.910800039768219,
	"min": -8.0,
	"max": 3.8496000170707703,
	"count": 117
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.14698461844370916,
	"min": -0.5714285714285714,
	"max": 0.27497142979076933,
	"count": 117
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -1.910800039768219,
	"min": -8.0,
	"max": 3.8496000170707703,
	"count": 117
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 117
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 117
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.015360206284094602,
	"min": 0.012117091874824838,
	"max": 0.024097679225572696,
	"count": 54
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.015360206284094602,
	"min": 0.012117091874824838,
	"max": 0.024097679225572696,
	"count": 54
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.0034538612274142605,
	"min": 0.00034969555053976364,
	"max": 0.005978238047100603,
	"count": 54
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.0034538612274142605,
	"min": 0.00034969555053976364,
	"max": 0.005978238047100603,
	"count": 54
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.003469962584010015,
	"min": 0.0003521892847250759,
	"max": 0.006564258489136895,
	"count": 54
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.003469962584010015,
	"min": 0.0003521892847250759,
	"max": 0.006564258489136895,
	"count": 54
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 54
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 54
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 54
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 54
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 54
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 54
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1679736271",
	"python_version": "3.9.16 (main, Dec 7 2022, 01:11:51) \n[GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/linux/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1679738620"
	},
	"total": 2348.638205398,
	"count": 1,
	"self": 0.04307650400005514,
	"children": {
	"run_training.setup": {
	"total": 0.11162882000002128,
	"count": 1,
	"self": 0.11162882000002128
	},
	"TrainerController.start_learning": {
	"total": 2348.483500074,
	"count": 1,
	"self": 1.5388987449687193,
	"children": {
	"TrainerController._reset_env": {
	"total": 9.502020643000037,
	"count": 6,
	"self": 9.502020643000037
	},
	"TrainerController.advance": {
	"total": 2337.0845989350314,
	"count": 76629,
	"self": 1.8646640759989168,
	"children": {
	"env_step": {
	"total": 1861.4849851179915,
	"count": 76629,
	"self": 1458.597810473985,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 401.9372201870403,
	"count": 76629,
	"self": 12.484379305042978,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 389.4528408819973,
	"count": 152102,
	"self": 389.4528408819973
	}
	}
	},
	"workers": {
	"total": 0.9499544569662248,
	"count": 76628,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2343.819020711023,
	"count": 76628,
	"is_parallel": true,
	"self": 1112.460945891066,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0057090290000019195,
	"count": 2,
	"is_parallel": true,
	"self": 0.0035821259999124777,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0021269030000894418,
	"count": 8,
	"is_parallel": true,
	"self": 0.0021269030000894418
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.07212128599996959,
	"count": 1,
	"is_parallel": true,
	"self": 0.0010296769999627031,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0008685379999633369,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008685379999633369
	},
	"communicator.exchange": {
	"total": 0.06713946100001067,
	"count": 1,
	"is_parallel": true,
	"self": 0.06713946100001067
	},
	"steps_from_proto": {
	"total": 0.003083610000032877,
	"count": 2,
	"is_parallel": true,
	"self": 0.0005916340001022036,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0024919759999306734,
	"count": 8,
	"is_parallel": true,
	"self": 0.0024919759999306734
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1231.3458499279573,
	"count": 76627,
	"is_parallel": true,
	"self": 73.28550675604083,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 51.22505309598006,
	"count": 76627,
	"is_parallel": true,
	"self": 51.22505309598006
	},
	"communicator.exchange": {
	"total": 881.2321504529953,
	"count": 76627,
	"is_parallel": true,
	"self": 881.2321504529953
	},
	"steps_from_proto": {
	"total": 225.60313962294117,
	"count": 153254,
	"is_parallel": true,
	"self": 41.6531555650144,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 183.94998405792677,
	"count": 613016,
	"is_parallel": true,
	"self": 183.94998405792677
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.012224891999494503,
	"count": 10,
	"is_parallel": true,
	"self": 0.0024052009999877555,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.009819690999506747,
	"count": 40,
	"is_parallel": true,
	"self": 0.009819690999506747
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 473.73494974104085,
	"count": 76628,
	"self": 15.233939597034862,
	"children": {
	"process_trajectory": {
	"total": 120.74160695800657,
	"count": 76628,
	"self": 120.02034359700639,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.7212633610001831,
	"count": 2,
	"self": 0.7212633610001831
	}
	}
	},
	"_update_policy": {
	"total": 337.7594031859994,
	"count": 54,
	"self": 210.69964387899927,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 127.05975930700015,
	"count": 1632,
	"self": 127.05975930700015
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.3730000318901148e-06,
	"count": 1,
	"self": 1.3730000318901148e-06
	},
	"TrainerController._save_models": {
	"total": 0.3579803779998656,
	"count": 1,
	"self": 0.0023122190000322007,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.3556681589998334,
	"count": 1,
	"self": 0.3556681589998334
	}
	}
	}
	}
	}
	}
	}