First Push

1d7d992 verified 25 days ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.5232912302017212,
	"min": 1.4524929523468018,
	"max": 3.295693874359131,
	"count": 2726
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 32074.419921875,
	"min": 24522.302734375,
	"max": 105462.203125,
	"count": 2726
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 74.84848484848484,
	"min": 42.902654867256636,
	"max": 999.0,
	"count": 2726
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19760.0,
	"min": 928.0,
	"max": 31000.0,
	"count": 2726
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1665.4253460478635,
	"min": 1199.496323851656,
	"max": 1732.2596207475895,
	"count": 2719
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 219836.145678318,
	"min": 2399.988520266327,
	"max": 354722.7644571557,
	"count": 2719
	},
	"SoccerTwos.Step.mean": {
	"value": 27259922.0,
	"min": 9140.0,
	"max": 27259922.0,
	"count": 2726
	},
	"SoccerTwos.Step.sum": {
	"value": 27259922.0,
	"min": 9140.0,
	"max": 27259922.0,
	"count": 2726
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.003984358161687851,
	"min": -0.13387973606586456,
	"max": 0.23543542623519897,
	"count": 2726
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 0.5259352922439575,
	"min": -21.22277069091797,
	"max": 24.327011108398438,
	"count": 2726
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.0031756118405610323,
	"min": -0.12983833253383636,
	"max": 0.23879003524780273,
	"count": 2726
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 0.4191807508468628,
	"min": -21.19337272644043,
	"max": 24.70865821838379,
	"count": 2726
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 2726
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 2726
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.019033331762660633,
	"min": -0.6666666666666666,
	"max": 0.47401355989908767,
	"count": 2726
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 2.5123997926712036,
	"min": -55.39319986104965,
	"max": 64.57020002603531,
	"count": 2726
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.019033331762660633,
	"min": -0.6666666666666666,
	"max": 0.47401355989908767,
	"count": 2726
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 2.5123997926712036,
	"min": -55.39319986104965,
	"max": 64.57020002603531,
	"count": 2726
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 2726
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 2726
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01947002433395634,
	"min": 0.009203283006111935,
	"max": 0.0286280690090886,
	"count": 1321
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01947002433395634,
	"min": 0.009203283006111935,
	"max": 0.0286280690090886,
	"count": 1321
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.08533640603224436,
	"min": 0.0005722908213404783,
	"max": 0.11490969508886337,
	"count": 1321
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.08533640603224436,
	"min": 0.0005722908213404783,
	"max": 0.11490969508886337,
	"count": 1321
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.08664804895718893,
	"min": 0.0005702611568267457,
	"max": 0.11693569918473562,
	"count": 1321
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.08664804895718893,
	"min": 0.0005702611568267457,
	"max": 0.11693569918473562,
	"count": 1321
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 1321
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 1321
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.19999999999999996,
	"max": 0.20000000000000007,
	"count": 1321
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.19999999999999996,
	"max": 0.20000000000000007,
	"count": 1321
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 1321
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 1321
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1743065613",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/home/samrito/anaconda3/envs/drl_hf/bin/mlagents-learn ./SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.6.0+cu124",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1743087033"
	},
	"total": 21419.806948977057,
	"count": 1,
	"self": 0.06077698618173599,
	"children": {
	"run_training.setup": {
	"total": 0.010219641961157322,
	"count": 1,
	"self": 0.010219641961157322
	},
	"TrainerController.start_learning": {
	"total": 21419.735952348914,
	"count": 1,
	"self": 19.17918024607934,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.262196201365441,
	"count": 110,
	"self": 2.262196201365441
	},
	"TrainerController.advance": {
	"total": 21398.188616118394,
	"count": 1865510,
	"self": 20.750042891595513,
	"children": {
	"env_step": {
	"total": 16269.669052127749,
	"count": 1865510,
	"self": 11917.53296902799,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 4339.913956762059,
	"count": 1865510,
	"self": 126.54519875603728,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 4213.368758006021,
	"count": 3422492,
	"self": 4213.368758006021
	}
	}
	},
	"workers": {
	"total": 12.222126337699592,
	"count": 1865510,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 21396.307301682886,
	"count": 1865510,
	"is_parallel": true,
	"self": 11680.562945507467,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0012204230297356844,
	"count": 2,
	"is_parallel": true,
	"self": 0.0002994914539158344,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.00092093157581985,
	"count": 8,
	"is_parallel": true,
	"self": 0.00092093157581985
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.015100114047527313,
	"count": 1,
	"is_parallel": true,
	"self": 0.00042400602251291275,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00021301698870956898,
	"count": 1,
	"is_parallel": true,
	"self": 0.00021301698870956898
	},
	"communicator.exchange": {
	"total": 0.013068980071693659,
	"count": 1,
	"is_parallel": true,
	"self": 0.013068980071693659
	},
	"steps_from_proto": {
	"total": 0.0013941109646111727,
	"count": 2,
	"is_parallel": true,
	"self": 0.00030786730349063873,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001086243661120534,
	"count": 8,
	"is_parallel": true,
	"self": 0.001086243661120534
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 9715.656926060328,
	"count": 1865509,
	"is_parallel": true,
	"self": 522.2820660541765,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 297.37677720864303,
	"count": 1865509,
	"is_parallel": true,
	"self": 297.37677720864303
	},
	"communicator.exchange": {
	"total": 7506.160344524076,
	"count": 1865509,
	"is_parallel": true,
	"self": 7506.160344524076
	},
	"steps_from_proto": {
	"total": 1389.8377382734325,
	"count": 3731018,
	"is_parallel": true,
	"self": 265.6407350411173,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 1124.1970032323152,
	"count": 14924072,
	"is_parallel": true,
	"self": 1124.1970032323152
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.0874301150906831,
	"count": 218,
	"is_parallel": true,
	"self": 0.017242368310689926,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.07018774677999318,
	"count": 872,
	"is_parallel": true,
	"self": 0.07018774677999318
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 5107.76952109905,
	"count": 1865509,
	"self": 148.80738690984435,
	"children": {
	"process_trajectory": {
	"total": 2398.339024409419,
	"count": 1865509,
	"self": 2392.7619246596005,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 5.577099749818444,
	"count": 54,
	"self": 5.577099749818444
	}
	}
	},
	"_update_policy": {
	"total": 2560.6231097797863,
	"count": 1321,
	"self": 1509.3422473517712,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 1051.280862428015,
	"count": 39642,
	"self": 1051.280862428015
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 5.029141902923584e-07,
	"count": 1,
	"self": 5.029141902923584e-07
	},
	"TrainerController._save_models": {
	"total": 0.10595928016118705,
	"count": 1,
	"self": 0.0008077402599155903,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.10515153990127146,
	"count": 1,
	"self": 0.10515153990127146
	}
	}
	}
	}
	}
	}
	}