basic-ppo-PyramidsRND / run_logs /timers.json

First push

c3fc964 about 2 years ago

19.1 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.29529279470443726,
	"min": 0.29529279470443726,
	"max": 1.466744065284729,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 8887.1318359375,
	"min": 8887.1318359375,
	"max": 44495.1484375,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989997.0,
	"min": 29977.0,
	"max": 989997.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989997.0,
	"min": 29977.0,
	"max": 989997.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.4516216814517975,
	"min": -0.1709778755903244,
	"max": 0.5972024202346802,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 119.67974853515625,
	"min": -40.69273376464844,
	"max": 167.2166748046875,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.016898194327950478,
	"min": -0.007352360058575869,
	"max": 0.268647700548172,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 4.478021621704102,
	"min": -1.9777848720550537,
	"max": 64.47544860839844,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07017654815198122,
	"min": 0.06635188308497338,
	"max": 0.07264778440141872,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9824716741277371,
	"min": 0.49177602286371613,
	"max": 1.0787795265884295,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.015065880895625532,
	"min": 7.816436311350838e-05,
	"max": 0.016984816687532142,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.21092233253875745,
	"min": 0.001016136720475609,
	"max": 0.23778743362545,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 2.57350974265e-05,
	"min": 2.57350974265e-05,
	"max": 0.0009838354301878855,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.000360291363971,
	"min": 0.000360291363971,
	"max": 0.0116911982308802,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.1025735,
	"min": 0.1025735,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.436029,
	"min": 1.3886848,
	"max": 2.5691197999999997,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00026709265,
	"min": 0.00026709265,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0037392970999999995,
	"min": 0.0037392970999999995,
	"max": 0.11693506802,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.010832207277417183,
	"min": 0.010832207277417183,
	"max": 0.46387335658073425,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.15165090560913086,
	"min": 0.15165090560913086,
	"max": 3.2471134662628174,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 403.46666666666664,
	"min": 323.53333333333336,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30260.0,
	"min": 16776.0,
	"max": 32338.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.3297599745790163,
	"min": -0.9999125520698726,
	"max": 1.6057687299326062,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 99.73199809342623,
	"min": -31.997201666235924,
	"max": 154.1537980735302,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.3297599745790163,
	"min": -0.9999125520698726,
	"max": 1.6057687299326062,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 99.73199809342623,
	"min": -31.997201666235924,
	"max": 154.1537980735302,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.04582851284377587,
	"min": 0.03869405331958357,
	"max": 8.313625031534363,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 3.4371384632831905,
	"min": 3.370638190288446,
	"max": 141.33162553608418,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1675370177",
	"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.6",
	"end_time_seconds": "1675372328"
	},
	"total": 2150.2418567649997,
	"count": 1,
	"self": 0.4461873319996812,
	"children": {
	"run_training.setup": {
	"total": 0.11946402600005968,
	"count": 1,
	"self": 0.11946402600005968
	},
	"TrainerController.start_learning": {
	"total": 2149.676205407,
	"count": 1,
	"self": 1.311774699059697,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.333074667000119,
	"count": 1,
	"self": 6.333074667000119
	},
	"TrainerController.advance": {
	"total": 2141.94625741594,
	"count": 63817,
	"self": 1.2845332158763085,
	"children": {
	"env_step": {
	"total": 1472.1067148750255,
	"count": 63817,
	"self": 1363.079992458991,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 108.21339087602178,
	"count": 63817,
	"self": 4.50583641393996,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 103.70755446208182,
	"count": 62569,
	"self": 34.994190919168204,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 68.71336354291361,
	"count": 62569,
	"self": 68.71336354291361
	}
	}
	}
	}
	},
	"workers": {
	"total": 0.8133315400127685,
	"count": 63817,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2144.9950893770038,
	"count": 63817,
	"is_parallel": true,
	"self": 885.1563557240329,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0019605700001648074,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007492490001368424,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001211321000027965,
	"count": 8,
	"is_parallel": true,
	"self": 0.001211321000027965
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04794792900020184,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004986509998161637,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.000439649000099962,
	"count": 1,
	"is_parallel": true,
	"self": 0.000439649000099962
	},
	"communicator.exchange": {
	"total": 0.045325726000100985,
	"count": 1,
	"is_parallel": true,
	"self": 0.045325726000100985
	},
	"steps_from_proto": {
	"total": 0.0016839030001847277,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004394269999465905,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012444760002381372,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012444760002381372
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1259.8387336529709,
	"count": 63816,
	"is_parallel": true,
	"self": 28.344905088870746,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 24.318936694005515,
	"count": 63816,
	"is_parallel": true,
	"self": 24.318936694005515
	},
	"communicator.exchange": {
	"total": 1100.6825599350593,
	"count": 63816,
	"is_parallel": true,
	"self": 1100.6825599350593
	},
	"steps_from_proto": {
	"total": 106.49233193503528,
	"count": 63816,
	"is_parallel": true,
	"self": 23.69820164102316,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 82.79413029401212,
	"count": 510528,
	"is_parallel": true,
	"self": 82.79413029401212
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 668.5550093250381,
	"count": 63817,
	"self": 2.372657367022839,
	"children": {
	"process_trajectory": {
	"total": 153.53406783401306,
	"count": 63817,
	"self": 153.3383845640128,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.1956832700002451,
	"count": 2,
	"self": 0.1956832700002451
	}
	}
	},
	"_update_policy": {
	"total": 512.6482841240022,
	"count": 453,
	"self": 196.62581849998423,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 316.02246562401797,
	"count": 22812,
	"self": 316.02246562401797
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.599998520570807e-07,
	"count": 1,
	"self": 9.599998520570807e-07
	},
	"TrainerController._save_models": {
	"total": 0.08509766499992111,
	"count": 1,
	"self": 0.001420862000031775,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08367680299988933,
	"count": 1,
	"self": 0.08367680299988933
	}
	}
	}
	}
	}
	}
	}