|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.4383755624294281, |
|
"min": 0.4383755624294281, |
|
"max": 1.5862054824829102, |
|
"count": 67 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 12996.958984375, |
|
"min": 12996.958984375, |
|
"max": 65935.390625, |
|
"count": 67 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 2009877.0, |
|
"min": 29952.0, |
|
"max": 2009877.0, |
|
"count": 67 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 2009877.0, |
|
"min": 29952.0, |
|
"max": 2009877.0, |
|
"count": 67 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.8164554834365845, |
|
"min": -0.09642726927995682, |
|
"max": 0.8519212603569031, |
|
"count": 67 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 240.0379180908203, |
|
"min": -24.01038932800293, |
|
"max": 261.5398254394531, |
|
"count": 67 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 0.010017666034400463, |
|
"min": -0.009136217646300793, |
|
"max": 0.3027942478656769, |
|
"count": 67 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 2.9451937675476074, |
|
"min": -2.5215959548950195, |
|
"max": 70.85385131835938, |
|
"count": 67 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.07075320851397394, |
|
"min": 0.06568519165940508, |
|
"max": 0.07565438236626529, |
|
"count": 67 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 0.9905449191956353, |
|
"min": 0.4734425738764306, |
|
"max": 1.050996414263741, |
|
"count": 67 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 0.013001791703104204, |
|
"min": 0.0003456554292742117, |
|
"max": 0.01566592345678793, |
|
"count": 67 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 0.18202508384345886, |
|
"min": 0.0027652434341936937, |
|
"max": 0.21932292839503098, |
|
"count": 67 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 0.00010061087360592142, |
|
"min": 0.00010061087360592142, |
|
"max": 0.00029836160054613336, |
|
"count": 67 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 0.0014085522304828999, |
|
"min": 0.0014085522304828999, |
|
"max": 0.003464173045275733, |
|
"count": 67 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.13353693571428574, |
|
"min": 0.13353693571428574, |
|
"max": 0.1994538666666667, |
|
"count": 67 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.8695171000000004, |
|
"min": 1.3827968, |
|
"max": 2.5547242666666667, |
|
"count": 67 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 0.0033603398778571437, |
|
"min": 0.0033603398778571437, |
|
"max": 0.00994544128, |
|
"count": 67 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.04704475829000001, |
|
"min": 0.04704475829000001, |
|
"max": 0.11549695423999998, |
|
"count": 67 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.00899757631123066, |
|
"min": 0.00899757631123066, |
|
"max": 0.3189292848110199, |
|
"count": 67 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.12596607208251953, |
|
"min": 0.12251792103052139, |
|
"max": 2.2325050830841064, |
|
"count": 67 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 67 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 67 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 230.68376068376068, |
|
"min": 220.4724409448819, |
|
"max": 997.1625, |
|
"count": 64 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 26990.0, |
|
"min": 926.0, |
|
"max": 79773.0, |
|
"count": 64 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.735117936427267, |
|
"min": -0.9731500518508256, |
|
"max": 1.779565872956616, |
|
"count": 64 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 203.00879856199026, |
|
"min": -77.85200414806604, |
|
"max": 248.7059983983636, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.735117936427267, |
|
"min": -0.9731500518508256, |
|
"max": 1.779565872956616, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 203.00879856199026, |
|
"min": -77.85200414806604, |
|
"max": 248.7059983983636, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.021515196687780704, |
|
"min": 0.021181808893123006, |
|
"max": 3.3438625559210777, |
|
"count": 64 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 2.517278012470342, |
|
"min": 2.517278012470342, |
|
"max": 156.16331193596125, |
|
"count": 64 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1674138899", |
|
"python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --num-envs=10 --run-id=Pyramids Training --no-graphics --force", |
|
"mlagents_version": "0.29.0.dev0", |
|
"mlagents_envs_version": "0.29.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.6", |
|
"end_time_seconds": "1674142245" |
|
}, |
|
"total": 3346.5197448459994, |
|
"count": 1, |
|
"self": 1.5104933649990926, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.22388053600002422, |
|
"count": 1, |
|
"self": 0.22388053600002422 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 3344.785370945, |
|
"count": 1, |
|
"self": 2.191321581034117, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 11.036381419999998, |
|
"count": 1, |
|
"self": 11.036381419999998 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 3330.519638434966, |
|
"count": 23321, |
|
"self": 2.14965534799785, |
|
"children": { |
|
"env_step": { |
|
"total": 1781.5993759870178, |
|
"count": 23321, |
|
"self": 963.0564049740243, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 814.5518747129988, |
|
"count": 130766, |
|
"self": 29.430823052086566, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 785.1210516609123, |
|
"count": 126498, |
|
"self": 224.14092069291928, |
|
"children": { |
|
"TorchPolicy.sample_actions": { |
|
"total": 560.980130967993, |
|
"count": 126498, |
|
"self": 560.980130967993 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 3.9910962999946378, |
|
"count": 23321, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 33402.44909967305, |
|
"count": 130759, |
|
"is_parallel": true, |
|
"self": 25763.64540756009, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.046783416000039324, |
|
"count": 10, |
|
"is_parallel": true, |
|
"self": 0.008720006000885405, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.03806340999915392, |
|
"count": 80, |
|
"is_parallel": true, |
|
"self": 0.03806340999915392 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 2.3285360760000913, |
|
"count": 10, |
|
"is_parallel": true, |
|
"self": 0.004722976000380186, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0036794169999438964, |
|
"count": 10, |
|
"is_parallel": true, |
|
"self": 0.0036794169999438964 |
|
}, |
|
"communicator.exchange": { |
|
"total": 2.297539016999849, |
|
"count": 10, |
|
"is_parallel": true, |
|
"self": 2.297539016999849 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.022594665999918107, |
|
"count": 10, |
|
"is_parallel": true, |
|
"self": 0.010956463999946209, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.011638201999971898, |
|
"count": 80, |
|
"is_parallel": true, |
|
"self": 0.011638201999971898 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 7638.803692112964, |
|
"count": 130749, |
|
"is_parallel": true, |
|
"self": 72.15934311896217, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 45.65303698401249, |
|
"count": 130749, |
|
"is_parallel": true, |
|
"self": 45.65303698401249 |
|
}, |
|
"communicator.exchange": { |
|
"total": 7282.672770433042, |
|
"count": 130749, |
|
"is_parallel": true, |
|
"self": 7282.672770433042 |
|
}, |
|
"steps_from_proto": { |
|
"total": 238.3185415769467, |
|
"count": 130749, |
|
"is_parallel": true, |
|
"self": 65.68012743502061, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 172.6384141419261, |
|
"count": 1045992, |
|
"is_parallel": true, |
|
"self": 172.6384141419261 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 1546.7706070999502, |
|
"count": 23320, |
|
"self": 4.446033568937764, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 463.3108352430115, |
|
"count": 23320, |
|
"self": 462.8958884420117, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.4149468009998145, |
|
"count": 4, |
|
"self": 0.4149468009998145 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 1079.013738288001, |
|
"count": 869, |
|
"self": 400.01942840705453, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 678.9943098809464, |
|
"count": 46083, |
|
"self": 678.9943098809464 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.7120000848080963e-06, |
|
"count": 1, |
|
"self": 1.7120000848080963e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 1.0380277969998133, |
|
"count": 1, |
|
"self": 0.003971679999267508, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 1.0340561170005458, |
|
"count": 1, |
|
"self": 1.0340561170005458 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |