| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.1812715381383896, |
| "min": 0.1697080135345459, |
| "max": 1.6065279245376587, |
| "count": 200 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 1864.9215087890625, |
| "min": 1685.9420166015625, |
| "max": 16450.845703125, |
| "count": 200 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 1999988.0, |
| "min": 9984.0, |
| "max": 1999988.0, |
| "count": 200 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 1999988.0, |
| "min": 9984.0, |
| "max": 1999988.0, |
| "count": 200 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.7763552069664001, |
| "min": -0.08807287365198135, |
| "max": 0.8628113269805908, |
| "count": 200 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 77.6355209350586, |
| "min": -7.045829772949219, |
| "max": 89.73237609863281, |
| "count": 200 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.12793628871440887, |
| "min": 0.1241626963019371, |
| "max": 3.223942279815674, |
| "count": 200 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 12.793628692626953, |
| "min": 11.833174705505371, |
| "max": 256.96441650390625, |
| "count": 200 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.07152327620079396, |
| "min": 0.05934585555951344, |
| "max": 0.08020872884755215, |
| "count": 200 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.14304655240158792, |
| "min": 0.05934585555951344, |
| "max": 0.1604174576951043, |
| "count": 200 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.016820931834262358, |
| "min": 0.0004981905462955183, |
| "max": 1.2856630093107622, |
| "count": 200 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.033641863668524716, |
| "min": 0.0004981905462955183, |
| "max": 1.2856630093107622, |
| "count": 200 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 8.469997176999891e-07, |
| "min": 8.469997176999891e-07, |
| "max": 0.0002987712004096, |
| "count": 200 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 1.6939994353999782e-06, |
| "min": 1.6939994353999782e-06, |
| "max": 0.0005687616104127999, |
| "count": 200 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10028230000000002, |
| "min": 0.10028230000000002, |
| "max": 0.19959039999999997, |
| "count": 200 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 0.20056460000000004, |
| "min": 0.10089415000000002, |
| "max": 0.3895872, |
| "count": 200 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 3.820176999999964e-05, |
| "min": 3.820176999999964e-05, |
| "max": 0.009959080960000002, |
| "count": 200 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 7.640353999999929e-05, |
| "min": 7.640353999999929e-05, |
| "max": 0.01895976128, |
| "count": 200 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.01132755633443594, |
| "min": 0.010952742770314217, |
| "max": 0.7967495918273926, |
| "count": 200 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.02265511266887188, |
| "min": 0.011068697087466717, |
| "max": 0.7967495918273926, |
| "count": 200 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 200 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 200 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 226.30434782608697, |
| "min": 210.06521739130434, |
| "max": 999.0, |
| "count": 196 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 10410.0, |
| "min": 406.0, |
| "max": 15984.0, |
| "count": 196 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.7759361599988126, |
| "min": -1.0000000521540642, |
| "max": 1.7878297776617902, |
| "count": 197 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 83.46899951994419, |
| "min": -16.000000834465027, |
| "max": 88.86559921503067, |
| "count": 197 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.7759361599988126, |
| "min": -1.0000000521540642, |
| "max": 1.7878297776617902, |
| "count": 197 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 83.46899951994419, |
| "min": -16.000000834465027, |
| "max": 88.86559921503067, |
| "count": 197 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.2671700805930936, |
| "min": 0.24556314122552672, |
| "max": 115.93597248196602, |
| "count": 197 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 12.556993787875399, |
| "min": 3.919705420732498, |
| "max": 1854.9755597114563, |
| "count": 197 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1728489636", |
| "python_version": "3.10.12 (main, Sep 11 2024, 15:47:36) [GCC 11.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training_4 --no-graphics", |
| "mlagents_version": "1.2.0.dev0", |
| "mlagents_envs_version": "1.2.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.4.1+cu121", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1728495200" |
| }, |
| "total": 5563.281154713, |
| "count": 1, |
| "self": 0.578380326000115, |
| "children": { |
| "run_training.setup": { |
| "total": 0.06315506800001458, |
| "count": 1, |
| "self": 0.06315506800001458 |
| }, |
| "TrainerController.start_learning": { |
| "total": 5562.639619319, |
| "count": 1, |
| "self": 3.658621601048253, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 2.3372126550002577, |
| "count": 1, |
| "self": 2.3372126550002577 |
| }, |
| "TrainerController.advance": { |
| "total": 5556.585015841953, |
| "count": 129381, |
| "self": 3.7074042090926014, |
| "children": { |
| "env_step": { |
| "total": 3966.0238739530296, |
| "count": 129381, |
| "self": 3736.5980412040853, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 227.22686251303276, |
| "count": 129381, |
| "self": 10.69970989295598, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 216.52715262007678, |
| "count": 125067, |
| "self": 216.52715262007678 |
| } |
| } |
| }, |
| "workers": { |
| "total": 2.1989702359114744, |
| "count": 129381, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 5551.047635885227, |
| "count": 129381, |
| "is_parallel": true, |
| "self": 2103.7738006034288, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0028710380001939484, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0008379179998883046, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0020331200003056438, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0020331200003056438 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.08737620700048865, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0008961279991126503, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0005002860007152776, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005002860007152776 |
| }, |
| "communicator.exchange": { |
| "total": 0.08327173799989396, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.08327173799989396 |
| }, |
| "steps_from_proto": { |
| "total": 0.0027080550007667625, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00039993899918044917, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0023081160015863134, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0023081160015863134 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 3447.273835281798, |
| "count": 129380, |
| "is_parallel": true, |
| "self": 81.91633728868419, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 53.13809518709877, |
| "count": 129380, |
| "is_parallel": true, |
| "self": 53.13809518709877 |
| }, |
| "communicator.exchange": { |
| "total": 3082.081615678245, |
| "count": 129380, |
| "is_parallel": true, |
| "self": 3082.081615678245 |
| }, |
| "steps_from_proto": { |
| "total": 230.13778712777003, |
| "count": 129380, |
| "is_parallel": true, |
| "self": 49.45365916853552, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 180.6841279592345, |
| "count": 1035040, |
| "is_parallel": true, |
| "self": 180.6841279592345 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 1586.8537376798304, |
| "count": 129381, |
| "self": 6.444372039120935, |
| "children": { |
| "process_trajectory": { |
| "total": 284.3386811197315, |
| "count": 129381, |
| "self": 284.0804185877314, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.25826253200011706, |
| "count": 4, |
| "self": 0.25826253200011706 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 1296.070684520978, |
| "count": 242, |
| "self": 663.0619838800121, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 633.0087006409658, |
| "count": 46473, |
| "self": 633.0087006409658 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.0690000635804608e-06, |
| "count": 1, |
| "self": 1.0690000635804608e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.058768151999174734, |
| "count": 1, |
| "self": 0.0011314740004308987, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.057636677998743835, |
| "count": 1, |
| "self": 0.057636677998743835 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |