First Push

f177508 verified over 1 year ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.1812715381383896,
	"min": 0.1697080135345459,
	"max": 1.6065279245376587,
	"count": 200
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 1864.9215087890625,
	"min": 1685.9420166015625,
	"max": 16450.845703125,
	"count": 200
	},
	"Pyramids.Step.mean": {
	"value": 1999988.0,
	"min": 9984.0,
	"max": 1999988.0,
	"count": 200
	},
	"Pyramids.Step.sum": {
	"value": 1999988.0,
	"min": 9984.0,
	"max": 1999988.0,
	"count": 200
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.7763552069664001,
	"min": -0.08807287365198135,
	"max": 0.8628113269805908,
	"count": 200
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 77.6355209350586,
	"min": -7.045829772949219,
	"max": 89.73237609863281,
	"count": 200
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.12793628871440887,
	"min": 0.1241626963019371,
	"max": 3.223942279815674,
	"count": 200
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 12.793628692626953,
	"min": 11.833174705505371,
	"max": 256.96441650390625,
	"count": 200
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07152327620079396,
	"min": 0.05934585555951344,
	"max": 0.08020872884755215,
	"count": 200
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.14304655240158792,
	"min": 0.05934585555951344,
	"max": 0.1604174576951043,
	"count": 200
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.016820931834262358,
	"min": 0.0004981905462955183,
	"max": 1.2856630093107622,
	"count": 200
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.033641863668524716,
	"min": 0.0004981905462955183,
	"max": 1.2856630093107622,
	"count": 200
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 8.469997176999891e-07,
	"min": 8.469997176999891e-07,
	"max": 0.0002987712004096,
	"count": 200
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 1.6939994353999782e-06,
	"min": 1.6939994353999782e-06,
	"max": 0.0005687616104127999,
	"count": 200
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10028230000000002,
	"min": 0.10028230000000002,
	"max": 0.19959039999999997,
	"count": 200
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 0.20056460000000004,
	"min": 0.10089415000000002,
	"max": 0.3895872,
	"count": 200
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 3.820176999999964e-05,
	"min": 3.820176999999964e-05,
	"max": 0.009959080960000002,
	"count": 200
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 7.640353999999929e-05,
	"min": 7.640353999999929e-05,
	"max": 0.01895976128,
	"count": 200
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.01132755633443594,
	"min": 0.010952742770314217,
	"max": 0.7967495918273926,
	"count": 200
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.02265511266887188,
	"min": 0.011068697087466717,
	"max": 0.7967495918273926,
	"count": 200
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 200
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 200
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 226.30434782608697,
	"min": 210.06521739130434,
	"max": 999.0,
	"count": 196
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 10410.0,
	"min": 406.0,
	"max": 15984.0,
	"count": 196
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.7759361599988126,
	"min": -1.0000000521540642,
	"max": 1.7878297776617902,
	"count": 197
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 83.46899951994419,
	"min": -16.000000834465027,
	"max": 88.86559921503067,
	"count": 197
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.7759361599988126,
	"min": -1.0000000521540642,
	"max": 1.7878297776617902,
	"count": 197
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 83.46899951994419,
	"min": -16.000000834465027,
	"max": 88.86559921503067,
	"count": 197
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.2671700805930936,
	"min": 0.24556314122552672,
	"max": 115.93597248196602,
	"count": 197
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 12.556993787875399,
	"min": 3.919705420732498,
	"max": 1854.9755597114563,
	"count": 197
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1728489636",
	"python_version": "3.10.12 (main, Sep 11 2024, 15:47:36) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training_4 --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.4.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1728495200"
	},
	"total": 5563.281154713,
	"count": 1,
	"self": 0.578380326000115,
	"children": {
	"run_training.setup": {
	"total": 0.06315506800001458,
	"count": 1,
	"self": 0.06315506800001458
	},
	"TrainerController.start_learning": {
	"total": 5562.639619319,
	"count": 1,
	"self": 3.658621601048253,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.3372126550002577,
	"count": 1,
	"self": 2.3372126550002577
	},
	"TrainerController.advance": {
	"total": 5556.585015841953,
	"count": 129381,
	"self": 3.7074042090926014,
	"children": {
	"env_step": {
	"total": 3966.0238739530296,
	"count": 129381,
	"self": 3736.5980412040853,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 227.22686251303276,
	"count": 129381,
	"self": 10.69970989295598,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 216.52715262007678,
	"count": 125067,
	"self": 216.52715262007678
	}
	}
	},
	"workers": {
	"total": 2.1989702359114744,
	"count": 129381,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 5551.047635885227,
	"count": 129381,
	"is_parallel": true,
	"self": 2103.7738006034288,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0028710380001939484,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008379179998883046,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0020331200003056438,
	"count": 8,
	"is_parallel": true,
	"self": 0.0020331200003056438
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.08737620700048865,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008961279991126503,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005002860007152776,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005002860007152776
	},
	"communicator.exchange": {
	"total": 0.08327173799989396,
	"count": 1,
	"is_parallel": true,
	"self": 0.08327173799989396
	},
	"steps_from_proto": {
	"total": 0.0027080550007667625,
	"count": 1,
	"is_parallel": true,
	"self": 0.00039993899918044917,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0023081160015863134,
	"count": 8,
	"is_parallel": true,
	"self": 0.0023081160015863134
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 3447.273835281798,
	"count": 129380,
	"is_parallel": true,
	"self": 81.91633728868419,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 53.13809518709877,
	"count": 129380,
	"is_parallel": true,
	"self": 53.13809518709877
	},
	"communicator.exchange": {
	"total": 3082.081615678245,
	"count": 129380,
	"is_parallel": true,
	"self": 3082.081615678245
	},
	"steps_from_proto": {
	"total": 230.13778712777003,
	"count": 129380,
	"is_parallel": true,
	"self": 49.45365916853552,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 180.6841279592345,
	"count": 1035040,
	"is_parallel": true,
	"self": 180.6841279592345
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1586.8537376798304,
	"count": 129381,
	"self": 6.444372039120935,
	"children": {
	"process_trajectory": {
	"total": 284.3386811197315,
	"count": 129381,
	"self": 284.0804185877314,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.25826253200011706,
	"count": 4,
	"self": 0.25826253200011706
	}
	}
	},
	"_update_policy": {
	"total": 1296.070684520978,
	"count": 242,
	"self": 663.0619838800121,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 633.0087006409658,
	"count": 46473,
	"self": 633.0087006409658
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.0690000635804608e-06,
	"count": 1,
	"self": 1.0690000635804608e-06
	},
	"TrainerController._save_models": {
	"total": 0.058768151999174734,
	"count": 1,
	"self": 0.0011314740004308987,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.057636677998743835,
	"count": 1,
	"self": 0.057636677998743835
	}
	}
	}
	}
	}
	}
	}