Upload 8 files

a17813c verified 7 months ago

19.6 kB

	{
	"name": "root",
	"gauges": {
	"Agent.Policy.Entropy.mean": {
	"value": 3.9790024757385254,
	"min": 3.9426229000091553,
	"max": 4.384097576141357,
	"count": 100
	},
	"Agent.Policy.Entropy.sum": {
	"value": 19588.62890625,
	"min": 3697.3173828125,
	"max": 31503.28515625,
	"count": 100
	},
	"Agent.WildfireResourceManagement.IndividualResourceCount.mean": {
	"value": 0.8833332272867361,
	"min": 0.5555555903249316,
	"max": 0.8999998913043075,
	"count": 100
	},
	"Agent.WildfireResourceManagement.IndividualResourceCount.sum": {
	"value": 15.899998091161251,
	"min": 7.000000223517418,
	"max": 31.999995470046997,
	"count": 100
	},
	"Agent.WildfireResourceManagement.RewardforMovingResourcestoNeighbours.mean": {
	"value": 80.60973479681545,
	"min": 0.10768404721360032,
	"max": 248.34259457058377,
	"count": 100
	},
	"Agent.WildfireResourceManagement.RewardforMovingResourcestoNeighbours.sum": {
	"value": 1450.975226342678,
	"min": 0.969156424922403,
	"max": 2945.7017974853516,
	"count": 100
	},
	"Agent.WildfireResourceManagement.RewardforMovingResourcestoSelf.mean": {
	"value": 0.3801335415078534,
	"min": 0.01641160911983914,
	"max": 9.644429033001265,
	"count": 100
	},
	"Agent.WildfireResourceManagement.RewardforMovingResourcestoSelf.sum": {
	"value": 6.842403747141361,
	"min": 0.14770448207855225,
	"max": 219.80404091626406,
	"count": 100
	},
	"Agent.WildfireResourceManagement.CollectivePerformance.mean": {
	"value": 67.59286774529352,
	"min": 0.2759494384129842,
	"max": 155.0876719156901,
	"count": 100
	},
	"Agent.WildfireResourceManagement.CollectivePerformance.sum": {
	"value": 1216.6716194152832,
	"min": 2.483544945716858,
	"max": 2201.0021057128906,
	"count": 100
	},
	"Agent.WildfireResourceManagement.IndividualPerformance.mean": {
	"value": 34.56691179010603,
	"min": 0.0947068203240633,
	"max": 77.07207973798116,
	"count": 100
	},
	"Agent.WildfireResourceManagement.IndividualPerformance.sum": {
	"value": 622.2044122219086,
	"min": 0.8523613829165697,
	"max": 1007.8357060849667,
	"count": 100
	},
	"Agent.Environment.LessonNumber.difficulty.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 100
	},
	"Agent.Environment.LessonNumber.difficulty.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 100
	},
	"Agent.Environment.LessonNumber.task.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 100
	},
	"Agent.Environment.LessonNumber.task.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 100
	},
	"Agent.Environment.EpisodeLength.mean": {
	"value": 273.0,
	"min": 16.0,
	"max": 455.0,
	"count": 100
	},
	"Agent.Environment.EpisodeLength.sum": {
	"value": 4914.0,
	"min": 144.0,
	"max": 7695.0,
	"count": 100
	},
	"Agent.Step.mean": {
	"value": 449877.0,
	"min": 4381.0,
	"max": 449877.0,
	"count": 100
	},
	"Agent.Step.sum": {
	"value": 449877.0,
	"min": 4381.0,
	"max": 449877.0,
	"count": 100
	},
	"Agent.Policy.CuriosityValueEstimate.mean": {
	"value": 0.006750881671905518,
	"min": -0.012739883735775948,
	"max": 0.11897391825914383,
	"count": 100
	},
	"Agent.Policy.CuriosityValueEstimate.sum": {
	"value": 0.10801410675048828,
	"min": -0.20383813977241516,
	"max": 3.0933218002319336,
	"count": 100
	},
	"Agent.Policy.ExtrinsicValueEstimate.mean": {
	"value": 35.70020294189453,
	"min": 1.470633864402771,
	"max": 50.8341064453125,
	"count": 100
	},
	"Agent.Policy.ExtrinsicValueEstimate.sum": {
	"value": 571.2032470703125,
	"min": 38.236480712890625,
	"max": 1677.5255126953125,
	"count": 100
	},
	"Agent.Environment.CumulativeReward.mean": {
	"value": 131.3084635734558,
	"min": 37.73844643739554,
	"max": 282.3111138343811,
	"count": 100
	},
	"Agent.Environment.CumulativeReward.sum": {
	"value": 2100.935417175293,
	"min": 1036.8795852661133,
	"max": 4516.977821350098,
	"count": 100
	},
	"Agent.Policy.CuriosityReward.mean": {
	"value": 0.020240316458512098,
	"min": 0.011927072860060199,
	"max": 0.22122024615796712,
	"count": 100
	},
	"Agent.Policy.CuriosityReward.sum": {
	"value": 0.32384506333619356,
	"min": 0.256887782830745,
	"max": 5.751726400107145,
	"count": 100
	},
	"Agent.Policy.ExtrinsicReward.mean": {
	"value": 131.3084635734558,
	"min": 37.73844643739554,
	"max": 282.3111138343811,
	"count": 100
	},
	"Agent.Policy.ExtrinsicReward.sum": {
	"value": 2100.935417175293,
	"min": 1036.8795852661133,
	"max": 4516.977821350098,
	"count": 100
	},
	"Agent.Losses.PolicyLoss.mean": {
	"value": 0.06362482790065016,
	"min": 0.056942009002618164,
	"max": 0.08438466520563356,
	"count": 99
	},
	"Agent.Losses.PolicyLoss.sum": {
	"value": 0.12724965580130032,
	"min": 0.056942009002618164,
	"max": 0.16876933041126713,
	"count": 99
	},
	"Agent.Losses.ValueLoss.mean": {
	"value": 63.23698472603792,
	"min": 5.822606236139933,
	"max": 156.46512782007738,
	"count": 99
	},
	"Agent.Losses.ValueLoss.sum": {
	"value": 126.47396945207583,
	"min": 5.822606236139933,
	"max": 312.93025564015477,
	"count": 99
	},
	"Agent.Policy.LearningRate.mean": {
	"value": 1.8030993989999881e-06,
	"min": 1.8030993989999881e-06,
	"max": 0.00029819400060199984,
	"count": 99
	},
	"Agent.Policy.LearningRate.sum": {
	"value": 3.6061987979999762e-06,
	"min": 3.6061987979999762e-06,
	"max": 0.0005861940046020002,
	"count": 99
	},
	"Agent.Policy.Epsilon.mean": {
	"value": 0.10060100000000004,
	"min": 0.10060100000000004,
	"max": 0.19939800000000005,
	"count": 99
	},
	"Agent.Policy.Epsilon.sum": {
	"value": 0.20120200000000008,
	"min": 0.10181000000000004,
	"max": 0.3953980000000001,
	"count": 99
	},
	"Agent.Policy.Beta.mean": {
	"value": 7.003989999999961e-05,
	"min": 7.003989999999961e-05,
	"max": 0.009939860200000004,
	"count": 99
	},
	"Agent.Policy.Beta.sum": {
	"value": 0.00014007979999999923,
	"min": 0.00014007979999999923,
	"max": 0.019540260200000006,
	"count": 99
	},
	"Agent.Losses.CuriosityForwardLoss.mean": {
	"value": 0.0028334709095681233,
	"min": 0.002552407628103493,
	"max": 0.38484019738814185,
	"count": 99
	},
	"Agent.Losses.CuriosityForwardLoss.sum": {
	"value": 0.005666941819136247,
	"min": 0.002716009190086933,
	"max": 0.38484019738814185,
	"count": 99
	},
	"Agent.Losses.CuriosityInverseLoss.mean": {
	"value": 3.954002788223013,
	"min": 3.93007966429715,
	"max": 4.389180887313116,
	"count": 99
	},
	"Agent.Losses.CuriosityInverseLoss.sum": {
	"value": 7.908005576446026,
	"min": 3.9468957362351595,
	"max": 8.731818569084954,
	"count": 99
	},
	"Agent.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	},
	"Agent.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1716654493",
	"python_version": "3.9.18 (main, Sep 11 2023, 14:09:26) [MSC v.1916 64 bit (AMD64)]",
	"command_line_arguments": "C:\\Users\\pdsie\\anaconda3\\envs\\mlagents20\\Scripts\\mlagents-learn c:/users/pdsie/documents/hivex/src/hivex/training/baseline/ml_agents/configs/mlagents/tmp/train/WildfireResourceManagement_difficulty_5_task_0_run_id_0_train.yaml --run-id=WildfireResourceManagement/train/WildfireResourceManagement_difficulty_5_task_0_run_id_0_train --base-port 5006",
	"mlagents_version": "0.30.0",
	"mlagents_envs_version": "0.30.0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.7.1+cu110",
	"numpy_version": "1.21.0",
	"end_time_seconds": "1716656322"
	},
	"total": 1829.2482914,
	"count": 1,
	"self": 0.19380449999994198,
	"children": {
	"run_training.setup": {
	"total": 0.06638769999999994,
	"count": 1,
	"self": 0.06638769999999994
	},
	"TrainerController.start_learning": {
	"total": 1828.9880992,
	"count": 1,
	"self": 1.1153832999816586,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.1201426,
	"count": 1,
	"self": 2.1201426
	},
	"TrainerController.advance": {
	"total": 1825.6590711000185,
	"count": 50091,
	"self": 1.064749900024708,
	"children": {
	"env_step": {
	"total": 1824.5943211999938,
	"count": 50091,
	"self": 1548.5461036000024,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 275.5569933000056,
	"count": 50091,
	"self": 1.7498843000246325,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 273.807108999981,
	"count": 50091,
	"self": 273.807108999981
	}
	}
	},
	"workers": {
	"total": 0.4912242999856691,
	"count": 50091,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 1826.4210882000307,
	"count": 50091,
	"is_parallel": true,
	"self": 336.4644268000425,
	"children": {
	"steps_from_proto": {
	"total": 0.00036009999999997433,
	"count": 1,
	"is_parallel": true,
	"self": 0.00016790000000010963,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0001921999999998647,
	"count": 2,
	"is_parallel": true,
	"self": 0.0001921999999998647
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1489.9563012999881,
	"count": 50091,
	"is_parallel": true,
	"self": 3.4311641999943276,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 4.08801820000469,
	"count": 50091,
	"is_parallel": true,
	"self": 4.08801820000469
	},
	"communicator.exchange": {
	"total": 1472.8431573999874,
	"count": 50091,
	"is_parallel": true,
	"self": 1472.8431573999874
	},
	"steps_from_proto": {
	"total": 9.593961500001807,
	"count": 50091,
	"is_parallel": true,
	"self": 4.881630800029496,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 4.712330699972311,
	"count": 100182,
	"is_parallel": true,
	"self": 4.712330699972311
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 2.1599999854515772e-05,
	"count": 1,
	"self": 2.1599999854515772e-05,
	"children": {
	"thread_root": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"trainer_advance": {
	"total": 1825.5939962999946,
	"count": 92098,
	"is_parallel": true,
	"self": 3.1223809999869445,
	"children": {
	"process_trajectory": {
	"total": 1460.9177770000076,
	"count": 92098,
	"is_parallel": true,
	"self": 1460.9177770000076
	},
	"_update_policy": {
	"total": 361.55383830000005,
	"count": 143,
	"is_parallel": true,
	"self": 177.03219429999865,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 184.5216440000014,
	"count": 10296,
	"is_parallel": true,
	"self": 184.5216440000014
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"TrainerController._save_models": {
	"total": 0.09348060000002079,
	"count": 1,
	"self": 0.005317500000046493,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08816309999997429,
	"count": 1,
	"self": 0.08816309999997429
	}
	}
	}
	}
	}
	}
	}