First Push

8eeb81a verified 5 months ago

15.6 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.3299667835235596,
	"min": 2.299405336380005,
	"max": 3.295668363571167,
	"count": 332
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 47121.25,
	"min": 15642.83203125,
	"max": 114542.3359375,
	"count": 332
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 50.76288659793814,
	"min": 42.76521739130435,
	"max": 999.0,
	"count": 332
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19696.0,
	"min": 15884.0,
	"max": 27488.0,
	"count": 332
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1478.026642524961,
	"min": 1179.7788040428786,
	"max": 1478.026642524961,
	"count": 325
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 286737.16864984244,
	"min": 2364.1918829443184,
	"max": 321863.026105703,
	"count": 325
	},
	"SoccerTwos.Step.mean": {
	"value": 3319968.0,
	"min": 9760.0,
	"max": 3319968.0,
	"count": 332
	},
	"SoccerTwos.Step.sum": {
	"value": 3319968.0,
	"min": 9760.0,
	"max": 3319968.0,
	"count": 332
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.13224956393241882,
	"min": -0.07247133553028107,
	"max": 0.17099936306476593,
	"count": 332
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 25.656415939331055,
	"min": -13.824865341186523,
	"max": 29.924888610839844,
	"count": 332
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.13362355530261993,
	"min": -0.06882161647081375,
	"max": 0.17515622079372406,
	"count": 332
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 25.922969818115234,
	"min": -13.692461013793945,
	"max": 30.6523380279541,
	"count": 332
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 332
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 332
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.08665361109468125,
	"min": -0.6923076923076923,
	"max": 0.5811499978105227,
	"count": 332
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 16.810800552368164,
	"min": -45.21120023727417,
	"max": 59.629999458789825,
	"count": 332
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.08665361109468125,
	"min": -0.6923076923076923,
	"max": 0.5811499978105227,
	"count": 332
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 16.810800552368164,
	"min": -45.21120023727417,
	"max": 59.629999458789825,
	"count": 332
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 332
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 332
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01647280962206423,
	"min": 0.010384321962677252,
	"max": 0.025824726539819192,
	"count": 157
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01647280962206423,
	"min": 0.010384321962677252,
	"max": 0.025824726539819192,
	"count": 157
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10077739705642065,
	"min": 0.0006277227638444553,
	"max": 0.11096864019831022,
	"count": 157
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10077739705642065,
	"min": 0.0006277227638444553,
	"max": 0.11096864019831022,
	"count": 157
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10252556800842286,
	"min": 0.0006187290273373947,
	"max": 0.11352627476056416,
	"count": 157
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10252556800842286,
	"min": 0.0006187290273373947,
	"max": 0.11352627476056416,
	"count": 157
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 157
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 157
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 157
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 157
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 157
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 157
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1724983919",
	"python_version": "3.10.12 (main, Jul 5 2023, 15:34:07) [Clang 14.0.6 ]",
	"command_line_arguments": "/Users/caio.campos/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.2",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1725010048"
	},
	"total": 26128.401052199,
	"count": 1,
	"self": 0.33014127099886537,
	"children": {
	"run_training.setup": {
	"total": 0.038303445999190444,
	"count": 1,
	"self": 0.038303445999190444
	},
	"TrainerController.start_learning": {
	"total": 26128.032607482,
	"count": 1,
	"self": 4.815222942630498,
	"children": {
	"TrainerController._reset_env": {
	"total": 8.892866306008727,
	"count": 17,
	"self": 8.892866306008727
	},
	"TrainerController.advance": {
	"total": 26114.05709432836,
	"count": 220564,
	"self": 4.818681626267789,
	"children": {
	"env_step": {
	"total": 20777.331596008145,
	"count": 220564,
	"self": 20038.60178467525,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 735.6629285974359,
	"count": 220564,
	"self": 28.332394672645023,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 707.3305339247909,
	"count": 423602,
	"self": 707.3305339247909
	}
	}
	},
	"workers": {
	"total": 3.06688273546024,
	"count": 220563,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 26112.673646069434,
	"count": 220563,
	"is_parallel": true,
	"self": 6650.5135924498245,
	"children": {
	"steps_from_proto": {
	"total": 0.05718903701563249,
	"count": 34,
	"is_parallel": true,
	"self": 0.008453278995148139,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.048735758020484354,
	"count": 136,
	"is_parallel": true,
	"self": 0.048735758020484354
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 19462.102864582594,
	"count": 220563,
	"is_parallel": true,
	"self": 59.292598800391715,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 371.8948498334321,
	"count": 220563,
	"is_parallel": true,
	"self": 371.8948498334321
	},
	"communicator.exchange": {
	"total": 18326.88937894188,
	"count": 220563,
	"is_parallel": true,
	"self": 18326.88937894188
	},
	"steps_from_proto": {
	"total": 704.02603700689,
	"count": 441126,
	"is_parallel": true,
	"self": 94.92409573729674,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 609.1019412695932,
	"count": 1764504,
	"is_parallel": true,
	"self": 609.1019412695932
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 5331.906816693945,
	"count": 220563,
	"self": 39.04413141792611,
	"children": {
	"process_trajectory": {
	"total": 676.097296054013,
	"count": 220563,
	"self": 674.3273022760113,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.7699937780016626,
	"count": 6,
	"self": 1.7699937780016626
	}
	}
	},
	"_update_policy": {
	"total": 4616.765389222006,
	"count": 158,
	"self": 473.07072151311513,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 4143.694667708891,
	"count": 4740,
	"self": 4143.694667708891
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.1279989848844707e-06,
	"count": 1,
	"self": 1.1279989848844707e-06
	},
	"TrainerController._save_models": {
	"total": 0.2674227770039579,
	"count": 1,
	"self": 0.0017639980069361627,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2656587789970217,
	"count": 1,
	"self": 0.2656587789970217
	}
	}
	}
	}
	}
	}
	}