First Push

1b7d43c over 2 years ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.7540055513381958,
	"min": 1.7540055513381958,
	"max": 2.859694480895996,
	"count": 287
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 34350.4453125,
	"min": 25404.435546875,
	"max": 68697.859375,
	"count": 287
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 59.951219512195124,
	"min": 45.43119266055046,
	"max": 134.75675675675674,
	"count": 287
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19664.0,
	"min": 6264.0,
	"max": 22528.0,
	"count": 287
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1547.7343081913593,
	"min": 1280.498417173598,
	"max": 1573.583713813668,
	"count": 287
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 253828.42654338293,
	"min": 57443.42553063212,
	"max": 334909.4936858504,
	"count": 287
	},
	"SoccerTwos.Step.mean": {
	"value": 4999964.0,
	"min": 2139961.0,
	"max": 4999964.0,
	"count": 287
	},
	"SoccerTwos.Step.sum": {
	"value": 4999964.0,
	"min": 2139961.0,
	"max": 4999964.0,
	"count": 287
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.05619893968105316,
	"min": -0.09217312932014465,
	"max": 0.2106694132089615,
	"count": 287
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 9.216626167297363,
	"min": -14.655527114868164,
	"max": 26.543701171875,
	"count": 287
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.05358322709798813,
	"min": -0.09259972721338272,
	"max": 0.20666013658046722,
	"count": 287
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 8.787649154663086,
	"min": -14.723356246948242,
	"max": 27.162918090820312,
	"count": 287
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 287
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 287
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.029275610316090467,
	"min": -0.3304608697476594,
	"max": 0.3157929830383836,
	"count": 287
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 4.801200091838837,
	"min": -40.803199887275696,
	"max": 54.64700049161911,
	"count": 287
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.029275610316090467,
	"min": -0.3304608697476594,
	"max": 0.3157929830383836,
	"count": 287
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 4.801200091838837,
	"min": -40.803199887275696,
	"max": 54.64700049161911,
	"count": 287
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 287
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 287
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.017620729313542447,
	"min": 0.011048298924288246,
	"max": 0.02409756457200274,
	"count": 138
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.017620729313542447,
	"min": 0.011048298924288246,
	"max": 0.02409756457200274,
	"count": 138
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.1136249082783858,
	"min": 0.04968581423163414,
	"max": 0.1136249082783858,
	"count": 138
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.1136249082783858,
	"min": 0.04968581423163414,
	"max": 0.1136249082783858,
	"count": 138
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.11541301185886065,
	"min": 0.050460034608840944,
	"max": 0.11541301185886065,
	"count": 138
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.11541301185886065,
	"min": 0.050460034608840944,
	"max": 0.11541301185886065,
	"count": 138
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 138
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 138
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 138
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 138
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 138
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 138
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1688065979",
	"python_version": "3.9.16 (main, May 15 2023, 23:46:34) \n[GCC 11.2.0]",
	"command_line_arguments": "/root/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1688072947"
	},
	"total": 6967.477507870994,
	"count": 1,
	"self": 0.4749574410961941,
	"children": {
	"run_training.setup": {
	"total": 0.018960394896566868,
	"count": 1,
	"self": 0.018960394896566868
	},
	"TrainerController.start_learning": {
	"total": 6966.983590035001,
	"count": 1,
	"self": 7.383688202360645,
	"children": {
	"TrainerController._reset_env": {
	"total": 8.599591638776474,
	"count": 16,
	"self": 8.599591638776474
	},
	"TrainerController.advance": {
	"total": 6950.742673392873,
	"count": 197041,
	"self": 7.936746210791171,
	"children": {
	"env_step": {
	"total": 5466.461122430745,
	"count": 197041,
	"self": 4434.788273636135,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1027.343017456471,
	"count": 197041,
	"self": 40.67520230030641,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 986.6678151561646,
	"count": 359170,
	"self": 986.6678151561646
	}
	}
	},
	"workers": {
	"total": 4.3298313381383196,
	"count": 197041,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 6951.302592928172,
	"count": 197041,
	"is_parallel": true,
	"self": 3226.155462664552,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0031961901113390923,
	"count": 2,
	"is_parallel": true,
	"self": 0.000803773058578372,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0023924170527607203,
	"count": 8,
	"is_parallel": true,
	"self": 0.0023924170527607203
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.040917290025390685,
	"count": 1,
	"is_parallel": true,
	"self": 0.001090687932446599,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0007754210382699966,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007754210382699966
	},
	"communicator.exchange": {
	"total": 0.03585985500831157,
	"count": 1,
	"is_parallel": true,
	"self": 0.03585985500831157
	},
	"steps_from_proto": {
	"total": 0.0031913260463625193,
	"count": 2,
	"is_parallel": true,
	"self": 0.0006325679132714868,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0025587581330910325,
	"count": 8,
	"is_parallel": true,
	"self": 0.0025587581330910325
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.038901473162695765,
	"count": 30,
	"is_parallel": true,
	"self": 0.007620085380040109,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.031281387782655656,
	"count": 120,
	"is_parallel": true,
	"self": 0.031281387782655656
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 3725.1082287904574,
	"count": 197040,
	"is_parallel": true,
	"self": 165.97430429654196,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 103.95889578491915,
	"count": 197040,
	"is_parallel": true,
	"self": 103.95889578491915
	},
	"communicator.exchange": {
	"total": 2985.190188732813,
	"count": 197040,
	"is_parallel": true,
	"self": 2985.190188732813
	},
	"steps_from_proto": {
	"total": 469.98483997618314,
	"count": 394080,
	"is_parallel": true,
	"self": 93.58895315986592,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 376.3958868163172,
	"count": 1576320,
	"is_parallel": true,
	"self": 376.3958868163172
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1476.3448047513375,
	"count": 197041,
	"self": 52.264346172101796,
	"children": {
	"process_trajectory": {
	"total": 592.9353361455724,
	"count": 197041,
	"self": 591.4335409004707,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 1.5017952451016754,
	"count": 6,
	"self": 1.5017952451016754
	}
	}
	},
	"_update_policy": {
	"total": 831.1451224336633,
	"count": 138,
	"self": 504.2810504854424,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 326.86407194822095,
	"count": 4140,
	"self": 326.86407194822095
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.869979314506054e-06,
	"count": 1,
	"self": 1.869979314506054e-06
	},
	"TrainerController._save_models": {
	"total": 0.25763493101112545,
	"count": 1,
	"self": 0.0034043260384351015,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.25423060497269034,
	"count": 1,
	"self": 0.25423060497269034
	}
	}
	}
	}
	}
	}
	}