| { | |
| "name": "root", | |
| "gauges": { | |
| "SoccerTwos.Policy.Entropy.mean": { | |
| "value": 1.7540055513381958, | |
| "min": 1.7540055513381958, | |
| "max": 2.859694480895996, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Policy.Entropy.sum": { | |
| "value": 34350.4453125, | |
| "min": 25404.435546875, | |
| "max": 68697.859375, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Environment.EpisodeLength.mean": { | |
| "value": 59.951219512195124, | |
| "min": 45.43119266055046, | |
| "max": 134.75675675675674, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Environment.EpisodeLength.sum": { | |
| "value": 19664.0, | |
| "min": 6264.0, | |
| "max": 22528.0, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Self-play.ELO.mean": { | |
| "value": 1547.7343081913593, | |
| "min": 1280.498417173598, | |
| "max": 1573.583713813668, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Self-play.ELO.sum": { | |
| "value": 253828.42654338293, | |
| "min": 57443.42553063212, | |
| "max": 334909.4936858504, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Step.mean": { | |
| "value": 4999964.0, | |
| "min": 2139961.0, | |
| "max": 4999964.0, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Step.sum": { | |
| "value": 4999964.0, | |
| "min": 2139961.0, | |
| "max": 4999964.0, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { | |
| "value": 0.05619893968105316, | |
| "min": -0.09217312932014465, | |
| "max": 0.2106694132089615, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { | |
| "value": 9.216626167297363, | |
| "min": -14.655527114868164, | |
| "max": 26.543701171875, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.05358322709798813, | |
| "min": -0.09259972721338272, | |
| "max": 0.20666013658046722, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 8.787649154663086, | |
| "min": -14.723356246948242, | |
| "max": 27.162918090820312, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Environment.CumulativeReward.mean": { | |
| "value": 0.0, | |
| "min": 0.0, | |
| "max": 0.0, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Environment.CumulativeReward.sum": { | |
| "value": 0.0, | |
| "min": 0.0, | |
| "max": 0.0, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicReward.mean": { | |
| "value": 0.029275610316090467, | |
| "min": -0.3304608697476594, | |
| "max": 0.3157929830383836, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Policy.ExtrinsicReward.sum": { | |
| "value": 4.801200091838837, | |
| "min": -40.803199887275696, | |
| "max": 54.64700049161911, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Environment.GroupCumulativeReward.mean": { | |
| "value": 0.029275610316090467, | |
| "min": -0.3304608697476594, | |
| "max": 0.3157929830383836, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Environment.GroupCumulativeReward.sum": { | |
| "value": 4.801200091838837, | |
| "min": -40.803199887275696, | |
| "max": 54.64700049161911, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 287 | |
| }, | |
| "SoccerTwos.Losses.PolicyLoss.mean": { | |
| "value": 0.017620729313542447, | |
| "min": 0.011048298924288246, | |
| "max": 0.02409756457200274, | |
| "count": 138 | |
| }, | |
| "SoccerTwos.Losses.PolicyLoss.sum": { | |
| "value": 0.017620729313542447, | |
| "min": 0.011048298924288246, | |
| "max": 0.02409756457200274, | |
| "count": 138 | |
| }, | |
| "SoccerTwos.Losses.ValueLoss.mean": { | |
| "value": 0.1136249082783858, | |
| "min": 0.04968581423163414, | |
| "max": 0.1136249082783858, | |
| "count": 138 | |
| }, | |
| "SoccerTwos.Losses.ValueLoss.sum": { | |
| "value": 0.1136249082783858, | |
| "min": 0.04968581423163414, | |
| "max": 0.1136249082783858, | |
| "count": 138 | |
| }, | |
| "SoccerTwos.Losses.BaselineLoss.mean": { | |
| "value": 0.11541301185886065, | |
| "min": 0.050460034608840944, | |
| "max": 0.11541301185886065, | |
| "count": 138 | |
| }, | |
| "SoccerTwos.Losses.BaselineLoss.sum": { | |
| "value": 0.11541301185886065, | |
| "min": 0.050460034608840944, | |
| "max": 0.11541301185886065, | |
| "count": 138 | |
| }, | |
| "SoccerTwos.Policy.LearningRate.mean": { | |
| "value": 0.0003, | |
| "min": 0.0003, | |
| "max": 0.0003, | |
| "count": 138 | |
| }, | |
| "SoccerTwos.Policy.LearningRate.sum": { | |
| "value": 0.0003, | |
| "min": 0.0003, | |
| "max": 0.0003, | |
| "count": 138 | |
| }, | |
| "SoccerTwos.Policy.Epsilon.mean": { | |
| "value": 0.20000000000000007, | |
| "min": 0.20000000000000007, | |
| "max": 0.20000000000000007, | |
| "count": 138 | |
| }, | |
| "SoccerTwos.Policy.Epsilon.sum": { | |
| "value": 0.20000000000000007, | |
| "min": 0.20000000000000007, | |
| "max": 0.20000000000000007, | |
| "count": 138 | |
| }, | |
| "SoccerTwos.Policy.Beta.mean": { | |
| "value": 0.005000000000000001, | |
| "min": 0.005000000000000001, | |
| "max": 0.005000000000000001, | |
| "count": 138 | |
| }, | |
| "SoccerTwos.Policy.Beta.sum": { | |
| "value": 0.005000000000000001, | |
| "min": 0.005000000000000001, | |
| "max": 0.005000000000000001, | |
| "count": 138 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1688065979", | |
| "python_version": "3.9.16 (main, May 15 2023, 23:46:34) \n[GCC 11.2.0]", | |
| "command_line_arguments": "/root/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume", | |
| "mlagents_version": "0.31.0.dev0", | |
| "mlagents_envs_version": "0.31.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "1.11.0+cu102", | |
| "numpy_version": "1.21.2", | |
| "end_time_seconds": "1688072947" | |
| }, | |
| "total": 6967.477507870994, | |
| "count": 1, | |
| "self": 0.4749574410961941, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.018960394896566868, | |
| "count": 1, | |
| "self": 0.018960394896566868 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 6966.983590035001, | |
| "count": 1, | |
| "self": 7.383688202360645, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 8.599591638776474, | |
| "count": 16, | |
| "self": 8.599591638776474 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 6950.742673392873, | |
| "count": 197041, | |
| "self": 7.936746210791171, | |
| "children": { | |
| "env_step": { | |
| "total": 5466.461122430745, | |
| "count": 197041, | |
| "self": 4434.788273636135, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 1027.343017456471, | |
| "count": 197041, | |
| "self": 40.67520230030641, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 986.6678151561646, | |
| "count": 359170, | |
| "self": 986.6678151561646 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 4.3298313381383196, | |
| "count": 197041, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 6951.302592928172, | |
| "count": 197041, | |
| "is_parallel": true, | |
| "self": 3226.155462664552, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0031961901113390923, | |
| "count": 2, | |
| "is_parallel": true, | |
| "self": 0.000803773058578372, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0023924170527607203, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0023924170527607203 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.040917290025390685, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.001090687932446599, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0007754210382699966, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0007754210382699966 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.03585985500831157, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.03585985500831157 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0031913260463625193, | |
| "count": 2, | |
| "is_parallel": true, | |
| "self": 0.0006325679132714868, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0025587581330910325, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0025587581330910325 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.038901473162695765, | |
| "count": 30, | |
| "is_parallel": true, | |
| "self": 0.007620085380040109, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.031281387782655656, | |
| "count": 120, | |
| "is_parallel": true, | |
| "self": 0.031281387782655656 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 3725.1082287904574, | |
| "count": 197040, | |
| "is_parallel": true, | |
| "self": 165.97430429654196, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 103.95889578491915, | |
| "count": 197040, | |
| "is_parallel": true, | |
| "self": 103.95889578491915 | |
| }, | |
| "communicator.exchange": { | |
| "total": 2985.190188732813, | |
| "count": 197040, | |
| "is_parallel": true, | |
| "self": 2985.190188732813 | |
| }, | |
| "steps_from_proto": { | |
| "total": 469.98483997618314, | |
| "count": 394080, | |
| "is_parallel": true, | |
| "self": 93.58895315986592, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 376.3958868163172, | |
| "count": 1576320, | |
| "is_parallel": true, | |
| "self": 376.3958868163172 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 1476.3448047513375, | |
| "count": 197041, | |
| "self": 52.264346172101796, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 592.9353361455724, | |
| "count": 197041, | |
| "self": 591.4335409004707, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 1.5017952451016754, | |
| "count": 6, | |
| "self": 1.5017952451016754 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 831.1451224336633, | |
| "count": 138, | |
| "self": 504.2810504854424, | |
| "children": { | |
| "TorchPOCAOptimizer.update": { | |
| "total": 326.86407194822095, | |
| "count": 4140, | |
| "self": 326.86407194822095 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.869979314506054e-06, | |
| "count": 1, | |
| "self": 1.869979314506054e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.25763493101112545, | |
| "count": 1, | |
| "self": 0.0034043260384351015, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.25423060497269034, | |
| "count": 1, | |
| "self": 0.25423060497269034 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |