First Push

187b59a about 1 year ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.4289458990097046,
	"min": 1.3331218957901,
	"max": 3.295753002166748,
	"count": 2909
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 28441.740234375,
	"min": 14116.41015625,
	"max": 134564.359375,
	"count": 2909
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 72.63636363636364,
	"min": 38.728,
	"max": 999.0,
	"count": 2909
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19176.0,
	"min": 1368.0,
	"max": 33472.0,
	"count": 2909
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1633.2024141553666,
	"min": 1197.4528454987494,
	"max": 1700.748415074803,
	"count": 2894
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 215582.71866850837,
	"min": 2395.855516605603,
	"max": 399412.78237338376,
	"count": 2894
	},
	"SoccerTwos.Step.mean": {
	"value": 29089880.0,
	"min": 9034.0,
	"max": 29089880.0,
	"count": 2909
	},
	"SoccerTwos.Step.sum": {
	"value": 29089880.0,
	"min": 9034.0,
	"max": 29089880.0,
	"count": 2909
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.016269130632281303,
	"min": -0.14047899842262268,
	"max": 0.18399012088775635,
	"count": 2909
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -2.1475253105163574,
	"min": -23.84164047241211,
	"max": 26.68563461303711,
	"count": 2909
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.01794874481856823,
	"min": -0.1390056312084198,
	"max": 0.18372780084609985,
	"count": 2909
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -2.369234323501587,
	"min": -24.460636138916016,
	"max": 26.59808349609375,
	"count": 2909
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 2909
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 2909
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.04186969814878522,
	"min": -0.5260500013828278,
	"max": 0.5829966128882715,
	"count": 2909
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -5.526800155639648,
	"min": -81.90319991111755,
	"max": 53.70960021018982,
	"count": 2909
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.04186969814878522,
	"min": -0.5260500013828278,
	"max": 0.5829966128882715,
	"count": 2909
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -5.526800155639648,
	"min": -81.90319991111755,
	"max": 53.70960021018982,
	"count": 2909
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 2909
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 2909
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.017092395084910096,
	"min": 0.010334619101680194,
	"max": 0.02452780718158465,
	"count": 1409
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.017092395084910096,
	"min": 0.010334619101680194,
	"max": 0.02452780718158465,
	"count": 1409
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.08425002073248228,
	"min": 4.625412599731741e-05,
	"max": 0.132067218174537,
	"count": 1409
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.08425002073248228,
	"min": 4.625412599731741e-05,
	"max": 0.132067218174537,
	"count": 1409
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.0861614927649498,
	"min": 4.70900532794379e-05,
	"max": 0.13552140071988106,
	"count": 1409
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.0861614927649498,
	"min": 4.70900532794379e-05,
	"max": 0.13552140071988106,
	"count": 1409
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 1409
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 1409
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.19999999999999996,
	"max": 0.20000000000000007,
	"count": 1409
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.19999999999999996,
	"max": 0.20000000000000007,
	"count": 1409
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 1409
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 1409
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1691727176",
	"python_version": "3.9.17 (main, Jul 5 2023, 21:05:34) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/renatostrianese/anaconda3/envs/RenatoTF/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwo/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1691805708"
	},
	"total": 78532.367960672,
	"count": 1,
	"self": 0.06609775401011575,
	"children": {
	"run_training.setup": {
	"total": 0.03313046699622646,
	"count": 1,
	"self": 0.03313046699622646
	},
	"TrainerController.start_learning": {
	"total": 78532.26873245099,
	"count": 1,
	"self": 47.53482574840018,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.610130590015615,
	"count": 146,
	"self": 4.610130590015615
	},
	"TrainerController.advance": {
	"total": 78479.86887295157,
	"count": 2012113,
	"self": 46.898810708808014,
	"children": {
	"env_step": {
	"total": 35817.85841291145,
	"count": 2012113,
	"self": 30057.72681538717,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 5729.997554799687,
	"count": 2012113,
	"self": 223.7001909118626,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 5506.297363887825,
	"count": 3654072,
	"self": 5506.297363887825
	}
	}
	},
	"workers": {
	"total": 30.13404272459593,
	"count": 2012112,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 78466.91669943526,
	"count": 2012112,
	"is_parallel": true,
	"self": 53690.49747905135,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0031258160015568137,
	"count": 2,
	"is_parallel": true,
	"self": 0.0009946089994627982,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0021312070020940155,
	"count": 8,
	"is_parallel": true,
	"self": 0.0021312070020940155
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.028206431001308374,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005391929953475483,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004178079980192706,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004178079980192706
	},
	"communicator.exchange": {
	"total": 0.025404737003555056,
	"count": 1,
	"is_parallel": true,
	"self": 0.025404737003555056
	},
	"steps_from_proto": {
	"total": 0.0018446930043864995,
	"count": 2,
	"is_parallel": true,
	"self": 0.0004180240066489205,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001426668997737579,
	"count": 8,
	"is_parallel": true,
	"self": 0.001426668997737579
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 24776.102041746977,
	"count": 2012111,
	"is_parallel": true,
	"self": 1435.6359346336321,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 1037.9718928028597,
	"count": 2012111,
	"is_parallel": true,
	"self": 1037.9718928028597
	},
	"communicator.exchange": {
	"total": 17808.430640130806,
	"count": 2012111,
	"is_parallel": true,
	"self": 17808.430640130806
	},
	"steps_from_proto": {
	"total": 4494.06357417968,
	"count": 4024222,
	"is_parallel": true,
	"self": 863.1041507397385,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 3630.959423439941,
	"count": 16096888,
	"is_parallel": true,
	"self": 3630.959423439941
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.3171786369275651,
	"count": 290,
	"is_parallel": true,
	"self": 0.06221032103348989,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.2549683158940752,
	"count": 1160,
	"is_parallel": true,
	"self": 0.2549683158940752
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 42615.11164933131,
	"count": 2012112,
	"self": 298.4929725266047,
	"children": {
	"process_trajectory": {
	"total": 6410.776937356939,
	"count": 2012112,
	"self": 6396.632048044943,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 14.14488931199594,
	"count": 58,
	"self": 14.14488931199594
	}
	}
	},
	"_update_policy": {
	"total": 35905.841739447766,
	"count": 1409,
	"self": 4567.986399615293,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 31337.855339832473,
	"count": 42285,
	"self": 31337.855339832473
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.69100530911237e-06,
	"count": 1,
	"self": 1.69100530911237e-06
	},
	"TrainerController._save_models": {
	"total": 0.2549014700052794,
	"count": 1,
	"self": 0.002151414009858854,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.25275005599542055,
	"count": 1,
	"self": 0.25275005599542055
	}
	}
	}
	}
	}
	}
	}