HPARAMS = { "horizon": 2048, "num_epochs": 15, "batch_size": 128, "policy_clip": 0.1, "discount_factor": 0.99, "GAE_lambda": 0.95, "entropy_coeff": 0.01, "value_coeff": 0.5, "learning_rate": 0.0003, }