{ "env_config": { "env_id": "CartPole-v1", "env_kwargs": {}, "max_steps": null, "use_image": false, "vector_env_num": 6, "use_multi_processing": true, "image_shape": null, "frame_stack": 1, "frame_skip": 1, "training_render_mode": null }, "device": "mps", "learning_rate": 0.0001, "gamma": 0.99, "checkpoint_pathname": "", "eval_episodes": 50, "eval_random_seed": 42, "eval_video_num": 10, "total_steps": 150000, "rollout_len": 32, "gae_lambda_or_n_step": 0.97, "entropy_coef": { "_type": "LinearSchedule", "_module": "practice.utils_for_coding.scheduler_utils", "start_e": 0.2, "end_e": 0.1, "duration": 200 }, "value_loss_coef": 0.02, "grad_acc": 1, "max_grad_norm": 0.5, "critic_lr": 5e-05, "critic_lr_gamma": 0.995, "env_wrappers": [ "CartPoleEnv", "PassiveEnvChecker", "OrderEnforcing", "TimeLimit", "CastObsFloat32Wrapper", "RecordEpisodeStatistics", "Autoreset" ] }