{ "type": "sac", "n_obs_steps": 1, "normalization_mapping": { "VISUAL": "MEAN_STD", "ACTION": "IDENTITY" }, "input_features": { "observation.image": { "type": "VISUAL", "shape": [ 3, 128, 128 ] } }, "output_features": { "action": { "type": "ACTION", "shape": [ 2 ] } }, "device": "cuda", "use_amp": false, "push_to_hub": true, "repo_id": "spirosperos/grid-position-policy", "private": null, "tags": null, "license": null, "dataset_stats": { "observation.image": { "mean": [ 0.485, 0.456, 0.406 ], "std": [ 0.229, 0.224, 0.225 ] }, "action": { "min": [ 0.0, 0.0 ], "max": [ 7.0, 7.0 ] } }, "storage_device": "cpu", "vision_encoder_name": "helper2424/resnet10", "freeze_vision_encoder": false, "image_encoder_hidden_dim": 32, "shared_encoder": true, "num_discrete_actions": null, "image_embedding_pooling_dim": 8, "online_steps": 1000000, "online_env_seed": 10000, "online_buffer_capacity": 10000, "offline_buffer_capacity": 1000, "async_prefetch": false, "online_step_before_learning": 100, "policy_update_freq": 1, "discount": 0.97, "temperature_init": 0.01, "num_critics": 2, "num_subsample_critics": null, "critic_lr": 0.0003, "actor_lr": 0.0003, "temperature_lr": 0.0003, "critic_target_update_weight": 0.005, "utd_ratio": 2, "state_encoder_hidden_dim": 256, "latent_dim": 64, "target_entropy": null, "use_backup_entropy": true, "grad_clip_norm": 10.0, "critic_network_kwargs": { "hidden_dims": [ 256, 256 ], "activate_final": true, "final_activation": null }, "actor_network_kwargs": { "hidden_dims": [ 256, 256 ], "activate_final": true }, "policy_kwargs": { "use_tanh_squash": false, "std_min": 1e-05, "std_max": 5.0, "init_final": 0.05 }, "discrete_critic_network_kwargs": { "hidden_dims": [ 256, 256 ], "activate_final": true, "final_activation": null }, "actor_learner_config": { "learner_host": "127.0.0.1", "learner_port": 50053, "policy_parameters_push_frequency": 0, "queue_get_timeout": 2.0 }, "concurrency": { "actor": "threads", "learner": "threads" }, "use_torch_compile": false }