{
    "type": "sac",
    "n_obs_steps": 1,
    "normalization_mapping": {
        "VISUAL": "MEAN_STD",
        "ACTION": "IDENTITY"
    },
    "input_features": {
        "observation.image": {
            "type": "VISUAL",
            "shape": [
                3,
                128,
                128
            ]
        }
    },
    "output_features": {
        "action": {
            "type": "ACTION",
            "shape": [
                2
            ]
        }
    },
    "device": "cuda",
    "use_amp": false,
    "push_to_hub": true,
    "repo_id": "spirosperos/grid-position-policy",
    "private": null,
    "tags": null,
    "license": null,
    "dataset_stats": {
        "observation.image": {
            "mean": [
                0.485,
                0.456,
                0.406
            ],
            "std": [
                0.229,
                0.224,
                0.225
            ]
        },
        "action": {
            "min": [
                0.0,
                0.0
            ],
            "max": [
                7.0,
                7.0
            ]
        }
    },
    "storage_device": "cpu",
    "vision_encoder_name": "helper2424/resnet10",
    "freeze_vision_encoder": false,
    "image_encoder_hidden_dim": 32,
    "shared_encoder": true,
    "num_discrete_actions": null,
    "image_embedding_pooling_dim": 8,
    "online_steps": 1000000,
    "online_env_seed": 10000,
    "online_buffer_capacity": 10000,
    "offline_buffer_capacity": 1000,
    "async_prefetch": false,
    "online_step_before_learning": 100,
    "policy_update_freq": 1,
    "discount": 0.97,
    "temperature_init": 0.01,
    "num_critics": 2,
    "num_subsample_critics": null,
    "critic_lr": 0.0003,
    "actor_lr": 0.0003,
    "temperature_lr": 0.0003,
    "critic_target_update_weight": 0.005,
    "utd_ratio": 2,
    "state_encoder_hidden_dim": 256,
    "latent_dim": 64,
    "target_entropy": null,
    "use_backup_entropy": true,
    "grad_clip_norm": 10.0,
    "critic_network_kwargs": {
        "hidden_dims": [
            256,
            256
        ],
        "activate_final": true,
        "final_activation": null
    },
    "actor_network_kwargs": {
        "hidden_dims": [
            256,
            256
        ],
        "activate_final": true
    },
    "policy_kwargs": {
        "use_tanh_squash": false,
        "std_min": 1e-05,
        "std_max": 5.0,
        "init_final": 0.05
    },
    "discrete_critic_network_kwargs": {
        "hidden_dims": [
            256,
            256
        ],
        "activate_final": true,
        "final_activation": null
    },
    "actor_learner_config": {
        "learner_host": "127.0.0.1",
        "learner_port": 50053,
        "policy_parameters_push_frequency": 0,
        "queue_get_timeout": 2.0
    },
    "concurrency": {
        "actor": "threads",
        "learner": "threads"
    },
    "use_torch_compile": false
}