{ "action_space": null, "policy_kwargs": { "active_reward_monitors": { "env_reward": 1 }, "attention_heads": 8, "attention_mask_style": "clipped_causal", "attention_memory_size": 256, "diff_mlp_embedding": false, "hidsize": 1024, "img_shape": [ 128, 128, 3 ], "impala_chans": [ 16, 32, 32 ], "impala_kwargs": { "post_pool_groups": 1 }, "impala_width": 4, "init_norm_kwargs": { "batch_norm": false, "group_norm_groups": 1 }, "n_recurrence_layers": 4, "only_img_input": true, "pointwise_ratio": 4, "pointwise_use_activation": false, "recurrence_is_residual": true, "recurrence_type": "transformer", "timesteps": 128, "use_pointwise_layer": true, "use_pre_lstm_ln": false }, "temperature": 1 }