{ "encoder": "vitl", "guide_type": "mask+observation", "loss_stategy": "entire_target_object", "pretrained": true }