{
  "act_layer": null,
  "attn_drop_rate": 0.0,
  "backbone": "hybrid",
  "c_head_num": null,
  "channel_dims": null,
  "channels": 256,
  "cls_attn_layers": 2,
  "decoder_dropout": 0.1,
  "decoder_hidden_size": 768,
  "decoder_params": {
    "embed_dim": 768
  },
  "depth": 22,
  "depths": [
    3,
    5
  ],
  "dims": [
    128,
    256,
    512,
    1024
  ],
  "drop_path_rate": 0.0,
  "drop_rate": 0.0,
  "dropout_ratio": 0.1,
  "embed_dim": 480,
  "eta": 1.0,
  "feat_downsample": false,
  "feature_strides": [
    4,
    8,
    16,
    32
  ],
  "hybrid_patch_size": 2,
  "img_size": [
    224,
    224
  ],
  "in_channels": [
    128,
    256,
    480,
    480
  ],
  "in_chans": 3,
  "in_index": [
    0,
    1,
    2,
    3
  ],
  "initializer_range": 1.0,
  "mlp_ratio": 4.0,
  "model_type": "fan",
  "norm_layer": null,
  "num_attention_heads": 8,
  "num_classes": 1000,
  "num_heads": 10,
  "num_hidden_layers": 12,
  "out_index": 18,
  "patch_size": 16,
  "qkv_bias": true,
  "reshape_last_stage": false,
  "rounding_mode": "floor",
  "se_mlp": false,
  "semantic_loss_ignore_index": -100,
  "sharpen_attn": false,
  "sr_ratio": [
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1,
    1
  ],
  "tokens_norm": true,
  "transformers_version": "4.24.0.dev0",
  "type": "SegFormerHead",
  "use_checkpoint": false,
  "use_head": false,
  "use_pos_embed": true
}