{ "_num_labels": 2, "architectures": [ "Swinv2ForImageClassification" ], "depths": [2, 2, 18, 2], "drop_path_rate": 0.1, "embed_dim": 192, "encoder_stride": 32, "hidden_size": 1536, "id2label": { "0": "artificial", "1": "real" }, "image_size": 256, "label2id": { "artificial": 0, "real": 1 }, "mlp_ratio": 4.0, "model_type": "swinv2", "num_channels": 3, "num_heads": [6, 12, 24, 48], "out_features": ["stage4"], "patch_size": 4, "path_norm": true, "pretrained_window_sizes": [12, 12, 12, 6], "window_size": 16 }