machuofan commited on
Commit
992f71f
1 Parent(s): 4e9f90c
config.json ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "CustomDDETRModel"
4
+ ],
5
+ "ddetr_cfg": {
6
+ "activation_dropout": 0.0,
7
+ "activation_function": "relu",
8
+ "attention_dropout": 0.0,
9
+ "auxiliary_loss": true,
10
+ "backbone": "resnet50",
11
+ "backbone_config": null,
12
+ "bbox_cost": 5,
13
+ "bbox_loss_coefficient": 5,
14
+ "class_cost": 2,
15
+ "cls_loss_coefficient": 2,
16
+ "d_model": 256,
17
+ "decoder_attention_heads": 8,
18
+ "decoder_ffn_dim": 1024,
19
+ "decoder_layers": 6,
20
+ "decoder_n_points": 4,
21
+ "dice_loss_coefficient": 1,
22
+ "dilation": false,
23
+ "disable_custom_kernels": false,
24
+ "dropout": 0.1,
25
+ "encoder_attention_heads": 8,
26
+ "encoder_ffn_dim": 1024,
27
+ "encoder_layerdrop": 0.0,
28
+ "encoder_layers": 6,
29
+ "encoder_n_points": 4,
30
+ "eos_coefficient": 0.1,
31
+ "focal_alpha": 0.25,
32
+ "giou_cost": 2,
33
+ "giou_loss_coefficient": 2,
34
+ "id2label": {
35
+ "0": "LABEL_0"
36
+ },
37
+ "init_std": 0.02,
38
+ "init_xavier_std": 1.0,
39
+ "is_encoder_decoder": true,
40
+ "label2id": {
41
+ "LABEL_0": 0
42
+ },
43
+ "mask_loss_coefficient": 1,
44
+ "max_position_embeddings": 1024,
45
+ "model_type": "deformable_detr",
46
+ "num_channels": 3,
47
+ "num_feature_levels": 1,
48
+ "num_queries": 300,
49
+ "position_embedding_type": "sine",
50
+ "transformers_version": "4.32.0",
51
+ "two_stage": true,
52
+ "two_stage_num_proposals": 300,
53
+ "use_pretrained_backbone": true,
54
+ "use_timm_backbone": true,
55
+ "with_box_refine": true
56
+ },
57
+ "model_type": "ddetr",
58
+ "torch_dtype": "float32",
59
+ "transformers_version": "4.32.0",
60
+ "vis_encoder_cfg": {
61
+ "architectures": [
62
+ "Dinov2Model"
63
+ ],
64
+ "attention_probs_dropout_prob": 0.0,
65
+ "drop_path_rate": 0.0,
66
+ "hidden_act": "gelu",
67
+ "hidden_dropout_prob": 0.0,
68
+ "hidden_size": 1024,
69
+ "image_size": 518,
70
+ "initializer_range": 0.02,
71
+ "layer_norm_eps": 1e-06,
72
+ "layerscale_value": 1.0,
73
+ "mlp_ratio": 4,
74
+ "model_type": "dinov2",
75
+ "num_attention_heads": 16,
76
+ "num_channels": 3,
77
+ "num_hidden_layers": 24,
78
+ "patch_size": 14,
79
+ "qkv_bias": true,
80
+ "torch_dtype": "float32",
81
+ "transformers_version": "4.32.0",
82
+ "use_swiglu_ffn": false
83
+ },
84
+ "vis_encoder_path": "checkpoints/dinov2-large",
85
+ "vis_output_layer": -2,
86
+ "zs_weight_path": null
87
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 224,
4
+ "width": 224
5
+ },
6
+ "do_center_crop": false,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": false,
11
+ "image_mean": [
12
+ 0.485,
13
+ 0.456,
14
+ 0.406
15
+ ],
16
+ "image_processor_type": "BitImageProcessor",
17
+ "image_std": [
18
+ 0.229,
19
+ 0.224,
20
+ 0.225
21
+ ],
22
+ "resample": 3,
23
+ "rescale_factor": 0.00392156862745098,
24
+ "size": {
25
+ "shortest_edge": 256
26
+ }
27
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:107801584fe1cc9eeddbd208fc444b32de7e0a8cc8433c3308edf1bc6916d5a1
3
+ size 1266992689
trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f606279103b477c3345aa6f1a6167242ce730521ea5b45b81cde8d05df346ea3
3
+ size 4283