aaa12963337 commited on
Commit
93302a5
1 Parent(s): 90244d3

End of training

Browse files
Files changed (4) hide show
  1. README.md +11 -11
  2. config.json +17 -55
  3. model.safetensors +2 -2
  4. training_args.bin +1 -1
README.md CHANGED
@@ -1,6 +1,6 @@
1
  ---
2
- license: mit
3
- base_model: shi-labs/dinat-mini-in1k-224
4
  tags:
5
  - generated_from_trainer
6
  datasets:
@@ -15,15 +15,15 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # msi-resnet-18-pretrain
17
 
18
- This model is a fine-tuned version of [shi-labs/dinat-mini-in1k-224](https://huggingface.co/shi-labs/dinat-mini-in1k-224) on the imagefolder dataset.
19
  It achieves the following results on the evaluation set:
20
- - eval_loss: 0.3170
21
- - eval_accuracy: 0.9277
22
- - eval_runtime: 34.2706
23
- - eval_samples_per_second: 209.509
24
- - eval_steps_per_second: 13.102
25
- - epoch: 1.0
26
- - step: 1562
27
 
28
  ## Model description
29
 
@@ -51,7 +51,7 @@ The following hyperparameters were used during training:
51
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
52
  - lr_scheduler_type: linear
53
  - lr_scheduler_warmup_ratio: 0.1
54
- - num_epochs: 3
55
 
56
  ### Framework versions
57
 
 
1
  ---
2
+ license: apache-2.0
3
+ base_model: microsoft/resnet-18
4
  tags:
5
  - generated_from_trainer
6
  datasets:
 
15
 
16
  # msi-resnet-18-pretrain
17
 
18
+ This model is a fine-tuned version of [microsoft/resnet-18](https://huggingface.co/microsoft/resnet-18) on the imagefolder dataset.
19
  It achieves the following results on the evaluation set:
20
+ - eval_loss: 0.4090
21
+ - eval_accuracy: 0.8648
22
+ - eval_runtime: 45.6695
23
+ - eval_samples_per_second: 157.216
24
+ - eval_steps_per_second: 9.831
25
+ - epoch: 2.0
26
+ - step: 3125
27
 
28
  ## Model description
29
 
 
51
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
52
  - lr_scheduler_type: linear
53
  - lr_scheduler_warmup_ratio: 0.1
54
+ - num_epochs: 10
55
 
56
  ### Framework versions
57
 
config.json CHANGED
@@ -1,48 +1,24 @@
1
  {
2
- "_name_or_path": "shi-labs/dinat-mini-in1k-224",
3
  "architectures": [
4
- "DinatForImageClassification"
5
  ],
6
- "attention_probs_dropout_prob": 0.0,
7
  "depths": [
8
- 3,
9
- 4,
10
- 6,
11
- 5
12
  ],
13
- "dilations": [
14
- [
15
- 1,
16
- 8,
17
- 1
18
- ],
19
- [
20
- 1,
21
- 4,
22
- 1,
23
- 4
24
- ],
25
- [
26
- 1,
27
- 2,
28
- 1,
29
- 2,
30
- 1,
31
- 2
32
- ],
33
- [
34
- 1,
35
- 1,
36
- 1,
37
- 1,
38
- 1
39
- ]
40
  ],
41
- "drop_path_rate": 0.2,
42
- "embed_dim": 64,
43
- "hidden_act": "gelu",
44
- "hidden_dropout_prob": 0.0,
45
- "hidden_size": 512,
46
  "id2label": {
47
  "0": "ADI",
48
  "1": "BACK",
@@ -54,8 +30,6 @@
54
  "7": "STR",
55
  "8": "TUM"
56
  },
57
- "initializer_range": 0.02,
58
- "kernel_size": 7,
59
  "label2id": {
60
  "ADI": "0",
61
  "BACK": "1",
@@ -67,28 +41,16 @@
67
  "STR": "7",
68
  "TUM": "8"
69
  },
70
- "layer_norm_eps": 1e-05,
71
- "layer_scale_init_value": 0.0,
72
- "mlp_ratio": 3.0,
73
- "model_type": "dinat",
74
  "num_channels": 3,
75
- "num_heads": [
76
- 2,
77
- 4,
78
- 8,
79
- 16
80
- ],
81
- "num_layers": 4,
82
  "out_features": [
83
  "stage4"
84
  ],
85
  "out_indices": [
86
  4
87
  ],
88
- "patch_size": 4,
89
- "path_norm": true,
90
  "problem_type": "single_label_classification",
91
- "qkv_bias": true,
92
  "stage_names": [
93
  "stem",
94
  "stage1",
 
1
  {
2
+ "_name_or_path": "microsoft/resnet-18",
3
  "architectures": [
4
+ "ResNetForImageClassification"
5
  ],
 
6
  "depths": [
7
+ 2,
8
+ 2,
9
+ 2,
10
+ 2
11
  ],
12
+ "downsample_in_bottleneck": false,
13
+ "downsample_in_first_stage": false,
14
+ "embedding_size": 64,
15
+ "hidden_act": "relu",
16
+ "hidden_sizes": [
17
+ 64,
18
+ 128,
19
+ 256,
20
+ 512
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
21
  ],
 
 
 
 
 
22
  "id2label": {
23
  "0": "ADI",
24
  "1": "BACK",
 
30
  "7": "STR",
31
  "8": "TUM"
32
  },
 
 
33
  "label2id": {
34
  "ADI": "0",
35
  "BACK": "1",
 
41
  "STR": "7",
42
  "TUM": "8"
43
  },
44
+ "layer_type": "basic",
45
+ "model_type": "resnet",
 
 
46
  "num_channels": 3,
 
 
 
 
 
 
 
47
  "out_features": [
48
  "stage4"
49
  ],
50
  "out_indices": [
51
  4
52
  ],
 
 
53
  "problem_type": "single_label_classification",
 
54
  "stage_names": [
55
  "stem",
56
  "stage1",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11cabcabf9bb525aaf32f09a868289b1bd7007a357e1adf14fb1c2b929632a9b
3
- size 78484420
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:276864846bd3ab62f97d961bebc713f1fc785860e19d234c2da36a16a6d3414b
3
+ size 44778700
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9cf2012c40cb0f2098b97033ed0b66799e3830b062d2368116dbf13a7f6ee20
3
  size 4155
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b683f5cafdd8c46dbf8e02b3384ab46bb498457d942d9cc206529119c27ef1eb
3
  size 4155