vija0 SmilingWolf commited on
Commit
b49f937
·
verified ·
0 Parent(s):

Duplicate from SmilingWolf/wd-swinv2-tagger-v3

Browse files

Co-authored-by: Smiling Wolf <SmilingWolf@users.noreply.huggingface.co>

Files changed (8) hide show
  1. .gitattributes +35 -0
  2. README.md +49 -0
  3. config.json +37 -0
  4. model.msgpack +3 -0
  5. model.onnx +3 -0
  6. model.safetensors +3 -0
  7. selected_tags.csv +0 -0
  8. sw_jax_cv_config.json +19 -0
.gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ library_name: timm
4
+ ---
5
+ # WD SwinV2 Tagger v3
6
+
7
+ Supports ratings, characters and general tags.
8
+
9
+ Trained using https://github.com/SmilingWolf/JAX-CV.
10
+ TPUs used for training kindly provided by the [TRC program](https://sites.research.google/trc/about/).
11
+
12
+ ## Dataset
13
+ Last image id: 7220105
14
+ Trained on Danbooru images with IDs modulo 0000-0899.
15
+ Validated on images with IDs modulo 0950-0999.
16
+ Images with less than 10 general tags were filtered out.
17
+ Tags with less than 600 images were filtered out.
18
+
19
+ ## Validation results
20
+ `v2.0: P=R: threshold = 0.2653, F1 = 0.4541`
21
+ `v1.0: P=R: threshold = 0.2521, F1 = 0.4411`
22
+
23
+ ## What's new
24
+ Model v2.0/Dataset v3:
25
+ Trained for a few more epochs.
26
+ Used tag frequency-based loss scaling to combat class imbalance.
27
+
28
+ Model v1.1/Dataset v3:
29
+ Amended the JAX model config file: add image size.
30
+ No change to the trained weights.
31
+
32
+ Model v1.0/Dataset v3:
33
+ More training images, more and up-to-date tags (up to 2024-02-28).
34
+ Now `timm` compatible! Load it up and give it a spin using the canonical one-liner!
35
+ ONNX model is compatible with code developed for the v2 series of models.
36
+ The batch dimension of the ONNX model is not fixed to 1 anymore. Now you can go crazy with batch inference.
37
+ Switched to Macro-F1 to measure model performance since it gives me a better gauge of overall training progress.
38
+
39
+ # Runtime deps
40
+ ONNX model requires `onnxruntime >= 1.17.0`
41
+
42
+ # Inference code examples
43
+ For timm: https://github.com/neggles/wdv3-timm
44
+ For ONNX: https://huggingface.co/spaces/SmilingWolf/wd-tagger
45
+ For JAX: https://github.com/SmilingWolf/wdv3-jax
46
+
47
+ ## Final words
48
+ Subject to change and updates.
49
+ Downstream users are encouraged to use tagged releases rather than relying on the head of the repo.
config.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architecture": "swinv2_base_window8_256",
3
+ "num_classes": 10861,
4
+ "num_features": 1024,
5
+ "global_pool": "avg",
6
+ "model_args": {
7
+ "act_layer": "gelu_tanh",
8
+ "img_size": 448,
9
+ "window_size": 14
10
+ },
11
+ "pretrained_cfg": {
12
+ "custom_load": false,
13
+ "input_size": [
14
+ 3,
15
+ 448,
16
+ 448
17
+ ],
18
+ "fixed_input_size": false,
19
+ "interpolation": "bicubic",
20
+ "crop_pct": 1.0,
21
+ "crop_mode": "center",
22
+ "mean": [
23
+ 0.5,
24
+ 0.5,
25
+ 0.5
26
+ ],
27
+ "std": [
28
+ 0.5,
29
+ 0.5,
30
+ 0.5
31
+ ],
32
+ "num_classes": 10861,
33
+ "pool_size": null,
34
+ "first_conv": null,
35
+ "classifier": null
36
+ }
37
+ }
model.msgpack ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a26ae4edbe45fa155ede34257153642b3bf476044a13e0ae6a0c4c131198f444
3
+ size 413777297
model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6774bff34d43bd49f75a47db4ef217dce701c9847b546523eb85ff6dbba1db1
3
+ size 467460978
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39fe04000d5907a0a7616df54af744d43fbd70b5fba7abc3135d3675734c03ef
3
+ size 392149220
selected_tags.csv ADDED
The diff for this file is too large to render. See raw diff
 
sw_jax_cv_config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "image_size": 448,
3
+ "model_name": "swinv2_base",
4
+ "model_args": {
5
+ "image_size": 448,
6
+ "patch_size": 4,
7
+ "in_chans": 3,
8
+ "num_classes": 10861,
9
+ "embed_dim": 128,
10
+ "window_size": 14,
11
+ "mlp_ratio": 4.0,
12
+ "qkv_bias": true,
13
+ "drop_rate": 0.0,
14
+ "attn_drop_rate": 0.0,
15
+ "drop_path_rate": 0.1,
16
+ "patch_norm": true,
17
+ "layer_norm_eps": 1e-05
18
+ }
19
+ }