patrickvonplaten YiYiXu commited on
Commit
6fd50d3
0 Parent(s):

Duplicate from YiYiXu/shap-e-img2img

Browse files

Co-authored-by: YiYi Xu <YiYiXu@users.noreply.huggingface.co>

.gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ ---
2
+ duplicated_from: YiYiXu/shap-e-img2img
3
+ ---
image_encoder/config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "openai/clip-vit-large-patch14",
3
+ "architectures": [
4
+ "CLIPVisionModel"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "dropout": 0.0,
8
+ "hidden_act": "quick_gelu",
9
+ "hidden_size": 1024,
10
+ "image_size": 224,
11
+ "initializer_factor": 1.0,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 4096,
14
+ "layer_norm_eps": 1e-05,
15
+ "model_type": "clip_vision_model",
16
+ "num_attention_heads": 16,
17
+ "num_channels": 3,
18
+ "num_hidden_layers": 24,
19
+ "patch_size": 14,
20
+ "projection_dim": 768,
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.29.2"
23
+ }
image_encoder/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49767fbe1b9ea4688056a86db9404053b9a34c3f6a95776cb85622e7ea8a35ae
3
+ size 1212850925
image_processor/preprocessor_config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": 224,
3
+ "do_center_crop": true,
4
+ "do_normalize": true,
5
+ "do_resize": true,
6
+ "feature_extractor_type": "CLIPFeatureExtractor",
7
+ "image_mean": [
8
+ 0.48145466,
9
+ 0.4578275,
10
+ 0.40821073
11
+ ],
12
+ "image_std": [
13
+ 0.26862954,
14
+ 0.26130258,
15
+ 0.27577711
16
+ ],
17
+ "resample": 3,
18
+ "size": 224
19
+ }
model_index.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "ShapEPriorPipeline",
3
+ "_diffusers_version": "0.17.0.dev0",
4
+ "scheduler": [
5
+ "diffusers",
6
+ "HeunDiscreteScheduler"
7
+ ],
8
+ "image_encoder": [
9
+ "transformers",
10
+ "CLIPVisionModel"
11
+ ],
12
+ "image_processor": [
13
+ "transformers",
14
+ "CLIPImageProcessor"
15
+ ],
16
+ "prior": [
17
+ "diffusers",
18
+ "PriorTransformer"
19
+ ],
20
+ "renderer": [
21
+ "shap_e",
22
+ "ShapERenderer"
23
+ ]
24
+ }
prior/config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "PriorTransformer",
3
+ "_diffusers_version": "0.18.0.dev0",
4
+ "added_emb_type": null,
5
+ "additional_embeddings": 0,
6
+ "attention_head_dim": 128,
7
+ "clip_embed_dim": 2048,
8
+ "dropout": 0.0,
9
+ "embedding_dim": 1024,
10
+ "embedding_proj_dim": 1024,
11
+ "embedding_proj_norm_type": "layer",
12
+ "encoder_hid_proj_type": null,
13
+ "norm_in_type": "layer",
14
+ "num_attention_heads": 8,
15
+ "num_embeddings": 1024,
16
+ "num_layers": 24,
17
+ "time_embed_act_fn": "gelu",
18
+ "time_embed_dim": 4096
19
+ }
prior/diffusion_pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d293731644d9c6de6e7bd22bb1db5a52cb7b0f35ca452cbdbb8cf1bc727316e
3
+ size 1263994731
renderer/config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "ShapERenderer",
3
+ "_diffusers_version": "0.18.0.dev0",
4
+ "act_fn": "swish",
5
+ "d_hidden": 256,
6
+ "d_latent": 1024,
7
+ "insert_direction_at": 4,
8
+ "n_hidden_layers": 6,
9
+ "n_output": 12,
10
+ "param_names": [
11
+ "nerstf.mlp.0.weight",
12
+ "nerstf.mlp.1.weight",
13
+ "nerstf.mlp.2.weight",
14
+ "nerstf.mlp.3.weight"
15
+ ],
16
+ "param_shapes": [
17
+ [
18
+ 256,
19
+ 93
20
+ ],
21
+ [
22
+ 256,
23
+ 256
24
+ ],
25
+ [
26
+ 256,
27
+ 256
28
+ ],
29
+ [
30
+ 256,
31
+ 256
32
+ ]
33
+ ]
34
+ }
renderer/diffusion_pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b50111f786c3dfca1d14cb1536a761cbc6826923a1f0021a19e156df5e171ee
3
+ size 905200536
scheduler/scheduler_config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "HeunDiscreteScheduler",
3
+ "_diffusers_version": "0.17.0.dev0",
4
+ "beta_schedule": "exp",
5
+ "trained_betas": null,
6
+ "num_train_timesteps": 1024,
7
+ "clip_sample": true,
8
+ "clip_sample_range": 1.0,
9
+ "prediction_type": "sample",
10
+ "use_karras_sigmas": true,
11
+ }