Upload 13 files
Browse filesThis model was designed as a general purpose fine tuning of SD1.5 on high quality photographs and traditional artworks upscaled and denoised before training to get the sharpest cleanest results possible.
It's trained at 576 resolution using the offset noise fix so generations are sharp and detailed with vibrant colors, deep blacks, and a well balanced contrast.
This model was not trained with A.I. generated images or merged with any other models which means your images won't have that green/aqua color cast seen in so many models today.
The largest portion of the dataset consists of photographs of women, men, gorgeous landscapes, and luxurious home/cabin/hotel interiors, some abandoned buildings and cityscapes, followed by a few unique art styles that can most easily be discovered by prompting with the commonly used words below.
Some tips for realistic images:
Don't use the word "realistic"
part of the dataset contains "realistic porcelain dolls" and it will likely reference those dolls to a degree when prompted. I tend to avoid that word anyways because "realistic" is usually used to describe high quality paintings, cgi, or other classically non realistic artforms and when I want realism I'm trying to reference photographs but do whatever works for you, there's plenty of latent space to explore and I'm no expert. It shouldn't be an issue but If your faces look a bit smoother than you like try throwing the word "doll" in the negative prompt.
This model is great at both high detailed realism and stylized images so keep these two words in mind when generating.
A few common words found in the training dataset include:
Papercut
Liquid Splash
Realistic Porcelain Doll
Interior
Landscape
...and a few others for you to discover.
If your so inclined to leave a tip I'm happy to accept monero at this address:
82s3fk8bQB2DHJ3r9idZUsST1Dvf5cKKC6Fu87rYgV9dAFbCbAcXMPXaP59yDwWzRXfYfTBszHZno6xGwDb17xUzEkCsAah
Thanks for checking out my work and enjoy!
- FeverDream_VAE-BakedIn.safetensors +3 -0
- INPAINT-FeverDream_VAE-BakedIn.inpainting.safetensors +3 -0
- model_index.json +33 -0
- scheduler/scheduler_config.json +16 -0
- text_encoder/config.json +25 -0
- text_encoder/pytorch_model.bin +3 -0
- tokenizer/merges.txt +0 -0
- tokenizer/special_tokens_map.json +24 -0
- tokenizer/tokenizer_config.json +35 -0
- tokenizer/vocab.json +0 -0
- unet/config.json +51 -0
- vae/config.json +31 -0
- vae/diffusion_pytorch_model.bin +3 -0
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:830772ed8e335f8a00633362a32279c03683d90099cfeaed3ca063b884a9c1d3
|
3 |
+
size 2132625468
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2216b8cf6d4a308ffe85d88fd3a6977a60c2dffb60447b51a6268d338ccc91c4
|
3 |
+
size 2132703886
|
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "StableDiffusionPipeline",
|
3 |
+
"_diffusers_version": "0.13.0",
|
4 |
+
"feature_extractor": [
|
5 |
+
null,
|
6 |
+
null
|
7 |
+
],
|
8 |
+
"requires_safety_checker": null,
|
9 |
+
"safety_checker": [
|
10 |
+
null,
|
11 |
+
null
|
12 |
+
],
|
13 |
+
"scheduler": [
|
14 |
+
"diffusers",
|
15 |
+
"DDPMScheduler"
|
16 |
+
],
|
17 |
+
"text_encoder": [
|
18 |
+
"transformers",
|
19 |
+
"CLIPTextModel"
|
20 |
+
],
|
21 |
+
"tokenizer": [
|
22 |
+
"transformers",
|
23 |
+
"CLIPTokenizer"
|
24 |
+
],
|
25 |
+
"unet": [
|
26 |
+
"diffusers",
|
27 |
+
"UNet2DConditionModel"
|
28 |
+
],
|
29 |
+
"vae": [
|
30 |
+
"diffusers",
|
31 |
+
"AutoencoderKL"
|
32 |
+
]
|
33 |
+
}
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "DDPMScheduler",
|
3 |
+
"_diffusers_version": "0.13.0",
|
4 |
+
"beta_end": 0.012,
|
5 |
+
"beta_schedule": "scaled_linear",
|
6 |
+
"beta_start": 0.00085,
|
7 |
+
"clip_sample": false,
|
8 |
+
"clip_sample_range": 1.0,
|
9 |
+
"num_train_timesteps": 1000,
|
10 |
+
"prediction_type": "epsilon",
|
11 |
+
"set_alpha_to_one": false,
|
12 |
+
"skip_prk_steps": true,
|
13 |
+
"steps_offset": 1,
|
14 |
+
"trained_betas": null,
|
15 |
+
"variance_type": "fixed_small"
|
16 |
+
}
|
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/root/.cache/huggingface/diffusers/models--panopstor--EveryDream/snapshots/0feeaee608654bc71a572dfefa9b83f3b74b204d/text_encoder",
|
3 |
+
"architectures": [
|
4 |
+
"CLIPTextModel"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 0,
|
8 |
+
"dropout": 0.0,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "quick_gelu",
|
11 |
+
"hidden_size": 768,
|
12 |
+
"initializer_factor": 1.0,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 3072,
|
15 |
+
"layer_norm_eps": 1e-05,
|
16 |
+
"max_position_embeddings": 77,
|
17 |
+
"model_type": "clip_text_model",
|
18 |
+
"num_attention_heads": 12,
|
19 |
+
"num_hidden_layers": 12,
|
20 |
+
"pad_token_id": 1,
|
21 |
+
"projection_dim": 768,
|
22 |
+
"torch_dtype": "float32",
|
23 |
+
"transformers_version": "4.25.1",
|
24 |
+
"vocab_size": 49408
|
25 |
+
}
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4bd3110d527d57076a7a914f0d84ed873b389223f359965616247243d04f06d
|
3 |
+
size 492309793
|
The diff for this file is too large to render.
See raw diff
|
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<|startoftext|>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": true,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "<|endoftext|>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"pad_token": "<|endoftext|>",
|
17 |
+
"unk_token": {
|
18 |
+
"content": "<|endoftext|>",
|
19 |
+
"lstrip": false,
|
20 |
+
"normalized": true,
|
21 |
+
"rstrip": false,
|
22 |
+
"single_word": false
|
23 |
+
}
|
24 |
+
}
|
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_prefix_space": false,
|
3 |
+
"bos_token": {
|
4 |
+
"__type": "AddedToken",
|
5 |
+
"content": "<|startoftext|>",
|
6 |
+
"lstrip": false,
|
7 |
+
"normalized": true,
|
8 |
+
"rstrip": false,
|
9 |
+
"single_word": false
|
10 |
+
},
|
11 |
+
"do_lower_case": true,
|
12 |
+
"eos_token": {
|
13 |
+
"__type": "AddedToken",
|
14 |
+
"content": "<|endoftext|>",
|
15 |
+
"lstrip": false,
|
16 |
+
"normalized": true,
|
17 |
+
"rstrip": false,
|
18 |
+
"single_word": false
|
19 |
+
},
|
20 |
+
"errors": "replace",
|
21 |
+
"model_max_length": 77,
|
22 |
+
"name_or_path": "/root/.cache/huggingface/diffusers/models--panopstor--EveryDream/snapshots/0feeaee608654bc71a572dfefa9b83f3b74b204d",
|
23 |
+
"pad_token": "<|endoftext|>",
|
24 |
+
"special_tokens_map_file": "./special_tokens_map.json",
|
25 |
+
"tokenizer_class": "CLIPTokenizer",
|
26 |
+
"unk_token": {
|
27 |
+
"__type": "AddedToken",
|
28 |
+
"content": "<|endoftext|>",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": true,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false
|
33 |
+
},
|
34 |
+
"use_fast": false
|
35 |
+
}
|
The diff for this file is too large to render.
See raw diff
|
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.13.0",
|
4 |
+
"_name_or_path": "/root/.cache/huggingface/diffusers/models--panopstor--EveryDream/snapshots/0feeaee608654bc71a572dfefa9b83f3b74b204d/unet",
|
5 |
+
"act_fn": "silu",
|
6 |
+
"attention_head_dim": 8,
|
7 |
+
"block_out_channels": [
|
8 |
+
320,
|
9 |
+
640,
|
10 |
+
1280,
|
11 |
+
1280
|
12 |
+
],
|
13 |
+
"center_input_sample": false,
|
14 |
+
"class_embed_type": null,
|
15 |
+
"conv_in_kernel": 3,
|
16 |
+
"conv_out_kernel": 3,
|
17 |
+
"cross_attention_dim": 768,
|
18 |
+
"down_block_types": [
|
19 |
+
"CrossAttnDownBlock2D",
|
20 |
+
"CrossAttnDownBlock2D",
|
21 |
+
"CrossAttnDownBlock2D",
|
22 |
+
"DownBlock2D"
|
23 |
+
],
|
24 |
+
"downsample_padding": 1,
|
25 |
+
"dual_cross_attention": false,
|
26 |
+
"flip_sin_to_cos": true,
|
27 |
+
"freq_shift": 0,
|
28 |
+
"in_channels": 4,
|
29 |
+
"layers_per_block": 2,
|
30 |
+
"mid_block_scale_factor": 1,
|
31 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
32 |
+
"norm_eps": 1e-05,
|
33 |
+
"norm_num_groups": 32,
|
34 |
+
"num_class_embeds": null,
|
35 |
+
"only_cross_attention": false,
|
36 |
+
"out_channels": 4,
|
37 |
+
"projection_class_embeddings_input_dim": null,
|
38 |
+
"resnet_time_scale_shift": "default",
|
39 |
+
"sample_size": 64,
|
40 |
+
"time_cond_proj_dim": null,
|
41 |
+
"time_embedding_type": "positional",
|
42 |
+
"timestep_post_act": null,
|
43 |
+
"up_block_types": [
|
44 |
+
"UpBlock2D",
|
45 |
+
"CrossAttnUpBlock2D",
|
46 |
+
"CrossAttnUpBlock2D",
|
47 |
+
"CrossAttnUpBlock2D"
|
48 |
+
],
|
49 |
+
"upcast_attention": false,
|
50 |
+
"use_linear_projection": false
|
51 |
+
}
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "AutoencoderKL",
|
3 |
+
"_diffusers_version": "0.13.0",
|
4 |
+
"_name_or_path": "/root/.cache/huggingface/diffusers/models--panopstor--EveryDream/snapshots/0feeaee608654bc71a572dfefa9b83f3b74b204d/vae",
|
5 |
+
"act_fn": "silu",
|
6 |
+
"block_out_channels": [
|
7 |
+
128,
|
8 |
+
256,
|
9 |
+
512,
|
10 |
+
512
|
11 |
+
],
|
12 |
+
"down_block_types": [
|
13 |
+
"DownEncoderBlock2D",
|
14 |
+
"DownEncoderBlock2D",
|
15 |
+
"DownEncoderBlock2D",
|
16 |
+
"DownEncoderBlock2D"
|
17 |
+
],
|
18 |
+
"in_channels": 3,
|
19 |
+
"latent_channels": 4,
|
20 |
+
"layers_per_block": 2,
|
21 |
+
"norm_num_groups": 32,
|
22 |
+
"out_channels": 3,
|
23 |
+
"sample_size": 512,
|
24 |
+
"scaling_factor": 0.18215,
|
25 |
+
"up_block_types": [
|
26 |
+
"UpDecoderBlock2D",
|
27 |
+
"UpDecoderBlock2D",
|
28 |
+
"UpDecoderBlock2D",
|
29 |
+
"UpDecoderBlock2D"
|
30 |
+
]
|
31 |
+
}
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11bc15ceb385823b4adb68bd5bdd7568d0c706c3de5ea9ebcb0b807092fc9030
|
3 |
+
size 167407601
|