Cvespaz commited on
Commit
20ae2bd
·
verified ·
1 Parent(s): d902f1b

Upload 18 files

Browse files
README.md ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - en
4
+ license: cc-by-nc-nd-4.0
5
+ library_name: diffusers
6
+ tags:
7
+ - art
8
+ - people
9
+ - diffusion
10
+ - Cinematic
11
+ - Photography
12
+ - Landscape
13
+ - Interior
14
+ - Food
15
+ - Car
16
+ - Wildlife
17
+ - Architecture
18
+ thumbnail: >-
19
+ https://storage.googleapis.com/run-diffusion-public-assets/juggernaut-xi/juggernaut-collage-256.webp
20
+ base_model: stabilityai/stable-diffusion-xl-base-1.0
21
+ pipeline_tag: text-to-image
22
+ ---
23
+
24
+ # Juggernaut XI v11 by RunDiffusion (Official)
25
+
26
+ 🎉 Juggernaut XI is Comming! 🌍
27
+ The next version of Juggernaut is on the horizon. Follow our social media accounts to be notified when we launch.
28
+
29
+ Juggernaut XI is available now on [RunDiffusion.com](http://rundiffusion.com/?utm_source=huggingface&utm_medium=referral&utm_campaign=juggernautv11) and through an API on Octo.AI
30
+
31
+ https://x.com/RunDiffusion & https://x.com/Juggernaut_AI
32
+
33
+ **Terms and Conditions:**
34
+ By providing your name and email, you consent to not use this model behind API's or generative services or on a competing platform or service to RunDiffusion.com.
35
+ Commercial licences can be obtained by emailing juggernaut@rundiffusion.com. You also agree to receive communications from RunDiffusion, including information on model releases, platform updates, and news from RunDiffusion.
36
+ RunDiffusion values your privacy and will not misuse your information. We are committed to avoiding irrelevant or unsolicited messages.
37
+
38
+ ![juggernaut XI photo previews](https://storage.googleapis.com/run-diffusion-public-assets/juggernaut-xi/juggernaut-collage-832.webp)
39
+ ![RunDiffusion Logo](https://imagedelivery.net/siANnpeNAc_S2q1M3-eDrA/ca2b388d-a835-490c-dec0-e764bee8d000/micro)
40
+ This model is not permitted to be used behind API services. Please contact [juggernaut@rundiffusion.com](mailto:juggernaut@rundiffusion.com) for business inquires, commercial licensing, custom models, and consultation.
41
+
42
+ Over two months have passed and we are thrilled to announce the next version of Juggernaut!
43
+
44
+ - Amazing prompt adherence ✅
45
+ - Massively improved aesthetics
46
+ - Better hands, eyes, faces, and compostion
47
+ - Fully trained from the ground up using the GPT4 Vision Captioning tool by LEOSAM 🛠️
48
+ - Expanded and cleaner dataset with higher quality images 🖼️
49
+ - Improved classifications of shots (Full Body, Midshots, Portraits, etc) 📸
50
+ - Enhanced text generation capability 📝
51
+ - Two different prompting techniques, Natural and Tagging style 🏷️
52
+ - Enhanced by RunDiffusion Photo for refinement of details 🧐
53
+
54
+ Read more about this version here https://rundiffusion.com/juggernaut-xi
55
+
56
+ Uset his now exclusively through Fooocus on RunDiffusion.com
57
+ - Launch Fooocus on RunDiffusion
58
+ - Find Juggernaut_XI_byRunDiffusion.safetensors and start generating!
59
+
60
+ Prompting Guide 📘
61
+ Because everything has been trained from the ground up, prompting is a bit different. (Simpler, don't worry) @Kandoo has created a guide to help you seamlessly integrate this powerful model into your workflow, enabling you to leverage its advanced capabilities without feeling overwhelmed. Download it here: https://rundiffusion.com/juggernaut-xl#nav
62
+
63
+ As always, we love our community and feel so lucky to be in this position to bring these awesome tools and models to you amazing diffusers. Thanks for supporting us since our first day back in 2022. Going on TWO YEARS since we first started using generative Ai. Time flies when you're having fun. wow!
64
+
65
+ Don't forget to follow us on Twitter where we have way more updates on big things we're working on. The future is bright
66
+
67
+ https://x.com/RunDiffusion
68
+
69
+ -RunDiffusion Team
70
+
71
+ ![https://rundiffusion.com?utm_source=huggingface&utm_medium=referral&utm_campaign=juggernautv11](https://i.imgur.com/fKPEqSu.jpg)
model_index.json CHANGED
@@ -1,42 +1,41 @@
1
- {
2
- "_class_name": "StableDiffusionXLPipeline",
3
- "_diffusers_version": "0.32.2",
4
- "_name_or_path": "RunDiffusion/Juggernaut-XI-v11",
5
- "feature_extractor": [
6
- null,
7
- null
8
- ],
9
- "force_zeros_for_empty_prompt": true,
10
- "image_encoder": [
11
- null,
12
- null
13
- ],
14
- "scheduler": [
15
- "diffusers",
16
- "EulerDiscreteScheduler"
17
- ],
18
- "text_encoder": [
19
- "transformers",
20
- "CLIPTextModel"
21
- ],
22
- "text_encoder_2": [
23
- "transformers",
24
- "CLIPTextModelWithProjection"
25
- ],
26
- "tokenizer": [
27
- "transformers",
28
- "CLIPTokenizer"
29
- ],
30
- "tokenizer_2": [
31
- "transformers",
32
- "CLIPTokenizer"
33
- ],
34
- "unet": [
35
- "diffusers",
36
- "UNet2DConditionModel"
37
- ],
38
- "vae": [
39
- "diffusers",
40
- "AutoencoderKL"
41
- ]
42
- }
 
1
+ {
2
+ "_class_name": "StableDiffusionXLPipeline",
3
+ "_diffusers_version": "0.26.3",
4
+ "feature_extractor": [
5
+ null,
6
+ null
7
+ ],
8
+ "force_zeros_for_empty_prompt": true,
9
+ "image_encoder": [
10
+ null,
11
+ null
12
+ ],
13
+ "scheduler": [
14
+ "diffusers",
15
+ "EulerDiscreteScheduler"
16
+ ],
17
+ "text_encoder": [
18
+ "transformers",
19
+ "CLIPTextModel"
20
+ ],
21
+ "text_encoder_2": [
22
+ "transformers",
23
+ "CLIPTextModelWithProjection"
24
+ ],
25
+ "tokenizer": [
26
+ "transformers",
27
+ "CLIPTokenizer"
28
+ ],
29
+ "tokenizer_2": [
30
+ "transformers",
31
+ "CLIPTokenizer"
32
+ ],
33
+ "unet": [
34
+ "diffusers",
35
+ "UNet2DConditionModel"
36
+ ],
37
+ "vae": [
38
+ "diffusers",
39
+ "AutoencoderKL"
40
+ ]
41
+ }
 
scheduler/scheduler_config.json CHANGED
@@ -1,24 +1,21 @@
1
- {
2
- "_class_name": "EulerDiscreteScheduler",
3
- "_diffusers_version": "0.32.2",
4
- "beta_end": 0.012,
5
- "beta_schedule": "scaled_linear",
6
- "beta_start": 0.00085,
7
- "final_sigmas_type": "zero",
8
- "interpolation_type": "linear",
9
- "num_train_timesteps": 1000,
10
- "prediction_type": "epsilon",
11
- "rescale_betas_zero_snr": false,
12
- "sample_max_value": 1.0,
13
- "set_alpha_to_one": false,
14
- "sigma_max": null,
15
- "sigma_min": null,
16
- "skip_prk_steps": true,
17
- "steps_offset": 1,
18
- "timestep_spacing": "leading",
19
- "timestep_type": "discrete",
20
- "trained_betas": null,
21
- "use_beta_sigmas": false,
22
- "use_exponential_sigmas": false,
23
- "use_karras_sigmas": false
24
- }
 
1
+ {
2
+ "_class_name": "EulerDiscreteScheduler",
3
+ "_diffusers_version": "0.26.3",
4
+ "beta_end": 0.012,
5
+ "beta_schedule": "scaled_linear",
6
+ "beta_start": 0.00085,
7
+ "interpolation_type": "linear",
8
+ "num_train_timesteps": 1000,
9
+ "prediction_type": "epsilon",
10
+ "rescale_betas_zero_snr": false,
11
+ "sample_max_value": 1.0,
12
+ "set_alpha_to_one": false,
13
+ "sigma_max": null,
14
+ "sigma_min": null,
15
+ "skip_prk_steps": true,
16
+ "steps_offset": 1,
17
+ "timestep_spacing": "leading",
18
+ "timestep_type": "discrete",
19
+ "trained_betas": null,
20
+ "use_karras_sigmas": false
21
+ }
 
 
 
text_encoder/config.json CHANGED
@@ -1,25 +1,24 @@
1
- {
2
- "_name_or_path": "/root/.cache/huggingface/hub/models--RunDiffusion--Juggernaut-XI-v11/snapshots/17a87abb089586ab38591a2309da18e44e2c8917/text_encoder",
3
- "architectures": [
4
- "CLIPTextModel"
5
- ],
6
- "attention_dropout": 0.0,
7
- "bos_token_id": 0,
8
- "dropout": 0.0,
9
- "eos_token_id": 2,
10
- "hidden_act": "quick_gelu",
11
- "hidden_size": 768,
12
- "initializer_factor": 1.0,
13
- "initializer_range": 0.02,
14
- "intermediate_size": 3072,
15
- "layer_norm_eps": 1e-05,
16
- "max_position_embeddings": 77,
17
- "model_type": "clip_text_model",
18
- "num_attention_heads": 12,
19
- "num_hidden_layers": 12,
20
- "pad_token_id": 1,
21
- "projection_dim": 768,
22
- "torch_dtype": "float16",
23
- "transformers_version": "4.48.2",
24
- "vocab_size": 49408
25
- }
 
1
+ {
2
+ "architectures": [
3
+ "CLIPTextModel"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 0,
7
+ "dropout": 0.0,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "quick_gelu",
10
+ "hidden_size": 768,
11
+ "initializer_factor": 1.0,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 77,
16
+ "model_type": "clip_text_model",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 1,
20
+ "projection_dim": 768,
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.30.2",
23
+ "vocab_size": 49408
24
+ }
 
text_encoder/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d1126c5a4cfdced7ed962724ab0b72601aea66808cd55e12689e3185629f1ce
3
- size 246144152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:205903ff704616a765d9c5f7ad43d94fa5f76a1979c3e07370cbbb31b4e2d119
3
+ size 492307041
text_encoder_2/config.json CHANGED
@@ -1,25 +1,24 @@
1
- {
2
- "_name_or_path": "/root/.cache/huggingface/hub/models--RunDiffusion--Juggernaut-XI-v11/snapshots/17a87abb089586ab38591a2309da18e44e2c8917/text_encoder_2",
3
- "architectures": [
4
- "CLIPTextModelWithProjection"
5
- ],
6
- "attention_dropout": 0.0,
7
- "bos_token_id": 0,
8
- "dropout": 0.0,
9
- "eos_token_id": 2,
10
- "hidden_act": "gelu",
11
- "hidden_size": 1280,
12
- "initializer_factor": 1.0,
13
- "initializer_range": 0.02,
14
- "intermediate_size": 5120,
15
- "layer_norm_eps": 1e-05,
16
- "max_position_embeddings": 77,
17
- "model_type": "clip_text_model",
18
- "num_attention_heads": 20,
19
- "num_hidden_layers": 32,
20
- "pad_token_id": 1,
21
- "projection_dim": 1280,
22
- "torch_dtype": "float16",
23
- "transformers_version": "4.48.2",
24
- "vocab_size": 49408
25
- }
 
1
+ {
2
+ "architectures": [
3
+ "CLIPTextModelWithProjection"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 0,
7
+ "dropout": 0.0,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "gelu",
10
+ "hidden_size": 1280,
11
+ "initializer_factor": 1.0,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 5120,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 77,
16
+ "model_type": "clip_text_model",
17
+ "num_attention_heads": 20,
18
+ "num_hidden_layers": 32,
19
+ "pad_token_id": 1,
20
+ "projection_dim": 1280,
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.30.2",
23
+ "vocab_size": 49408
24
+ }
 
text_encoder_2/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6fc294c5c672fad7391c20cf8bebf6900cd4687776879723e634da28c6cf7b06
3
- size 1389382176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8789c738d9b7fb569baf95add70c6b7269cdeee67bd0c1056875c0ed43d69355
3
+ size 2778810597
tokenizer/merges.txt CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer/special_tokens_map.json CHANGED
@@ -1,24 +1,24 @@
1
- {
2
- "bos_token": {
3
- "content": "<|startoftext|>",
4
- "lstrip": false,
5
- "normalized": true,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "eos_token": {
10
- "content": "<|endoftext|>",
11
- "lstrip": false,
12
- "normalized": true,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "pad_token": "<|endoftext|>",
17
- "unk_token": {
18
- "content": "<|endoftext|>",
19
- "lstrip": false,
20
- "normalized": true,
21
- "rstrip": false,
22
- "single_word": false
23
- }
24
- }
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<|endoftext|>",
17
+ "unk_token": {
18
+ "content": "<|endoftext|>",
19
+ "lstrip": false,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }
tokenizer/tokenizer_config.json CHANGED
@@ -1,31 +1,33 @@
1
- {
2
- "add_prefix_space": false,
3
- "added_tokens_decoder": {
4
- "49406": {
5
- "content": "<|startoftext|>",
6
- "lstrip": false,
7
- "normalized": true,
8
- "rstrip": false,
9
- "single_word": false,
10
- "special": true
11
- },
12
- "49407": {
13
- "content": "<|endoftext|>",
14
- "lstrip": false,
15
- "normalized": true,
16
- "rstrip": false,
17
- "single_word": false,
18
- "special": true
19
- }
20
- },
21
- "bos_token": "<|startoftext|>",
22
- "clean_up_tokenization_spaces": true,
23
- "do_lower_case": true,
24
- "eos_token": "<|endoftext|>",
25
- "errors": "replace",
26
- "extra_special_tokens": {},
27
- "model_max_length": 77,
28
- "pad_token": "<|endoftext|>",
29
- "tokenizer_class": "CLIPTokenizer",
30
- "unk_token": "<|endoftext|>"
31
- }
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "bos_token": {
4
+ "__type": "AddedToken",
5
+ "content": "<|startoftext|>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false
10
+ },
11
+ "clean_up_tokenization_spaces": true,
12
+ "do_lower_case": true,
13
+ "eos_token": {
14
+ "__type": "AddedToken",
15
+ "content": "<|endoftext|>",
16
+ "lstrip": false,
17
+ "normalized": true,
18
+ "rstrip": false,
19
+ "single_word": false
20
+ },
21
+ "errors": "replace",
22
+ "model_max_length": 77,
23
+ "pad_token": "<|endoftext|>",
24
+ "tokenizer_class": "CLIPTokenizer",
25
+ "unk_token": {
26
+ "__type": "AddedToken",
27
+ "content": "<|endoftext|>",
28
+ "lstrip": false,
29
+ "normalized": true,
30
+ "rstrip": false,
31
+ "single_word": false
32
+ }
33
+ }
tokenizer/vocab.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_2/merges.txt CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_2/special_tokens_map.json CHANGED
@@ -1,24 +1,24 @@
1
- {
2
- "bos_token": {
3
- "content": "<|startoftext|>",
4
- "lstrip": false,
5
- "normalized": true,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "eos_token": {
10
- "content": "<|endoftext|>",
11
- "lstrip": false,
12
- "normalized": true,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "pad_token": "!",
17
- "unk_token": {
18
- "content": "<|endoftext|>",
19
- "lstrip": false,
20
- "normalized": true,
21
- "rstrip": false,
22
- "single_word": false
23
- }
24
- }
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "!",
17
+ "unk_token": {
18
+ "content": "<|endoftext|>",
19
+ "lstrip": false,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }
tokenizer_2/tokenizer_config.json CHANGED
@@ -1,39 +1,33 @@
1
- {
2
- "add_prefix_space": false,
3
- "added_tokens_decoder": {
4
- "0": {
5
- "content": "!",
6
- "lstrip": false,
7
- "normalized": false,
8
- "rstrip": false,
9
- "single_word": false,
10
- "special": true
11
- },
12
- "49406": {
13
- "content": "<|startoftext|>",
14
- "lstrip": false,
15
- "normalized": true,
16
- "rstrip": false,
17
- "single_word": false,
18
- "special": true
19
- },
20
- "49407": {
21
- "content": "<|endoftext|>",
22
- "lstrip": false,
23
- "normalized": true,
24
- "rstrip": false,
25
- "single_word": false,
26
- "special": true
27
- }
28
- },
29
- "bos_token": "<|startoftext|>",
30
- "clean_up_tokenization_spaces": true,
31
- "do_lower_case": true,
32
- "eos_token": "<|endoftext|>",
33
- "errors": "replace",
34
- "extra_special_tokens": {},
35
- "model_max_length": 77,
36
- "pad_token": "!",
37
- "tokenizer_class": "CLIPTokenizer",
38
- "unk_token": "<|endoftext|>"
39
- }
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "bos_token": {
4
+ "__type": "AddedToken",
5
+ "content": "<|startoftext|>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false
10
+ },
11
+ "clean_up_tokenization_spaces": true,
12
+ "do_lower_case": true,
13
+ "eos_token": {
14
+ "__type": "AddedToken",
15
+ "content": "<|endoftext|>",
16
+ "lstrip": false,
17
+ "normalized": true,
18
+ "rstrip": false,
19
+ "single_word": false
20
+ },
21
+ "errors": "replace",
22
+ "model_max_length": 77,
23
+ "pad_token": "!",
24
+ "tokenizer_class": "CLIPTokenizer",
25
+ "unk_token": {
26
+ "__type": "AddedToken",
27
+ "content": "<|endoftext|>",
28
+ "lstrip": false,
29
+ "normalized": true,
30
+ "rstrip": false,
31
+ "single_word": false
32
+ }
33
+ }
 
 
 
 
 
 
tokenizer_2/vocab.json CHANGED
The diff for this file is too large to render. See raw diff
 
unet/config.json CHANGED
@@ -1,73 +1,72 @@
1
- {
2
- "_class_name": "UNet2DConditionModel",
3
- "_diffusers_version": "0.32.2",
4
- "_name_or_path": "/root/.cache/huggingface/hub/models--RunDiffusion--Juggernaut-XI-v11/snapshots/17a87abb089586ab38591a2309da18e44e2c8917/unet",
5
- "act_fn": "silu",
6
- "addition_embed_type": "text_time",
7
- "addition_embed_type_num_heads": 64,
8
- "addition_time_embed_dim": 256,
9
- "attention_head_dim": [
10
- 5,
11
- 10,
12
- 20
13
- ],
14
- "attention_type": "default",
15
- "block_out_channels": [
16
- 320,
17
- 640,
18
- 1280
19
- ],
20
- "center_input_sample": false,
21
- "class_embed_type": null,
22
- "class_embeddings_concat": false,
23
- "conv_in_kernel": 3,
24
- "conv_out_kernel": 3,
25
- "cross_attention_dim": 2048,
26
- "cross_attention_norm": null,
27
- "down_block_types": [
28
- "DownBlock2D",
29
- "CrossAttnDownBlock2D",
30
- "CrossAttnDownBlock2D"
31
- ],
32
- "downsample_padding": 1,
33
- "dropout": 0.0,
34
- "dual_cross_attention": false,
35
- "encoder_hid_dim": null,
36
- "encoder_hid_dim_type": null,
37
- "flip_sin_to_cos": true,
38
- "freq_shift": 0,
39
- "in_channels": 4,
40
- "layers_per_block": 2,
41
- "mid_block_only_cross_attention": null,
42
- "mid_block_scale_factor": 1,
43
- "mid_block_type": "UNetMidBlock2DCrossAttn",
44
- "norm_eps": 1e-05,
45
- "norm_num_groups": 32,
46
- "num_attention_heads": null,
47
- "num_class_embeds": null,
48
- "only_cross_attention": false,
49
- "out_channels": 4,
50
- "projection_class_embeddings_input_dim": 2816,
51
- "resnet_out_scale_factor": 1.0,
52
- "resnet_skip_time_act": false,
53
- "resnet_time_scale_shift": "default",
54
- "reverse_transformer_layers_per_block": null,
55
- "sample_size": 128,
56
- "time_cond_proj_dim": null,
57
- "time_embedding_act_fn": null,
58
- "time_embedding_dim": null,
59
- "time_embedding_type": "positional",
60
- "timestep_post_act": null,
61
- "transformer_layers_per_block": [
62
- 1,
63
- 2,
64
- 10
65
- ],
66
- "up_block_types": [
67
- "CrossAttnUpBlock2D",
68
- "CrossAttnUpBlock2D",
69
- "UpBlock2D"
70
- ],
71
- "upcast_attention": false,
72
- "use_linear_projection": true
73
- }
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.26.3",
4
+ "act_fn": "silu",
5
+ "addition_embed_type": "text_time",
6
+ "addition_embed_type_num_heads": 64,
7
+ "addition_time_embed_dim": 256,
8
+ "attention_head_dim": [
9
+ 5,
10
+ 10,
11
+ 20
12
+ ],
13
+ "attention_type": "default",
14
+ "block_out_channels": [
15
+ 320,
16
+ 640,
17
+ 1280
18
+ ],
19
+ "center_input_sample": false,
20
+ "class_embed_type": null,
21
+ "class_embeddings_concat": false,
22
+ "conv_in_kernel": 3,
23
+ "conv_out_kernel": 3,
24
+ "cross_attention_dim": 2048,
25
+ "cross_attention_norm": null,
26
+ "down_block_types": [
27
+ "DownBlock2D",
28
+ "CrossAttnDownBlock2D",
29
+ "CrossAttnDownBlock2D"
30
+ ],
31
+ "downsample_padding": 1,
32
+ "dropout": 0.0,
33
+ "dual_cross_attention": false,
34
+ "encoder_hid_dim": null,
35
+ "encoder_hid_dim_type": null,
36
+ "flip_sin_to_cos": true,
37
+ "freq_shift": 0,
38
+ "in_channels": 4,
39
+ "layers_per_block": 2,
40
+ "mid_block_only_cross_attention": null,
41
+ "mid_block_scale_factor": 1,
42
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
43
+ "norm_eps": 1e-05,
44
+ "norm_num_groups": 32,
45
+ "num_attention_heads": null,
46
+ "num_class_embeds": null,
47
+ "only_cross_attention": false,
48
+ "out_channels": 4,
49
+ "projection_class_embeddings_input_dim": 2816,
50
+ "resnet_out_scale_factor": 1.0,
51
+ "resnet_skip_time_act": false,
52
+ "resnet_time_scale_shift": "default",
53
+ "reverse_transformer_layers_per_block": null,
54
+ "sample_size": 128,
55
+ "time_cond_proj_dim": null,
56
+ "time_embedding_act_fn": null,
57
+ "time_embedding_dim": null,
58
+ "time_embedding_type": "positional",
59
+ "timestep_post_act": null,
60
+ "transformer_layers_per_block": [
61
+ 1,
62
+ 2,
63
+ 10
64
+ ],
65
+ "up_block_types": [
66
+ "CrossAttnUpBlock2D",
67
+ "CrossAttnUpBlock2D",
68
+ "UpBlock2D"
69
+ ],
70
+ "upcast_attention": false,
71
+ "use_linear_projection": true
72
+ }
 
vae/config.json CHANGED
@@ -1,38 +1,31 @@
1
- {
2
- "_class_name": "AutoencoderKL",
3
- "_diffusers_version": "0.32.2",
4
- "_name_or_path": "/root/.cache/huggingface/hub/models--RunDiffusion--Juggernaut-XI-v11/snapshots/17a87abb089586ab38591a2309da18e44e2c8917/vae",
5
- "act_fn": "silu",
6
- "block_out_channels": [
7
- 128,
8
- 256,
9
- 512,
10
- 512
11
- ],
12
- "down_block_types": [
13
- "DownEncoderBlock2D",
14
- "DownEncoderBlock2D",
15
- "DownEncoderBlock2D",
16
- "DownEncoderBlock2D"
17
- ],
18
- "force_upcast": true,
19
- "in_channels": 3,
20
- "latent_channels": 4,
21
- "latents_mean": null,
22
- "latents_std": null,
23
- "layers_per_block": 2,
24
- "mid_block_add_attention": true,
25
- "norm_num_groups": 32,
26
- "out_channels": 3,
27
- "sample_size": 1024,
28
- "scaling_factor": 0.13025,
29
- "shift_factor": null,
30
- "up_block_types": [
31
- "UpDecoderBlock2D",
32
- "UpDecoderBlock2D",
33
- "UpDecoderBlock2D",
34
- "UpDecoderBlock2D"
35
- ],
36
- "use_post_quant_conv": true,
37
- "use_quant_conv": true
38
- }
 
1
+ {
2
+ "_class_name": "AutoencoderKL",
3
+ "_diffusers_version": "0.26.3",
4
+ "act_fn": "silu",
5
+ "block_out_channels": [
6
+ 128,
7
+ 256,
8
+ 512,
9
+ 512
10
+ ],
11
+ "down_block_types": [
12
+ "DownEncoderBlock2D",
13
+ "DownEncoderBlock2D",
14
+ "DownEncoderBlock2D",
15
+ "DownEncoderBlock2D"
16
+ ],
17
+ "force_upcast": true,
18
+ "in_channels": 3,
19
+ "latent_channels": 4,
20
+ "layers_per_block": 2,
21
+ "norm_num_groups": 32,
22
+ "out_channels": 3,
23
+ "sample_size": 1024,
24
+ "scaling_factor": 0.13025,
25
+ "up_block_types": [
26
+ "UpDecoderBlock2D",
27
+ "UpDecoderBlock2D",
28
+ "UpDecoderBlock2D",
29
+ "UpDecoderBlock2D"
30
+ ]
31
+ }
 
 
 
 
 
 
 
vae/diffusion_pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37eb3e09ae1ce3d6891ddf809ca927b618e501091142cf07fdd9cd170e3a046f
3
+ size 334712113