Text-to-Image
Diffusers
Safetensors
Pruna AI
StableDiffusionXLPipeline
johnrachwanpruna commited on
Commit
474ca95
·
verified ·
1 Parent(s): 6fc90f0

Add files using upload-large-folder tool

Browse files
README.md CHANGED
@@ -39,24 +39,25 @@ The compression configuration of the model is stored in the `smash_config.json`
39
  "batcher": null,
40
  "cacher": null,
41
  "compiler": null,
42
- "factorizer": "qkv_diffusers",
43
  "pruner": null,
44
- "quantizer": "torchao",
45
- "torchao_excluded_modules": "none",
46
- "torchao_quant_type": "int4dq",
 
47
  "batch_size": 1,
48
- "device": "mps",
 
49
  "save_fns": [
50
- "save_before_apply",
51
- "save_before_apply"
52
  ],
53
  "load_fns": [
54
- "diffusers"
55
  ],
56
  "reapply_after_load": {
57
- "factorizer": "qkv_diffusers",
58
  "pruner": null,
59
- "quantizer": "torchao",
60
  "cacher": null,
61
  "compiler": null,
62
  "batcher": null
@@ -70,4 +71,4 @@ The compression configuration of the model is stored in the `smash_config.json`
70
  [![GitHub](https://img.shields.io/github/followers/PrunaAI?label=Follow%20%40PrunaAI&style=social)](https://github.com/PrunaAI)
71
  [![LinkedIn](https://img.shields.io/badge/LinkedIn-Connect-blue)](https://www.linkedin.com/company/93832878/admin/feed/posts/?feedType=following)
72
  [![Discord](https://img.shields.io/badge/Discord-Join%20Us-blue?style=social&logo=discord)](https://discord.com/invite/rskEr4BZJx)
73
- [![Reddit](https://img.shields.io/reddit/subreddit-subscribers/PrunaAI?style=social)](https://www.reddit.com/r/PrunaAI/)
 
39
  "batcher": null,
40
  "cacher": null,
41
  "compiler": null,
42
+ "factorizer": null,
43
  "pruner": null,
44
+ "quantizer": "hqq_diffusers",
45
+ "hqq_diffusers_backend": "torchao_int4",
46
+ "hqq_diffusers_group_size": 64,
47
+ "hqq_diffusers_weight_bits": 8,
48
  "batch_size": 1,
49
+ "device": "cuda",
50
+ "device_map": null,
51
  "save_fns": [
52
+ "hqq_diffusers"
 
53
  ],
54
  "load_fns": [
55
+ "hqq_diffusers"
56
  ],
57
  "reapply_after_load": {
58
+ "factorizer": null,
59
  "pruner": null,
60
+ "quantizer": null,
61
  "cacher": null,
62
  "compiler": null,
63
  "batcher": null
 
71
  [![GitHub](https://img.shields.io/github/followers/PrunaAI?label=Follow%20%40PrunaAI&style=social)](https://github.com/PrunaAI)
72
  [![LinkedIn](https://img.shields.io/badge/LinkedIn-Connect-blue)](https://www.linkedin.com/company/93832878/admin/feed/posts/?feedType=following)
73
  [![Discord](https://img.shields.io/badge/Discord-Join%20Us-blue?style=social&logo=discord)](https://discord.com/invite/rskEr4BZJx)
74
+ [![Reddit](https://img.shields.io/reddit/subreddit-subscribers/PrunaAI?style=social)](https://www.reddit.com/r/PrunaAI/)
backbone_quantized/config.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.34.0",
4
+ "_name_or_path": "/root/.cache/huggingface/hub/models--segmind--Segmind-Vega/snapshots/7714c4363e5856ff974a4f4b068e8691f26d0b40/unet",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": "text_time",
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": 256,
9
+ "attention_head_dim": [
10
+ 5,
11
+ 10,
12
+ 20
13
+ ],
14
+ "attention_type": "default",
15
+ "block_out_channels": [
16
+ 320,
17
+ 640,
18
+ 1280
19
+ ],
20
+ "center_input_sample": false,
21
+ "class_embed_type": null,
22
+ "class_embeddings_concat": false,
23
+ "conv_in_kernel": 3,
24
+ "conv_out_kernel": 3,
25
+ "cross_attention_dim": 2048,
26
+ "cross_attention_norm": null,
27
+ "down_block_types": [
28
+ "DownBlock2D",
29
+ "CrossAttnDownBlock2D",
30
+ "CrossAttnDownBlock2D"
31
+ ],
32
+ "downsample_padding": 1,
33
+ "dropout": 0.0,
34
+ "dual_cross_attention": false,
35
+ "encoder_hid_dim": null,
36
+ "encoder_hid_dim_type": null,
37
+ "flip_sin_to_cos": true,
38
+ "freq_shift": 0,
39
+ "in_channels": 4,
40
+ "layers_per_block": 2,
41
+ "mid_block_only_cross_attention": null,
42
+ "mid_block_scale_factor": 1,
43
+ "mid_block_type": "UNetMidBlock2D",
44
+ "norm_eps": 1e-05,
45
+ "norm_num_groups": 32,
46
+ "num_attention_heads": null,
47
+ "num_class_embeds": null,
48
+ "only_cross_attention": false,
49
+ "out_channels": 4,
50
+ "projection_class_embeddings_input_dim": 2816,
51
+ "resnet_out_scale_factor": 1.0,
52
+ "resnet_skip_time_act": false,
53
+ "resnet_time_scale_shift": "default",
54
+ "reverse_transformer_layers_per_block": null,
55
+ "sample_size": 128,
56
+ "time_cond_proj_dim": null,
57
+ "time_embedding_act_fn": null,
58
+ "time_embedding_dim": null,
59
+ "time_embedding_type": "positional",
60
+ "timestep_post_act": null,
61
+ "transformer_layers_per_block": [
62
+ 1,
63
+ 1,
64
+ 2
65
+ ],
66
+ "up_block_types": [
67
+ "CrossAttnUpBlock2D",
68
+ "CrossAttnUpBlock2D",
69
+ "UpBlock2D"
70
+ ],
71
+ "upcast_attention": null,
72
+ "use_linear_projection": true
73
+ }
backbone_quantized/qmodel.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b8dff1b6202099d663a8f660d89655fdf2df7d3d724bc0e4bbbd2cab1a6291b
3
+ size 1713166505
model_index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "_class_name": "StableDiffusionXLPipeline",
3
- "_diffusers_version": "0.33.1",
4
  "_name_or_path": "segmind/Segmind-Vega",
5
  "feature_extractor": [
6
  null,
@@ -32,8 +32,8 @@
32
  "CLIPTokenizer"
33
  ],
34
  "unet": [
35
- "diffusers",
36
- "UNet2DConditionModel"
37
  ],
38
  "vae": [
39
  "diffusers",
 
1
  {
2
  "_class_name": "StableDiffusionXLPipeline",
3
+ "_diffusers_version": "0.34.0",
4
  "_name_or_path": "segmind/Segmind-Vega",
5
  "feature_extractor": [
6
  null,
 
32
  "CLIPTokenizer"
33
  ],
34
  "unet": [
35
+ null,
36
+ null
37
  ],
38
  "vae": [
39
  "diffusers",
scheduler/scheduler_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "_class_name": "EulerDiscreteScheduler",
3
- "_diffusers_version": "0.33.1",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
6
  "beta_start": 0.00085,
 
1
  {
2
  "_class_name": "EulerDiscreteScheduler",
3
+ "_diffusers_version": "0.34.0",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
6
  "beta_start": 0.00085,
smash_config.json CHANGED
@@ -2,24 +2,25 @@
2
  "batcher": null,
3
  "cacher": null,
4
  "compiler": null,
5
- "factorizer": "qkv_diffusers",
6
  "pruner": null,
7
- "quantizer": "torchao",
8
- "torchao_excluded_modules": "none",
9
- "torchao_quant_type": "int4dq",
 
10
  "batch_size": 1,
11
- "device": "mps",
 
12
  "save_fns": [
13
- "save_before_apply",
14
- "save_before_apply"
15
  ],
16
  "load_fns": [
17
- "diffusers"
18
  ],
19
  "reapply_after_load": {
20
- "factorizer": "qkv_diffusers",
21
  "pruner": null,
22
- "quantizer": "torchao",
23
  "cacher": null,
24
  "compiler": null,
25
  "batcher": null
 
2
  "batcher": null,
3
  "cacher": null,
4
  "compiler": null,
5
+ "factorizer": null,
6
  "pruner": null,
7
+ "quantizer": "hqq_diffusers",
8
+ "hqq_diffusers_backend": "torchao_int4",
9
+ "hqq_diffusers_group_size": 64,
10
+ "hqq_diffusers_weight_bits": 8,
11
  "batch_size": 1,
12
+ "device": "cuda",
13
+ "device_map": null,
14
  "save_fns": [
15
+ "hqq_diffusers"
 
16
  ],
17
  "load_fns": [
18
+ "hqq_diffusers"
19
  ],
20
  "reapply_after_load": {
21
+ "factorizer": null,
22
  "pruner": null,
23
+ "quantizer": null,
24
  "cacher": null,
25
  "compiler": null,
26
  "batcher": null
text_encoder/config.json CHANGED
@@ -18,7 +18,7 @@
18
  "num_hidden_layers": 12,
19
  "pad_token_id": 1,
20
  "projection_dim": 768,
21
- "torch_dtype": "bfloat16",
22
- "transformers_version": "4.52.4",
23
  "vocab_size": 49408
24
  }
 
18
  "num_hidden_layers": 12,
19
  "pad_token_id": 1,
20
  "projection_dim": 768,
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.53.2",
23
  "vocab_size": 49408
24
  }
text_encoder/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4921a685a94dc5c57f74a4bf157481bfb18d375e16ada3ca93cac8c5b5a1402d
3
- size 246144352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92b998a9a64549bfa05c019bde114be6681549a0c79caee903fe30c9444d08b9
3
+ size 492265168
text_encoder_2/config.json CHANGED
@@ -18,7 +18,7 @@
18
  "num_hidden_layers": 32,
19
  "pad_token_id": 1,
20
  "projection_dim": 1280,
21
- "torch_dtype": "bfloat16",
22
- "transformers_version": "4.52.4",
23
  "vocab_size": 49408
24
  }
 
18
  "num_hidden_layers": 32,
19
  "pad_token_id": 1,
20
  "projection_dim": 1280,
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.53.2",
23
  "vocab_size": 49408
24
  }
text_encoder_2/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64224adda1a700e7327fd781bd28e888604fd63bfff71fe70e46da89efe34702
3
- size 1389382688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:943a2924ee888295a156dd47089d67181d633b782337890af11ef4b15af17ec5
3
+ size 2778702264
vae/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "AutoencoderKL",
3
- "_diffusers_version": "0.33.1",
4
- "_name_or_path": "/Users/davidberenstein/.cache/huggingface/hub/models--segmind--Segmind-Vega/snapshots/7714c4363e5856ff974a4f4b068e8691f26d0b40/vae",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
 
1
  {
2
  "_class_name": "AutoencoderKL",
3
+ "_diffusers_version": "0.34.0",
4
+ "_name_or_path": "/root/.cache/huggingface/hub/models--segmind--Segmind-Vega/snapshots/7714c4363e5856ff974a4f4b068e8691f26d0b40/vae",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
vae/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2741af7e84fe3b0a7aee02f89fa34c0858ed55f5782aab5931b94938983652da
3
- size 167335590
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1598f3d24932bcfe6634e8b618ea1e30ab1d57f5aad13a6d2de446d2199f2341
3
+ size 334643268