codeShare commited on
Commit
41c7b55
·
verified ·
1 Parent(s): e545bd6

Upload SDNQ Flux2 Klein fine-tuned transformer

Browse files
model_index.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "Flux2KleinPipeline",
3
  "_diffusers_version": "0.38.0.dev0",
4
- "_name_or_path": "black-forest-labs/FLUX.2-klein-4B",
5
  "is_distilled": true,
6
  "scheduler": [
7
  "diffusers",
 
1
  {
2
  "_class_name": "Flux2KleinPipeline",
3
  "_diffusers_version": "0.38.0.dev0",
4
+ "_name_or_path": "codeShare/FLUX.2-klein-AIO-SDNQ-4bit-dynamic",
5
  "is_distilled": true,
6
  "scheduler": [
7
  "diffusers",
text_encoder/config.json CHANGED
@@ -58,7 +58,7 @@
58
  "num_key_value_heads": 8,
59
  "pad_token_id": null,
60
  "quantization_config": {
61
- "add_skip_keys": true,
62
  "dequantize_fp32": true,
63
  "dynamic_loss_threshold": 0.01,
64
  "group_size": 0,
@@ -463,9 +463,9 @@
463
  "quant_conv": false,
464
  "quant_embedding": false,
465
  "quant_method": "sdnq",
466
- "quantization_device": "cuda",
467
  "quantized_matmul_dtype": null,
468
- "return_device": "cuda",
469
  "sdnq_version": "0.1.7",
470
  "svd_rank": 32,
471
  "svd_steps": 8,
@@ -485,7 +485,7 @@
485
  },
486
  "sliding_window": null,
487
  "tie_word_embeddings": true,
488
- "transformers_version": "5.0.0",
489
  "use_cache": true,
490
  "use_sliding_window": false,
491
  "vocab_size": 151936
 
58
  "num_key_value_heads": 8,
59
  "pad_token_id": null,
60
  "quantization_config": {
61
+ "add_skip_keys": false,
62
  "dequantize_fp32": true,
63
  "dynamic_loss_threshold": 0.01,
64
  "group_size": 0,
 
463
  "quant_conv": false,
464
  "quant_embedding": false,
465
  "quant_method": "sdnq",
466
+ "quantization_device": null,
467
  "quantized_matmul_dtype": null,
468
+ "return_device": null,
469
  "sdnq_version": "0.1.7",
470
  "svd_rank": 32,
471
  "svd_steps": 8,
 
485
  },
486
  "sliding_window": null,
487
  "tie_word_embeddings": true,
488
+ "transformers_version": "5.6.0",
489
  "use_cache": true,
490
  "use_sliding_window": false,
491
  "vocab_size": 151936
text_encoder/generation_config.json CHANGED
@@ -1,13 +1,7 @@
1
  {
 
2
  "bos_token_id": 151643,
3
- "do_sample": true,
4
- "eos_token_id": [
5
- 151645,
6
- 151643
7
- ],
8
- "pad_token_id": 151643,
9
- "temperature": 0.6,
10
- "top_k": 20,
11
- "top_p": 0.95,
12
- "transformers_version": "5.0.0"
13
  }
 
1
  {
2
+ "_from_model_config": true,
3
  "bos_token_id": 151643,
4
+ "eos_token_id": 151645,
5
+ "transformers_version": "5.6.0",
6
+ "use_cache": true
 
 
 
 
 
 
 
7
  }
tokenizer/tokenizer_config.json CHANGED
@@ -21,6 +21,7 @@
21
  "<|video_pad|>"
22
  ],
23
  "is_local": true,
 
24
  "model_max_length": 131072,
25
  "model_specific_special_tokens": {},
26
  "pad_token": "<|endoftext|>",
 
21
  "<|video_pad|>"
22
  ],
23
  "is_local": true,
24
+ "local_files_only": false,
25
  "model_max_length": 131072,
26
  "model_specific_special_tokens": {},
27
  "pad_token": "<|endoftext|>",
transformer/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "Flux2Transformer2DModel",
3
  "_diffusers_version": "0.38.0.dev0",
4
- "_name_or_path": "black-forest-labs/FLUX.2-klein-4B",
5
  "attention_head_dim": 128,
6
  "axes_dims_rope": [
7
  32,
@@ -28,400 +28,120 @@
28
  "is_training": false,
29
  "modules_dtype_dict": {
30
  "int5": [
31
- "transformer_blocks.0.attn.to_k.weight",
32
  "single_transformer_blocks.19.attn.to_qkv_mlp_proj.weight",
33
- "model.layers.2.mlp.down_proj.weight"
34
  ],
35
  "uint4": [
36
- "transformer_blocks.1.attn.add_k_proj.weight",
37
- "single_transformer_blocks.15.attn.to_out.weight",
 
 
 
 
 
 
 
 
 
38
  "single_transformer_blocks.13.attn.to_qkv_mlp_proj.weight",
 
 
 
 
 
39
  "single_transformer_blocks.16.attn.to_qkv_mlp_proj.weight",
40
- "transformer_blocks.4.attn.to_v.weight",
41
- "transformer_blocks.3.attn.to_v.weight",
42
- "single_transformer_blocks.3.attn.to_out.weight",
43
- "transformer_blocks.0.ff_context.linear_out.weight",
44
- "transformer_blocks.1.attn.to_k.weight",
45
- "single_transformer_blocks.9.attn.to_out.weight",
46
- "transformer_blocks.3.attn.to_add_out.weight",
47
- "transformer_blocks.3.ff_context.linear_in.weight",
48
- "transformer_blocks.3.attn.to_out.0.weight",
49
- "transformer_blocks.0.attn.to_out.0.weight",
50
- "transformer_blocks.4.ff.linear_in.weight",
51
- "transformer_blocks.2.ff.linear_out.weight",
52
- "transformer_blocks.1.ff.linear_in.weight",
53
- "transformer_blocks.4.attn.to_q.weight",
54
- "transformer_blocks.3.attn.add_v_proj.weight",
55
- "transformer_blocks.1.ff.linear_out.weight",
56
  "single_transformer_blocks.17.attn.to_qkv_mlp_proj.weight",
57
- "transformer_blocks.4.attn.add_k_proj.weight",
 
 
58
  "single_transformer_blocks.2.attn.to_out.weight",
59
- "transformer_blocks.0.attn.to_v.weight",
60
- "transformer_blocks.4.attn.add_q_proj.weight",
61
- "transformer_blocks.0.attn.add_q_proj.weight",
62
- "transformer_blocks.0.attn.add_v_proj.weight",
63
- "single_transformer_blocks.7.attn.to_out.weight",
64
- "transformer_blocks.1.attn.to_v.weight",
65
- "transformer_blocks.4.ff.linear_out.weight",
66
- "transformer_blocks.2.attn.to_q.weight",
67
  "single_transformer_blocks.5.attn.to_qkv_mlp_proj.weight",
68
- "transformer_blocks.2.attn.add_q_proj.weight",
69
- "single_transformer_blocks.0.attn.to_out.weight",
70
- "single_transformer_blocks.19.attn.to_out.weight",
71
- "transformer_blocks.4.ff_context.linear_out.weight",
72
- "transformer_blocks.1.ff_context.linear_out.weight",
73
- "transformer_blocks.2.attn.add_v_proj.weight",
74
- "single_transformer_blocks.10.attn.to_qkv_mlp_proj.weight",
75
  "single_transformer_blocks.6.attn.to_qkv_mlp_proj.weight",
76
- "transformer_blocks.4.attn.to_k.weight",
77
- "transformer_blocks.0.ff.linear_out.weight",
78
- "single_transformer_blocks.14.attn.to_qkv_mlp_proj.weight",
79
- "single_transformer_blocks.14.attn.to_out.weight",
80
- "single_transformer_blocks.11.attn.to_qkv_mlp_proj.weight",
81
- "single_transformer_blocks.0.attn.to_qkv_mlp_proj.weight",
82
  "single_transformer_blocks.8.attn.to_qkv_mlp_proj.weight",
 
 
 
 
 
 
 
 
 
 
 
83
  "transformer_blocks.0.ff_context.linear_in.weight",
84
- "single_transformer_blocks.12.attn.to_out.weight",
85
- "transformer_blocks.3.attn.add_q_proj.weight",
86
- "single_transformer_blocks.16.attn.to_out.weight",
87
- "transformer_blocks.3.ff.linear_in.weight",
88
  "transformer_blocks.1.attn.to_add_out.weight",
89
- "transformer_blocks.3.attn.add_k_proj.weight",
90
- "transformer_blocks.0.attn.to_add_out.weight",
91
- "single_transformer_blocks.12.attn.to_qkv_mlp_proj.weight",
92
- "transformer_blocks.2.ff_context.linear_out.weight",
93
- "transformer_blocks.4.attn.to_add_out.weight",
94
- "transformer_blocks.3.ff_context.linear_out.weight",
95
- "transformer_blocks.4.attn.to_out.0.weight",
96
- "single_transformer_blocks.17.attn.to_out.weight",
97
- "single_transformer_blocks.4.attn.to_out.weight",
98
  "transformer_blocks.1.attn.to_out.0.weight",
99
- "single_transformer_blocks.18.attn.to_qkv_mlp_proj.weight",
100
- "transformer_blocks.1.ff_context.linear_in.weight",
101
  "transformer_blocks.1.attn.to_q.weight",
102
- "single_transformer_blocks.9.attn.to_qkv_mlp_proj.weight",
103
- "single_transformer_blocks.1.attn.to_qkv_mlp_proj.weight",
104
- "single_transformer_blocks.7.attn.to_qkv_mlp_proj.weight",
105
- "single_transformer_blocks.18.attn.to_out.weight",
106
- "transformer_blocks.4.attn.add_v_proj.weight",
107
- "single_transformer_blocks.1.attn.to_out.weight",
108
- "transformer_blocks.1.attn.add_q_proj.weight",
109
- "transformer_blocks.2.ff.linear_in.weight",
110
- "transformer_blocks.2.ff_context.linear_in.weight",
111
- "transformer_blocks.3.ff.linear_out.weight",
112
- "single_transformer_blocks.5.attn.to_out.weight",
113
- "single_transformer_blocks.3.attn.to_qkv_mlp_proj.weight",
114
- "transformer_blocks.2.attn.to_v.weight",
115
- "transformer_blocks.0.attn.to_q.weight",
116
- "single_transformer_blocks.4.attn.to_qkv_mlp_proj.weight",
117
- "transformer_blocks.1.attn.add_v_proj.weight",
118
- "single_transformer_blocks.11.attn.to_out.weight",
119
- "transformer_blocks.0.ff.linear_in.weight",
120
- "transformer_blocks.0.attn.add_k_proj.weight",
121
  "transformer_blocks.2.attn.to_k.weight",
122
  "transformer_blocks.2.attn.to_out.0.weight",
123
- "transformer_blocks.2.attn.to_add_out.weight",
 
 
 
 
 
 
 
 
 
124
  "transformer_blocks.3.attn.to_k.weight",
125
- "transformer_blocks.2.attn.add_k_proj.weight",
126
- "single_transformer_blocks.15.attn.to_qkv_mlp_proj.weight",
127
- "single_transformer_blocks.13.attn.to_out.weight",
128
- "single_transformer_blocks.8.attn.to_out.weight",
129
- "single_transformer_blocks.6.attn.to_out.weight",
130
- "transformer_blocks.4.ff_context.linear_in.weight",
131
- "single_transformer_blocks.10.attn.to_out.weight",
132
- "single_transformer_blocks.2.attn.to_qkv_mlp_proj.weight",
133
  "transformer_blocks.3.attn.to_q.weight",
134
- "model.layers.0.mlp.down_proj.weight",
135
- "model.layers.0.mlp.gate_proj.weight",
136
- "model.layers.0.mlp.up_proj.weight",
137
- "model.layers.0.self_attn.k_proj.weight",
138
- "model.layers.0.self_attn.o_proj.weight",
139
- "model.layers.0.self_attn.q_proj.weight",
140
- "model.layers.0.self_attn.v_proj.weight",
141
- "model.layers.1.mlp.down_proj.weight",
142
- "model.layers.1.mlp.gate_proj.weight",
143
- "model.layers.1.mlp.up_proj.weight",
144
- "model.layers.1.self_attn.k_proj.weight",
145
- "model.layers.1.self_attn.o_proj.weight",
146
- "model.layers.1.self_attn.q_proj.weight",
147
- "model.layers.1.self_attn.v_proj.weight",
148
- "model.layers.2.mlp.gate_proj.weight",
149
- "model.layers.2.mlp.up_proj.weight",
150
- "model.layers.2.self_attn.k_proj.weight",
151
- "model.layers.2.self_attn.o_proj.weight",
152
- "model.layers.2.self_attn.q_proj.weight",
153
- "model.layers.2.self_attn.v_proj.weight",
154
- "model.layers.3.mlp.down_proj.weight",
155
- "model.layers.3.mlp.gate_proj.weight",
156
- "model.layers.3.mlp.up_proj.weight",
157
- "model.layers.3.self_attn.k_proj.weight",
158
- "model.layers.3.self_attn.o_proj.weight",
159
- "model.layers.3.self_attn.q_proj.weight",
160
- "model.layers.3.self_attn.v_proj.weight",
161
- "model.layers.4.mlp.down_proj.weight",
162
- "model.layers.4.mlp.gate_proj.weight",
163
- "model.layers.4.mlp.up_proj.weight",
164
- "model.layers.4.self_attn.k_proj.weight",
165
- "model.layers.4.self_attn.o_proj.weight",
166
- "model.layers.4.self_attn.q_proj.weight",
167
- "model.layers.4.self_attn.v_proj.weight",
168
- "model.layers.5.mlp.down_proj.weight",
169
- "model.layers.5.mlp.gate_proj.weight",
170
- "model.layers.5.mlp.up_proj.weight",
171
- "model.layers.5.self_attn.k_proj.weight",
172
- "model.layers.5.self_attn.o_proj.weight",
173
- "model.layers.5.self_attn.q_proj.weight",
174
- "model.layers.5.self_attn.v_proj.weight",
175
- "model.layers.6.mlp.down_proj.weight",
176
- "model.layers.6.mlp.gate_proj.weight",
177
- "model.layers.6.mlp.up_proj.weight",
178
- "model.layers.6.self_attn.k_proj.weight",
179
- "model.layers.6.self_attn.o_proj.weight",
180
- "model.layers.6.self_attn.q_proj.weight",
181
- "model.layers.6.self_attn.v_proj.weight",
182
- "model.layers.7.mlp.down_proj.weight",
183
- "model.layers.7.mlp.gate_proj.weight",
184
- "model.layers.7.mlp.up_proj.weight",
185
- "model.layers.7.self_attn.k_proj.weight",
186
- "model.layers.7.self_attn.o_proj.weight",
187
- "model.layers.7.self_attn.q_proj.weight",
188
- "model.layers.7.self_attn.v_proj.weight",
189
- "model.layers.8.mlp.down_proj.weight",
190
- "model.layers.8.mlp.gate_proj.weight",
191
- "model.layers.8.mlp.up_proj.weight",
192
- "model.layers.8.self_attn.k_proj.weight",
193
- "model.layers.8.self_attn.o_proj.weight",
194
- "model.layers.8.self_attn.q_proj.weight",
195
- "model.layers.8.self_attn.v_proj.weight",
196
- "model.layers.9.mlp.down_proj.weight",
197
- "model.layers.9.mlp.gate_proj.weight",
198
- "model.layers.9.mlp.up_proj.weight",
199
- "model.layers.9.self_attn.k_proj.weight",
200
- "model.layers.9.self_attn.o_proj.weight",
201
- "model.layers.9.self_attn.q_proj.weight",
202
- "model.layers.9.self_attn.v_proj.weight",
203
- "model.layers.10.mlp.down_proj.weight",
204
- "model.layers.10.mlp.gate_proj.weight",
205
- "model.layers.10.mlp.up_proj.weight",
206
- "model.layers.10.self_attn.k_proj.weight",
207
- "model.layers.10.self_attn.o_proj.weight",
208
- "model.layers.10.self_attn.q_proj.weight",
209
- "model.layers.10.self_attn.v_proj.weight",
210
- "model.layers.11.mlp.down_proj.weight",
211
- "model.layers.11.mlp.gate_proj.weight",
212
- "model.layers.11.mlp.up_proj.weight",
213
- "model.layers.11.self_attn.k_proj.weight",
214
- "model.layers.11.self_attn.o_proj.weight",
215
- "model.layers.11.self_attn.q_proj.weight",
216
- "model.layers.11.self_attn.v_proj.weight",
217
- "model.layers.12.mlp.down_proj.weight",
218
- "model.layers.12.mlp.gate_proj.weight",
219
- "model.layers.12.mlp.up_proj.weight",
220
- "model.layers.12.self_attn.k_proj.weight",
221
- "model.layers.12.self_attn.o_proj.weight",
222
- "model.layers.12.self_attn.q_proj.weight",
223
- "model.layers.12.self_attn.v_proj.weight",
224
- "model.layers.13.mlp.down_proj.weight",
225
- "model.layers.13.mlp.gate_proj.weight",
226
- "model.layers.13.mlp.up_proj.weight",
227
- "model.layers.13.self_attn.k_proj.weight",
228
- "model.layers.13.self_attn.o_proj.weight",
229
- "model.layers.13.self_attn.q_proj.weight",
230
- "model.layers.13.self_attn.v_proj.weight",
231
- "model.layers.14.mlp.down_proj.weight",
232
- "model.layers.14.mlp.gate_proj.weight",
233
- "model.layers.14.mlp.up_proj.weight",
234
- "model.layers.14.self_attn.k_proj.weight",
235
- "model.layers.14.self_attn.o_proj.weight",
236
- "model.layers.14.self_attn.q_proj.weight",
237
- "model.layers.14.self_attn.v_proj.weight",
238
- "model.layers.15.mlp.down_proj.weight",
239
- "model.layers.15.mlp.gate_proj.weight",
240
- "model.layers.15.mlp.up_proj.weight",
241
- "model.layers.15.self_attn.k_proj.weight",
242
- "model.layers.15.self_attn.o_proj.weight",
243
- "model.layers.15.self_attn.q_proj.weight",
244
- "model.layers.15.self_attn.v_proj.weight",
245
- "model.layers.16.mlp.down_proj.weight",
246
- "model.layers.16.mlp.gate_proj.weight",
247
- "model.layers.16.mlp.up_proj.weight",
248
- "model.layers.16.self_attn.k_proj.weight",
249
- "model.layers.16.self_attn.o_proj.weight",
250
- "model.layers.16.self_attn.q_proj.weight",
251
- "model.layers.16.self_attn.v_proj.weight",
252
- "model.layers.17.mlp.down_proj.weight",
253
- "model.layers.17.mlp.gate_proj.weight",
254
- "model.layers.17.mlp.up_proj.weight",
255
- "model.layers.17.self_attn.k_proj.weight",
256
- "model.layers.17.self_attn.o_proj.weight",
257
- "model.layers.17.self_attn.q_proj.weight",
258
- "model.layers.17.self_attn.v_proj.weight",
259
- "model.layers.18.mlp.down_proj.weight",
260
- "model.layers.18.mlp.gate_proj.weight",
261
- "model.layers.18.mlp.up_proj.weight",
262
- "model.layers.18.self_attn.k_proj.weight",
263
- "model.layers.18.self_attn.o_proj.weight",
264
- "model.layers.18.self_attn.q_proj.weight",
265
- "model.layers.18.self_attn.v_proj.weight",
266
- "model.layers.19.mlp.down_proj.weight",
267
- "model.layers.19.mlp.gate_proj.weight",
268
- "model.layers.19.mlp.up_proj.weight",
269
- "model.layers.19.self_attn.k_proj.weight",
270
- "model.layers.19.self_attn.o_proj.weight",
271
- "model.layers.19.self_attn.q_proj.weight",
272
- "model.layers.19.self_attn.v_proj.weight",
273
- "model.layers.20.mlp.down_proj.weight",
274
- "model.layers.20.mlp.gate_proj.weight",
275
- "model.layers.20.mlp.up_proj.weight",
276
- "model.layers.20.self_attn.k_proj.weight",
277
- "model.layers.20.self_attn.o_proj.weight",
278
- "model.layers.20.self_attn.q_proj.weight",
279
- "model.layers.20.self_attn.v_proj.weight",
280
- "model.layers.21.mlp.down_proj.weight",
281
- "model.layers.21.mlp.gate_proj.weight",
282
- "model.layers.21.mlp.up_proj.weight",
283
- "model.layers.21.self_attn.k_proj.weight",
284
- "model.layers.21.self_attn.o_proj.weight",
285
- "model.layers.21.self_attn.q_proj.weight",
286
- "model.layers.21.self_attn.v_proj.weight",
287
- "model.layers.22.mlp.down_proj.weight",
288
- "model.layers.22.mlp.gate_proj.weight",
289
- "model.layers.22.mlp.up_proj.weight",
290
- "model.layers.22.self_attn.k_proj.weight",
291
- "model.layers.22.self_attn.o_proj.weight",
292
- "model.layers.22.self_attn.q_proj.weight",
293
- "model.layers.22.self_attn.v_proj.weight",
294
- "model.layers.23.mlp.down_proj.weight",
295
- "model.layers.23.mlp.gate_proj.weight",
296
- "model.layers.23.mlp.up_proj.weight",
297
- "model.layers.23.self_attn.k_proj.weight",
298
- "model.layers.23.self_attn.o_proj.weight",
299
- "model.layers.23.self_attn.q_proj.weight",
300
- "model.layers.23.self_attn.v_proj.weight",
301
- "model.layers.24.mlp.down_proj.weight",
302
- "model.layers.24.mlp.gate_proj.weight",
303
- "model.layers.24.mlp.up_proj.weight",
304
- "model.layers.24.self_attn.k_proj.weight",
305
- "model.layers.24.self_attn.o_proj.weight",
306
- "model.layers.24.self_attn.q_proj.weight",
307
- "model.layers.24.self_attn.v_proj.weight",
308
- "model.layers.25.mlp.down_proj.weight",
309
- "model.layers.25.mlp.gate_proj.weight",
310
- "model.layers.25.mlp.up_proj.weight",
311
- "model.layers.25.self_attn.k_proj.weight",
312
- "model.layers.25.self_attn.o_proj.weight",
313
- "model.layers.25.self_attn.q_proj.weight",
314
- "model.layers.25.self_attn.v_proj.weight",
315
- "model.layers.26.mlp.down_proj.weight",
316
- "model.layers.26.mlp.gate_proj.weight",
317
- "model.layers.26.mlp.up_proj.weight",
318
- "model.layers.26.self_attn.k_proj.weight",
319
- "model.layers.26.self_attn.o_proj.weight",
320
- "model.layers.26.self_attn.q_proj.weight",
321
- "model.layers.26.self_attn.v_proj.weight",
322
- "model.layers.27.mlp.down_proj.weight",
323
- "model.layers.27.mlp.gate_proj.weight",
324
- "model.layers.27.mlp.up_proj.weight",
325
- "model.layers.27.self_attn.k_proj.weight",
326
- "model.layers.27.self_attn.o_proj.weight",
327
- "model.layers.27.self_attn.q_proj.weight",
328
- "model.layers.27.self_attn.v_proj.weight",
329
- "model.layers.28.mlp.down_proj.weight",
330
- "model.layers.28.mlp.gate_proj.weight",
331
- "model.layers.28.mlp.up_proj.weight",
332
- "model.layers.28.self_attn.k_proj.weight",
333
- "model.layers.28.self_attn.o_proj.weight",
334
- "model.layers.28.self_attn.q_proj.weight",
335
- "model.layers.28.self_attn.v_proj.weight",
336
- "model.layers.29.mlp.down_proj.weight",
337
- "model.layers.29.mlp.gate_proj.weight",
338
- "model.layers.29.mlp.up_proj.weight",
339
- "model.layers.29.self_attn.k_proj.weight",
340
- "model.layers.29.self_attn.o_proj.weight",
341
- "model.layers.29.self_attn.q_proj.weight",
342
- "model.layers.29.self_attn.v_proj.weight",
343
- "model.layers.30.mlp.down_proj.weight",
344
- "model.layers.30.mlp.gate_proj.weight",
345
- "model.layers.30.mlp.up_proj.weight",
346
- "model.layers.30.self_attn.k_proj.weight",
347
- "model.layers.30.self_attn.o_proj.weight",
348
- "model.layers.30.self_attn.q_proj.weight",
349
- "model.layers.30.self_attn.v_proj.weight",
350
- "model.layers.31.mlp.down_proj.weight",
351
- "model.layers.31.mlp.gate_proj.weight",
352
- "model.layers.31.mlp.up_proj.weight",
353
- "model.layers.31.self_attn.k_proj.weight",
354
- "model.layers.31.self_attn.o_proj.weight",
355
- "model.layers.31.self_attn.q_proj.weight",
356
- "model.layers.31.self_attn.v_proj.weight",
357
- "model.layers.32.mlp.down_proj.weight",
358
- "model.layers.32.mlp.gate_proj.weight",
359
- "model.layers.32.mlp.up_proj.weight",
360
- "model.layers.32.self_attn.k_proj.weight",
361
- "model.layers.32.self_attn.o_proj.weight",
362
- "model.layers.32.self_attn.q_proj.weight",
363
- "model.layers.32.self_attn.v_proj.weight",
364
- "model.layers.33.mlp.down_proj.weight",
365
- "model.layers.33.mlp.gate_proj.weight",
366
- "model.layers.33.mlp.up_proj.weight",
367
- "model.layers.33.self_attn.k_proj.weight",
368
- "model.layers.33.self_attn.o_proj.weight",
369
- "model.layers.33.self_attn.q_proj.weight",
370
- "model.layers.33.self_attn.v_proj.weight",
371
- "model.layers.34.mlp.down_proj.weight",
372
- "model.layers.34.mlp.gate_proj.weight",
373
- "model.layers.34.mlp.up_proj.weight",
374
- "model.layers.34.self_attn.k_proj.weight",
375
- "model.layers.34.self_attn.o_proj.weight",
376
- "model.layers.34.self_attn.q_proj.weight",
377
- "model.layers.34.self_attn.v_proj.weight",
378
- "model.layers.35.mlp.down_proj.weight",
379
- "model.layers.35.mlp.gate_proj.weight",
380
- "model.layers.35.mlp.up_proj.weight",
381
- "model.layers.35.self_attn.k_proj.weight",
382
- "model.layers.35.self_attn.o_proj.weight",
383
- "model.layers.35.self_attn.q_proj.weight",
384
- "model.layers.35.self_attn.v_proj.weight"
385
  ]
386
  },
387
  "modules_quant_config": {},
388
  "modules_to_not_convert": [
389
- ".proj_out",
390
- "double_stream_modulation_txt",
391
  "time_guidance_embed",
 
392
  "context_embedder",
 
393
  "x_embedder",
394
  "double_stream_modulation_img",
395
- "single_stream_modulation",
396
- "norm_out",
397
- "lm_head",
398
- "model.embed_tokens",
399
- "lm_head.weight",
400
- "model.embed_tokens.weight",
401
- ".time_embed",
402
- ".context_embedder",
403
- ".condition_embedder",
404
- ".x_embedder",
405
- ".t_embedder",
406
- ".y_embedder",
407
- ".emb_in",
408
- ".txt_in",
409
- ".img_in",
410
- ".vid_in",
411
  ".proj_out",
412
- ".norm_out",
413
- ".emb_out",
414
- ".txt_out",
415
- ".img_out",
416
- ".vid_out",
417
- ".final_layer",
418
- "multi_modal_projector",
419
- "time_text_embed",
420
- "patch_embedding",
421
- "patch_embed",
422
- "patch_emb",
423
- "lm_head",
424
- "wte"
425
  ],
426
  "non_blocking": false,
427
  "quant_conv": false,
 
1
  {
2
  "_class_name": "Flux2Transformer2DModel",
3
  "_diffusers_version": "0.38.0.dev0",
4
+ "_name_or_path": "/content/flux_aio_full/transformer",
5
  "attention_head_dim": 128,
6
  "axes_dims_rope": [
7
  32,
 
28
  "is_training": false,
29
  "modules_dtype_dict": {
30
  "int5": [
 
31
  "single_transformer_blocks.19.attn.to_qkv_mlp_proj.weight",
32
+ "transformer_blocks.0.attn.to_k.weight"
33
  ],
34
  "uint4": [
35
+ "single_transformer_blocks.0.attn.to_out.weight",
36
+ "single_transformer_blocks.0.attn.to_qkv_mlp_proj.weight",
37
+ "single_transformer_blocks.1.attn.to_out.weight",
38
+ "single_transformer_blocks.1.attn.to_qkv_mlp_proj.weight",
39
+ "single_transformer_blocks.10.attn.to_out.weight",
40
+ "single_transformer_blocks.10.attn.to_qkv_mlp_proj.weight",
41
+ "single_transformer_blocks.11.attn.to_out.weight",
42
+ "single_transformer_blocks.11.attn.to_qkv_mlp_proj.weight",
43
+ "single_transformer_blocks.12.attn.to_out.weight",
44
+ "single_transformer_blocks.12.attn.to_qkv_mlp_proj.weight",
45
+ "single_transformer_blocks.13.attn.to_out.weight",
46
  "single_transformer_blocks.13.attn.to_qkv_mlp_proj.weight",
47
+ "single_transformer_blocks.14.attn.to_out.weight",
48
+ "single_transformer_blocks.14.attn.to_qkv_mlp_proj.weight",
49
+ "single_transformer_blocks.15.attn.to_out.weight",
50
+ "single_transformer_blocks.15.attn.to_qkv_mlp_proj.weight",
51
+ "single_transformer_blocks.16.attn.to_out.weight",
52
  "single_transformer_blocks.16.attn.to_qkv_mlp_proj.weight",
53
+ "single_transformer_blocks.17.attn.to_out.weight",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
54
  "single_transformer_blocks.17.attn.to_qkv_mlp_proj.weight",
55
+ "single_transformer_blocks.18.attn.to_out.weight",
56
+ "single_transformer_blocks.18.attn.to_qkv_mlp_proj.weight",
57
+ "single_transformer_blocks.19.attn.to_out.weight",
58
  "single_transformer_blocks.2.attn.to_out.weight",
59
+ "single_transformer_blocks.2.attn.to_qkv_mlp_proj.weight",
60
+ "single_transformer_blocks.3.attn.to_out.weight",
61
+ "single_transformer_blocks.3.attn.to_qkv_mlp_proj.weight",
62
+ "single_transformer_blocks.4.attn.to_out.weight",
63
+ "single_transformer_blocks.4.attn.to_qkv_mlp_proj.weight",
64
+ "single_transformer_blocks.5.attn.to_out.weight",
 
 
65
  "single_transformer_blocks.5.attn.to_qkv_mlp_proj.weight",
66
+ "single_transformer_blocks.6.attn.to_out.weight",
 
 
 
 
 
 
67
  "single_transformer_blocks.6.attn.to_qkv_mlp_proj.weight",
68
+ "single_transformer_blocks.7.attn.to_out.weight",
69
+ "single_transformer_blocks.7.attn.to_qkv_mlp_proj.weight",
70
+ "single_transformer_blocks.8.attn.to_out.weight",
 
 
 
71
  "single_transformer_blocks.8.attn.to_qkv_mlp_proj.weight",
72
+ "single_transformer_blocks.9.attn.to_out.weight",
73
+ "single_transformer_blocks.9.attn.to_qkv_mlp_proj.weight",
74
+ "transformer_blocks.0.attn.add_k_proj.weight",
75
+ "transformer_blocks.0.attn.add_q_proj.weight",
76
+ "transformer_blocks.0.attn.add_v_proj.weight",
77
+ "transformer_blocks.0.attn.to_add_out.weight",
78
+ "transformer_blocks.0.attn.to_out.0.weight",
79
+ "transformer_blocks.0.attn.to_q.weight",
80
+ "transformer_blocks.0.attn.to_v.weight",
81
+ "transformer_blocks.0.ff.linear_in.weight",
82
+ "transformer_blocks.0.ff.linear_out.weight",
83
  "transformer_blocks.0.ff_context.linear_in.weight",
84
+ "transformer_blocks.0.ff_context.linear_out.weight",
85
+ "transformer_blocks.1.attn.add_k_proj.weight",
86
+ "transformer_blocks.1.attn.add_q_proj.weight",
87
+ "transformer_blocks.1.attn.add_v_proj.weight",
88
  "transformer_blocks.1.attn.to_add_out.weight",
89
+ "transformer_blocks.1.attn.to_k.weight",
 
 
 
 
 
 
 
 
90
  "transformer_blocks.1.attn.to_out.0.weight",
 
 
91
  "transformer_blocks.1.attn.to_q.weight",
92
+ "transformer_blocks.1.attn.to_v.weight",
93
+ "transformer_blocks.1.ff.linear_in.weight",
94
+ "transformer_blocks.1.ff.linear_out.weight",
95
+ "transformer_blocks.1.ff_context.linear_in.weight",
96
+ "transformer_blocks.1.ff_context.linear_out.weight",
97
+ "transformer_blocks.2.attn.add_k_proj.weight",
98
+ "transformer_blocks.2.attn.add_q_proj.weight",
99
+ "transformer_blocks.2.attn.add_v_proj.weight",
100
+ "transformer_blocks.2.attn.to_add_out.weight",
 
 
 
 
 
 
 
 
 
 
101
  "transformer_blocks.2.attn.to_k.weight",
102
  "transformer_blocks.2.attn.to_out.0.weight",
103
+ "transformer_blocks.2.attn.to_q.weight",
104
+ "transformer_blocks.2.attn.to_v.weight",
105
+ "transformer_blocks.2.ff.linear_in.weight",
106
+ "transformer_blocks.2.ff.linear_out.weight",
107
+ "transformer_blocks.2.ff_context.linear_in.weight",
108
+ "transformer_blocks.2.ff_context.linear_out.weight",
109
+ "transformer_blocks.3.attn.add_k_proj.weight",
110
+ "transformer_blocks.3.attn.add_q_proj.weight",
111
+ "transformer_blocks.3.attn.add_v_proj.weight",
112
+ "transformer_blocks.3.attn.to_add_out.weight",
113
  "transformer_blocks.3.attn.to_k.weight",
114
+ "transformer_blocks.3.attn.to_out.0.weight",
 
 
 
 
 
 
 
115
  "transformer_blocks.3.attn.to_q.weight",
116
+ "transformer_blocks.3.attn.to_v.weight",
117
+ "transformer_blocks.3.ff.linear_in.weight",
118
+ "transformer_blocks.3.ff.linear_out.weight",
119
+ "transformer_blocks.3.ff_context.linear_in.weight",
120
+ "transformer_blocks.3.ff_context.linear_out.weight",
121
+ "transformer_blocks.4.attn.add_k_proj.weight",
122
+ "transformer_blocks.4.attn.add_q_proj.weight",
123
+ "transformer_blocks.4.attn.add_v_proj.weight",
124
+ "transformer_blocks.4.attn.to_add_out.weight",
125
+ "transformer_blocks.4.attn.to_k.weight",
126
+ "transformer_blocks.4.attn.to_out.0.weight",
127
+ "transformer_blocks.4.attn.to_q.weight",
128
+ "transformer_blocks.4.attn.to_v.weight",
129
+ "transformer_blocks.4.ff.linear_in.weight",
130
+ "transformer_blocks.4.ff.linear_out.weight",
131
+ "transformer_blocks.4.ff_context.linear_in.weight",
132
+ "transformer_blocks.4.ff_context.linear_out.weight"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
133
  ]
134
  },
135
  "modules_quant_config": {},
136
  "modules_to_not_convert": [
 
 
137
  "time_guidance_embed",
138
+ "norm_out",
139
  "context_embedder",
140
+ "double_stream_modulation_txt",
141
  "x_embedder",
142
  "double_stream_modulation_img",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
143
  ".proj_out",
144
+ "single_stream_modulation"
 
 
 
 
 
 
 
 
 
 
 
 
145
  ],
146
  "non_blocking": false,
147
  "quant_conv": false,
vae/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "AutoencoderKLFlux2",
3
  "_diffusers_version": "0.38.0.dev0",
4
- "_name_or_path": "/root/.cache/huggingface/hub/models--black-forest-labs--FLUX.2-klein-4B/snapshots/e7b7dc27f91deacad38e78976d1f2b499d76a294/vae",
5
  "act_fn": "silu",
6
  "batch_norm_eps": 0.0001,
7
  "batch_norm_momentum": 0.1,
 
1
  {
2
  "_class_name": "AutoencoderKLFlux2",
3
  "_diffusers_version": "0.38.0.dev0",
4
+ "_name_or_path": "/root/.cache/huggingface/hub/models--codeShare--FLUX.2-klein-AIO-SDNQ-4bit-dynamic/snapshots/e545bd6edd331387b952ad7bb0546784d91daeca/vae",
5
  "act_fn": "silu",
6
  "batch_norm_eps": 0.0001,
7
  "batch_norm_momentum": 0.1,