-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathmerge_PermSpec_SDXL.py
1860 lines (1856 loc) · 207 KB
/
merge_PermSpec_SDXL.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
from .merge_rebasin import PermutationSpec, permutation_spec_from_axes_to_perm
def sdxl_permutation_spec() -> PermutationSpec:
conv = lambda name, p_in, p_out: { # pylint: disable=unnecessary-lambda-assignment
f"{name}.weight": (
p_out,
p_in,
),
f"{name}.bias": (p_out,),
}
norm = lambda name, p: {f"{name}.weight": (p,), f"{name}.bias": (p,)} # pylint: disable=unnecessary-lambda-assignment
dense = (
lambda name, p_in, p_out, bias=True: { # pylint: disable=unnecessary-lambda-assignment
f"{name}.weight": (p_out, p_in),
f"{name}.bias": (p_out,),
}
if bias
else {f"{name}.weight": (p_out, p_in)}
)
skip = lambda name, p_in, p_out: { # pylint: disable=unnecessary-lambda-assignment
f"{name}": (
p_out,
p_in,
None,
None,
)
}
# Unet Res blocks
easyblock = lambda name, p_in, p_out: { # pylint: disable=unnecessary-lambda-assignment
**norm(f"{name}.in_layers.0", p_in),
**conv(f"{name}.in_layers.2", p_in, f"P_{name}_inner"),
**dense(
f"{name}.emb_layers.1", f"P_{name}_inner2", f"P_{name}_inner3", bias=True
),
**norm(f"{name}.out_layers.0", f"P_{name}_inner4"),
**conv(f"{name}.out_layers.3", f"P_{name}_inner4", p_out),
}
return permutation_spec_from_axes_to_perm(
{
# Skipped Layers
**skip("betas", None, None),
**skip("alphas_cumprod", None, None),
**skip("alphas_cumprod_prev", None, None),
**skip("sqrt_alphas_cumprod", None, None),
**skip("sqrt_one_minus_alphas_cumprod", None, None),
**skip("log_one_minus_alphas_cumprods", None, None),
**skip("sqrt_recip_alphas_cumprod", None, None),
**skip("sqrt_recipm1_alphas_cumprod", None, None),
**skip("posterior_variance", None, None),
**skip("posterior_log_variance_clipped", None, None),
**skip("posterior_mean_coef1", None, None),
**skip("posterior_mean_coef2", None, None),
**skip("log_one_minus_alphas_cumprod", None, None),
**skip("model_ema.decay", None, None),
**skip("model_ema.num_updates", None, None),
**skip("conditioner.embedders.0.transformer.text_model.embeddings.position_ids", None, None),
**skip("conditioner.embedders.1.model.logit_scale", None, None),
**skip("conditioner.embedders.1.model.positional_embedding", None, None),
**skip("conditioner.embedders.1.model.text_projection", None, None),
**conv("model.diffusion_model.input_blocks.0.0", "P_bg0", "P_bg1"),
**easyblock("model.diffusion_model.input_blocks.1.0", "P_bg2", "P_bg3"),
**easyblock("model.diffusion_model.input_blocks.2.0", "P_bg4", "P_bg5"),
**conv("model.diffusion_model.input_blocks.3.0.op", "P_bg6", "P_bg7"),
**easyblock("model.diffusion_model.input_blocks.4.0", "P_bg8", "P_bg9"),
**conv("model.diffusion_model.input_blocks.4.0.skip_connection", "P_bg10", "P_bg11"),
**norm("model.diffusion_model.input_blocks.4.1.norm", "P_bg12"),
**conv("model.diffusion_model.input_blocks.4.1.proj_in", "P_bg12", "P_bg13"),
**conv("model.diffusion_model.input_blocks.4.1.proj_out", "P_bg14", "P_bg15"),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn1.to_k", "P_bg16", "P_bg17", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn1.to_out.0", "P_bg16", "P_bg17", bias=True),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn1.to_q", "P_bg16", "P_bg17", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn1.to_v", "P_bg16", "P_bg17", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn2.to_k", "P_bg18", "P_bg19", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn2.to_out.0", "P_bg20", "P_bg21", bias=True),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn2.to_q", "P_bg20", "P_bg21", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn2.to_v", "P_bg18", "P_bg19", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.ff.net.0.proj", "P_bg22", "P_bg23", bias=True),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.ff.net.2", "P_bg24", "P_bg25", bias=True),
**norm("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.norm1", "P_bg26"),
**norm("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.norm2", "P_bg26"),
**norm("model.diffusion_model.input_blocks.4.1.transformer_blocks.0.norm3", "P_bg26"),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.attn1.to_k", "P_bg27", "P_bg28", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.attn1.to_out.0", "P_bg27", "P_bg28", bias=True),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.attn1.to_q", "P_bg27", "P_bg28", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.attn1.to_v", "P_bg27", "P_bg28", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.attn2.to_k", "P_bg29", "P_bg30", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.attn2.to_out.0", "P_bg31", "P_bg32", bias=True),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.attn2.to_q", "P_bg31", "P_bg32", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.attn2.to_v", "P_bg33", "P_bg34", bias=False),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.ff.net.0.proj", "P_bg35", "P_bg36", bias=True),
**dense("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.ff.net.2", "P_bg37", "P_bg38", bias=True),
**norm("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.norm1", "P_bg39"),
**norm("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.norm2", "P_bg39"),
**norm("model.diffusion_model.input_blocks.4.1.transformer_blocks.1.norm3", "P_bg39"),
**easyblock("model.diffusion_model.input_blocks.5.0", "P_bg40", "P_bg41"),
**norm("model.diffusion_model.input_blocks.5.1.norm", "P_bg42"),
**conv("model.diffusion_model.input_blocks.5.1.proj_in", "P_bg43", "P_bg44"),
**conv("model.diffusion_model.input_blocks.5.1.proj_out", "P_bg45", "P_bg46"),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn1.to_k", "P_bg47", "P_bg48", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn1.to_out.0", "P_bg47", "P_bg48", bias=True),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn1.to_q", "P_bg47", "P_bg48", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn1.to_v", "P_bg47", "P_bg48", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn2.to_k", "P_bg49", "P_bg50", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn2.to_out.0", "P_bg51", "P_bg52", bias=True),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn2.to_q", "P_bg53", "P_bg54", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn2.to_v", "P_bg55", "P_bg56", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.ff.net.0.proj", "P_bg57", "P_bg58", bias=True),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.ff.net.2", "P_bg59", "P_bg60", bias=True),
**norm("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.norm1", "P_bg61"),
**norm("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.norm2", "P_bg61"),
**norm("model.diffusion_model.input_blocks.5.1.transformer_blocks.0.norm3", "P_bg61"),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.attn1.to_k", "P_bg62", "P_bg63", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.attn1.to_out.0", "P_bg62", "P_bg63", bias=True),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.attn1.to_q", "P_bg62", "P_bg63", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.attn1.to_v", "P_bg62", "P_bg63", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.attn2.to_k", "P_bg64", "P_bg65", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.attn2.to_out.0", "P_bg66", "P_bg67", bias=True),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.attn2.to_q", "P_bg68", "P_bg69", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.attn2.to_v", "P_bg70", "P_bg71", bias=False),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.ff.net.0.proj", "P_bg72", "P_bg73", bias=True),
**dense("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.ff.net.2", "P_bg74", "P_bg75", bias=True),
**norm("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.norm1", "P_bg76"),
**norm("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.norm2", "P_bg76"),
**norm("model.diffusion_model.input_blocks.5.1.transformer_blocks.1.norm3", "P_bg76"),
**conv("model.diffusion_model.input_blocks.6.0.op", "P_bg77", "P_bg78"),
**easyblock("model.diffusion_model.input_blocks.7.0", "P_bg78", "P_bg79"),
**conv("model.diffusion_model.input_blocks.7.0.skip_connection", "P_bg80", "P_bg81"),
**norm("model.diffusion_model.input_blocks.7.1.norm", "P_bg82"),
**conv("model.diffusion_model.input_blocks.7.1.proj_in", "P_bg82", "P_bg83"),
**conv("model.diffusion_model.input_blocks.7.1.proj_out", "P_bg84", "P_bg85"),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn1.to_k", "P_bg86", "P_bg87", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn1.to_out.0", "P_bg86", "P_bg87", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn1.to_q", "P_bg86", "P_bg87", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn1.to_v", "P_bg86", "P_bg87", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn2.to_k", "P_bg88", "P_bg89", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn2.to_out.0", "P_bg90", "P_bg91", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn2.to_q", "P_bg92", "P_bg93", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn2.to_v", "P_bg94", "P_bg95", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.ff.net.0.proj", "P_bg96", "P_bg97", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.ff.net.2", "P_bg98", "P_bg99", bias=True),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.norm1", "P_bg100"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.norm2", "P_bg100"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.0.norm3", "P_bg100"),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.attn1.to_k", "P_bg101", "P_bg102", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.attn1.to_out.0", "P_bg101", "P_bg102", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.attn1.to_q", "P_bg101", "P_bg102", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.attn1.to_v", "P_bg101", "P_bg102", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.attn2.to_k", "P_bg103", "P_bg104", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.attn2.to_out.0", "P_bg105", "P_bg106", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.attn2.to_q", "P_bg107", "P_bg108", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.attn2.to_v", "P_bg109", "P_bg110", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.ff.net.0.proj", "P_bg111", "P_bg112", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.ff.net.2", "P_bg113", "P_bg114", bias=True),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.norm1", "P_bg115"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.norm2", "P_bg115"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.1.norm3", "P_bg115"),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.attn1.to_k", "P_bg116", "P_bg117", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.attn1.to_out.0", "P_bg116", "P_bg117", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.attn1.to_q", "P_bg116", "P_bg117", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.attn1.to_v", "P_bg116", "P_bg117", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.attn2.to_k", "P_bg118", "P_bg119", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.attn2.to_out.0", "P_bg120", "P_bg121", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.attn2.to_q", "P_bg122", "P_bg123", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.attn2.to_v", "P_bg124", "P_bg125", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.ff.net.0.proj", "P_bg126", "P_bg127", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.ff.net.2", "P_bg128", "P_bg129", bias=True),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.norm1", "P_bg130"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.norm2", "P_bg130"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.2.norm3", "P_bg130"),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.attn1.to_k", "P_bg110", "P_bg111", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.attn1.to_out.0", "P_bg131", "P_bg132", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.attn1.to_q", "P_bg131", "P_bg132", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.attn1.to_v", "P_bg131", "P_bg132", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.attn2.to_k", "P_bg133", "P_bg134", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.attn2.to_out.0", "P_bg135", "P_bg136", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.attn2.to_q", "P_bg137", "P_bg138", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.attn2.to_v", "P_bg139", "P_bg140", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.ff.net.0.proj", "P_bg141", "P_bg142", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.ff.net.2", "P_bg143", "P_bg144", bias=True),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.norm1", "P_bg145"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.norm2", "P_bg145"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.3.norm3", "P_bg145"),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.attn1.to_k", "P_bg146", "P_bg147", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.attn1.to_out.0", "P_bg146", "P_bg147", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.attn1.to_q", "P_bg146", "P_bg147", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.attn1.to_v", "P_bg146", "P_bg147", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.attn2.to_k", "P_bg148", "P_bg149", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.attn2.to_out.0", "P_bg150", "P_bg151", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.attn2.to_q", "P_bg152", "P_bg153", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.attn2.to_v", "P_bg154", "P_bg155", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.ff.net.0.proj", "P_bg156", "P_bg157", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.ff.net.2", "P_bg158", "P_bg159", bias=True),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.norm1", "P_bg160"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.norm2", "P_bg160"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.4.norm3", "P_bg160"),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.attn1.to_k", "P_bg161", "P_bg162", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.attn1.to_out.0", "P_bg161", "P_bg162", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.attn1.to_q", "P_bg161", "P_bg162", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.attn1.to_v", "P_bg161", "P_bg162", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.attn2.to_k", "P_bg163", "P_bg164", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.attn2.to_out.0", "P_bg165", "P_bg166", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.attn2.to_q", "P_bg167", "P_bg168", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.attn2.to_v", "P_bg169", "P_bg170", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.ff.net.0.proj", "P_bg171", "P_bg172", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.ff.net.2", "P_bg173", "P_bg174", bias=True),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.norm1", "P_bg175"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.norm2", "P_bg175"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.5.norm3", "P_bg175"),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.attn1.to_k", "P_bg176", "P_bg177", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.attn1.to_out.0", "P_bg176", "P_bg177", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.attn1.to_q", "P_bg176", "P_bg177", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.attn1.to_v", "P_bg176", "P_bg177", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.attn2.to_k", "P_bg178", "P_bg179", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.attn2.to_out.0", "P_bg180", "P_bg181", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.attn2.to_q", "P_bg182", "P_bg183", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.attn2.to_v", "P_bg184", "P_bg185", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.ff.net.0.proj", "P_bg186", "P_bg187", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.ff.net.2", "P_bg188", "P_bg189", bias=True),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.norm1", "P_bg190"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.norm2", "P_bg190"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.6.norm3", "P_bg190"),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.attn1.to_k", "P_bg191", "P_bg192", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.attn1.to_out.0", "P_bg193", "P_bg194", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.attn1.to_q", "P_bg195", "P_bg196", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.attn1.to_v", "P_bg197", "P_bg198", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.attn2.to_k", "P_bg199", "P_bg200", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.attn2.to_out.0", "P_bg201", "P_bg202", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.attn2.to_q", "P_bg203", "P_bg204", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.attn2.to_v", "P_bg205", "P_bg206", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.ff.net.0.proj", "P_bg207", "P_bg208", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.ff.net.2", "P_bg209", "P_bg210", bias=True),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.norm1", "P_bg211"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.norm2", "P_bg211"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.7.norm3", "P_bg211"),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.attn1.to_k", "P_bg212", "P_bg213", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.attn1.to_out.0", "P_bg212", "P_bg213", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.attn1.to_q", "P_bg212", "P_bg213", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.attn1.to_v", "P_bg212", "P_bg213", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.attn2.to_k", "P_bg214", "P_bg215", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.attn2.to_out.0", "P_bg216", "P_bg217", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.attn2.to_q", "P_bg218", "P_bg219", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.attn2.to_v", "P_bg220", "P_bg221", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.ff.net.0.proj", "P_bg222", "P_bg223", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.ff.net.2", "P_bg224", "P_bg225", bias=True),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.norm1", "P_bg226"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.norm2", "P_bg226"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.8.norm3", "P_bg226"),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.attn1.to_k", "P_bg227", "P_bg228", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.attn1.to_out.0", "P_bg227", "P_bg228", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.attn1.to_q", "P_bg227", "P_bg228", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.attn1.to_v", "P_bg227", "P_bg228", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.attn2.to_k", "P_bg229", "P_bg230", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.attn2.to_out.0", "P_bg231", "P_bg232", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.attn2.to_q", "P_bg233", "P_bg234", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.attn2.to_v", "P_bg235", "P_bg236", bias=False),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.ff.net.0.proj", "P_bg237", "P_bg238", bias=True),
**dense("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.ff.net.2", "P_bg239", "P_bg240", bias=True),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.norm1", "P_bg241"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.norm2", "P_bg241"),
**norm("model.diffusion_model.input_blocks.7.1.transformer_blocks.9.norm3", "P_bg241"),
**easyblock("model.diffusion_model.input_blocks.8.0", "P_bg242", "P_bg243"),
**norm("model.diffusion_model.input_blocks.8.1.norm", "P_bg244"),
**conv("model.diffusion_model.input_blocks.8.1.proj_in", "P_bg244", "P_bg245"),
**conv("model.diffusion_model.input_blocks.8.1.proj_out", "P_bg246", "P_bg247"),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn1.to_k", "P_bg248", "P_bg249", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn1.to_out.0", "P_bg248", "P_bg249", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn1.to_q", "P_bg248", "P_bg249", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn1.to_v", "P_bg248", "P_bg249", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn2.to_k", "P_bg250", "P_bg251", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn2.to_out.0", "P_bg252", "P_bg253", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn2.to_q", "P_bg254", "P_bg255", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn2.to_v", "P_bg256", "P_bg257", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.ff.net.0.proj", "P_bg258", "P_bg259", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.ff.net.2", "P_bg260", "P_bg261", bias=True),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.norm1", "P_bg262"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.norm2", "P_bg262"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.0.norm3", "P_bg262"),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.attn1.to_k", "P_bg263", "P_bg264", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.attn1.to_out.0", "P_bg263", "P_bg264", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.attn1.to_q", "P_bg263", "P_bg264", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.attn1.to_v", "P_bg263", "P_bg264", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.attn2.to_k", "P_bg265", "P_bg266", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.attn2.to_out.0", "P_bg267", "P_bg268", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.attn2.to_q", "P_bg269", "P_bg270", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.attn2.to_v", "P_bg271", "P_bg272", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.ff.net.0.proj", "P_bg273", "P_bg274", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.ff.net.2", "P_bg275", "P_bg276", bias=True),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.norm1", "P_bg277"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.norm2", "P_bg277"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.1.norm3", "P_bg277"),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.attn1.to_k", "P_bg278", "P_bg279", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.attn1.to_out.0", "P_bg278", "P_bg279", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.attn1.to_q", "P_bg278", "P_bg279", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.attn1.to_v", "P_bg278", "P_bg279", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.attn2.to_k", "P_bg280", "P_bg281", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.attn2.to_out.0", "P_bg282", "P_bg283", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.attn2.to_q", "P_bg284", "P_bg285", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.attn2.to_v", "P_bg286", "P_bg287", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.ff.net.0.proj", "P_bg288", "P_bg289", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.ff.net.2", "P_bg290", "P_bg291", bias=True),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.norm1", "P_bg292"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.norm2", "P_bg292"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.2.norm3", "P_bg292"),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.attn1.to_k", "P_bg293", "P_bg294", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.attn1.to_out.0", "P_bg293", "P_bg294", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.attn1.to_q", "P_bg293", "P_bg294", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.attn1.to_v", "P_bg293", "P_bg294", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.attn2.to_k", "P_bg295", "P_bg296", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.attn2.to_out.0", "P_bg297", "P_bg298", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.attn2.to_q", "P_bg299", "P_bg300", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.attn2.to_v", "P_bg301", "P_bg302", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.ff.net.0.proj", "P_bg303", "P_bg304", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.ff.net.2", "P_bg305", "P_bg306", bias=True),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.norm1", "P_bg307"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.norm2", "P_bg307"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.3.norm3", "P_bg307"),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.attn1.to_k", "P_bg308", "P_bg309", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.attn1.to_out.0", "P_bg308", "P_bg309", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.attn1.to_q", "P_bg308", "P_bg309", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.attn1.to_v", "P_bg308", "P_bg309", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.attn2.to_k", "P_bg310", "P_bg311", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.attn2.to_out.0", "P_bg312", "P_bg313", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.attn2.to_q", "P_bg314", "P_bg315", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.attn2.to_v", "P_bg316", "P_bg317", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.ff.net.0.proj", "P_bg318", "P_bg319", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.ff.net.2", "P_bg320", "P_bg321", bias=True),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.norm1", "P_bg322"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.norm2", "P_bg322"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.4.norm3", "P_bg322"),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.attn1.to_k", "P_bg322", "P_bg323", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.attn1.to_out.0", "P_bg322", "P_bg323", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.attn1.to_q", "P_bg322", "P_bg323", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.attn1.to_v", "P_bg322", "P_bg323", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.attn2.to_k", "P_bg324", "P_bg325", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.attn2.to_out.0", "P_bg326", "P_bg327", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.attn2.to_q", "P_bg328", "P_bg329", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.attn2.to_v", "P_bg330", "P_bg331", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.ff.net.0.proj", "P_bg332", "P_bg333", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.ff.net.2", "P_bg334", "P_bg335", bias=True),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.norm1", "P_bg336"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.norm2", "P_bg336"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.5.norm3", "P_bg336"),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.attn1.to_k", "P_bg337", "P_bg338", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.attn1.to_out.0", "P_bg337", "P_bg338", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.attn1.to_q", "P_bg337", "P_bg338", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.attn1.to_v", "P_bg337", "P_bg338", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.attn2.to_k", "P_bg339", "P_bg340", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.attn2.to_out.0", "P_bg341", "P_bg342", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.attn2.to_q", "P_bg343", "P_bg344", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.attn2.to_v", "P_bg345", "P_bg346", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.ff.net.0.proj", "P_bg347", "P_bg348", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.ff.net.2", "P_bg349", "P_bg350", bias=True),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.norm1", "P_bg351"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.norm2", "P_bg351"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.6.norm3", "P_bg351"),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.attn1.to_k", "P_bg352", "P_bg353", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.attn1.to_out.0", "P_bg352", "P_bg353", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.attn1.to_q", "P_bg352", "P_bg353", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.attn1.to_v", "P_bg352", "P_bg353", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.attn2.to_k", "P_bg354", "P_bg355", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.attn2.to_out.0", "P_bg356", "P_bg357", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.attn2.to_q", "P_bg358", "P_bg359", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.attn2.to_v", "P_bg360", "P_bg361", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.ff.net.0.proj", "P_bg362", "P_bg363", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.ff.net.2", "P_bg364", "P_bg365", bias=True),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.norm1", "P_bg366"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.norm2", "P_bg366"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.7.norm3", "P_bg366"),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.attn1.to_k", "P_bg367", "P_bg368", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.attn1.to_out.0", "P_bg367", "P_bg368", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.attn1.to_q", "P_bg367", "P_bg368", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.attn1.to_v", "P_bg367", "P_bg368", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.attn2.to_k", "P_bg369", "P_bg370", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.attn2.to_out.0", "P_bg371", "P_bg372", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.attn2.to_q", "P_bg373", "P_bg374", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.attn2.to_v", "P_bg375", "P_bg376", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.ff.net.0.proj", "P_bg377", "P_bg378", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.ff.net.2", "P_bg379", "P_bg380", bias=True),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.norm1", "P_bg381"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.norm2", "P_bg381"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.8.norm3", "P_bg381"),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.attn1.to_k", "P_bg382", "P_bg383", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.attn1.to_out.0", "P_bg382", "P_bg383", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.attn1.to_q", "P_bg382", "P_bg383", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.attn1.to_v", "P_bg382", "P_bg383", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.attn2.to_k", "P_bg384", "P_bg385", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.attn2.to_out.0", "P_bg386", "P_bg387", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.attn2.to_q", "P_bg388", "P_bg389", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.attn2.to_v", "P_bg390", "P_bg391", bias=False),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.ff.net.0.proj", "P_bg392", "P_bg393", bias=True),
**dense("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.ff.net.2", "P_bg394", "P_bg395", bias=True),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.norm1", "P_bg396"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.norm2", "P_bg396"),
**norm("model.diffusion_model.input_blocks.8.1.transformer_blocks.9.norm3", "P_bg396"),
**dense("model.diffusion_model.label_emb.0.0", "P_bg397", "P_bg398", bias=True),
**dense("model.diffusion_model.label_emb.0.2", "P_bg399", "P_bg400", bias=True),
**easyblock("model.diffusion_model.middle_block.0", "P_bg401", "P_bg402"),
**norm("model.diffusion_model.middle_block.1.norm", "P_bg403"),
**conv("model.diffusion_model.middle_block.1.proj_in", "P_bg403", "P_bg404"),
**conv("model.diffusion_model.middle_block.1.proj_out", "P_bg405", "P_bg406"),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.0.attn1.to_k", "P_bg407", "P_bg408", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.0.attn1.to_out.0", "P_bg407", "P_bg408", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.0.attn1.to_q", "P_bg407", "P_bg408", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.0.attn1.to_v", "P_bg407", "P_bg408", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.0.attn2.to_k", "P_bg409", "P_bg410", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.0.attn2.to_out.0", "P_bg411", "P_bg412", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.0.attn2.to_q", "P_bg413", "P_bg414", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.0.attn2.to_v", "P_bg415", "P_bg416", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.0.ff.net.0.proj", "P_bg417", "P_bg418", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.0.ff.net.2", "P_bg419", "P_bg420", bias=True),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.0.norm1", "P_bg421"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.0.norm2", "P_bg421"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.0.norm3", "P_bg421"),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.1.attn1.to_k", "P_bg422", "P_bg423", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.1.attn1.to_out.0", "P_bg422", "P_bg423", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.1.attn1.to_q", "P_bg422", "P_bg423", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.1.attn1.to_v", "P_bg422", "P_bg423", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.1.attn2.to_k", "P_bg424", "P_bg425", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.1.attn2.to_out.0", "P_bg426", "P_bg427", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.1.attn2.to_q", "P_bg428", "P_bg429", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.1.attn2.to_v", "P_bg430", "P_bg431", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.1.ff.net.0.proj", "P_bg432", "P_bg433", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.1.ff.net.2", "P_bg434", "P_bg435", bias=True),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.1.norm1", "P_bg436"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.1.norm2", "P_bg436"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.1.norm3", "P_bg436"),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.2.attn1.to_k", "P_bg437", "P_bg438", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.2.attn1.to_out.0", "P_bg437", "P_bg438", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.2.attn1.to_q", "P_bg437", "P_bg438", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.2.attn1.to_v", "P_bg437", "P_bg438", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.2.attn2.to_k", "P_bg439", "P_bg440", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.2.attn2.to_out.0", "P_bg441", "P_bg442", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.2.attn2.to_q", "P_bg443", "P_bg444", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.2.attn2.to_v", "P_bg445", "P_bg446", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.2.ff.net.0.proj", "P_bg447", "P_bg448", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.2.ff.net.2", "P_bg449", "P_bg450", bias=True),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.2.norm1", "P_bg451"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.2.norm2", "P_bg451"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.2.norm3", "P_bg451"),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.3.attn1.to_k", "P_bg452", "P_bg453", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.3.attn1.to_out.0", "P_bg452", "P_bg453", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.3.attn1.to_q", "P_bg452", "P_bg453", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.3.attn1.to_v", "P_bg452", "P_bg453", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.3.attn2.to_k", "P_bg454", "P_bg455", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.3.attn2.to_out.0", "P_bg456", "P_bg457", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.3.attn2.to_q", "P_bg458", "P_bg459", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.3.attn2.to_v", "P_bg460", "P_bg461", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.3.ff.net.0.proj", "P_bg462", "P_bg463", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.3.ff.net.2", "P_bg464", "P_bg465", bias=True),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.3.norm1", "P_bg466"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.3.norm2", "P_bg466"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.3.norm3", "P_bg466"),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.4.attn1.to_k", "P_bg467", "P_bg468", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.4.attn1.to_out.0", "P_bg467", "P_bg468", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.4.attn1.to_q", "P_bg467", "P_bg468", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.4.attn1.to_v", "P_bg467", "P_bg468", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.4.attn2.to_k", "P_bg469", "P_bg470", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.4.attn2.to_out.0", "P_bg471", "P_bg472", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.4.attn2.to_q", "P_bg473", "P_bg474", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.4.attn2.to_v", "P_bg475", "P_bg476", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.4.ff.net.0.proj", "P_bg477", "P_bg478", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.4.ff.net.2", "P_bg479", "P_bg480", bias=True),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.4.norm1", "P_bg481"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.4.norm2", "P_bg481"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.4.norm3", "P_bg481"),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.5.attn1.to_k", "P_bg482", "P_bg483", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.5.attn1.to_out.0", "P_bg482", "P_bg483", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.5.attn1.to_q", "P_bg482", "P_bg483", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.5.attn1.to_v", "P_bg482", "P_bg483", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.5.attn2.to_k", "P_bg484", "P_bg485", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.5.attn2.to_out.0", "P_bg486", "P_bg487", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.5.attn2.to_q", "P_bg488", "P_bg489", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.5.attn2.to_v", "P_bg490", "P_bg491", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.5.ff.net.0.proj", "P_bg492", "P_bg493", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.5.ff.net.2", "P_bg494", "P_bg495", bias=True),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.5.norm1", "P_bg496"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.5.norm2", "P_bg496"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.5.norm3", "P_bg496"),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.6.attn1.to_k", "P_bg497", "P_bg498", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.6.attn1.to_out.0", "P_bg497", "P_bg498", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.6.attn1.to_q", "P_bg497", "P_bg498", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.6.attn1.to_v", "P_bg497", "P_bg498", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.6.attn2.to_k", "P_bg499", "P_bg500", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.6.attn2.to_out.0", "P_bg501", "P_bg502", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.6.attn2.to_q", "P_bg503", "P_bg504", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.6.attn2.to_v", "P_bg505", "P_bg506", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.6.ff.net.0.proj", "P_bg507", "P_bg508", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.6.ff.net.2", "P_bg509", "P_bg510", bias=True),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.6.norm1", "P_bg511"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.6.norm2", "P_bg511"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.6.norm3", "P_bg511"),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.7.attn1.to_k", "P_bg512", "P_bg513", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.7.attn1.to_out.0", "P_bg512", "P_bg513", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.7.attn1.to_q", "P_bg512", "P_bg513", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.7.attn1.to_v", "P_bg512", "P_bg513", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.7.attn2.to_k", "P_bg514", "P_bg515", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.7.attn2.to_out.0", "P_bg516", "P_bg517", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.7.attn2.to_q", "P_bg518", "P_bg519", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.7.attn2.to_v", "P_bg520", "P_bg521", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.7.ff.net.0.proj", "P_bg522", "P_bg523", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.7.ff.net.2", "P_bg524", "P_bg525", bias=True),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.7.norm1", "P_bg526"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.7.norm2", "P_bg526"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.7.norm3", "P_bg526"),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.8.attn1.to_k", "P_bg527", "P_bg528", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.8.attn1.to_out.0", "P_bg527", "P_bg528", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.8.attn1.to_q", "P_bg527", "P_bg528", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.8.attn1.to_v", "P_bg527", "P_bg528", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.8.attn2.to_k", "P_bg529", "P_bg530", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.8.attn2.to_out.0", "P_bg531", "P_bg532", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.8.attn2.to_q", "P_bg533", "P_bg534", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.8.attn2.to_v", "P_bg535", "P_bg536", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.8.ff.net.0.proj", "P_bg537", "P_bg538", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.8.ff.net.2", "P_bg539", "P_bg540", bias=True),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.8.norm1", "P_bg541"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.8.norm2", "P_bg541"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.8.norm3", "P_bg541"),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.9.attn1.to_k", "P_bg542", "P_bg543", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.9.attn1.to_out.0", "P_bg542", "P_bg543", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.9.attn1.to_q", "P_bg542", "P_bg543", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.9.attn1.to_v", "P_bg542", "P_bg543", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.9.attn2.to_k", "P_bg544", "P_bg545", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.9.attn2.to_out.0", "P_bg546", "P_bg547", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.9.attn2.to_q", "P_bg548", "P_bg549", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.9.attn2.to_v", "P_bg550", "P_bg551", bias=False),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.9.ff.net.0.proj", "P_bg552", "P_bg553", bias=True),
**dense("model.diffusion_model.middle_block.1.transformer_blocks.9.ff.net.2", "P_bg554", "P_bg555", bias=True),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.9.norm1", "P_bg556"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.9.norm2", "P_bg556"),
**norm("model.diffusion_model.middle_block.1.transformer_blocks.9.norm3", "P_bg556"),
**easyblock("model.diffusion_model.middle_block.2", "P_bg557", "P_bg558"),
**norm("model.diffusion_model.out.0", "P_bg559"),
**conv("model.diffusion_model.out.2", "P_bg560", "P_bg561"),
**easyblock("model.diffusion_model.output_blocks.0.0", "P_bg562", "P_bg563"),
**conv("model.diffusion_model.output_blocks.0.0.skip_connection", "P_bg564", "P_bg565"),
**norm("model.diffusion_model.output_blocks.0.1.norm", "P_bg566"),
**conv("model.diffusion_model.output_blocks.0.1.proj_in", "P_bg566", "P_bg567"),
**conv("model.diffusion_model.output_blocks.0.1.proj_out", "P_bg568", "P_bg569"),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.attn1.to_k", "P_bg570", "P_bg571", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.attn1.to_out.0", "P_bg570", "P_bg571", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.attn1.to_q", "P_bg570", "P_bg571", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.attn1.to_v", "P_bg570", "P_bg571", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.attn2.to_k", "P_bg572", "P_bg573", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.attn2.to_out.0", "P_bg574", "P_bg575", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.attn2.to_q", "P_bg576", "P_bg577", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.attn2.to_v", "P_bg578", "P_bg579", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.ff.net.0.proj", "P_bg580", "P_bg581", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.ff.net.2", "P_bg582", "P_bg583", bias=True),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.norm1", "P_bg584"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.norm2", "P_bg584"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.0.norm3", "P_bg584"),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.attn1.to_k", "P_bg585", "P_bg586", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.attn1.to_out.0", "P_bg585", "P_bg586", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.attn1.to_q", "P_bg585", "P_bg586", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.attn1.to_v", "P_bg585", "P_bg586", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.attn2.to_k", "P_bg587", "P_bg588", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.attn2.to_out.0", "P_bg589", "P_bg590", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.attn2.to_q", "P_bg591", "P_bg592", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.attn2.to_v", "P_bg593", "P_bg594", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.ff.net.0.proj", "P_bg595", "P_bg596", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.ff.net.2", "P_bg597", "P_bg598", bias=True),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.norm1", "P_bg599"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.norm2", "P_bg599"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.1.norm3", "P_bg599"),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.attn1.to_k", "P_bg600", "P_bg601", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.attn1.to_out.0", "P_bg600", "P_bg601", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.attn1.to_q", "P_bg600", "P_bg601", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.attn1.to_v", "P_bg600", "P_bg601", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.attn2.to_k", "P_bg602", "P_bg603", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.attn2.to_out.0", "P_bg604", "P_bg605", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.attn2.to_q", "P_bg606", "P_bg607", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.attn2.to_v", "P_bg608", "P_bg609", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.ff.net.0.proj", "P_bg610", "P_bg611", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.ff.net.2", "P_bg612", "P_bg613", bias=True),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.norm1", "P_bg614"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.norm2", "P_bg614"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.2.norm3", "P_bg614"),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.attn1.to_k", "P_bg615", "P_bg616", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.attn1.to_out.0", "P_bg615", "P_bg616", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.attn1.to_q", "P_bg615", "P_bg616", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.attn1.to_v", "P_bg615", "P_bg616", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.attn2.to_k", "P_bg617", "P_bg618", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.attn2.to_out.0", "P_bg619", "P_bg620", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.attn2.to_q", "P_bg621", "P_bg622", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.attn2.to_v", "P_bg623", "P_bg624", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.ff.net.0.proj", "P_bg625", "P_bg626", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.ff.net.2", "P_bg627", "P_bg628", bias=True),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.norm1", "P_bg629"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.norm2", "P_bg629"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.3.norm3", "P_bg629"),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.attn1.to_k", "P_bg630", "P_bg631", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.attn1.to_out.0", "P_bg630", "P_bg631", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.attn1.to_q", "P_bg630", "P_bg631", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.attn1.to_v", "P_bg630", "P_bg631", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.attn2.to_k", "P_bg632", "P_bg633", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.attn2.to_out.0", "P_bg634", "P_bg635", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.attn2.to_q", "P_bg636", "P_bg637", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.attn2.to_v", "P_bg638", "P_bg639", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.ff.net.0.proj", "P_bg640", "P_bg641", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.ff.net.2", "P_bg642", "P_bg643", bias=True),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.norm1", "P_bg644"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.norm2", "P_bg644"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.4.norm3", "P_bg644"),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.attn1.to_k", "P_bg645", "P_bg646", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.attn1.to_out.0", "P_bg645", "P_bg646", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.attn1.to_q", "P_bg645", "P_bg646", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.attn1.to_v", "P_bg645", "P_bg646", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.attn2.to_k", "P_bg647", "P_bg648", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.attn2.to_out.0", "P_bg649", "P_bg650", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.attn2.to_q", "P_bg651", "P_bg652", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.attn2.to_v", "P_bg653", "P_bg654", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.ff.net.0.proj", "P_bg655", "P_bg656", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.ff.net.2", "P_bg657", "P_bg658", bias=True),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.norm1", "P_bg659"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.norm2", "P_bg659"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.5.norm3", "P_bg659"),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.attn1.to_k", "P_bg660", "P_bg661", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.attn1.to_out.0", "P_bg660", "P_bg661", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.attn1.to_q", "P_bg660", "P_bg661", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.attn1.to_v", "P_bg660", "P_bg661", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.attn2.to_k", "P_bg662", "P_bg663", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.attn2.to_out.0", "P_bg664", "P_bg665", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.attn2.to_q", "P_bg666", "P_bg667", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.attn2.to_v", "P_bg668", "P_bg669", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.ff.net.0.proj", "P_bg670", "P_bg671", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.ff.net.2", "P_bg672", "P_bg673", bias=True),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.norm1", "P_bg674"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.norm2", "P_bg674"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.6.norm3", "P_bg674"),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.attn1.to_k", "P_bg675", "P_bg676", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.attn1.to_out.0", "P_bg675", "P_bg676", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.attn1.to_q", "P_bg675", "P_bg676", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.attn1.to_v", "P_bg675", "P_bg676", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.attn2.to_k", "P_bg677", "P_bg678", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.attn2.to_out.0", "P_bg679", "P_bg680", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.attn2.to_q", "P_bg681", "P_bg682", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.attn2.to_v", "P_bg683", "P_bg684", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.ff.net.0.proj", "P_bg685", "P_bg686", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.ff.net.2", "P_bg687", "P_bg688", bias=True),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.norm1", "P_bg689"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.norm2", "P_bg689"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.7.norm3", "P_bg689"),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.attn1.to_k", "P_bg690", "P_bg691", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.attn1.to_out.0", "P_bg690", "P_bg691", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.attn1.to_q", "P_bg690", "P_bg691", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.attn1.to_v", "P_bg690", "P_bg691", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.attn2.to_k", "P_bg692", "P_bg693", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.attn2.to_out.0", "P_bg694", "P_bg695", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.attn2.to_q", "P_bg696", "P_bg697", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.attn2.to_v", "P_bg698", "P_bg699", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.ff.net.0.proj", "P_bg700", "P_bg701", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.ff.net.2", "P_bg702", "P_bg703", bias=True),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.norm1", "P_bg704"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.norm2", "P_bg704"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.8.norm3", "P_bg704"),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.attn1.to_k", "P_bg705", "P_bg706", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.attn1.to_out.0", "P_bg705", "P_bg706", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.attn1.to_q", "P_bg705", "P_bg706", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.attn1.to_v", "P_bg705", "P_bg706", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.attn2.to_k", "P_bg707", "P_bg708", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.attn2.to_out.0", "P_bg709", "P_bg710", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.attn2.to_q", "P_bg711", "P_bg712", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.attn2.to_v", "P_bg713", "P_bg714", bias=False),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.ff.net.0.proj", "P_bg715", "P_bg716", bias=True),
**dense("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.ff.net.2", "P_bg717", "P_bg718", bias=True),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.norm1", "P_bg719"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.norm2", "P_bg719"),
**norm("model.diffusion_model.output_blocks.0.1.transformer_blocks.9.norm3", "P_bg719"),
**easyblock("model.diffusion_model.output_blocks.1.0", "P_bg720", "P_bg721"),
**conv("model.diffusion_model.output_blocks.1.0.skip_connection", "P_bg722", "P_bg723"),
**norm("model.diffusion_model.output_blocks.1.1.norm", "P_bg724"),
**conv("model.diffusion_model.output_blocks.1.1.proj_in", "P_bg724", "P_bg725"),
**conv("model.diffusion_model.output_blocks.1.1.proj_out", "P_bg726", "P_bg727"),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.attn1.to_k", "P_bg728", "P_bg729", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.attn1.to_out.0", "P_bg728", "P_bg729", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.attn1.to_q", "P_bg728", "P_bg729", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.attn1.to_v", "P_bg728", "P_bg729", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.attn2.to_k", "P_bg730", "P_bg731", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.attn2.to_out.0", "P_bg732", "P_bg733", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.attn2.to_q", "P_bg734", "P_bg735", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.attn2.to_v", "P_bg736", "P_bg737", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.ff.net.0.proj", "P_bg738", "P_bg739", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.ff.net.2", "P_bg740", "P_bg741", bias=True),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.norm1", "P_bg742"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.norm2", "P_bg742"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.0.norm3", "P_bg742"),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.attn1.to_k", "P_bg743", "P_bg744", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.attn1.to_out.0", "P_bg743", "P_bg744", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.attn1.to_q", "P_bg743", "P_bg744", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.attn1.to_v", "P_bg743", "P_bg744", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.attn2.to_k", "P_bg745", "P_bg746", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.attn2.to_out.0", "P_bg747", "P_bg748", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.attn2.to_q", "P_bg749", "P_bg750", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.attn2.to_v", "P_bg751", "P_bg752", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.ff.net.0.proj", "P_bg753", "P_bg754", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.ff.net.2", "P_bg755", "P_bg756", bias=True),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.norm1", "P_bg757"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.norm2", "P_bg757"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.1.norm3", "P_bg757"),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.attn1.to_k", "P_bg758", "P_bg759", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.attn1.to_out.0", "P_bg758", "P_bg759", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.attn1.to_q", "P_bg758", "P_bg759", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.attn1.to_v", "P_bg758", "P_bg759", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.attn2.to_k", "P_bg760", "P_bg761", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.attn2.to_out.0", "P_bg762", "P_bg763", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.attn2.to_q", "P_bg764", "P_bg765", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.attn2.to_v", "P_bg766", "P_bg767", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.ff.net.0.proj", "P_bg768", "P_bg769", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.ff.net.2", "P_bg770", "P_bg771", bias=True),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.norm1", "P_bg772"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.norm2", "P_bg772"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.2.norm3", "P_bg772"),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.attn1.to_k", "P_bg773", "P_bg774", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.attn1.to_out.0", "P_bg773", "P_bg774", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.attn1.to_q", "P_bg773", "P_bg774", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.attn1.to_v", "P_bg773", "P_bg774", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.attn2.to_k", "P_bg775", "P_bg776", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.attn2.to_out.0", "P_bg777", "P_bg778", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.attn2.to_q", "P_bg779", "P_bg780", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.attn2.to_v", "P_bg781", "P_bg782", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.ff.net.0.proj", "P_bg783", "P_bg784", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.ff.net.2", "P_bg785", "P_bg786", bias=True),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.norm1", "P_bg787"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.norm2", "P_bg787"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.3.norm3", "P_bg787"),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.attn1.to_k", "P_bg788", "P_bg789", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.attn1.to_out.0", "P_bg788", "P_bg789", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.attn1.to_q", "P_bg788", "P_bg789", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.attn1.to_v", "P_bg788", "P_bg789", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.attn2.to_k", "P_bg790", "P_bg791", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.attn2.to_out.0", "P_bg792", "P_bg793", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.attn2.to_q", "P_bg794", "P_bg795", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.attn2.to_v", "P_bg796", "P_bg797", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.ff.net.0.proj", "P_bg798", "P_bg799", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.ff.net.2", "P_bg800", "P_bg801", bias=True),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.norm1", "P_bg802"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.norm2", "P_bg802"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.4.norm3", "P_bg802"),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.attn1.to_k", "P_bg803", "P_bg804", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.attn1.to_out.0", "P_bg803", "P_bg804", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.attn1.to_q", "P_bg803", "P_bg804", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.attn1.to_v", "P_bg803", "P_bg804", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.attn2.to_k", "P_bg805", "P_bg806", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.attn2.to_out.0", "P_bg807", "P_bg808", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.attn2.to_q", "P_bg809", "P_bg810", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.attn2.to_v", "P_bg811", "P_bg812", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.ff.net.0.proj", "P_bg813", "P_bg814", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.ff.net.2", "P_bg815", "P_bg816", bias=True),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.norm1", "P_bg817"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.norm2", "P_bg817"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.5.norm3", "P_bg817"),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.attn1.to_k", "P_bg818", "P_bg819", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.attn1.to_out.0", "P_bg818", "P_bg819", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.attn1.to_q", "P_bg818", "P_bg819", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.attn1.to_v", "P_bg818", "P_bg819", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.attn2.to_k", "P_bg820", "P_bg821", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.attn2.to_out.0", "P_bg822", "P_bg823", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.attn2.to_q", "P_bg824", "P_bg825", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.attn2.to_v", "P_bg826", "P_bg827", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.ff.net.0.proj", "P_bg828", "P_bg829", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.ff.net.2", "P_bg830", "P_bg831", bias=True),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.norm1", "P_bg832"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.norm2", "P_bg832"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.6.norm3", "P_bg832"),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.attn1.to_k", "P_bg833", "P_bg834", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.attn1.to_out.0", "P_bg833", "P_bg834", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.attn1.to_q", "P_bg833", "P_bg834", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.attn1.to_v", "P_bg833", "P_bg834", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.attn2.to_k", "P_bg835", "P_bg836", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.attn2.to_out.0", "P_bg837", "P_bg838", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.attn2.to_q", "P_bg839", "P_bg840", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.attn2.to_v", "P_bg841", "P_bg842", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.ff.net.0.proj", "P_bg843", "P_bg844", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.ff.net.2", "P_bg845", "P_bg846", bias=True),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.norm1", "P_bg847"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.norm2", "P_bg847"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.7.norm3", "P_bg847"),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.attn1.to_k", "P_bg848", "P_bg849", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.attn1.to_out.0", "P_bg848", "P_bg849", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.attn1.to_q", "P_bg848", "P_bg849", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.attn1.to_v", "P_bg848", "P_bg849", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.attn2.to_k", "P_bg850", "P_bg851", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.attn2.to_out.0", "P_bg852", "P_bg853", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.attn2.to_q", "P_bg854", "P_bg855", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.attn2.to_v", "P_bg856", "P_bg857", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.ff.net.0.proj", "P_bg858", "P_bg859", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.ff.net.2", "P_bg860", "P_bg861", bias=True),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.norm1", "P_bg862"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.norm2", "P_bg862"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.8.norm3", "P_bg862"),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.attn1.to_k", "P_bg863", "P_bg864", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.attn1.to_out.0", "P_bg863", "P_bg864", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.attn1.to_q", "P_bg863", "P_bg864", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.attn1.to_v", "P_bg863", "P_bg864", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.attn2.to_k", "P_bg865", "P_bg866", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.attn2.to_out.0", "P_bg867", "P_bg868", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.attn2.to_q", "P_bg869", "P_bg870", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.attn2.to_v", "P_bg871", "P_bg872", bias=False),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.ff.net.0.proj", "P_bg873", "P_bg874", bias=True),
**dense("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.ff.net.2", "P_bg875", "P_bg876", bias=True),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.norm1", "P_bg877"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.norm2", "P_bg877"),
**norm("model.diffusion_model.output_blocks.1.1.transformer_blocks.9.norm3", "P_bg877"),
**easyblock("model.diffusion_model.output_blocks.2.0", "P_bg878", "P_bg879"),
**conv("model.diffusion_model.output_blocks.2.0.skip_connection", "P_bg880", "P_bg881"),
**norm("model.diffusion_model.output_blocks.2.1.norm", "P_bg882"),
**conv("model.diffusion_model.output_blocks.2.1.proj_in", "P_bg882", "P_bg883"),
**conv("model.diffusion_model.output_blocks.2.1.proj_out", "P_bg884", "P_bg885"),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.attn1.to_k", "P_bg886", "P_bg887", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.attn1.to_out.0", "P_bg886", "P_bg887", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.attn1.to_q", "P_bg886", "P_bg887", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.attn1.to_v", "P_bg886", "P_bg887", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.attn2.to_k", "P_bg888", "P_bg889", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.attn2.to_out.0", "P_bg890", "P_bg891", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.attn2.to_q", "P_bg892", "P_bg893", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.attn2.to_v", "P_bg894", "P_bg895", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.ff.net.0.proj", "P_bg896", "P_bg897", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.ff.net.2", "P_bg898", "P_bg899", bias=True),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.norm1", "P_bg900"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.norm2", "P_bg900"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.0.norm3", "P_bg900"),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.attn1.to_k", "P_bg901", "P_bg902", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.attn1.to_out.0", "P_bg901", "P_bg902", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.attn1.to_q", "P_bg901", "P_bg902", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.attn1.to_v", "P_bg901", "P_bg902", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.attn2.to_k", "P_bg903", "P_bg904", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.attn2.to_out.0", "P_bg905", "P_bg906", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.attn2.to_q", "P_bg907", "P_bg908", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.attn2.to_v", "P_bg909", "P_bg910", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.ff.net.0.proj", "P_bg911", "P_bg912", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.ff.net.2", "P_bg913", "P_bg914", bias=True),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.norm1", "P_bg915"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.norm2", "P_bg915"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.1.norm3", "P_bg915"),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.attn1.to_k", "P_bg916", "P_bg917", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.attn1.to_out.0", "P_bg916", "P_bg917", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.attn1.to_q", "P_bg916", "P_bg917", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.attn1.to_v", "P_bg916", "P_bg917", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.attn2.to_k", "P_bg918", "P_bg919", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.attn2.to_out.0", "P_bg920", "P_bg921", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.attn2.to_q", "P_bg922", "P_bg923", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.attn2.to_v", "P_bg924", "P_bg925", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.ff.net.0.proj", "P_bg926", "P_bg927", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.ff.net.2", "P_bg928", "P_bg929", bias=True),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.norm1", "P_bg930"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.norm2", "P_bg930"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.2.norm3", "P_bg930"),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.attn1.to_k", "P_bg931", "P_bg932", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.attn1.to_out.0", "P_bg931", "P_bg932", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.attn1.to_q", "P_bg931", "P_bg932", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.attn1.to_v", "P_bg931", "P_bg932", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.attn2.to_k", "P_bg933", "P_bg934", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.attn2.to_out.0", "P_bg935", "P_bg936", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.attn2.to_q", "P_bg937", "P_bg938", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.attn2.to_v", "P_bg939", "P_bg940", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.ff.net.0.proj", "P_bg941", "P_bg942", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.ff.net.2", "P_bg943", "P_bg944", bias=True),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.norm1", "P_bg945"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.norm2", "P_bg945"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.3.norm3", "P_bg945"),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.attn1.to_k", "P_bg946", "P_bg947", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.attn1.to_out.0", "P_bg946", "P_bg947", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.attn1.to_q", "P_bg946", "P_bg947", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.attn1.to_v", "P_bg946", "P_bg947", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.attn2.to_k", "P_bg948", "P_bg949", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.attn2.to_out.0", "P_bg950", "P_bg951", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.attn2.to_q", "P_bg952", "P_bg953", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.attn2.to_v", "P_bg954", "P_bg955", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.ff.net.0.proj", "P_bg956", "P_bg957", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.ff.net.2", "P_bg958", "P_bg959", bias=True),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.norm1", "P_bg960"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.norm2", "P_bg960"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.4.norm3", "P_bg960"),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.attn1.to_k", "P_bg961", "P_bg962", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.attn1.to_out.0", "P_bg961", "P_bg962", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.attn1.to_q", "P_bg961", "P_bg962", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.attn1.to_v", "P_bg961", "P_bg962", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.attn2.to_k", "P_bg963", "P_bg964", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.attn2.to_out.0", "P_bg965", "P_bg966", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.attn2.to_q", "P_bg967", "P_bg968", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.attn2.to_v", "P_bg969", "P_bg970", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.ff.net.0.proj", "P_bg971", "P_bg972", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.ff.net.2", "P_bg973", "P_bg974", bias=True),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.norm1", "P_bg975"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.norm2", "P_bg975"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.5.norm3", "P_bg975"),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.attn1.to_k", "P_bg976", "P_bg977", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.attn1.to_out.0", "P_bg976", "P_bg977", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.attn1.to_q", "P_bg976", "P_bg977", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.attn1.to_v", "P_bg976", "P_bg977", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.attn2.to_k", "P_bg978", "P_bg979", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.attn2.to_out.0", "P_bg980", "P_bg981", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.attn2.to_q", "P_bg982", "P_bg983", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.attn2.to_v", "P_bg984", "P_bg985", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.ff.net.0.proj", "P_bg986", "P_bg987", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.ff.net.2", "P_bg988", "P_bg989", bias=True),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.norm1", "P_bg990"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.norm2", "P_bg990"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.6.norm3", "P_bg990"),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.attn1.to_k", "P_bg991", "P_bg992", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.attn1.to_out.0", "P_bg991", "P_bg992", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.attn1.to_q", "P_bg991", "P_bg992", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.attn1.to_v", "P_bg991", "P_bg992", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.attn2.to_k", "P_bg993", "P_bg994", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.attn2.to_out.0", "P_bg995", "P_bg996", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.attn2.to_q", "P_bg997", "P_bg998", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.attn2.to_v", "P_bg999", "P_bg1000", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.ff.net.0.proj", "P_bg1001", "P_bg1002", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.ff.net.2", "P_bg1003", "P_bg1004", bias=True),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.norm1", "P_bg1005"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.norm2", "P_bg1005"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.7.norm3", "P_bg1005"),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.attn1.to_k", "P_bg1006", "P_bg1007", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.attn1.to_out.0", "P_bg1006", "P_bg1007", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.attn1.to_q", "P_bg1006", "P_bg1007", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.attn1.to_v", "P_bg1006", "P_bg1007", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.attn2.to_k", "P_bg1008", "P_bg1009", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.attn2.to_out.0", "P_bg1010", "P_bg1011", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.attn2.to_q", "P_bg1012", "P_bg1013", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.attn2.to_v", "P_bg1014", "P_bg1015", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.ff.net.0.proj", "P_bg1016", "P_bg1017", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.ff.net.2", "P_bg1018", "P_bg1019", bias=True),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.norm1", "P_bg1020"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.norm2", "P_bg1020"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.8.norm3", "P_bg1020"),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.attn1.to_k", "P_bg1021", "P_bg1022", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.attn1.to_out.0", "P_bg1021", "P_bg1022", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.attn1.to_q", "P_bg1021", "P_bg1022", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.attn1.to_v", "P_bg1021", "P_bg1022", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.attn2.to_k", "P_bg1023", "P_bg1024", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.attn2.to_out.0", "P_bg1025", "P_bg1026", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.attn2.to_q", "P_bg1027", "P_bg1028", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.attn2.to_v", "P_bg1029", "P_bg1030", bias=False),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.ff.net.0.proj", "P_bg1031", "P_bg1032", bias=True),
**dense("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.ff.net.2", "P_bg1033", "P_bg1034", bias=True),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.norm1", "P_bg1035"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.norm2", "P_bg1035"),
**norm("model.diffusion_model.output_blocks.2.1.transformer_blocks.9.norm3", "P_bg1035"),
**conv("model.diffusion_model.output_blocks.2.2.conv", "P_bg1036", "P_bg1037"),
**easyblock("model.diffusion_model.output_blocks.3.0", "P_bg1038", "P_bg1039"),
**conv("model.diffusion_model.output_blocks.3.0.skip_connection", "P_bg1040", "P_bg1041"),
**norm("model.diffusion_model.output_blocks.3.1.norm", "P_bg1042"),
**conv("model.diffusion_model.output_blocks.3.1.proj_in", "P_bg1042", "P_bg1043"),
**conv("model.diffusion_model.output_blocks.3.1.proj_out", "P_bg1044", "P_bg1045"),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn1.to_k", "P_bg1046", "P_bg1047", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn1.to_out.0", "P_bg1046", "P_bg1047", bias=True),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn1.to_q", "P_bg1046", "P_bg1047", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn1.to_v", "P_bg1046", "P_bg1047", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn2.to_k", "P_bg1048", "P_bg1049", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn2.to_out.0", "P_bg1050", "P_bg1051", bias=True),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn2.to_q", "P_bg1052", "P_bg1053", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn2.to_v", "P_bg1054", "P_bg1055", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.ff.net.0.proj", "P_bg1056", "P_bg1057", bias=True),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.ff.net.2", "P_bg1058", "P_bg1059", bias=True),
**norm("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.norm1", "P_bg1060"),
**norm("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.norm2", "P_bg1060"),
**norm("model.diffusion_model.output_blocks.3.1.transformer_blocks.0.norm3", "P_bg1060"),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.attn1.to_k", "P_bg1061", "P_bg1062", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.attn1.to_out.0", "P_bg1061", "P_bg1062", bias=True),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.attn1.to_q", "P_bg1061", "P_bg1062", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.attn1.to_v", "P_bg1061", "P_bg1062", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.attn2.to_k", "P_bg1063", "P_bg1064", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.attn2.to_out.0", "P_bg1065", "P_bg1066", bias=True),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.attn2.to_q", "P_bg1067", "P_bg1068", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.attn2.to_v", "P_bg1069", "P_bg1070", bias=False),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.ff.net.0.proj", "P_bg1071", "P_bg1072", bias=True),
**dense("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.ff.net.2", "P_bg1073", "P_bg1074", bias=True),
**norm("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.norm1", "P_bg1075"),
**norm("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.norm2", "P_bg1075"),
**norm("model.diffusion_model.output_blocks.3.1.transformer_blocks.1.norm3", "P_bg1075"),
**easyblock("model.diffusion_model.output_blocks.4.0", "P_bg1076", "P_bg1077"),
**conv("model.diffusion_model.output_blocks.4.0.skip_connection", "P_bg1078", "P_bg1079"),
**norm("model.diffusion_model.output_blocks.4.1.norm", "P_bg1080"),
**conv("model.diffusion_model.output_blocks.4.1.proj_in", "P_bg1080", "P_bg1081"),
**conv("model.diffusion_model.output_blocks.4.1.proj_out", "P_bg1082", "P_bg1083"),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn1.to_k", "P_bg1084", "P_bg1085", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn1.to_out.0", "P_bg1084", "P_bg1085", bias=True),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn1.to_q", "P_bg1084", "P_bg1085", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn1.to_v", "P_bg1084", "P_bg1085", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn2.to_k", "P_bg1086", "P_bg1087", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn2.to_out.0", "P_bg1088", "P_bg1089", bias=True),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn2.to_q", "P_bg1090", "P_bg1091", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn2.to_v", "P_bg1092", "P_bg1093", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.ff.net.0.proj", "P_bg1094", "P_bg1095", bias=True),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.ff.net.2", "P_bg1096", "P_bg1097", bias=True),
**norm("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.norm1", "P_bg1098"),
**norm("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.norm2", "P_bg1098"),
**norm("model.diffusion_model.output_blocks.4.1.transformer_blocks.0.norm3", "P_bg1098"),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.1.attn1.to_k", "P_bg1099", "P_bg1100", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.1.attn1.to_out.0", "P_bg1099", "P_bg1100", bias=True),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.1.attn1.to_q", "P_bg1099", "P_bg1100", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.1.attn1.to_v", "P_bg1099", "P_bg1100", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.1.attn2.to_k", "P_bg1101", "P_bg1102", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.1.attn2.to_out.0", "P_bg1103", "P_bg1104", bias=True),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.1.attn2.to_q", "P_bg1105", "P_bg1106", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.1.attn2.to_v", "P_bg1107", "P_bg1108", bias=False),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.1.ff.net.0.proj", "P_bg1109", "P_bg1110", bias=True),
**dense("model.diffusion_model.output_blocks.4.1.transformer_blocks.1.ff.net.2", "P_bg1111", "P_bg1112", bias=True),