-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathaux_xl.py
180 lines (178 loc) · 10.6 KB
/
aux_xl.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
# T_references for training size (512)
Tref = {
"down_blocks.0.attentions.0.transformer_blocks.0.attn1.processor": {4096},
"down_blocks.0.attentions.0.transformer_blocks.0.attn2.processor": {77},
"down_blocks.0.attentions.1.transformer_blocks.0.attn1.processor": {4096},
"down_blocks.0.attentions.1.transformer_blocks.0.attn2.processor": {77},
"down_blocks.1.attentions.0.transformer_blocks.0.attn1.processor": {1024},
"down_blocks.1.attentions.0.transformer_blocks.0.attn2.processor": {77},
"down_blocks.1.attentions.1.transformer_blocks.0.attn1.processor": {1024},
"down_blocks.1.attentions.1.transformer_blocks.0.attn2.processor": {77},
"down_blocks.2.attentions.0.transformer_blocks.0.attn1.processor": {256},
"down_blocks.2.attentions.0.transformer_blocks.0.attn2.processor": {77},
"down_blocks.2.attentions.1.transformer_blocks.0.attn1.processor": {256},
"down_blocks.2.attentions.1.transformer_blocks.0.attn2.processor": {77},
"mid_block.attentions.0.transformer_blocks.0.attn1.processor": {64},
"mid_block.attentions.0.transformer_blocks.0.attn2.processor": {77},
"up_blocks.1.attentions.0.transformer_blocks.0.attn1.processor": {256},
"up_blocks.1.attentions.0.transformer_blocks.0.attn2.processor": {77},
"up_blocks.1.attentions.1.transformer_blocks.0.attn1.processor": {256},
"up_blocks.1.attentions.1.transformer_blocks.0.attn2.processor": {77},
"up_blocks.1.attentions.2.transformer_blocks.0.attn1.processor": {256},
"up_blocks.1.attentions.2.transformer_blocks.0.attn2.processor": {77},
"up_blocks.2.attentions.0.transformer_blocks.0.attn1.processor": {1024},
"up_blocks.2.attentions.0.transformer_blocks.0.attn2.processor": {77},
"up_blocks.2.attentions.1.transformer_blocks.0.attn1.processor": {1024},
"up_blocks.2.attentions.1.transformer_blocks.0.attn2.processor": {77},
"up_blocks.2.attentions.2.transformer_blocks.0.attn1.processor": {1024},
"up_blocks.2.attentions.2.transformer_blocks.0.attn2.processor": {77},
"up_blocks.3.attentions.0.transformer_blocks.0.attn1.processor": {4096},
"up_blocks.3.attentions.0.transformer_blocks.0.attn2.processor": {77},
"up_blocks.3.attentions.1.transformer_blocks.0.attn1.processor": {4096},
"up_blocks.3.attentions.1.transformer_blocks.0.attn2.processor": {77},
"up_blocks.3.attentions.2.transformer_blocks.0.attn1.processor": {4096},
"up_blocks.3.attentions.2.transformer_blocks.0.attn2.processor": {77},
}
list_layers = [
"down_blocks.1.attentions.0.transformer_blocks.0.attn1",
"down_blocks.1.attentions.0.transformer_blocks.0.attn2",
"down_blocks.1.attentions.0.transformer_blocks.1.attn1",
"down_blocks.1.attentions.0.transformer_blocks.1.attn2",
"down_blocks.1.attentions.1.transformer_blocks.0.attn1",
"down_blocks.1.attentions.1.transformer_blocks.0.attn2",
"down_blocks.1.attentions.1.transformer_blocks.1.attn1",
"down_blocks.1.attentions.1.transformer_blocks.1.attn2",
"down_blocks.2.attentions.0.transformer_blocks.0.attn1",
"down_blocks.2.attentions.0.transformer_blocks.0.attn2",
"down_blocks.2.attentions.0.transformer_blocks.1.attn1",
"down_blocks.2.attentions.0.transformer_blocks.1.attn2",
"down_blocks.2.attentions.0.transformer_blocks.2.attn1",
"down_blocks.2.attentions.0.transformer_blocks.2.attn2",
"down_blocks.2.attentions.0.transformer_blocks.3.attn1",
"down_blocks.2.attentions.0.transformer_blocks.3.attn2",
"down_blocks.2.attentions.0.transformer_blocks.4.attn1",
"down_blocks.2.attentions.0.transformer_blocks.4.attn2",
"down_blocks.2.attentions.0.transformer_blocks.5.attn1",
"down_blocks.2.attentions.0.transformer_blocks.5.attn2",
"down_blocks.2.attentions.0.transformer_blocks.6.attn1",
"down_blocks.2.attentions.0.transformer_blocks.6.attn2",
"down_blocks.2.attentions.0.transformer_blocks.7.attn1",
"down_blocks.2.attentions.0.transformer_blocks.7.attn2",
"down_blocks.2.attentions.0.transformer_blocks.8.attn1",
"down_blocks.2.attentions.0.transformer_blocks.8.attn2",
"down_blocks.2.attentions.0.transformer_blocks.9.attn1",
"down_blocks.2.attentions.0.transformer_blocks.9.attn2",
"down_blocks.2.attentions.1.transformer_blocks.0.attn1",
"down_blocks.2.attentions.1.transformer_blocks.0.attn2",
"down_blocks.2.attentions.1.transformer_blocks.1.attn1",
"down_blocks.2.attentions.1.transformer_blocks.1.attn2",
"down_blocks.2.attentions.1.transformer_blocks.2.attn1",
"down_blocks.2.attentions.1.transformer_blocks.2.attn2",
"down_blocks.2.attentions.1.transformer_blocks.3.attn1",
"down_blocks.2.attentions.1.transformer_blocks.3.attn2",
"down_blocks.2.attentions.1.transformer_blocks.4.attn1",
"down_blocks.2.attentions.1.transformer_blocks.4.attn2",
"down_blocks.2.attentions.1.transformer_blocks.5.attn1",
"down_blocks.2.attentions.1.transformer_blocks.5.attn2",
"down_blocks.2.attentions.1.transformer_blocks.6.attn1",
"down_blocks.2.attentions.1.transformer_blocks.6.attn2",
"down_blocks.2.attentions.1.transformer_blocks.7.attn1",
"down_blocks.2.attentions.1.transformer_blocks.7.attn2",
"down_blocks.2.attentions.1.transformer_blocks.8.attn1",
"down_blocks.2.attentions.1.transformer_blocks.8.attn2",
"down_blocks.2.attentions.1.transformer_blocks.9.attn1",
"down_blocks.2.attentions.1.transformer_blocks.9.attn2",
"up_blocks.0.attentions.0.transformer_blocks.0.attn1",
"up_blocks.0.attentions.0.transformer_blocks.0.attn2",
"up_blocks.0.attentions.0.transformer_blocks.1.attn1",
"up_blocks.0.attentions.0.transformer_blocks.1.attn2",
"up_blocks.0.attentions.0.transformer_blocks.2.attn1",
"up_blocks.0.attentions.0.transformer_blocks.2.attn2",
"up_blocks.0.attentions.0.transformer_blocks.3.attn1",
"up_blocks.0.attentions.0.transformer_blocks.3.attn2",
"up_blocks.0.attentions.0.transformer_blocks.4.attn1",
"up_blocks.0.attentions.0.transformer_blocks.4.attn2",
"up_blocks.0.attentions.0.transformer_blocks.5.attn1",
"up_blocks.0.attentions.0.transformer_blocks.5.attn2",
"up_blocks.0.attentions.0.transformer_blocks.6.attn1",
"up_blocks.0.attentions.0.transformer_blocks.6.attn2",
"up_blocks.0.attentions.0.transformer_blocks.7.attn1",
"up_blocks.0.attentions.0.transformer_blocks.7.attn2",
"up_blocks.0.attentions.0.transformer_blocks.8.attn1",
"up_blocks.0.attentions.0.transformer_blocks.8.attn2",
"up_blocks.0.attentions.0.transformer_blocks.9.attn1",
"up_blocks.0.attentions.0.transformer_blocks.9.attn2",
"up_blocks.0.attentions.1.transformer_blocks.0.attn1",
"up_blocks.0.attentions.1.transformer_blocks.0.attn2",
"up_blocks.0.attentions.1.transformer_blocks.1.attn1",
"up_blocks.0.attentions.1.transformer_blocks.1.attn2",
"up_blocks.0.attentions.1.transformer_blocks.2.attn1",
"up_blocks.0.attentions.1.transformer_blocks.2.attn2",
"up_blocks.0.attentions.1.transformer_blocks.3.attn1",
"up_blocks.0.attentions.1.transformer_blocks.3.attn2",
"up_blocks.0.attentions.1.transformer_blocks.4.attn1",
"up_blocks.0.attentions.1.transformer_blocks.4.attn2",
"up_blocks.0.attentions.1.transformer_blocks.5.attn1",
"up_blocks.0.attentions.1.transformer_blocks.5.attn2",
"up_blocks.0.attentions.1.transformer_blocks.6.attn1",
"up_blocks.0.attentions.1.transformer_blocks.6.attn2",
"up_blocks.0.attentions.1.transformer_blocks.7.attn1",
"up_blocks.0.attentions.1.transformer_blocks.7.attn2",
"up_blocks.0.attentions.1.transformer_blocks.8.attn1",
"up_blocks.0.attentions.1.transformer_blocks.8.attn2",
"up_blocks.0.attentions.1.transformer_blocks.9.attn1",
"up_blocks.0.attentions.1.transformer_blocks.9.attn2",
"up_blocks.0.attentions.2.transformer_blocks.0.attn1",
"up_blocks.0.attentions.2.transformer_blocks.0.attn2",
"up_blocks.0.attentions.2.transformer_blocks.1.attn1",
"up_blocks.0.attentions.2.transformer_blocks.1.attn2",
"up_blocks.0.attentions.2.transformer_blocks.2.attn1",
"up_blocks.0.attentions.2.transformer_blocks.2.attn2",
"up_blocks.0.attentions.2.transformer_blocks.3.attn1",
"up_blocks.0.attentions.2.transformer_blocks.3.attn2",
"up_blocks.0.attentions.2.transformer_blocks.4.attn1",
"up_blocks.0.attentions.2.transformer_blocks.4.attn2",
"up_blocks.0.attentions.2.transformer_blocks.5.attn1",
"up_blocks.0.attentions.2.transformer_blocks.5.attn2",
"up_blocks.0.attentions.2.transformer_blocks.6.attn1",
"up_blocks.0.attentions.2.transformer_blocks.6.attn2",
"up_blocks.0.attentions.2.transformer_blocks.7.attn1",
"up_blocks.0.attentions.2.transformer_blocks.7.attn2",
"up_blocks.0.attentions.2.transformer_blocks.8.attn1",
"up_blocks.0.attentions.2.transformer_blocks.8.attn2",
"up_blocks.0.attentions.2.transformer_blocks.9.attn1",
"up_blocks.0.attentions.2.transformer_blocks.9.attn2",
"up_blocks.1.attentions.0.transformer_blocks.0.attn1",
"up_blocks.1.attentions.0.transformer_blocks.0.attn2",
"up_blocks.1.attentions.0.transformer_blocks.1.attn1",
"up_blocks.1.attentions.0.transformer_blocks.1.attn2",
"up_blocks.1.attentions.1.transformer_blocks.0.attn1",
"up_blocks.1.attentions.1.transformer_blocks.0.attn2",
"up_blocks.1.attentions.1.transformer_blocks.1.attn1",
"up_blocks.1.attentions.1.transformer_blocks.1.attn2",
"up_blocks.1.attentions.2.transformer_blocks.0.attn1",
"up_blocks.1.attentions.2.transformer_blocks.0.attn2",
"up_blocks.1.attentions.2.transformer_blocks.1.attn1",
"up_blocks.1.attentions.2.transformer_blocks.1.attn2",
"mid_block.attentions.0.transformer_blocks.0.attn1",
"mid_block.attentions.0.transformer_blocks.0.attn2",
"mid_block.attentions.0.transformer_blocks.1.attn1",
"mid_block.attentions.0.transformer_blocks.1.attn2",
"mid_block.attentions.0.transformer_blocks.2.attn1",
"mid_block.attentions.0.transformer_blocks.2.attn2",
"mid_block.attentions.0.transformer_blocks.3.attn1",
"mid_block.attentions.0.transformer_blocks.3.attn2",
"mid_block.attentions.0.transformer_blocks.4.attn1",
"mid_block.attentions.0.transformer_blocks.4.attn2",
"mid_block.attentions.0.transformer_blocks.5.attn1",
"mid_block.attentions.0.transformer_blocks.5.attn2",
"mid_block.attentions.0.transformer_blocks.6.attn1",
"mid_block.attentions.0.transformer_blocks.6.attn2",
"mid_block.attentions.0.transformer_blocks.7.attn1",
"mid_block.attentions.0.transformer_blocks.7.attn2",
"mid_block.attentions.0.transformer_blocks.8.attn1",
"mid_block.attentions.0.transformer_blocks.8.attn2",
"mid_block.attentions.0.transformer_blocks.9.attn1",
"mid_block.attentions.0.transformer_blocks.9.attn2",
]
list_layers = list(map(lambda x: x + ".processor", list_layers))