-
Notifications
You must be signed in to change notification settings - Fork 960
Expand file tree
/
Copy pathspv.tensorARM.all_accesses.comp.out
More file actions
453 lines (452 loc) · 22.4 KB
/
spv.tensorARM.all_accesses.comp.out
File metadata and controls
453 lines (452 loc) · 22.4 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
spv.tensorARM.all_accesses.comp
// Module Version 10000
// Generated by (magic number): 8000b
// Id's are bound by 276
Capability Shader
Capability Float16
Capability Float64
Capability Int64
Capability Int16
Capability Int8
Capability TensorsARM
Capability Float8EXT
Capability BFloat16TypeKHR
Extension "SPV_ARM_tensors"
Extension "SPV_EXT_float8"
Extension "SPV_KHR_bfloat16"
1: ExtInstImport "GLSL.std.450"
MemoryModel Logical GLSL450
EntryPoint GLCompute 4 "main"
ExecutionMode 4 LocalSize 1 1 1
Source GLSL 460
SourceExtension "GL_ARM_tensors"
SourceExtension "GL_ARM_tensors_bfloat16"
SourceExtension "GL_ARM_tensors_float_e4m3"
SourceExtension "GL_ARM_tensors_float_e5m2"
SourceExtension "GL_EXT_bfloat16"
SourceExtension "GL_EXT_float_e4m3"
SourceExtension "GL_EXT_float_e5m2"
SourceExtension "GL_EXT_shader_explicit_arithmetic_types"
Name 4 "main"
Name 10 "coords"
Name 15 "iw8"
Name 19 "iw16"
Name 23 "iw"
Name 27 "iw64"
Name 31 "it8"
Name 37 "it16"
Name 43 "it32"
Name 49 "it64"
Name 56 "iwv"
Name 63 "ir8"
Name 67 "ir16"
Name 71 "ir"
Name 75 "ir64"
Name 79 "irv"
Name 83 "uw8"
Name 87 "uw16"
Name 90 "uw"
Name 93 "uw64"
Name 97 "ut8"
Name 103 "ut16"
Name 109 "ut32"
Name 115 "ut64"
Name 121 "uwv"
Name 128 "ur8"
Name 132 "ur16"
Name 136 "ur"
Name 140 "ur64"
Name 144 "urv"
Name 148 "fw"
Name 152 "fw16"
Name 156 "fw64"
Name 160 "ft16"
Name 166 "ft32"
Name 172 "ft64"
Name 178 "fwv"
Name 185 "fr16"
Name 189 "fr"
Name 193 "fr64"
Name 197 "frv"
Name 201 "bf16w"
Name 205 "fe5m2w"
Name 209 "fe4m3w"
Name 213 "bft16"
Name 219 "fte5m2"
Name 225 "fte4m3"
Name 231 "bf16wv"
Name 238 "fe5m2wv"
Name 243 "fe4m3one"
Name 246 "fe4m3wv"
Name 254 "bf16r"
Name 258 "fe5m2r"
Name 262 "fe4m3r"
Name 266 "bf16rv"
Name 270 "fe5m2rv"
Name 274 "fe4m3rv"
Decorate 31(it8) Binding 0
Decorate 31(it8) DescriptorSet 0
Decorate 37(it16) Binding 1
Decorate 37(it16) DescriptorSet 0
Decorate 43(it32) Binding 2
Decorate 43(it32) DescriptorSet 0
Decorate 49(it64) Binding 3
Decorate 49(it64) DescriptorSet 0
Decorate 97(ut8) Binding 4
Decorate 97(ut8) DescriptorSet 0
Decorate 103(ut16) Binding 5
Decorate 103(ut16) DescriptorSet 0
Decorate 109(ut32) Binding 6
Decorate 109(ut32) DescriptorSet 0
Decorate 115(ut64) Binding 7
Decorate 115(ut64) DescriptorSet 0
Decorate 160(ft16) Binding 8
Decorate 160(ft16) DescriptorSet 0
Decorate 166(ft32) Binding 9
Decorate 166(ft32) DescriptorSet 0
Decorate 172(ft64) Binding 10
Decorate 172(ft64) DescriptorSet 0
Decorate 213(bft16) Binding 11
Decorate 213(bft16) DescriptorSet 0
Decorate 219(fte5m2) Binding 12
Decorate 219(fte5m2) DescriptorSet 0
Decorate 225(fte4m3) Binding 13
Decorate 225(fte4m3) DescriptorSet 0
2: TypeVoid
3: TypeFunction 2
6: TypeInt 32 0
7: 6(int) Constant 1
8: TypeArray 6(int) 7
9: TypePointer Function 8
11: 6(int) Constant 0
12: 8 ConstantComposite 11
13: TypeInt 8 1
14: TypePointer Function 13(int8_t)
16: 13(int8_t) Constant 1
17: TypeInt 16 1
18: TypePointer Function 17(int16_t)
20: 17(int16_t) Constant 1
21: TypeInt 32 1
22: TypePointer Function 21(int)
24: 21(int) Constant 1
25: TypeInt 64 1
26: TypePointer Function 25(int64_t)
28: 25(int64_t) Constant 1 0
29: TypeTensorARM 13(int8_t) 7
30: TypePointer UniformConstant 29
31(it8): 30(ptr) Variable UniformConstant
35: TypeTensorARM 17(int16_t) 7
36: TypePointer UniformConstant 35
37(it16): 36(ptr) Variable UniformConstant
41: TypeTensorARM 21(int) 7
42: TypePointer UniformConstant 41
43(it32): 42(ptr) Variable UniformConstant
47: TypeTensorARM 25(int64_t) 7
48: TypePointer UniformConstant 47
49(it64): 48(ptr) Variable UniformConstant
53: 6(int) Constant 4
54: TypeArray 21(int) 53
55: TypePointer Function 54
57: 54 ConstantComposite 24 24 24 24
81: TypeInt 8 0
82: TypePointer Function 81(int8_t)
84: 81(int8_t) Constant 1
85: TypeInt 16 0
86: TypePointer Function 85(int16_t)
88: 85(int16_t) Constant 1
89: TypePointer Function 6(int)
91: TypeInt 64 0
92: TypePointer Function 91(int64_t)
94: 91(int64_t) Constant 1 0
95: TypeTensorARM 81(int8_t) 7
96: TypePointer UniformConstant 95
97(ut8): 96(ptr) Variable UniformConstant
101: TypeTensorARM 85(int16_t) 7
102: TypePointer UniformConstant 101
103(ut16): 102(ptr) Variable UniformConstant
107: TypeTensorARM 6(int) 7
108: TypePointer UniformConstant 107
109(ut32): 108(ptr) Variable UniformConstant
113: TypeTensorARM 91(int64_t) 7
114: TypePointer UniformConstant 113
115(ut64): 114(ptr) Variable UniformConstant
119: TypeArray 6(int) 53
120: TypePointer Function 119
122: 119 ConstantComposite 7 7 7 7
146: TypeFloat 32
147: TypePointer Function 146(float)
149: 146(float) Constant 1065353216
150: TypeFloat 16
151: TypePointer Function 150(float16_t)
153:150(float16_t) Constant 15360
154: TypeFloat 64
155: TypePointer Function 154(float64_t)
157:154(float64_t) Constant 0 1072693248
158: TypeTensorARM 150(float16_t) 7
159: TypePointer UniformConstant 158
160(ft16): 159(ptr) Variable UniformConstant
164: TypeTensorARM 146(float) 7
165: TypePointer UniformConstant 164
166(ft32): 165(ptr) Variable UniformConstant
170: TypeTensorARM 154(float64_t) 7
171: TypePointer UniformConstant 170
172(ft64): 171(ptr) Variable UniformConstant
176: TypeArray 146(float) 53
177: TypePointer Function 176
179: 176 ConstantComposite 149 149 149 149
199: TypeFloat 16 0
200: TypePointer Function 199(bfloat16_t)
202:199(bfloat16_t) Constant 16256
203: TypeFloat 8 4215
204: TypePointer Function 203(floate5m2_t)
206:203(floate5m2_t) Constant 60
207: TypeFloat 8 4214
208: TypePointer Function 207(floate4m3_t)
210:207(floate4m3_t) Constant 56
211: TypeTensorARM 199(bfloat16_t) 7
212: TypePointer UniformConstant 211
213(bft16): 212(ptr) Variable UniformConstant
217: TypeTensorARM 203(floate5m2_t) 7
218: TypePointer UniformConstant 217
219(fte5m2): 218(ptr) Variable UniformConstant
223: TypeTensorARM 207(floate4m3_t) 7
224: TypePointer UniformConstant 223
225(fte4m3): 224(ptr) Variable UniformConstant
229: TypeArray 199(bfloat16_t) 53
230: TypePointer Function 229
232: 229 ConstantComposite 202 202 202 202
236: TypeArray 203(floate5m2_t) 53
237: TypePointer Function 236
239: 236 ConstantComposite 206 206 206 206
244: TypeArray 207(floate4m3_t) 53
245: TypePointer Function 244
4(main): 2 Function None 3
5: Label
10(coords): 9(ptr) Variable Function
15(iw8): 14(ptr) Variable Function
19(iw16): 18(ptr) Variable Function
23(iw): 22(ptr) Variable Function
27(iw64): 26(ptr) Variable Function
56(iwv): 55(ptr) Variable Function
63(ir8): 14(ptr) Variable Function
67(ir16): 18(ptr) Variable Function
71(ir): 22(ptr) Variable Function
75(ir64): 26(ptr) Variable Function
79(irv): 55(ptr) Variable Function
83(uw8): 82(ptr) Variable Function
87(uw16): 86(ptr) Variable Function
90(uw): 89(ptr) Variable Function
93(uw64): 92(ptr) Variable Function
121(uwv): 120(ptr) Variable Function
128(ur8): 82(ptr) Variable Function
132(ur16): 86(ptr) Variable Function
136(ur): 89(ptr) Variable Function
140(ur64): 92(ptr) Variable Function
144(urv): 120(ptr) Variable Function
148(fw): 147(ptr) Variable Function
152(fw16): 151(ptr) Variable Function
156(fw64): 155(ptr) Variable Function
178(fwv): 177(ptr) Variable Function
185(fr16): 151(ptr) Variable Function
189(fr): 147(ptr) Variable Function
193(fr64): 155(ptr) Variable Function
197(frv): 177(ptr) Variable Function
201(bf16w): 200(ptr) Variable Function
205(fe5m2w): 204(ptr) Variable Function
209(fe4m3w): 208(ptr) Variable Function
231(bf16wv): 230(ptr) Variable Function
238(fe5m2wv): 237(ptr) Variable Function
243(fe4m3one): 208(ptr) Variable Function
246(fe4m3wv): 245(ptr) Variable Function
254(bf16r): 200(ptr) Variable Function
258(fe5m2r): 204(ptr) Variable Function
262(fe4m3r): 208(ptr) Variable Function
266(bf16rv): 230(ptr) Variable Function
270(fe5m2rv): 237(ptr) Variable Function
274(fe4m3rv): 245(ptr) Variable Function
Store 10(coords) 12
Store 15(iw8) 16
Store 19(iw16) 20
Store 23(iw) 24
Store 27(iw64) 28
32: 29 Load 31(it8)
33: 8 Load 10(coords)
34: 13(int8_t) Load 15(iw8)
TensorWriteARM 32 33 34
38: 35 Load 37(it16)
39: 8 Load 10(coords)
40: 17(int16_t) Load 19(iw16)
TensorWriteARM 38 39 40
44: 41 Load 43(it32)
45: 8 Load 10(coords)
46: 21(int) Load 23(iw)
TensorWriteARM 44 45 46
50: 47 Load 49(it64)
51: 8 Load 10(coords)
52: 25(int64_t) Load 27(iw64)
TensorWriteARM 50 51 52
Store 56(iwv) 57
58: 41 Load 43(it32)
59: 8 Load 10(coords)
60: 54 Load 56(iwv)
TensorWriteARM 58 59 60
61: 29 Load 31(it8)
62: 8 Load 10(coords)
64: 13(int8_t) TensorReadARM 61 62
Store 63(ir8) 64
65: 35 Load 37(it16)
66: 8 Load 10(coords)
68: 17(int16_t) TensorReadARM 65 66
Store 67(ir16) 68
69: 41 Load 43(it32)
70: 8 Load 10(coords)
72: 21(int) TensorReadARM 69 70
Store 71(ir) 72
73: 47 Load 49(it64)
74: 8 Load 10(coords)
76: 25(int64_t) TensorReadARM 73 74
Store 75(ir64) 76
77: 41 Load 43(it32)
78: 8 Load 10(coords)
80: 54 TensorReadARM 77 78
Store 79(irv) 80
Store 83(uw8) 84
Store 87(uw16) 88
Store 90(uw) 7
Store 93(uw64) 94
98: 95 Load 97(ut8)
99: 8 Load 10(coords)
100: 81(int8_t) Load 83(uw8)
TensorWriteARM 98 99 100
104: 101 Load 103(ut16)
105: 8 Load 10(coords)
106: 85(int16_t) Load 87(uw16)
TensorWriteARM 104 105 106
110: 107 Load 109(ut32)
111: 8 Load 10(coords)
112: 6(int) Load 90(uw)
TensorWriteARM 110 111 112
116: 113 Load 115(ut64)
117: 8 Load 10(coords)
118: 91(int64_t) Load 93(uw64)
TensorWriteARM 116 117 118
Store 121(uwv) 122
123: 107 Load 109(ut32)
124: 8 Load 10(coords)
125: 119 Load 121(uwv)
TensorWriteARM 123 124 125
126: 95 Load 97(ut8)
127: 8 Load 10(coords)
129: 81(int8_t) TensorReadARM 126 127
Store 128(ur8) 129
130: 101 Load 103(ut16)
131: 8 Load 10(coords)
133: 85(int16_t) TensorReadARM 130 131
Store 132(ur16) 133
134: 107 Load 109(ut32)
135: 8 Load 10(coords)
137: 6(int) TensorReadARM 134 135
Store 136(ur) 137
138: 113 Load 115(ut64)
139: 8 Load 10(coords)
141: 91(int64_t) TensorReadARM 138 139
Store 140(ur64) 141
142: 107 Load 109(ut32)
143: 8 Load 10(coords)
145: 119 TensorReadARM 142 143
Store 144(urv) 145
Store 148(fw) 149
Store 152(fw16) 153
Store 156(fw64) 157
161: 158 Load 160(ft16)
162: 8 Load 10(coords)
163:150(float16_t) Load 152(fw16)
TensorWriteARM 161 162 163
167: 164 Load 166(ft32)
168: 8 Load 10(coords)
169: 146(float) Load 148(fw)
TensorWriteARM 167 168 169
173: 170 Load 172(ft64)
174: 8 Load 10(coords)
175:154(float64_t) Load 156(fw64)
TensorWriteARM 173 174 175
Store 178(fwv) 179
180: 164 Load 166(ft32)
181: 8 Load 10(coords)
182: 176 Load 178(fwv)
TensorWriteARM 180 181 182
183: 158 Load 160(ft16)
184: 8 Load 10(coords)
186:150(float16_t) TensorReadARM 183 184
Store 185(fr16) 186
187: 164 Load 166(ft32)
188: 8 Load 10(coords)
190: 146(float) TensorReadARM 187 188
Store 189(fr) 190
191: 170 Load 172(ft64)
192: 8 Load 10(coords)
194:154(float64_t) TensorReadARM 191 192
Store 193(fr64) 194
195: 164 Load 166(ft32)
196: 8 Load 10(coords)
198: 176 TensorReadARM 195 196
Store 197(frv) 198
Store 201(bf16w) 202
Store 205(fe5m2w) 206
Store 209(fe4m3w) 210
214: 211 Load 213(bft16)
215: 8 Load 10(coords)
216:199(bfloat16_t) Load 201(bf16w)
TensorWriteARM 214 215 216
220: 217 Load 219(fte5m2)
221: 8 Load 10(coords)
222:203(floate5m2_t) Load 205(fe5m2w)
TensorWriteARM 220 221 222
226: 223 Load 225(fte4m3)
227: 8 Load 10(coords)
228:207(floate4m3_t) Load 209(fe4m3w)
TensorWriteARM 226 227 228
Store 231(bf16wv) 232
233: 211 Load 213(bft16)
234: 8 Load 10(coords)
235: 229 Load 231(bf16wv)
TensorWriteARM 233 234 235
Store 238(fe5m2wv) 239
240: 217 Load 219(fte5m2)
241: 8 Load 10(coords)
242: 236 Load 238(fe5m2wv)
TensorWriteARM 240 241 242
Store 243(fe4m3one) 210
247:207(floate4m3_t) Load 243(fe4m3one)
248: 244 CompositeConstruct 247 247 247 247
Store 246(fe4m3wv) 248
249: 223 Load 225(fte4m3)
250: 8 Load 10(coords)
251: 244 Load 246(fe4m3wv)
TensorWriteARM 249 250 251
252: 211 Load 213(bft16)
253: 8 Load 10(coords)
255:199(bfloat16_t) TensorReadARM 252 253
Store 254(bf16r) 255
256: 217 Load 219(fte5m2)
257: 8 Load 10(coords)
259:203(floate5m2_t) TensorReadARM 256 257
Store 258(fe5m2r) 259
260: 223 Load 225(fte4m3)
261: 8 Load 10(coords)
263:207(floate4m3_t) TensorReadARM 260 261
Store 262(fe4m3r) 263
264: 211 Load 213(bft16)
265: 8 Load 10(coords)
267: 229 TensorReadARM 264 265
Store 266(bf16rv) 267
268: 217 Load 219(fte5m2)
269: 8 Load 10(coords)
271: 236 TensorReadARM 268 269
Store 270(fe5m2rv) 271
272: 223 Load 225(fte4m3)
273: 8 Load 10(coords)
275: 244 TensorReadARM 272 273
Store 274(fe4m3rv) 275
Return
FunctionEnd