Commit a1ca690
authored
[AArch64] recognise zip1/zip2 with flipped operands (#167235)
Currently, the following two snippets get treated very differently from
each other (https://godbolt.org/z/rYGj9TGz6):
```LLVM
define <8 x i8> @foo(<8 x i8> %x, <8 x i8> %y) local_unnamed_addr #0 {
entry:
%0 = shufflevector <8 x i8> %x, <8 x i8> %y, <8 x i32>
<i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11>
ret <8 x i8> %0
}
define <8 x i8> @bar(<8 x i8> %x, <8 x i8> %y) local_unnamed_addr #0 {
entry:
%0 = shufflevector <8 x i8> %x, <8 x i8> %y, <8 x i32>
<i32 8, i32 0, i32 9, i32 1, i32 10, i32 2, i32 11, i32 3>
ret <8 x i8> %0
}
```
```
foo: // @foo
zip1 v0.8b, v0.8b, v1.8b
ret
.LCPI1_0:
.byte 8 // 0x8
.byte 0 // 0x0
.byte 9 // 0x9
.byte 1 // 0x1
.byte 10 // 0xa
.byte 2 // 0x2
.byte 11 // 0xb
.byte 3 // 0x3
bar: // @bar
adrp x8, .LCPI1_0
mov v0.d[1], v1.d[0]
ldr d1, [x8, :lo12:.LCPI1_0]
tbl v0.8b, { v0.16b }, v1.8b
ret
```
The reason is that `isZIPMask` does not recognise the pattern when the
operands are flipped.
This PR fixes `isZIPMask` so that both `foo` and `bar` get compiled as
expected:
```
foo: // @foo
zip1 v0.8b, v0.8b, v1.8b
ret
bar: // @bar
zip1 v0.8b, v1.8b, v0.8b
ret
```
I intend to open a similar follow-up PR for `isTRNMask`, which seems to
have the same problem.
I noticed this while working on
#137447, though the change
does not on itself fix that issue.1 parent e3a28c0 commit a1ca690
File tree
10 files changed
+207
-220
lines changed- llvm
- lib/Target/AArch64
- GISel
- test/CodeGen/AArch64
10 files changed
+207
-220
lines changed| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
14805 | 14805 | | |
14806 | 14806 | | |
14807 | 14807 | | |
14808 | | - | |
| 14808 | + | |
| 14809 | + | |
14809 | 14810 | | |
14810 | | - | |
| 14811 | + | |
| 14812 | + | |
14811 | 14813 | | |
14812 | 14814 | | |
14813 | 14815 | | |
| |||
16529 | 16531 | | |
16530 | 16532 | | |
16531 | 16533 | | |
16532 | | - | |
| 16534 | + | |
16533 | 16535 | | |
16534 | 16536 | | |
16535 | 16537 | | |
| |||
31576 | 31578 | | |
31577 | 31579 | | |
31578 | 31580 | | |
31579 | | - | |
| 31581 | + | |
| 31582 | + | |
| 31583 | + | |
31580 | 31584 | | |
31581 | 31585 | | |
31582 | | - | |
| 31586 | + | |
| 31587 | + | |
| 31588 | + | |
| 31589 | + | |
31583 | 31590 | | |
31584 | 31591 | | |
31585 | 31592 | | |
| |||
31624 | 31631 | | |
31625 | 31632 | | |
31626 | 31633 | | |
31627 | | - | |
| 31634 | + | |
| 31635 | + | |
31628 | 31636 | | |
31629 | 31637 | | |
31630 | | - | |
| 31638 | + | |
| 31639 | + | |
| 31640 | + | |
| 31641 | + | |
31631 | 31642 | | |
31632 | 31643 | | |
31633 | 31644 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
6622 | 6622 | | |
6623 | 6623 | | |
6624 | 6624 | | |
6625 | | - | |
6626 | | - | |
| 6625 | + | |
| 6626 | + | |
| 6627 | + | |
| 6628 | + | |
6627 | 6629 | | |
6628 | | - | |
| 6630 | + | |
6629 | 6631 | | |
6630 | 6632 | | |
6631 | | - | |
6632 | | - | |
6633 | | - | |
6634 | | - | |
6635 | | - | |
6636 | | - | |
6637 | | - | |
6638 | | - | |
6639 | | - | |
6640 | | - | |
6641 | | - | |
6642 | | - | |
6643 | | - | |
6644 | 6633 | | |
| 6634 | + | |
| 6635 | + | |
| 6636 | + | |
| 6637 | + | |
| 6638 | + | |
| 6639 | + | |
6645 | 6640 | | |
6646 | | - | |
6647 | 6641 | | |
6648 | | - | |
6649 | | - | |
6650 | | - | |
6651 | | - | |
| 6642 | + | |
| 6643 | + | |
| 6644 | + | |
| 6645 | + | |
| 6646 | + | |
| 6647 | + | |
| 6648 | + | |
| 6649 | + | |
| 6650 | + | |
| 6651 | + | |
| 6652 | + | |
| 6653 | + | |
| 6654 | + | |
| 6655 | + | |
| 6656 | + | |
| 6657 | + | |
| 6658 | + | |
| 6659 | + | |
| 6660 | + | |
| 6661 | + | |
| 6662 | + | |
| 6663 | + | |
6652 | 6664 | | |
6653 | | - | |
| 6665 | + | |
| 6666 | + | |
| 6667 | + | |
| 6668 | + | |
| 6669 | + | |
| 6670 | + | |
6654 | 6671 | | |
6655 | 6672 | | |
6656 | 6673 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
6067 | 6067 | | |
6068 | 6068 | | |
6069 | 6069 | | |
6070 | | - | |
| 6070 | + | |
6071 | 6071 | | |
6072 | 6072 | | |
6073 | 6073 | | |
| |||
Lines changed: 4 additions & 3 deletions
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
252 | 252 | | |
253 | 253 | | |
254 | 254 | | |
| 255 | + | |
255 | 256 | | |
256 | 257 | | |
257 | 258 | | |
258 | | - | |
| 259 | + | |
259 | 260 | | |
260 | 261 | | |
261 | | - | |
262 | | - | |
| 262 | + | |
| 263 | + | |
263 | 264 | | |
264 | 265 | | |
265 | 266 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
355 | 355 | | |
356 | 356 | | |
357 | 357 | | |
358 | | - | |
359 | 358 | | |
360 | | - | |
361 | | - | |
362 | | - | |
363 | | - | |
364 | | - | |
365 | | - | |
366 | | - | |
367 | | - | |
368 | | - | |
369 | | - | |
370 | | - | |
371 | | - | |
372 | | - | |
373 | | - | |
374 | | - | |
375 | | - | |
376 | | - | |
| 359 | + | |
| 360 | + | |
| 361 | + | |
| 362 | + | |
| 363 | + | |
| 364 | + | |
377 | 365 | | |
378 | 366 | | |
379 | 367 | | |
380 | 368 | | |
381 | 369 | | |
382 | | - | |
383 | 370 | | |
384 | | - | |
385 | | - | |
386 | | - | |
387 | | - | |
388 | | - | |
389 | | - | |
390 | | - | |
391 | | - | |
392 | | - | |
393 | | - | |
394 | | - | |
395 | | - | |
396 | | - | |
397 | | - | |
398 | | - | |
399 | | - | |
400 | | - | |
| 371 | + | |
| 372 | + | |
| 373 | + | |
| 374 | + | |
| 375 | + | |
| 376 | + | |
401 | 377 | | |
402 | 378 | | |
403 | 379 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
8 | 8 | | |
9 | 9 | | |
10 | 10 | | |
| 11 | + | |
11 | 12 | | |
12 | | - | |
13 | | - | |
| 13 | + | |
14 | 14 | | |
15 | 15 | | |
16 | 16 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
66 | 66 | | |
67 | 67 | | |
68 | 68 | | |
| 69 | + | |
69 | 70 | | |
70 | | - | |
71 | 71 | | |
72 | | - | |
| 72 | + | |
| 73 | + | |
73 | 74 | | |
74 | | - | |
75 | | - | |
76 | | - | |
| 75 | + | |
| 76 | + | |
| 77 | + | |
77 | 78 | | |
78 | | - | |
79 | | - | |
80 | | - | |
| 79 | + | |
| 80 | + | |
81 | 81 | | |
82 | | - | |
83 | | - | |
84 | | - | |
| 82 | + | |
| 83 | + | |
| 84 | + | |
85 | 85 | | |
86 | | - | |
87 | | - | |
88 | | - | |
89 | | - | |
90 | | - | |
| 86 | + | |
| 87 | + | |
| 88 | + | |
| 89 | + | |
| 90 | + | |
| 91 | + | |
91 | 92 | | |
92 | | - | |
93 | | - | |
94 | | - | |
95 | | - | |
| 93 | + | |
96 | 94 | | |
| 95 | + | |
| 96 | + | |
97 | 97 | | |
98 | | - | |
| 98 | + | |
| 99 | + | |
| 100 | + | |
99 | 101 | | |
100 | | - | |
101 | | - | |
| 102 | + | |
| 103 | + | |
102 | 104 | | |
103 | | - | |
104 | | - | |
105 | 105 | | |
106 | 106 | | |
107 | | - | |
108 | | - | |
109 | | - | |
110 | | - | |
| 107 | + | |
| 108 | + | |
| 109 | + | |
111 | 110 | | |
112 | 111 | | |
113 | | - | |
114 | | - | |
115 | | - | |
| 112 | + | |
| 113 | + | |
| 114 | + | |
| 115 | + | |
116 | 116 | | |
117 | | - | |
118 | | - | |
| 117 | + | |
119 | 118 | | |
| 119 | + | |
120 | 120 | | |
121 | 121 | | |
122 | 122 | | |
| |||
125 | 125 | | |
126 | 126 | | |
127 | 127 | | |
128 | | - | |
129 | | - | |
| 128 | + | |
| 129 | + | |
130 | 130 | | |
131 | 131 | | |
132 | 132 | | |
| |||
0 commit comments