|
1 |
| -# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 5 |
2 |
| -# RUN: llc -mtriple=amdgcn -mcpu=gfx908 -verify-machineinstrs --start-before=greedy,2 --stop-after=greedy,2 %s -o - | FileCheck %s |
| 1 | +# RUN: not llc -mtriple=amdgcn -mcpu=gfx908 -verify-machineinstrs -start-before=greedy,1 -stop-after=virtregrewriter,2 -o - -verify-regalloc %s 2> %t.err | FileCheck %s |
| 2 | +# RUN: FileCheck -check-prefix=ERR %s < %t.err |
3 | 3 |
|
4 |
| -# Make sure there's no machine verifier error |
| 4 | +# Make sure there's no machine verifier error after failure. |
5 | 5 |
|
6 |
| -# If RA is unable to find a register to allocate, then cleanupFailedVReg will do ad-hoc rewriting and will insert undefs to make the LiveRanges workable. |
7 |
| -# %30:av_128 = COPY undef $vgpr0_vgpr1_vgpr2_vgpr3 is an example of such a rewrite / undef. If we were to want to spill %30, we should not be inserting |
8 |
| -# actual spill code, as the source operand is undef. |
9 |
| -# Check that there are no verfier issues with the LiveRange of $vgpr0_vgpr1_vgpr2_vgpr3 / that we do not insert spill code for %30. |
| 6 | +# ERR: error: inline assembly requires more registers than available |
| 7 | +# ERR: error: inline assembly requires more registers than available |
| 8 | +# ERR: error: inline assembly requires more registers than available |
| 9 | +# ERR: error: inline assembly requires more registers than available |
10 | 10 |
|
| 11 | +# This testcase cannot be compiled with the enforced register |
| 12 | +# budget. Previously, tryLastChanceRecoloring would assert here. It |
| 13 | +# was attempting to recolor a superregister with an overlapping |
| 14 | +# subregister over the same range. |
11 | 15 |
|
12 | 16 | --- |
|
13 |
| - define void @foo() #0 { |
| 17 | + define void @dead_copy() #0 { |
14 | 18 | ret void
|
15 | 19 | }
|
16 | 20 |
|
17 |
| - attributes #0 = { "amdgpu-waves-per-eu"="8,8" } |
| 21 | + define void @copy_kill() #0 { |
| 22 | + ret void |
| 23 | + } |
| 24 | + |
| 25 | + define void @copy_subreg() #0 { |
| 26 | + ret void |
| 27 | + } |
| 28 | + |
| 29 | + define void @copy_subreg2() #0 { |
| 30 | + ret void |
| 31 | + } |
| 32 | + |
| 33 | + attributes #0 = { "amdgpu-num-vgpr"="6" } |
| 34 | + |
| 35 | +... |
| 36 | + |
| 37 | +# CHECK-LABEL: name: dead_copy |
| 38 | +# CHECK: renamable $agpr0_agpr1_agpr2 = IMPLICIT_DEF |
| 39 | +# CHECK: dead renamable $vgpr0_vgpr1_vgpr2 = COPY renamable $agpr0_agpr1_agpr2 |
| 40 | + |
| 41 | +--- |
| 42 | +name: dead_copy |
| 43 | +tracksRegLiveness: true |
| 44 | +machineFunctionInfo: |
| 45 | + scratchRSrcReg: '$sgpr0_sgpr1_sgpr2_sgpr3' |
| 46 | + frameOffsetReg: '$sgpr33' |
| 47 | + stackPtrOffsetReg: '$sgpr32' |
| 48 | +body: | |
| 49 | + bb.0: |
| 50 | +
|
| 51 | + INLINEASM &"; def $0 $1 $2 $3 $4", 1 /* sideeffect attdialect */, 11534346 /* regdef:VReg_512 */, def %0:vreg_512, 10158090 /* regdef:VReg_256 */, def %1:vreg_256, 4784138 /* regdef:VReg_128 */, def %2:vreg_128, 3670026 /* regdef:VReg_96 */, def %3:vreg_96, 3670026 /* regdef:VReg_96 */, def %4:vreg_96 |
| 52 | + %5:vreg_96 = COPY %3 |
| 53 | + INLINEASM &"; use $0", 1 /* sideeffect attdialect */, 3670025 /* reguse:VReg_96 */, %3 |
| 54 | + SI_RETURN |
| 55 | +
|
| 56 | +... |
| 57 | + |
| 58 | + |
| 59 | +# CHECK-LABEL: name: copy_kill |
| 60 | +# CHECK: renamable $vgpr0_vgpr1_vgpr2 = IMPLICIT_DEF |
18 | 61 |
|
| 62 | +--- |
| 63 | +name: copy_kill |
| 64 | +tracksRegLiveness: true |
| 65 | +machineFunctionInfo: |
| 66 | + scratchRSrcReg: '$sgpr0_sgpr1_sgpr2_sgpr3' |
| 67 | + frameOffsetReg: '$sgpr33' |
| 68 | + stackPtrOffsetReg: '$sgpr32' |
| 69 | +body: | |
| 70 | + bb.0: |
| 71 | +
|
| 72 | + INLINEASM &"; def $0 $1 $2 $3 $4", 1 /* sideeffect attdialect */, 11534346 /* regdef:VReg_512 */, def %0:vreg_512, 10158090 /* regdef:VReg_256 */, def %1:vreg_256, 4784138 /* regdef:VReg_128 */, def %2:vreg_128, 3670026 /* regdef:VReg_96 */, def %3:vreg_96, 3670026 /* regdef:VReg_96 */, def %4:vreg_96 |
| 73 | + %5:vreg_96 = COPY %3 |
| 74 | + INLINEASM &"; use $0", 1 /* sideeffect attdialect */, 3670025 /* reguse:VReg_96 */, %5 |
| 75 | + SI_RETURN |
19 | 76 | ...
|
20 | 77 |
|
| 78 | +# CHECK-LABEL: name: copy_subreg |
| 79 | +# CHECK: renamable $vgpr1_vgpr2 = IMPLICIT_DEF |
| 80 | +# CHECK: renamable $vgpr0 = COPY renamable $vgpr1 |
21 | 81 | ---
|
22 |
| -name: foo |
| 82 | +name: copy_subreg |
23 | 83 | tracksRegLiveness: true
|
24 |
| -stack: |
25 |
| - - { id: 0, type: spill-slot, size: 32, alignment: 4 } |
26 | 84 | machineFunctionInfo:
|
27 |
| - maxKernArgAlign: 4 |
28 |
| - isEntryFunction: true |
29 |
| - waveLimiter: true |
30 |
| - scratchRSrcReg: '$sgpr96_sgpr97_sgpr98_sgpr99' |
| 85 | + scratchRSrcReg: '$sgpr0_sgpr1_sgpr2_sgpr3' |
| 86 | + frameOffsetReg: '$sgpr33' |
31 | 87 | stackPtrOffsetReg: '$sgpr32'
|
32 |
| - frameOffsetReg: '$sgpr33' |
33 |
| - hasSpilledVGPRs: true |
34 |
| - argumentInfo: |
35 |
| - privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
36 |
| - dispatchPtr: { reg: '$sgpr4_sgpr5' } |
37 |
| - kernargSegmentPtr: { reg: '$sgpr6_sgpr7' } |
38 |
| - workGroupIDX: { reg: '$sgpr8' } |
39 |
| - privateSegmentWaveByteOffset: { reg: '$sgpr9' } |
40 | 88 | body: |
|
41 | 89 | bb.0:
|
42 |
| - ; CHECK-LABEL: name: foo |
43 |
| - ; CHECK: INLINEASM &"; def $0 $1 $2 $3 $4", 1 /* sideeffect attdialect */, 10 /* regdef */, def %10, 10 /* regdef */, def %1, 10 /* regdef */, def %2, 10 /* regdef */, def $vgpr0_vgpr1_vgpr2_vgpr3, 10 /* regdef */, implicit-def $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15 |
44 |
| - ; CHECK-NEXT: [[COPY:%[0-9]+]]:av_128 = COPY undef $vgpr0_vgpr1_vgpr2_vgpr3 |
45 |
| - ; CHECK-NEXT: SI_SPILL_AV128_SAVE [[COPY]], %stack.2, $sgpr32, 0, implicit $exec :: (store (s128) into %stack.2, align 4, addrspace 5) |
46 |
| - ; CHECK-NEXT: SI_SPILL_AV160_SAVE %2, %stack.1, $sgpr32, 0, implicit $exec :: (store (s160) into %stack.1, align 4, addrspace 5) |
47 |
| - ; CHECK-NEXT: SI_SPILL_AV256_SAVE %1, %stack.3, $sgpr32, 0, implicit $exec :: (store (s256) into %stack.3, align 4, addrspace 5) |
48 |
| - ; CHECK-NEXT: [[COPY1:%[0-9]+]]:vreg_512 = COPY %10 |
49 |
| - ; CHECK-NEXT: SI_SPILL_V512_SAVE [[COPY1]], %stack.0, $sgpr32, 0, implicit $exec :: (store (s512) into %stack.0, align 4, addrspace 5) |
50 |
| - ; CHECK-NEXT: [[COPY2:%[0-9]+]]:vreg_512 = COPY $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15 |
51 |
| - ; CHECK-NEXT: SI_SPILL_V512_SAVE [[COPY2]], %stack.6, $sgpr32, 0, implicit $exec :: (store (s512) into %stack.6, align 4, addrspace 5) |
52 |
| - ; CHECK-NEXT: INLINEASM &"; clobber", 1 /* sideeffect attdialect */, 10 /* regdef */, implicit-def early-clobber $vgpr0_vgpr1_vgpr2_vgpr3_vgpr4_vgpr5_vgpr6_vgpr7_vgpr8_vgpr9_vgpr10_vgpr11_vgpr12_vgpr13_vgpr14_vgpr15_vgpr16_vgpr17_vgpr18_vgpr19_vgpr20_vgpr21_vgpr22_vgpr23_vgpr24_vgpr25_vgpr26_vgpr27_vgpr28_vgpr29_vgpr30_vgpr31 |
53 |
| - ; CHECK-NEXT: [[SI_SPILL_V512_RESTORE:%[0-9]+]]:vreg_512 = SI_SPILL_V512_RESTORE %stack.6, $sgpr32, 0, implicit $exec :: (load (s512) from %stack.6, align 4, addrspace 5) |
54 |
| - ; CHECK-NEXT: $agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15_agpr16 = COPY [[SI_SPILL_V512_RESTORE]] |
55 |
| - ; CHECK-NEXT: [[SI_SPILL_V512_RESTORE1:%[0-9]+]]:vreg_512 = SI_SPILL_V512_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s512) from %stack.0, align 4, addrspace 5) |
56 |
| - ; CHECK-NEXT: SI_SPILL_V512_SAVE [[SI_SPILL_V512_RESTORE1]], %stack.4, $sgpr32, 0, implicit $exec :: (store (s512) into %stack.4, align 4, addrspace 5) |
57 |
| - ; CHECK-NEXT: [[SI_SPILL_AV256_RESTORE:%[0-9]+]]:vreg_256 = SI_SPILL_AV256_RESTORE %stack.3, $sgpr32, 0, implicit $exec :: (load (s256) from %stack.3, align 4, addrspace 5) |
58 |
| - ; CHECK-NEXT: SI_SPILL_V256_SAVE [[SI_SPILL_AV256_RESTORE]], %stack.5, $sgpr32, 0, implicit $exec :: (store (s256) into %stack.5, align 4, addrspace 5) |
59 |
| - ; CHECK-NEXT: [[SI_SPILL_AV160_RESTORE:%[0-9]+]]:vreg_160 = SI_SPILL_AV160_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s160) from %stack.1, align 4, addrspace 5) |
60 |
| - ; CHECK-NEXT: $vgpr0_vgpr1_vgpr2_vgpr3 = SI_SPILL_AV128_RESTORE %stack.2, $sgpr32, 0, implicit $exec :: (load (s128) from %stack.2, align 4, addrspace 5) |
61 |
| - ; CHECK-NEXT: [[SI_SPILL_AV512_RESTORE:%[0-9]+]]:av_512 = SI_SPILL_AV512_RESTORE %stack.4, $sgpr32, 0, implicit $exec :: (load (s512) from %stack.4, align 4, addrspace 5) |
62 |
| - ; CHECK-NEXT: [[SI_SPILL_V256_RESTORE:%[0-9]+]]:vreg_256 = SI_SPILL_V256_RESTORE %stack.5, $sgpr32, 0, implicit $exec :: (load (s256) from %stack.5, align 4, addrspace 5) |
63 |
| - ; CHECK-NEXT: INLINEASM &"; use $0 $1 $2 $3 $4", 1 /* sideeffect attdialect */, 9 /* reguse */, [[SI_SPILL_AV512_RESTORE]], 9 /* reguse */, [[SI_SPILL_V256_RESTORE]], 9 /* reguse */, [[SI_SPILL_AV160_RESTORE]], 9 /* reguse */, undef $vgpr0_vgpr1_vgpr2_vgpr3, 9 /* reguse */, $agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15_agpr16 |
64 |
| - ; CHECK-NEXT: SI_RETURN |
65 |
| - INLINEASM &"; def $0 $1 $2 $3 $4", 1 /* sideeffect attdialect */, 10, def %22:vreg_512, 10, def %25:vreg_256, 10, def %28:vreg_160, 10, def $vgpr0_vgpr1_vgpr2_vgpr3, 10, implicit-def $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15 |
66 |
| - %30:av_128 = COPY undef $vgpr0_vgpr1_vgpr2_vgpr3 |
67 |
| - %27:av_160 = COPY %28:vreg_160 |
68 |
| - %24:av_256 = COPY %25:vreg_256 |
69 |
| - SI_SPILL_V512_SAVE %22:vreg_512, %stack.0, $sgpr32, 0, implicit $exec :: (store (s512) into %stack.0, align 4, addrspace 5) |
70 |
| - %18:vreg_512 = COPY $agpr0_agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15 |
71 |
| - INLINEASM &"; clobber", 1 /* sideeffect attdialect */, 10, implicit-def early-clobber $vgpr0_vgpr1_vgpr2_vgpr3_vgpr4_vgpr5_vgpr6_vgpr7_vgpr8_vgpr9_vgpr10_vgpr11_vgpr12_vgpr13_vgpr14_vgpr15_vgpr16_vgpr17_vgpr18_vgpr19_vgpr20_vgpr21_vgpr22_vgpr23_vgpr24_vgpr25_vgpr26_vgpr27_vgpr28_vgpr29_vgpr30_vgpr31 |
72 |
| - $agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15_agpr16 = COPY %18:vreg_512 |
73 |
| - %23:vreg_512 = SI_SPILL_V512_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s512) from %stack.0, align 4, addrspace 5) |
74 |
| - %26:vreg_256 = COPY %24:av_256 |
75 |
| - %29:vreg_160 = COPY %27:av_160 |
76 |
| - $vgpr0_vgpr1_vgpr2_vgpr3 = COPY %30:av_128 |
77 |
| - INLINEASM &"; use $0 $1 $2 $3 $4", 1 /* sideeffect attdialect */, 9, %23:vreg_512, 9, %26:vreg_256, 9, %29:vreg_160, 9, undef $vgpr0_vgpr1_vgpr2_vgpr3, 9, $agpr1_agpr2_agpr3_agpr4_agpr5_agpr6_agpr7_agpr8_agpr9_agpr10_agpr11_agpr12_agpr13_agpr14_agpr15_agpr16 |
| 90 | +
|
| 91 | + INLINEASM &"; def $0 $1 $2 $3 $4", 1 /* sideeffect attdialect */, 11534346 /* regdef:VReg_512 */, def %0:vreg_512, 10158090 /* regdef:VReg_256 */, def %1:vreg_256, 4784138 /* regdef:VReg_128 */, def %2:vreg_128, 3670026 /* regdef:VReg_96 */, def %3:vreg_96, 3670026 /* regdef:VReg_96 */, def %4:vreg_96 |
| 92 | + %3.sub0 = COPY %3.sub1 |
| 93 | + INLINEASM &"; use $0", 1 /* sideeffect attdialect */, 3670025 /* reguse:VReg_96 */, %3 |
78 | 94 | SI_RETURN
|
| 95 | +... |
| 96 | + |
| 97 | +# CHECK-LABEL: name: copy_subreg2 |
| 98 | +# CHECK: renamable $vgpr0_vgpr1_vgpr2 = IMPLICIT_DEF |
79 | 99 |
|
| 100 | +--- |
| 101 | +name: copy_subreg2 |
| 102 | +tracksRegLiveness: true |
| 103 | +machineFunctionInfo: |
| 104 | + scratchRSrcReg: '$sgpr0_sgpr1_sgpr2_sgpr3' |
| 105 | + frameOffsetReg: '$sgpr33' |
| 106 | + stackPtrOffsetReg: '$sgpr32' |
| 107 | +body: | |
| 108 | + bb.0: |
| 109 | +
|
| 110 | + INLINEASM &"; def $0 $1 $2 $3 $4", 1 /* sideeffect attdialect */, 11534346 /* regdef:VReg_512 */, def %0:vreg_512, 10158090 /* regdef:VReg_256 */, def %1:vreg_256, 4784138 /* regdef:VReg_128 */, def %2:vreg_128, 3670026 /* regdef:VReg_96 */, def %3:vreg_96, 3670026 /* regdef:VReg_96 */, def %4:vreg_96 |
| 111 | + undef %5.sub0:vreg_96 = COPY %3.sub0 |
| 112 | + %5.sub1_sub2:vreg_96 = COPY %3.sub1_sub2 |
| 113 | + INLINEASM &"; use $0", 1 /* sideeffect attdialect */, 3670025 /* reguse:VReg_96 */, %5 |
| 114 | + SI_RETURN |
80 | 115 | ...
|
0 commit comments