You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
317 lines
11 KiB
317 lines
11 KiB
# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
|
|
# RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -run-pass=amdgpu-postlegalizer-combiner -verify-machineinstrs %s -o - | FileCheck %s
|
|
|
|
---
|
|
name: remove_and_255_zextload
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1
|
|
; CHECK-LABEL: name: remove_and_255_zextload
|
|
; CHECK: liveins: $vgpr0_vgpr1
|
|
; CHECK: %ptr:_(p1) = COPY $vgpr0_vgpr1
|
|
; CHECK: %load:_(s32) = G_ZEXTLOAD %ptr(p1) :: (load 1, addrspace 1)
|
|
; CHECK: $vgpr0 = COPY %load(s32)
|
|
%ptr:_(p1) = COPY $vgpr0_vgpr1
|
|
%load:_(s32) = G_ZEXTLOAD %ptr :: (load 1, addrspace 1, align 1)
|
|
%mask:_(s32) = G_CONSTANT i32 255
|
|
%and:_(s32) = G_AND %load, %mask
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
---
|
|
name: remove_and_255_smin_zextload
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK-LABEL: name: remove_and_255_smin_zextload
|
|
; CHECK: liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK: %ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
; CHECK: %ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
; CHECK: %load0:_(s32) = G_ZEXTLOAD %ptr0(p1) :: (load 1, addrspace 1)
|
|
; CHECK: %load1:_(s32) = G_ZEXTLOAD %ptr1(p1) :: (load 1, addrspace 1)
|
|
; CHECK: %smin:_(s32) = G_SMIN %load0, %load1
|
|
; CHECK: $vgpr0 = COPY %smin(s32)
|
|
%ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
%ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
%load0:_(s32) = G_ZEXTLOAD %ptr0 :: (load 1, addrspace 1, align 1)
|
|
%load1:_(s32) = G_ZEXTLOAD %ptr1 :: (load 1, addrspace 1, align 1)
|
|
%smin:_(s32) = G_SMIN %load0, %load1
|
|
%mask:_(s32) = G_CONSTANT i32 255
|
|
%and:_(s32) = G_AND %smin, %mask
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
---
|
|
name: remove_and_255_smax_zextload
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK-LABEL: name: remove_and_255_smax_zextload
|
|
; CHECK: liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK: %ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
; CHECK: %ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
; CHECK: %load0:_(s32) = G_ZEXTLOAD %ptr0(p1) :: (load 1, addrspace 1)
|
|
; CHECK: %load1:_(s32) = G_ZEXTLOAD %ptr1(p1) :: (load 1, addrspace 1)
|
|
; CHECK: %smax:_(s32) = G_SMAX %load0, %load1
|
|
; CHECK: $vgpr0 = COPY %smax(s32)
|
|
%ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
%ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
%load0:_(s32) = G_ZEXTLOAD %ptr0 :: (load 1, addrspace 1, align 1)
|
|
%load1:_(s32) = G_ZEXTLOAD %ptr1 :: (load 1, addrspace 1, align 1)
|
|
%smax:_(s32) = G_SMAX %load0, %load1
|
|
%mask:_(s32) = G_CONSTANT i32 255
|
|
%and:_(s32) = G_AND %smax, %mask
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
---
|
|
name: remove_and_255_umin_zextload
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK-LABEL: name: remove_and_255_umin_zextload
|
|
; CHECK: liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK: %ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
; CHECK: %ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
; CHECK: %load0:_(s32) = G_ZEXTLOAD %ptr0(p1) :: (load 1, addrspace 1)
|
|
; CHECK: %load1:_(s32) = G_ZEXTLOAD %ptr1(p1) :: (load 1, addrspace 1)
|
|
; CHECK: %umin:_(s32) = G_UMIN %load0, %load1
|
|
; CHECK: $vgpr0 = COPY %umin(s32)
|
|
%ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
%ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
%load0:_(s32) = G_ZEXTLOAD %ptr0 :: (load 1, addrspace 1, align 1)
|
|
%load1:_(s32) = G_ZEXTLOAD %ptr1 :: (load 1, addrspace 1, align 1)
|
|
%umin:_(s32) = G_UMIN %load0, %load1
|
|
%mask:_(s32) = G_CONSTANT i32 255
|
|
%and:_(s32) = G_AND %umin, %mask
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
---
|
|
name: remove_and_255_umax_zextload
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK-LABEL: name: remove_and_255_umax_zextload
|
|
; CHECK: liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK: %ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
; CHECK: %ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
; CHECK: %load0:_(s32) = G_ZEXTLOAD %ptr0(p1) :: (load 1, addrspace 1)
|
|
; CHECK: %load1:_(s32) = G_ZEXTLOAD %ptr1(p1) :: (load 1, addrspace 1)
|
|
; CHECK: %umax:_(s32) = G_UMAX %load0, %load1
|
|
; CHECK: $vgpr0 = COPY %umax(s32)
|
|
%ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
%ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
%load0:_(s32) = G_ZEXTLOAD %ptr0 :: (load 1, addrspace 1, align 1)
|
|
%load1:_(s32) = G_ZEXTLOAD %ptr1 :: (load 1, addrspace 1, align 1)
|
|
%umax:_(s32) = G_UMAX %load0, %load1
|
|
%mask:_(s32) = G_CONSTANT i32 255
|
|
%and:_(s32) = G_AND %umax, %mask
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
# Don't have enough known bits for lhs
|
|
---
|
|
name: remove_and_255_smin_fail_lhs
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK-LABEL: name: remove_and_255_smin_fail_lhs
|
|
; CHECK: liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK: %ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
; CHECK: %ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
; CHECK: %load0:_(s32) = G_LOAD %ptr0(p1) :: (load 4, addrspace 1)
|
|
; CHECK: %load1:_(s32) = G_ZEXTLOAD %ptr1(p1) :: (load 1, addrspace 1)
|
|
; CHECK: %smin:_(s32) = G_SMIN %load0, %load1
|
|
; CHECK: %mask:_(s32) = G_CONSTANT i32 255
|
|
; CHECK: %and:_(s32) = G_AND %smin, %mask
|
|
; CHECK: $vgpr0 = COPY %and(s32)
|
|
%ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
%ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
%load0:_(s32) = G_LOAD %ptr0 :: (load 4, addrspace 1, align 4)
|
|
%load1:_(s32) = G_ZEXTLOAD %ptr1 :: (load 1, addrspace 1, align 1)
|
|
%smin:_(s32) = G_SMIN %load0, %load1
|
|
%mask:_(s32) = G_CONSTANT i32 255
|
|
%and:_(s32) = G_AND %smin, %mask
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
# Don't have enough known bits for rhs
|
|
---
|
|
name: remove_and_255_smin_fail_rhs
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK-LABEL: name: remove_and_255_smin_fail_rhs
|
|
; CHECK: liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
|
|
; CHECK: %ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
; CHECK: %ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
; CHECK: %load0:_(s32) = G_ZEXTLOAD %ptr0(p1) :: (load 1, addrspace 1)
|
|
; CHECK: %load1:_(s32) = G_LOAD %ptr1(p1) :: (load 4, addrspace 1)
|
|
; CHECK: %smin:_(s32) = G_SMIN %load0, %load1
|
|
; CHECK: %mask:_(s32) = G_CONSTANT i32 255
|
|
; CHECK: %and:_(s32) = G_AND %smin, %mask
|
|
; CHECK: $vgpr0 = COPY %and(s32)
|
|
%ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
%ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
%load0:_(s32) = G_ZEXTLOAD %ptr0 :: (load 1, addrspace 1, align 1)
|
|
%load1:_(s32) = G_LOAD %ptr1 :: (load 4, addrspace 1, align 4)
|
|
%smin:_(s32) = G_SMIN %load0, %load1
|
|
%mask:_(s32) = G_CONSTANT i32 255
|
|
%and:_(s32) = G_AND %smin, %mask
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
# Test known bits for groupstaticsize is the maximum LDS size.
|
|
---
|
|
name: remove_and_65535_groupstaticsize
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1
|
|
; CHECK-LABEL: name: remove_and_65535_groupstaticsize
|
|
; CHECK: liveins: $vgpr0_vgpr1
|
|
; CHECK: %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
|
|
; CHECK: %mask:_(s32) = G_CONSTANT i32 65535
|
|
; CHECK: %and:_(s32) = G_AND %lds_size, %mask
|
|
; CHECK: $vgpr0 = COPY %and(s32)
|
|
%ptr:_(p1) = COPY $vgpr0_vgpr1
|
|
%lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
|
|
%mask:_(s32) = G_CONSTANT i32 65535
|
|
%and:_(s32) = G_AND %lds_size, %mask
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
---
|
|
name: remove_and_131071_groupstaticsize
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1
|
|
; CHECK-LABEL: name: remove_and_131071_groupstaticsize
|
|
; CHECK: liveins: $vgpr0_vgpr1
|
|
; CHECK: %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
|
|
; CHECK: $vgpr0 = COPY %lds_size(s32)
|
|
%ptr:_(p1) = COPY $vgpr0_vgpr1
|
|
%lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
|
|
%mask:_(s32) = G_CONSTANT i32 131071
|
|
%and:_(s32) = G_AND %lds_size, %mask
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
---
|
|
name: no_remove_and_65536_groupstaticsize
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1
|
|
; CHECK-LABEL: name: no_remove_and_65536_groupstaticsize
|
|
; CHECK: liveins: $vgpr0_vgpr1
|
|
; CHECK: %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
|
|
; CHECK: %mask:_(s32) = G_CONSTANT i32 65536
|
|
; CHECK: %and:_(s32) = G_AND %lds_size, %mask
|
|
; CHECK: $vgpr0 = COPY %and(s32)
|
|
%ptr:_(p1) = COPY $vgpr0_vgpr1
|
|
%lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
|
|
%mask:_(s32) = G_CONSTANT i32 65536
|
|
%and:_(s32) = G_AND %lds_size, %mask
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
---
|
|
name: no_remove_and_32767_groupstaticsize
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1
|
|
; CHECK-LABEL: name: no_remove_and_32767_groupstaticsize
|
|
; CHECK: liveins: $vgpr0_vgpr1
|
|
; CHECK: %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
|
|
; CHECK: %mask:_(s32) = G_CONSTANT i32 32767
|
|
; CHECK: %and:_(s32) = G_AND %lds_size, %mask
|
|
; CHECK: $vgpr0 = COPY %and(s32)
|
|
%ptr:_(p1) = COPY $vgpr0_vgpr1
|
|
%lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
|
|
%mask:_(s32) = G_CONSTANT i32 32767
|
|
%and:_(s32) = G_AND %lds_size, %mask
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
# We can conclude the number of bits based only on one operand
|
|
---
|
|
name: remove_and_umin_lhs_only
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1, $vgpr2_vgpr3, $vgpr4
|
|
|
|
; CHECK-LABEL: name: remove_and_umin_lhs_only
|
|
; CHECK: liveins: $vgpr0_vgpr1, $vgpr2_vgpr3, $vgpr4
|
|
; CHECK: %val:_(s32) = COPY $vgpr4
|
|
; CHECK: %k255:_(s32) = G_CONSTANT i32 255
|
|
; CHECK: %umin0:_(s32) = G_UMIN %val, %k255
|
|
; CHECK: $vgpr0 = COPY %umin0(s32)
|
|
%ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
%ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
%val:_(s32) = COPY $vgpr4
|
|
%k255:_(s32) = G_CONSTANT i32 255
|
|
%umin0:_(s32) = G_UMIN %val, %k255
|
|
%and:_(s32) = G_AND %umin0, %k255
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|
|
|
|
---
|
|
name: remove_and_umin_rhs_only
|
|
legalized: true
|
|
tracksRegLiveness: true
|
|
body: |
|
|
bb.0:
|
|
liveins: $vgpr0_vgpr1, $vgpr2_vgpr3, $vgpr4
|
|
|
|
; CHECK-LABEL: name: remove_and_umin_rhs_only
|
|
; CHECK: liveins: $vgpr0_vgpr1, $vgpr2_vgpr3, $vgpr4
|
|
; CHECK: %val:_(s32) = COPY $vgpr4
|
|
; CHECK: %k255:_(s32) = G_CONSTANT i32 255
|
|
; CHECK: %umin0:_(s32) = G_UMIN %k255, %val
|
|
; CHECK: $vgpr0 = COPY %umin0(s32)
|
|
%ptr0:_(p1) = COPY $vgpr0_vgpr1
|
|
%ptr1:_(p1) = COPY $vgpr2_vgpr3
|
|
%val:_(s32) = COPY $vgpr4
|
|
%k255:_(s32) = G_CONSTANT i32 255
|
|
%umin0:_(s32) = G_UMIN %k255, %val
|
|
%and:_(s32) = G_AND %umin0, %k255
|
|
$vgpr0 = COPY %and
|
|
|
|
...
|