277 lines
10 KiB
LLVM
277 lines
10 KiB
LLVM
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
||
|
; RUN: opt -S -instcombine %s -o - | FileCheck %s
|
||
|
target datalayout = "e-p:32:32:32-p1:64:64:64-p2:8:8:8-p3:16:16:16-p4:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:32"
|
||
|
|
||
|
@g = addrspace(3) global i32 89
|
||
|
|
||
|
@const_zero_i8_as1 = addrspace(1) constant i8 0
|
||
|
@const_zero_i32_as1 = addrspace(1) constant i32 0
|
||
|
|
||
|
@const_zero_i8_as2 = addrspace(2) constant i8 0
|
||
|
@const_zero_i32_as2 = addrspace(2) constant i32 0
|
||
|
|
||
|
@const_zero_i8_as3 = addrspace(3) constant i8 0
|
||
|
@const_zero_i32_as3 = addrspace(3) constant i32 0
|
||
|
|
||
|
; Test constant folding of inttoptr (ptrtoint constantexpr)
|
||
|
; The intermediate integer size is the same as the pointer size
|
||
|
define i32 addrspace(3)* @test_constant_fold_inttoptr_as_pointer_same_size() {
|
||
|
; CHECK-LABEL: @test_constant_fold_inttoptr_as_pointer_same_size(
|
||
|
; CHECK-NEXT: ret i32 addrspace(3)* @const_zero_i32_as3
|
||
|
;
|
||
|
%x = ptrtoint i32 addrspace(3)* @const_zero_i32_as3 to i32
|
||
|
%y = inttoptr i32 %x to i32 addrspace(3)*
|
||
|
ret i32 addrspace(3)* %y
|
||
|
}
|
||
|
|
||
|
; The intermediate integer size is larger than the pointer size
|
||
|
define i32 addrspace(2)* @test_constant_fold_inttoptr_as_pointer_smaller() {
|
||
|
; CHECK-LABEL: @test_constant_fold_inttoptr_as_pointer_smaller(
|
||
|
; CHECK-NEXT: ret i32 addrspace(2)* @const_zero_i32_as2
|
||
|
;
|
||
|
%x = ptrtoint i32 addrspace(2)* @const_zero_i32_as2 to i16
|
||
|
%y = inttoptr i16 %x to i32 addrspace(2)*
|
||
|
ret i32 addrspace(2)* %y
|
||
|
}
|
||
|
|
||
|
; Different address spaces that are the same size, but they are
|
||
|
; different so nothing should happen
|
||
|
define i32 addrspace(4)* @test_constant_fold_inttoptr_as_pointer_smaller_different_as() {
|
||
|
; CHECK-LABEL: @test_constant_fold_inttoptr_as_pointer_smaller_different_as(
|
||
|
; CHECK-NEXT: ret i32 addrspace(4)* inttoptr (i16 ptrtoint (i32 addrspace(3)* @const_zero_i32_as3 to i16) to i32 addrspace(4)*)
|
||
|
;
|
||
|
%x = ptrtoint i32 addrspace(3)* @const_zero_i32_as3 to i16
|
||
|
%y = inttoptr i16 %x to i32 addrspace(4)*
|
||
|
ret i32 addrspace(4)* %y
|
||
|
}
|
||
|
|
||
|
; Make sure we don't introduce a bitcast between different sized
|
||
|
; address spaces when folding this
|
||
|
define i32 addrspace(2)* @test_constant_fold_inttoptr_as_pointer_smaller_different_size_as() {
|
||
|
; CHECK-LABEL: @test_constant_fold_inttoptr_as_pointer_smaller_different_size_as(
|
||
|
; CHECK-NEXT: ret i32 addrspace(2)* inttoptr (i32 ptrtoint (i32 addrspace(3)* @const_zero_i32_as3 to i32) to i32 addrspace(2)*)
|
||
|
;
|
||
|
%x = ptrtoint i32 addrspace(3)* @const_zero_i32_as3 to i32
|
||
|
%y = inttoptr i32 %x to i32 addrspace(2)*
|
||
|
ret i32 addrspace(2)* %y
|
||
|
}
|
||
|
|
||
|
; The intermediate integer size is too small, nothing should happen
|
||
|
define i32 addrspace(3)* @test_constant_fold_inttoptr_as_pointer_larger() {
|
||
|
; CHECK-LABEL: @test_constant_fold_inttoptr_as_pointer_larger(
|
||
|
; CHECK-NEXT: ret i32 addrspace(3)* inttoptr (i8 ptrtoint (i32 addrspace(3)* @const_zero_i32_as3 to i8) to i32 addrspace(3)*)
|
||
|
;
|
||
|
%x = ptrtoint i32 addrspace(3)* @const_zero_i32_as3 to i8
|
||
|
%y = inttoptr i8 %x to i32 addrspace(3)*
|
||
|
ret i32 addrspace(3)* %y
|
||
|
}
|
||
|
|
||
|
define i8 @const_fold_ptrtoint() {
|
||
|
; CHECK-LABEL: @const_fold_ptrtoint(
|
||
|
; CHECK-NEXT: ret i8 4
|
||
|
;
|
||
|
ret i8 ptrtoint (i32 addrspace(2)* inttoptr (i4 4 to i32 addrspace(2)*) to i8)
|
||
|
}
|
||
|
|
||
|
; Test that mask happens when the destination pointer is smaller than
|
||
|
; the original
|
||
|
define i8 @const_fold_ptrtoint_mask() {
|
||
|
; CHECK-LABEL: @const_fold_ptrtoint_mask(
|
||
|
; CHECK-NEXT: ret i8 1
|
||
|
;
|
||
|
ret i8 ptrtoint (i32 addrspace(3)* inttoptr (i32 257 to i32 addrspace(3)*) to i8)
|
||
|
}
|
||
|
|
||
|
; Address space 0 is too small for the correct mask, should mask with
|
||
|
; 64-bits instead of 32
|
||
|
define i64 @const_fold_ptrtoint_mask_small_as0() {
|
||
|
; CHECK-LABEL: @const_fold_ptrtoint_mask_small_as0(
|
||
|
; CHECK-NEXT: ret i64 -1
|
||
|
;
|
||
|
ret i64 ptrtoint (i32 addrspace(1)* inttoptr (i128 -1 to i32 addrspace(1)*) to i64)
|
||
|
}
|
||
|
|
||
|
define i32 addrspace(3)* @const_inttoptr() {
|
||
|
; CHECK-LABEL: @const_inttoptr(
|
||
|
; CHECK-NEXT: ret i32 addrspace(3)* inttoptr (i16 4 to i32 addrspace(3)*)
|
||
|
;
|
||
|
%p = inttoptr i16 4 to i32 addrspace(3)*
|
||
|
ret i32 addrspace(3)* %p
|
||
|
}
|
||
|
|
||
|
define i16 @const_ptrtoint() {
|
||
|
; CHECK-LABEL: @const_ptrtoint(
|
||
|
; CHECK-NEXT: ret i16 ptrtoint (i32 addrspace(3)* @g to i16)
|
||
|
;
|
||
|
%i = ptrtoint i32 addrspace(3)* @g to i16
|
||
|
ret i16 %i
|
||
|
}
|
||
|
|
||
|
define i16 @const_inttoptr_ptrtoint() {
|
||
|
; CHECK-LABEL: @const_inttoptr_ptrtoint(
|
||
|
; CHECK-NEXT: ret i16 9
|
||
|
;
|
||
|
ret i16 ptrtoint (i32 addrspace(3)* inttoptr (i16 9 to i32 addrspace(3)*) to i16)
|
||
|
}
|
||
|
|
||
|
define i1 @constant_fold_cmp_constantexpr_inttoptr() {
|
||
|
; CHECK-LABEL: @constant_fold_cmp_constantexpr_inttoptr(
|
||
|
; CHECK-NEXT: ret i1 true
|
||
|
;
|
||
|
%x = icmp eq i32 addrspace(3)* inttoptr (i16 0 to i32 addrspace(3)*), null
|
||
|
ret i1 %x
|
||
|
}
|
||
|
|
||
|
define i1 @constant_fold_inttoptr_null(i16 %i) {
|
||
|
; CHECK-LABEL: @constant_fold_inttoptr_null(
|
||
|
; CHECK-NEXT: ret i1 false
|
||
|
;
|
||
|
%x = icmp eq i32 addrspace(3)* inttoptr (i16 99 to i32 addrspace(3)*), inttoptr (i16 0 to i32 addrspace(3)*)
|
||
|
ret i1 %x
|
||
|
}
|
||
|
|
||
|
define i1 @constant_fold_ptrtoint_null() {
|
||
|
; CHECK-LABEL: @constant_fold_ptrtoint_null(
|
||
|
; CHECK-NEXT: ret i1 icmp eq (i32 addrspace(3)* @g, i32 addrspace(3)* null)
|
||
|
;
|
||
|
%x = icmp eq i16 ptrtoint (i32 addrspace(3)* @g to i16), ptrtoint (i32 addrspace(3)* null to i16)
|
||
|
ret i1 %x
|
||
|
}
|
||
|
|
||
|
define i1 @constant_fold_ptrtoint_null_2() {
|
||
|
; CHECK-LABEL: @constant_fold_ptrtoint_null_2(
|
||
|
; CHECK-NEXT: ret i1 icmp eq (i32 addrspace(3)* @g, i32 addrspace(3)* null)
|
||
|
;
|
||
|
%x = icmp eq i16 ptrtoint (i32 addrspace(3)* null to i16), ptrtoint (i32 addrspace(3)* @g to i16)
|
||
|
ret i1 %x
|
||
|
}
|
||
|
|
||
|
define i1 @constant_fold_ptrtoint() {
|
||
|
; CHECK-LABEL: @constant_fold_ptrtoint(
|
||
|
; CHECK-NEXT: ret i1 true
|
||
|
;
|
||
|
%x = icmp eq i16 ptrtoint (i32 addrspace(3)* @g to i16), ptrtoint (i32 addrspace(3)* @g to i16)
|
||
|
ret i1 %x
|
||
|
}
|
||
|
|
||
|
define i1 @constant_fold_inttoptr() {
|
||
|
; CHECK-LABEL: @constant_fold_inttoptr(
|
||
|
; CHECK-NEXT: ret i1 false
|
||
|
;
|
||
|
%x = icmp eq i32 addrspace(3)* inttoptr (i16 99 to i32 addrspace(3)*), inttoptr (i16 27 to i32 addrspace(3)*)
|
||
|
ret i1 %x
|
||
|
}
|
||
|
|
||
|
@g_float_as3 = addrspace(3) global float zeroinitializer
|
||
|
@g_v4f_as3 = addrspace(3) global <4 x float> zeroinitializer
|
||
|
|
||
|
define float @constant_fold_bitcast_ftoi_load() {
|
||
|
; CHECK-LABEL: @constant_fold_bitcast_ftoi_load(
|
||
|
; CHECK-NEXT: [[A:%.*]] = load float, float addrspace(3)* bitcast (i32 addrspace(3)* @g to float addrspace(3)*), align 4
|
||
|
; CHECK-NEXT: ret float [[A]]
|
||
|
;
|
||
|
%a = load float, float addrspace(3)* bitcast (i32 addrspace(3)* @g to float addrspace(3)*), align 4
|
||
|
ret float %a
|
||
|
}
|
||
|
|
||
|
define i32 @constant_fold_bitcast_itof_load() {
|
||
|
; CHECK-LABEL: @constant_fold_bitcast_itof_load(
|
||
|
; CHECK-NEXT: [[A:%.*]] = load i32, i32 addrspace(3)* bitcast (float addrspace(3)* @g_float_as3 to i32 addrspace(3)*), align 4
|
||
|
; CHECK-NEXT: ret i32 [[A]]
|
||
|
;
|
||
|
%a = load i32, i32 addrspace(3)* bitcast (float addrspace(3)* @g_float_as3 to i32 addrspace(3)*), align 4
|
||
|
ret i32 %a
|
||
|
}
|
||
|
|
||
|
define <4 x float> @constant_fold_bitcast_vector_as() {
|
||
|
; CHECK-LABEL: @constant_fold_bitcast_vector_as(
|
||
|
; CHECK-NEXT: [[A:%.*]] = load <4 x float>, <4 x float> addrspace(3)* @g_v4f_as3, align 16
|
||
|
; CHECK-NEXT: ret <4 x float> [[A]]
|
||
|
;
|
||
|
%a = load <4 x float>, <4 x float> addrspace(3)* bitcast (<4 x i32> addrspace(3)* bitcast (<4 x float> addrspace(3)* @g_v4f_as3 to <4 x i32> addrspace(3)*) to <4 x float> addrspace(3)*), align 4
|
||
|
ret <4 x float> %a
|
||
|
}
|
||
|
|
||
|
@i32_array_as3 = addrspace(3) global [10 x i32] zeroinitializer
|
||
|
|
||
|
define i32 @test_cast_gep_small_indices_as() {
|
||
|
; CHECK-LABEL: @test_cast_gep_small_indices_as(
|
||
|
; CHECK-NEXT: [[X:%.*]] = load i32, i32 addrspace(3)* getelementptr inbounds ([10 x i32], [10 x i32] addrspace(3)* @i32_array_as3, i16 0, i16 0), align 16
|
||
|
; CHECK-NEXT: ret i32 [[X]]
|
||
|
;
|
||
|
%p = getelementptr [10 x i32], [10 x i32] addrspace(3)* @i32_array_as3, i7 0, i7 0
|
||
|
%x = load i32, i32 addrspace(3)* %p, align 4
|
||
|
ret i32 %x
|
||
|
}
|
||
|
|
||
|
%struct.foo = type { float, float, [4 x i32], i32 addrspace(3)* }
|
||
|
|
||
|
@constant_fold_global_ptr = addrspace(3) global %struct.foo {
|
||
|
float 0.0,
|
||
|
float 0.0,
|
||
|
[4 x i32] zeroinitializer,
|
||
|
i32 addrspace(3)* getelementptr ([10 x i32], [10 x i32] addrspace(3)* @i32_array_as3, i64 0, i64 0)
|
||
|
}
|
||
|
|
||
|
define i32 @test_cast_gep_large_indices_as() {
|
||
|
; CHECK-LABEL: @test_cast_gep_large_indices_as(
|
||
|
; CHECK-NEXT: [[X:%.*]] = load i32, i32 addrspace(3)* getelementptr inbounds ([10 x i32], [10 x i32] addrspace(3)* @i32_array_as3, i16 0, i16 0), align 16
|
||
|
; CHECK-NEXT: ret i32 [[X]]
|
||
|
;
|
||
|
%p = getelementptr [10 x i32], [10 x i32] addrspace(3)* @i32_array_as3, i64 0, i64 0
|
||
|
%x = load i32, i32 addrspace(3)* %p, align 4
|
||
|
ret i32 %x
|
||
|
}
|
||
|
|
||
|
define i32 @test_constant_cast_gep_struct_indices_as() {
|
||
|
; CHECK-LABEL: @test_constant_cast_gep_struct_indices_as(
|
||
|
; CHECK-NEXT: [[Y:%.*]] = load i32, i32 addrspace(3)* getelementptr inbounds (%struct.foo, [[STRUCT_FOO:%.*]] addrspace(3)* @constant_fold_global_ptr, i16 0, i32 2, i16 2), align 16
|
||
|
; CHECK-NEXT: ret i32 [[Y]]
|
||
|
;
|
||
|
%x = getelementptr %struct.foo, %struct.foo addrspace(3)* @constant_fold_global_ptr, i18 0, i32 2, i12 2
|
||
|
%y = load i32, i32 addrspace(3)* %x, align 4
|
||
|
ret i32 %y
|
||
|
}
|
||
|
|
||
|
@constant_data_as3 = addrspace(3) constant [5 x i32] [i32 1, i32 2, i32 3, i32 4, i32 5]
|
||
|
|
||
|
define i32 @test_read_data_from_global_as3() {
|
||
|
; CHECK-LABEL: @test_read_data_from_global_as3(
|
||
|
; CHECK-NEXT: ret i32 2
|
||
|
;
|
||
|
%x = getelementptr [5 x i32], [5 x i32] addrspace(3)* @constant_data_as3, i32 0, i32 1
|
||
|
%y = load i32, i32 addrspace(3)* %x, align 4
|
||
|
ret i32 %y
|
||
|
}
|
||
|
|
||
|
@a = addrspace(1) constant i32 9
|
||
|
@b = addrspace(1) constant i32 23
|
||
|
@c = addrspace(1) constant i32 34
|
||
|
@d = addrspace(1) constant i32 99
|
||
|
|
||
|
@ptr_array = addrspace(2) constant [4 x i32 addrspace(1)*] [ i32 addrspace(1)* @a, i32 addrspace(1)* @b, i32 addrspace(1)* @c, i32 addrspace(1)* @d]
|
||
|
@indirect = addrspace(0) constant i32 addrspace(1)* addrspace(2)* getelementptr inbounds ([4 x i32 addrspace(1)*], [4 x i32 addrspace(1)*] addrspace(2)* @ptr_array, i1 0, i32 2)
|
||
|
|
||
|
define i32 @constant_through_array_as_ptrs() {
|
||
|
; CHECK-LABEL: @constant_through_array_as_ptrs(
|
||
|
; CHECK-NEXT: ret i32 34
|
||
|
;
|
||
|
%p = load i32 addrspace(1)* addrspace(2)*, i32 addrspace(1)* addrspace(2)* addrspace(0)* @indirect, align 4
|
||
|
%a = load i32 addrspace(1)*, i32 addrspace(1)* addrspace(2)* %p, align 4
|
||
|
%b = load i32, i32 addrspace(1)* %a, align 4
|
||
|
ret i32 %b
|
||
|
}
|
||
|
|
||
|
@shared_mem = external addrspace(3) global [0 x i8]
|
||
|
|
||
|
define float @canonicalize_addrspacecast(i32 %i) {
|
||
|
; CHECK-LABEL: @canonicalize_addrspacecast(
|
||
|
; CHECK-NEXT: [[P:%.*]] = getelementptr inbounds float, float* addrspacecast (float addrspace(3)* bitcast ([0 x i8] addrspace(3)* @shared_mem to float addrspace(3)*) to float*), i32 [[I:%.*]]
|
||
|
; CHECK-NEXT: [[V:%.*]] = load float, float* [[P]], align 4
|
||
|
; CHECK-NEXT: ret float [[V]]
|
||
|
;
|
||
|
%p = getelementptr inbounds float, float* addrspacecast ([0 x i8] addrspace(3)* @shared_mem to float*), i32 %i
|
||
|
%v = load float, float* %p
|
||
|
ret float %v
|
||
|
}
|