300 lines
12 KiB
C
300 lines
12 KiB
C
|
// RUN: %clang_cc1 -triple x86_64-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix=LINUX
|
||
|
// RUN: %clang_cc1 -triple x86_64-windows-pc -emit-llvm %s -o - | FileCheck %s --check-prefix=WINDOWS
|
||
|
|
||
|
int __attribute__((target("sse4.2"))) foo(void) { return 0; }
|
||
|
int __attribute__((target("arch=sandybridge"))) foo(void);
|
||
|
int __attribute__((target("arch=ivybridge"))) foo(void) {return 1;}
|
||
|
int __attribute__((target("arch=goldmont"))) foo(void) {return 3;}
|
||
|
int __attribute__((target("arch=goldmont-plus"))) foo(void) {return 4;}
|
||
|
int __attribute__((target("arch=tremont"))) foo(void) {return 5;}
|
||
|
int __attribute__((target("arch=icelake-client"))) foo(void) {return 6;}
|
||
|
int __attribute__((target("arch=icelake-server"))) foo(void) {return 7;}
|
||
|
int __attribute__((target("arch=cooperlake"))) foo(void) {return 8;}
|
||
|
int __attribute__((target("arch=tigerlake"))) foo(void) {return 9;}
|
||
|
int __attribute__((target("arch=sapphirerapids"))) foo(void) {return 10;}
|
||
|
int __attribute__((target("arch=alderlake"))) foo(void) {return 11;}
|
||
|
int __attribute__((target("default"))) foo(void) { return 2; }
|
||
|
|
||
|
int bar() {
|
||
|
return foo();
|
||
|
}
|
||
|
|
||
|
inline int __attribute__((target("sse4.2"))) foo_inline(void) { return 0; }
|
||
|
inline int __attribute__((target("arch=sandybridge"))) foo_inline(void);
|
||
|
inline int __attribute__((target("arch=ivybridge"))) foo_inline(void) {return 1;}
|
||
|
inline int __attribute__((target("default"))) foo_inline(void) { return 2; }
|
||
|
|
||
|
int bar2() {
|
||
|
return foo_inline();
|
||
|
}
|
||
|
|
||
|
inline __attribute__((target("default"))) void foo_decls(void);
|
||
|
inline __attribute__((target("sse4.2"))) void foo_decls(void);
|
||
|
void bar3() {
|
||
|
foo_decls();
|
||
|
}
|
||
|
inline __attribute__((target("default"))) void foo_decls(void) {}
|
||
|
inline __attribute__((target("sse4.2"))) void foo_decls(void) {}
|
||
|
|
||
|
inline __attribute__((target("default"))) void foo_multi(int i, double d) {}
|
||
|
inline __attribute__((target("avx,sse4.2"))) void foo_multi(int i, double d) {}
|
||
|
inline __attribute__((target("sse4.2,fma4"))) void foo_multi(int i, double d) {}
|
||
|
inline __attribute__((target("arch=ivybridge,fma4,sse4.2"))) void foo_multi(int i, double d) {}
|
||
|
void bar4() {
|
||
|
foo_multi(1, 5.0);
|
||
|
}
|
||
|
|
||
|
int fwd_decl_default(void);
|
||
|
int __attribute__((target("default"))) fwd_decl_default(void) { return 2; }
|
||
|
|
||
|
int fwd_decl_avx(void);
|
||
|
int __attribute__((target("avx"))) fwd_decl_avx(void) { return 2; }
|
||
|
int __attribute__((target("default"))) fwd_decl_avx(void) { return 2; }
|
||
|
|
||
|
void bar5() {
|
||
|
fwd_decl_default();
|
||
|
fwd_decl_avx();
|
||
|
}
|
||
|
|
||
|
int __attribute__((target("avx"))) changed_to_mv(void) { return 0;}
|
||
|
int __attribute__((target("fma4"))) changed_to_mv(void) { return 1;}
|
||
|
|
||
|
__attribute__((target("default"), used)) inline void foo_used(int i, double d) {}
|
||
|
__attribute__((target("avx,sse4.2"))) inline void foo_used(int i, double d) {}
|
||
|
|
||
|
__attribute__((target("default"))) inline void foo_used2(int i, double d) {}
|
||
|
__attribute__((target("avx,sse4.2"), used)) inline void foo_used2(int i, double d) {}
|
||
|
|
||
|
// LINUX: @llvm.used = appending global [2 x i8*] [i8* bitcast (void (i32, double)* @foo_used to i8*), i8* bitcast (void (i32, double)* @foo_used2.avx_sse4.2 to i8*)], section "llvm.metadata"
|
||
|
// WINDOWS: @llvm.used = appending global [2 x i8*] [i8* bitcast (void (i32, double)* @foo_used to i8*), i8* bitcast (void (i32, double)* @foo_used2.avx_sse4.2 to i8*)], section "llvm.metadata"
|
||
|
|
||
|
// LINUX: @foo.ifunc = weak_odr ifunc i32 (), i32 ()* ()* @foo.resolver
|
||
|
// LINUX: @foo_inline.ifunc = weak_odr ifunc i32 (), i32 ()* ()* @foo_inline.resolver
|
||
|
// LINUX: @foo_decls.ifunc = weak_odr ifunc void (), void ()* ()* @foo_decls.resolver
|
||
|
// LINUX: @foo_multi.ifunc = weak_odr ifunc void (i32, double), void (i32, double)* ()* @foo_multi.resolver
|
||
|
// LINUX: @fwd_decl_default.ifunc = weak_odr ifunc i32 (), i32 ()* ()* @fwd_decl_default.resolver
|
||
|
// LINUX: @fwd_decl_avx.ifunc = weak_odr ifunc i32 (), i32 ()* ()* @fwd_decl_avx.resolver
|
||
|
|
||
|
// LINUX: define{{.*}} i32 @foo.sse4.2()
|
||
|
// LINUX: ret i32 0
|
||
|
// LINUX: define{{.*}} i32 @foo.arch_ivybridge()
|
||
|
// LINUX: ret i32 1
|
||
|
// LINUX: define{{.*}} i32 @foo.arch_goldmont()
|
||
|
// LINUX: ret i32 3
|
||
|
// LINUX: define{{.*}} i32 @foo.arch_goldmont-plus()
|
||
|
// LINUX: ret i32 4
|
||
|
// LINUX: define{{.*}} i32 @foo.arch_tremont()
|
||
|
// LINUX: ret i32 5
|
||
|
// LINUX: define{{.*}} i32 @foo.arch_icelake-client()
|
||
|
// LINUX: ret i32 6
|
||
|
// LINUX: define{{.*}} i32 @foo.arch_icelake-server()
|
||
|
// LINUX: ret i32 7
|
||
|
// LINUX: define{{.*}} i32 @foo.arch_cooperlake()
|
||
|
// LINUX: ret i32 8
|
||
|
// LINUX: define{{.*}} i32 @foo.arch_tigerlake()
|
||
|
// LINUX: ret i32 9
|
||
|
// LINUX: define{{.*}} i32 @foo.arch_sapphirerapids()
|
||
|
// LINUX: ret i32 10
|
||
|
// LINUX: define{{.*}} i32 @foo.arch_alderlake()
|
||
|
// LINUX: ret i32 11
|
||
|
// LINUX: define{{.*}} i32 @foo()
|
||
|
// LINUX: ret i32 2
|
||
|
// LINUX: define{{.*}} i32 @bar()
|
||
|
// LINUX: call i32 @foo.ifunc()
|
||
|
|
||
|
// WINDOWS: define dso_local i32 @foo.sse4.2()
|
||
|
// WINDOWS: ret i32 0
|
||
|
// WINDOWS: define dso_local i32 @foo.arch_ivybridge()
|
||
|
// WINDOWS: ret i32 1
|
||
|
// WINDOWS: define dso_local i32 @foo.arch_goldmont()
|
||
|
// WINDOWS: ret i32 3
|
||
|
// WINDOWS: define dso_local i32 @foo.arch_goldmont-plus()
|
||
|
// WINDOWS: ret i32 4
|
||
|
// WINDOWS: define dso_local i32 @foo.arch_tremont()
|
||
|
// WINDOWS: ret i32 5
|
||
|
// WINDOWS: define dso_local i32 @foo.arch_icelake-client()
|
||
|
// WINDOWS: ret i32 6
|
||
|
// WINDOWS: define dso_local i32 @foo.arch_icelake-server()
|
||
|
// WINDOWS: ret i32 7
|
||
|
// WINDOWS: define dso_local i32 @foo()
|
||
|
// WINDOWS: ret i32 2
|
||
|
// WINDOWS: define dso_local i32 @bar()
|
||
|
// WINDOWS: call i32 @foo.resolver()
|
||
|
|
||
|
// LINUX: define weak_odr i32 ()* @foo.resolver() comdat
|
||
|
// LINUX: call void @__cpu_indicator_init()
|
||
|
// LINUX: ret i32 ()* @foo.arch_sandybridge
|
||
|
// LINUX: ret i32 ()* @foo.arch_ivybridge
|
||
|
// LINUX: ret i32 ()* @foo.sse4.2
|
||
|
// LINUX: ret i32 ()* @foo
|
||
|
|
||
|
// WINDOWS: define weak_odr dso_local i32 @foo.resolver() comdat
|
||
|
// WINDOWS: call void @__cpu_indicator_init()
|
||
|
// WINDOWS: call i32 @foo.arch_sandybridge
|
||
|
// WINDOWS: call i32 @foo.arch_ivybridge
|
||
|
// WINDOWS: call i32 @foo.sse4.2
|
||
|
// WINDOWS: call i32 @foo
|
||
|
|
||
|
// LINUX: define{{.*}} i32 @bar2()
|
||
|
// LINUX: call i32 @foo_inline.ifunc()
|
||
|
|
||
|
// WINDOWS: define dso_local i32 @bar2()
|
||
|
// WINDOWS: call i32 @foo_inline.resolver()
|
||
|
|
||
|
// LINUX: define weak_odr i32 ()* @foo_inline.resolver() comdat
|
||
|
// LINUX: call void @__cpu_indicator_init()
|
||
|
// LINUX: ret i32 ()* @foo_inline.arch_sandybridge
|
||
|
// LINUX: ret i32 ()* @foo_inline.arch_ivybridge
|
||
|
// LINUX: ret i32 ()* @foo_inline.sse4.2
|
||
|
// LINUX: ret i32 ()* @foo_inline
|
||
|
|
||
|
// WINDOWS: define weak_odr dso_local i32 @foo_inline.resolver() comdat
|
||
|
// WINDOWS: call void @__cpu_indicator_init()
|
||
|
// WINDOWS: call i32 @foo_inline.arch_sandybridge
|
||
|
// WINDOWS: call i32 @foo_inline.arch_ivybridge
|
||
|
// WINDOWS: call i32 @foo_inline.sse4.2
|
||
|
// WINDOWS: call i32 @foo_inline
|
||
|
|
||
|
// LINUX: define{{.*}} void @bar3()
|
||
|
// LINUX: call void @foo_decls.ifunc()
|
||
|
|
||
|
// WINDOWS: define dso_local void @bar3()
|
||
|
// WINDOWS: call void @foo_decls.resolver()
|
||
|
|
||
|
// LINUX: define weak_odr void ()* @foo_decls.resolver() comdat
|
||
|
// LINUX: ret void ()* @foo_decls.sse4.2
|
||
|
// LINUX: ret void ()* @foo_decls
|
||
|
|
||
|
// WINDOWS: define weak_odr dso_local void @foo_decls.resolver() comdat
|
||
|
// WINDOWS: call void @foo_decls.sse4.2
|
||
|
// WINDOWS: call void @foo_decls
|
||
|
|
||
|
// LINUX: define{{.*}} void @bar4()
|
||
|
// LINUX: call void @foo_multi.ifunc(i32 1, double 5.{{[0+e]*}})
|
||
|
|
||
|
// WINDOWS: define dso_local void @bar4()
|
||
|
// WINDOWS: call void @foo_multi.resolver(i32 1, double 5.{{[0+e]*}})
|
||
|
|
||
|
// LINUX: define weak_odr void (i32, double)* @foo_multi.resolver() comdat
|
||
|
// LINUX: and i32 %{{.*}}, 4352
|
||
|
// LINUX: icmp eq i32 %{{.*}}, 4352
|
||
|
// LINUX: ret void (i32, double)* @foo_multi.fma4_sse4.2
|
||
|
// LINUX: icmp eq i32 %{{.*}}, 12
|
||
|
// LINUX: and i32 %{{.*}}, 4352
|
||
|
// LINUX: icmp eq i32 %{{.*}}, 4352
|
||
|
// LINUX: ret void (i32, double)* @foo_multi.arch_ivybridge_fma4_sse4.2
|
||
|
// LINUX: and i32 %{{.*}}, 768
|
||
|
// LINUX: icmp eq i32 %{{.*}}, 768
|
||
|
// LINUX: ret void (i32, double)* @foo_multi.avx_sse4.2
|
||
|
// LINUX: ret void (i32, double)* @foo_multi
|
||
|
|
||
|
// WINDOWS: define weak_odr dso_local void @foo_multi.resolver(i32 %0, double %1) comdat
|
||
|
// WINDOWS: and i32 %{{.*}}, 4352
|
||
|
// WINDOWS: icmp eq i32 %{{.*}}, 4352
|
||
|
// WINDOWS: call void @foo_multi.fma4_sse4.2(i32 %0, double %1)
|
||
|
// WINDOWS-NEXT: ret void
|
||
|
// WINDOWS: icmp eq i32 %{{.*}}, 12
|
||
|
// WINDOWS: and i32 %{{.*}}, 4352
|
||
|
// WINDOWS: icmp eq i32 %{{.*}}, 4352
|
||
|
// WINDOWS: call void @foo_multi.arch_ivybridge_fma4_sse4.2(i32 %0, double %1)
|
||
|
// WINDOWS-NEXT: ret void
|
||
|
// WINDOWS: and i32 %{{.*}}, 768
|
||
|
// WINDOWS: icmp eq i32 %{{.*}}, 768
|
||
|
// WINDOWS: call void @foo_multi.avx_sse4.2(i32 %0, double %1)
|
||
|
// WINDOWS-NEXT: ret void
|
||
|
// WINDOWS: call void @foo_multi(i32 %0, double %1)
|
||
|
// WINDOWS-NEXT: ret void
|
||
|
|
||
|
// LINUX: define{{.*}} i32 @fwd_decl_default()
|
||
|
// LINUX: ret i32 2
|
||
|
// LINUX: define{{.*}} i32 @fwd_decl_avx.avx()
|
||
|
// LINUX: ret i32 2
|
||
|
// LINUX: define{{.*}} i32 @fwd_decl_avx()
|
||
|
// LINUX: ret i32 2
|
||
|
|
||
|
// WINDOWS: define dso_local i32 @fwd_decl_default()
|
||
|
// WINDOWS: ret i32 2
|
||
|
// WINDOWS: define dso_local i32 @fwd_decl_avx.avx()
|
||
|
// WINDOWS: ret i32 2
|
||
|
// WINDOWS: define dso_local i32 @fwd_decl_avx()
|
||
|
// WINDOWS: ret i32 2
|
||
|
|
||
|
// LINUX: define{{.*}} void @bar5()
|
||
|
// LINUX: call i32 @fwd_decl_default.ifunc()
|
||
|
// LINUX: call i32 @fwd_decl_avx.ifunc()
|
||
|
|
||
|
// WINDOWS: define dso_local void @bar5()
|
||
|
// WINDOWS: call i32 @fwd_decl_default.resolver()
|
||
|
// WINDOWS: call i32 @fwd_decl_avx.resolver()
|
||
|
|
||
|
// LINUX: define weak_odr i32 ()* @fwd_decl_default.resolver() comdat
|
||
|
// LINUX: call void @__cpu_indicator_init()
|
||
|
// LINUX: ret i32 ()* @fwd_decl_default
|
||
|
// LINUX: define weak_odr i32 ()* @fwd_decl_avx.resolver() comdat
|
||
|
// LINUX: call void @__cpu_indicator_init()
|
||
|
// LINUX: ret i32 ()* @fwd_decl_avx.avx
|
||
|
// LINUX: ret i32 ()* @fwd_decl_avx
|
||
|
|
||
|
// WINDOWS: define weak_odr dso_local i32 @fwd_decl_default.resolver() comdat
|
||
|
// WINDOWS: call void @__cpu_indicator_init()
|
||
|
// WINDOWS: call i32 @fwd_decl_default
|
||
|
// WINDOWS: define weak_odr dso_local i32 @fwd_decl_avx.resolver() comdat
|
||
|
// WINDOWS: call void @__cpu_indicator_init()
|
||
|
// WINDOWS: call i32 @fwd_decl_avx.avx
|
||
|
// WINDOWS: call i32 @fwd_decl_avx
|
||
|
|
||
|
// LINUX: define{{.*}} i32 @changed_to_mv.avx()
|
||
|
// LINUX: define{{.*}} i32 @changed_to_mv.fma4()
|
||
|
|
||
|
// WINDOWS: define dso_local i32 @changed_to_mv.avx()
|
||
|
// WINDOWS: define dso_local i32 @changed_to_mv.fma4()
|
||
|
|
||
|
// LINUX: define linkonce void @foo_used(i32 %{{.*}}, double %{{.*}})
|
||
|
// LINUX-NOT: @foo_used.avx_sse4.2(
|
||
|
// LINUX-NOT: @foo_used2(
|
||
|
// LINUX: define linkonce void @foo_used2.avx_sse4.2(i32 %{{.*}}, double %{{.*}})
|
||
|
|
||
|
// WINDOWS: define linkonce_odr dso_local void @foo_used(i32 %{{.*}}, double %{{.*}})
|
||
|
// WINDOWS-NOT: @foo_used.avx_sse4.2(
|
||
|
// WINDOWS-NOT: @foo_used2(
|
||
|
// WINDOWS: define linkonce_odr dso_local void @foo_used2.avx_sse4.2(i32 %{{.*}}, double %{{.*}})
|
||
|
|
||
|
// LINUX: declare i32 @foo.arch_sandybridge()
|
||
|
// WINDOWS: declare dso_local i32 @foo.arch_sandybridge()
|
||
|
|
||
|
// LINUX: define linkonce i32 @foo_inline.sse4.2()
|
||
|
// LINUX: ret i32 0
|
||
|
|
||
|
// WINDOWS: define linkonce_odr dso_local i32 @foo_inline.sse4.2()
|
||
|
// WINDOWS: ret i32 0
|
||
|
|
||
|
// LINUX: declare i32 @foo_inline.arch_sandybridge()
|
||
|
|
||
|
// WINDOWS: declare dso_local i32 @foo_inline.arch_sandybridge()
|
||
|
|
||
|
// LINUX: define linkonce i32 @foo_inline.arch_ivybridge()
|
||
|
// LINUX: ret i32 1
|
||
|
// LINUX: define linkonce i32 @foo_inline()
|
||
|
// LINUX: ret i32 2
|
||
|
|
||
|
// WINDOWS: define linkonce_odr dso_local i32 @foo_inline.arch_ivybridge()
|
||
|
// WINDOWS: ret i32 1
|
||
|
// WINDOWS: define linkonce_odr dso_local i32 @foo_inline()
|
||
|
// WINDOWS: ret i32 2
|
||
|
|
||
|
// LINUX: define linkonce void @foo_decls()
|
||
|
// LINUX: define linkonce void @foo_decls.sse4.2()
|
||
|
|
||
|
// WINDOWS: define linkonce_odr dso_local void @foo_decls()
|
||
|
// WINDOWS: define linkonce_odr dso_local void @foo_decls.sse4.2()
|
||
|
|
||
|
// LINUX: define linkonce void @foo_multi(i32 %{{[^,]+}}, double %{{[^\)]+}})
|
||
|
// LINUX: define linkonce void @foo_multi.avx_sse4.2(i32 %{{[^,]+}}, double %{{[^\)]+}})
|
||
|
// LINUX: define linkonce void @foo_multi.fma4_sse4.2(i32 %{{[^,]+}}, double %{{[^\)]+}})
|
||
|
// LINUX: define linkonce void @foo_multi.arch_ivybridge_fma4_sse4.2(i32 %{{[^,]+}}, double %{{[^\)]+}})
|
||
|
|
||
|
// WINDOWS: define linkonce_odr dso_local void @foo_multi(i32 %{{[^,]+}}, double %{{[^\)]+}})
|
||
|
// WINDOWS: define linkonce_odr dso_local void @foo_multi.avx_sse4.2(i32 %{{[^,]+}}, double %{{[^\)]+}})
|
||
|
// WINDOWS: define linkonce_odr dso_local void @foo_multi.fma4_sse4.2(i32 %{{[^,]+}}, double %{{[^\)]+}})
|
||
|
// WINDOWS: define linkonce_odr dso_local void @foo_multi.arch_ivybridge_fma4_sse4.2(i32 %{{[^,]+}}, double %{{[^\)]+}})
|