// RUN: %clang_cc1 -triple x86_64-linux-gnu -emit-llvm -o - %s | FileCheck %s --check-prefixes=CHECK,LINUX // RUN: %clang_cc1 -triple x86_64-apple-macos -emit-llvm -o - %s | FileCheck %s --check-prefixes=CHECK,LINUX // RUN: %clang_cc1 -triple x86_64-windows-pc -fms-compatibility -emit-llvm -o - %s | FileCheck %s --check-prefixes=CHECK,WINDOWS #ifdef _WIN64 #define ATTR(X) __declspec(X) #else #define ATTR(X) __attribute__((X)) #endif // _WIN64 // Each version should have an IFunc and an alias. // LINUX: @SingleVersion = weak_odr alias void (), ptr @SingleVersion.ifunc // LINUX: @TwoVersions = weak_odr alias void (), ptr @TwoVersions.ifunc // LINUX: @OrderDispatchUsageSpecific = weak_odr alias void (), ptr @OrderDispatchUsageSpecific.ifunc // LINUX: @TwoVersionsSameAttr = weak_odr alias void (), ptr @TwoVersionsSameAttr.ifunc // LINUX: @ThreeVersionsSameAttr = weak_odr alias void (), ptr @ThreeVersionsSameAttr.ifunc // LINUX: @OrderSpecificUsageDispatch = weak_odr alias void (), ptr @OrderSpecificUsageDispatch.ifunc // LINUX: @NoSpecifics = weak_odr alias void (), ptr @NoSpecifics.ifunc // LINUX: @HasGeneric = weak_odr alias void (), ptr @HasGeneric.ifunc // LINUX: @HasParams = weak_odr alias void (i32, double), ptr @HasParams.ifunc // LINUX: @HasParamsAndReturn = weak_odr alias i32 (i32, double), ptr @HasParamsAndReturn.ifunc // LINUX: @GenericAndPentium = weak_odr alias i32 (i32, double), ptr @GenericAndPentium.ifunc // LINUX: @DispatchFirst = weak_odr alias i32 (), ptr @DispatchFirst.ifunc // LINUX: @SingleVersion.ifunc = weak_odr ifunc void (), ptr @SingleVersion.resolver // LINUX: @TwoVersions.ifunc = weak_odr ifunc void (), ptr @TwoVersions.resolver // LINUX: @OrderDispatchUsageSpecific.ifunc = weak_odr ifunc void (), ptr @OrderDispatchUsageSpecific.resolver // LINUX: @TwoVersionsSameAttr.ifunc = weak_odr ifunc void (), ptr @TwoVersionsSameAttr.resolver // LINUX: @ThreeVersionsSameAttr.ifunc = weak_odr ifunc void (), ptr @ThreeVersionsSameAttr.resolver // LINUX: @OrderSpecificUsageDispatch.ifunc = weak_odr ifunc void (), ptr @OrderSpecificUsageDispatch.resolver // LINUX: @NoSpecifics.ifunc = weak_odr ifunc void (), ptr @NoSpecifics.resolver // LINUX: @HasGeneric.ifunc = weak_odr ifunc void (), ptr @HasGeneric.resolver // LINUX: @HasParams.ifunc = weak_odr ifunc void (i32, double), ptr @HasParams.resolver // LINUX: @HasParamsAndReturn.ifunc = weak_odr ifunc i32 (i32, double), ptr @HasParamsAndReturn.resolver // LINUX: @GenericAndPentium.ifunc = weak_odr ifunc i32 (i32, double), ptr @GenericAndPentium.resolver // LINUX: @DispatchFirst.ifunc = weak_odr ifunc i32 (), ptr @DispatchFirst.resolver ATTR(cpu_specific(ivybridge)) void SingleVersion(void){} // LINUX: define{{.*}} void @SingleVersion.S() #[[S:[0-9]+]] // WINDOWS: define dso_local void @SingleVersion.S() #[[S:[0-9]+]] ATTR(cpu_dispatch(ivybridge)) void SingleVersion(void); // LINUX: define weak_odr ptr @SingleVersion.resolver() // LINUX: call void @__cpu_indicator_init // LINUX: %[[FEAT_INIT:.+]] = load i32, ptr getelementptr inbounds ({ i32, i32, i32, [1 x i32] }, ptr @__cpu_model, i32 0, i32 3, i32 0), align 4 // LINUX: %[[FEAT_JOIN:.+]] = and i32 %[[FEAT_INIT]], 525311 // LINUX: %[[FEAT_CHECK:.+]] = icmp eq i32 %[[FEAT_JOIN]], 525311 // LINUX: ret ptr @SingleVersion.S // LINUX: call void @llvm.trap // LINUX: unreachable // WINDOWS: define weak_odr dso_local void @SingleVersion() comdat // WINDOWS: call void @__cpu_indicator_init() // WINDOWS: %[[FEAT_INIT:.+]] = load i32, ptr getelementptr inbounds ({ i32, i32, i32, [1 x i32] }, ptr @__cpu_model, i32 0, i32 3, i32 0), align 4 // WINDOWS: %[[FEAT_JOIN:.+]] = and i32 %[[FEAT_INIT]], 525311 // WINDOWS: %[[FEAT_CHECK:.+]] = icmp eq i32 %[[FEAT_JOIN]], 525311 // WINDOWS: call void @SingleVersion.S() // WINDOWS-NEXT: ret void // WINDOWS: call void @llvm.trap // WINDOWS: unreachable ATTR(cpu_specific(ivybridge)) void NotCalled(void){} // LINUX: define{{.*}} void @NotCalled.S() #[[S]] // WINDOWS: define dso_local void @NotCalled.S() #[[S:[0-9]+]] // Done before any of the implementations. Also has an undecorated forward // declaration. void TwoVersions(void); ATTR(cpu_dispatch(ivybridge, knl)) void TwoVersions(void); // LINUX: define weak_odr ptr @TwoVersions.resolver() // LINUX: call void @__cpu_indicator_init // LINUX: %[[FEAT_INIT:.+]] = load i32, ptr getelementptr inbounds ({ i32, i32, i32, [1 x i32] }, ptr @__cpu_model, i32 0, i32 3, i32 0), align 4 // LINUX: %[[FEAT_JOIN:.+]] = and i32 %[[FEAT_INIT]], 59754495 // LINUX: %[[FEAT_CHECK:.+]] = icmp eq i32 %[[FEAT_JOIN]], 59754495 // LINUX: ret ptr @TwoVersions.Z // LINUX: ret ptr @TwoVersions.S // LINUX: call void @llvm.trap // LINUX: unreachable // WINDOWS: define weak_odr dso_local void @TwoVersions() comdat // WINDOWS: call void @__cpu_indicator_init() // WINDOWS: %[[FEAT_INIT:.+]] = load i32, ptr getelementptr inbounds ({ i32, i32, i32, [1 x i32] }, ptr @__cpu_model, i32 0, i32 3, i32 0), align 4 // WINDOWS: %[[FEAT_JOIN:.+]] = and i32 %[[FEAT_INIT]], 59754495 // WINDOWS: %[[FEAT_CHECK:.+]] = icmp eq i32 %[[FEAT_JOIN]], 59754495 // WINDOWS: call void @TwoVersions.Z() // WINDOWS-NEXT: ret void // WINDOWS: call void @TwoVersions.S() // WINDOWS-NEXT: ret void // WINDOWS: call void @llvm.trap // WINDOWS: unreachable ATTR(cpu_specific(ivybridge)) void TwoVersions(void){} // CHECK: define {{.*}}void @TwoVersions.S() #[[S]] ATTR(cpu_specific(knl)) void TwoVersions(void){} // CHECK: define {{.*}}void @TwoVersions.Z() #[[K:[0-9]+]] ATTR(cpu_specific(ivybridge, knl)) void TwoVersionsSameAttr(void){} // CHECK: define {{.*}}void @TwoVersionsSameAttr.S() #[[S]] // CHECK: define {{.*}}void @TwoVersionsSameAttr.Z() #[[K]] ATTR(cpu_specific(atom, ivybridge, knl)) void ThreeVersionsSameAttr(void){} // CHECK: define {{.*}}void @ThreeVersionsSameAttr.O() #[[O:[0-9]+]] // CHECK: define {{.*}}void @ThreeVersionsSameAttr.S() #[[S]] // CHECK: define {{.*}}void @ThreeVersionsSameAttr.Z() #[[K]] ATTR(cpu_specific(knl)) void CpuSpecificNoDispatch(void) {} // CHECK: define {{.*}}void @CpuSpecificNoDispatch.Z() #[[K:[0-9]+]] ATTR(cpu_dispatch(knl)) void OrderDispatchUsageSpecific(void); // LINUX: define weak_odr ptr @OrderDispatchUsageSpecific.resolver() // LINUX: call void @__cpu_indicator_init // LINUX: ret ptr @OrderDispatchUsageSpecific.Z // LINUX: call void @llvm.trap // LINUX: unreachable // WINDOWS: define weak_odr dso_local void @OrderDispatchUsageSpecific() comdat // WINDOWS: call void @__cpu_indicator_init() // WINDOWS: call void @OrderDispatchUsageSpecific.Z() // WINDOWS-NEXT: ret void // WINDOWS: call void @llvm.trap // WINDOWS: unreachable // CHECK: define {{.*}}void @OrderDispatchUsageSpecific.Z() ATTR(cpu_specific(knl)) void OrderSpecificUsageDispatch(void) {} // CHECK: define {{.*}}void @OrderSpecificUsageDispatch.Z() #[[K:[0-9]+]] void usages(void) { SingleVersion(); // LINUX: @SingleVersion.ifunc() // WINDOWS: @SingleVersion() TwoVersions(); // LINUX: @TwoVersions.ifunc() // WINDOWS: @TwoVersions() TwoVersionsSameAttr(); // LINUX: @TwoVersionsSameAttr.ifunc() // WINDOWS: @TwoVersionsSameAttr() ThreeVersionsSameAttr(); // LINUX: @ThreeVersionsSameAttr.ifunc() // WINDOWS: @ThreeVersionsSameAttr() CpuSpecificNoDispatch(); // LINUX: @CpuSpecificNoDispatch.ifunc() // WINDOWS: @CpuSpecificNoDispatch() OrderDispatchUsageSpecific(); // LINUX: @OrderDispatchUsageSpecific.ifunc() // WINDOWS: @OrderDispatchUsageSpecific() OrderSpecificUsageDispatch(); // LINUX: @OrderSpecificUsageDispatch.ifunc() // WINDOWS: @OrderSpecificUsageDispatch() } // LINUX: declare void @CpuSpecificNoDispatch.ifunc() // has an extra config to emit! ATTR(cpu_dispatch(ivybridge, knl, atom)) void TwoVersionsSameAttr(void); // LINUX: define weak_odr ptr @TwoVersionsSameAttr.resolver() // LINUX: ret ptr @TwoVersionsSameAttr.Z // LINUX: ret ptr @TwoVersionsSameAttr.S // LINUX: ret ptr @TwoVersionsSameAttr.O // LINUX: call void @llvm.trap // LINUX: unreachable // WINDOWS: define weak_odr dso_local void @TwoVersionsSameAttr() comdat // WINDOWS: call void @TwoVersionsSameAttr.Z // WINDOWS-NEXT: ret void // WINDOWS: call void @TwoVersionsSameAttr.S // WINDOWS-NEXT: ret void // WINDOWS: call void @TwoVersionsSameAttr.O // WINDOWS-NEXT: ret void // WINDOWS: call void @llvm.trap // WINDOWS: unreachable ATTR(cpu_dispatch(atom, ivybridge, knl)) void ThreeVersionsSameAttr(void){} // LINUX: define weak_odr ptr @ThreeVersionsSameAttr.resolver() // LINUX: call void @__cpu_indicator_init // LINUX: ret ptr @ThreeVersionsSameAttr.Z // LINUX: ret ptr @ThreeVersionsSameAttr.S // LINUX: ret ptr @ThreeVersionsSameAttr.O // LINUX: call void @llvm.trap // LINUX: unreachable // WINDOWS: define weak_odr dso_local void @ThreeVersionsSameAttr() comdat // WINDOWS: call void @__cpu_indicator_init // WINDOWS: call void @ThreeVersionsSameAttr.Z // WINDOWS-NEXT: ret void // WINDOWS: call void @ThreeVersionsSameAttr.S // WINDOWS-NEXT: ret void // WINDOWS: call void @ThreeVersionsSameAttr.O // WINDOWS-NEXT: ret void // WINDOWS: call void @llvm.trap // WINDOWS: unreachable ATTR(cpu_dispatch(knl)) void OrderSpecificUsageDispatch(void); // LINUX: define weak_odr ptr @OrderSpecificUsageDispatch.resolver() // LINUX: ret ptr @OrderSpecificUsageDispatch.Z // WINDOWS: define weak_odr dso_local void @OrderSpecificUsageDispatch() comdat // WINDOWS: call void @__cpu_indicator_init // WINDOWS: call void @OrderSpecificUsageDispatch.Z // WINDOWS-NEXT: ret void // No Cpu Specific options. ATTR(cpu_dispatch(atom, ivybridge, knl)) void NoSpecifics(void); // LINUX: define weak_odr ptr @NoSpecifics.resolver() // LINUX: call void @__cpu_indicator_init // LINUX: ret ptr @NoSpecifics.Z // LINUX: ret ptr @NoSpecifics.S // LINUX: ret ptr @NoSpecifics.O // LINUX: call void @llvm.trap // LINUX: unreachable // WINDOWS: define weak_odr dso_local void @NoSpecifics() comdat // WINDOWS: call void @__cpu_indicator_init // WINDOWS: call void @NoSpecifics.Z // WINDOWS-NEXT: ret void // WINDOWS: call void @NoSpecifics.S // WINDOWS-NEXT: ret void // WINDOWS: call void @NoSpecifics.O // WINDOWS-NEXT: ret void // WINDOWS: call void @llvm.trap // WINDOWS: unreachable ATTR(cpu_dispatch(atom, generic, ivybridge, knl)) void HasGeneric(void); // LINUX: define weak_odr ptr @HasGeneric.resolver() // LINUX: call void @__cpu_indicator_init // LINUX: ret ptr @HasGeneric.Z // LINUX: ret ptr @HasGeneric.S // LINUX: ret ptr @HasGeneric.O // LINUX: ret ptr @HasGeneric.A // LINUX-NOT: call void @llvm.trap // WINDOWS: define weak_odr dso_local void @HasGeneric() comdat // WINDOWS: call void @__cpu_indicator_init // WINDOWS: call void @HasGeneric.Z // WINDOWS-NEXT: ret void // WINDOWS: call void @HasGeneric.S // WINDOWS-NEXT: ret void // WINDOWS: call void @HasGeneric.O // WINDOWS-NEXT: ret void // WINDOWS: call void @HasGeneric.A // WINDOWS-NEXT: ret void // WINDOWS-NOT: call void @llvm.trap ATTR(cpu_dispatch(atom, generic, ivybridge, knl)) void HasParams(int i, double d); // LINUX: define weak_odr ptr @HasParams.resolver() // LINUX: call void @__cpu_indicator_init // LINUX: ret ptr @HasParams.Z // LINUX: ret ptr @HasParams.S // LINUX: ret ptr @HasParams.O // LINUX: ret ptr @HasParams.A // LINUX-NOT: call void @llvm.trap // WINDOWS: define weak_odr dso_local void @HasParams(i32 %0, double %1) comdat // WINDOWS: call void @__cpu_indicator_init // WINDOWS: call void @HasParams.Z(i32 %0, double %1) // WINDOWS-NEXT: ret void // WINDOWS: call void @HasParams.S(i32 %0, double %1) // WINDOWS-NEXT: ret void // WINDOWS: call void @HasParams.O(i32 %0, double %1) // WINDOWS-NEXT: ret void // WINDOWS: call void @HasParams.A(i32 %0, double %1) // WINDOWS-NEXT: ret void // WINDOWS-NOT: call void @llvm.trap ATTR(cpu_dispatch(atom, generic, ivybridge, knl)) int HasParamsAndReturn(int i, double d); // LINUX: define weak_odr ptr @HasParamsAndReturn.resolver() // LINUX: call void @__cpu_indicator_init // LINUX: ret ptr @HasParamsAndReturn.Z // LINUX: ret ptr @HasParamsAndReturn.S // LINUX: ret ptr @HasParamsAndReturn.O // LINUX: ret ptr @HasParamsAndReturn.A // LINUX-NOT: call void @llvm.trap // WINDOWS: define weak_odr dso_local i32 @HasParamsAndReturn(i32 %0, double %1) comdat // WINDOWS: call void @__cpu_indicator_init // WINDOWS: %[[RET:.+]] = musttail call i32 @HasParamsAndReturn.Z(i32 %0, double %1) // WINDOWS-NEXT: ret i32 %[[RET]] // WINDOWS: %[[RET:.+]] = musttail call i32 @HasParamsAndReturn.S(i32 %0, double %1) // WINDOWS-NEXT: ret i32 %[[RET]] // WINDOWS: %[[RET:.+]] = musttail call i32 @HasParamsAndReturn.O(i32 %0, double %1) // WINDOWS-NEXT: ret i32 %[[RET]] // WINDOWS: %[[RET:.+]] = musttail call i32 @HasParamsAndReturn.A(i32 %0, double %1) // WINDOWS-NEXT: ret i32 %[[RET]] // WINDOWS-NOT: call void @llvm.trap ATTR(cpu_dispatch(atom, generic, pentium)) int GenericAndPentium(int i, double d); // LINUX: define weak_odr ptr @GenericAndPentium.resolver() // LINUX: call void @__cpu_indicator_init // LINUX: ret ptr @GenericAndPentium.O // LINUX: ret ptr @GenericAndPentium.B // LINUX-NOT: ret ptr @GenericAndPentium.A // LINUX-NOT: call void @llvm.trap // WINDOWS: define weak_odr dso_local i32 @GenericAndPentium(i32 %0, double %1) comdat // WINDOWS: call void @__cpu_indicator_init // WINDOWS: %[[RET:.+]] = musttail call i32 @GenericAndPentium.O(i32 %0, double %1) // WINDOWS-NEXT: ret i32 %[[RET]] // WINDOWS: %[[RET:.+]] = musttail call i32 @GenericAndPentium.B(i32 %0, double %1) // WINDOWS-NEXT: ret i32 %[[RET]] // WINDOWS-NOT: call i32 @GenericAndPentium.A // WINDOWS-NOT: call void @llvm.trap ATTR(cpu_dispatch(atom, pentium)) int DispatchFirst(void); // LINUX: define weak_odr ptr @DispatchFirst.resolver // LINUX: ret ptr @DispatchFirst.O // LINUX: ret ptr @DispatchFirst.B // WINDOWS: define weak_odr dso_local i32 @DispatchFirst() comdat // WINDOWS: %[[RET:.+]] = musttail call i32 @DispatchFirst.O() // WINDOWS-NEXT: ret i32 %[[RET]] // WINDOWS: %[[RET:.+]] = musttail call i32 @DispatchFirst.B() // WINDOWS-NEXT: ret i32 %[[RET]] ATTR(cpu_specific(atom)) int DispatchFirst(void) {return 0;} // LINUX: define{{.*}} i32 @DispatchFirst.O // LINUX: ret i32 0 // WINDOWS: define dso_local i32 @DispatchFirst.O() // WINDOWS: ret i32 0 ATTR(cpu_specific(pentium)) int DispatchFirst(void) {return 1;} // LINUX: define{{.*}} i32 @DispatchFirst.B // LINUX: ret i32 1 // WINDOWS: define dso_local i32 @DispatchFirst.B // WINDOWS: ret i32 1 ATTR(cpu_specific(knl)) void OrderDispatchUsageSpecific(void) {} // CHECK: attributes #[[S]] = {{.*}}"target-features"="+avx,+cmov,+crc32,+cx16,+cx8,+f16c,+fsgsbase,+fxsr,+mmx,+pclmul,+popcnt,+rdrnd,+sahf,+sse,+sse2,+sse3,+sse4.1,+sse4.2,+ssse3,+x87,+xsave,+xsaveopt" // CHECK-SAME: "tune-cpu"="ivybridge" // CHECK: attributes #[[K]] = {{.*}}"target-features"="+adx,+aes,+avx,+avx2,+avx512cd,+avx512er,+avx512f,+avx512pf,+bmi,+bmi2,+cmov,+crc32,+cx16,+cx8,+evex512,+f16c,+fma,+fsgsbase,+fxsr,+invpcid,+lzcnt,+mmx,+movbe,+pclmul,+popcnt,+prefetchwt1,+prfchw,+rdrnd,+rdseed,+sahf,+sse,+sse2,+sse3,+sse4.1,+sse4.2,+ssse3,+x87,+xsave,+xsaveopt" // CHECK-SAME: "tune-cpu"="knl" // CHECK: attributes #[[O]] = {{.*}}"target-features"="+cmov,+cx16,+cx8,+fxsr,+mmx,+movbe,+sahf,+sse,+sse2,+sse3,+ssse3,+x87" // CHECK-SAME: "tune-cpu"="atom"