mirror of
https://github.com/Gericom/teak-llvm.git
synced 2025-06-19 11:35:51 -04:00

MSVC 2013 would refuse to pass highly aligned things (typically vectors and aggregates) by value. Users would receive this error: t.cpp(11) : error C2719: 'w': formal parameter with __declspec(align('32')) won't be aligned t.cpp(11) : error C2719: 'q': formal parameter with __declspec(align('32')) won't be aligned However, in MSVC 2015, this behavior was changed, and highly aligned things are now passed indirectly. To avoid breaking backwards incompatibility, objects that do not have a *required* high alignment (i.e. double) are still passed directly, even though they are not naturally aligned. This change implements the new behavior of passing things indirectly. The new behavior is: - up to three vector parameters can be passed in [XYZ]MM0-2 - remaining arguments with required alignment greater than 4 bytes are passed indirectly Previously, MSVC never passed things truly indirectly, meaning clang would always apply the byval attribute to indirect arguments. We had to go to the trouble of adding inalloca so that non-trivially copyable C++ types could be passed in place without copying the object representation. When inalloca was added, we asserted that all arguments passed indirectly must use byval. With this change, that assert no longer holds, and I had to update inalloca to handle that case. The implicit sret pointer parameter was already handled this way, and this change generalizes some of that logic to arguments. There are two cases that this change leaves unfixed: 1. objects that are non-trivially copyable *and* overaligned 2. vectorcall + inalloca + vectors For case 1, I need to touch C++ ABI code in MicrosoftCXXABI.cpp, so I want to do it in a follow-up. For case 2, my fix is one line, but it will require updating IR tests to use lots of inreg, so I wanted to separate it out. Related to D71915 and D72110 Fixes most of PR44395 Reviewed By: rjmccall, craig.topper, erichkeane Differential Revision: https://reviews.llvm.org/D72114
80 lines
3.6 KiB
C++
80 lines
3.6 KiB
C++
// RUN: %clang_cc1 -w -triple i686-pc-win32 -emit-llvm -o - %s | FileCheck %s
|
|
|
|
// PR44395
|
|
// MSVC passes up to three vectors in registers, and the rest indirectly. Check
|
|
// that both are compatible with an inalloca prototype.
|
|
|
|
struct NonTrivial {
|
|
NonTrivial();
|
|
NonTrivial(const NonTrivial &o);
|
|
unsigned handle;
|
|
};
|
|
|
|
typedef float __m128 __attribute__((__vector_size__(16), __aligned__(16)));
|
|
__m128 gv128;
|
|
|
|
// nt, w, and q will be in the inalloca pack.
|
|
void receive_vec_128(NonTrivial nt, __m128 x, __m128 y, __m128 z, __m128 w, __m128 q) {
|
|
gv128 = x + y + z + w + q;
|
|
}
|
|
// CHECK-LABEL: define dso_local void @"?receive_vec_128@@YAXUNonTrivial@@T__m128@@1111@Z"
|
|
// CHECK-SAME: (<4 x float> inreg %x,
|
|
// CHECK-SAME: <4 x float> inreg %y,
|
|
// CHECK-SAME: <4 x float> inreg %z,
|
|
// CHECK-SAME: <{ %struct.NonTrivial, <4 x float>*, <4 x float>* }>* inalloca %0)
|
|
|
|
void pass_vec_128() {
|
|
__m128 z = {0};
|
|
receive_vec_128(NonTrivial(), z, z, z, z, z);
|
|
}
|
|
// CHECK-LABEL: define dso_local void @"?pass_vec_128@@YAXXZ"()
|
|
// CHECK: getelementptr inbounds <{ %struct.NonTrivial, <4 x float>*, <4 x float>* }>, <{ %struct.NonTrivial, <4 x float>*, <4 x float>* }>* %{{[^,]*}}, i32 0, i32 0
|
|
// CHECK: call x86_thiscallcc %struct.NonTrivial* @"??0NonTrivial@@QAE@XZ"(%struct.NonTrivial* %{{.*}})
|
|
|
|
// Store q, store temp alloca.
|
|
// CHECK: store <4 x float> %{{[^,]*}}, <4 x float>* %{{[^,]*}}, align 16
|
|
// CHECK: getelementptr inbounds <{ %struct.NonTrivial, <4 x float>*, <4 x float>* }>, <{ %struct.NonTrivial, <4 x float>*, <4 x float>* }>* %{{[^,]*}}, i32 0, i32 1
|
|
// CHECK: store <4 x float>* %{{[^,]*}}, <4 x float>** %{{[^,]*}}, align 4
|
|
|
|
// Store w, store temp alloca.
|
|
// CHECK: store <4 x float> %{{[^,]*}}, <4 x float>* %{{[^,]*}}, align 16
|
|
// CHECK: getelementptr inbounds <{ %struct.NonTrivial, <4 x float>*, <4 x float>* }>, <{ %struct.NonTrivial, <4 x float>*, <4 x float>* }>* %{{[^,]*}}, i32 0, i32 2
|
|
// CHECK: store <4 x float>* %{{[^,]*}}, <4 x float>** %{{[^,]*}}, align 4
|
|
|
|
// CHECK: call void @"?receive_vec_128@@YAXUNonTrivial@@T__m128@@1111@Z"
|
|
// CHECK-SAME: (<4 x float> inreg %{{[^,]*}},
|
|
// CHECK-SAME: <4 x float> inreg %{{[^,]*}},
|
|
// CHECK-SAME: <4 x float> inreg %{{[^,]*}},
|
|
// CHECK-SAME: <{ %struct.NonTrivial, <4 x float>*, <4 x float>* }>* inalloca %{{[^,]*}})
|
|
|
|
// w will be passed indirectly by register, and q will be passed indirectly, but
|
|
// the pointer will be in memory.
|
|
void __fastcall fastcall_receive_vec(__m128 x, __m128 y, __m128 z, __m128 w, int edx, __m128 q, NonTrivial nt) {
|
|
gv128 = x + y + z + w + q;
|
|
}
|
|
// CHECK-LABEL: define dso_local x86_fastcallcc void @"?fastcall_receive_vec@@Y{{[^"]*}}"
|
|
// CHECK-SAME: (<4 x float> inreg %x,
|
|
// CHECK-SAME: <4 x float> inreg %y,
|
|
// CHECK-SAME: <4 x float> inreg %z,
|
|
// CHECK-SAME: <4 x float>* inreg %0,
|
|
// CHECK-SAME: i32 inreg %edx,
|
|
// CHECK-SAME: <{ <4 x float>*, %struct.NonTrivial }>* inalloca %1)
|
|
|
|
|
|
void __vectorcall vectorcall_receive_vec(double xmm0, double xmm1, double xmm2,
|
|
__m128 x, __m128 y, __m128 z,
|
|
__m128 w, int edx, __m128 q, NonTrivial nt) {
|
|
gv128 = x + y + z + w + q;
|
|
}
|
|
// FIXME: Enable these checks, clang generates wrong IR.
|
|
// CHECK-LABEL: define dso_local x86_vectorcallcc void @"?vectorcall_receive_vec@@Y{{[^"]*}}"
|
|
// CHECKX-SAME: (double inreg %xmm0,
|
|
// CHECKX-SAME: double inreg %xmm1,
|
|
// CHECKX-SAME: double inreg %xmm2,
|
|
// CHECKX-SAME: <4 x float> inreg %x,
|
|
// CHECKX-SAME: <4 x float> inreg %y,
|
|
// CHECKX-SAME: <4 x float> inreg %z,
|
|
// CHECKX-SAME: <4 x float>* inreg %0,
|
|
// CHECKX-SAME: i32 inreg %edx,
|
|
// CHECKX-SAME: <{ <4 x float>*, %struct.NonTrivial }>* inalloca %1)
|