2015-05-24 06:55:12 +02:00
|
|
|
// Copyright 2008 Dolphin Emulator Project
|
2021-07-05 03:22:19 +02:00
|
|
|
// SPDX-License-Identifier: GPL-2.0-or-later
|
2008-12-14 19:25:33 +01:00
|
|
|
|
2014-02-17 11:18:15 +01:00
|
|
|
#include "Common/x64ABI.h"
|
2021-12-10 03:22:16 +01:00
|
|
|
|
2014-09-08 03:06:58 +02:00
|
|
|
#include "Common/CommonTypes.h"
|
2014-02-17 11:18:15 +01:00
|
|
|
#include "Common/x64Emitter.h"
|
2008-12-08 06:30:24 +01:00
|
|
|
|
2008-07-31 22:22:35 +02:00
|
|
|
using namespace Gen;
|
2008-12-08 06:30:24 +01:00
|
|
|
|
2008-11-23 18:46:14 +01:00
|
|
|
// Shared code between Win64 and Unix64
|
2008-12-08 06:30:24 +01:00
|
|
|
|
2014-10-17 04:21:55 +02:00
|
|
|
void XEmitter::ABI_CalculateFrameSize(BitSet32 mask, size_t rsp_alignment, size_t needed_frame_size,
|
|
|
|
size_t* shadowp, size_t* subtractionp, size_t* xmm_offsetp)
|
2013-09-30 04:51:07 +02:00
|
|
|
{
|
Improve code and clarify parameters to ABI_Push/PopRegistersAndAdjustStack.
- Factor common work into a helper function.
- Replace confusingly named "noProlog" with "rsp_alignment". Now that
x86 is not supported, we can just specify it explicitly as 8 for
clarity.
- Add the option to include more frame size, which I'll need later.
- Revert a change by magumagu in March which replaced MOVAPD with MOVUPD
on account of 32-bit Windows, since it's no longer supported. True,
apparently recent processors don't execute the former any faster if the
pointer is, in fact, aligned, but there's no point using MOVUPD for
something that's guaranteed to be aligned...
(I discovered that GenFrsqrte and GenFres were incorrectly passing false
to noProlog - they were, in fact, functions without prologs, the
original meaning of the parameter - which caused the previous change to
break. This is now fixed.)
2014-09-07 20:06:48 +02:00
|
|
|
size_t shadow = 0;
|
2014-08-03 20:42:06 +02:00
|
|
|
#if defined(_WIN32)
|
2013-09-30 04:51:07 +02:00
|
|
|
shadow = 0x20;
|
|
|
|
#endif
|
Improve code and clarify parameters to ABI_Push/PopRegistersAndAdjustStack.
- Factor common work into a helper function.
- Replace confusingly named "noProlog" with "rsp_alignment". Now that
x86 is not supported, we can just specify it explicitly as 8 for
clarity.
- Add the option to include more frame size, which I'll need later.
- Revert a change by magumagu in March which replaced MOVAPD with MOVUPD
on account of 32-bit Windows, since it's no longer supported. True,
apparently recent processors don't execute the former any faster if the
pointer is, in fact, aligned, but there's no point using MOVUPD for
something that's guaranteed to be aligned...
(I discovered that GenFrsqrte and GenFres were incorrectly passing false
to noProlog - they were, in fact, functions without prologs, the
original meaning of the parameter - which caused the previous change to
break. This is now fixed.)
2014-09-07 20:06:48 +02:00
|
|
|
|
2014-10-17 04:21:55 +02:00
|
|
|
int count = (mask & ABI_ALL_GPRS).Count();
|
Improve code and clarify parameters to ABI_Push/PopRegistersAndAdjustStack.
- Factor common work into a helper function.
- Replace confusingly named "noProlog" with "rsp_alignment". Now that
x86 is not supported, we can just specify it explicitly as 8 for
clarity.
- Add the option to include more frame size, which I'll need later.
- Revert a change by magumagu in March which replaced MOVAPD with MOVUPD
on account of 32-bit Windows, since it's no longer supported. True,
apparently recent processors don't execute the former any faster if the
pointer is, in fact, aligned, but there's no point using MOVUPD for
something that's guaranteed to be aligned...
(I discovered that GenFrsqrte and GenFres were incorrectly passing false
to noProlog - they were, in fact, functions without prologs, the
original meaning of the parameter - which caused the previous change to
break. This is now fixed.)
2014-09-07 20:06:48 +02:00
|
|
|
rsp_alignment -= count * 8;
|
|
|
|
size_t subtraction = 0;
|
2014-10-17 04:21:55 +02:00
|
|
|
int fpr_count = (mask & ABI_ALL_FPRS).Count();
|
|
|
|
if (fpr_count)
|
Improve code and clarify parameters to ABI_Push/PopRegistersAndAdjustStack.
- Factor common work into a helper function.
- Replace confusingly named "noProlog" with "rsp_alignment". Now that
x86 is not supported, we can just specify it explicitly as 8 for
clarity.
- Add the option to include more frame size, which I'll need later.
- Revert a change by magumagu in March which replaced MOVAPD with MOVUPD
on account of 32-bit Windows, since it's no longer supported. True,
apparently recent processors don't execute the former any faster if the
pointer is, in fact, aligned, but there's no point using MOVUPD for
something that's guaranteed to be aligned...
(I discovered that GenFrsqrte and GenFres were incorrectly passing false
to noProlog - they were, in fact, functions without prologs, the
original meaning of the parameter - which caused the previous change to
break. This is now fixed.)
2014-09-07 20:06:48 +02:00
|
|
|
{
|
|
|
|
// If we have any XMMs to save, we must align the stack here.
|
|
|
|
subtraction = rsp_alignment & 0xf;
|
|
|
|
}
|
2014-10-17 04:21:55 +02:00
|
|
|
subtraction += 16 * fpr_count;
|
Improve code and clarify parameters to ABI_Push/PopRegistersAndAdjustStack.
- Factor common work into a helper function.
- Replace confusingly named "noProlog" with "rsp_alignment". Now that
x86 is not supported, we can just specify it explicitly as 8 for
clarity.
- Add the option to include more frame size, which I'll need later.
- Revert a change by magumagu in March which replaced MOVAPD with MOVUPD
on account of 32-bit Windows, since it's no longer supported. True,
apparently recent processors don't execute the former any faster if the
pointer is, in fact, aligned, but there's no point using MOVUPD for
something that's guaranteed to be aligned...
(I discovered that GenFrsqrte and GenFres were incorrectly passing false
to noProlog - they were, in fact, functions without prologs, the
original meaning of the parameter - which caused the previous change to
break. This is now fixed.)
2014-09-07 20:06:48 +02:00
|
|
|
size_t xmm_base_subtraction = subtraction;
|
|
|
|
subtraction += needed_frame_size;
|
|
|
|
subtraction += shadow;
|
|
|
|
// Final alignment.
|
|
|
|
rsp_alignment -= subtraction;
|
|
|
|
subtraction += rsp_alignment & 0xf;
|
|
|
|
|
|
|
|
*shadowp = shadow;
|
|
|
|
*subtractionp = subtraction;
|
|
|
|
*xmm_offsetp = subtraction - xmm_base_subtraction;
|
|
|
|
}
|
|
|
|
|
2014-10-17 04:21:55 +02:00
|
|
|
size_t XEmitter::ABI_PushRegistersAndAdjustStack(BitSet32 mask, size_t rsp_alignment,
|
|
|
|
size_t needed_frame_size)
|
Improve code and clarify parameters to ABI_Push/PopRegistersAndAdjustStack.
- Factor common work into a helper function.
- Replace confusingly named "noProlog" with "rsp_alignment". Now that
x86 is not supported, we can just specify it explicitly as 8 for
clarity.
- Add the option to include more frame size, which I'll need later.
- Revert a change by magumagu in March which replaced MOVAPD with MOVUPD
on account of 32-bit Windows, since it's no longer supported. True,
apparently recent processors don't execute the former any faster if the
pointer is, in fact, aligned, but there's no point using MOVUPD for
something that's guaranteed to be aligned...
(I discovered that GenFrsqrte and GenFres were incorrectly passing false
to noProlog - they were, in fact, functions without prologs, the
original meaning of the parameter - which caused the previous change to
break. This is now fixed.)
2014-09-07 20:06:48 +02:00
|
|
|
{
|
|
|
|
size_t shadow, subtraction, xmm_offset;
|
|
|
|
ABI_CalculateFrameSize(mask, rsp_alignment, needed_frame_size, &shadow, &subtraction,
|
|
|
|
&xmm_offset);
|
|
|
|
|
2014-10-17 04:21:55 +02:00
|
|
|
for (int r : mask& ABI_ALL_GPRS)
|
2015-02-15 20:43:31 +01:00
|
|
|
PUSH((X64Reg)r);
|
Improve code and clarify parameters to ABI_Push/PopRegistersAndAdjustStack.
- Factor common work into a helper function.
- Replace confusingly named "noProlog" with "rsp_alignment". Now that
x86 is not supported, we can just specify it explicitly as 8 for
clarity.
- Add the option to include more frame size, which I'll need later.
- Revert a change by magumagu in March which replaced MOVAPD with MOVUPD
on account of 32-bit Windows, since it's no longer supported. True,
apparently recent processors don't execute the former any faster if the
pointer is, in fact, aligned, but there's no point using MOVUPD for
something that's guaranteed to be aligned...
(I discovered that GenFrsqrte and GenFres were incorrectly passing false
to noProlog - they were, in fact, functions without prologs, the
original meaning of the parameter - which caused the previous change to
break. This is now fixed.)
2014-09-07 20:06:48 +02:00
|
|
|
|
|
|
|
if (subtraction)
|
|
|
|
SUB(64, R(RSP), subtraction >= 0x80 ? Imm32((u32)subtraction) : Imm8((u8)subtraction));
|
|
|
|
|
2014-10-17 04:21:55 +02:00
|
|
|
for (int x : mask& ABI_ALL_FPRS)
|
2013-09-30 04:51:07 +02:00
|
|
|
{
|
2015-02-15 20:43:31 +01:00
|
|
|
MOVAPD(MDisp(RSP, (int)xmm_offset), (X64Reg)(x - 16));
|
2014-10-17 04:21:55 +02:00
|
|
|
xmm_offset += 16;
|
2013-09-30 04:51:07 +02:00
|
|
|
}
|
Improve code and clarify parameters to ABI_Push/PopRegistersAndAdjustStack.
- Factor common work into a helper function.
- Replace confusingly named "noProlog" with "rsp_alignment". Now that
x86 is not supported, we can just specify it explicitly as 8 for
clarity.
- Add the option to include more frame size, which I'll need later.
- Revert a change by magumagu in March which replaced MOVAPD with MOVUPD
on account of 32-bit Windows, since it's no longer supported. True,
apparently recent processors don't execute the former any faster if the
pointer is, in fact, aligned, but there's no point using MOVUPD for
something that's guaranteed to be aligned...
(I discovered that GenFrsqrte and GenFres were incorrectly passing false
to noProlog - they were, in fact, functions without prologs, the
original meaning of the parameter - which caused the previous change to
break. This is now fixed.)
2014-09-07 20:06:48 +02:00
|
|
|
|
|
|
|
return shadow;
|
2013-09-30 04:51:07 +02:00
|
|
|
}
|
|
|
|
|
2014-10-17 04:21:55 +02:00
|
|
|
void XEmitter::ABI_PopRegistersAndAdjustStack(BitSet32 mask, size_t rsp_alignment,
|
|
|
|
size_t needed_frame_size)
|
2013-09-30 04:51:07 +02:00
|
|
|
{
|
Improve code and clarify parameters to ABI_Push/PopRegistersAndAdjustStack.
- Factor common work into a helper function.
- Replace confusingly named "noProlog" with "rsp_alignment". Now that
x86 is not supported, we can just specify it explicitly as 8 for
clarity.
- Add the option to include more frame size, which I'll need later.
- Revert a change by magumagu in March which replaced MOVAPD with MOVUPD
on account of 32-bit Windows, since it's no longer supported. True,
apparently recent processors don't execute the former any faster if the
pointer is, in fact, aligned, but there's no point using MOVUPD for
something that's guaranteed to be aligned...
(I discovered that GenFrsqrte and GenFres were incorrectly passing false
to noProlog - they were, in fact, functions without prologs, the
original meaning of the parameter - which caused the previous change to
break. This is now fixed.)
2014-09-07 20:06:48 +02:00
|
|
|
size_t shadow, subtraction, xmm_offset;
|
|
|
|
ABI_CalculateFrameSize(mask, rsp_alignment, needed_frame_size, &shadow, &subtraction,
|
|
|
|
&xmm_offset);
|
|
|
|
|
2014-10-17 04:21:55 +02:00
|
|
|
for (int x : mask& ABI_ALL_FPRS)
|
2013-09-30 04:51:07 +02:00
|
|
|
{
|
2014-10-17 04:21:55 +02:00
|
|
|
MOVAPD((X64Reg)(x - 16), MDisp(RSP, (int)xmm_offset));
|
|
|
|
xmm_offset += 16;
|
2013-09-30 04:51:07 +02:00
|
|
|
}
|
|
|
|
|
Improve code and clarify parameters to ABI_Push/PopRegistersAndAdjustStack.
- Factor common work into a helper function.
- Replace confusingly named "noProlog" with "rsp_alignment". Now that
x86 is not supported, we can just specify it explicitly as 8 for
clarity.
- Add the option to include more frame size, which I'll need later.
- Revert a change by magumagu in March which replaced MOVAPD with MOVUPD
on account of 32-bit Windows, since it's no longer supported. True,
apparently recent processors don't execute the former any faster if the
pointer is, in fact, aligned, but there's no point using MOVUPD for
something that's guaranteed to be aligned...
(I discovered that GenFrsqrte and GenFres were incorrectly passing false
to noProlog - they were, in fact, functions without prologs, the
original meaning of the parameter - which caused the previous change to
break. This is now fixed.)
2014-09-07 20:06:48 +02:00
|
|
|
if (subtraction)
|
|
|
|
ADD(64, R(RSP), subtraction >= 0x80 ? Imm32((u32)subtraction) : Imm8((u8)subtraction));
|
|
|
|
|
2013-09-30 04:51:07 +02:00
|
|
|
for (int r = 15; r >= 0; r--)
|
|
|
|
{
|
2014-10-17 04:21:55 +02:00
|
|
|
if (mask[r])
|
2015-02-15 20:43:31 +01:00
|
|
|
POP((X64Reg)r);
|
2013-09-30 04:51:07 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-01-03 00:32:23 +01:00
|
|
|
void XEmitter::MOVTwo(int bits, Gen::X64Reg dst1, Gen::X64Reg src1, s32 offset1, Gen::X64Reg dst2,
|
|
|
|
Gen::X64Reg src2)
|
2014-09-04 07:02:21 +02:00
|
|
|
{
|
|
|
|
if (dst1 == src2 && dst2 == src1)
|
|
|
|
{
|
2014-09-11 07:17:38 +02:00
|
|
|
XCHG(bits, R(src1), R(src2));
|
2015-01-03 00:32:23 +01:00
|
|
|
if (offset1)
|
|
|
|
ADD(bits, R(dst1), Imm32(offset1));
|
2014-09-04 07:02:21 +02:00
|
|
|
}
|
2014-09-11 07:17:38 +02:00
|
|
|
else if (src2 != dst1)
|
2014-09-04 07:02:21 +02:00
|
|
|
{
|
2015-01-03 00:32:23 +01:00
|
|
|
if (dst1 != src1 && offset1)
|
|
|
|
LEA(bits, dst1, MDisp(src1, offset1));
|
|
|
|
else if (dst1 != src1)
|
2014-09-04 07:02:21 +02:00
|
|
|
MOV(bits, R(dst1), R(src1));
|
2015-01-03 00:32:23 +01:00
|
|
|
else if (offset1)
|
|
|
|
ADD(bits, R(dst1), Imm32(offset1));
|
2014-09-04 07:02:21 +02:00
|
|
|
if (dst2 != src2)
|
|
|
|
MOV(bits, R(dst2), R(src2));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
if (dst2 != src2)
|
|
|
|
MOV(bits, R(dst2), R(src2));
|
2015-01-03 00:32:23 +01:00
|
|
|
if (dst1 != src1 && offset1)
|
|
|
|
LEA(bits, dst1, MDisp(src1, offset1));
|
|
|
|
else if (dst1 != src1)
|
2014-09-04 07:02:21 +02:00
|
|
|
MOV(bits, R(dst1), R(src1));
|
2015-01-03 00:32:23 +01:00
|
|
|
else if (offset1)
|
|
|
|
ADD(bits, R(dst1), Imm32(offset1));
|
2014-09-04 07:02:21 +02:00
|
|
|
}
|
|
|
|
}
|