Implement some ARM32 memory instructions and CMP (#565)
* Implement ARM32 memory instructions: LDM, LDR, LDRB, LDRD, LDRH, LDRSB, LDRSH, STM, STR, STRB, STRD, STRH (immediate and register + immediate variants), implement CMP (immediate and register shifted by immediate variants)
* Rename some opcode classes and flag masks for consistency
* Fix a few suboptimal ARM32 codegen issues, only loads should be considered on decoder when checking if Rt == PC, and only NZCV flags should be considered for comparison optimizations
* Take into account Rt2 for LDRD instructions aswell when checking if the instruction changes PC
* Re-align arm32 instructions on the opcode table
2019-01-29 13:06:11 -03:00
|
|
|
using ChocolArm64.Decoders;
|
2019-04-26 01:55:12 -03:00
|
|
|
using ChocolArm64.IntermediateRepresentation;
|
Implement some ARM32 memory instructions and CMP (#565)
* Implement ARM32 memory instructions: LDM, LDR, LDRB, LDRD, LDRH, LDRSB, LDRSH, STM, STR, STRB, STRD, STRH (immediate and register + immediate variants), implement CMP (immediate and register shifted by immediate variants)
* Rename some opcode classes and flag masks for consistency
* Fix a few suboptimal ARM32 codegen issues, only loads should be considered on decoder when checking if Rt == PC, and only NZCV flags should be considered for comparison optimizations
* Take into account Rt2 for LDRD instructions aswell when checking if the instruction changes PC
* Re-align arm32 instructions on the opcode table
2019-01-29 13:06:11 -03:00
|
|
|
using ChocolArm64.State;
|
|
|
|
using ChocolArm64.Translation;
|
|
|
|
using System;
|
|
|
|
using System.Reflection.Emit;
|
|
|
|
|
|
|
|
using static ChocolArm64.Instructions.InstEmit32Helper;
|
|
|
|
using static ChocolArm64.Instructions.InstEmitMemoryHelper;
|
|
|
|
|
|
|
|
namespace ChocolArm64.Instructions
|
|
|
|
{
|
|
|
|
static partial class InstEmit32
|
|
|
|
{
|
|
|
|
private const int ByteSizeLog2 = 0;
|
|
|
|
private const int HWordSizeLog2 = 1;
|
|
|
|
private const int WordSizeLog2 = 2;
|
|
|
|
private const int DWordSizeLog2 = 3;
|
|
|
|
|
|
|
|
[Flags]
|
|
|
|
enum AccessType
|
|
|
|
{
|
|
|
|
Store = 0,
|
|
|
|
Signed = 1,
|
|
|
|
Load = 2,
|
|
|
|
|
|
|
|
LoadZx = Load,
|
|
|
|
LoadSx = Load | Signed,
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Ldm(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
OpCode32MemMult op = (OpCode32MemMult)context.CurrOp;
|
|
|
|
|
|
|
|
EmitLoadFromRegister(context, op.Rn);
|
|
|
|
|
|
|
|
bool writesToPc = (op.RegisterMask & (1 << RegisterAlias.Aarch32Pc)) != 0;
|
|
|
|
|
|
|
|
bool writeBack = op.PostOffset != 0 && (op.Rn != RegisterAlias.Aarch32Pc || !writesToPc);
|
|
|
|
|
|
|
|
if (writeBack)
|
|
|
|
{
|
|
|
|
context.Emit(OpCodes.Dup);
|
|
|
|
}
|
|
|
|
|
|
|
|
context.EmitLdc_I4(op.Offset);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
context.EmitSttmp();
|
|
|
|
|
|
|
|
if (writeBack)
|
|
|
|
{
|
|
|
|
context.EmitLdc_I4(op.PostOffset);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
EmitStoreToRegister(context, op.Rn);
|
|
|
|
}
|
|
|
|
|
|
|
|
int mask = op.RegisterMask;
|
|
|
|
int offset = 0;
|
|
|
|
|
|
|
|
for (int register = 0; mask != 0; mask >>= 1, register++)
|
|
|
|
{
|
|
|
|
if ((mask & 1) != 0)
|
|
|
|
{
|
|
|
|
context.EmitLdtmp();
|
|
|
|
context.EmitLdc_I4(offset);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
EmitReadZxCall(context, WordSizeLog2);
|
|
|
|
|
|
|
|
EmitStoreToRegister(context, register);
|
|
|
|
|
|
|
|
offset += 4;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Ldr(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
EmitLoadOrStore(context, WordSizeLog2, AccessType.LoadZx);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Ldrb(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
EmitLoadOrStore(context, ByteSizeLog2, AccessType.LoadZx);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Ldrd(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
EmitLoadOrStore(context, DWordSizeLog2, AccessType.LoadZx);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Ldrh(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
EmitLoadOrStore(context, HWordSizeLog2, AccessType.LoadZx);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Ldrsb(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
EmitLoadOrStore(context, ByteSizeLog2, AccessType.LoadSx);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Ldrsh(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
EmitLoadOrStore(context, HWordSizeLog2, AccessType.LoadSx);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Stm(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
OpCode32MemMult op = (OpCode32MemMult)context.CurrOp;
|
|
|
|
|
|
|
|
EmitLoadFromRegister(context, op.Rn);
|
|
|
|
|
|
|
|
context.EmitLdc_I4(op.Offset);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
context.EmitSttmp();
|
|
|
|
|
|
|
|
int mask = op.RegisterMask;
|
|
|
|
int offset = 0;
|
|
|
|
|
|
|
|
for (int register = 0; mask != 0; mask >>= 1, register++)
|
|
|
|
{
|
|
|
|
if ((mask & 1) != 0)
|
|
|
|
{
|
|
|
|
context.EmitLdtmp();
|
|
|
|
context.EmitLdc_I4(offset);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
EmitLoadFromRegister(context, register);
|
|
|
|
|
|
|
|
EmitWriteCall(context, WordSizeLog2);
|
|
|
|
|
2019-07-01 21:39:22 -05:00
|
|
|
// Note: If Rn is also specified on the register list,
|
|
|
|
// and Rn is the first register on this list, then the
|
|
|
|
// value that is written to memory is the unmodified value,
|
|
|
|
// before the write back. If it is on the list, but it's
|
|
|
|
// not the first one, then the value written to memory
|
|
|
|
// varies between CPUs.
|
Implement some ARM32 memory instructions and CMP (#565)
* Implement ARM32 memory instructions: LDM, LDR, LDRB, LDRD, LDRH, LDRSB, LDRSH, STM, STR, STRB, STRD, STRH (immediate and register + immediate variants), implement CMP (immediate and register shifted by immediate variants)
* Rename some opcode classes and flag masks for consistency
* Fix a few suboptimal ARM32 codegen issues, only loads should be considered on decoder when checking if Rt == PC, and only NZCV flags should be considered for comparison optimizations
* Take into account Rt2 for LDRD instructions aswell when checking if the instruction changes PC
* Re-align arm32 instructions on the opcode table
2019-01-29 13:06:11 -03:00
|
|
|
if (offset == 0 && op.PostOffset != 0)
|
|
|
|
{
|
2019-07-01 21:39:22 -05:00
|
|
|
// Emit write back after the first write.
|
Implement some ARM32 memory instructions and CMP (#565)
* Implement ARM32 memory instructions: LDM, LDR, LDRB, LDRD, LDRH, LDRSB, LDRSH, STM, STR, STRB, STRD, STRH (immediate and register + immediate variants), implement CMP (immediate and register shifted by immediate variants)
* Rename some opcode classes and flag masks for consistency
* Fix a few suboptimal ARM32 codegen issues, only loads should be considered on decoder when checking if Rt == PC, and only NZCV flags should be considered for comparison optimizations
* Take into account Rt2 for LDRD instructions aswell when checking if the instruction changes PC
* Re-align arm32 instructions on the opcode table
2019-01-29 13:06:11 -03:00
|
|
|
EmitLoadFromRegister(context, op.Rn);
|
|
|
|
|
|
|
|
context.EmitLdc_I4(op.PostOffset);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
EmitStoreToRegister(context, op.Rn);
|
|
|
|
}
|
|
|
|
|
|
|
|
offset += 4;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Str(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
EmitLoadOrStore(context, WordSizeLog2, AccessType.Store);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Strb(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
EmitLoadOrStore(context, ByteSizeLog2, AccessType.Store);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Strd(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
EmitLoadOrStore(context, DWordSizeLog2, AccessType.Store);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Strh(ILEmitterCtx context)
|
|
|
|
{
|
|
|
|
EmitLoadOrStore(context, HWordSizeLog2, AccessType.Store);
|
|
|
|
}
|
|
|
|
|
|
|
|
private static void EmitLoadOrStore(ILEmitterCtx context, int size, AccessType accType)
|
|
|
|
{
|
|
|
|
OpCode32Mem op = (OpCode32Mem)context.CurrOp;
|
|
|
|
|
|
|
|
if (op.Index || op.WBack)
|
|
|
|
{
|
|
|
|
EmitLoadFromRegister(context, op.Rn);
|
|
|
|
|
|
|
|
context.EmitLdc_I4(op.Imm);
|
|
|
|
|
|
|
|
context.Emit(op.Add ? OpCodes.Add : OpCodes.Sub);
|
|
|
|
|
|
|
|
context.EmitSttmp();
|
|
|
|
}
|
|
|
|
|
|
|
|
if (op.Index)
|
|
|
|
{
|
|
|
|
context.EmitLdtmp();
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitLoadFromRegister(context, op.Rn);
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((accType & AccessType.Load) != 0)
|
|
|
|
{
|
|
|
|
if ((accType & AccessType.Signed) != 0)
|
|
|
|
{
|
|
|
|
EmitReadSx32Call(context, size);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitReadZxCall(context, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (op.WBack)
|
|
|
|
{
|
|
|
|
context.EmitLdtmp();
|
|
|
|
|
|
|
|
EmitStoreToRegister(context, op.Rn);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (size == DWordSizeLog2)
|
|
|
|
{
|
|
|
|
context.Emit(OpCodes.Dup);
|
|
|
|
|
|
|
|
context.EmitLdflg((int)PState.EBit);
|
|
|
|
|
|
|
|
ILLabel lblBigEndian = new ILLabel();
|
|
|
|
ILLabel lblEnd = new ILLabel();
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Brtrue_S, lblBigEndian);
|
|
|
|
|
2019-07-01 21:39:22 -05:00
|
|
|
// Little endian mode.
|
Implement some ARM32 memory instructions and CMP (#565)
* Implement ARM32 memory instructions: LDM, LDR, LDRB, LDRD, LDRH, LDRSB, LDRSH, STM, STR, STRB, STRD, STRH (immediate and register + immediate variants), implement CMP (immediate and register shifted by immediate variants)
* Rename some opcode classes and flag masks for consistency
* Fix a few suboptimal ARM32 codegen issues, only loads should be considered on decoder when checking if Rt == PC, and only NZCV flags should be considered for comparison optimizations
* Take into account Rt2 for LDRD instructions aswell when checking if the instruction changes PC
* Re-align arm32 instructions on the opcode table
2019-01-29 13:06:11 -03:00
|
|
|
context.Emit(OpCodes.Conv_U4);
|
|
|
|
|
|
|
|
EmitStoreToRegister(context, op.Rt);
|
|
|
|
|
|
|
|
context.EmitLsr(32);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Conv_U4);
|
|
|
|
|
|
|
|
EmitStoreToRegister(context, op.Rt | 1);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Br_S, lblEnd);
|
|
|
|
|
2019-07-01 21:39:22 -05:00
|
|
|
// Big endian mode.
|
Implement some ARM32 memory instructions and CMP (#565)
* Implement ARM32 memory instructions: LDM, LDR, LDRB, LDRD, LDRH, LDRSB, LDRSH, STM, STR, STRB, STRD, STRH (immediate and register + immediate variants), implement CMP (immediate and register shifted by immediate variants)
* Rename some opcode classes and flag masks for consistency
* Fix a few suboptimal ARM32 codegen issues, only loads should be considered on decoder when checking if Rt == PC, and only NZCV flags should be considered for comparison optimizations
* Take into account Rt2 for LDRD instructions aswell when checking if the instruction changes PC
* Re-align arm32 instructions on the opcode table
2019-01-29 13:06:11 -03:00
|
|
|
context.MarkLabel(lblBigEndian);
|
|
|
|
|
|
|
|
context.EmitLsr(32);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Conv_U4);
|
|
|
|
|
|
|
|
EmitStoreToRegister(context, op.Rt);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Conv_U4);
|
|
|
|
|
|
|
|
EmitStoreToRegister(context, op.Rt | 1);
|
|
|
|
|
|
|
|
context.MarkLabel(lblEnd);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitStoreToRegister(context, op.Rt);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
if (op.WBack)
|
|
|
|
{
|
|
|
|
context.EmitLdtmp();
|
|
|
|
|
|
|
|
EmitStoreToRegister(context, op.Rn);
|
|
|
|
}
|
|
|
|
|
|
|
|
EmitLoadFromRegister(context, op.Rt);
|
|
|
|
|
|
|
|
if (size == DWordSizeLog2)
|
|
|
|
{
|
|
|
|
context.Emit(OpCodes.Conv_U8);
|
|
|
|
|
|
|
|
context.EmitLdflg((int)PState.EBit);
|
|
|
|
|
|
|
|
ILLabel lblBigEndian = new ILLabel();
|
|
|
|
ILLabel lblEnd = new ILLabel();
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Brtrue_S, lblBigEndian);
|
|
|
|
|
2019-07-01 21:39:22 -05:00
|
|
|
// Little endian mode.
|
Implement some ARM32 memory instructions and CMP (#565)
* Implement ARM32 memory instructions: LDM, LDR, LDRB, LDRD, LDRH, LDRSB, LDRSH, STM, STR, STRB, STRD, STRH (immediate and register + immediate variants), implement CMP (immediate and register shifted by immediate variants)
* Rename some opcode classes and flag masks for consistency
* Fix a few suboptimal ARM32 codegen issues, only loads should be considered on decoder when checking if Rt == PC, and only NZCV flags should be considered for comparison optimizations
* Take into account Rt2 for LDRD instructions aswell when checking if the instruction changes PC
* Re-align arm32 instructions on the opcode table
2019-01-29 13:06:11 -03:00
|
|
|
EmitLoadFromRegister(context, op.Rt | 1);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Conv_U8);
|
|
|
|
|
|
|
|
context.EmitLsl(32);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Or);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Br_S, lblEnd);
|
|
|
|
|
2019-07-01 21:39:22 -05:00
|
|
|
// Big endian mode.
|
Implement some ARM32 memory instructions and CMP (#565)
* Implement ARM32 memory instructions: LDM, LDR, LDRB, LDRD, LDRH, LDRSB, LDRSH, STM, STR, STRB, STRD, STRH (immediate and register + immediate variants), implement CMP (immediate and register shifted by immediate variants)
* Rename some opcode classes and flag masks for consistency
* Fix a few suboptimal ARM32 codegen issues, only loads should be considered on decoder when checking if Rt == PC, and only NZCV flags should be considered for comparison optimizations
* Take into account Rt2 for LDRD instructions aswell when checking if the instruction changes PC
* Re-align arm32 instructions on the opcode table
2019-01-29 13:06:11 -03:00
|
|
|
context.MarkLabel(lblBigEndian);
|
|
|
|
|
|
|
|
context.EmitLsl(32);
|
|
|
|
|
|
|
|
EmitLoadFromRegister(context, op.Rt | 1);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Conv_U8);
|
|
|
|
|
|
|
|
context.Emit(OpCodes.Or);
|
|
|
|
|
|
|
|
context.MarkLabel(lblEnd);
|
|
|
|
}
|
|
|
|
|
|
|
|
EmitWriteCall(context, size);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|