|
|
|
@ -972,6 +972,16 @@ typedef struct _smlal_inst { |
|
|
|
unsigned int RdLo; |
|
|
|
} smlal_inst; |
|
|
|
|
|
|
|
typedef struct smlald_inst { |
|
|
|
unsigned int RdLo; |
|
|
|
unsigned int RdHi; |
|
|
|
unsigned int Rm; |
|
|
|
unsigned int Rn; |
|
|
|
unsigned int swap; |
|
|
|
unsigned int op1; |
|
|
|
unsigned int op2; |
|
|
|
} smlald_inst; |
|
|
|
|
|
|
|
typedef struct _mla_inst { |
|
|
|
unsigned int S; |
|
|
|
unsigned int Rn; |
|
|
|
@ -2360,9 +2370,32 @@ ARM_INST_PTR INTERPRETER_TRANSLATE(smlal)(unsigned int inst, int index) |
|
|
|
} |
|
|
|
|
|
|
|
ARM_INST_PTR INTERPRETER_TRANSLATE(smlalxy)(unsigned int inst, int index) { UNIMPLEMENTED_INSTRUCTION("SMLALXY"); } |
|
|
|
ARM_INST_PTR INTERPRETER_TRANSLATE(smlald)(unsigned int inst, int index) { UNIMPLEMENTED_INSTRUCTION("SMLALD"); } |
|
|
|
ARM_INST_PTR INTERPRETER_TRANSLATE(smlaw)(unsigned int inst, int index) { UNIMPLEMENTED_INSTRUCTION("SMLAW"); } |
|
|
|
ARM_INST_PTR INTERPRETER_TRANSLATE(smlsld)(unsigned int inst, int index) { UNIMPLEMENTED_INSTRUCTION("SMLSLD"); } |
|
|
|
|
|
|
|
ARM_INST_PTR INTERPRETER_TRANSLATE(smlald)(unsigned int inst, int index) |
|
|
|
{ |
|
|
|
arm_inst* const inst_base = (arm_inst*)AllocBuffer(sizeof(arm_inst) + sizeof(smlald_inst)); |
|
|
|
smlald_inst* const inst_cream = (smlald_inst*)inst_base->component; |
|
|
|
|
|
|
|
inst_base->cond = BITS(inst, 28, 31); |
|
|
|
inst_base->idx = index; |
|
|
|
inst_base->br = NON_BRANCH; |
|
|
|
inst_base->load_r15 = 0; |
|
|
|
|
|
|
|
inst_cream->Rm = BITS(inst, 8, 11); |
|
|
|
inst_cream->Rn = BITS(inst, 0, 3); |
|
|
|
inst_cream->RdLo = BITS(inst, 12, 15); |
|
|
|
inst_cream->RdHi = BITS(inst, 16, 19); |
|
|
|
inst_cream->swap = BIT(inst, 5); |
|
|
|
inst_cream->op1 = BITS(inst, 20, 22); |
|
|
|
inst_cream->op2 = BITS(inst, 5, 7); |
|
|
|
|
|
|
|
return inst_base; |
|
|
|
} |
|
|
|
ARM_INST_PTR INTERPRETER_TRANSLATE(smlsld)(unsigned int inst, int index) |
|
|
|
{ |
|
|
|
return INTERPRETER_TRANSLATE(smlald)(inst, index); |
|
|
|
} |
|
|
|
|
|
|
|
ARM_INST_PTR INTERPRETER_TRANSLATE(smmla)(unsigned int inst, int index) |
|
|
|
{ |
|
|
|
@ -5519,9 +5552,45 @@ unsigned InterpreterMainLoop(ARMul_State* state) { |
|
|
|
} |
|
|
|
|
|
|
|
SMLALXY_INST: |
|
|
|
SMLALD_INST: |
|
|
|
SMLAW_INST: |
|
|
|
|
|
|
|
SMLALD_INST: |
|
|
|
SMLSLD_INST: |
|
|
|
{ |
|
|
|
if (inst_base->cond == 0xE || CondPassed(cpu, inst_base->cond)) { |
|
|
|
smlald_inst* const inst_cream = (smlald_inst*)inst_base->component; |
|
|
|
|
|
|
|
const bool do_swap = (inst_cream->swap == 1); |
|
|
|
const u32 rdlo_val = RDLO; |
|
|
|
const u32 rdhi_val = RDHI; |
|
|
|
const u32 rn_val = RN; |
|
|
|
u32 rm_val = RM; |
|
|
|
|
|
|
|
if (do_swap) |
|
|
|
rm_val = (((rm_val & 0xFFFF) << 16) | (rm_val >> 16)); |
|
|
|
|
|
|
|
const s32 product1 = (s16)(rn_val & 0xFFFF) * (s16)(rm_val & 0xFFFF); |
|
|
|
const s32 product2 = (s16)((rn_val >> 16) & 0xFFFF) * (s16)((rm_val >> 16) & 0xFFFF); |
|
|
|
s64 result; |
|
|
|
|
|
|
|
// SMLALD
|
|
|
|
if (BIT(inst_cream->op2, 1) == 0) { |
|
|
|
result = (product1 + product2) + (s64)(rdlo_val | ((s64)rdhi_val << 32)); |
|
|
|
} |
|
|
|
// SMLSLD
|
|
|
|
else { |
|
|
|
result = (product1 - product2) + (s64)(rdlo_val | ((s64)rdhi_val << 32)); |
|
|
|
} |
|
|
|
|
|
|
|
RDLO = (result & 0xFFFFFFFF); |
|
|
|
RDHI = ((result >> 32) & 0xFFFFFFFF); |
|
|
|
} |
|
|
|
|
|
|
|
cpu->Reg[15] += GET_INST_SIZE(cpu); |
|
|
|
INC_PC(sizeof(smlald_inst)); |
|
|
|
FETCH_INST; |
|
|
|
GOTO_NEXT_INST; |
|
|
|
} |
|
|
|
|
|
|
|
SMMLA_INST: |
|
|
|
SMMLS_INST: |
|
|
|
|