From f5174d12aa0f9aef7fce3ef6263df0f08d2e8c75 Mon Sep 17 00:00:00 2001 From: Yang Liu Date: Mon, 10 Feb 2025 18:44:35 +0800 Subject: [LA64_DYNAREC] Added preliminary optimization for REP MOVSB (#2340) --- src/dynarec/la64/dynarec_la64_00.c | 14 ++++++++++++++ src/dynarec/la64/dynarec_la64_66.c | 14 ++++++++++++++ 2 files changed, 28 insertions(+) (limited to 'src') diff --git a/src/dynarec/la64/dynarec_la64_00.c b/src/dynarec/la64/dynarec_la64_00.c index 1751c759..a342fb53 100644 --- a/src/dynarec/la64/dynarec_la64_00.c +++ b/src/dynarec/la64/dynarec_la64_00.c @@ -1291,6 +1291,20 @@ uintptr_t dynarec64_00(dynarec_la64_t* dyn, uintptr_t addr, uintptr_t ip, int ni CBZ_NEXT(xRCX); ANDI(x1, xFlags, 1 << F_DF); BNEZ_MARK2(x1); + // special optim for large RCX value on forward case only + OR(x1, xRSI, xRDI); + ANDI(x1, x1, 7); + BNEZ_MARK(x1); + ADDI_D(x6, xZR, 8); + MARK3; + BLT_MARK(xRCX, x6); + LD_D(x1, xRSI, 0); + ST_D(x1, xRDI, 0); + ADDI_D(xRSI, xRSI, 8); + ADDI_D(xRDI, xRDI, 8); + ADDI_D(xRCX, xRCX, -8); + BNEZ_MARK3(xRCX); + B_NEXT_nocond; MARK; // Part with DF==0 LD_BU(x1, xRSI, 0); ST_B(x1, xRDI, 0); diff --git a/src/dynarec/la64/dynarec_la64_66.c b/src/dynarec/la64/dynarec_la64_66.c index 8d3ae2e5..5e9e0a3b 100644 --- a/src/dynarec/la64/dynarec_la64_66.c +++ b/src/dynarec/la64/dynarec_la64_66.c @@ -542,6 +542,20 @@ uintptr_t dynarec64_66(dynarec_la64_t* dyn, uintptr_t addr, uintptr_t ip, int ni CBZ_NEXT(xRCX); ANDI(x1, xFlags, 1 << F_DF); BNEZ_MARK2(x1); + // special optim for large RCX value on forward case only + OR(x1, xRSI, xRDI); + ANDI(x1, x1, 7); + BNEZ_MARK(x1); + ADDI_D(x6, xZR, 8); + MARK3; + BLT_MARK(xRCX, x6); + LD_D(x1, xRSI, 0); + ST_D(x1, xRDI, 0); + ADDI_D(xRSI, xRSI, 8); + ADDI_D(xRDI, xRDI, 8); + ADDI_D(xRCX, xRCX, -8); + BNEZ_MARK3(xRCX); + B_NEXT_nocond; MARK; // Part with DF==0 LD_BU(x1, xRSI, 0); ST_B(x1, xRDI, 0); -- cgit 1.4.1