[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]
[Qemu-ppc] [PULL 45/66] ppc: Speed up load/store multiple
From: |
David Gibson |
Subject: |
[Qemu-ppc] [PULL 45/66] ppc: Speed up load/store multiple |
Date: |
Tue, 6 Sep 2016 13:42:55 +1000 |
From: Benjamin Herrenschmidt <address@hidden>
Use a single translate when not crossing a page boundary and avoid
going through layers of helpers. MacOS uses those instructions
a lot, so does OpenBIOS.
Signed-off-by: Benjamin Herrenschmidt <address@hidden>
Signed-off-by: David Gibson <address@hidden>
---
target-ppc/mem_helper.c | 69 +++++++++++++++++++++++++++++++++++++++++++++++++
1 file changed, 69 insertions(+)
diff --git a/target-ppc/mem_helper.c b/target-ppc/mem_helper.c
index 6548715..bf6c44a 100644
--- a/target-ppc/mem_helper.c
+++ b/target-ppc/mem_helper.c
@@ -53,8 +53,48 @@ static inline target_ulong addr_add(CPUPPCState *env,
target_ulong addr,
}
}
+/* Reduce the length so that addr + len doesn't cross a page boundary. */
+static inline uint64_t adj_len_to_page(uint64_t len, uint64_t addr)
+{
+#ifndef CONFIG_USER_ONLY
+ if ((addr & ~TARGET_PAGE_MASK) + len - 1 >= TARGET_PAGE_SIZE) {
+ return -addr & ~TARGET_PAGE_MASK;
+ }
+#endif
+ return len;
+}
+
void helper_lmw(CPUPPCState *env, target_ulong addr, uint32_t reg)
{
+ uint32_t *src;
+ uint64_t len, adjlen;
+
+ if ((addr & 3)) {
+ goto fallback;
+ }
+ len = (32 - reg) << 2;
+ while (len) {
+ src = tlb_vaddr_to_host(env, addr, MMU_DATA_LOAD, env->dmmu_idx);
+ if (!src) {
+ goto fallback;
+ }
+ adjlen = adj_len_to_page(len, addr);
+ len -= adjlen;
+#if defined(HOST_WORDS_BIGENDIAN)
+ memcpy(&env->gpr[reg], src, adjlen);
+ reg += (adjlen >> 2);
+ addr = addr_add(env, addr, adjlen);
+#else
+ while(adjlen) {
+ env->gpr[reg++] = bswap32(*(src++));
+ adjlen -= 4;
+ addr = addr_add(env, addr, 4);
+ }
+#endif
+ }
+ return;
+
+ fallback:
for (; reg < 32; reg++) {
if (needs_byteswap(env)) {
env->gpr[reg] = bswap32(cpu_ldl_data_ra(env, addr, GETPC()));
@@ -67,6 +107,35 @@ void helper_lmw(CPUPPCState *env, target_ulong addr,
uint32_t reg)
void helper_stmw(CPUPPCState *env, target_ulong addr, uint32_t reg)
{
+ uint32_t *dst;
+ uint64_t len, adjlen;
+
+ if ((addr & 3)) {
+ goto fallback;
+ }
+ len = (32 - reg) << 2;
+ while (len) {
+ dst = tlb_vaddr_to_host(env, addr, MMU_DATA_STORE, env->dmmu_idx);
+ if (!dst) {
+ goto fallback;
+ }
+ adjlen = adj_len_to_page(len, addr);
+ len -= adjlen;
+#if defined(HOST_WORDS_BIGENDIAN)
+ memcpy(dst, &env->gpr[reg], adjlen);
+ reg += (adjlen >> 2);
+ addr = addr_add(env, addr, adjlen);
+#else
+ while(adjlen) {
+ *(dst++) = bswap32(env->gpr[reg++]);
+ adjlen -= 4;
+ addr = addr_add(env, addr, 4);
+ }
+#endif
+ }
+ return;
+
+ fallback:
for (; reg < 32; reg++) {
if (needs_byteswap(env)) {
cpu_stl_data_ra(env, addr, bswap32((uint32_t)env->gpr[reg]),
--
2.7.4
- [Qemu-ppc] [PULL 11/66] target-ppc: add cmpeqb instruction, (continued)
- [Qemu-ppc] [PULL 11/66] target-ppc: add cmpeqb instruction, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 29/66] ppc: Make tlb_fill() use new exception helper, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 31/66] ppc: Fix source NIP on SLB related interrupts, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 25/66] ppc: Don't update the NIP in floating point generated code, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 19/66] ppc: Move DFP ops out of translate.c, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 22/66] ppc: Rename fload_invalid_op_excp to float_invalid_op_excp, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 40/66] ppc: Speed up dcbz, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 30/66] ppc: Rework NIP updates vs. exception generation, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 47/66] target-ppc: implement branch-less divd[o][.], David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 56/66] hw/ppc: add a ppc_create_page_sizes_prop() helper routine, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 45/66] ppc: Speed up load/store multiple,
David Gibson <=
- [Qemu-ppc] [PULL 50/66] target-ppc: add vcmpnez[b, h, w][.] instructions, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 65/66] tests: Resort check-qtest entries in Makefile.include, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 64/66] spapr: implement H_CHANGE_LOGICAL_LAN_MAC h_call, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 35/66] ppc: Don't update NIP on conditional trap instructions, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 52/66] target-ppc: add vsrv instruction, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 41/66] ppc: Fix CFAR updates, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 66/66] tests: Check serial output of firmware boot of some machines, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 20/66] ppc: Move VMX ops out of translate.c, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 21/66] ppc: Move VSX ops out of translate.c, David Gibson, 2016/09/05
- [Qemu-ppc] [PULL 18/66] ppc: Move embedded spe ops out of translate.c, David Gibson, 2016/09/05