summaryrefslogtreecommitdiff
path: root/src/arch/arm/isa/insts/ldr64.isa
diff options
context:
space:
mode:
authorMitch Hayenga <mitch.hayenga@arm.com>2014-09-03 07:42:52 -0400
committerMitch Hayenga <mitch.hayenga@arm.com>2014-09-03 07:42:52 -0400
commit8f95144e161ef7bdb264eb572108a98f215785c0 (patch)
treefed971653335ef0ee3db72d372ae3b465e10b5cd /src/arch/arm/isa/insts/ldr64.isa
parentf6f63ec0aa68f631691d9eccc18739722a0a9f17 (diff)
downloadgem5-8f95144e161ef7bdb264eb572108a98f215785c0.tar.xz
arm: Make memory ops work on 64bit/128-bit quantities
Multiple instructions assume only 32-bit load operations are available, this patch increases load sizes to 64-bit or 128-bit for many load pair and load multiple instructions.
Diffstat (limited to 'src/arch/arm/isa/insts/ldr64.isa')
-rw-r--r--src/arch/arm/isa/insts/ldr64.isa90
1 files changed, 47 insertions, 43 deletions
diff --git a/src/arch/arm/isa/insts/ldr64.isa b/src/arch/arm/isa/insts/ldr64.isa
index 78460f661..eea925e66 100644
--- a/src/arch/arm/isa/insts/ldr64.isa
+++ b/src/arch/arm/isa/insts/ldr64.isa
@@ -1,6 +1,6 @@
// -*- mode:c++ -*-
-// Copyright (c) 2011-2013 ARM Limited
+// Copyright (c) 2011-2014 ARM Limited
// All rights reserved
//
// The license below extends only to copyright in the software and shall
@@ -187,35 +187,32 @@ let {{
AA64FpDestP2_uw = 0;
AA64FpDestP3_uw = 0;
'''
- elif self.size == 8 or (self.size == 16 and not self.top):
+ elif self.size == 8:
accCode = '''
uint64_t data = cSwap(Mem%s,
isBigEndian64(xc->tcBase()));
AA64FpDestP0_uw = (uint32_t)data;
AA64FpDestP1_uw = (data >> 32);
+ AA64FpDestP2_uw = 0;
+ AA64FpDestP3_uw = 0;
'''
- # Only zero out the other half if this isn't part of a
- # pair of 8 byte loads implementing a 16 byte load.
- if self.size == 8:
- accCode += '''
- AA64FpDestP2_uw = 0;
- AA64FpDestP3_uw = 0;
- '''
- elif self.size == 16 and self.top:
+ elif self.size == 16:
accCode = '''
- uint64_t data = cSwap(Mem%s,
- isBigEndian64(xc->tcBase()));
- AA64FpDestP2_uw = (uint32_t)data;
- AA64FpDestP3_uw = (data >> 32);
+ Twin64_t data = cSwap(Mem%s,
+ isBigEndian64(xc->tcBase()));
+
+
+ AA64FpDestP0_uw = (uint32_t)data.a;
+ AA64FpDestP1_uw = (data.a >> 32);
+ AA64FpDestP2_uw = (uint32_t)data.b;
+ AA64FpDestP3_uw = (data.b >> 32);
'''
elif self.flavor == "widen" or self.size == 8:
accCode = "XDest = cSwap(Mem%s, isBigEndian64(xc->tcBase()));"
else:
accCode = "WDest = cSwap(Mem%s, isBigEndian64(xc->tcBase()));"
- if self.size == 16:
- accCode = accCode % buildMemSuffix(self.sign, 8)
- else:
- accCode = accCode % buildMemSuffix(self.sign, self.size)
+
+ accCode = accCode % buildMemSuffix(self.sign, self.size)
self.codeBlobs["memacc_code"] = accCode
@@ -231,17 +228,29 @@ let {{
# Code that actually handles the access
if self.flavor == "fp":
- accCode = '''
- uint64_t data = cSwap(Mem_ud, isBigEndian64(xc->tcBase()));
- AA64FpDestP0_uw = (uint32_t)data;
- AA64FpDestP1_uw = 0;
- AA64FpDestP2_uw = 0;
- AA64FpDestP3_uw = 0;
- AA64FpDest2P0_uw = (data >> 32);
- AA64FpDest2P1_uw = 0;
- AA64FpDest2P2_uw = 0;
- AA64FpDest2P3_uw = 0;
- '''
+ if self.size == 4:
+ accCode = '''
+ uint64_t data = cSwap(Mem_ud, isBigEndian64(xc->tcBase()));
+ AA64FpDestP0_uw = (uint32_t)data;
+ AA64FpDestP1_uw = 0;
+ AA64FpDestP2_uw = 0;
+ AA64FpDestP3_uw = 0;
+ AA64FpDest2P0_uw = (data >> 32);
+ AA64FpDest2P1_uw = 0;
+ AA64FpDest2P2_uw = 0;
+ AA64FpDest2P3_uw = 0;
+ '''
+ elif self.size == 8:
+ accCode = '''
+ AA64FpDestP0_uw = (uint32_t)Mem_tud.a;
+ AA64FpDestP1_uw = (uint32_t)(Mem_tud.a >> 32);
+ AA64FpDestP2_uw = 0;
+ AA64FpDestP3_uw = 0;
+ AA64FpDest2P0_uw = (uint32_t)Mem_tud.b;
+ AA64FpDest2P1_uw = (uint32_t)(Mem_tud.b >> 32);
+ AA64FpDest2P2_uw = 0;
+ AA64FpDest2P3_uw = 0;
+ '''
else:
if self.sign:
if self.size == 4:
@@ -253,8 +262,8 @@ let {{
'''
elif self.size == 8:
accCode = '''
- XDest = sext<64>(Mem_tud.a);
- XDest2 = sext<64>(Mem_tud.b);
+ XDest = Mem_tud.a;
+ XDest2 = Mem_tud.b;
'''
else:
if self.size == 4:
@@ -416,6 +425,11 @@ let {{
decConstBase = 'LoadStoreLitU64'
micro = True
+ LoadImmDU64("ldp_uop", "MicroLdPairUop", 8).emit()
+ LoadImmDU64("ldp_fp8_uop", "MicroLdPairFp8Uop", 8, flavor="fp").emit()
+ LoadImmU64("ldfp16_uop", "MicroLdFp16Uop", 16, flavor="fp").emit()
+ LoadReg64("ldfp16reg_uop", "MicroLdFp16RegUop", 16, flavor="fp").emit()
+
LoadImmDouble64("ldaxp", "LDAXPW64", 4, flavor="acexp").emit()
LoadImmDouble64("ldaxp", "LDAXPX64", 8, flavor="acexp").emit()
LoadImmDouble64("ldxp", "LDXPW64", 4, flavor="exp").emit()
@@ -428,18 +442,8 @@ let {{
LoadRegU64("ldrfpxr_uop", "MicroLdrFpXRegUop", 8, flavor="fp").emit()
LoadLitU64("ldrfpxl_uop", "MicroLdrFpXLitUop", 8, literal=True,
flavor="fp").emit()
- LoadImmU64("ldrqbfpxi_uop", "MicroLdrQBFpXImmUop",
- 16, flavor="fp", top = False).emit()
- LoadRegU64("ldrqbfpxr_uop", "MicroLdrQBFpXRegUop",
- 16, flavor="fp", top = False).emit()
- LoadLitU64("ldrqbfpxl_uop", "MicroLdrQBFpXLitUop",
- 16, literal=True, flavor="fp", top = False).emit()
- LoadImmU64("ldrqtfpxi_uop", "MicroLdrQTFpXImmUop",
- 16, flavor="fp", top = True).emit()
- LoadRegU64("ldrqtfpxr_uop", "MicroLdrQTFpXRegUop",
- 16, flavor="fp", top = True).emit()
- LoadLitU64("ldrqtfpxl_uop", "MicroLdrQTFpXLitUop",
- 16, literal=True, flavor="fp", top = True).emit()
+ LoadLitU64("ldfp16_lit__uop", "MicroLdFp16LitUop",
+ 16, literal=True, flavor="fp").emit()
LoadImmDU64("ldrduxi_uop", "MicroLdrDUXImmUop", 4, sign=False).emit()
LoadImmDU64("ldrdsxi_uop", "MicroLdrDSXImmUop", 4, sign=True).emit()
LoadImmDU64("ldrdfpxi_uop", "MicroLdrDFpXImmUop", 4, flavor="fp").emit()