summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGabe Black <gblack@eecs.umich.edu>2009-08-02 08:39:29 -0700
committerGabe Black <gblack@eecs.umich.edu>2009-08-02 08:39:29 -0700
commitaff57202b4665b997ea257609dee0f9e68169b0f (patch)
tree0d77a1d8b7c8117ec017498b3ec79d17c81d4d03
parenta13a706a207296b40dbe43576fad423cf5f4679a (diff)
downloadgem5-aff57202b4665b997ea257609dee0f9e68169b0f.tar.xz
X86: Fix the high result of mul1s, and removed undefined shifts from the mult microops.
-rw-r--r--src/arch/x86/isa/microops/regop.isa34
1 files changed, 19 insertions, 15 deletions
diff --git a/src/arch/x86/isa/microops/regop.isa b/src/arch/x86/isa/microops/regop.isa
index cabdc2172..698216139 100644
--- a/src/arch/x86/isa/microops/regop.isa
+++ b/src/arch/x86/isa/microops/regop.isa
@@ -517,34 +517,38 @@ let {{
class Xor(LogicRegOp):
code = 'DestReg = merge(DestReg, psrc1 ^ op2, dataSize)'
- # Neither of these is quite correct because it assumes that right shifting
- # a signed or unsigned value does sign or zero extension respectively.
- # The C standard says that what happens on a right shift with a 1 in the
- # MSB position is undefined. On x86 and under likely most compilers the
- # "right thing" happens, but this isn't a guarantee.
class Mul1s(WrRegOp):
code = '''
ProdLow = psrc1 * op2;
int halfSize = (dataSize * 8) / 2;
- int64_t spsrc1_h = spsrc1 >> halfSize;
- int64_t spsrc1_l = spsrc1 & mask(halfSize);
- int64_t spsrc2_h = sop2 >> halfSize;
- int64_t spsrc2_l = sop2 & mask(halfSize);
- ProdHi = ((spsrc1_l * spsrc2_h + spsrc1_h * spsrc2_l +
- ((spsrc1_l * spsrc2_l) >> halfSize)) >> halfSize) +
- spsrc1_h * spsrc2_h;
+ uint64_t shifter = (1ULL << halfSize);
+ uint64_t hiResult;
+ uint64_t psrc1_h = psrc1 / shifter;
+ uint64_t psrc1_l = psrc1 & mask(halfSize);
+ uint64_t psrc2_h = op2 / shifter;
+ uint64_t psrc2_l = op2 & mask(halfSize);
+ hiResult = ((psrc1_l * psrc2_h + psrc1_h * psrc2_l +
+ ((psrc1_l * psrc2_l) / shifter)) /shifter) +
+ psrc1_h * psrc2_h;
+ if (spsrc1 < 0)
+ hiResult -= op2;
+ int64_t bigSop2 = sop2;
+ if (bigSop2 < 0)
+ hiResult -= psrc1;
+ ProdHi = hiResult;
'''
class Mul1u(WrRegOp):
code = '''
ProdLow = psrc1 * op2;
int halfSize = (dataSize * 8) / 2;
- uint64_t psrc1_h = psrc1 >> halfSize;
+ uint64_t shifter = (1ULL << halfSize);
+ uint64_t psrc1_h = psrc1 / shifter;
uint64_t psrc1_l = psrc1 & mask(halfSize);
- uint64_t psrc2_h = op2 >> halfSize;
+ uint64_t psrc2_h = op2 / shifter;
uint64_t psrc2_l = op2 & mask(halfSize);
ProdHi = ((psrc1_l * psrc2_h + psrc1_h * psrc2_l +
- ((psrc1_l * psrc2_l) >> halfSize)) >> halfSize) +
+ ((psrc1_l * psrc2_l) / shifter)) / shifter) +
psrc1_h * psrc2_h;
'''