summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorPouya Fotouhi <Pouya.Fotouhi@amd.com>2019-08-26 17:59:36 -0500
committerPouya Fotouhi <pfotouhi@ucdavis.edu>2019-09-20 04:03:24 +0000
commit67e310836baa0e652ae7a3b4ebd00263a52239c2 (patch)
treec50907ddbc27ecf8533a2b34a1fbe316848d6dcd
parentdc2db5cf9b5f782912569fd2be8be69fa71da33c (diff)
downloadgem5-67e310836baa0e652ae7a3b4ebd00263a52239c2.tar.xz
arch-x86: ignore non-temporal hint for movntps/movntpd SSE insts
Making the implementation of movntps/movntpd consistent with other non-temporal instructions. We are ignoring the hint here, and implementing those instructions as cacheable instructions. This change adds a warning to let user know about this workaround. Also, this change add the address check for second part of move. Change-Id: I811652b24cf39ca2f5c5d4c9e9e417f69190b55c Reviewed-on: https://gem5-review.googlesource.com/c/public/gem5/+/20408 Reviewed-by: Jason Lowe-Power <jason@lowepower.com> Reviewed-by: Gabe Black <gabeblack@google.com> Maintainer: Jason Lowe-Power <jason@lowepower.com> Tested-by: kokoro <noreply+kokoro@google.com>
-rw-r--r--src/arch/x86/isa/decoder/two_byte_opcodes.isa4
-rw-r--r--src/arch/x86/isa/insts/simd128/floating_point/data_transfer/move_non_temporal.py28
2 files changed, 22 insertions, 10 deletions
diff --git a/src/arch/x86/isa/decoder/two_byte_opcodes.isa b/src/arch/x86/isa/decoder/two_byte_opcodes.isa
index 348bff32e..dfb748efb 100644
--- a/src/arch/x86/isa/decoder/two_byte_opcodes.isa
+++ b/src/arch/x86/isa/decoder/two_byte_opcodes.isa
@@ -383,6 +383,8 @@
0x0: MOVAPS(Vq,Wq);
0x1: MOVAPS(Wq,Vq);
0x2: CVTPI2PS(Vq,Qq);
+ //Non-temporal hint is ignored since we don't have
+ //proper support for it in the memory system.
0x3: MOVNTPS(Mq,Vq);
0x4: CVTTPS2PI(Pq,Wq);
0x5: CVTPS2PI(Pq,Wq);
@@ -401,6 +403,8 @@
0x0: MOVAPD(Vo,Wo);
0x1: MOVAPD(Wo,Vo);
0x2: CVTPI2PD(Vo,Qq);
+ //Non-temporal hint is ignored since we don't have
+ //proper support for it in the memory system.
0x3: MOVNTPD(Mq,Vq);
0x4: CVTTPD2PI(Pq,Wo);
0x5: CVTPD2PI(Pq,Wo);
diff --git a/src/arch/x86/isa/insts/simd128/floating_point/data_transfer/move_non_temporal.py b/src/arch/x86/isa/insts/simd128/floating_point/data_transfer/move_non_temporal.py
index a6e392ffd..06dba5975 100644
--- a/src/arch/x86/isa/insts/simd128/floating_point/data_transfer/move_non_temporal.py
+++ b/src/arch/x86/isa/insts/simd128/floating_point/data_transfer/move_non_temporal.py
@@ -40,29 +40,37 @@
microcode = '''
# movntps is basically the same as movaps, excepting the caching hint and
# ordering constraints
+# We are ignoring the non-temporal hint.
def macroop MOVNTPS_M_XMM {
- # Check low address.
- stfp xmmh, seg, sib, "DISPLACEMENT + 8", dataSize=8, uncacheable=True
- stfp xmml, seg, sib, disp, dataSize=8, uncacheable=True
+ warn_once "MOVNTPS: Ignoring non-temporal hint, modeling as cacheable!"
+ cda seg, sib, "DISPLACEMENT + 8", dataSize=8
+ stfp xmmh, seg, sib, "DISPLACEMENT + 8", dataSize=8
+ stfp xmml, seg, sib, disp, dataSize=8
};
def macroop MOVNTPS_P_XMM {
+ warn_once "MOVNTPS_P: Ignoring non-temporal hint, modeling as cacheable!"
rdip t7
- # Check low address.
- stfp xmmh, seg, riprel, "DISPLACEMENT + 8", dataSize=8, uncacheable=True
- stfp xmml, seg, riprel, disp, dataSize=8, uncacheable=True
+ cda seg, riprel, "DISPLACEMENT + 8", dataSize=8
+ stfp xmmh, seg, riprel, "DISPLACEMENT + 8", dataSize=8
+ stfp xmml, seg, riprel, disp, dataSize=8
};
# movntpd is basically the same as movapd, excepting the caching hint and
# ordering constraints
+# We are ignoring the non-temporal hint.
def macroop MOVNTPD_M_XMM {
- stfp xmml, seg, sib, "DISPLACEMENT", dataSize=8, uncacheable=True
- stfp xmmh, seg, sib, "DISPLACEMENT + 8", dataSize=8, uncacheable=True
+ warn_once "MOVNTPD: Ignoring non-temporal hint, modeling as cacheable!"
+ cda seg, sib, "DISPLACEMENT + 8", dataSize=8
+ stfp xmml, seg, sib, "DISPLACEMENT", dataSize=8
+ stfp xmmh, seg, sib, "DISPLACEMENT + 8", dataSize=8
};
def macroop MOVNTPD_P_XMM {
+ warn_once "MOVNTPD_P: Ignoring non-temporal hint, modeling as cacheable!"
rdip t7
- stfp xmml, seg, riprel, "DISPLACEMENT", dataSize=8, uncacheable=True
- stfp xmmh, seg, riprel, "DISPLACEMENT + 8", dataSize=8, uncacheable=True
+ cda seg, riprel, "DISPLACEMENT + 8", dataSize=8
+ stfp xmml, seg, riprel, "DISPLACEMENT", dataSize=8
+ stfp xmmh, seg, riprel, "DISPLACEMENT + 8", dataSize=8
};
'''