From 389abade01f44ce7204776c0d71f89c8d3177d9d Mon Sep 17 00:00:00 2001
From: Gabe Black <gblack@eecs.umich.edu>
Date: Thu, 6 Sep 2007 16:18:34 -0700
Subject: X86: Add a square root microop and the SSE sqrt instruction.

--HG--
extra : convert_revision : ddc6e7e95111189d43f75bf84cd3d82433d982b3
---
 src/arch/x86/isa/decoder/two_byte_opcodes.isa | 12 +++--
 src/arch/x86/isa/insts/sse/__init__.py        |  3 +-
 src/arch/x86/isa/insts/sse/square_root.py     | 71 +++++++++++++++++++++++++++
 src/arch/x86/isa/microops/regop.isa           |  3 ++
 4 files changed, 83 insertions(+), 6 deletions(-)
 create mode 100644 src/arch/x86/isa/insts/sse/square_root.py

diff --git a/src/arch/x86/isa/decoder/two_byte_opcodes.isa b/src/arch/x86/isa/decoder/two_byte_opcodes.isa
index ae2318899..eae994706 100644
--- a/src/arch/x86/isa/decoder/two_byte_opcodes.isa
+++ b/src/arch/x86/isa/decoder/two_byte_opcodes.isa
@@ -283,12 +283,14 @@
                     0x7: Inst::XORPD(Vq,Wq);
                     default: Inst::UD2();
                 }
-                // repne (0xF2)
-                0x8: decode OPCODE_OP_BOTTOM3 {
-                    0x1: sqrtsd_Vq_Wq();
-                    default: Inst::UD2();
+                format Inst {
+                    // repne (0xF2)
+                    0x8: decode OPCODE_OP_BOTTOM3 {
+                        0x1: SQRTSD(Vq,Wq);
+                        default: UD2();
+                    }
+                    default: UD2();
                 }
-                default: Inst::UD2();
             }
             0x0B: decode LEGACY_DECODEVAL {
                 // no prefix
diff --git a/src/arch/x86/isa/insts/sse/__init__.py b/src/arch/x86/isa/insts/sse/__init__.py
index 05c306885..7985a124f 100644
--- a/src/arch/x86/isa/insts/sse/__init__.py
+++ b/src/arch/x86/isa/insts/sse/__init__.py
@@ -58,7 +58,8 @@ categories = ["move",
               "add_and_subtract",
               "multiply_and_divide",
               "logical",
-              "compare"]
+              "compare",
+              "square_root"]
 
 microcode = '''
 # SSE instructions
diff --git a/src/arch/x86/isa/insts/sse/square_root.py b/src/arch/x86/isa/insts/sse/square_root.py
new file mode 100644
index 000000000..473292386
--- /dev/null
+++ b/src/arch/x86/isa/insts/sse/square_root.py
@@ -0,0 +1,71 @@
+# Copyright (c) 2007 The Hewlett-Packard Development Company
+# All rights reserved.
+#
+# Redistribution and use of this software in source and binary forms,
+# with or without modification, are permitted provided that the
+# following conditions are met:
+#
+# The software must be used only for Non-Commercial Use which means any
+# use which is NOT directed to receiving any direct monetary
+# compensation for, or commercial advantage from such use.  Illustrative
+# examples of non-commercial use are academic research, personal study,
+# teaching, education and corporate research & development.
+# Illustrative examples of commercial use are distributing products for
+# commercial advantage and providing services using the software for
+# commercial advantage.
+#
+# If you wish to use this software or functionality therein that may be
+# covered by patents for commercial use, please contact:
+#     Director of Intellectual Property Licensing
+#     Office of Strategy and Technology
+#     Hewlett-Packard Company
+#     1501 Page Mill Road
+#     Palo Alto, California  94304
+#
+# Redistributions of source code must retain the above copyright notice,
+# this list of conditions and the following disclaimer.  Redistributions
+# in binary form must reproduce the above copyright notice, this list of
+# conditions and the following disclaimer in the documentation and/or
+# other materials provided with the distribution.  Neither the name of
+# the COPYRIGHT HOLDER(s), HEWLETT-PACKARD COMPANY, nor the names of its
+# contributors may be used to endorse or promote products derived from
+# this software without specific prior written permission.  No right of
+# sublicense is granted herewith.  Derivatives of the software and
+# output created using the software may be prepared, but only for
+# Non-Commercial Uses.  Derivatives of the software may be shared with
+# others provided: (i) the others agree to abide by the list of
+# conditions herein which includes the Non-Commercial Use restrictions;
+# and (ii) such Derivatives of the software include the above copyright
+# notice to acknowledge the contribution from this software where
+# applicable, this list of conditions and the disclaimer below.
+#
+# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+#
+# Authors: Gabe Black
+
+microcode = '''
+def macroop SQRTSD_R_R {
+    sqrtfp xmml, xmml, xmmlm
+};
+
+def macroop SQRTSD_R_M {
+    ldfp ufp1, seg, sib, disp
+    sqrtfp xmml, xmml, ufp1
+};
+
+def macroop SQRTSD_R_P {
+    rdip t7
+    ldfp ufp1, seg, riprel, disp
+    sqrtfp xmml, xmml, ufp1
+};
+'''
diff --git a/src/arch/x86/isa/microops/regop.isa b/src/arch/x86/isa/microops/regop.isa
index ec6f49424..57edbb606 100644
--- a/src/arch/x86/isa/microops/regop.isa
+++ b/src/arch/x86/isa/microops/regop.isa
@@ -656,6 +656,9 @@ let {{
     class Xorfp(RegOp):
         code = 'FpDestReg.uqw = FpSrcReg1.uqw ^ FpSrcReg2.uqw;'
 
+    class Sqrtfp(RegOp):
+        code = 'FpDestReg = sqrt(FpSrcReg2);'
+
     class Movfp(CondRegOp):
         code = 'FpDestReg.uqw = FpSrcReg2.uqw;'
         else_code = 'FpDestReg.uqw = FpDestReg.uqw;'
-- 
cgit v1.2.3