x86: Make fprem like the fprem on a real x87

author Andreas Sandberg <andreas@sandberg.pp.se>

Tue, 18 Jun 2013 14:10:42 +0000 (16:10 +0200)

committer Andreas Sandberg <andreas@sandberg.pp.se>

Tue, 18 Jun 2013 14:10:42 +0000 (16:10 +0200)
author Andreas Sandberg <andreas@sandberg.pp.se>
Tue, 18 Jun 2013 14:10:42 +0000 (16:10 +0200)
committer Andreas Sandberg <andreas@sandberg.pp.se>
Tue, 18 Jun 2013 14:10:42 +0000 (16:10 +0200)
diff --git a/src/arch/x86/isa/insts/x87/arithmetic/partial_remainder.py b/src/arch/x86/isa/insts/x87/arithmetic/partial_remainder.py

index b02184e1a1291c1d933cd27b6146beadd8fa8f19..42aabfdf68370284eed94cef68f9af73949e660f 100644 (file)
--- a/src/arch/x86/isa/insts/x87/arithmetic/partial_remainder.py
+++ b/src/arch/x86/isa/insts/x87/arithmetic/partial_remainder.py
@@ -37,10 +37,10 @@
  
  microcode = '''
  def macroop FPREM {
-    premfp st(0), st(1), st(0)
+    premfp st(0), st(1), st(0), SetStatus=True
  };
  
  def macroop FPREM1 {
-    premfp st(0), st(1), st(0)
+    premfp st(0), st(1), st(0), SetStatus=True
  };
  '''
diff --git a/src/arch/x86/isa/microops/fpop.isa b/src/arch/x86/isa/microops/fpop.isa

index e6372ba6be891e75432c89316ba787801b3fc794..22d6fbcdad60f127d9a474847068fa10e71a35b5 100644 (file)
--- a/src/arch/x86/isa/microops/fpop.isa
+++ b/src/arch/x86/isa/microops/fpop.isa
@@ -330,11 +330,34 @@ let {{
  
      class PremFp(FpBinaryOp):
          code = '''
-            FpDestReg = fmod(FpSrcReg1, FpSrcReg2);
-            DPRINTF(X86, "src1: %lf, src2: %lf, dest: %lf\\n", FpSrcReg1, FpSrcReg2, FpDestReg);
+            MiscReg new_fsw(FSW);
+            int src1_exp;
+            int src2_exp;
+            std::frexp(FpSrcReg1, &src1_exp);
+            std::frexp(FpSrcReg2, &src2_exp);
+
+            const int d(src2_exp - src1_exp);
+            if (d < 64) {
+                const int64_t q(std::trunc(FpSrcReg2 / FpSrcReg1));
+                FpDestReg = FpSrcReg2 - FpSrcReg1 * q;
+                new_fsw &= ~(CC0Bit | CC1Bit | CC2Bit | CC2Bit);
+                new_fsw |= (q & 0x1) ? CC1Bit : 0;
+                new_fsw |= (q & 0x2) ? CC3Bit : 0;
+                new_fsw |= (q & 0x4) ? CC0Bit : 0;
+            } else {
+                const int n(42);
+                const int64_t qq(std::trunc(
+                    FpSrcReg2 / std::ldexp(FpSrcReg1, d - n)));
+                FpDestReg = FpSrcReg2 - std::ldexp(FpSrcReg1 * qq, d - n);
+                new_fsw |= CC2Bit;
+            }
+            DPRINTF(X86, "src1: %lf, src2: %lf, dest: %lf, FSW: 0x%x\\n",
+                    FpSrcReg1, FpSrcReg2, FpDestReg, new_fsw);
          '''
          op_class = 'FloatDivOp'
  
+        flag_code = 'FSW = new_fsw;'
+
      class Compfp(FpBinaryOp):
          def __init__(self, src1, src2, spm=0, setStatus=False, \
                  dataSize="env.dataSize"):
author	Andreas Sandberg <andreas@sandberg.pp.se>
	Tue, 18 Jun 2013 14:10:42 +0000 (16:10 +0200)
committer	Andreas Sandberg <andreas@sandberg.pp.se>
	Tue, 18 Jun 2013 14:10:42 +0000 (16:10 +0200)
src/arch/x86/isa/insts/x87/arithmetic/partial_remainder.py		patch \| blob \| history
src/arch/x86/isa/microops/fpop.isa		patch \| blob \| history