n64: raise unimpl instead of invalid for fpu conversions

invertego · LukeUsher · commit 4e36ce7ad5cb · 2022-10-30T21:38:48.000Z
diff --git a/ares/n64/cpu/cpu.hpp b/ares/n64/cpu/cpu.hpp
@@ -656,7 +656,7 @@ struct CPU : Thread {
   template<typename T> auto fgr(u32) -> T&;
   auto getControlRegisterFPU(n5) -> u32;
   auto setControlRegisterFPU(n5, n32) -> void;
-  auto checkFPUExceptions() -> bool;
+  template<bool CVT> auto checkFPUExceptions() -> bool;
   auto fpeDivisionByZero() -> bool;
   auto fpeInexact() -> bool;
   auto fpeUnderflow() -> bool;
diff --git a/ares/n64/cpu/interpreter-fpu.cpp b/ares/n64/cpu/interpreter-fpu.cpp
@@ -175,6 +175,7 @@ auto CPU::fpeUnimplemented() -> bool {
   return true;
 }
 
+template<bool CVT>
 auto CPU::checkFPUExceptions() -> bool {
   u32 exc = fenv.testExcept(float_env::divByZero
                           | float_env::inexact
@@ -183,6 +184,13 @@ auto CPU::checkFPUExceptions() -> bool {
                           | float_env::invalid);
   if (!exc) return false;
 
+  if constexpr(CVT) {
+    if(exc & float_env::invalid) {
+      if(fpeUnimplemented()) exception.floatingPoint();
+      return true;
+    }
+  }
+
   if(exc & float_env::underflow) {
     if(!fpu.csr.flushSubnormals || fpu.csr.enable.underflow || fpu.csr.enable.inexact) {
       if(fpeUnimplemented()) exception.floatingPoint();
@@ -200,13 +208,16 @@ auto CPU::checkFPUExceptions() -> bool {
   return raise;
 }
 
-#define CHECK_FPE(type, operation) ({ \
+#define CHECK_FPE_IMPL(type, operation, convert) ({ \
   fenv.clearExcept(); \
   type res = [&]() noinline -> type { return operation; }(); \
-  if (checkFPUExceptions()) return; \
+  if (checkFPUExceptions<convert>()) return; \
   (res); \
 })
 
+#define CHECK_FPE(type, operation)      CHECK_FPE_IMPL(type, operation, false)
+#define CHECK_FPE_CONV(type, operation) CHECK_FPE_IMPL(type, operation, true)
+
 auto f32repr(f32 f) -> n32 {
   uint32_t v; memcpy(&v, &f, 4);
   return n32(v);
@@ -444,15 +455,15 @@ auto CPU::FCEIL_W_S(u8 fd, u8 fs) -> void {
   if(!fpuCheckStart()) return;
   auto ffs = FS(f32);
   if(!fpuCheckInputConv<s32>(ffs)) return;
-  auto ffd = CHECK_FPE(s32, roundCeil<s32>(ffs));
+  auto ffd = CHECK_FPE_CONV(s32, roundCeil<s32>(ffs));
   FD(s32) = ffd;
 }
 
 auto CPU::FCEIL_W_D(u8 fd, u8 fs) -> void {
   if(!fpuCheckStart()) return;
   auto ffs = FS(f64);
   if(!fpuCheckInputConv<s32>(ffs)) return;
-  auto ffd = CHECK_FPE(s32, roundCeil<s32>(ffs));
+  auto ffd = CHECK_FPE_CONV(s32, roundCeil<s32>(ffs));
   FD(s32) = ffd;
 }
 
@@ -719,15 +730,15 @@ auto CPU::FCVT_W_S(u8 fd, u8 fs) -> void {
   if(!fpuCheckStart()) return;
   auto ffs = FS(f32);
   if(!fpuCheckInputConv<s32>(ffs)) return;
-  auto ffd = CHECK_FPE(s32, roundCurrent<s32>(ffs));
+  auto ffd = CHECK_FPE_CONV(s32, roundCurrent<s32>(ffs));
   FD(s32) = ffd;
 }
 
 auto CPU::FCVT_W_D(u8 fd, u8 fs) -> void {
   if(!fpuCheckStart()) return;
   auto ffs = FS(f64);
   if(!fpuCheckInputConv<s32>(ffs)) return;
-  auto ffd = CHECK_FPE(s32, roundCurrent<s32>(ffs));
+  auto ffd = CHECK_FPE_CONV(s32, roundCurrent<s32>(ffs));
   FD(s32) = ffd;
 }
 
@@ -771,15 +782,15 @@ auto CPU::FFLOOR_W_S(u8 fd, u8 fs) -> void {
   if(!fpuCheckStart()) return;
   auto ffs = FS(f32);
   if(!fpuCheckInputConv<s32>(ffs)) return;
-  auto ffd = CHECK_FPE(s32, roundFloor<s32>(ffs));
+  auto ffd = CHECK_FPE_CONV(s32, roundFloor<s32>(ffs));
   FD(s32) = ffd;
 }
 
 auto CPU::FFLOOR_W_D(u8 fd, u8 fs) -> void {
   if(!fpuCheckStart()) return;
   auto ffs = FS(f64);
   if(!fpuCheckInputConv<s32>(ffs)) return;
-  auto ffd = CHECK_FPE(s32, roundFloor<s32>(ffs));
+  auto ffd = CHECK_FPE_CONV(s32, roundFloor<s32>(ffs));
   FD(s32) = ffd;
 }
 
@@ -853,7 +864,7 @@ auto CPU::FROUND_W_S(u8 fd, u8 fs) -> void {
   if(!fpuCheckStart()) return;
   auto ffs = FS(f32);
   if(!fpuCheckInputConv<s32>(ffs)) return;
-  auto ffd = CHECK_FPE(s32, roundNearest<s32>(ffs));
+  auto ffd = CHECK_FPE_CONV(s32, roundNearest<s32>(ffs));
   if(ffd != ffs && fpeInexact()) return exception.floatingPoint();
   FD(s32) = ffd;
 }
@@ -862,7 +873,7 @@ auto CPU::FROUND_W_D(u8 fd, u8 fs) -> void {
   if(!fpuCheckStart()) return;
   auto ffs = FS(f64);
   if(!fpuCheckInputConv<s32>(ffs)) return;
-  auto ffd = CHECK_FPE(s32, roundNearest<s32>(ffs));
+  auto ffd = CHECK_FPE_CONV(s32, roundNearest<s32>(ffs));
   if(ffd != ffs && fpeInexact()) return exception.floatingPoint();
   FD(s32) = ffd;
 }
@@ -927,7 +938,7 @@ auto CPU::FTRUNC_W_S(u8 fd, u8 fs) -> void {
   if(!fpuCheckStart()) return;
   auto ffs = FS(f32);
   if(!fpuCheckInputConv<s32>(ffs)) return;
-  auto ffd = CHECK_FPE(s32, roundTrunc<s32>(ffs));
+  auto ffd = CHECK_FPE_CONV(s32, roundTrunc<s32>(ffs));
   if((f32)ffd != ffs && fpeInexact()) return exception.floatingPoint();
   FD(s32) = ffd;
 }
@@ -936,7 +947,7 @@ auto CPU::FTRUNC_W_D(u8 fd, u8 fs) -> void {
   if(!fpuCheckStart()) return;
   auto ffs = FS(f64);
   if(!fpuCheckInputConv<s32>(ffs)) return;
-  auto ffd = CHECK_FPE(s32, roundTrunc<s32>(ffs));
+  auto ffd = CHECK_FPE_CONV(s32, roundTrunc<s32>(ffs));
   if((f64)ffd != ffs && fpeInexact()) return exception.floatingPoint();
   FD(s32) = ffd;
 }