math/big: fix known bug in Float.Float64

- handle exponent over- and underflow - handle denormalized numbers - added test cases Change-Id: I1bbb9904b0c104f54696944e1f57559881f6eeeb Reviewed-on: https://go-review.googlesource.com/7982 Reviewed-by: Alan Donovan <adonovan@google.com>
author: Robert Griesemer <gri@golang.org> 2015-03-23 17:31:25 -0700
committer: Robert Griesemer <gri@golang.org> 2015-03-24 20:34:14 +0000
commit: 2c4cf2f6f2ccfb43869b9e6b881f29699bc29bfd (patch)
tree: 043d9d7ee115be6038237d5fe7d932f9bf24904c /src/math/big/float.go
parent: 0e55f201d618b082b725c1792715d723b0783b5f (diff)
download: go-2c4cf2f6f2ccfb43869b9e6b881f29699bc29bfd.tar.xz
1 files changed, 58 insertions, 13 deletions
diff --git a/src/math/big/float.go b/src/math/big/float.go
index a86471e2a5..fa3751d0c7 100644
--- a/src/math/big/float.go
+++ b/src/math/big/float.go
@@ -872,9 +872,14 @@ func (x *Float) Int64() (int64, Accuracy) {
 	panic("unreachable")
 }
 
-// Float64 returns the closest float64 value of x
-// by rounding to nearest with 53 bits precision.
-// BUG(gri) Float.Float64 doesn't handle exponent overflow.
+// Float64 returns the float64 value nearest to x by rounding ToNearestEven
+// with 53 bits of precision.
+// If x is too small to be represented by a float64
+// (|x| < math.SmallestNonzeroFloat64), the result is (0, Below) or
+// (-0, Above), respectively, depending on the sign of x.
+// If x is too large to be represented by a float64 (|x| > math.MaxFloat64),
+// the result is (+Inf, Above) or (-Inf, Below), depending on the sign of x.
+// The result is (NaN, Undef) for NaNs.
 func (x *Float) Float64() (float64, Accuracy) {
 	if debugFloat {
 		x.validate()
@@ -886,27 +891,67 @@ func (x *Float) Float64() (float64, Accuracy) {
 		var r Float
 		r.prec = 53
 		r.Set(x)
-		var s uint64
+
+		// Rounding via Set may have caused r to overflow
+		// to ±Inf (rounding never causes underflows to 0).
+		if r.form == inf {
+			r.exp = 10000 // cause overflow below
+		}
+
+		// see also implementation of math.Ldexp
+
+		e := int64(r.exp) + 1022
+		if e <= -52 {
+			// underflow
+			if x.neg {
+				z := 0.0
+				return -z, Above
+			}
+			return 0.0, Below
+		}
+		// e > -52
+
+		if e >= 2047 {
+			// overflow
+			if x.neg {
+				return math.Inf(-1), Below
+			}
+			return math.Inf(+1), Above
+		}
+		// -52 < e < 2047
+
+		denormal := false
+		if e < 0 {
+			denormal = true
+			e += 52
+		}
+		// 0 < e < 2047
+
+		s := uint64(0)
 		if r.neg {
 			s = 1 << 63
 		}
-		e := uint64(1022+r.exp) & 0x7ff // TODO(gri) check for overflow
-		m := high64(r.mant) >> 11 & (1<<52 - 1)
-		return math.Float64frombits(s | e<<52 | m), r.acc
+		m := high64(r.mant) >> 11 & (1<<52 - 1) // cut off msb (implicit 1 bit)
+		z := math.Float64frombits(s | uint64(e)<<52 | m)
+		if denormal {
+			// adjust for denormal
+			// TODO(gri) does this change accuracy?
+			z /= 1 << 52
+		}
+		return z, r.acc
 
 	case zero:
-		z := 0.0
 		if x.neg {
-			z = -z
+			z := 0.0
+			return -z, Exact
 		}
-		return z, Exact
+		return 0.0, Exact
 
 	case inf:
-		sign := +1
 		if x.neg {
-			sign = -1
+			return math.Inf(-1), Exact
 		}
-		return math.Inf(sign), Exact
+		return math.Inf(+1), Exact
 
 	case nan:
 		return math.NaN(), Undef
author	Robert Griesemer <gri@golang.org>	2015-03-23 17:31:25 -0700
committer	Robert Griesemer <gri@golang.org>	2015-03-24 20:34:14 +0000
commit	2c4cf2f6f2ccfb43869b9e6b881f29699bc29bfd (patch)
tree	043d9d7ee115be6038237d5fe7d932f9bf24904c /src/math/big/float.go
parent	0e55f201d618b082b725c1792715d723b0783b5f (diff)
download	go-2c4cf2f6f2ccfb43869b9e6b881f29699bc29bfd.tar.xz