math/big: implement Rat.FloatPrec

[gostls13.git] / src / math / big / ratconv.go
diff --git a/src/math/big/ratconv.go b/src/math/big/ratconv.go

index 5656280e84dabcfb0b7f4754c91ed8fc236692c7..9fb5711ff9e182aee87b9cd8aeb66811134af6e0 100644 (file)
--- a/src/math/big/ratconv.go
+++ b/src/math/big/ratconv.go
@@ -38,10 +38,23 @@ func (z *Rat) Scan(s fmt.ScanState, ch rune) error {
  }
  
  // SetString sets z to the value of s and returns z and a boolean indicating
-// success. s can be given as a fraction "a/b" or as a decimal floating-point
-// number optionally followed by an exponent. The entire string (not just a prefix)
-// must be valid for success. If the operation failed, the value of z is
-// undefined but the returned value is nil.
+// success. s can be given as a (possibly signed) fraction "a/b", or as a
+// floating-point number optionally followed by an exponent.
+// If a fraction is provided, both the dividend and the divisor may be a
+// decimal integer or independently use a prefix of “0b”, “0” or “0o”,
+// or “0x” (or their upper-case variants) to denote a binary, octal, or
+// hexadecimal integer, respectively. The divisor may not be signed.
+// If a floating-point number is provided, it may be in decimal form or
+// use any of the same prefixes as above but for “0” to denote a non-decimal
+// mantissa. A leading “0” is considered a decimal leading 0; it does not
+// indicate octal representation in this case.
+// An optional base-10 “e” or base-2 “p” (or their upper-case variants)
+// exponent may be provided as well, except for hexadecimal floats which
+// only accept an (optional) “p” exponent (because an “e” or “E” cannot
+// be distinguished from a mantissa digit). If the exponent's absolute value
+// is too large, the operation may fail.
+// The entire string, not just a prefix, must be valid for success. If the
+// operation failed, the value of z is undefined but the returned value is nil.
  func (z *Rat) SetString(s string) (*Rat, bool) {
         if len(s) == 0 {
                 return nil, false
@@ -78,16 +91,17 @@ func (z *Rat) SetString(s string) (*Rat, bool) {
         }
  
         // mantissa
-       // TODO(gri) allow other bases besides 10 for mantissa and exponent? (issue #29799)
-       var ecorr int
-       z.a.abs, _, ecorr, err = z.a.abs.scan(r, 10, true)
+       var base int
+       var fcount int // fractional digit count; valid if <= 0
+       z.a.abs, base, fcount, err = z.a.abs.scan(r, 0, true)
         if err != nil {
                 return nil, false
         }
  
         // exponent
         var exp int64
-       exp, _, err = scanExponent(r, false)
+       var ebase int
+       exp, ebase, err = scanExponent(r, true, true)
         if err != nil {
                 return nil, false
         }
@@ -99,105 +113,187 @@ func (z *Rat) SetString(s string) (*Rat, bool) {
  
         // special-case 0 (see also issue #16176)
         if len(z.a.abs) == 0 {
-               return z, true
+               return z.norm(), true
         }
         // len(z.a.abs) > 0
  
-       // correct exponent
-       if ecorr < 0 {
-               exp += int64(ecorr)
+       // The mantissa may have a radix point (fcount <= 0) and there
+       // may be a nonzero exponent exp. The radix point amounts to a
+       // division by base**(-fcount), which equals a multiplication by
+       // base**fcount. An exponent means multiplication by ebase**exp.
+       // Multiplications are commutative, so we can apply them in any
+       // order. We only have powers of 2 and 10, and we split powers
+       // of 10 into the product of the same powers of 2 and 5. This
+       // may reduce the size of shift/multiplication factors or
+       // divisors required to create the final fraction, depending
+       // on the actual floating-point value.
+
+       // determine binary or decimal exponent contribution of radix point
+       var exp2, exp5 int64
+       if fcount < 0 {
+               // The mantissa has a radix point ddd.dddd; and
+               // -fcount is the number of digits to the right
+               // of '.'. Adjust relevant exponent accordingly.
+               d := int64(fcount)
+               switch base {
+               case 10:
+                       exp5 = d
+                       fallthrough // 10**e == 5**e * 2**e
+               case 2:
+                       exp2 = d
+               case 8:
+                       exp2 = d * 3 // octal digits are 3 bits each
+               case 16:
+                       exp2 = d * 4 // hexadecimal digits are 4 bits each
+               default:
+                       panic("unexpected mantissa base")
+               }
+               // fcount consumed - not needed anymore
         }
  
-       // compute exponent power
-       expabs := exp
-       if expabs < 0 {
-               expabs = -expabs
+       // take actual exponent into account
+       switch ebase {
+       case 10:
+               exp5 += exp
+               fallthrough // see fallthrough above
+       case 2:
+               exp2 += exp
+       default:
+               panic("unexpected exponent base")
         }
-       powTen := nat(nil).expNN(natTen, nat(nil).setWord(Word(expabs)), nil)
-
-       // complete fraction
-       if exp < 0 {
-               z.b.abs = powTen
-               z.norm()
+       // exp consumed - not needed anymore
+
+       // apply exp5 contributions
+       // (start with exp5 so the numbers to multiply are smaller)
+       if exp5 != 0 {
+               n := exp5
+               if n < 0 {
+                       n = -n
+                       if n < 0 {
+                               // This can occur if -n overflows. -(-1 << 63) would become
+                               // -1 << 63, which is still negative.
+                               return nil, false
+                       }
+               }
+               if n > 1e6 {
+                       return nil, false // avoid excessively large exponents
+               }
+               pow5 := z.b.abs.expNN(natFive, nat(nil).setWord(Word(n)), nil, false) // use underlying array of z.b.abs
+               if exp5 > 0 {
+                       z.a.abs = z.a.abs.mul(z.a.abs, pow5)
+                       z.b.abs = z.b.abs.setWord(1)
+               } else {
+                       z.b.abs = pow5
+               }
         } else {
-               z.a.abs = z.a.abs.mul(z.a.abs, powTen)
-               z.b.abs = z.b.abs[:0]
+               z.b.abs = z.b.abs.setWord(1)
+       }
+
+       // apply exp2 contributions
+       if exp2 < -1e7 || exp2 > 1e7 {
+               return nil, false // avoid excessively large exponents
+       }
+       if exp2 > 0 {
+               z.a.abs = z.a.abs.shl(z.a.abs, uint(exp2))
+       } else if exp2 < 0 {
+               z.b.abs = z.b.abs.shl(z.b.abs, uint(-exp2))
         }
  
         z.a.neg = neg && len(z.a.abs) > 0 // 0 has no sign
  
-       return z, true
+       return z.norm(), true
  }
  
-// scanExponent scans the longest possible prefix of r representing a decimal
-// ('e', 'E') or binary ('p') exponent, if any. It returns the exponent, the
-// exponent base (10 or 2), or a read or syntax error, if any.
+// scanExponent scans the longest possible prefix of r representing a base 10
+// (“e”, “E”) or a base 2 (“p”, “P”) exponent, if any. It returns the
+// exponent, the exponent base (10 or 2), or a read or syntax error, if any.
  //
-//     exponent = ( "E" | "e" | "p" ) [ sign ] digits .
+// If sepOk is set, an underscore character “_” may appear between successive
+// exponent digits; such underscores do not change the value of the exponent.
+// Incorrect placement of underscores is reported as an error if there are no
+// other errors. If sepOk is not set, underscores are not recognized and thus
+// terminate scanning like any other character that is not a valid digit.
+//
+//     exponent = ( "e" | "E" | "p" | "P" ) [ sign ] digits .
  //     sign     = "+" | "-" .
-//     digits   = digit { digit } .
+//     digits   = digit { [ '_' ] digit } .
  //     digit    = "0" ... "9" .
  //
-// A binary exponent is only permitted if binExpOk is set.
-func scanExponent(r io.ByteScanner, binExpOk bool) (exp int64, base int, err error) {
-       base = 10
-
-       var ch byte
-       if ch, err = r.ReadByte(); err != nil {
+// A base 2 exponent is only permitted if base2ok is set.
+func scanExponent(r io.ByteScanner, base2ok, sepOk bool) (exp int64, base int, err error) {
+       // one char look-ahead
+       ch, err := r.ReadByte()
+       if err != nil {
                 if err == io.EOF {
-                       err = nil // no exponent; same as e0
+                       err = nil
                 }
-               return
+               return 0, 10, err
         }
  
+       // exponent char
         switch ch {
         case 'e', 'E':
-               // ok
-       case 'p':
-               if binExpOk {
+               base = 10
+       case 'p', 'P':
+               if base2ok {
                         base = 2
                         break // ok
                 }
                 fallthrough // binary exponent not permitted
         default:
-               r.UnreadByte()
-               return // no exponent; same as e0
-       }
-
-       var neg bool
-       if neg, err = scanSign(r); err != nil {
-               return
+               r.UnreadByte() // ch does not belong to exponent anymore
+               return 0, 10, nil
         }
  
+       // sign
         var digits []byte
-       if neg {
-               digits = append(digits, '-')
+       ch, err = r.ReadByte()
+       if err == nil && (ch == '+' || ch == '-') {
+               if ch == '-' {
+                       digits = append(digits, '-')
+               }
+               ch, err = r.ReadByte()
         }
  
-       // no need to use nat.scan for exponent digits
-       // since we only care about int64 values - the
-       // from-scratch scan is easy enough and faster
-       for i := 0; ; i++ {
-               if ch, err = r.ReadByte(); err != nil {
-                       if err != io.EOF || i == 0 {
-                               return
-                       }
-                       err = nil
-                       break // i > 0
-               }
-               if ch < '0' || '9' < ch {
-                       if i == 0 {
-                               r.UnreadByte()
-                               err = fmt.Errorf("invalid exponent (missing digits)")
-                               return
+       // prev encodes the previously seen char: it is one
+       // of '_', '0' (a digit), or '.' (anything else). A
+       // valid separator '_' may only occur after a digit.
+       prev := '.'
+       invalSep := false
+
+       // exponent value
+       hasDigits := false
+       for err == nil {
+               if '0' <= ch && ch <= '9' {
+                       digits = append(digits, ch)
+                       prev = '0'
+                       hasDigits = true
+               } else if ch == '_' && sepOk {
+                       if prev != '0' {
+                               invalSep = true
                         }
-                       break // i > 0
+                       prev = '_'
+               } else {
+                       r.UnreadByte() // ch does not belong to number anymore
+                       break
                 }
-               digits = append(digits, ch)
+               ch, err = r.ReadByte()
+       }
+
+       if err == io.EOF {
+               err = nil
+       }
+       if err == nil && !hasDigits {
+               err = errNoDigits
+       }
+       if err == nil {
+               exp, err = strconv.ParseInt(string(digits), 10, 64)
+       }
+       // other errors take precedence over invalid separators
+       if err == nil && (invalSep || prev == '_') {
+               err = errInvalSep
         }
-       // i > 0 => we have at least one digit
  
-       exp, err = strconv.ParseInt(string(digits), 10, 64)
         return
  }
  
@@ -229,7 +325,7 @@ func (x *Rat) RatString() string {
  }
  
  // FloatString returns a string representation of x in decimal form with prec
-// digits of precision after the decimal point. The last digit is rounded to
+// digits of precision after the radix point. The last digit is rounded to
  // nearest, with halves rounded away from zero.
  func (x *Rat) FloatString(prec int) string {
         var buf []byte
@@ -250,7 +346,7 @@ func (x *Rat) FloatString(prec int) string {
  
         p := natOne
         if prec > 0 {
-               p = nat(nil).expNN(natTen, nat(nil).setUint64(uint64(prec)), nil)
+               p = nat(nil).expNN(natTen, nat(nil).setUint64(uint64(prec)), nil, false)
         }
  
         r = r.mul(r, p)
@@ -282,3 +378,99 @@ func (x *Rat) FloatString(prec int) string {
  
         return string(buf)
  }
+
+// Note: FloatPrec (below) is in this file rather than rat.go because
+//       its results are relevant for decimal representation/printing.
+
+// FloatPrec returns the number n of non-repeating digits immediately
+// following the decimal point of the decimal representation of x.
+// The boolean result indicates whether a decimal representation of x
+// with that many fractional digits is exact or rounded.
+//
+// Examples:
+//
+//     x      n    exact    decimal representation n fractional digits
+//     0      0    true     0
+//     1      0    true     1
+//     1/2    1    true     0.5
+//     1/3    0    false    0       (0.333... rounded)
+//     1/4    2    true     0.25
+//     1/6    1    false    0.2     (0.166... rounded)
+func (x *Rat) FloatPrec() (n int, exact bool) {
+       // Determine q and largest p2, p5 such that d = q·2^p2·5^p5.
+       // The results n, exact are:
+       //
+       //     n = max(p2, p5)
+       //     exact = q == 1
+       //
+       // See https://en.wikipedia.org/wiki/Repeating_decimal for
+       // details.
+       d := x.Denom().abs // d >= 1
+
+       // Determine p2 by counting factors of 2.
+       // p2 corresponds to the trailing zero bits in d.
+       // Do this first to reduce q as much as possible.
+       var q nat
+       p2 := d.trailingZeroBits()
+       q = q.shr(d, p2)
+
+       // Determine p5 by counting factors of 5.
+
+       // Build a table starting with an initial power of 5,
+       // and using repeated squaring until the factor doesn't
+       // divide q anymore. Then use the table to determine
+       // the power of 5 in q.
+       //
+       // Setting the table limit to 0 turns this off;
+       // a limit of 1 uses just one factor 5^fp.
+       // Larger values build up a more comprehensive table.
+       const fp = 13        // f == 5^fp
+       const limit = 100    // table size limit
+       var tab []nat        // tab[i] == 5^(fp·2^i)
+       f := nat{1220703125} // == 5^fp (must fit into a uint32 Word)
+       var t, r nat         // temporaries
+       for len(tab) < limit {
+               if _, r = t.div(r, q, f); len(r) != 0 {
+                       break // f doesn't divide q evenly
+               }
+               tab = append(tab, f)
+               f = f.sqr(f)
+       }
+
+       // TODO(gri) Optimization: don't waste the successful
+       //           division q/f above; instead reduce q and
+       //           count the multiples.
+
+       // Factor q using the table entries, if any.
+       var p5, p uint
+       for i := len(tab) - 1; i >= 0; i-- {
+               q, p = multiples(q, tab[i])
+               p5 += p << i * fp
+       }
+
+       q, p = multiples(q, natFive)
+       p5 += p
+
+       return int(max(p2, p5)), q.cmp(natOne) == 0
+}
+
+// multiples returns d and largest p such that x = d·f^p.
+// x and f must not be 0.
+func multiples(x, f nat) (d nat, p uint) {
+       // Determine p through repeated division.
+       d = d.set(x)
+       // p == 0
+       var q, r nat
+       for {
+               // invariant x == d·f^p
+               q, r = q.div(r, d, f)
+               if len(r) != 0 {
+                       return
+               }
+               // q == d/f
+               // x == q·f·f^p
+               p++
+               // x == q·f^p
+               d = d.set(q)
+       }
+}