]> git.saurik.com Git - apple/javascriptcore.git/blame - wtf/dtoa.cpp
JavaScriptCore-554.1.tar.gz
[apple/javascriptcore.git] / wtf / dtoa.cpp
CommitLineData
9dae56ea
A
1/****************************************************************
2 *
3 * The author of this software is David M. Gay.
4 *
5 * Copyright (c) 1991, 2000, 2001 by Lucent Technologies.
6 * Copyright (C) 2002, 2005, 2006, 2007, 2008 Apple Inc. All rights reserved.
7 *
8 * Permission to use, copy, modify, and distribute this software for any
9 * purpose without fee is hereby granted, provided that this entire notice
10 * is included in all copies of any software which is or includes a copy
11 * or modification of this software and in all copies of the supporting
12 * documentation for such software.
13 *
14 * THIS SOFTWARE IS BEING PROVIDED "AS IS", WITHOUT ANY EXPRESS OR IMPLIED
15 * WARRANTY. IN PARTICULAR, NEITHER THE AUTHOR NOR LUCENT MAKES ANY
16 * REPRESENTATION OR WARRANTY OF ANY KIND CONCERNING THE MERCHANTABILITY
17 * OF THIS SOFTWARE OR ITS FITNESS FOR ANY PARTICULAR PURPOSE.
18 *
19 ***************************************************************/
20
21/* Please send bug reports to
22 David M. Gay
23 Bell Laboratories, Room 2C-463
24 600 Mountain Avenue
25 Murray Hill, NJ 07974-0636
26 U.S.A.
27 dmg@bell-labs.com
28 */
29
30/* On a machine with IEEE extended-precision registers, it is
31 * necessary to specify double-precision (53-bit) rounding precision
32 * before invoking strtod or dtoa. If the machine uses (the equivalent
33 * of) Intel 80x87 arithmetic, the call
34 * _control87(PC_53, MCW_PC);
35 * does this with many compilers. Whether this or another call is
36 * appropriate depends on the compiler; for this to work, it may be
37 * necessary to #include "float.h" or another system-dependent header
38 * file.
39 */
40
41/* strtod for IEEE-arithmetic machines.
42 *
43 * This strtod returns a nearest machine number to the input decimal
44 * string (or sets errno to ERANGE). With IEEE arithmetic, ties are
45 * broken by the IEEE round-even rule. Otherwise ties are broken by
46 * biased rounding (add half and chop).
47 *
48 * Inspired loosely by William D. Clinger's paper "How to Read Floating
49 * Point Numbers Accurately" [Proc. ACM SIGPLAN '90, pp. 92-101].
50 *
51 * Modifications:
52 *
53 * 1. We only require IEEE.
54 * 2. We get by with floating-point arithmetic in a case that
55 * Clinger missed -- when we're computing d * 10^n
56 * for a small integer d and the integer n is not too
57 * much larger than 22 (the maximum integer k for which
58 * we can represent 10^k exactly), we may be able to
59 * compute (d*10^k) * 10^(e-k) with just one roundoff.
60 * 3. Rather than a bit-at-a-time adjustment of the binary
61 * result in the hard case, we use floating-point
62 * arithmetic to determine the adjustment to within
63 * one bit; only in really hard cases do we need to
64 * compute a second residual.
65 * 4. Because of 3., we don't need a large table of powers of 10
66 * for ten-to-e (just some small tables, e.g. of 10^k
67 * for 0 <= k <= 22).
68 */
69
70/*
71 * #define IEEE_8087 for IEEE-arithmetic machines where the least
72 * significant byte has the lowest address.
73 * #define IEEE_MC68k for IEEE-arithmetic machines where the most
74 * significant byte has the lowest address.
75 * #define No_leftright to omit left-right logic in fast floating-point
76 * computation of dtoa.
77 * #define Check_FLT_ROUNDS if FLT_ROUNDS can assume the values 2 or 3
78 * and Honor_FLT_ROUNDS is not #defined.
79 * #define Inaccurate_Divide for IEEE-format with correctly rounded
80 * products but inaccurate quotients, e.g., for Intel i860.
81 * #define USE_LONG_LONG on machines that have a "long long"
82 * integer type (of >= 64 bits), and performance testing shows that
83 * it is faster than 32-bit fallback (which is often not the case
84 * on 32-bit machines). On such machines, you can #define Just_16
85 * to store 16 bits per 32-bit int32_t when doing high-precision integer
86 * arithmetic. Whether this speeds things up or slows things down
87 * depends on the machine and the number being converted.
88 * #define Bad_float_h if your system lacks a float.h or if it does not
89 * define some or all of DBL_DIG, DBL_MAX_10_EXP, DBL_MAX_EXP,
90 * FLT_RADIX, FLT_ROUNDS, and DBL_MAX.
91 * #define INFNAN_CHECK on IEEE systems to cause strtod to check for
92 * Infinity and NaN (case insensitively). On some systems (e.g.,
93 * some HP systems), it may be necessary to #define NAN_WORD0
94 * appropriately -- to the most significant word of a quiet NaN.
95 * (On HP Series 700/800 machines, -DNAN_WORD0=0x7ff40000 works.)
96 * When INFNAN_CHECK is #defined and No_Hex_NaN is not #defined,
97 * strtod also accepts (case insensitively) strings of the form
98 * NaN(x), where x is a string of hexadecimal digits and spaces;
99 * if there is only one string of hexadecimal digits, it is taken
100 * for the 52 fraction bits of the resulting NaN; if there are two
101 * or more strings of hex digits, the first is for the high 20 bits,
102 * the second and subsequent for the low 32 bits, with intervening
103 * white space ignored; but if this results in none of the 52
104 * fraction bits being on (an IEEE Infinity symbol), then NAN_WORD0
105 * and NAN_WORD1 are used instead.
106 * #define NO_IEEE_Scale to disable new (Feb. 1997) logic in strtod that
107 * avoids underflows on inputs whose result does not underflow.
108 * If you #define NO_IEEE_Scale on a machine that uses IEEE-format
109 * floating-point numbers and flushes underflows to zero rather
110 * than implementing gradual underflow, then you must also #define
111 * Sudden_Underflow.
112 * #define YES_ALIAS to permit aliasing certain double values with
113 * arrays of ULongs. This leads to slightly better code with
114 * some compilers and was always used prior to 19990916, but it
115 * is not strictly legal and can cause trouble with aggressively
116 * optimizing compilers (e.g., gcc 2.95.1 under -O2).
117 * #define SET_INEXACT if IEEE arithmetic is being used and extra
118 * computation should be done to set the inexact flag when the
119 * result is inexact and avoid setting inexact when the result
120 * is exact. In this case, dtoa.c must be compiled in
121 * an environment, perhaps provided by #include "dtoa.c" in a
122 * suitable wrapper, that defines two functions,
123 * int get_inexact(void);
124 * void clear_inexact(void);
125 * such that get_inexact() returns a nonzero value if the
126 * inexact bit is already set, and clear_inexact() sets the
127 * inexact bit to 0. When SET_INEXACT is #defined, strtod
128 * also does extra computations to set the underflow and overflow
129 * flags when appropriate (i.e., when the result is tiny and
130 * inexact or when it is a numeric value rounded to +-infinity).
131 * #define NO_ERRNO if strtod should not assign errno = ERANGE when
132 * the result overflows to +-Infinity or underflows to 0.
133 */
134
135#include "config.h"
136#include "dtoa.h"
137
138#if HAVE(ERRNO_H)
139#include <errno.h>
140#else
141#define NO_ERRNO
142#endif
143#include <float.h>
144#include <math.h>
145#include <stdint.h>
146#include <stdlib.h>
147#include <string.h>
148#include <wtf/AlwaysInline.h>
149#include <wtf/Assertions.h>
150#include <wtf/FastMalloc.h>
ba379fdc 151#include <wtf/Vector.h>
9dae56ea
A
152#include <wtf/Threading.h>
153
ba379fdc
A
154#include <stdio.h>
155
9dae56ea
A
156#if COMPILER(MSVC)
157#pragma warning(disable: 4244)
158#pragma warning(disable: 4245)
159#pragma warning(disable: 4554)
160#endif
161
162#if PLATFORM(BIG_ENDIAN)
163#define IEEE_MC68k
164#elif PLATFORM(MIDDLE_ENDIAN)
165#define IEEE_ARM
166#else
167#define IEEE_8087
168#endif
169
170#define INFNAN_CHECK
171
172#if defined(IEEE_8087) + defined(IEEE_MC68k) + defined(IEEE_ARM) != 1
173Exactly one of IEEE_8087, IEEE_ARM or IEEE_MC68k should be defined.
174#endif
175
176namespace WTF {
177
178#if ENABLE(JSC_MULTIPLE_THREADS)
179Mutex* s_dtoaP5Mutex;
180#endif
181
182typedef union { double d; uint32_t L[2]; } U;
183
184#ifdef YES_ALIAS
185#define dval(x) x
186#ifdef IEEE_8087
187#define word0(x) ((uint32_t*)&x)[1]
188#define word1(x) ((uint32_t*)&x)[0]
189#else
190#define word0(x) ((uint32_t*)&x)[0]
191#define word1(x) ((uint32_t*)&x)[1]
192#endif
193#else
194#ifdef IEEE_8087
ba379fdc
A
195#define word0(x) (x)->L[1]
196#define word1(x) (x)->L[0]
9dae56ea 197#else
ba379fdc
A
198#define word0(x) (x)->L[0]
199#define word1(x) (x)->L[1]
9dae56ea 200#endif
ba379fdc 201#define dval(x) (x)->d
9dae56ea
A
202#endif
203
204/* The following definition of Storeinc is appropriate for MIPS processors.
205 * An alternative that might be better on some machines is
206 * #define Storeinc(a,b,c) (*a++ = b << 16 | c & 0xffff)
207 */
208#if defined(IEEE_8087) || defined(IEEE_ARM)
209#define Storeinc(a,b,c) (((unsigned short*)a)[1] = (unsigned short)b, ((unsigned short*)a)[0] = (unsigned short)c, a++)
210#else
211#define Storeinc(a,b,c) (((unsigned short*)a)[0] = (unsigned short)b, ((unsigned short*)a)[1] = (unsigned short)c, a++)
212#endif
213
214#define Exp_shift 20
215#define Exp_shift1 20
216#define Exp_msk1 0x100000
217#define Exp_msk11 0x100000
218#define Exp_mask 0x7ff00000
219#define P 53
220#define Bias 1023
221#define Emin (-1022)
222#define Exp_1 0x3ff00000
223#define Exp_11 0x3ff00000
224#define Ebits 11
225#define Frac_mask 0xfffff
226#define Frac_mask1 0xfffff
227#define Ten_pmax 22
228#define Bletch 0x10
229#define Bndry_mask 0xfffff
230#define Bndry_mask1 0xfffff
231#define LSB 1
232#define Sign_bit 0x80000000
233#define Log2P 1
234#define Tiny0 0
235#define Tiny1 1
236#define Quick_max 14
237#define Int_max 14
238
239#if !defined(NO_IEEE_Scale)
240#undef Avoid_Underflow
241#define Avoid_Underflow
242#endif
243
244#if !defined(Flt_Rounds)
245#if defined(FLT_ROUNDS)
246#define Flt_Rounds FLT_ROUNDS
247#else
248#define Flt_Rounds 1
249#endif
250#endif /*Flt_Rounds*/
251
252
253#define rounded_product(a,b) a *= b
254#define rounded_quotient(a,b) a /= b
255
256#define Big0 (Frac_mask1 | Exp_msk1 * (DBL_MAX_EXP + Bias - 1))
257#define Big1 0xffffffff
258
ba379fdc
A
259
260// FIXME: we should remove non-Pack_32 mode since it is unused and unmaintained
9dae56ea
A
261#ifndef Pack_32
262#define Pack_32
263#endif
264
265#if PLATFORM(PPC64) || PLATFORM(X86_64)
266// 64-bit emulation provided by the compiler is likely to be slower than dtoa own code on 32-bit hardware.
267#define USE_LONG_LONG
268#endif
269
270#ifndef USE_LONG_LONG
271#ifdef Just_16
272#undef Pack_32
273/* When Pack_32 is not defined, we store 16 bits per 32-bit int32_t.
274 * This makes some inner loops simpler and sometimes saves work
275 * during multiplications, but it often seems to make things slightly
276 * slower. Hence the default is now to store 32 bits per int32_t.
277 */
278#endif
279#endif
280
281#define Kmax 15
282
ba379fdc
A
283struct BigInt {
284 BigInt() : sign(0) { }
285 int sign;
9dae56ea 286
ba379fdc
A
287 void clear()
288 {
289 sign = 0;
290 m_words.clear();
291 }
292
293 size_t size() const
294 {
295 return m_words.size();
296 }
9dae56ea 297
ba379fdc
A
298 void resize(size_t s)
299 {
300 m_words.resize(s);
301 }
302
303 uint32_t* words()
304 {
305 return m_words.data();
306 }
9dae56ea 307
ba379fdc
A
308 const uint32_t* words() const
309 {
310 return m_words.data();
311 }
312
313 void append(uint32_t w)
314 {
315 m_words.append(w);
316 }
317
318 Vector<uint32_t, 16> m_words;
319};
9dae56ea 320
ba379fdc 321static void multadd(BigInt& b, int m, int a) /* multiply by m and add a */
9dae56ea
A
322{
323#ifdef USE_LONG_LONG
324 unsigned long long carry;
325#else
326 uint32_t carry;
327#endif
328
ba379fdc
A
329 int wds = b.size();
330 uint32_t* x = b.words();
9dae56ea
A
331 int i = 0;
332 carry = a;
333 do {
334#ifdef USE_LONG_LONG
335 unsigned long long y = *x * (unsigned long long)m + carry;
336 carry = y >> 32;
337 *x++ = (uint32_t)y & 0xffffffffUL;
338#else
339#ifdef Pack_32
340 uint32_t xi = *x;
341 uint32_t y = (xi & 0xffff) * m + carry;
342 uint32_t z = (xi >> 16) * m + (y >> 16);
343 carry = z >> 16;
344 *x++ = (z << 16) + (y & 0xffff);
345#else
346 uint32_t y = *x * m + carry;
347 carry = y >> 16;
348 *x++ = y & 0xffff;
349#endif
350#endif
351 } while (++i < wds);
352
ba379fdc
A
353 if (carry)
354 b.append((uint32_t)carry);
9dae56ea
A
355}
356
ba379fdc 357static void s2b(BigInt& b, const char* s, int nd0, int nd, uint32_t y9)
9dae56ea
A
358{
359 int k;
360 int32_t y;
361 int32_t x = (nd + 8) / 9;
362
363 for (k = 0, y = 1; x > y; y <<= 1, k++) { }
364#ifdef Pack_32
ba379fdc
A
365 b.sign = 0;
366 b.resize(1);
367 b.words()[0] = y9;
9dae56ea 368#else
ba379fdc
A
369 b.sign = 0;
370 b.resize((b->x[1] = y9 >> 16) ? 2 : 1);
371 b.words()[0] = y9 & 0xffff;
9dae56ea
A
372#endif
373
374 int i = 9;
375 if (9 < nd0) {
376 s += 9;
377 do {
ba379fdc 378 multadd(b, 10, *s++ - '0');
9dae56ea
A
379 } while (++i < nd0);
380 s++;
381 } else
382 s += 10;
383 for (; i < nd; i++)
ba379fdc 384 multadd(b, 10, *s++ - '0');
9dae56ea
A
385}
386
387static int hi0bits(uint32_t x)
388{
389 int k = 0;
390
391 if (!(x & 0xffff0000)) {
392 k = 16;
393 x <<= 16;
394 }
395 if (!(x & 0xff000000)) {
396 k += 8;
397 x <<= 8;
398 }
399 if (!(x & 0xf0000000)) {
400 k += 4;
401 x <<= 4;
402 }
403 if (!(x & 0xc0000000)) {
404 k += 2;
405 x <<= 2;
406 }
407 if (!(x & 0x80000000)) {
408 k++;
409 if (!(x & 0x40000000))
410 return 32;
411 }
412 return k;
413}
414
415static int lo0bits (uint32_t* y)
416{
417 int k;
418 uint32_t x = *y;
419
420 if (x & 7) {
421 if (x & 1)
422 return 0;
423 if (x & 2) {
424 *y = x >> 1;
425 return 1;
426 }
427 *y = x >> 2;
428 return 2;
429 }
430 k = 0;
431 if (!(x & 0xffff)) {
432 k = 16;
433 x >>= 16;
434 }
435 if (!(x & 0xff)) {
436 k += 8;
437 x >>= 8;
438 }
439 if (!(x & 0xf)) {
440 k += 4;
441 x >>= 4;
442 }
443 if (!(x & 0x3)) {
444 k += 2;
445 x >>= 2;
446 }
447 if (!(x & 1)) {
448 k++;
449 x >>= 1;
450 if (!x & 1)
451 return 32;
452 }
453 *y = x;
454 return k;
455}
456
ba379fdc 457static void i2b(BigInt& b, int i)
9dae56ea 458{
ba379fdc
A
459 b.sign = 0;
460 b.resize(1);
461 b.words()[0] = i;
9dae56ea
A
462}
463
ba379fdc 464static void mult(BigInt& aRef, const BigInt& bRef)
9dae56ea 465{
ba379fdc
A
466 const BigInt* a = &aRef;
467 const BigInt* b = &bRef;
468 BigInt c;
469 int wa, wb, wc;
470 const uint32_t *x = 0, *xa, *xb, *xae, *xbe;
471 uint32_t *xc, *xc0;
9dae56ea
A
472 uint32_t y;
473#ifdef USE_LONG_LONG
474 unsigned long long carry, z;
475#else
476 uint32_t carry, z;
477#endif
478
ba379fdc
A
479 if (a->size() < b->size()) {
480 const BigInt* tmp = a;
9dae56ea 481 a = b;
ba379fdc 482 b = tmp;
9dae56ea 483 }
ba379fdc
A
484
485 wa = a->size();
486 wb = b->size();
9dae56ea 487 wc = wa + wb;
ba379fdc
A
488 c.resize(wc);
489
490 for (xc = c.words(), xa = xc + wc; xc < xa; xc++)
491 *xc = 0;
492 xa = a->words();
9dae56ea 493 xae = xa + wa;
ba379fdc 494 xb = b->words();
9dae56ea 495 xbe = xb + wb;
ba379fdc 496 xc0 = c.words();
9dae56ea
A
497#ifdef USE_LONG_LONG
498 for (; xb < xbe; xc0++) {
499 if ((y = *xb++)) {
500 x = xa;
501 xc = xc0;
502 carry = 0;
503 do {
504 z = *x++ * (unsigned long long)y + *xc + carry;
505 carry = z >> 32;
506 *xc++ = (uint32_t)z & 0xffffffffUL;
507 } while (x < xae);
508 *xc = (uint32_t)carry;
509 }
510 }
511#else
512#ifdef Pack_32
513 for (; xb < xbe; xb++, xc0++) {
514 if ((y = *xb & 0xffff)) {
515 x = xa;
516 xc = xc0;
517 carry = 0;
518 do {
519 z = (*x & 0xffff) * y + (*xc & 0xffff) + carry;
520 carry = z >> 16;
521 uint32_t z2 = (*x++ >> 16) * y + (*xc >> 16) + carry;
522 carry = z2 >> 16;
523 Storeinc(xc, z2, z);
524 } while (x < xae);
525 *xc = carry;
526 }
527 if ((y = *xb >> 16)) {
528 x = xa;
529 xc = xc0;
530 carry = 0;
531 uint32_t z2 = *xc;
532 do {
533 z = (*x & 0xffff) * y + (*xc >> 16) + carry;
534 carry = z >> 16;
535 Storeinc(xc, z, z2);
536 z2 = (*x++ >> 16) * y + (*xc & 0xffff) + carry;
537 carry = z2 >> 16;
538 } while (x < xae);
539 *xc = z2;
540 }
541 }
542#else
543 for(; xb < xbe; xc0++) {
544 if ((y = *xb++)) {
545 x = xa;
546 xc = xc0;
547 carry = 0;
548 do {
549 z = *x++ * y + *xc + carry;
550 carry = z >> 16;
551 *xc++ = z & 0xffff;
552 } while (x < xae);
553 *xc = carry;
554 }
555 }
556#endif
557#endif
ba379fdc
A
558 for (xc0 = c.words(), xc = xc0 + wc; wc > 0 && !*--xc; --wc) { }
559 c.resize(wc);
560 aRef = c;
9dae56ea
A
561}
562
ba379fdc
A
563struct P5Node {
564 BigInt val;
565 P5Node* next;
566};
567
568static P5Node* p5s;
9dae56ea
A
569static int p5s_count;
570
ba379fdc 571static ALWAYS_INLINE void pow5mult(BigInt& b, int k)
9dae56ea
A
572{
573 static int p05[3] = { 5, 25, 125 };
574
575 if (int i = k & 3)
ba379fdc 576 multadd(b, p05[i - 1], 0);
9dae56ea
A
577
578 if (!(k >>= 2))
ba379fdc 579 return;
9dae56ea
A
580
581#if ENABLE(JSC_MULTIPLE_THREADS)
582 s_dtoaP5Mutex->lock();
583#endif
ba379fdc
A
584 P5Node* p5 = p5s;
585
9dae56ea
A
586 if (!p5) {
587 /* first time */
ba379fdc
A
588 p5 = new P5Node;
589 i2b(p5->val, 625);
590 p5->next = 0;
591 p5s = p5;
9dae56ea
A
592 p5s_count = 1;
593 }
ba379fdc 594
9dae56ea
A
595 int p5s_count_local = p5s_count;
596#if ENABLE(JSC_MULTIPLE_THREADS)
597 s_dtoaP5Mutex->unlock();
598#endif
599 int p5s_used = 0;
600
601 for (;;) {
ba379fdc
A
602 if (k & 1)
603 mult(b, p5->val);
604
9dae56ea
A
605 if (!(k >>= 1))
606 break;
607
608 if (++p5s_used == p5s_count_local) {
609#if ENABLE(JSC_MULTIPLE_THREADS)
610 s_dtoaP5Mutex->lock();
611#endif
612 if (p5s_used == p5s_count) {
613 ASSERT(!p5->next);
ba379fdc
A
614 p5->next = new P5Node;
615 p5->next->next = 0;
616 p5->next->val = p5->val;
617 mult(p5->next->val, p5->next->val);
9dae56ea
A
618 ++p5s_count;
619 }
620
621 p5s_count_local = p5s_count;
622#if ENABLE(JSC_MULTIPLE_THREADS)
623 s_dtoaP5Mutex->unlock();
624#endif
625 }
626 p5 = p5->next;
627 }
9dae56ea
A
628}
629
ba379fdc 630static ALWAYS_INLINE void lshift(BigInt& b, int k)
9dae56ea 631{
9dae56ea
A
632#ifdef Pack_32
633 int n = k >> 5;
634#else
635 int n = k >> 4;
636#endif
637
ba379fdc
A
638 int origSize = b.size();
639 int n1 = n + origSize + 1;
9dae56ea 640
ba379fdc
A
641 if (k &= 0x1f)
642 b.resize(b.size() + n + 1);
643 else
644 b.resize(b.size() + n);
645
646 const uint32_t* srcStart = b.words();
647 uint32_t* dstStart = b.words();
648 const uint32_t* src = srcStart + origSize - 1;
9dae56ea
A
649 uint32_t* dst = dstStart + n1 - 1;
650#ifdef Pack_32
ba379fdc 651 if (k) {
9dae56ea
A
652 uint32_t hiSubword = 0;
653 int s = 32 - k;
654 for (; src >= srcStart; --src) {
655 *dst-- = hiSubword | *src >> s;
656 hiSubword = *src << k;
657 }
658 *dst = hiSubword;
659 ASSERT(dst == dstStart + n);
ba379fdc
A
660
661 b.resize(origSize + n + (b.words()[n1 - 1] != 0));
9dae56ea
A
662 }
663#else
664 if (k &= 0xf) {
665 uint32_t hiSubword = 0;
666 int s = 16 - k;
667 for (; src >= srcStart; --src) {
668 *dst-- = hiSubword | *src >> s;
669 hiSubword = (*src << k) & 0xffff;
670 }
671 *dst = hiSubword;
672 ASSERT(dst == dstStart + n);
673 result->wds = b->wds + n + (result->x[n1 - 1] != 0);
674 }
675 #endif
676 else {
677 do {
678 *--dst = *src--;
679 } while (src >= srcStart);
9dae56ea
A
680 }
681 for (dst = dstStart + n; dst != dstStart; )
682 *--dst = 0;
683
ba379fdc 684 ASSERT(b.size() <= 1 || b.words()[b.size() - 1]);
9dae56ea
A
685}
686
ba379fdc 687static int cmp(const BigInt& a, const BigInt& b)
9dae56ea 688{
ba379fdc 689 const uint32_t *xa, *xa0, *xb, *xb0;
9dae56ea
A
690 int i, j;
691
ba379fdc
A
692 i = a.size();
693 j = b.size();
694 ASSERT(i <= 1 || a.words()[i - 1]);
695 ASSERT(j <= 1 || b.words()[j - 1]);
9dae56ea
A
696 if (i -= j)
697 return i;
ba379fdc 698 xa0 = a.words();
9dae56ea 699 xa = xa0 + j;
ba379fdc 700 xb0 = b.words();
9dae56ea
A
701 xb = xb0 + j;
702 for (;;) {
703 if (*--xa != *--xb)
704 return *xa < *xb ? -1 : 1;
705 if (xa <= xa0)
706 break;
707 }
708 return 0;
709}
710
ba379fdc 711static ALWAYS_INLINE void diff(BigInt& c, const BigInt& aRef, const BigInt& bRef)
9dae56ea 712{
ba379fdc
A
713 const BigInt* a = &aRef;
714 const BigInt* b = &bRef;
9dae56ea 715 int i, wa, wb;
ba379fdc 716 uint32_t *xc;
9dae56ea 717
ba379fdc 718 i = cmp(*a, *b);
9dae56ea 719 if (!i) {
ba379fdc
A
720 c.sign = 0;
721 c.resize(1);
722 c.words()[0] = 0;
723 return;
9dae56ea
A
724 }
725 if (i < 0) {
ba379fdc 726 const BigInt* tmp = a;
9dae56ea 727 a = b;
ba379fdc 728 b = tmp;
9dae56ea
A
729 i = 1;
730 } else
731 i = 0;
ba379fdc
A
732
733 wa = a->size();
734 const uint32_t* xa = a->words();
735 const uint32_t* xae = xa + wa;
736 wb = b->size();
737 const uint32_t* xb = b->words();
738 const uint32_t* xbe = xb + wb;
739
740 c.resize(wa);
741 c.sign = i;
742 xc = c.words();
9dae56ea
A
743#ifdef USE_LONG_LONG
744 unsigned long long borrow = 0;
745 do {
746 unsigned long long y = (unsigned long long)*xa++ - *xb++ - borrow;
747 borrow = y >> 32 & (uint32_t)1;
748 *xc++ = (uint32_t)y & 0xffffffffUL;
749 } while (xb < xbe);
750 while (xa < xae) {
751 unsigned long long y = *xa++ - borrow;
752 borrow = y >> 32 & (uint32_t)1;
753 *xc++ = (uint32_t)y & 0xffffffffUL;
754 }
755#else
756 uint32_t borrow = 0;
757#ifdef Pack_32
758 do {
759 uint32_t y = (*xa & 0xffff) - (*xb & 0xffff) - borrow;
760 borrow = (y & 0x10000) >> 16;
761 uint32_t z = (*xa++ >> 16) - (*xb++ >> 16) - borrow;
762 borrow = (z & 0x10000) >> 16;
763 Storeinc(xc, z, y);
764 } while (xb < xbe);
765 while (xa < xae) {
766 uint32_t y = (*xa & 0xffff) - borrow;
767 borrow = (y & 0x10000) >> 16;
768 uint32_t z = (*xa++ >> 16) - borrow;
769 borrow = (z & 0x10000) >> 16;
770 Storeinc(xc, z, y);
771 }
772#else
773 do {
774 uint32_t y = *xa++ - *xb++ - borrow;
775 borrow = (y & 0x10000) >> 16;
776 *xc++ = y & 0xffff;
777 } while (xb < xbe);
778 while (xa < xae) {
779 uint32_t y = *xa++ - borrow;
780 borrow = (y & 0x10000) >> 16;
781 *xc++ = y & 0xffff;
782 }
783#endif
784#endif
785 while (!*--xc)
786 wa--;
ba379fdc 787 c.resize(wa);
9dae56ea
A
788}
789
ba379fdc 790static double ulp(U *x)
9dae56ea
A
791{
792 register int32_t L;
ba379fdc 793 U u;
9dae56ea
A
794
795 L = (word0(x) & Exp_mask) - (P - 1) * Exp_msk1;
796#ifndef Avoid_Underflow
797#ifndef Sudden_Underflow
798 if (L > 0) {
799#endif
800#endif
ba379fdc
A
801 word0(&u) = L;
802 word1(&u) = 0;
9dae56ea
A
803#ifndef Avoid_Underflow
804#ifndef Sudden_Underflow
805 } else {
806 L = -L >> Exp_shift;
807 if (L < Exp_shift) {
ba379fdc
A
808 word0(&u) = 0x80000 >> L;
809 word1(&u) = 0;
9dae56ea 810 } else {
ba379fdc 811 word0(&u) = 0;
9dae56ea 812 L -= Exp_shift;
ba379fdc 813 word1(&u) = L >= 31 ? 1 : 1 << 31 - L;
9dae56ea
A
814 }
815 }
816#endif
817#endif
ba379fdc 818 return dval(&u);
9dae56ea
A
819}
820
ba379fdc 821static double b2d(const BigInt& a, int* e)
9dae56ea 822{
ba379fdc
A
823 const uint32_t* xa;
824 const uint32_t* xa0;
9dae56ea
A
825 uint32_t w;
826 uint32_t y;
827 uint32_t z;
828 int k;
ba379fdc 829 U d;
9dae56ea 830
ba379fdc
A
831#define d0 word0(&d)
832#define d1 word1(&d)
9dae56ea 833
ba379fdc
A
834 xa0 = a.words();
835 xa = xa0 + a.size();
9dae56ea
A
836 y = *--xa;
837 ASSERT(y);
838 k = hi0bits(y);
839 *e = 32 - k;
840#ifdef Pack_32
841 if (k < Ebits) {
ba379fdc 842 d0 = Exp_1 | (y >> (Ebits - k));
9dae56ea 843 w = xa > xa0 ? *--xa : 0;
ba379fdc 844 d1 = (y << (32 - Ebits + k)) | (w >> (Ebits - k));
9dae56ea
A
845 goto ret_d;
846 }
847 z = xa > xa0 ? *--xa : 0;
848 if (k -= Ebits) {
ba379fdc 849 d0 = Exp_1 | (y << k) | (z >> (32 - k));
9dae56ea 850 y = xa > xa0 ? *--xa : 0;
ba379fdc 851 d1 = (z << k) | (y >> (32 - k));
9dae56ea
A
852 } else {
853 d0 = Exp_1 | y;
854 d1 = z;
855 }
856#else
857 if (k < Ebits + 16) {
858 z = xa > xa0 ? *--xa : 0;
859 d0 = Exp_1 | y << k - Ebits | z >> Ebits + 16 - k;
860 w = xa > xa0 ? *--xa : 0;
861 y = xa > xa0 ? *--xa : 0;
862 d1 = z << k + 16 - Ebits | w << k - Ebits | y >> 16 + Ebits - k;
863 goto ret_d;
864 }
865 z = xa > xa0 ? *--xa : 0;
866 w = xa > xa0 ? *--xa : 0;
867 k -= Ebits + 16;
868 d0 = Exp_1 | y << k + 16 | z << k | w >> 16 - k;
869 y = xa > xa0 ? *--xa : 0;
870 d1 = w << k + 16 | y << k;
871#endif
872ret_d:
873#undef d0
874#undef d1
ba379fdc 875 return dval(&d);
9dae56ea
A
876}
877
ba379fdc 878static ALWAYS_INLINE void d2b(BigInt& b, U* d, int* e, int* bits)
9dae56ea 879{
9dae56ea
A
880 int de, k;
881 uint32_t *x, y, z;
882#ifndef Sudden_Underflow
883 int i;
884#endif
885#define d0 word0(d)
886#define d1 word1(d)
887
ba379fdc 888 b.sign = 0;
9dae56ea 889#ifdef Pack_32
ba379fdc 890 b.resize(1);
9dae56ea 891#else
ba379fdc 892 b.resize(2);
9dae56ea 893#endif
ba379fdc 894 x = b.words();
9dae56ea
A
895
896 z = d0 & Frac_mask;
897 d0 &= 0x7fffffff; /* clear sign bit, which we ignore */
898#ifdef Sudden_Underflow
899 de = (int)(d0 >> Exp_shift);
900#else
901 if ((de = (int)(d0 >> Exp_shift)))
902 z |= Exp_msk1;
903#endif
904#ifdef Pack_32
905 if ((y = d1)) {
906 if ((k = lo0bits(&y))) {
ba379fdc 907 x[0] = y | (z << (32 - k));
9dae56ea
A
908 z >>= k;
909 } else
910 x[0] = y;
ba379fdc
A
911 if (z) {
912 b.resize(2);
913 x[1] = z;
914 }
915
9dae56ea 916#ifndef Sudden_Underflow
ba379fdc 917 i = b.size();
9dae56ea 918#endif
9dae56ea
A
919 } else {
920 k = lo0bits(&z);
921 x[0] = z;
922#ifndef Sudden_Underflow
ba379fdc 923 i = 1;
9dae56ea 924#endif
ba379fdc 925 b.resize(1);
9dae56ea
A
926 k += 32;
927 }
928#else
929 if ((y = d1)) {
930 if ((k = lo0bits(&y))) {
931 if (k >= 16) {
932 x[0] = y | z << 32 - k & 0xffff;
933 x[1] = z >> k - 16 & 0xffff;
934 x[2] = z >> k;
935 i = 2;
936 } else {
937 x[0] = y & 0xffff;
938 x[1] = y >> 16 | z << 16 - k & 0xffff;
939 x[2] = z >> k & 0xffff;
940 x[3] = z >> k + 16;
941 i = 3;
942 }
943 } else {
944 x[0] = y & 0xffff;
945 x[1] = y >> 16;
946 x[2] = z & 0xffff;
947 x[3] = z >> 16;
948 i = 3;
949 }
950 } else {
951 k = lo0bits(&z);
952 if (k >= 16) {
953 x[0] = z;
954 i = 0;
955 } else {
956 x[0] = z & 0xffff;
957 x[1] = z >> 16;
958 i = 1;
959 }
960 k += 32;
961 } while (!x[i])
962 --i;
ba379fdc 963 b->resize(i + 1);
9dae56ea
A
964#endif
965#ifndef Sudden_Underflow
966 if (de) {
967#endif
968 *e = de - Bias - (P - 1) + k;
969 *bits = P - k;
970#ifndef Sudden_Underflow
971 } else {
972 *e = de - Bias - (P - 1) + 1 + k;
973#ifdef Pack_32
974 *bits = (32 * i) - hi0bits(x[i - 1]);
975#else
976 *bits = (i + 2) * 16 - hi0bits(x[i]);
977#endif
978 }
979#endif
9dae56ea
A
980}
981#undef d0
982#undef d1
983
ba379fdc 984static double ratio(const BigInt& a, const BigInt& b)
9dae56ea 985{
ba379fdc 986 U da, db;
9dae56ea
A
987 int k, ka, kb;
988
ba379fdc
A
989 dval(&da) = b2d(a, &ka);
990 dval(&db) = b2d(b, &kb);
9dae56ea 991#ifdef Pack_32
ba379fdc 992 k = ka - kb + 32 * (a.size() - b.size());
9dae56ea 993#else
ba379fdc 994 k = ka - kb + 16 * (a.size() - b.size());
9dae56ea
A
995#endif
996 if (k > 0)
ba379fdc 997 word0(&da) += k * Exp_msk1;
9dae56ea
A
998 else {
999 k = -k;
ba379fdc 1000 word0(&db) += k * Exp_msk1;
9dae56ea 1001 }
ba379fdc 1002 return dval(&da) / dval(&db);
9dae56ea
A
1003}
1004
1005static const double tens[] = {
1006 1e0, 1e1, 1e2, 1e3, 1e4, 1e5, 1e6, 1e7, 1e8, 1e9,
1007 1e10, 1e11, 1e12, 1e13, 1e14, 1e15, 1e16, 1e17, 1e18, 1e19,
1008 1e20, 1e21, 1e22
1009};
1010
1011static const double bigtens[] = { 1e16, 1e32, 1e64, 1e128, 1e256 };
1012static const double tinytens[] = { 1e-16, 1e-32, 1e-64, 1e-128,
1013#ifdef Avoid_Underflow
1014 9007199254740992. * 9007199254740992.e-256
1015 /* = 2^106 * 1e-53 */
1016#else
1017 1e-256
1018#endif
1019};
1020
1021/* The factor of 2^53 in tinytens[4] helps us avoid setting the underflow */
1022/* flag unnecessarily. It leads to a song and dance at the end of strtod. */
1023#define Scale_Bit 0x10
1024#define n_bigtens 5
1025
1026#if defined(INFNAN_CHECK)
1027
1028#ifndef NAN_WORD0
1029#define NAN_WORD0 0x7ff80000
1030#endif
1031
1032#ifndef NAN_WORD1
1033#define NAN_WORD1 0
1034#endif
1035
1036static int match(const char** sp, const char* t)
1037{
1038 int c, d;
1039 const char* s = *sp;
1040
1041 while ((d = *t++)) {
1042 if ((c = *++s) >= 'A' && c <= 'Z')
1043 c += 'a' - 'A';
1044 if (c != d)
1045 return 0;
1046 }
1047 *sp = s + 1;
1048 return 1;
1049}
1050
1051#ifndef No_Hex_NaN
ba379fdc 1052static void hexnan(U* rvp, const char** sp)
9dae56ea
A
1053{
1054 uint32_t c, x[2];
1055 const char* s;
1056 int havedig, udx0, xshift;
1057
1058 x[0] = x[1] = 0;
1059 havedig = xshift = 0;
1060 udx0 = 1;
1061 s = *sp;
1062 while ((c = *(const unsigned char*)++s)) {
1063 if (c >= '0' && c <= '9')
1064 c -= '0';
1065 else if (c >= 'a' && c <= 'f')
1066 c += 10 - 'a';
1067 else if (c >= 'A' && c <= 'F')
1068 c += 10 - 'A';
1069 else if (c <= ' ') {
1070 if (udx0 && havedig) {
1071 udx0 = 0;
1072 xshift = 1;
1073 }
1074 continue;
1075 } else if (/*(*/ c == ')' && havedig) {
1076 *sp = s + 1;
1077 break;
1078 } else
1079 return; /* invalid form: don't change *sp */
1080 havedig = 1;
1081 if (xshift) {
1082 xshift = 0;
1083 x[0] = x[1];
1084 x[1] = 0;
1085 }
1086 if (udx0)
1087 x[0] = (x[0] << 4) | (x[1] >> 28);
1088 x[1] = (x[1] << 4) | c;
1089 }
1090 if ((x[0] &= 0xfffff) || x[1]) {
ba379fdc
A
1091 word0(rvp) = Exp_mask | x[0];
1092 word1(rvp) = x[1];
9dae56ea
A
1093 }
1094}
1095#endif /*No_Hex_NaN*/
1096#endif /* INFNAN_CHECK */
1097
1098double strtod(const char* s00, char** se)
1099{
1100#ifdef Avoid_Underflow
1101 int scale;
1102#endif
1103 int bb2, bb5, bbe, bd2, bd5, bbbits, bs2, c, dsign,
1104 e, e1, esign, i, j, k, nd, nd0, nf, nz, nz0, sign;
1105 const char *s, *s0, *s1;
ba379fdc
A
1106 double aadj, aadj1;
1107 U aadj2, adj, rv, rv0;
9dae56ea
A
1108 int32_t L;
1109 uint32_t y, z;
ba379fdc 1110 BigInt bb, bb1, bd, bd0, bs, delta;
9dae56ea
A
1111#ifdef SET_INEXACT
1112 int inexact, oldinexact;
1113#endif
1114
1115 sign = nz0 = nz = 0;
ba379fdc 1116 dval(&rv) = 0;
9dae56ea
A
1117 for (s = s00; ; s++)
1118 switch (*s) {
1119 case '-':
1120 sign = 1;
1121 /* no break */
1122 case '+':
1123 if (*++s)
1124 goto break2;
1125 /* no break */
1126 case 0:
1127 goto ret0;
1128 case '\t':
1129 case '\n':
1130 case '\v':
1131 case '\f':
1132 case '\r':
1133 case ' ':
1134 continue;
1135 default:
1136 goto break2;
1137 }
1138break2:
1139 if (*s == '0') {
1140 nz0 = 1;
1141 while (*++s == '0') { }
1142 if (!*s)
1143 goto ret;
1144 }
1145 s0 = s;
1146 y = z = 0;
1147 for (nd = nf = 0; (c = *s) >= '0' && c <= '9'; nd++, s++)
1148 if (nd < 9)
1149 y = (10 * y) + c - '0';
1150 else if (nd < 16)
1151 z = (10 * z) + c - '0';
1152 nd0 = nd;
1153 if (c == '.') {
1154 c = *++s;
1155 if (!nd) {
1156 for (; c == '0'; c = *++s)
1157 nz++;
1158 if (c > '0' && c <= '9') {
1159 s0 = s;
1160 nf += nz;
1161 nz = 0;
1162 goto have_dig;
1163 }
1164 goto dig_done;
1165 }
1166 for (; c >= '0' && c <= '9'; c = *++s) {
1167have_dig:
1168 nz++;
1169 if (c -= '0') {
1170 nf += nz;
1171 for (i = 1; i < nz; i++)
1172 if (nd++ < 9)
1173 y *= 10;
1174 else if (nd <= DBL_DIG + 1)
1175 z *= 10;
1176 if (nd++ < 9)
1177 y = (10 * y) + c;
1178 else if (nd <= DBL_DIG + 1)
1179 z = (10 * z) + c;
1180 nz = 0;
1181 }
1182 }
1183 }
1184dig_done:
1185 e = 0;
1186 if (c == 'e' || c == 'E') {
1187 if (!nd && !nz && !nz0) {
1188 goto ret0;
1189 }
1190 s00 = s;
1191 esign = 0;
1192 switch (c = *++s) {
1193 case '-':
1194 esign = 1;
1195 case '+':
1196 c = *++s;
1197 }
1198 if (c >= '0' && c <= '9') {
1199 while (c == '0')
1200 c = *++s;
1201 if (c > '0' && c <= '9') {
1202 L = c - '0';
1203 s1 = s;
1204 while ((c = *++s) >= '0' && c <= '9')
1205 L = (10 * L) + c - '0';
1206 if (s - s1 > 8 || L > 19999)
1207 /* Avoid confusion from exponents
1208 * so large that e might overflow.
1209 */
1210 e = 19999; /* safe for 16 bit ints */
1211 else
1212 e = (int)L;
1213 if (esign)
1214 e = -e;
1215 } else
1216 e = 0;
1217 } else
1218 s = s00;
1219 }
1220 if (!nd) {
1221 if (!nz && !nz0) {
1222#ifdef INFNAN_CHECK
1223 /* Check for Nan and Infinity */
1224 switch(c) {
1225 case 'i':
1226 case 'I':
1227 if (match(&s,"nf")) {
1228 --s;
1229 if (!match(&s,"inity"))
1230 ++s;
ba379fdc
A
1231 word0(&rv) = 0x7ff00000;
1232 word1(&rv) = 0;
9dae56ea
A
1233 goto ret;
1234 }
1235 break;
1236 case 'n':
1237 case 'N':
1238 if (match(&s, "an")) {
ba379fdc
A
1239 word0(&rv) = NAN_WORD0;
1240 word1(&rv) = NAN_WORD1;
9dae56ea
A
1241#ifndef No_Hex_NaN
1242 if (*s == '(') /*)*/
1243 hexnan(&rv, &s);
1244#endif
1245 goto ret;
1246 }
1247 }
1248#endif /* INFNAN_CHECK */
1249ret0:
1250 s = s00;
1251 sign = 0;
1252 }
1253 goto ret;
1254 }
1255 e1 = e -= nf;
1256
1257 /* Now we have nd0 digits, starting at s0, followed by a
1258 * decimal point, followed by nd-nd0 digits. The number we're
1259 * after is the integer represented by those digits times
1260 * 10**e */
1261
1262 if (!nd0)
1263 nd0 = nd;
1264 k = nd < DBL_DIG + 1 ? nd : DBL_DIG + 1;
ba379fdc 1265 dval(&rv) = y;
9dae56ea
A
1266 if (k > 9) {
1267#ifdef SET_INEXACT
1268 if (k > DBL_DIG)
1269 oldinexact = get_inexact();
1270#endif
ba379fdc 1271 dval(&rv) = tens[k - 9] * dval(&rv) + z;
9dae56ea 1272 }
9dae56ea
A
1273 if (nd <= DBL_DIG && Flt_Rounds == 1) {
1274 if (!e)
1275 goto ret;
1276 if (e > 0) {
1277 if (e <= Ten_pmax) {
ba379fdc 1278 /* rv = */ rounded_product(dval(&rv), tens[e]);
9dae56ea
A
1279 goto ret;
1280 }
1281 i = DBL_DIG - nd;
1282 if (e <= Ten_pmax + i) {
1283 /* A fancier test would sometimes let us do
1284 * this for larger i values.
1285 */
1286 e -= i;
ba379fdc
A
1287 dval(&rv) *= tens[i];
1288 /* rv = */ rounded_product(dval(&rv), tens[e]);
9dae56ea
A
1289 goto ret;
1290 }
1291 }
1292#ifndef Inaccurate_Divide
1293 else if (e >= -Ten_pmax) {
ba379fdc 1294 /* rv = */ rounded_quotient(dval(&rv), tens[-e]);
9dae56ea
A
1295 goto ret;
1296 }
1297#endif
1298 }
1299 e1 += nd - k;
1300
1301#ifdef SET_INEXACT
1302 inexact = 1;
1303 if (k <= DBL_DIG)
1304 oldinexact = get_inexact();
1305#endif
1306#ifdef Avoid_Underflow
1307 scale = 0;
1308#endif
1309
1310 /* Get starting approximation = rv * 10**e1 */
1311
1312 if (e1 > 0) {
1313 if ((i = e1 & 15))
ba379fdc 1314 dval(&rv) *= tens[i];
9dae56ea
A
1315 if (e1 &= ~15) {
1316 if (e1 > DBL_MAX_10_EXP) {
1317ovfl:
1318#ifndef NO_ERRNO
1319 errno = ERANGE;
1320#endif
1321 /* Can't trust HUGE_VAL */
ba379fdc
A
1322 word0(&rv) = Exp_mask;
1323 word1(&rv) = 0;
9dae56ea
A
1324#ifdef SET_INEXACT
1325 /* set overflow bit */
ba379fdc
A
1326 dval(&rv0) = 1e300;
1327 dval(&rv0) *= dval(&rv0);
9dae56ea 1328#endif
9dae56ea
A
1329 goto ret;
1330 }
1331 e1 >>= 4;
1332 for (j = 0; e1 > 1; j++, e1 >>= 1)
1333 if (e1 & 1)
ba379fdc 1334 dval(&rv) *= bigtens[j];
9dae56ea 1335 /* The last multiplication could overflow. */
ba379fdc
A
1336 word0(&rv) -= P * Exp_msk1;
1337 dval(&rv) *= bigtens[j];
1338 if ((z = word0(&rv) & Exp_mask) > Exp_msk1 * (DBL_MAX_EXP + Bias - P))
9dae56ea
A
1339 goto ovfl;
1340 if (z > Exp_msk1 * (DBL_MAX_EXP + Bias - 1 - P)) {
1341 /* set to largest number */
1342 /* (Can't trust DBL_MAX) */
ba379fdc
A
1343 word0(&rv) = Big0;
1344 word1(&rv) = Big1;
9dae56ea 1345 } else
ba379fdc 1346 word0(&rv) += P * Exp_msk1;
9dae56ea
A
1347 }
1348 } else if (e1 < 0) {
1349 e1 = -e1;
1350 if ((i = e1 & 15))
ba379fdc 1351 dval(&rv) /= tens[i];
9dae56ea
A
1352 if (e1 >>= 4) {
1353 if (e1 >= 1 << n_bigtens)
1354 goto undfl;
1355#ifdef Avoid_Underflow
1356 if (e1 & Scale_Bit)
1357 scale = 2 * P;
1358 for (j = 0; e1 > 0; j++, e1 >>= 1)
1359 if (e1 & 1)
ba379fdc
A
1360 dval(&rv) *= tinytens[j];
1361 if (scale && (j = (2 * P) + 1 - ((word0(&rv) & Exp_mask) >> Exp_shift)) > 0) {
9dae56ea
A
1362 /* scaled rv is denormal; zap j low bits */
1363 if (j >= 32) {
ba379fdc 1364 word1(&rv) = 0;
9dae56ea 1365 if (j >= 53)
ba379fdc 1366 word0(&rv) = (P + 2) * Exp_msk1;
9dae56ea 1367 else
ba379fdc 1368 word0(&rv) &= 0xffffffff << (j - 32);
9dae56ea 1369 } else
ba379fdc 1370 word1(&rv) &= 0xffffffff << j;
9dae56ea
A
1371 }
1372#else
1373 for (j = 0; e1 > 1; j++, e1 >>= 1)
1374 if (e1 & 1)
ba379fdc 1375 dval(&rv) *= tinytens[j];
9dae56ea 1376 /* The last multiplication could underflow. */
ba379fdc
A
1377 dval(&rv0) = dval(&rv);
1378 dval(&rv) *= tinytens[j];
1379 if (!dval(&rv)) {
1380 dval(&rv) = 2. * dval(&rv0);
1381 dval(&rv) *= tinytens[j];
9dae56ea 1382#endif
ba379fdc 1383 if (!dval(&rv)) {
9dae56ea 1384undfl:
ba379fdc 1385 dval(&rv) = 0.;
9dae56ea
A
1386#ifndef NO_ERRNO
1387 errno = ERANGE;
1388#endif
9dae56ea
A
1389 goto ret;
1390 }
1391#ifndef Avoid_Underflow
ba379fdc
A
1392 word0(&rv) = Tiny0;
1393 word1(&rv) = Tiny1;
9dae56ea
A
1394 /* The refinement below will clean
1395 * this approximation up.
1396 */
1397 }
1398#endif
1399 }
1400 }
1401
1402 /* Now the hard part -- adjusting rv to the correct value.*/
1403
1404 /* Put digits into bd: true value = bd * 10^e */
1405
ba379fdc 1406 s2b(bd0, s0, nd0, nd, y);
9dae56ea
A
1407
1408 for (;;) {
ba379fdc
A
1409 bd = bd0;
1410 d2b(bb, &rv, &bbe, &bbbits); /* rv = bb * 2^bbe */
1411 i2b(bs, 1);
9dae56ea
A
1412
1413 if (e >= 0) {
1414 bb2 = bb5 = 0;
1415 bd2 = bd5 = e;
1416 } else {
1417 bb2 = bb5 = -e;
1418 bd2 = bd5 = 0;
1419 }
1420 if (bbe >= 0)
1421 bb2 += bbe;
1422 else
1423 bd2 -= bbe;
1424 bs2 = bb2;
1425#ifdef Avoid_Underflow
1426 j = bbe - scale;
1427 i = j + bbbits - 1; /* logb(rv) */
1428 if (i < Emin) /* denormal */
1429 j += P - Emin;
1430 else
1431 j = P + 1 - bbbits;
1432#else /*Avoid_Underflow*/
1433#ifdef Sudden_Underflow
1434 j = P + 1 - bbbits;
1435#else /*Sudden_Underflow*/
1436 j = bbe;
1437 i = j + bbbits - 1; /* logb(rv) */
1438 if (i < Emin) /* denormal */
1439 j += P - Emin;
1440 else
1441 j = P + 1 - bbbits;
1442#endif /*Sudden_Underflow*/
1443#endif /*Avoid_Underflow*/
1444 bb2 += j;
1445 bd2 += j;
1446#ifdef Avoid_Underflow
1447 bd2 += scale;
1448#endif
1449 i = bb2 < bd2 ? bb2 : bd2;
1450 if (i > bs2)
1451 i = bs2;
1452 if (i > 0) {
1453 bb2 -= i;
1454 bd2 -= i;
1455 bs2 -= i;
1456 }
1457 if (bb5 > 0) {
ba379fdc
A
1458 pow5mult(bs, bb5);
1459 mult(bb, bs);
9dae56ea
A
1460 }
1461 if (bb2 > 0)
ba379fdc 1462 lshift(bb, bb2);
9dae56ea 1463 if (bd5 > 0)
ba379fdc 1464 pow5mult(bd, bd5);
9dae56ea 1465 if (bd2 > 0)
ba379fdc 1466 lshift(bd, bd2);
9dae56ea 1467 if (bs2 > 0)
ba379fdc
A
1468 lshift(bs, bs2);
1469 diff(delta, bb, bd);
1470 dsign = delta.sign;
1471 delta.sign = 0;
9dae56ea
A
1472 i = cmp(delta, bs);
1473
1474 if (i < 0) {
1475 /* Error is less than half an ulp -- check for
1476 * special case of mantissa a power of two.
1477 */
ba379fdc 1478 if (dsign || word1(&rv) || word0(&rv) & Bndry_mask
9dae56ea 1479#ifdef Avoid_Underflow
ba379fdc 1480 || (word0(&rv) & Exp_mask) <= (2 * P + 1) * Exp_msk1
9dae56ea 1481#else
ba379fdc 1482 || (word0(&rv) & Exp_mask) <= Exp_msk1
9dae56ea
A
1483#endif
1484 ) {
1485#ifdef SET_INEXACT
ba379fdc 1486 if (!delta->words()[0] && delta->size() <= 1)
9dae56ea
A
1487 inexact = 0;
1488#endif
1489 break;
1490 }
ba379fdc 1491 if (!delta.words()[0] && delta.size() <= 1) {
9dae56ea
A
1492 /* exact result */
1493#ifdef SET_INEXACT
1494 inexact = 0;
1495#endif
1496 break;
1497 }
ba379fdc 1498 lshift(delta, Log2P);
9dae56ea
A
1499 if (cmp(delta, bs) > 0)
1500 goto drop_down;
1501 break;
1502 }
1503 if (i == 0) {
1504 /* exactly half-way between */
1505 if (dsign) {
ba379fdc
A
1506 if ((word0(&rv) & Bndry_mask1) == Bndry_mask1
1507 && word1(&rv) == (
9dae56ea 1508#ifdef Avoid_Underflow
ba379fdc 1509 (scale && (y = word0(&rv) & Exp_mask) <= 2 * P * Exp_msk1)
9dae56ea
A
1510 ? (0xffffffff & (0xffffffff << (2 * P + 1 - (y >> Exp_shift)))) :
1511#endif
1512 0xffffffff)) {
1513 /*boundary case -- increment exponent*/
ba379fdc
A
1514 word0(&rv) = (word0(&rv) & Exp_mask) + Exp_msk1;
1515 word1(&rv) = 0;
9dae56ea
A
1516#ifdef Avoid_Underflow
1517 dsign = 0;
1518#endif
1519 break;
1520 }
ba379fdc 1521 } else if (!(word0(&rv) & Bndry_mask) && !word1(&rv)) {
9dae56ea
A
1522drop_down:
1523 /* boundary case -- decrement exponent */
1524#ifdef Sudden_Underflow /*{{*/
ba379fdc 1525 L = word0(&rv) & Exp_mask;
9dae56ea
A
1526#ifdef Avoid_Underflow
1527 if (L <= (scale ? (2 * P + 1) * Exp_msk1 : Exp_msk1))
1528#else
1529 if (L <= Exp_msk1)
1530#endif /*Avoid_Underflow*/
1531 goto undfl;
1532 L -= Exp_msk1;
1533#else /*Sudden_Underflow}{*/
1534#ifdef Avoid_Underflow
1535 if (scale) {
ba379fdc 1536 L = word0(&rv) & Exp_mask;
9dae56ea
A
1537 if (L <= (2 * P + 1) * Exp_msk1) {
1538 if (L > (P + 2) * Exp_msk1)
1539 /* round even ==> */
1540 /* accept rv */
1541 break;
1542 /* rv = smallest denormal */
1543 goto undfl;
1544 }
1545 }
1546#endif /*Avoid_Underflow*/
ba379fdc 1547 L = (word0(&rv) & Exp_mask) - Exp_msk1;
9dae56ea 1548#endif /*Sudden_Underflow}}*/
ba379fdc
A
1549 word0(&rv) = L | Bndry_mask1;
1550 word1(&rv) = 0xffffffff;
9dae56ea
A
1551 break;
1552 }
ba379fdc 1553 if (!(word1(&rv) & LSB))
9dae56ea
A
1554 break;
1555 if (dsign)
ba379fdc 1556 dval(&rv) += ulp(&rv);
9dae56ea 1557 else {
ba379fdc 1558 dval(&rv) -= ulp(&rv);
9dae56ea 1559#ifndef Sudden_Underflow
ba379fdc 1560 if (!dval(&rv))
9dae56ea
A
1561 goto undfl;
1562#endif
1563 }
1564#ifdef Avoid_Underflow
1565 dsign = 1 - dsign;
1566#endif
1567 break;
1568 }
1569 if ((aadj = ratio(delta, bs)) <= 2.) {
1570 if (dsign)
1571 aadj = aadj1 = 1.;
ba379fdc 1572 else if (word1(&rv) || word0(&rv) & Bndry_mask) {
9dae56ea 1573#ifndef Sudden_Underflow
ba379fdc 1574 if (word1(&rv) == Tiny1 && !word0(&rv))
9dae56ea
A
1575 goto undfl;
1576#endif
1577 aadj = 1.;
1578 aadj1 = -1.;
1579 } else {
1580 /* special case -- power of FLT_RADIX to be */
1581 /* rounded down... */
1582
1583 if (aadj < 2. / FLT_RADIX)
1584 aadj = 1. / FLT_RADIX;
1585 else
1586 aadj *= 0.5;
1587 aadj1 = -aadj;
1588 }
1589 } else {
1590 aadj *= 0.5;
1591 aadj1 = dsign ? aadj : -aadj;
1592#ifdef Check_FLT_ROUNDS
1593 switch (Rounding) {
1594 case 2: /* towards +infinity */
1595 aadj1 -= 0.5;
1596 break;
1597 case 0: /* towards 0 */
1598 case 3: /* towards -infinity */
1599 aadj1 += 0.5;
1600 }
1601#else
1602 if (Flt_Rounds == 0)
1603 aadj1 += 0.5;
1604#endif /*Check_FLT_ROUNDS*/
1605 }
ba379fdc 1606 y = word0(&rv) & Exp_mask;
9dae56ea
A
1607
1608 /* Check for overflow */
1609
1610 if (y == Exp_msk1 * (DBL_MAX_EXP + Bias - 1)) {
ba379fdc
A
1611 dval(&rv0) = dval(&rv);
1612 word0(&rv) -= P * Exp_msk1;
1613 adj.d = aadj1 * ulp(&rv);
1614 dval(&rv) += adj.d;
1615 if ((word0(&rv) & Exp_mask) >= Exp_msk1 * (DBL_MAX_EXP + Bias - P)) {
1616 if (word0(&rv0) == Big0 && word1(&rv0) == Big1)
9dae56ea 1617 goto ovfl;
ba379fdc
A
1618 word0(&rv) = Big0;
1619 word1(&rv) = Big1;
9dae56ea
A
1620 goto cont;
1621 } else
ba379fdc 1622 word0(&rv) += P * Exp_msk1;
9dae56ea
A
1623 } else {
1624#ifdef Avoid_Underflow
1625 if (scale && y <= 2 * P * Exp_msk1) {
1626 if (aadj <= 0x7fffffff) {
1627 if ((z = (uint32_t)aadj) <= 0)
1628 z = 1;
1629 aadj = z;
1630 aadj1 = dsign ? aadj : -aadj;
1631 }
ba379fdc
A
1632 dval(&aadj2) = aadj1;
1633 word0(&aadj2) += (2 * P + 1) * Exp_msk1 - y;
1634 aadj1 = dval(&aadj2);
9dae56ea 1635 }
ba379fdc
A
1636 adj.d = aadj1 * ulp(&rv);
1637 dval(&rv) += adj.d;
9dae56ea
A
1638#else
1639#ifdef Sudden_Underflow
ba379fdc
A
1640 if ((word0(&rv) & Exp_mask) <= P * Exp_msk1) {
1641 dval(&rv0) = dval(&rv);
1642 word0(&rv) += P * Exp_msk1;
1643 adj.d = aadj1 * ulp(&rv);
1644 dval(&rv) += adj.d;
1645 if ((word0(&rv) & Exp_mask) <= P * Exp_msk1)
9dae56ea 1646 {
ba379fdc 1647 if (word0(&rv0) == Tiny0 && word1(&rv0) == Tiny1)
9dae56ea 1648 goto undfl;
ba379fdc
A
1649 word0(&rv) = Tiny0;
1650 word1(&rv) = Tiny1;
9dae56ea
A
1651 goto cont;
1652 }
1653 else
ba379fdc 1654 word0(&rv) -= P * Exp_msk1;
9dae56ea 1655 } else {
ba379fdc
A
1656 adj.d = aadj1 * ulp(&rv);
1657 dval(&rv) += adj.d;
9dae56ea
A
1658 }
1659#else /*Sudden_Underflow*/
1660 /* Compute adj so that the IEEE rounding rules will
1661 * correctly round rv + adj in some half-way cases.
1662 * If rv * ulp(rv) is denormalized (i.e.,
1663 * y <= (P - 1) * Exp_msk1), we must adjust aadj to avoid
1664 * trouble from bits lost to denormalization;
1665 * example: 1.2e-307 .
1666 */
1667 if (y <= (P - 1) * Exp_msk1 && aadj > 1.) {
1668 aadj1 = (double)(int)(aadj + 0.5);
1669 if (!dsign)
1670 aadj1 = -aadj1;
1671 }
ba379fdc
A
1672 adj.d = aadj1 * ulp(&rv);
1673 dval(&rv) += adj.d;
9dae56ea
A
1674#endif /*Sudden_Underflow*/
1675#endif /*Avoid_Underflow*/
1676 }
ba379fdc 1677 z = word0(&rv) & Exp_mask;
9dae56ea
A
1678#ifndef SET_INEXACT
1679#ifdef Avoid_Underflow
1680 if (!scale)
1681#endif
1682 if (y == z) {
1683 /* Can we stop now? */
1684 L = (int32_t)aadj;
1685 aadj -= L;
1686 /* The tolerances below are conservative. */
ba379fdc 1687 if (dsign || word1(&rv) || word0(&rv) & Bndry_mask) {
9dae56ea
A
1688 if (aadj < .4999999 || aadj > .5000001)
1689 break;
1690 } else if (aadj < .4999999 / FLT_RADIX)
1691 break;
1692 }
1693#endif
1694cont:
ba379fdc 1695 ;
9dae56ea
A
1696 }
1697#ifdef SET_INEXACT
1698 if (inexact) {
1699 if (!oldinexact) {
ba379fdc
A
1700 word0(&rv0) = Exp_1 + (70 << Exp_shift);
1701 word1(&rv0) = 0;
1702 dval(&rv0) += 1.;
9dae56ea
A
1703 }
1704 } else if (!oldinexact)
1705 clear_inexact();
1706#endif
1707#ifdef Avoid_Underflow
1708 if (scale) {
ba379fdc
A
1709 word0(&rv0) = Exp_1 - 2 * P * Exp_msk1;
1710 word1(&rv0) = 0;
1711 dval(&rv) *= dval(&rv0);
9dae56ea
A
1712#ifndef NO_ERRNO
1713 /* try to avoid the bug of testing an 8087 register value */
ba379fdc 1714 if (word0(&rv) == 0 && word1(&rv) == 0)
9dae56ea
A
1715 errno = ERANGE;
1716#endif
1717 }
1718#endif /* Avoid_Underflow */
1719#ifdef SET_INEXACT
ba379fdc 1720 if (inexact && !(word0(&rv) & Exp_mask)) {
9dae56ea 1721 /* set underflow bit */
ba379fdc
A
1722 dval(&rv0) = 1e-300;
1723 dval(&rv0) *= dval(&rv0);
9dae56ea
A
1724 }
1725#endif
9dae56ea
A
1726ret:
1727 if (se)
1728 *se = const_cast<char*>(s);
ba379fdc 1729 return sign ? -dval(&rv) : dval(&rv);
9dae56ea
A
1730}
1731
ba379fdc 1732static ALWAYS_INLINE int quorem(BigInt& b, BigInt& S)
9dae56ea 1733{
ba379fdc 1734 size_t n;
9dae56ea
A
1735 uint32_t *bx, *bxe, q, *sx, *sxe;
1736#ifdef USE_LONG_LONG
1737 unsigned long long borrow, carry, y, ys;
1738#else
1739 uint32_t borrow, carry, y, ys;
1740#ifdef Pack_32
1741 uint32_t si, z, zs;
1742#endif
1743#endif
ba379fdc
A
1744 ASSERT(b.size() <= 1 || b.words()[b.size() - 1]);
1745 ASSERT(S.size() <= 1 || S.words()[S.size() - 1]);
9dae56ea 1746
ba379fdc
A
1747 n = S.size();
1748 ASSERT_WITH_MESSAGE(b.size() <= n, "oversize b in quorem");
1749 if (b.size() < n)
9dae56ea 1750 return 0;
ba379fdc 1751 sx = S.words();
9dae56ea 1752 sxe = sx + --n;
ba379fdc 1753 bx = b.words();
9dae56ea
A
1754 bxe = bx + n;
1755 q = *bxe / (*sxe + 1); /* ensure q <= true quotient */
1756 ASSERT_WITH_MESSAGE(q <= 9, "oversized quotient in quorem");
1757 if (q) {
1758 borrow = 0;
1759 carry = 0;
1760 do {
1761#ifdef USE_LONG_LONG
1762 ys = *sx++ * (unsigned long long)q + carry;
1763 carry = ys >> 32;
1764 y = *bx - (ys & 0xffffffffUL) - borrow;
1765 borrow = y >> 32 & (uint32_t)1;
1766 *bx++ = (uint32_t)y & 0xffffffffUL;
1767#else
1768#ifdef Pack_32
1769 si = *sx++;
1770 ys = (si & 0xffff) * q + carry;
1771 zs = (si >> 16) * q + (ys >> 16);
1772 carry = zs >> 16;
1773 y = (*bx & 0xffff) - (ys & 0xffff) - borrow;
1774 borrow = (y & 0x10000) >> 16;
1775 z = (*bx >> 16) - (zs & 0xffff) - borrow;
1776 borrow = (z & 0x10000) >> 16;
1777 Storeinc(bx, z, y);
1778#else
1779 ys = *sx++ * q + carry;
1780 carry = ys >> 16;
1781 y = *bx - (ys & 0xffff) - borrow;
1782 borrow = (y & 0x10000) >> 16;
1783 *bx++ = y & 0xffff;
1784#endif
1785#endif
1786 } while (sx <= sxe);
1787 if (!*bxe) {
ba379fdc 1788 bx = b.words();
9dae56ea
A
1789 while (--bxe > bx && !*bxe)
1790 --n;
ba379fdc 1791 b.resize(n);
9dae56ea
A
1792 }
1793 }
1794 if (cmp(b, S) >= 0) {
1795 q++;
1796 borrow = 0;
1797 carry = 0;
ba379fdc
A
1798 bx = b.words();
1799 sx = S.words();
9dae56ea
A
1800 do {
1801#ifdef USE_LONG_LONG
1802 ys = *sx++ + carry;
1803 carry = ys >> 32;
1804 y = *bx - (ys & 0xffffffffUL) - borrow;
1805 borrow = y >> 32 & (uint32_t)1;
1806 *bx++ = (uint32_t)y & 0xffffffffUL;
1807#else
1808#ifdef Pack_32
1809 si = *sx++;
1810 ys = (si & 0xffff) + carry;
1811 zs = (si >> 16) + (ys >> 16);
1812 carry = zs >> 16;
1813 y = (*bx & 0xffff) - (ys & 0xffff) - borrow;
1814 borrow = (y & 0x10000) >> 16;
1815 z = (*bx >> 16) - (zs & 0xffff) - borrow;
1816 borrow = (z & 0x10000) >> 16;
1817 Storeinc(bx, z, y);
1818#else
1819 ys = *sx++ + carry;
1820 carry = ys >> 16;
1821 y = *bx - (ys & 0xffff) - borrow;
1822 borrow = (y & 0x10000) >> 16;
1823 *bx++ = y & 0xffff;
1824#endif
1825#endif
1826 } while (sx <= sxe);
ba379fdc 1827 bx = b.words();
9dae56ea
A
1828 bxe = bx + n;
1829 if (!*bxe) {
1830 while (--bxe > bx && !*bxe)
1831 --n;
ba379fdc 1832 b.resize(n);
9dae56ea
A
1833 }
1834 }
1835 return q;
1836}
1837
9dae56ea
A
1838/* dtoa for IEEE arithmetic (dmg): convert double to ASCII string.
1839 *
1840 * Inspired by "How to Print Floating-Point Numbers Accurately" by
1841 * Guy L. Steele, Jr. and Jon L. White [Proc. ACM SIGPLAN '90, pp. 92-101].
1842 *
1843 * Modifications:
1844 * 1. Rather than iterating, we use a simple numeric overestimate
1845 * to determine k = floor(log10(d)). We scale relevant
1846 * quantities using O(log2(k)) rather than O(k) multiplications.
1847 * 2. For some modes > 2 (corresponding to ecvt and fcvt), we don't
1848 * try to generate digits strictly left to right. Instead, we
1849 * compute with fewer bits and propagate the carry if necessary
1850 * when rounding the final digit up. This is often faster.
1851 * 3. Under the assumption that input will be rounded nearest,
1852 * mode 0 renders 1e23 as 1e23 rather than 9.999999999999999e22.
1853 * That is, we allow equality in stopping tests when the
1854 * round-nearest rule will give the same floating-point value
1855 * as would satisfaction of the stopping test with strict
1856 * inequality.
1857 * 4. We remove common factors of powers of 2 from relevant
1858 * quantities.
1859 * 5. When converting floating-point integers less than 1e16,
1860 * we use floating-point arithmetic rather than resorting
1861 * to multiple-precision integers.
1862 * 6. When asked to produce fewer than 15 digits, we first try
1863 * to get by with floating-point arithmetic; we resort to
1864 * multiple-precision integer arithmetic only if we cannot
1865 * guarantee that the floating-point calculation has given
1866 * the correctly rounded result. For k requested digits and
1867 * "uniformly" distributed input, the probability is
1868 * something like 10^(k-15) that we must resort to the int32_t
1869 * calculation.
1870 */
1871
ba379fdc 1872void dtoa(char* result, double dd, int ndigits, int* decpt, int* sign, char** rve)
9dae56ea
A
1873{
1874 /*
1875 Arguments ndigits, decpt, sign are similar to those
1876 of ecvt and fcvt; trailing zeros are suppressed from
1877 the returned string. If not null, *rve is set to point
1878 to the end of the return value. If d is +-Infinity or NaN,
1879 then *decpt is set to 9999.
1880
1881 */
1882
1883 int bbits, b2, b5, be, dig, i, ieps, ilim = 0, ilim0, ilim1 = 0,
1884 j, j1, k, k0, k_check, leftright, m2, m5, s2, s5,
1885 spec_case, try_quick;
1886 int32_t L;
1887#ifndef Sudden_Underflow
1888 int denorm;
1889 uint32_t x;
1890#endif
ba379fdc
A
1891 BigInt b, b1, delta, mlo, mhi, S;
1892 U d2, eps, u;
1893 double ds;
9dae56ea
A
1894 char *s, *s0;
1895#ifdef SET_INEXACT
1896 int inexact, oldinexact;
1897#endif
1898
ba379fdc
A
1899 u.d = dd;
1900 if (word0(&u) & Sign_bit) {
9dae56ea
A
1901 /* set sign for everything, including 0's and NaNs */
1902 *sign = 1;
ba379fdc 1903 word0(&u) &= ~Sign_bit; /* clear sign bit */
9dae56ea
A
1904 } else
1905 *sign = 0;
1906
ba379fdc 1907 if ((word0(&u) & Exp_mask) == Exp_mask)
9dae56ea
A
1908 {
1909 /* Infinity or NaN */
1910 *decpt = 9999;
ba379fdc
A
1911 if (!word1(&u) && !(word0(&u) & 0xfffff))
1912 strcpy(result, "Infinity");
1913 else
1914 strcpy(result, "NaN");
1915 return;
9dae56ea 1916 }
ba379fdc 1917 if (!dval(&u)) {
9dae56ea 1918 *decpt = 1;
ba379fdc
A
1919 result[0] = '0';
1920 result[1] = '\0';
1921 return;
9dae56ea
A
1922 }
1923
1924#ifdef SET_INEXACT
1925 try_quick = oldinexact = get_inexact();
1926 inexact = 1;
1927#endif
1928
ba379fdc 1929 d2b(b, &u, &be, &bbits);
9dae56ea 1930#ifdef Sudden_Underflow
ba379fdc 1931 i = (int)(word0(&u) >> Exp_shift1 & (Exp_mask >> Exp_shift1));
9dae56ea 1932#else
ba379fdc 1933 if ((i = (int)(word0(&u) >> Exp_shift1 & (Exp_mask >> Exp_shift1)))) {
9dae56ea 1934#endif
ba379fdc
A
1935 dval(&d2) = dval(&u);
1936 word0(&d2) &= Frac_mask1;
1937 word0(&d2) |= Exp_11;
9dae56ea
A
1938
1939 /* log(x) ~=~ log(1.5) + (x-1.5)/1.5
1940 * log10(x) = log(x) / log(10)
1941 * ~=~ log(1.5)/log(10) + (x-1.5)/(1.5*log(10))
1942 * log10(d) = (i-Bias)*log(2)/log(10) + log10(d2)
1943 *
1944 * This suggests computing an approximation k to log10(d) by
1945 *
1946 * k = (i - Bias)*0.301029995663981
1947 * + ( (d2-1.5)*0.289529654602168 + 0.176091259055681 );
1948 *
1949 * We want k to be too large rather than too small.
1950 * The error in the first-order Taylor series approximation
1951 * is in our favor, so we just round up the constant enough
1952 * to compensate for any error in the multiplication of
1953 * (i - Bias) by 0.301029995663981; since |i - Bias| <= 1077,
1954 * and 1077 * 0.30103 * 2^-52 ~=~ 7.2e-14,
1955 * adding 1e-13 to the constant term more than suffices.
1956 * Hence we adjust the constant term to 0.1760912590558.
1957 * (We could get a more accurate k by invoking log10,
1958 * but this is probably not worthwhile.)
1959 */
1960
1961 i -= Bias;
1962#ifndef Sudden_Underflow
1963 denorm = 0;
1964 } else {
1965 /* d is denormalized */
1966
1967 i = bbits + be + (Bias + (P - 1) - 1);
ba379fdc
A
1968 x = (i > 32) ? (word0(&u) << (64 - i)) | (word1(&u) >> (i - 32))
1969 : word1(&u) << (32 - i);
1970 dval(&d2) = x;
1971 word0(&d2) -= 31 * Exp_msk1; /* adjust exponent */
9dae56ea
A
1972 i -= (Bias + (P - 1) - 1) + 1;
1973 denorm = 1;
1974 }
1975#endif
ba379fdc 1976 ds = (dval(&d2) - 1.5) * 0.289529654602168 + 0.1760912590558 + (i * 0.301029995663981);
9dae56ea
A
1977 k = (int)ds;
1978 if (ds < 0. && ds != k)
1979 k--; /* want k = floor(ds) */
1980 k_check = 1;
1981 if (k >= 0 && k <= Ten_pmax) {
ba379fdc 1982 if (dval(&u) < tens[k])
9dae56ea
A
1983 k--;
1984 k_check = 0;
1985 }
1986 j = bbits - i - 1;
1987 if (j >= 0) {
1988 b2 = 0;
1989 s2 = j;
1990 } else {
1991 b2 = -j;
1992 s2 = 0;
1993 }
1994 if (k >= 0) {
1995 b5 = 0;
1996 s5 = k;
1997 s2 += k;
1998 } else {
1999 b2 -= k;
2000 b5 = -k;
2001 s5 = 0;
2002 }
2003
2004#ifndef SET_INEXACT
2005#ifdef Check_FLT_ROUNDS
2006 try_quick = Rounding == 1;
2007#else
2008 try_quick = 1;
2009#endif
2010#endif /*SET_INEXACT*/
2011
2012 leftright = 1;
2013 ilim = ilim1 = -1;
2014 i = 18;
2015 ndigits = 0;
ba379fdc 2016 s = s0 = result;
9dae56ea
A
2017
2018 if (ilim >= 0 && ilim <= Quick_max && try_quick) {
2019
2020 /* Try to get by with floating-point arithmetic. */
2021
2022 i = 0;
ba379fdc 2023 dval(&d2) = dval(&u);
9dae56ea
A
2024 k0 = k;
2025 ilim0 = ilim;
2026 ieps = 2; /* conservative */
2027 if (k > 0) {
2028 ds = tens[k & 0xf];
2029 j = k >> 4;
2030 if (j & Bletch) {
2031 /* prevent overflows */
2032 j &= Bletch - 1;
ba379fdc 2033 dval(&u) /= bigtens[n_bigtens - 1];
9dae56ea
A
2034 ieps++;
2035 }
2036 for (; j; j >>= 1, i++) {
2037 if (j & 1) {
2038 ieps++;
2039 ds *= bigtens[i];
2040 }
2041 }
ba379fdc 2042 dval(&u) /= ds;
9dae56ea 2043 } else if ((j1 = -k)) {
ba379fdc 2044 dval(&u) *= tens[j1 & 0xf];
9dae56ea
A
2045 for (j = j1 >> 4; j; j >>= 1, i++) {
2046 if (j & 1) {
2047 ieps++;
ba379fdc 2048 dval(&u) *= bigtens[i];
9dae56ea
A
2049 }
2050 }
2051 }
ba379fdc 2052 if (k_check && dval(&u) < 1. && ilim > 0) {
9dae56ea
A
2053 if (ilim1 <= 0)
2054 goto fast_failed;
2055 ilim = ilim1;
2056 k--;
ba379fdc 2057 dval(&u) *= 10.;
9dae56ea
A
2058 ieps++;
2059 }
ba379fdc
A
2060 dval(&eps) = (ieps * dval(&u)) + 7.;
2061 word0(&eps) -= (P - 1) * Exp_msk1;
9dae56ea 2062 if (ilim == 0) {
ba379fdc
A
2063 S.clear();
2064 mhi.clear();
2065 dval(&u) -= 5.;
2066 if (dval(&u) > dval(&eps))
9dae56ea 2067 goto one_digit;
ba379fdc 2068 if (dval(&u) < -dval(&eps))
9dae56ea
A
2069 goto no_digits;
2070 goto fast_failed;
2071 }
2072#ifndef No_leftright
2073 if (leftright) {
2074 /* Use Steele & White method of only
2075 * generating digits needed.
2076 */
ba379fdc 2077 dval(&eps) = (0.5 / tens[ilim - 1]) - dval(&eps);
9dae56ea 2078 for (i = 0;;) {
ba379fdc
A
2079 L = (long int)dval(&u);
2080 dval(&u) -= L;
9dae56ea 2081 *s++ = '0' + (int)L;
ba379fdc
A
2082 if (dval(&u) < dval(&eps))
2083 goto ret;
2084 if (1. - dval(&u) < dval(&eps))
9dae56ea
A
2085 goto bump_up;
2086 if (++i >= ilim)
2087 break;
ba379fdc
A
2088 dval(&eps) *= 10.;
2089 dval(&u) *= 10.;
9dae56ea
A
2090 }
2091 } else {
2092#endif
2093 /* Generate ilim digits, then fix them up. */
ba379fdc
A
2094 dval(&eps) *= tens[ilim - 1];
2095 for (i = 1;; i++, dval(&u) *= 10.) {
2096 L = (int32_t)(dval(&u));
2097 if (!(dval(&u) -= L))
9dae56ea
A
2098 ilim = i;
2099 *s++ = '0' + (int)L;
2100 if (i == ilim) {
ba379fdc 2101 if (dval(&u) > 0.5 + dval(&eps))
9dae56ea 2102 goto bump_up;
ba379fdc 2103 else if (dval(&u) < 0.5 - dval(&eps)) {
9dae56ea
A
2104 while (*--s == '0') { }
2105 s++;
ba379fdc 2106 goto ret;
9dae56ea
A
2107 }
2108 break;
2109 }
2110 }
2111#ifndef No_leftright
2112 }
2113#endif
2114fast_failed:
2115 s = s0;
ba379fdc 2116 dval(&u) = dval(&d2);
9dae56ea
A
2117 k = k0;
2118 ilim = ilim0;
2119 }
2120
2121 /* Do we have a "small" integer? */
2122
2123 if (be >= 0 && k <= Int_max) {
2124 /* Yes. */
2125 ds = tens[k];
2126 if (ndigits < 0 && ilim <= 0) {
ba379fdc
A
2127 S.clear();
2128 mhi.clear();
2129 if (ilim < 0 || dval(&u) <= 5 * ds)
9dae56ea
A
2130 goto no_digits;
2131 goto one_digit;
2132 }
ba379fdc
A
2133 for (i = 1;; i++, dval(&u) *= 10.) {
2134 L = (int32_t)(dval(&u) / ds);
2135 dval(&u) -= L * ds;
9dae56ea
A
2136#ifdef Check_FLT_ROUNDS
2137 /* If FLT_ROUNDS == 2, L will usually be high by 1 */
ba379fdc 2138 if (dval(&u) < 0) {
9dae56ea 2139 L--;
ba379fdc 2140 dval(&u) += ds;
9dae56ea
A
2141 }
2142#endif
2143 *s++ = '0' + (int)L;
ba379fdc 2144 if (!dval(&u)) {
9dae56ea
A
2145#ifdef SET_INEXACT
2146 inexact = 0;
2147#endif
2148 break;
2149 }
2150 if (i == ilim) {
ba379fdc
A
2151 dval(&u) += dval(&u);
2152 if (dval(&u) > ds || (dval(&u) == ds && (L & 1))) {
9dae56ea
A
2153bump_up:
2154 while (*--s == '9')
2155 if (s == s0) {
2156 k++;
2157 *s = '0';
2158 break;
2159 }
2160 ++*s++;
2161 }
2162 break;
2163 }
2164 }
ba379fdc 2165 goto ret;
9dae56ea
A
2166 }
2167
2168 m2 = b2;
2169 m5 = b5;
ba379fdc
A
2170 mhi.clear();
2171 mlo.clear();
9dae56ea
A
2172 if (leftright) {
2173 i =
2174#ifndef Sudden_Underflow
2175 denorm ? be + (Bias + (P - 1) - 1 + 1) :
2176#endif
2177 1 + P - bbits;
2178 b2 += i;
2179 s2 += i;
ba379fdc 2180 i2b(mhi, 1);
9dae56ea
A
2181 }
2182 if (m2 > 0 && s2 > 0) {
2183 i = m2 < s2 ? m2 : s2;
2184 b2 -= i;
2185 m2 -= i;
2186 s2 -= i;
2187 }
2188 if (b5 > 0) {
2189 if (leftright) {
2190 if (m5 > 0) {
ba379fdc
A
2191 pow5mult(mhi, m5);
2192 mult(b, mhi);
9dae56ea
A
2193 }
2194 if ((j = b5 - m5))
ba379fdc 2195 pow5mult(b, j);
9dae56ea 2196 } else
ba379fdc 2197 pow5mult(b, b5);
9dae56ea 2198 }
ba379fdc 2199 i2b(S, 1);
9dae56ea 2200 if (s5 > 0)
ba379fdc 2201 pow5mult(S, s5);
9dae56ea
A
2202
2203 /* Check for special case that d is a normalized power of 2. */
2204
2205 spec_case = 0;
ba379fdc 2206 if (!word1(&u) && !(word0(&u) & Bndry_mask)
9dae56ea 2207#ifndef Sudden_Underflow
ba379fdc 2208 && word0(&u) & (Exp_mask & ~Exp_msk1)
9dae56ea
A
2209#endif
2210 ) {
2211 /* The special case */
2212 b2 += Log2P;
2213 s2 += Log2P;
2214 spec_case = 1;
2215 }
2216
2217 /* Arrange for convenient computation of quotients:
2218 * shift left if necessary so divisor has 4 leading 0 bits.
2219 *
2220 * Perhaps we should just compute leading 28 bits of S once
2221 * and for all and pass them and a shift to quorem, so it
2222 * can do shifts and ors to compute the numerator for q.
2223 */
2224#ifdef Pack_32
ba379fdc 2225 if ((i = ((s5 ? 32 - hi0bits(S.words()[S.size() - 1]) : 1) + s2) & 0x1f))
9dae56ea
A
2226 i = 32 - i;
2227#else
ba379fdc 2228 if ((i = ((s5 ? 32 - hi0bits(S.words()[S.size() - 1]) : 1) + s2) & 0xf))
9dae56ea
A
2229 i = 16 - i;
2230#endif
2231 if (i > 4) {
2232 i -= 4;
2233 b2 += i;
2234 m2 += i;
2235 s2 += i;
2236 } else if (i < 4) {
2237 i += 28;
2238 b2 += i;
2239 m2 += i;
2240 s2 += i;
2241 }
2242 if (b2 > 0)
ba379fdc 2243 lshift(b, b2);
9dae56ea 2244 if (s2 > 0)
ba379fdc 2245 lshift(S, s2);
9dae56ea
A
2246 if (k_check) {
2247 if (cmp(b,S) < 0) {
2248 k--;
ba379fdc 2249 multadd(b, 10, 0); /* we botched the k estimate */
9dae56ea 2250 if (leftright)
ba379fdc 2251 multadd(mhi, 10, 0);
9dae56ea
A
2252 ilim = ilim1;
2253 }
2254 }
2255
2256 if (leftright) {
2257 if (m2 > 0)
ba379fdc 2258 lshift(mhi, m2);
9dae56ea
A
2259
2260 /* Compute mlo -- check for special case
2261 * that d is a normalized power of 2.
2262 */
2263
2264 mlo = mhi;
2265 if (spec_case) {
ba379fdc
A
2266 mhi = mlo;
2267 lshift(mhi, Log2P);
9dae56ea
A
2268 }
2269
2270 for (i = 1;;i++) {
2271 dig = quorem(b,S) + '0';
2272 /* Do we yet have the shortest decimal string
2273 * that will round to d?
2274 */
2275 j = cmp(b, mlo);
ba379fdc
A
2276 diff(delta, S, mhi);
2277 j1 = delta.sign ? 1 : cmp(b, delta);
2278 if (j1 == 0 && !(word1(&u) & 1)) {
9dae56ea
A
2279 if (dig == '9')
2280 goto round_9_up;
2281 if (j > 0)
2282 dig++;
2283#ifdef SET_INEXACT
2284 else if (!b->x[0] && b->wds <= 1)
2285 inexact = 0;
2286#endif
2287 *s++ = dig;
2288 goto ret;
2289 }
ba379fdc
A
2290 if (j < 0 || (j == 0 && !(word1(&u) & 1))) {
2291 if (!b.words()[0] && b.size() <= 1) {
9dae56ea
A
2292#ifdef SET_INEXACT
2293 inexact = 0;
2294#endif
2295 goto accept_dig;
2296 }
2297 if (j1 > 0) {
ba379fdc 2298 lshift(b, 1);
9dae56ea 2299 j1 = cmp(b, S);
ba379fdc 2300 if ((j1 > 0 || (j1 == 0 && (dig & 1))) && dig++ == '9')
9dae56ea
A
2301 goto round_9_up;
2302 }
2303accept_dig:
2304 *s++ = dig;
2305 goto ret;
2306 }
2307 if (j1 > 0) {
2308 if (dig == '9') { /* possible if i == 1 */
2309round_9_up:
2310 *s++ = '9';
2311 goto roundoff;
2312 }
2313 *s++ = dig + 1;
2314 goto ret;
2315 }
2316 *s++ = dig;
2317 if (i == ilim)
2318 break;
ba379fdc
A
2319 multadd(b, 10, 0);
2320 multadd(mlo, 10, 0);
2321 multadd(mhi, 10, 0);
9dae56ea
A
2322 }
2323 } else
2324 for (i = 1;; i++) {
2325 *s++ = dig = quorem(b,S) + '0';
ba379fdc 2326 if (!b.words()[0] && b.size() <= 1) {
9dae56ea
A
2327#ifdef SET_INEXACT
2328 inexact = 0;
2329#endif
2330 goto ret;
2331 }
2332 if (i >= ilim)
2333 break;
ba379fdc 2334 multadd(b, 10, 0);
9dae56ea
A
2335 }
2336
2337 /* Round off last digit */
2338
ba379fdc 2339 lshift(b, 1);
9dae56ea 2340 j = cmp(b, S);
ba379fdc 2341 if (j > 0 || (j == 0 && (dig & 1))) {
9dae56ea
A
2342roundoff:
2343 while (*--s == '9')
2344 if (s == s0) {
2345 k++;
2346 *s++ = '1';
2347 goto ret;
2348 }
2349 ++*s++;
2350 } else {
2351 while (*--s == '0') { }
2352 s++;
2353 }
2354 goto ret;
2355no_digits:
2356 k = -1 - ndigits;
2357 goto ret;
2358one_digit:
2359 *s++ = '1';
2360 k++;
2361 goto ret;
2362ret:
9dae56ea
A
2363#ifdef SET_INEXACT
2364 if (inexact) {
2365 if (!oldinexact) {
ba379fdc
A
2366 word0(&u) = Exp_1 + (70 << Exp_shift);
2367 word1(&u) = 0;
2368 dval(&u) += 1.;
9dae56ea
A
2369 }
2370 } else if (!oldinexact)
2371 clear_inexact();
2372#endif
9dae56ea
A
2373 *s = 0;
2374 *decpt = k + 1;
2375 if (rve)
2376 *rve = s;
9dae56ea
A
2377}
2378
2379} // namespace WTF