[1.9:Feature] faster bignum multiplication by karatsuba method

Yusuke_ENDOH · December 11, 2008, 8:10pm

e$B1sF#$G$9!#e(B

Python e$B$N%=!<%9$r;29M$K$7$F!"e(Bbignum e$B$N>h;;$re(B Karatsuba
e$BK!$J$I$Ge(B
e$B9bB.2=$7$F$_$^$7$?!#e(B

e$B%Y%s%A%^!<%/$9$k$H$3$s$J46$8$G$9!#e(B

                                    e$B5le(B    e$B?7e(B

e$BG\N(e(B
x = 10 ** 10; 500000.times { x * x } 1.11s 0.99s 112.13%
x = 10 ** 20; 500000.times { x * x } 1.28s 1.25s 102.52%
x = 10 ** 30; 500000.times { x * x } 1.52s 1.36s 111.19%
x = 10 ** 1000; 10000.times { x * x } 2.42s 1.51s 159.97%
x = 31000; 50000.times { x * x } 4.25s 2.65s 160.07%
x = 230000; 50000.times { x * x } 4.49s 2.42s 185.65%
50.times { 161000000 } 4.37s 4.21s 103.72%
10.times { 10100000 } 5.06s 1.98s 255.85%
(12345 ** 12345) * (54321 ** 54321) 8.84s 2.57s 344.45%

e$B$a$C$?$K;H$o$J$5$=$&$JBg$-$JCM$GFC$K8z2L$,$“$j$^$9$,!”>.$5$Je(B
e$BCM$G$bCY$/$O$J$i$J$$$h$&$K9)IW$7$?$D$b$j$G$9!#e(B

e$B%Q%C%A$NBg$^$+$JFbMF$O0J2<$N$H$*$j$G$9!#e(B

bigadd_core e$B!"e(Bbigsub_core
- bigadd e$B$He(B bigsub e$B$N7W;;ItJ,$r$/$/$j$@$7$?$b$Ne(B
  (bigmul1_karatsuba e$B$J$I$G;H$&e(B)
bigmul1_normal(x, y)
- e$BI.;;e(B (e$B=>Mh$HF1$8e(B)
bigmul1_balance(x, y)
- y e$B$N7e$re(B x e$B$N7e?t$GJ,3d$7$F!"8D!9$K>h;;$7$?7k2L$rB-$9e(B
bigmul1_karatsuba(x, y)
- Karatsuba e$BK!$K$h$k>h;;e(B
  (カラツバ法 - Wikipedia)
bigsqr_fast(x)
- e$BI.;;$h$je(B 2 e$BG\B.$$Fs>he(B
  (Handbook of Applied Cryptography, Algorithm 14.16
  Centre For Applied Cryptographic Research: The University of Waterloo)
big_sparse_p(x)
- sparse e$B$+$I$&$+$rH=CG$9$ke(B
  (e$B7e$re(B 3 e$B$D%i%s%@%`Cj=P$7!"e(B0 e$B$N?t$,e(B 1
  e$B8D0J2<$J$ie(B sparse)
bigmul0(x, y)
- x e$B$+e(B y e$B$,e(B KARATSUBA_MUL_DIGITS (= 70)
  e$B7e$h$j>.$5$1$l$Pe(B
  bigsqr_fast e$B$^$?$Oe(B bigmul1_normal
- x e$B$+e(B y e$B$,e(B sparse (e$B$[$H$s$I$N7e$,e(B 0) e$B$G$be(B
  bigsqr_fast e$B$^$?$Oe(B
  bigmul1_normal
- x e$B$He(B y e$B$N7e?t$N:9$,FsG\0J>e$J$ie(B bigmul1_balance
- e$B$=$l0J30$J$ie(B bigmul1_karatsuba

e$B0l1~e(B make test && make test-all e$B$ODL$C$F$$$^$9e(B (bignum
e$B$N%F%9%H$Oe(B
e$B=<<B$7$F$J$$$N$G$"$^$jEv$F$K$J$i$J$$$G$9$,e(B) e$B!#e(B

e$B$I$&$G$7$g$&$+!#e(B

Index: bignum.c

— bignum.c (revision 20645)
+++ bignum.c (working copy)
@@ -17,6 +17,7 @@
#ifdef HAVE_IEEEFP_H
#include <ieeefp.h>
#endif
+#include <assert.h>

VALUE rb_cBignum;

@@ -1380,12 +1381,36 @@
return bignorm(z);
}

+static void
+bigsub_core(BDIGIT *xds, long xn, BDIGIT *yds, long yn, BDIGIT *zds,
long zn)
+{

BDIGIT_DBL_SIGNED num;
long i;
for (i = 0, num = 0; i < yn; i++) {
num += (BDIGIT_DBL_SIGNED)xds[i] - yds[i];
zds[i] = BIGLO(num);
num = BIGDN(num);
}
while (num && i < xn) {
num += xds[i];
zds[i++] = BIGLO(num);
num = BIGDN(num);
}
while (i < xn) {
zds[i] = xds[i];
i++;
}
assert(i <= zn);
while (i < zn) {
zds[i++] = 0;
}
+}

static VALUE
bigsub(VALUE x, VALUE y)
{
VALUE z = 0;

BDIGIT *zds;
BDIGIT_DBL_SIGNED num;
long i = RBIGNUM_LEN(x);

/* if x is larger than y, swap */
@@ -1406,32 +1431,52 @@
}

z = bignew(RBIGNUM_LEN(x), z==0);
zds = BDIGITS(z);

bigsub_core(BDIGITS(x), RBIGNUM_LEN(x),
BDIGITS(y), RBIGNUM_LEN(y),
BDIGITS(z), RBIGNUM_LEN(z));

for (i = 0, num = 0; i < RBIGNUM_LEN(y); i++) {
num += (BDIGIT_DBL_SIGNED)BDIGITS(x)[i] - BDIGITS(y)[i];
zds[i] = BIGLO(num);

return z;
+}

+static void
+bigadd_core(BDIGIT *xds, long xn, BDIGIT *yds, long yn, BDIGIT *zds,
long zn)
+{

BDIGIT_DBL num = 0;
long i;
if (xn > yn) {
BDIGIT *tds;
tds = xds; xds = yds; yds = tds;
i = xn; xn = yn; yn = i;
}
i = 0;
while (i < xn) {
num += (BDIGIT_DBL)xds[i] + yds[i];
zds[i++] = BIGLO(num);
num = BIGDN(num);
}

while (num && i < RBIGNUM_LEN(x)) {
num += BDIGITS(x)[i];

while (num && i < yn) {
num += yds[i];
zds[i++] = BIGLO(num);
num = BIGDN(num);
}

while (i < RBIGNUM_LEN(x)) {
zds[i] = BDIGITS(x)[i];

while (i < yn) {
zds[i] = yds[i];
i++;
}

return z;

if (num) zds[i++] = (BDIGIT)num;
assert(i <= zn);
while (i < zn) {
zds[i++] = 0;
}
}

static VALUE
bigadd(VALUE x, VALUE y, int sign)
{
VALUE z;

BDIGIT_DBL num;
long i, len;

long len;

sign = (sign == RBIGNUM_SIGN(y));
if (RBIGNUM_SIGN(x) != sign) {
@@ -1441,30 +1486,15 @@

if (RBIGNUM_LEN(x) > RBIGNUM_LEN(y)) {
len = RBIGNUM_LEN(x) + 1;

z = x; x = y; y = z;
}
else {
len = RBIGNUM_LEN(y) + 1;
}
z = bignew(len, sign);
len = RBIGNUM_LEN(x);
for (i = 0, num = 0; i < len; i++) {
num += (BDIGIT_DBL)BDIGITS(x)[i] + BDIGITS(y)[i];
BDIGITS(z)[i] = BIGLO(num);
num = BIGDN(num);
}
len = RBIGNUM_LEN(y);
while (num && i < len) {
num += BDIGITS(y)[i];
BDIGITS(z)[i++] = BIGLO(num);
num = BIGDN(num);
}
while (i < len) {
BDIGITS(z)[i] = BDIGITS(y)[i];
i++;
}
BDIGITS(z)[i] = (BDIGIT)num;

bigadd_core(BDIGITS(x), RBIGNUM_LEN(x),
BDIGITS(y), RBIGNUM_LEN(y),
BDIGITS(z), RBIGNUM_LEN(z));

return z;
}
@@ -1519,24 +1549,20 @@
}
}

-static void
-rb_big_stop(void *ptr)
+static long
+big_real_len(VALUE x)
{

VALUE stop = (VALUE)ptr;
*stop = Qtrue;

long i = RBIGNUM_LEN(x);
while (–i && !BDIGITS(x)[i]);
return i + 1;
}

-struct big_mul_struct {

VALUE x, y, z, stop;
-};

static VALUE
-bigmul1(void *ptr)
+bigmul1_normal(VALUE x, VALUE y)
{

struct big_mul_struct bms = (struct big_mul_struct)ptr;
long i, j;
BDIGIT_DBL n = 0;
VALUE x = bms->x, y = bms->y, z = bms->z;

VALUE z = bignew(RBIGNUM_LEN(x) + RBIGNUM_LEN(y) + 1,
RBIGNUM_SIGN(x)==RBIGNUM_SIGN(y));
BDIGIT *zds;

j = RBIGNUM_LEN(x) + RBIGNUM_LEN(y) + 1;
@@ -1544,7 +1570,6 @@
while (j–) zds[j] = 0;
for (i = 0; i < RBIGNUM_LEN(x); i++) {
BDIGIT_DBL dd;

if (bms->stop) return Qnil;
dd = BDIGITS(x)[i];
if (dd == 0) continue;
n = 0;
@@ -1558,45 +1583,251 @@
zds[i + j] = n;
}
}

rb_thread_check_ints();
return z;
}

+static VALUE bigmul0(VALUE x, VALUE y);
+
+/* balancing multiplication by slicing larger argument */
static VALUE
-rb_big_mul0(VALUE x, VALUE y)
+bigmul1_balance(VALUE x, VALUE y)
{

struct big_mul_struct bms;
volatile VALUE z;

VALUE z, t1, t2;
long i, xn, yn, r, n;

switch (TYPE(y)) {
```
 case T_FIXNUM:
```
y = rb_int2big(FIX2LONG(y));
break;

xn = RBIGNUM_LEN(x);
yn = RBIGNUM_LEN(y);
assert(2 * xn <= yn);

```
 case T_BIGNUM:
```
break;

z = bignew(xn + yn, RBIGNUM_SIGN(x)==RBIGNUM_SIGN(y));
t1 = bignew(xn, 1);

```
 case T_FLOAT:
```
return DBL2NUM(rb_big2dbl(x) * RFLOAT_VALUE(y));

for (i = 0; i < xn + yn; i++) BDIGITS(z)[i] = 0;

```
 default:
```
return rb_num_coerce_bin(x, y, ‘*’);

n = 0;
while (yn > 0) {
r = xn > yn ? yn : xn;
MEMCPY(BDIGITS(t1), BDIGITS(y) + n, BDIGIT, r);
RBIGNUM_SET_LEN(t1, r);
t2 = bigmul0(x, t1);
bigadd_core(BDIGITS(z) + n, RBIGNUM_LEN(z) - n,
```
   BDIGITS(t2), big_real_len(t2),
```

   BDIGITS(z) + n, RBIGNUM_LEN(z) - n);

yn -= r;
n += r;
}
rb_gc_force_recycle(t1);

bms.x = x;
bms.y = y;
bms.z = bignew(RBIGNUM_LEN(x) + RBIGNUM_LEN(y) + 1,
RBIGNUM_SIGN(x)==RBIGNUM_SIGN(y));
bms.stop = Qfalse;

return z;
+}

if (RBIGNUM_LEN(x) + RBIGNUM_LEN(y) > 10000) {
z = rb_thread_blocking_region(bigmul1, &bms, rb_big_stop, &bms.stop);
+/* split a bignum into high and low bignums */
+static void
+big_split(VALUE v, long n, VALUE *ph, VALUE *pl)
+{

long hn, ln;
VALUE h, l;
ln = RBIGNUM_LEN(v) > n ? n : RBIGNUM_LEN(v);
hn = RBIGNUM_LEN(v) - ln;
while (–hn && !BDIGITS(v)[hn + ln]);
h = bignew(++hn, 1);
MEMCPY(BDIGITS(h), BDIGITS(v) + ln, BDIGIT, hn);
while (–ln && !BDIGITS(v)[ln]);
l = bignew(++ln, 1);
MEMCPY(BDIGITS(l), BDIGITS(v), BDIGIT, ln);
*pl = l;
*ph = h;
+}

+/* multiplication by karatsuba method */
+static VALUE
+bigmul1_karatsuba(VALUE x, VALUE y)
+{

long i, n, xn, yn, t1n, t2n;
VALUE xh, xl, yh, yl, z, t1, t2, t3;
BDIGIT *zds;
xn = RBIGNUM_LEN(x);
yn = RBIGNUM_LEN(y);
n = yn / 2;
big_split(x, n, &xh, &xl);
if (x == y) {
yh = xh; yl = xl;
}
else big_split(y, n, &yh, &yl);
/* x = xh * b + xl
```
* y = yh * b + yl
```
```
*
```
```
* Karatsuba method:
```
```
*   x * y = z2 * b^2 + z1 * b + z0
```
```
*   where
```
```
*     z2 = xh * yh
```
```
*     z0 = xl * yl
```

*     z1 = (xh + xl) * (yh + yl) - x2 - x0

```
*
```

*  ref: http://en.wikipedia.org/wiki/Karatsuba_algorithm

```
*/
```
/* allocate a result bignum */
z = bignew(xn + yn, RBIGNUM_SIGN(x)==RBIGNUM_SIGN(y));
zds = BDIGITS(z);
for (i = 0; i < xn + yn; i++) zds[i] = 0xdfdfdfdf;
/* t1 ← xh * yh */
t1 = bigmul0(xh, yh);
t1n = big_real_len(t1);
/* copy t1 into high bytes of the result (z2) */
MEMCPY(zds + 2 * n, BDIGITS(t1), BDIGIT, t1n);
for (i = 2 * n + t1n; i < xn + yn; i++) BDIGITS(z)[i] = 0;
/* t2 ← xl * yl */
if (BIGZEROP(xl) || BIGZEROP(yl)) {
```
 t2 = xl;
```
t2n = 0;
}
else {

z = bigmul1(&bms);

```
 t2 = bigmul0(xl, yl);
```
```
 t2n = big_real_len(t2);
```
}
/* copy t2 into low bytes of the result (z0) */
MEMCPY(zds, BDIGITS(t2), BDIGIT, t2n);
for (i = t2n; i < 2 * n; i++) BDIGITS(z)[i] = 0;
/* subtract t2 from middle bytes of the result (z1) */
i = xn + yn - n;
bigsub_core(zds + n, i, BDIGITS(t2), t2n, zds + n, i);
bigsub_core(zds + n, i, BDIGITS(t1), t1n, zds + n, i);
rb_gc_force_recycle(t1);
if (t2n) rb_gc_force_recycle(t2);
/* t1 ← xh + xl */
t1 = bigadd(xh, xl, 1);
/* t2 ← yh + yl */
t2 = (x == y) ? t1 : bigadd(yh, yl, 1);
/* t3 ← t1 * t2 */
t3 = bigmul0(t1, t2);
rb_gc_force_recycle(t1);
if (t1 != t2) rb_gc_force_recycle(t2);
/* add t3 to middle bytes of the result (z1) */
bigadd_core(zds + n, i, BDIGITS(t3), big_real_len(t3), zds + n, i);
rb_gc_force_recycle(t3);
return z;
}

+/* efficient squaring (2 times faster than normal multiplication)

- ref: Handbook of Applied Cryptography, Algorithm 14.16

 http://www.cacr.math.uwaterloo.ca/hac/about/chap14.pdf

*/
+static VALUE
+bigsqr_fast(VALUE x)
+{
long len = RBIGNUM_LEN(x), i, j;
VALUE z = bignew(2 * len + 1, 1);
BDIGIT *xds = BDIGITS(x), *zds = BDIGITS(z);
BDIGIT_DBL c, v, w;
for (i = 2 * len + 1; i–; ) zds[i] = 0;
for (i = 0; i < len; i++) {
v = (BDIGIT_DBL)xds[i];
if (!v) continue;
c = (BDIGIT_DBL)zds[i + i] + v * v;
zds[i + i] = BIGLO(c);
c = BIGDN(c);
v *= 2;
for (j = i + 1; j < len; j++) {
```
 w = (BDIGIT_DBL)xds[j];
```

 c += (BDIGIT_DBL)zds[i + j] + BIGLO(v) * w;

```
 zds[i + j] = BIGLO(c);
```
```
 c = BIGDN(c);
```
```
 if (BIGDN(v)) c += w;
```
}
if (c) {
```
 c += (BDIGIT_DBL)zds[i + len];
```
```
 zds[i + len] = BIGLO(c);
```
```
 c = BIGDN(c);
```
}
if (c) zds[i + len + 1] += c;
}
return z;
+}

+#define KARATSUBA_MUL_DIGITS 70
+
+
+/* determine whether a bignum is sparse or not by random sampling */
+static inline VALUE
+big_sparse_p(VALUE x)
+{

long c = 0, n = RBIGNUM_LEN(x);
unsigned long rb_rand_internal(unsigned long i);
if ( BDIGITS(x)[rb_rand_internal(n / 2) + n / 4]) c++;
if (c <= 1 && BDIGITS(x)[rb_rand_internal(n / 2) + n / 4]) c++;
if (c <= 1 && BDIGITS(x)[rb_rand_internal(n / 2) + n / 4]) c++;
return (c <= 1) ? Qtrue : Qfalse;
+}

+#if 0
+static void
+dump_bignum(VALUE x)
+{

long i;
printf(“0x0”);
for (i = RBIGNUM_LEN(x); i–; ) {
```
 printf("_%08x", BDIGITS(x)[i]);
```
}
puts(“”);
+}
+#endif

+static VALUE
+bigmul0(VALUE x, VALUE y)
+{

long xn, yn;
xn = RBIGNUM_LEN(x);
yn = RBIGNUM_LEN(y);
/* make sure that y is longer than x */
if (xn > yn) {
VALUE t;
long tn;
t = x; x = y; y = t;
tn = xn; xn = yn; yn = tn;
}
assert(xn <= yn);
/* normal multiplication when x is small */
if (xn < KARATSUBA_MUL_DIGITS) {
```
 normal:
```
if (x == y) return bigsqr_fast(x);
```
 return bigmul1_normal(x, y);
```
}
/* normal multiplication when x or y is a sparse bignum */
if (big_sparse_p(x)) goto normal;
if (big_sparse_p(y)) return bigmul1_normal(y, x);
/* balance multiplication by slicing y when x is much smaller than
y */
if (2 * xn <= yn) return bigmul1_balance(x, y);
/* multiplication by karatsuba method */
return bigmul1_karatsuba(x, y);
+}

/*

call-seq:
```
big * other  => Numeric
```

@@ -1607,7 +1838,22 @@
VALUE
rb_big_mul(VALUE x, VALUE y)
{

return bignorm(rb_big_mul0(x, y));

switch (TYPE(y)) {
```
 case T_FIXNUM:
```
y = rb_int2big(FIX2LONG(y));
break;
```
 case T_BIGNUM:
```
break;
```
 case T_FLOAT:
```
return DBL2NUM(rb_big2dbl(x) * RFLOAT_VALUE(y));
```
 default:
```
return rb_num_coerce_bin(x, y, ‘*’);
}
return bignorm(bigmul0(x, y));
}

struct big_div_struct {
@@ -1661,6 +1907,13 @@
return Qnil;
}

+static void
+rb_big_stop(void *ptr)
+{

VALUE stop = (VALUE)ptr;
*stop = Qtrue;
+}

static VALUE
bigdivrem(VALUE x, VALUE y, VALUE *divp, VALUE *modp)
{
@@ -2037,7 +2290,7 @@
BDIGIT_DBL num;

 if (len < 4000 / BITSPERDIG) {

return bigtrunc(rb_big_mul0(x, x));

return bigtrunc(bigmul0(x, x));
}

a = bignew(len - k, 1);
@@ -2054,7 +2307,7 @@
}
MEMCPY(BDIGITS(z) + 2 * k, BDIGITS(a2), BDIGIT, RBIGNUM_LEN(a2));
RBIGNUM_SET_LEN(z, len);

a2 = bigtrunc(rb_big_mul0(a, b));

a2 = bigtrunc(bigmul0(a, b));
len = RBIGNUM_LEN(a2);
for (i = 0, num = 0; i < len; i++) {
num += (BDIGIT_DBL)BDIGITS(z)[i + k] + ((BDIGIT_DBL)BDIGITS(a2)[i] <<
1);
@@ -2125,7 +2378,7 @@
for (mask = FIXNUM_MAX + 1; mask; mask >>= 1) {
if (z) z = bigtrunc(bigsqr(z));
if (yy & mask) {

   z = z ? bigtrunc(rb_big_mul0(z, x)) : x;

```
   z = z ? bigtrunc(bigmul0(z, x)) : x;
```
}
}
return bignorm(z);
Index: random.c
===================================================================
— random.c (revision 20645)
+++ random.c (working copy)
@@ -452,6 +452,16 @@
return rb_big_norm((VALUE)val);
}

+unsigned long
+rb_rand_internal(unsigned long i)
+{

struct MT *mt = &default_mt.mt;
if (!genrand_initialized(mt)) {
rand_init(mt, random_seed());
}
return limited_rand(mt, i);
+}

/*

call-seq:
```
rand(max=0)    => number
```

Yusuke_ENDOH · December 12, 2008, 1:27am

e$B$^$D$b$He(B e$B$f$-$R$m$G$9e(B

In message “Re: [ruby-dev:37392] [1.9:Feature] faster bignum
multiplication by karatsuba method”
on Fri, 12 Dec 2008 04:02:42 +0900, “Yusuke ENDOH” [email protected]
writes:

|Python e$B$N%=!<%9$r;29M$K$7$F!"e(Bbignum e$B$N>h;;$re(B Karatsuba e$BK!$J$I$Ge(B
|e$B9bB.2=$7$F$_$^$7$?!#e(B

|e$B0l1~e(B make test && make test-all e$B$ODL$C$F$$$^$9e(B (bignum e$B$N%F%9%H$Oe(B
|e$B=<<B$7$F$J$$$N$G$"$^$jEv$F$K$J$i$J$$$G$9$,e(B) e$B!#e(B
|
|e$B$I$&$G$7$g$&$+!#e(B

trunke$B$K%3%_%C%H$7$F$/$@$5$$!#e(B

Yusuke_ENDOH · December 12, 2008, 5:10am

e$B:XF#$H?=$7$^$9!#e(B

On Fri, 12 Dec 2008 04:02:42 +0900
“Yusuke ENDOH” [email protected] wrote:

e$B1sF#$G$9!#e(B

Python e$B$N%=!<%9$r;29M$K$7$F!"e(Bbignum e$B$N>h;;$re(B Karatsuba e$BK!$J$I$Ge(B
e$B9bB.2=$7$F$_$^$7$?!#e(B

e$B$*$)!“$9$P$i$7$$!#$”$j$,$H$&$4$6$$$^$9!#e(B

e$B0JA0e(B[ruby-dev:32629]e$B$G=q$$$F$$$i$C$7$c$C$?e(BFFTe$BHG$HHf$Y$F$O$I$&$J$N$G$7$g$&!#e(B
e$BAG?M9M$($G$O!"N>J}6&7e$,==J,$KBg$-$$>l9g$N$h$j87$7$$>r7o2<$G$O!"e(BKaratsubae$B$+$ie(B
e$B@Z$jBX$($l$PB.$/$J$k5$$,$7$^$9!#e(B

e$B$^$D$b$H$5$s$,!V%/%j%9%^%9$r2a$.$?$i<h$j9~$`!W$H8@$C$F$=$N$^$^$G$"$k$H;W$$$^$9!#e(B

Yusuke_ENDOH · December 14, 2008, 5:09am

e$B1sF#$G$9!#e(B

2008/12/12 13:02 Tadashi S. [email protected]:

e$B0JA0e(B[ruby-dev:32629]e$B$G=q$$$F$$$i$C$7$c$C$?e(BFFTe$BHG$HHf$Y$F$O$I$&$J$N$G$7$g$&!#e(B
e$BAG?M9M$($G$O!"N>J}6&7e$,==J,$KBg$-$$>l9g$N$h$j87$7$$>r7o2<$G$O!"e(BKaratsubae$B$+$ie(B
e$B@Z$jBX$($l$PB.$/$J$k5$$,$7$^$9!#e(B

e$B3P$($F$/$l$F$$$k?M$,$$$?$H$O!#$"$j$,$H$&$4$6$$$^$9!#e(B

e$B<B$O;d<+?H$,$b$&$"$s$^$j3P$($F$J$$$s$G$9$,!“K\Ev$K7e$,Bg$-$$>l9g$Oe(B
FFT e$B$Ne(B
e$BJ}$,Aa$$$O$:$J$N$G!”;n$7$F$$$^$;$s$,B?J,$=$NJ}K!$OM-8z$@$H;W$$$^$9!#e(B

e$B$?$@$“$N%Q%C%A$O!“e(Bdouble e$B7?$,e(B IEEE754
e$B$NG@:EY$G$”$k$3$He(B (e$BFC$K2>?tIt$,e(B
52bit e$B0J>e$”$k$3$He(B)
e$B$r2>Dj$7$F$$$k$?$a!“$=$&$G$J$$JQ$J4D6-$GF0$+$J$$$N$Ge(B
e$B%@%a!”$H8@$&%3%a%s%H$,$D$$$?5-21$,$"$j$^$9e(B (ML e$B$G$J$/e(B IRC
e$B$Ge(B) e$B!#e(B

e$B%3%s%Q%$%k;~$Ke(B double e$B7?$N2>?tIt$,e(B 52 bit
e$B0J>e$+$I$&$+$rH=Dj$G$-$l$P<h$je(B
e$B9~$a$k$+$b$7$l$^$;$s$,!"e(B

e$B!VJQ$J4D6-!W$G$A$c$s$HF0$/$+%F%9%H$r$9$k$N$,Fq$7$$e(B
Karatsuba e$B>h;;$G$b$^$"==J,$+$J$H;W$&e(B
e$B:#$H$J$C$F$O$“$N%Q%C%A$K$”$^$j<+?.$,$J$$e(B
(e$B8m:9I>2A$r$I$&$d$C$?$+$H$+e(B
e$BA4$/3P$($F$J$$e(B)

e$B$N$G!“@5D>$J$H$3$m!”;d<+?H$O:n6H$9$k5$$,$J$$$G$9!#e(B

Yusuke_ENDOH · December 16, 2008, 7:45am

e$B$J$+$@$G$9!#e(B

At Sun, 14 Dec 2008 13:01:52 +0900,
Yusuke ENDOH wrote in [ruby-dev:37435]:

e$B%3%s%Q%$%k;~$Ke(B double e$B7?$N2>?tIt$,e(B 52 bit e$B0J>e$+$I$&$+$rH=Dj$G$-$l$P<h$je(B
e$B9~$a$k$+$b$7$l$^$;$s$,!"e(B

#include <float.h>
#if DBL_MANT_DIG >= 52
…
#endif

e$B$G!#e(B

Yusuke_ENDOH · December 14, 2008, 5:03am

e$B1sF#$G$9!#e(B

2008/12/12 9:19 Yukihiro M. [email protected]:

|
|e$B$I$&$G$7$g$&$+!#e(B

trunke$B$K%3%_%C%H$7$F$/$@$5$$!#e(B

e$B$"$j$,$H$&$4$6$$$^$9!#e(B
e$B4JC1$J%F%9%H$H$H$b$K%3%_%C%H$7$^$7$?!#e(B

e$B$"$H!"e(Bbigsqr(x) e$B$,$J$s$+CY$$e(B (bigmul0(x, x)
e$B$7$?J}$,B.$$e(B) e$B$3$H$K5$$E$$$?$N$G!"e(B
e$B$b$&$A$g$C$HD4$Y$F$5$i$K=$@5$9$k$H;W$$$^$9!#e(B