80ビット拡張倍精度を使った０次第１種変形ベッセル関数の計算

/** _besi0q -- the 0th-order modified Bessel function of the first kind I0
   Rev. 0.4 (Feb. 19, 2023) (c) 2023, Takayuki HOSODA
   http://www.finetune.jp/~lyuka/technote/bessel/
   _besi0q(x) returns the 0th-order modified Bessel function
   of the first kind of real argument x.
 */
long double _besi0q(long double x) {
    int                 i;
    long double         a, p, q, r, s, t;
    /* The coefficients P32, P45 and Q3 used here are attributed to
       https://www.advanpix.com/2015/11/11/rational-approximations-for-the-
       modified-bessel-function-of-the-first-kind-i0-computations-double-precision/
     */
    const long double P32[33] = {
         1.00000000000000000000000000000000000e+00L,
         2.50000000000000000000000000000000000e-01L,
         2.77777777777777777777777777777777779e-02L,
         1.73611111111111111111111111111111083e-03L,
         6.94444444444444444444444444444449108e-05L,
         1.92901234567901234567901234567853905e-06L,
         3.93675988914084152179390274631572236e-08L,
         6.15118732678256487780297303953307469e-10L,
         7.59405842812662330592959640146193002e-12L,
         7.59405842812662330592959486994771411e-14L,
         6.27608134555919281481787961562157257e-16L,
         4.35838982330499501028963901609513258e-18L,
         2.57892888952958284633290216759752759e-20L,
         1.31578004567835859498063743807352147e-22L,
         5.84791131412603820814035808275571168e-25L,
         2.28434035708048361004361404800451548e-27L,
         7.90429189301205834423041758728181758e-30L,
         2.43959626327530221779537803521876900e-32L,
         6.75788438580533320595854894826703327e-35L,
         1.68947109644654239602153081596915483e-37L,
         3.83100021886675733871724163689480203e-40L,
         7.91528970342866904594413272561413611e-43L,
         1.49627405863018698139365798878928887e-45L,
         2.59769774665516078740718557214698854e-48L,
         4.15632134882805917464119034520347550e-51L,
         6.14832848022015178960667680429552612e-54L,
         8.43488878141065428604958554806851059e-57L,
         1.07486432616861166276174172563459685e-59L,
         1.28666328289305198822024236233461582e-62L,
         1.37245729295774874628038022579554422e-65L,
         1.71642649655915754818217188454585521e-68L,
         6.42133551177881248636744515323368258e-72L,
         2.93990539325117515154720726204799338e-74L}; /* [0L,15.5): */
    const long double P45[46] = {
         3.33094095073755755465308169515679754e-01L,
        -4.87305575020532173309650536123692992e+00L,
         1.16765891025166570372673307538545807e+00L,
         2.64107028015824651013530450189957215e+03L,
         3.29947497422711739169516563125826777e+02L,
         1.85360637074230573336349486640079127e+02L,
         1.92716946160432511352351625380961688e+02L,
         2.94374157084426440123892033050844719e+02L,
         5.94369974672125230816192833403509948e+02L,
         1.49338188597066557028520330783876602e+03L,
         4.49070212230053277828526595070904928e+03L,
         1.57364639902573996182985842231707641e+04L,
         6.09475654654342361774769290134171804e+04L,
         6.74843325301108470040298999048635726e+05L,
        -6.57083582192662169318674677284026011e+07L,
         9.83172447953771800483159480192563859e+09L,
        -1.23905750827828029147738416146512108e+12L,
         1.35560883142284024977500631878243972e+14L,
        -1.29343718391927120913858066893326175e+16L,
         1.08130315540350608880516332890283373e+18L,
        -7.95087530860069987411846664771880366e+19L,
         5.15861021545066736428201155306431096e+21L,
        -2.96090425993185982903689108288073850e+23L,
         1.50651836855858836083071762402341231e+25L,
        -6.80526037590684842951323289698851799e+26L,
         2.73203132967909651102779478756247727e+28L,
        -9.75309923194275182518137234542338189e+29L,
         3.09640722254712498146426101828630546e+31L,
        -8.73913695514222641997435352487537101e+32L,
         2.19076945578257225990373580600588103e+34L,
        -4.87120899281572328851130765475319009e+35L,
         9.58810466892032483163229870526807875e+36L,
        -1.66627420459640895942341335296132587e+38L,
         2.54807715779107313134088724774425453e+39L,
        -3.41409756541742494848545251263381364e+40L,
         3.98660860345465130692055711924224814e+41L,
        -4.02958459088507064758116007151695612e+42L,
         3.49565245578103887077950778697885925e+43L,
        -2.57418585602707614088803903097321313e+44L,
         1.58622500396250248773886354120038387e+45L,
        -8.02304482873909934532998282613480285e+45L,
         3.24266546042741906420052016688464442e+46L,
        -1.00665425805861133618962888863945150e+47L,
         2.25310991683789163051367847410612888e+47L,
        -3.23574657445200742953438267415045330e+47L,
         2.23881303334352384470482998051927380e+47L}; /* [15.5L,Inf): */
    const long double Q3[4] = {
         8.34943076824502833362836053862403964e-01L,
        -1.23193072119209042422963284443456931e+01L,
         4.40809330596253724239279903622218481e+00L,
         6.62043547609998683454530303968680120e+03L}; /* [15.5L,Inf): */
    p = q = 0;
    if ((a = fabsl((long double)x)) < 15.5L) {
        s = 0.25L * a * a;
        for (i = 0, t = 1.0L; i <= 32; i++, t *= s)
            p += P32[i] * t;
        return s * p + 1.0L;
    } else {
        r = 1.0L / a;
        for (i = 0, t = 1.0L; i <= 45; i++, t *= r)
            p += P45[i] * t;
        for (i = 0, t = 1.0L; i <= 3; i++, t *= r)
            q += Q3[i] * t;
        return expl(a) * p / (q * sqrtl(a));
    }
}

上記計算範囲での最大誤差 (0 ≤ x ≤ 40.0) gsl_sf_bessel_I0 : 8.182e-16 (x = 19.0859375) nr3_i0 : 5.534e-16 (x = 15.0009765625) _besi0p : 6.353e-17 (x = 33.8134765625) _besi0q : 2.494e-18 (x = 38.1123046875)

NAME besi0l(x) the 0th-order modified Bessel function of the first kind I₀ SYNOPSIS #include <math.h> #include <float.h> long double besi0l(long double x); RETURN VALUE besi0l(x) returns the 0th-order modified Bessel function of the first kind of real argument x.

/* besi0l.h -- include files for besi0l.c Rev. 1.4.3 (Mar. 5, 2023) (c) 2023, Takayuki HOSODA http://www.finetune.co.jp/~lyuka/technote/bessel/besi0.html */ #include <float.h> #include <math.h> long double expl(long double); long double sqrtl(long double); long double _besi0l(long double); #define SS_BORDER 512.0L #define SX_CTRL 24.0L #define SX_NCOEF 28 static const long double SXI0INF[SX_NCOEF] = { 3.98942280401432677939946059934381868e-1L, 4.98677850501790847424932574917977336e-2L, 2.80506290907257351676524573391362251e-2L, 2.92194053028393074663046430616002345e-2L, 4.47422143699726895577789846880753591e-2L, 9.06029840991946963545024439933526022e-2L, 2.28395022416719963726974910899909685e-1L, 6.89263549793315604818906427537227441e-1L, 2.42319216724212517319146790931056522L, 9.72642411573575243128241980264935207L, 4.38904888222575828461619193594552012e1L, 2.19951199666086295854061436789997088e2L, 1.21202275649332969277915104231154645e3L, 7.28379060392626017295162886004535128e3L, 4.74096727701986041614440842765451883e4L, 3.32262789997808550831453957304787528e5L, 2.49456672803042201053927541382735011e6L, 1.99748762266553644814505215121910608e7L, 1.69925162344811260345672839253014233e8L, 1.53044438980293825929754024300905582e9L, 1.45487869805641818274472419351048369e10L, 1.45574469728145176499635795791138279e11L, 1.52935905981443426902174196828303794e12L, 1.68312613919795075802664537270279990e13L, 1.93647168827514230441711438973983593e14L, 2.32473426177430833645274582488267304e15L, 2.90703548792066153034307302428838104e16L, 3.78049198405978622163596857649354738e17L}; #define EXP_NMAX 14 static const long double EXP_POW2N[EXP_NMAX] = { 2.71828182845904523536028747135266250L, 7.38905609893065022723042746057500781L, 5.45981500331442390781102612028608784e1L, 2.98095798704172827474359209945288867e3L, 8.88611052050787263676302374078145035e6L, 7.89629601826806951609780226351082242e13L, 6.23514908081161688290923870892846974e27L, 3.88770840599459509222267368835747807e55L, 1.51142766500410354252008966570728651e111L, 2.28441358653975664037875151712240342e222L, 5.21854543436743420112120953369801690e444L, 2.72332164505571925012480592774276919e889L, 7.41648078242898890481921050372684935e1778L, 5.50041871961385074607498352510634209e3557L};

/** _besi0l - zeroth-order modified Bessel function of the first kind. Rev. 1.4.3 (Mar. 5, 2023) (c) 2023, Takayuki HOSODA http://www.finetune.co.jp/~lyuka/technote/bessel/besi0.html _besi0l(x) returns the 0th-order modified Bessel function of the first kind of real argument x. SX_CTRL is the threshold value for switching formulas, and the standard setting is 24.0. For x <= SX_CTRL, use the infinite series, which is the definition of the zeroth-order modified Bessel function of the first kind. Fox x > SX_CTRL, use a 27th order polynomial approximation. The maximum error for 0 <= x < 768 is 6.5e-19. SS_BORDER is the threshold for computing an infinite series into two partial sums; SS_BORDER = 512 is appropriate when SX_CTRL = 24. */ #include "besi0l.h" long double _besi0l(long double x) { int n, m; long double sum, term, d, sub; if (0.0L == (x = fabsl(x))) return 1.0L; if (x <= SX_CTRL) { for (n = 1, sum = term = 1.0L; term > sum / SS_BORDER; sum += term, n++) term *= (0.25L * x * x) / (long double)(n * n); /* Major part calculation */ for (sub = 0.0L; term >= (LDBL_EPSILON) * sub; sub += term, n++) term *= (0.25L * x * x) / (long double)(n * n); /* Minor part calculation */ return sum + sub; } else { for (n = 0, sum = d = 0.0L, term = 1.0L; n < SX_NCOEF; n++, term *= (1.0L / x)) sum += SXI0INF[n] * term; m = floorl(x); d = 1.0L; for (n = 0; n < EXP_NMAX; n++) if ((1 << n) & m) d *= EXP_POW2N[n]; /* Range reduction for expl() */ return d * expl(x - (long double)m) / sqrtl(x) * sum; } } #ifdef DEBUG_BESI0L /* A compile option of -ffast-math may be needed for gcc as follows. * gcc -Wall -O -ffast-math -DDEBUG_BESI0L besi0l.c -o besi0 */ #include <stdio.h> #include <stdlib.h> #ifdef __FreeBSD__ #include <floatingpoint.h> #endif int main(int argc, char *argv[]) { long double x; char *dummy; #ifdef __FreeBSD__ fpsetprec(FP_PE); fpsetround(FP_RN); #endif if (argc == 2) { x = strtold(argv[1], &dummy); printf("besi0l(%.18Lg) ~= %18.18Lg\n", x, _besi0l(x)); } else { printf("%s x\n", argv[0]); } return(0); } #endif

計算速度の比較 _besi0l : 1283 [ms] (0 ≤ x ≤ 15.0, ittr = 10000000) _besi0q : 704 [ms] (0 ≤ x ≤ 15.0, ittr = 10000000) _besi0l : 1246 [ms] (0 ≤ x ≤ 128.0, ittr = 10000000) _besi0q : 1227 [ms] (0 ≤ x ≤ 128.0, ittr = 10000000)

L25: fxch %st(2) .L9: movl %eax, -128(%rsp) addl $1, %eax fildl -128(%rsp) fdivr %st(4), %st fmul %st(0), %st fmulp %st, %st(2) fxch %st(2) fadd %st(1), %st fld %st(0) fmul %st(3), %st fcomip %st(2), %st jb .L25

I₀ の参照値 I₀(1) ≃ 1.266065877752008335598244625214718 I₀(2) ≃ 2.279585302336067267437204440811533 I₀(4) ≃ 11.30192195213633049635627018321710 I₀(8) ≃ 427.5641157218047851773967913180829 I₀(16) ≃ 893446.2279201050170708640309761884 I₀(32) ≃ 5590908381350.873086500103776088605 I₀(64) ≃ 3.115457918187897557650694682306942 ×10²⁶ I₀(128) ≃ 1.372222546128743649356014388474097 ×10⁵⁴

チェビシェフ (Chebyshev) 近似とパデ (Padé) 近似による I₀ の計算

無限級数と多項式近似による I₀ の計算

結論

おまけ

I₀ calculator
x		I₀ (x) ≈

チェビシェフ (Chebyshev) 近似とパデ (Padé) 近似による I0 の計算

無限級数と多項式近似による I0 の計算

結論

おまけ

チェビシェフ (Chebyshev) 近似とパデ (Padé) 近似による I₀ の計算

無限級数と多項式近似による I₀ の計算