URL
https://opencores.org/ocsvn/openrisc/openrisc/trunk
Subversion Repositories openrisc
[/] [openrisc/] [trunk/] [gnu-dev/] [or1k-gcc/] [libquadmath/] [math/] [erfq.c] - Rev 792
Go to most recent revision | Compare with Previous | Blame | View Log
/* * ==================================================== * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved. * * Developed at SunPro, a Sun Microsystems, Inc. business. * Permission to use, copy, modify, and distribute this * software is freely granted, provided that this notice * is preserved. * ==================================================== */ /* Modifications and expansions for 128-bit long double are Copyright (C) 2001 Stephen L. Moshier <moshier@na-net.ornl.gov> and are incorporated herein by permission of the author. The author reserves the right to distribute this material elsewhere under different copying permissions. These modifications are distributed here under the following terms: This library is free software; you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License as published by the Free Software Foundation; either version 2.1 of the License, or (at your option) any later version. This library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details. You should have received a copy of the GNU Lesser General Public License along with this library; if not, write to the Free Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */ /* double erf(double x) * double erfc(double x) * x * 2 |\ * erf(x) = --------- | exp(-t*t)dt * sqrt(pi) \| * 0 * * erfc(x) = 1-erf(x) * Note that * erf(-x) = -erf(x) * erfc(-x) = 2 - erfc(x) * * Method: * 1. erf(x) = x + x*R(x^2) for |x| in [0, 7/8] * Remark. The formula is derived by noting * erf(x) = (2/sqrt(pi))*(x - x^3/3 + x^5/10 - x^7/42 + ....) * and that * 2/sqrt(pi) = 1.128379167095512573896158903121545171688 * is close to one. * * 1a. erf(x) = 1 - erfc(x), for |x| > 1.0 * erfc(x) = 1 - erf(x) if |x| < 1/4 * * 2. For |x| in [7/8, 1], let s = |x| - 1, and * c = 0.84506291151 rounded to single (24 bits) * erf(s + c) = sign(x) * (c + P1(s)/Q1(s)) * Remark: here we use the taylor series expansion at x=1. * erf(1+s) = erf(1) + s*Poly(s) * = 0.845.. + P1(s)/Q1(s) * Note that |P1/Q1|< 0.078 for x in [0.84375,1.25] * * 3. For x in [1/4, 5/4], * erfc(s + const) = erfc(const) + s P1(s)/Q1(s) * for const = 1/4, 3/8, ..., 9/8 * and 0 <= s <= 1/8 . * * 4. For x in [5/4, 107], * erfc(x) = (1/x)*exp(-x*x-0.5625 + R(z)) * z=1/x^2 * The interval is partitioned into several segments * of width 1/8 in 1/x. * * Note1: * To compute exp(-x*x-0.5625+R/S), let s be a single * precision number and s := x; then * -x*x = -s*s + (s-x)*(s+x) * exp(-x*x-0.5626+R/S) = * exp(-s*s-0.5625)*exp((s-x)*(s+x)+R/S); * Note2: * Here 4 and 5 make use of the asymptotic series * exp(-x*x) * erfc(x) ~ ---------- * ( 1 + Poly(1/x^2) ) * x*sqrt(pi) * * 5. For inf > x >= 107 * erf(x) = sign(x) *(1 - tiny) (raise inexact) * erfc(x) = tiny*tiny (raise underflow) if x > 0 * = 2 - tiny if x<0 * * 7. Special case: * erf(0) = 0, erf(inf) = 1, erf(-inf) = -1, * erfc(0) = 1, erfc(inf) = 0, erfc(-inf) = 2, * erfc/erf(NaN) is NaN */ #include "quadmath-imp.h" __float128 erfcq (__float128); /* Evaluate P[n] x^n + P[n-1] x^(n-1) + ... + P[0] */ static __float128 neval (__float128 x, const __float128 *p, int n) { __float128 y; p += n; y = *p--; do { y = y * x + *p--; } while (--n > 0); return y; } /* Evaluate x^n+1 + P[n] x^(n) + P[n-1] x^(n-1) + ... + P[0] */ static __float128 deval (__float128 x, const __float128 *p, int n) { __float128 y; p += n; y = x + *p--; do { y = y * x + *p--; } while (--n > 0); return y; } static const __float128 tiny = 1e-4931Q, half = 0.5Q, one = 1.0Q, two = 2.0Q, /* 2/sqrt(pi) - 1 */ efx = 1.2837916709551257389615890312154517168810E-1Q, /* 8 * (2/sqrt(pi) - 1) */ efx8 = 1.0270333367641005911692712249723613735048E0Q; /* erf(x) = x + x R(x^2) 0 <= x <= 7/8 Peak relative error 1.8e-35 */ #define NTN1 8 static const __float128 TN1[NTN1 + 1] = { -3.858252324254637124543172907442106422373E10Q, 9.580319248590464682316366876952214879858E10Q, 1.302170519734879977595901236693040544854E10Q, 2.922956950426397417800321486727032845006E9Q, 1.764317520783319397868923218385468729799E8Q, 1.573436014601118630105796794840834145120E7Q, 4.028077380105721388745632295157816229289E5Q, 1.644056806467289066852135096352853491530E4Q, 3.390868480059991640235675479463287886081E1Q }; #define NTD1 8 static const __float128 TD1[NTD1 + 1] = { -3.005357030696532927149885530689529032152E11Q, -1.342602283126282827411658673839982164042E11Q, -2.777153893355340961288511024443668743399E10Q, -3.483826391033531996955620074072768276974E9Q, -2.906321047071299585682722511260895227921E8Q, -1.653347985722154162439387878512427542691E7Q, -6.245520581562848778466500301865173123136E5Q, -1.402124304177498828590239373389110545142E4Q, -1.209368072473510674493129989468348633579E2Q /* 1.0E0 */ }; /* erf(z+1) = erf_const + P(z)/Q(z) -.125 <= z <= 0 Peak relative error 7.3e-36 */ static const __float128 erf_const = 0.845062911510467529296875Q; #define NTN2 8 static const __float128 TN2[NTN2 + 1] = { -4.088889697077485301010486931817357000235E1Q, 7.157046430681808553842307502826960051036E3Q, -2.191561912574409865550015485451373731780E3Q, 2.180174916555316874988981177654057337219E3Q, 2.848578658049670668231333682379720943455E2Q, 1.630362490952512836762810462174798925274E2Q, 6.317712353961866974143739396865293596895E0Q, 2.450441034183492434655586496522857578066E1Q, 5.127662277706787664956025545897050896203E-1Q }; #define NTD2 8 static const __float128 TD2[NTD2 + 1] = { 1.731026445926834008273768924015161048885E4Q, 1.209682239007990370796112604286048173750E4Q, 1.160950290217993641320602282462976163857E4Q, 5.394294645127126577825507169061355698157E3Q, 2.791239340533632669442158497532521776093E3Q, 8.989365571337319032943005387378993827684E2Q, 2.974016493766349409725385710897298069677E2Q, 6.148192754590376378740261072533527271947E1Q, 1.178502892490738445655468927408440847480E1Q /* 1.0E0 */ }; /* erfc(x + 0.25) = erfc(0.25) + x R(x) 0 <= x < 0.125 Peak relative error 1.4e-35 */ #define NRNr13 8 static const __float128 RNr13[NRNr13 + 1] = { -2.353707097641280550282633036456457014829E3Q, 3.871159656228743599994116143079870279866E2Q, -3.888105134258266192210485617504098426679E2Q, -2.129998539120061668038806696199343094971E1Q, -8.125462263594034672468446317145384108734E1Q, 8.151549093983505810118308635926270319660E0Q, -5.033362032729207310462422357772568553670E0Q, -4.253956621135136090295893547735851168471E-2Q, -8.098602878463854789780108161581050357814E-2Q }; #define NRDr13 7 static const __float128 RDr13[NRDr13 + 1] = { 2.220448796306693503549505450626652881752E3Q, 1.899133258779578688791041599040951431383E2Q, 1.061906712284961110196427571557149268454E3Q, 7.497086072306967965180978101974566760042E1Q, 2.146796115662672795876463568170441327274E2Q, 1.120156008362573736664338015952284925592E1Q, 2.211014952075052616409845051695042741074E1Q, 6.469655675326150785692908453094054988938E-1Q /* 1.0E0 */ }; /* erfc(0.25) = C13a + C13b to extra precision. */ static const __float128 C13a = 0.723663330078125Q; static const __float128 C13b = 1.0279753638067014931732235184287934646022E-5Q; /* erfc(x + 0.375) = erfc(0.375) + x R(x) 0 <= x < 0.125 Peak relative error 1.2e-35 */ #define NRNr14 8 static const __float128 RNr14[NRNr14 + 1] = { -2.446164016404426277577283038988918202456E3Q, 6.718753324496563913392217011618096698140E2Q, -4.581631138049836157425391886957389240794E2Q, -2.382844088987092233033215402335026078208E1Q, -7.119237852400600507927038680970936336458E1Q, 1.313609646108420136332418282286454287146E1Q, -6.188608702082264389155862490056401365834E0Q, -2.787116601106678287277373011101132659279E-2Q, -2.230395570574153963203348263549700967918E-2Q }; #define NRDr14 7 static const __float128 RDr14[NRDr14 + 1] = { 2.495187439241869732696223349840963702875E3Q, 2.503549449872925580011284635695738412162E2Q, 1.159033560988895481698051531263861842461E3Q, 9.493751466542304491261487998684383688622E1Q, 2.276214929562354328261422263078480321204E2Q, 1.367697521219069280358984081407807931847E1Q, 2.276988395995528495055594829206582732682E1Q, 7.647745753648996559837591812375456641163E-1Q /* 1.0E0 */ }; /* erfc(0.375) = C14a + C14b to extra precision. */ static const __float128 C14a = 0.5958709716796875Q; static const __float128 C14b = 1.2118885490201676174914080878232469565953E-5Q; /* erfc(x + 0.5) = erfc(0.5) + x R(x) 0 <= x < 0.125 Peak relative error 4.7e-36 */ #define NRNr15 8 static const __float128 RNr15[NRNr15 + 1] = { -2.624212418011181487924855581955853461925E3Q, 8.473828904647825181073831556439301342756E2Q, -5.286207458628380765099405359607331669027E2Q, -3.895781234155315729088407259045269652318E1Q, -6.200857908065163618041240848728398496256E1Q, 1.469324610346924001393137895116129204737E1Q, -6.961356525370658572800674953305625578903E0Q, 5.145724386641163809595512876629030548495E-3Q, 1.990253655948179713415957791776180406812E-2Q }; #define NRDr15 7 static const __float128 RDr15[NRDr15 + 1] = { 2.986190760847974943034021764693341524962E3Q, 5.288262758961073066335410218650047725985E2Q, 1.363649178071006978355113026427856008978E3Q, 1.921707975649915894241864988942255320833E2Q, 2.588651100651029023069013885900085533226E2Q, 2.628752920321455606558942309396855629459E1Q, 2.455649035885114308978333741080991380610E1Q, 1.378826653595128464383127836412100939126E0Q /* 1.0E0 */ }; /* erfc(0.5) = C15a + C15b to extra precision. */ static const __float128 C15a = 0.4794921875Q; static const __float128 C15b = 7.9346869534623172533461080354712635484242E-6Q; /* erfc(x + 0.625) = erfc(0.625) + x R(x) 0 <= x < 0.125 Peak relative error 5.1e-36 */ #define NRNr16 8 static const __float128 RNr16[NRNr16 + 1] = { -2.347887943200680563784690094002722906820E3Q, 8.008590660692105004780722726421020136482E2Q, -5.257363310384119728760181252132311447963E2Q, -4.471737717857801230450290232600243795637E1Q, -4.849540386452573306708795324759300320304E1Q, 1.140885264677134679275986782978655952843E1Q, -6.731591085460269447926746876983786152300E0Q, 1.370831653033047440345050025876085121231E-1Q, 2.022958279982138755020825717073966576670E-2Q, }; #define NRDr16 7 static const __float128 RDr16[NRDr16 + 1] = { 3.075166170024837215399323264868308087281E3Q, 8.730468942160798031608053127270430036627E2Q, 1.458472799166340479742581949088453244767E3Q, 3.230423687568019709453130785873540386217E2Q, 2.804009872719893612081109617983169474655E2Q, 4.465334221323222943418085830026979293091E1Q, 2.612723259683205928103787842214809134746E1Q, 2.341526751185244109722204018543276124997E0Q, /* 1.0E0 */ }; /* erfc(0.625) = C16a + C16b to extra precision. */ static const __float128 C16a = 0.3767547607421875Q; static const __float128 C16b = 4.3570693945275513594941232097252997287766E-6Q; /* erfc(x + 0.75) = erfc(0.75) + x R(x) 0 <= x < 0.125 Peak relative error 1.7e-35 */ #define NRNr17 8 static const __float128 RNr17[NRNr17 + 1] = { -1.767068734220277728233364375724380366826E3Q, 6.693746645665242832426891888805363898707E2Q, -4.746224241837275958126060307406616817753E2Q, -2.274160637728782675145666064841883803196E1Q, -3.541232266140939050094370552538987982637E1Q, 6.988950514747052676394491563585179503865E0Q, -5.807687216836540830881352383529281215100E0Q, 3.631915988567346438830283503729569443642E-1Q, -1.488945487149634820537348176770282391202E-2Q }; #define NRDr17 7 static const __float128 RDr17[NRDr17 + 1] = { 2.748457523498150741964464942246913394647E3Q, 1.020213390713477686776037331757871252652E3Q, 1.388857635935432621972601695296561952738E3Q, 3.903363681143817750895999579637315491087E2Q, 2.784568344378139499217928969529219886578E2Q, 5.555800830216764702779238020065345401144E1Q, 2.646215470959050279430447295801291168941E1Q, 2.984905282103517497081766758550112011265E0Q, /* 1.0E0 */ }; /* erfc(0.75) = C17a + C17b to extra precision. */ static const __float128 C17a = 0.2888336181640625Q; static const __float128 C17b = 1.0748182422368401062165408589222625794046E-5Q; /* erfc(x + 0.875) = erfc(0.875) + x R(x) 0 <= x < 0.125 Peak relative error 2.2e-35 */ #define NRNr18 8 static const __float128 RNr18[NRNr18 + 1] = { -1.342044899087593397419622771847219619588E3Q, 6.127221294229172997509252330961641850598E2Q, -4.519821356522291185621206350470820610727E2Q, 1.223275177825128732497510264197915160235E1Q, -2.730789571382971355625020710543532867692E1Q, 4.045181204921538886880171727755445395862E0Q, -4.925146477876592723401384464691452700539E0Q, 5.933878036611279244654299924101068088582E-1Q, -5.557645435858916025452563379795159124753E-2Q }; #define NRDr18 7 static const __float128 RDr18[NRDr18 + 1] = { 2.557518000661700588758505116291983092951E3Q, 1.070171433382888994954602511991940418588E3Q, 1.344842834423493081054489613250688918709E3Q, 4.161144478449381901208660598266288188426E2Q, 2.763670252219855198052378138756906980422E2Q, 5.998153487868943708236273854747564557632E1Q, 2.657695108438628847733050476209037025318E1Q, 3.252140524394421868923289114410336976512E0Q, /* 1.0E0 */ }; /* erfc(0.875) = C18a + C18b to extra precision. */ static const __float128 C18a = 0.215911865234375Q; static const __float128 C18b = 1.3073705765341685464282101150637224028267E-5Q; /* erfc(x + 1.0) = erfc(1.0) + x R(x) 0 <= x < 0.125 Peak relative error 1.6e-35 */ #define NRNr19 8 static const __float128 RNr19[NRNr19 + 1] = { -1.139180936454157193495882956565663294826E3Q, 6.134903129086899737514712477207945973616E2Q, -4.628909024715329562325555164720732868263E2Q, 4.165702387210732352564932347500364010833E1Q, -2.286979913515229747204101330405771801610E1Q, 1.870695256449872743066783202326943667722E0Q, -4.177486601273105752879868187237000032364E0Q, 7.533980372789646140112424811291782526263E-1Q, -8.629945436917752003058064731308767664446E-2Q }; #define NRDr19 7 static const __float128 RDr19[NRDr19 + 1] = { 2.744303447981132701432716278363418643778E3Q, 1.266396359526187065222528050591302171471E3Q, 1.466739461422073351497972255511919814273E3Q, 4.868710570759693955597496520298058147162E2Q, 2.993694301559756046478189634131722579643E2Q, 6.868976819510254139741559102693828237440E1Q, 2.801505816247677193480190483913753613630E1Q, 3.604439909194350263552750347742663954481E0Q, /* 1.0E0 */ }; /* erfc(1.0) = C19a + C19b to extra precision. */ static const __float128 C19a = 0.15728759765625Q; static const __float128 C19b = 1.1609394035130658779364917390740703933002E-5Q; /* erfc(x + 1.125) = erfc(1.125) + x R(x) 0 <= x < 0.125 Peak relative error 3.6e-36 */ #define NRNr20 8 static const __float128 RNr20[NRNr20 + 1] = { -9.652706916457973956366721379612508047640E2Q, 5.577066396050932776683469951773643880634E2Q, -4.406335508848496713572223098693575485978E2Q, 5.202893466490242733570232680736966655434E1Q, -1.931311847665757913322495948705563937159E1Q, -9.364318268748287664267341457164918090611E-2Q, -3.306390351286352764891355375882586201069E0Q, 7.573806045289044647727613003096916516475E-1Q, -9.611744011489092894027478899545635991213E-2Q }; #define NRDr20 7 static const __float128 RDr20[NRDr20 + 1] = { 3.032829629520142564106649167182428189014E3Q, 1.659648470721967719961167083684972196891E3Q, 1.703545128657284619402511356932569292535E3Q, 6.393465677731598872500200253155257708763E2Q, 3.489131397281030947405287112726059221934E2Q, 8.848641738570783406484348434387611713070E1Q, 3.132269062552392974833215844236160958502E1Q, 4.430131663290563523933419966185230513168E0Q /* 1.0E0 */ }; /* erfc(1.125) = C20a + C20b to extra precision. */ static const __float128 C20a = 0.111602783203125Q; static const __float128 C20b = 8.9850951672359304215530728365232161564636E-6Q; /* erfc(1/x) = 1/x exp (-1/x^2 - 0.5625 + R(1/x^2)) 7/8 <= 1/x < 1 Peak relative error 1.4e-35 */ #define NRNr8 9 static const __float128 RNr8[NRNr8 + 1] = { 3.587451489255356250759834295199296936784E1Q, 5.406249749087340431871378009874875889602E2Q, 2.931301290625250886238822286506381194157E3Q, 7.359254185241795584113047248898753470923E3Q, 9.201031849810636104112101947312492532314E3Q, 5.749697096193191467751650366613289284777E3Q, 1.710415234419860825710780802678697889231E3Q, 2.150753982543378580859546706243022719599E2Q, 8.740953582272147335100537849981160931197E0Q, 4.876422978828717219629814794707963640913E-2Q }; #define NRDr8 8 static const __float128 RDr8[NRDr8 + 1] = { 6.358593134096908350929496535931630140282E1Q, 9.900253816552450073757174323424051765523E2Q, 5.642928777856801020545245437089490805186E3Q, 1.524195375199570868195152698617273739609E4Q, 2.113829644500006749947332935305800887345E4Q, 1.526438562626465706267943737310282977138E4Q, 5.561370922149241457131421914140039411782E3Q, 9.394035530179705051609070428036834496942E2Q, 6.147019596150394577984175188032707343615E1Q /* 1.0E0 */ }; /* erfc(1/x) = 1/x exp (-1/x^2 - 0.5625 + R(1/x^2)) 0.75 <= 1/x <= 0.875 Peak relative error 2.0e-36 */ #define NRNr7 9 static const __float128 RNr7[NRNr7 + 1] = { 1.686222193385987690785945787708644476545E1Q, 1.178224543567604215602418571310612066594E3Q, 1.764550584290149466653899886088166091093E4Q, 1.073758321890334822002849369898232811561E5Q, 3.132840749205943137619839114451290324371E5Q, 4.607864939974100224615527007793867585915E5Q, 3.389781820105852303125270837910972384510E5Q, 1.174042187110565202875011358512564753399E5Q, 1.660013606011167144046604892622504338313E4Q, 6.700393957480661937695573729183733234400E2Q }; #define NRDr7 9 static const __float128 RDr7[NRDr7 + 1] = { -1.709305024718358874701575813642933561169E3Q, -3.280033887481333199580464617020514788369E4Q, -2.345284228022521885093072363418750835214E5Q, -8.086758123097763971926711729242327554917E5Q, -1.456900414510108718402423999575992450138E6Q, -1.391654264881255068392389037292702041855E6Q, -6.842360801869939983674527468509852583855E5Q, -1.597430214446573566179675395199807533371E5Q, -1.488876130609876681421645314851760773480E4Q, -3.511762950935060301403599443436465645703E2Q /* 1.0E0 */ }; /* erfc(1/x) = 1/x exp(-1/x^2 - 0.5625 + R(1/x^2)) 5/8 <= 1/x < 3/4 Peak relative error 1.9e-35 */ #define NRNr6 9 static const __float128 RNr6[NRNr6 + 1] = { 1.642076876176834390623842732352935761108E0Q, 1.207150003611117689000664385596211076662E2Q, 2.119260779316389904742873816462800103939E3Q, 1.562942227734663441801452930916044224174E4Q, 5.656779189549710079988084081145693580479E4Q, 1.052166241021481691922831746350942786299E5Q, 9.949798524786000595621602790068349165758E4Q, 4.491790734080265043407035220188849562856E4Q, 8.377074098301530326270432059434791287601E3Q, 4.506934806567986810091824791963991057083E2Q }; #define NRDr6 9 static const __float128 RDr6[NRDr6 + 1] = { -1.664557643928263091879301304019826629067E2Q, -3.800035902507656624590531122291160668452E3Q, -3.277028191591734928360050685359277076056E4Q, -1.381359471502885446400589109566587443987E5Q, -3.082204287382581873532528989283748656546E5Q, -3.691071488256738343008271448234631037095E5Q, -2.300482443038349815750714219117566715043E5Q, -6.873955300927636236692803579555752171530E4Q, -8.262158817978334142081581542749986845399E3Q, -2.517122254384430859629423488157361983661E2Q /* 1.00 */ }; /* erfc(1/x) = 1/x exp(-1/x^2 - 0.5625 + R(1/x^2)) 1/2 <= 1/x < 5/8 Peak relative error 4.6e-36 */ #define NRNr5 10 static const __float128 RNr5[NRNr5 + 1] = { -3.332258927455285458355550878136506961608E-3Q, -2.697100758900280402659586595884478660721E-1Q, -6.083328551139621521416618424949137195536E0Q, -6.119863528983308012970821226810162441263E1Q, -3.176535282475593173248810678636522589861E2Q, -8.933395175080560925809992467187963260693E2Q, -1.360019508488475978060917477620199499560E3Q, -1.075075579828188621541398761300910213280E3Q, -4.017346561586014822824459436695197089916E2Q, -5.857581368145266249509589726077645791341E1Q, -2.077715925587834606379119585995758954399E0Q }; #define NRDr5 9 static const __float128 RDr5[NRDr5 + 1] = { 3.377879570417399341550710467744693125385E-1Q, 1.021963322742390735430008860602594456187E1Q, 1.200847646592942095192766255154827011939E2Q, 7.118915528142927104078182863387116942836E2Q, 2.318159380062066469386544552429625026238E3Q, 4.238729853534009221025582008928765281620E3Q, 4.279114907284825886266493994833515580782E3Q, 2.257277186663261531053293222591851737504E3Q, 5.570475501285054293371908382916063822957E2Q, 5.142189243856288981145786492585432443560E1Q /* 1.0E0 */ }; /* erfc(1/x) = 1/x exp(-1/x^2 - 0.5625 + R(1/x^2)) 3/8 <= 1/x < 1/2 Peak relative error 2.0e-36 */ #define NRNr4 10 static const __float128 RNr4[NRNr4 + 1] = { 3.258530712024527835089319075288494524465E-3Q, 2.987056016877277929720231688689431056567E-1Q, 8.738729089340199750734409156830371528862E0Q, 1.207211160148647782396337792426311125923E2Q, 8.997558632489032902250523945248208224445E2Q, 3.798025197699757225978410230530640879762E3Q, 9.113203668683080975637043118209210146846E3Q, 1.203285891339933238608683715194034900149E4Q, 8.100647057919140328536743641735339740855E3Q, 2.383888249907144945837976899822927411769E3Q, 2.127493573166454249221983582495245662319E2Q }; #define NRDr4 10 static const __float128 RDr4[NRDr4 + 1] = { -3.303141981514540274165450687270180479586E-1Q, -1.353768629363605300707949368917687066724E1Q, -2.206127630303621521950193783894598987033E2Q, -1.861800338758066696514480386180875607204E3Q, -8.889048775872605708249140016201753255599E3Q, -2.465888106627948210478692168261494857089E4Q, -3.934642211710774494879042116768390014289E4Q, -3.455077258242252974937480623730228841003E4Q, -1.524083977439690284820586063729912653196E4Q, -2.810541887397984804237552337349093953857E3Q, -1.343929553541159933824901621702567066156E2Q /* 1.0E0 */ }; /* erfc(1/x) = 1/x exp(-1/x^2 - 0.5625 + R(1/x^2)) 1/4 <= 1/x < 3/8 Peak relative error 8.4e-37 */ #define NRNr3 11 static const __float128 RNr3[NRNr3 + 1] = { -1.952401126551202208698629992497306292987E-6Q, -2.130881743066372952515162564941682716125E-4Q, -8.376493958090190943737529486107282224387E-3Q, -1.650592646560987700661598877522831234791E-1Q, -1.839290818933317338111364667708678163199E0Q, -1.216278715570882422410442318517814388470E1Q, -4.818759344462360427612133632533779091386E1Q, -1.120994661297476876804405329172164436784E2Q, -1.452850765662319264191141091859300126931E2Q, -9.485207851128957108648038238656777241333E1Q, -2.563663855025796641216191848818620020073E1Q, -1.787995944187565676837847610706317833247E0Q }; #define NRDr3 10 static const __float128 RDr3[NRDr3 + 1] = { 1.979130686770349481460559711878399476903E-4Q, 1.156941716128488266238105813374635099057E-2Q, 2.752657634309886336431266395637285974292E-1Q, 3.482245457248318787349778336603569327521E0Q, 2.569347069372696358578399521203959253162E1Q, 1.142279000180457419740314694631879921561E2Q, 3.056503977190564294341422623108332700840E2Q, 4.780844020923794821656358157128719184422E2Q, 4.105972727212554277496256802312730410518E2Q, 1.724072188063746970865027817017067646246E2Q, 2.815939183464818198705278118326590370435E1Q /* 1.0E0 */ }; /* erfc(1/x) = 1/x exp(-1/x^2 - 0.5625 + R(1/x^2)) 1/8 <= 1/x < 1/4 Peak relative error 1.5e-36 */ #define NRNr2 11 static const __float128 RNr2[NRNr2 + 1] = { -2.638914383420287212401687401284326363787E-8Q, -3.479198370260633977258201271399116766619E-6Q, -1.783985295335697686382487087502222519983E-4Q, -4.777876933122576014266349277217559356276E-3Q, -7.450634738987325004070761301045014986520E-2Q, -7.068318854874733315971973707247467326619E-1Q, -4.113919921935944795764071670806867038732E0Q, -1.440447573226906222417767283691888875082E1Q, -2.883484031530718428417168042141288943905E1Q, -2.990886974328476387277797361464279931446E1Q, -1.325283914915104866248279787536128997331E1Q, -1.572436106228070195510230310658206154374E0Q }; #define NRDr2 10 static const __float128 RDr2[NRDr2 + 1] = { 2.675042728136731923554119302571867799673E-6Q, 2.170997868451812708585443282998329996268E-4Q, 7.249969752687540289422684951196241427445E-3Q, 1.302040375859768674620410563307838448508E-1Q, 1.380202483082910888897654537144485285549E0Q, 8.926594113174165352623847870299170069350E0Q, 3.521089584782616472372909095331572607185E1Q, 8.233547427533181375185259050330809105570E1Q, 1.072971579885803033079469639073292840135E2Q, 6.943803113337964469736022094105143158033E1Q, 1.775695341031607738233608307835017282662E1Q /* 1.0E0 */ }; /* erfc(1/x) = 1/x exp(-1/x^2 - 0.5625 + R(1/x^2)) 1/128 <= 1/x < 1/8 Peak relative error 2.2e-36 */ #define NRNr1 9 static const __float128 RNr1[NRNr1 + 1] = { -4.250780883202361946697751475473042685782E-8Q, -5.375777053288612282487696975623206383019E-6Q, -2.573645949220896816208565944117382460452E-4Q, -6.199032928113542080263152610799113086319E-3Q, -8.262721198693404060380104048479916247786E-2Q, -6.242615227257324746371284637695778043982E-1Q, -2.609874739199595400225113299437099626386E0Q, -5.581967563336676737146358534602770006970E0Q, -5.124398923356022609707490956634280573882E0Q, -1.290865243944292370661544030414667556649E0Q }; #define NRDr1 8 static const __float128 RDr1[NRDr1 + 1] = { 4.308976661749509034845251315983612976224E-6Q, 3.265390126432780184125233455960049294580E-4Q, 9.811328839187040701901866531796570418691E-3Q, 1.511222515036021033410078631914783519649E-1Q, 1.289264341917429958858379585970225092274E0Q, 6.147640356182230769548007536914983522270E0Q, 1.573966871337739784518246317003956180750E1Q, 1.955534123435095067199574045529218238263E1Q, 9.472613121363135472247929109615785855865E0Q /* 1.0E0 */ }; __float128 erfq (__float128 x) { __float128 a, y, z; int32_t i, ix, sign; ieee854_float128 u; u.value = x; sign = u.words32.w0; ix = sign & 0x7fffffff; if (ix >= 0x7fff0000) { /* erf(nan)=nan */ i = ((sign & 0xffff0000) >> 31) << 1; return (__float128) (1 - i) + one / x; /* erf(+-inf)=+-1 */ } if (ix >= 0x3fff0000) /* |x| >= 1.0 */ { y = erfcq (x); return (one - y); /* return (one - erfcq (x)); */ } u.words32.w0 = ix; a = u.value; z = x * x; if (ix < 0x3ffec000) /* a < 0.875 */ { if (ix < 0x3fc60000) /* |x|<2**-57 */ { if (ix < 0x00080000) return 0.125 * (8.0 * x + efx8 * x); /*avoid underflow */ return x + efx * x; } y = a + a * neval (z, TN1, NTN1) / deval (z, TD1, NTD1); } else { a = a - one; y = erf_const + neval (a, TN2, NTN2) / deval (a, TD2, NTD2); } if (sign & 0x80000000) /* x < 0 */ y = -y; return( y ); } __float128 erfcq (__float128 x) { __float128 y = 0.0Q, z, p, r; int32_t i, ix, sign; ieee854_float128 u; u.value = x; sign = u.words32.w0; ix = sign & 0x7fffffff; u.words32.w0 = ix; if (ix >= 0x7fff0000) { /* erfc(nan)=nan */ /* erfc(+-inf)=0,2 */ return (__float128) (((uint32_t) sign >> 31) << 1) + one / x; } if (ix < 0x3ffd0000) /* |x| <1/4 */ { if (ix < 0x3f8d0000) /* |x|<2**-114 */ return one - x; return one - erfq (x); } if (ix < 0x3fff4000) /* 1.25 */ { x = u.value; i = 8.0 * x; switch (i) { case 2: z = x - 0.25Q; y = C13b + z * neval (z, RNr13, NRNr13) / deval (z, RDr13, NRDr13); y += C13a; break; case 3: z = x - 0.375Q; y = C14b + z * neval (z, RNr14, NRNr14) / deval (z, RDr14, NRDr14); y += C14a; break; case 4: z = x - 0.5Q; y = C15b + z * neval (z, RNr15, NRNr15) / deval (z, RDr15, NRDr15); y += C15a; break; case 5: z = x - 0.625Q; y = C16b + z * neval (z, RNr16, NRNr16) / deval (z, RDr16, NRDr16); y += C16a; break; case 6: z = x - 0.75Q; y = C17b + z * neval (z, RNr17, NRNr17) / deval (z, RDr17, NRDr17); y += C17a; break; case 7: z = x - 0.875Q; y = C18b + z * neval (z, RNr18, NRNr18) / deval (z, RDr18, NRDr18); y += C18a; break; case 8: z = x - 1.0Q; y = C19b + z * neval (z, RNr19, NRNr19) / deval (z, RDr19, NRDr19); y += C19a; break; case 9: z = x - 1.125Q; y = C20b + z * neval (z, RNr20, NRNr20) / deval (z, RDr20, NRDr20); y += C20a; break; } if (sign & 0x80000000) y = 2.0Q - y; return y; } /* 1.25 < |x| < 107 */ if (ix < 0x4005ac00) { /* x < -9 */ if ((ix >= 0x40022000) && (sign & 0x80000000)) return two - tiny; x = fabsq (x); z = one / (x * x); i = 8.0 / x; switch (i) { default: case 0: p = neval (z, RNr1, NRNr1) / deval (z, RDr1, NRDr1); break; case 1: p = neval (z, RNr2, NRNr2) / deval (z, RDr2, NRDr2); break; case 2: p = neval (z, RNr3, NRNr3) / deval (z, RDr3, NRDr3); break; case 3: p = neval (z, RNr4, NRNr4) / deval (z, RDr4, NRDr4); break; case 4: p = neval (z, RNr5, NRNr5) / deval (z, RDr5, NRDr5); break; case 5: p = neval (z, RNr6, NRNr6) / deval (z, RDr6, NRDr6); break; case 6: p = neval (z, RNr7, NRNr7) / deval (z, RDr7, NRDr7); break; case 7: p = neval (z, RNr8, NRNr8) / deval (z, RDr8, NRDr8); break; } u.value = x; u.words32.w3 = 0; u.words32.w2 &= 0xfe000000; z = u.value; r = expq (-z * z - 0.5625) * expq ((z - x) * (z + x) + p); if ((sign & 0x80000000) == 0) return r / x; else return two - r / x; } else { if ((sign & 0x80000000) == 0) return tiny * tiny; else return two - tiny; } }
Go to most recent revision | Compare with Previous | Blame | View Log