45 template<
size_t MaxTerms,
bool Normalize,
typename TA,
typename TX>
46 inline auto gamma(
const TA& a,
const TX& x)
51 auto mask = (
x >= 0) && (a > 0);
54 if(bbm::none(mask))
return result_t(0);
59 const auto epsilon = std::numeric_limits<scalar_t<result_t>>::epsilon();
66 auto converged = !mask;
67 for(
size_t m=1; m <= MaxTerms && bbm::any(!converged); ++m, ++ap)
70 term *=
bbm::select(converged, 0, x * bbm::rcp(ap));
76 converged |= bbm::abs(term) < bbm::abs(sum_series)*epsilon;
81 if constexpr (Normalize) norm = bbm::lgamma(
result_t(a));
85 sum_series *= bbm::exp(-x + a*bbm::log(x) - norm);
101 template<
size_t MaxTerms,
bool Normalize,
typename TA,
typename TX>
102 inline auto Gamma(
const TA& a,
const TX& x)
107 auto mask = (
x >= 0) && (a > 0);
110 if(bbm::none(mask))
return result_t(0);
113 const auto epsilon = std::numeric_limits<scalar_t<result_t>>::epsilon();
114 const auto tiny = std::numeric_limits<scalar_t<result_t>>::min() / epsilon;
122 auto converged = !mask;
123 for(
size_t k=1; k < MaxTerms && bbm::any(!converged); ++k)
139 Gamma =
bbm::select(converged, Gamma, Gamma * delta);
142 converged |= bbm::abs(delta-1) <= epsilon;
147 if constexpr (Normalize) norm = bbm::lgamma(
result_t(a));
150 return bbm::select(mask, bbm::exp(-x + a*bbm::log(x) - norm) * Gamma, 0);
157 template<
typename TA,
typename TX>
158 inline auto gamma_is_large(
const TA& a,
const TX& x)
162 auto result = ((a > 200) && (20/a > sigma*sigma)) || ((a > 20) && (sigma < 0.4) && (std::numeric_limits<scalar_t<result_t>>::digits <= 64));
176 template<
bool normalize,
typename TA,
typename TX>
177 inline auto gamma_large(
const TA& a ,
const TX& x)
186 result_t z = bbm::sign(x-a) * bbm::safe_sqrt(2*phi);
188 auto eval_poly = []<
typename T,
size_t... IDX>(
const T& a,
const T&
z, std::index_sequence<IDX...>)
190 constexpr std::array idx{IDX...};
193 auto c0 = bbm::poly<idx[0]>(z,
194 T(-0.333333333333333333333333333333333333),
195 T(0.0833333333333333333333333333333333333),
196 T(-0.0148148148148148148148148148148148148),
197 T(0.00115740740740740740740740740740740741),
198 T(0.0003527336860670194003527336860670194),
199 T(-0.000178755144032921810699588477366255144),
200 T(0.391926317852243778169704095630021556e-4),
201 T(-0.218544851067999216147364295512443661e-5),
202 T(-0.185406221071515996070179883622956325e-5),
203 T(0.829671134095308600501624213166443227e-6),
204 T(-0.17665952736826079304360054245742403e-6),
205 T(0.670785354340149858036939710029613572e-8),
206 T(0.102618097842403080425739573227252951e-7),
207 T(-0.438203601845335318655297462244719123e-8),
208 T(0.914769958223679023418248817633113681e-9),
209 T(-0.255141939949462497668779537993887013e-10),
210 T(-0.583077213255042506746408945040035798e-10),
211 T(0.243619480206674162436940696707789943e-10),
212 T(-0.502766928011417558909054985925744366e-11),
213 T(0.110043920319561347708374174497293411e-12),
214 T(0.337176326240098537882769884169200185e-12),
215 T(-0.13923887224181620659193661848957998e-12),
216 T(0.285348938070474432039669099052828299e-13),
217 T(-0.513911183424257261899064580300494205e-15),
218 T(-0.197522882943494428353962401580710912e-14),
219 T(0.809952115670456133407115668702575255e-15),
220 T(-0.165225312163981618191514820265351162e-15),
221 T(0.253054300974788842327061090060267385e-17),
222 T(0.116869397385595765888230876507793475e-16),
223 T(-0.477003704982048475822167804084816597e-17),
224 T(0.969912605905623712420709685898585354e-18));
226 auto c1 = bbm::poly<idx[1]>(z,
227 T(-0.00185185185185185185185185185185185185),
228 T(-0.00347222222222222222222222222222222222),
229 T(0.0026455026455026455026455026455026455),
230 T(-0.000990226337448559670781893004115226337),
231 T(0.000205761316872427983539094650205761317),
232 T(-0.401877572016460905349794238683127572e-6),
233 T(-0.180985503344899778370285914867533523e-4),
234 T(0.76491609160811100846374214980916921e-5),
235 T(-0.16120900894563446003775221882217767e-5),
236 T(0.464712780280743434226135033938722401e-8),
237 T(0.137863344691572095931187533077488877e-6),
238 T(-0.575254560351770496402194531835048307e-7),
239 T(0.119516285997781473243076536699698169e-7),
240 T(-0.175432417197476476237547551202312502e-10),
241 T(-0.100915437106004126274577504686681675e-8),
242 T(0.416279299184258263623372347219858628e-9),
243 T(-0.856390702649298063807431562579670208e-10),
244 T(0.606721510160475861512701762169919581e-13),
245 T(0.716249896481148539007961017165545733e-11),
246 T(-0.293318664377143711740636683615595403e-11),
247 T(0.599669636568368872330374527568788909e-12),
248 T(-0.216717865273233141017100472779701734e-15),
249 T(-0.497833997236926164052815522048108548e-13),
250 T(0.202916288237134247736694804325894226e-13),
251 T(-0.413125571381061004935108332558187111e-14),
252 T(0.828651623988309644380188591057589316e-18),
253 T(0.341003088693333279336339355910600992e-15),
254 T(-0.138541953028939715357034547426313703e-15),
255 T(0.281234665322887466568860332727259483e-16));
257 auto c2 = bbm::poly<idx[2]>(z,
258 T(0.0041335978835978835978835978835978836),
259 T(-0.00268132716049382716049382716049382716),
260 T(0.000771604938271604938271604938271604938),
261 T(0.200938786008230452674897119341563786e-5),
262 T(-0.000107366532263651605215391223621676297),
263 T(0.529234488291201254164217127180090143e-4),
264 T(-0.127606351886187277133779191392360117e-4),
265 T(0.34235787340961380741902003904747389e-7),
266 T(0.137219573090629332055943852926020279e-5),
267 T(-0.629899213838005502290672234278391876e-6),
268 T(0.142806142060642417915846008822771748e-6),
269 T(-0.204770984219908660149195854409200226e-9),
270 T(-0.140925299108675210532930244154315272e-7),
271 T(0.622897408492202203356394293530327112e-8),
272 T(-0.136704883966171134992724380284402402e-8),
273 T(0.942835615901467819547711211663208075e-12),
274 T(0.128722524000893180595479368872770442e-9),
275 T(-0.556459561343633211465414765894951439e-10),
276 T(0.119759355463669810035898150310311343e-10),
277 T(-0.416897822518386350403836626692480096e-14),
278 T(-0.109406404278845944099299008640802908e-11),
279 T(0.4662239946390135746326204922464679e-12),
280 T(-0.990510576390690597844122258212382301e-13),
281 T(0.189318767683735145056885183170630169e-16),
282 T(0.885922187259112726176031067028740667e-14),
283 T(-0.373782039804640545306560251777191937e-14),
284 T(0.786883363903515525774088394065960751e-15));
286 auto c3 = bbm::poly<idx[3]>(z,
287 T(0.000649434156378600823045267489711934156),
288 T(0.000229472093621399176954732510288065844),
289 T(-0.000469189494395255712128140111679206329),
290 T(0.000267720632062838852962309752433209223),
291 T(-0.756180167188397641072538191879755666e-4),
292 T(-0.239650511386729665193314027333231723e-6),
293 T(0.110826541153473023614770299726861227e-4),
294 T(-0.567495282699159656749963105701560205e-5),
295 T(0.14230900732435883914551894470580433e-5),
296 T(-0.278610802915281422405802158211174452e-10),
297 T(-0.16958404091930277289864168795820267e-6),
298 T(0.809946490538808236335278504852724081e-7),
299 T(-0.191111684859736540606728140872727635e-7),
300 T(0.239286204398081179686413514022282056e-11),
301 T(0.206201318154887984369925818486654549e-8),
302 T(-0.946049666185513217375417988510192814e-9),
303 T(0.215410497757749078380130268468744512e-9),
304 T(-0.138882333681390304603424682490735291e-13),
305 T(-0.218947616819639394064123400466489455e-10),
306 T(0.979099895117168512568262802255883368e-11),
307 T(-0.217821918801809621153859472011393244e-11),
308 T(0.62088195734079014258166361684972205e-16),
309 T(0.212697836327973697696702537114614471e-12),
310 T(-0.934468879151743333127396765626749473e-13),
311 T(0.204536712267828493249215913063207436e-13));
313 auto c4 = bbm::poly<idx[4]>(z,
314 T(-0.000861888290916711698604702719929057378),
315 T(0.00078403922172006662747403488144228885),
316 T(-0.000299072480303190179733389609932819809),
317 T(-0.146384525788434181781232535690697556e-5),
318 T(0.664149821546512218665853782451862013e-4),
319 T(-0.396836504717943466443123507595386882e-4),
320 T(0.113757269706784190980552042885831759e-4),
321 T(0.250749722623753280165221942390057007e-9),
322 T(-0.169541495365583060147164356781525752e-5),
323 T(0.890750753220530968882898422505515924e-6),
324 T(-0.229293483400080487057216364891158518e-6),
325 T(0.295679413754404904696572852500004588e-10),
326 T(0.288658297427087836297341274604184504e-7),
327 T(-0.141897394378032193894774303903982717e-7),
328 T(0.344635804994648970659527720474194356e-8),
329 T(-0.230245171745280671320192735850147087e-12),
330 T(-0.394092330280464052750697640085291799e-9),
331 T(0.186023389685045019134258533045185639e-9),
332 T(-0.435632300505661804380678327446262424e-10),
333 T(0.127860010162962312660550463349930726e-14),
334 T(0.467927502665791946200382739991760062e-11),
335 T(-0.214924647061348285410535341910721086e-11),
336 T(0.490881561480965216323649688463984082e-12));
338 auto c5 = bbm::poly<idx[5]>(z,
339 T(-0.000336798553366358150308767592718210002),
340 T(-0.697281375836585777429398828575783308e-4),
341 T(0.00027727532449593920787336425196507501),
342 T(-0.000199325705161888477003360405280844238),
343 T(0.679778047793720783881640176604435742e-4),
344 T(0.141906292064396701483392727105575757e-6),
345 T(-0.135940481897686932784583938837504469e-4),
346 T(0.80184702563342015397192571980419684e-5),
347 T(-0.229148117650809517038048790128781806e-5),
348 T(-0.325247355129845395166230137750005047e-9),
349 T(0.346528464910852649559195496827579815e-6),
350 T(-0.184471871911713432765322367374920978e-6),
351 T(0.482409670378941807563762631738989002e-7),
352 T(-0.179894667217435153025754291716644314e-13),
353 T(-0.630619450001352343517516981425944698e-8),
354 T(0.316241762877456793773762181540969623e-8),
355 T(-0.784092425369742929000839303523267545e-9));
357 auto c6 = bbm::poly<idx[6]>(z,
358 T(0.00053130793646399222316574854297762391),
359 T(-0.000592166437353693882864836225604401187),
360 T(0.000270878209671804482771279183488328692),
361 T(0.790235323266032787212032944390816666e-6),
362 T(-0.815396936756196875092890088464682624e-4),
363 T(0.561168275310624965003775619041471695e-4),
364 T(-0.183291165828433755673259749374098313e-4),
365 T(-0.307961345060330478256414192546677006e-8),
366 T(0.346515536880360908673728529745376913e-5),
367 T(-0.202913273960586037269527254582695285e-5),
368 T(0.578879286314900370889997586203187687e-6),
369 T(0.233863067382665698933480579231637609e-12),
370 T(-0.88286007463304835250508524317926246e-7),
371 T(0.474359588804081278032150770595852426e-7),
372 T(-0.125454150207103824457130611214783073e-7));
374 auto c7 = bbm::poly<idx[7]>(z,
375 T(0.000344367606892377671254279625108523655),
376 T(0.517179090826059219337057843002058823e-4),
377 T(-0.000334931610811422363116635090580012327),
378 T(0.000281269515476323702273722110707777978),
379 T(-0.000109765822446847310235396824500789005),
380 T(-0.127410090954844853794579954588107623e-6),
381 T(0.277444515115636441570715073933712622e-4),
382 T(-0.182634888057113326614324442681892723e-4),
383 T(0.578769494973505239894178121070843383e-5),
384 T(0.493875893393627039981813418398565502e-9),
385 T(-0.105953670140260427338098566209633945e-5),
386 T(0.616671437611040747858836254004890765e-6),
387 T(-0.175629733590604619378669693914265388e-6));
389 auto c8 = bbm::poly<idx[8]>(z,
390 T(-0.000652623918595309418922034919726622692),
391 T(0.000839498720672087279993357516764983445),
392 T(-0.000438297098541721005061087953050560377),
393 T(-0.696909145842055197136911097362072702e-6),
394 T(0.00016644846642067547837384572662326101),
395 T(-0.000127835176797692185853344001461664247),
396 T(0.462995326369130429061361032704489636e-4),
397 T(0.455790986792270771162749294232219616e-8),
398 T(-0.105952711258051954718238500312872328e-4),
399 T(0.678334290486516662273073740749269432e-5),
400 T(-0.210754766662588042469972680229376445e-5));
402 auto c9 = bbm::poly<idx[9]>(z,
403 T(-0.000596761290192746250124390067179459605),
404 T(-0.720489541602001055908571930225015052e-4),
405 T(0.000678230883766732836161951166000673426),
406 T(-0.000640147526026275845100045652582354779),
407 T(0.000277501076343287044992374518205845463),
408 T(0.181970083804651510461686554030325202e-6),
409 T(-0.847950711706850318239732559632810086e-4),
410 T(0.610519208250153101764709122740859458e-4),
411 T(-0.210739201834048624082975255893773306e-4));
413 auto c10 = bbm::poly<idx[10]>(z,
414 T(0.00133244544948006563712694993432717968),
415 T(-0.00191443849856547752650089885832852254),
416 T(0.0011089369134596637339607446329267522),
417 T(0.993240412264229896742295262075817566e-6),
418 T(-0.000508745012930931989848393025305956774),
419 T(0.00042735056665392884328432271160040444),
420 T(-0.000168588537679107988033552814662382059));
422 auto c11 = bbm::poly<idx[11]>(z,
423 T(0.00157972766073083495908785631307733022),
424 T(0.000162516262783915816898635123980270998),
425 T(-0.00206334210355432762645284467690276817),
426 T(0.00213896861856890981541061922797693947),
427 T(-0.00101085593912630031708085801712479376));
429 auto c12 = bbm::poly<idx[12]>(z,
430 T(-0.00407251211951401664727281097914544601),
431 T(0.00640336283380806979482363809026579583),
432 T(-0.00404101610816766177473974858518094879));
434 auto c13 = bbm::poly<idx[13]>(z, T(-0.0059475779383993002845382844736066323L));
436 return bbm::poly<idx[14]>(bbm::rcp(a), c0, c1, c2, c3, c4, c5, c6, c7, c8, c9, c10, c11, c12, c13);
441 if constexpr (std::numeric_limits<scalar_t<result_t>>::digits <= 24) result = eval_poly(
result_t(a),
z, std::index_sequence<7,5,3,0,0,0,0,0,0,0,0,0,0,0,0,3>{});
442 else if constexpr (std::numeric_limits<scalar_t<result_t>>::digits <= 53) result = eval_poly(
result_t(a),
z, std::index_sequence<15,13,11,9,7,9,7,5,3,1,0,0,0,0,10>{});
443 else if constexpr (std::numeric_limits<scalar_t<result_t>>::digits <= 64) result = eval_poly(
result_t(a),
z, std::index_sequence<19,17,15,13,11,9,11,9,7,5,3,5,3,0,13>{});
444 else result = eval_poly(
result_t(a), z, std::index_sequence<31,29,27,25,23,17,15,13,11,9,7,5,3,1,14>{});
447 result *= bbm::sign(x-a) * bbm::exp(-y) / bbm::sqrt(std::numbers::pi * 2 * a);
448 result += bbm::erfc( bbm::sqrt(y)) * 0.5;
466 template<
typename TA,
typename TX,
size_t MaxTerm=100>
469 using result_t =
decltype(a+x);
473 auto mask = bbm::detail::gamma_is_large(a,x);
475 if(bbm::any(mask)) result =
bbm::select(mask, bbm::detail::gamma_large<false>(a, x), result);
476 if(bbm::none(todo))
return result;
479 mask = todo && (x <= a+1);
481 if(bbm::any(mask)) result =
bbm::select(mask, bbm::detail::gamma<MaxTerm, false>(a, x), result);
482 if(bbm::none(todo))
return result;
485 mask = todo && (x > a+1);
486 if(bbm::any(mask)) result =
bbm::select(mask, (
bbm::tgamma(a) - bbm::detail::Gamma<MaxTerm, false>(a, x)), result);
498 template<
typename TA,
typename TX,
size_t MaxTerm=100>
501 using result_t =
decltype(a+x);
505 auto mask = bbm::detail::gamma_is_large(a,x);
507 if(bbm::any(mask)) result =
bbm::select(mask, bbm::detail::gamma_large<true>(a, x), result);
508 if(bbm::none(todo))
return result;
511 mask = todo && (x <= a+1);
513 if(bbm::any(mask)) result =
bbm::select(mask, bbm::detail::gamma<MaxTerm, true>(a, x), result);
514 if(bbm::none(todo))
return result;
517 mask = todo && (x > a+1);
518 if(bbm::any(mask)) result =
bbm::select(mask, (1 - bbm::detail::Gamma<MaxTerm, true>(a, x)), result);
531 template<
typename TA,
typename TX,
size_t MaxTerm=100>
532 inline auto tgamma(
const TA& a,
const TX& x)
534 using result_t =
decltype(a+x);
538 auto mask = bbm::detail::gamma_is_large(a,x);
540 if(bbm::any(mask)) result =
bbm::select(mask, (1-bbm::detail::gamma_large<false>(a, x)), result);
541 if(bbm::none(todo))
return result;
544 mask = todo && (x <= a+1);
546 if(bbm::any(mask)) result =
bbm::select(mask, (
bbm::tgamma(a) - bbm::detail::gamma<MaxTerm, false>(a, x)), result);
547 if(bbm::none(todo))
return result;
550 mask = todo && (x > a+1);
551 if(bbm::any(mask)) result =
bbm::select(mask, bbm::detail::Gamma<MaxTerm, false>(a, x), result);
563 template<
typename TA,
typename TX,
size_t MaxTerm=100>
566 using result_t =
decltype(a+x);
570 auto mask = bbm::detail::gamma_is_large(a,x);
572 if(bbm::any(mask)) result =
bbm::select(mask, (1-bbm::detail::gamma_large<true>(a, x)), result);
573 if(bbm::none(todo))
return result;
576 mask = todo && (x <= a+1);
578 if(bbm::any(mask)) result =
bbm::select(mask, (1 - bbm::detail::gamma<MaxTerm, true>(a, x)), result);
579 if(bbm::none(todo))
return result;
582 mask = todo && (x > a+1);
583 if(bbm::any(mask)) result =
bbm::select(mask, bbm::detail::Gamma<MaxTerm, true>(a, x), result);
592 template<
typename TA,
typename TX,
size_t MaxTerm=100>
595 using result_t =
decltype(a+x);
596 auto result =
make_named<
"p",
"q">(result_t(0), result_t(0));
599 auto mask = bbm::detail::gamma_is_large(a,x);
603 auto p = bbm::detail::gamma_large<true>(a, x);
606 if(bbm::none(todo))
return result;
609 mask = todo && (x <= a+1);
613 auto p = bbm::detail::gamma<MaxTerm, true>(a, x);
616 if(bbm::none(todo))
return result;
619 mask = todo && (x > a+1);
622 auto q = bbm::detail::Gamma<MaxTerm, true>(a, x);
typename detail::result_impl< T... >::type result_t
determine the mathematical result type; reverts to first argument if '+' is not defined on T....
Definition: math.h:49
auto norm(const T &a)
Definition: horizontal.h:24
auto normalize(const T &a)
Definition: horizontal.h:38
T & phi(vec2d< T > &v)
Definition: spherical.h:39
constexpr decltype(auto) y(bbm::vec3d< T > &v)
Definition: vec.h:23
constexpr decltype(auto) z(bbm::vec3d< T > &v)
Definition: vec.h:26
constexpr decltype(auto) x(bbm::vec3d< T > &v)
Definition: vec.h:20
Definition: aggregatebsdf.h:29
constexpr named< anonymize_t< T >, NAMES... > make_named(T &&t)
Make a named of a gettable type (with size == #NAMES); renames if the type is a named container.
Definition: named.h:293
auto gamma_q(const TA &a, const TX &x)
Normalized incomplete upper gamma function.
Definition: gamma.h:564
constexpr auto select(MASK &&mask, const A &a, const A &b)
Definition: backbone.h:255
auto tgamma_lower(const TA &a, const TX &x)
Unnormalized incomplete lower gamma function.
Definition: gamma.h:467
auto tgamma(const TA &a, const TX &x)
Unnormalized incomplete upper gamma function.
Definition: gamma.h:532
auto gamma_p(const TA &a, const TX &x)
Normalized incomplete lower gamma function.
Definition: gamma.h:499
auto gamma_pq(const TA &a, const TX &x)
Normalized incomplete upper and lower gamma function.
Definition: gamma.h:593
Compile time polynomial using Horner's method.
A wrapper for STL containers such as tuple, pair, and array. These containers force the programmer to...