|
345 | 345 | return Q
|
346 | 346 | end
|
347 | 347 |
|
348 |
| -@inline setindex!!(tup::Tuple, value, index) = @inbounds Base.setindex(tup, value, index) |
| 348 | +@inline setindex!!(tup::Tuple, value, index) = @inbounds index > length(tup) ? tup : Base.setindex(tup, value, index) |
349 | 349 | @inline setindex!!(tup::AbstractVector, value, index) = @inbounds Base.setindex!(tup, value, index)
|
| 350 | +@inline safe_getindex(e, eindex, elen) = (eindex ≤ elen && eindex ≤ length(e)) ? @inbounds(e[eindex]) : zero(eltype(e)) # Shewchuk's code is relying on undefined behaviour from out-of-bounds access where we call this. We need to be careful. |
350 | 351 |
|
351 | 352 | @inline function scale_expansion_zeroelim(elen::Int, e, b, ::Val{N})::Tuple{NTuple,Int} where {N}
|
352 | 353 | h = ntuple(i -> zero(typeof(e[1])), Val(N))
|
@@ -396,78 +397,72 @@ end
|
396 | 397 |
|
397 | 398 | @inline function fast_expansion_sum_zeroelim(elen::Int, e, flen::Int, f, h)
|
398 | 399 | @inbounds begin
|
399 |
| - enow = e[1] |
400 |
| - fnow = f[1] |
401 |
| - eindex = findex = 1 |
402 |
| - if ((fnow > enow) == (fnow > -enow)) |
403 |
| - Q = enow |
404 |
| - enow = e[eindex += 1] |
405 |
| - else |
406 |
| - Q = fnow |
407 |
| - fnow = f[findex += 1] |
408 |
| - end |
409 |
| - hindex = 0 |
410 |
| - if ((eindex < elen) && (findex < flen)) # still < since pre-increment |
411 |
| - if ((fnow > enow) == (fnow > -enow)) |
412 |
| - Qnew, hh = Fast_Two_Sum(enow, Q) |
413 |
| - enow = e[eindex += 1] |
| 400 | + enow = e[1] |
| 401 | + fnow = f[1] |
| 402 | + eindex = findex = 1 |
| 403 | + if (fnow > enow) == (fnow > -enow) |
| 404 | + Q = enow |
| 405 | + eindex += 1 |
| 406 | + enow = safe_getindex(e, eindex, elen) |
414 | 407 | else
|
415 |
| - Qnew, hh = Fast_Two_Sum(fnow, Q) |
416 |
| - fnow = f[findex += 1] |
| 408 | + Q = fnow |
| 409 | + findex += 1 |
| 410 | + fnow = safe_getindex(f, findex, flen) |
417 | 411 | end
|
418 |
| - Q = Qnew |
419 |
| - if hh != 0.0 |
420 |
| - #h[hindex+=1] = hh |
421 |
| - h = setindex!!(h, hh, hindex+=1) |
| 412 | + hindex = 1 |
| 413 | + if (eindex ≤ elen) && (findex ≤ flen) |
| 414 | + if (fnow > enow) == (fnow > -enow) |
| 415 | + Q, hh = Fast_Two_Sum(enow, Q) |
| 416 | + eindex += 1 |
| 417 | + enow = safe_getindex(e, eindex, elen) |
| 418 | + else |
| 419 | + Q, hh = Fast_Two_Sum(fnow, Q) |
| 420 | + findex += 1 |
| 421 | + fnow = safe_getindex(f, findex, flen) |
| 422 | + end |
| 423 | + if !iszero(hh) |
| 424 | + h = setindex!!(h, hh, hindex) |
| 425 | + hindex += 1 |
| 426 | + end |
| 427 | + while (eindex ≤ elen) && (findex ≤ flen) |
| 428 | + if (fnow > enow) == (fnow > -enow) |
| 429 | + Q, hh = Two_Sum(Q, enow) |
| 430 | + eindex += 1 |
| 431 | + enow = safe_getindex(e, eindex, elen) |
| 432 | + else |
| 433 | + Q, hh = Two_Sum(Q, fnow) |
| 434 | + findex += 1 |
| 435 | + fnow = safe_getindex(f, findex, flen) |
| 436 | + end |
| 437 | + if !iszero(hh) |
| 438 | + h = setindex!!(h, hh, hindex) |
| 439 | + hindex += 1 |
| 440 | + end |
| 441 | + end |
422 | 442 | end
|
423 |
| - |
424 |
| - while (eindex < elen) && (findex < flen) # still < since pre-increment |
425 |
| - if (fnow > enow) == (fnow > -enow) |
426 |
| - Qnew, hh = Two_Sum(Q, enow) |
427 |
| - enow = e[eindex += 1] |
428 |
| - else |
429 |
| - Qnew, hh = Two_Sum(Q, fnow) |
430 |
| - fnow = f[findex += 1] |
431 |
| - end |
432 |
| - Q = Qnew |
433 |
| - if hh != 0.0 |
434 |
| - #h[hindex += 1] = hh |
435 |
| - h = setindex!!(h, hh, hindex+=1) |
436 |
| - end |
| 443 | + while eindex ≤ elen |
| 444 | + Q, hh = Two_Sum(Q, enow) |
| 445 | + eindex += 1 |
| 446 | + enow = safe_getindex(e, eindex, elen) |
| 447 | + if !iszero(hh) |
| 448 | + h = setindex!!(h, hh, hindex) |
| 449 | + hindex += 1 |
| 450 | + end |
437 | 451 | end
|
438 |
| - end |
439 |
| - |
440 |
| - while eindex <= elen |
441 |
| - Qnew, hh = Two_Sum(Q, enow) |
442 |
| - eindex += 1 |
443 |
| - # We need an extra iteration to calculate Q |
444 |
| - # but we don't want to access e |
445 |
| - if eindex <= elen |
446 |
| - enow = e[eindex] |
| 452 | + while findex ≤ flen |
| 453 | + Q, hh = Two_Sum(Q, fnow) |
| 454 | + findex += 1 |
| 455 | + fnow = safe_getindex(f, findex, flen) |
| 456 | + if !iszero(hh) |
| 457 | + h = setindex!!(h, hh, hindex) |
| 458 | + hindex += 1 |
| 459 | + end |
447 | 460 | end
|
448 |
| - Q = Qnew |
449 |
| - if hh != 0.0 |
450 |
| - #h[hindex += 1] = hh |
451 |
| - h = setindex!!(h, hh, hindex+=1) |
| 461 | + if !iszero(Q) || isone(hindex) |
| 462 | + h = setindex!!(h, Q, hindex) |
| 463 | + hindex += 1 |
452 | 464 | end
|
453 |
| - end |
454 |
| - |
455 |
| - while findex <= flen |
456 |
| - Qnew, hh = Two_Sum(Q, fnow) |
457 |
| - findex += 1 |
458 |
| - if findex <= flen |
459 |
| - fnow = f[findex] |
460 |
| - end |
461 |
| - Q = Qnew |
462 |
| - if hh != 0.0 |
463 |
| - #h[hindex += 1] = hh |
464 |
| - h = setindex!!(h, hh, hindex+=1) |
465 |
| - end |
466 |
| - end |
467 |
| - if (Q != 0.0) || (hindex == 0) |
468 |
| - h = setindex!!(h, Q, hindex+=1) |
469 |
| - end |
470 |
| - return h, hindex |
| 465 | + return h, hindex - 1 |
471 | 466 | end
|
472 | 467 | end
|
473 | 468 |
|
@@ -518,7 +513,7 @@ function _incircleadapt_round1(pa, pb, pc, pd, permanent, cache=nothing)
|
518 | 513 | fin1, finlength = fast_expansion_sum_zeroelim(ablen, abdet, clen, cdet, Val(32))
|
519 | 514 |
|
520 | 515 | # check to make sure we haven't truncated too much
|
521 |
| - if ablen < 32 || finlength < 32 |
| 516 | + if ablen < 32 && finlength < 32 |
522 | 517 |
|
523 | 518 | det = estimate(finlength, fin1)
|
524 | 519 | errbound = iccerrboundB * permanent
|
@@ -558,7 +553,7 @@ function _incircleadapt_round1(pa, pb, pc, pd, permanent, cache=nothing)
|
558 | 553 | h48, h64, h1152_1, h1152_2 = _allocs_or_cache(cache)
|
559 | 554 |
|
560 | 555 | # if they were too short, rerun them...
|
561 |
| - if ablen == 32 || finlength == 32 |
| 556 | + if ablen >= 32 || finlength >= 32 |
562 | 557 | abdetv, ablen = fast_expansion_sum_zeroelim(alen, adet, blen, bdet, h64)
|
563 | 558 | fin1v, finlength = fast_expansion_sum_zeroelim(ablen, abdetv, clen, cdet, h1152_1)
|
564 | 559 |
|
|
0 commit comments