Legendre prime counting function: Difference between revisions

← Older edit

Legendre prime counting function (view source)

Revision as of 08:01, 3 March 2024

81,474 bytes added , 2 months ago

→‎{{header|Nim}}: Added Mojo Partial Sieving version...

GordonBGood

474

edits

Revision as of 02:48, 9 November 2022 (view source) GordonBGood (talk \| contribs) (→‎{{header\|CoffeeScript}}: add Chapel non-memoizing versions above...) ← Older edit		Latest revision as of 08:01, 3 March 2024 (view source) GordonBGood (talk \| contribs) (→‎{{header\|Nim}}: Added Mojo Partial Sieving version...)
(30 intermediate revisions by 8 users not shown)
Line 33: <br> <br> =={{header\|11l}}== {{trans\|Python}} <syntaxhighlight lang="11l"> F primes_up_to_limit(Int limit) [Int] r I limit >= 2 r.append(2) V isprime = [1B] * ((limit - 1) I/ 2) V sieveend = Int(sqrt(limit)) L(i) 0 .< isprime.len I isprime[i] Int p = i * 2 + 3 r.append(p) I i <= sieveend L(j) ((p * p - 3) >> 1 .< isprime.len).step(p) isprime[j] = 0B R r V p = primes_up_to_limit(Int(sqrt(1'000'000'000))) F phi(x, =a) F phi_cached(x, a) [(Int, Int) = Int] :cache I (x, a) C :cache R :cache[(x, a)] V r = phi(x, a) :cache[(x, a)] = r R r V res = 0 L I a == 0 \| x == 0 R x + res a-- res -= phi_cached(x I/ :p[a], a) F legpi(n) I n < 2 R 0 V a = legpi(Int(sqrt(n))) R phi(n, a) + a - 1 L(e) 10 print(‘10^’e‘ ’legpi(10 ^ e)) </syntaxhighlight> {{out}} <pre> 10^0 0 10^1 4 10^2 25 10^3 168 10^4 1229 10^5 9592 10^6 78498 10^7 664579 10^8 5761455 10^9 50847534 </pre> =={{header\|C}}== {{trans\|Vlang}} Using fixed width types so requires C99 or later. Surprisingly only half as fast as Go on the same machine (GCC -O3 Ubuntu 22.04) for a billion numbers. However, the position is reversed if we let it run through to a trillion numbers - about 100 ms for C compared to 160 ms for Go. <syntaxhighlight lang="c">#include <stdio.h> #include <math.h> #include <stdlib.h> #include <stdint.h> #include <time.h> const uint8_t masks[8] = {1, 2, 4, 8, 16, 32, 64, 128}; #define half(n) ((int64_t)((n) - 1) >> 1) #define divide(nm, d) ((uint64_t)((double)nm / (double)d)) int64_t countPrimes(uint64_t n) { if (n < 9) return (n < 2) ? 0 : ((int64_t)n + 1) / 2; uint64_t rtlmt = (uint64_t)sqrt((double)n); int64_t mxndx = (int64_t)((rtlmt - 1) / 2); int arrlen = (int)(mxndx + 1); uint32_t smalls = malloc(arrlen 4); uint32_t roughs = malloc(arrlen 4); int64_t larges = malloc(arrlen 8); for (int i = 0; i < arrlen; ++i) { smalls[i] = (uint32_t)i; roughs[i] = (uint32_t)(i + i + 1); larges[i] = (int64_t)((n/(uint64_t)(i + i + 1) - 1) / 2); } int cullbuflen = (int)((mxndx + 8) / 8); uint8_t cullbuf = calloc(cullbuflen, 1); int64_t nbps = 0; int rilmt = arrlen; for (int64_t i = 1; ; ++i) { int64_t sqri = (i + i) (i + 1); if (sqri > mxndx) break; if (cullbuf[i >> 3] & masks[i & 7]) continue; cullbuf[i >> 3] \|= masks[i & 7]; uint64_t bp = (uint64_t)(i + i + 1); for (int64_t c = sqri; c < (int64_t)arrlen; c += (int64_t)bp) { cullbuf[c >> 3] \|= masks[c & 7]; } int nri = 0; for (int ori = 0; ori < rilmt; ++ori) { uint32_t r = roughs[ori]; int64_t rci = (int64_t)(r >> 1); if (cullbuf[rci >> 3] & masks[rci & 7]) continue; uint64_t d = (uint64_t)r * bp; int64_t t = (d <= rtlmt) ? larges[(int64_t)smalls[d >> 1] - nbps] : (int64_t)smalls[half(divide(n, d))]; larges[nri] = larges[ori] - t + nbps; roughs[nri] = r; nri++; } int64_t si = mxndx; for (uint64_t pm = (rtlmt/bp - 1) \| 1; pm >= bp; pm -= 2) { uint32_t c = smalls[pm >> 1]; uint64_t e = (pm * bp) >> 1; for ( ; si >= (int64_t)e; --si) smalls[si] -= c - (uint32_t)nbps; } rilmt = nri; nbps++; } int64_t ans = larges[0] + (int64_t)((rilmt + 2(nbps - 1)) (rilmt - 1) / 2); int ri, sri; for (ri = 1; ri < rilmt; ++ri) ans -= larges[ri]; for (ri = 1; ; ++ri) { uint64_t p = (uint64_t)roughs[ri]; uint64_t m = n / p; int ei = (int)smalls[half((uint64_t)m/p)] - nbps; if (ei <= ri) break; ans -= (int64_t)((ei - ri) * (nbps + ri - 1)); for (sri = ri + 1; sri < ei + 1; ++sri) { ans += (int64_t)smalls[half(divide(m, (uint64_t)roughs[sri]))]; } } free(smalls); free(roughs); free(larges); free(cullbuf); return ans + 1; } int main() { uint64_t n; int i; clock_t start = clock(); for (i = 0, n = 1; i < 10; ++i, n = 10) { printf("10^%d %ld\n", i, countPrimes(n)); } clock_t end = clock(); printf("\nTook %f seconds\n", (double) (end - start) / CLOCKS_PER_SEC); return 0; }</syntaxhighlight> {{out}} <pre> 10^0 0 10^1 4 10^2 25 10^3 168 10^4 1229 10^5 9592 10^6 78498 10^7 664579 10^8 5761455 10^9 50847534 Took 0.003843 seconds </pre> =={{header\|C++}}== Line 626 ⟶ 804: The above function enjoys quite a large gain in speed of about a further ten times over the immediately preceding version due to not using recursion at all and the greatly reduced computational complexity of O(n(3/4)/((log n)2)) instead of the almost-linear-for-large-counting-ranges O(n/((log n)2)) for the previous two versions, although the previous two versions differ in performance by a constant factor due to the overheads of recursion and division. This version of prime counting function might be considered to be reasonably useful for counting primes up to a 1e16 in almost two minutes as long as the computer used has the required free memory of about 800 Megabytes. This Crystal version is about twice as slow as the Nim version from which it was translated because Nim's default GCC back-end is better at optimization (at least for this algorithm) than the LLVM back-end used by Crystal and also there is more numeric calculation checking such as numeric overflow used in Crystal that can't be turned off. At that, this version is about the same speed as when translated to Rust, which also uses a LLVM back-end. =={{header\|Elm}}== Currently, Elm does not have linear arrays and has no mutation whatsoever, even array content mutation protected by "monadic function chains" as for Haskell, so many algorithms can't be easily implemented such as the Legendre Partial Sieving algorithm which requires random access to linear arrays whose contents are mutated according to previous passes. However, given a prime number generator based on persistent data structures such as the List version [[https://rosettacode.org/wiki/Sieve_of_Eratosthenes#Elm\|from the Sieve of Eratosthenes task page]], one can translate the algorithm of the "bottom-up" recursive version without the "TinyPhi" Look Up Table (LUT) optmization which would need a linear array to implement, as in the following code: <syntaxhighlight lang="elm">module Main exposing (main) import Browser exposing (element) import Task exposing (Task, succeed, perform, andThen) import Html exposing (div, text) import Time exposing (now, posixToMillis) type CIS a = CIS a (() -> CIS a) -- infinite Co-Inductive Stream... uptoCIS2List : comparable -> CIS comparable -> List comparable uptoCIS2List n cis = let loop (CIS hd tl) lst = if hd > n then List.reverse lst else loop (tl()) (hd :: lst) in loop cis [] -- require a range of primes by Sieve of Eratosthenes... primesTreeFolding : () -> CIS Int primesTreeFolding() = let merge (CIS x xtl as xs) (CIS y ytl as ys) = case compare x y of LT -> CIS x <\| \ () -> merge (xtl()) ys EQ -> CIS x <\| \ () -> merge (xtl()) (ytl()) GT -> CIS y <\| \ () -> merge xs (ytl()) pmult bp = let adv = bp + bp pmlt p = CIS p <\| \ () -> pmlt (p + adv) in pmlt (bp bp) allmlts (CIS bp bptl) = CIS (pmult bp) <\| \ () -> allmlts (bptl()) pairs (CIS frst tls) = let (CIS scnd tlss) = tls() in CIS (merge frst scnd) <\| \ () -> pairs (tlss()) cmpsts (CIS (CIS hd tl) tls) = CIS hd <\| \ () -> merge (tl()) <\| cmpsts <\| pairs (tls()) testprm n (CIS hd tl as cs) = if n < hd then CIS n <\| \ () -> testprm (n + 2) cs else testprm (n + 2) (tl()) oddprms() = CIS 3 <\| \ () -> testprm 5 <\| cmpsts <\| allmlts <\| oddprms() in CIS 2 <\| \ () -> oddprms() countPrimesTo : Float -> Float -- only use integral values! countPrimesTo n = if n < 3 then if n < 2 then 0 else 1 else let nnf = toFloat (floor n) -- erase fractional part! sqrtn = sqrt nnf \|> truncate oprms = primesTreeFolding() \|> uptoCIS2List sqrtn \|> List.drop 1 opsz = List.length oprms lvl opi opilmt plst m acc = if opi >= opilmt then acc else case plst of [] -> acc -- should never happen (op :: optl) -> let opl = toFloat op nm = m * opl in if nnf <= nm * opl then acc + toFloat (opilmt - opi) else let q = nnf / nm \|> floor \|> toFloat nacc = acc + q - toFloat (floor (q / 2)) sacc = if opi <= 0 then 0 else lvl 0 opi oprms nm 0 in lvl (opi + 1) opilmt optl m (nacc - sacc) in nnf - toFloat (floor (nnf / 2)) - lvl 0 opsz oprms 1 0 + toFloat opsz -- run the required task tests... timemillis : () -> Task Never Int -- a side effect function timemillis() = now \|> andThen (\ t -> succeed (posixToMillis t)) test : () -> Cmd Msg -- side effect function chain (includes "perform")... test() = timemillis() \|> andThen (\ strt -> let rsltstrs = List.range 0 9 \|> List.map ( \ n -> "π(10^" ++ String.fromInt n ++ ") = " ++ String.fromFloat (countPrimesTo (toFloat (10^n)))) in timemillis() \|> andThen (\ stop -> succeed (List.append rsltstrs ["This took " ++ String.fromInt (stop - strt) ++ " milliseconds."]))) \|> perform Done -- following code has to do with outputting to a web page using MUV/TEA... type alias Model = List String type Msg = Done Model main : Program () Model Msg main = -- starts with empty list of strings; views model of filled list... element { init = \ _ -> ( [], test() ) , update = \ (Done mdl) _ -> ( mdl , Cmd.none ) , subscriptions = \ _ -> Sub.none , view = div [] << List.map (div [] << List.singleton << text) }</syntaxhighlight> {{out}} <pre>π(10^0) = 0 π(10^1) = 4 π(10^2) = 25 π(10^3) = 168 π(10^4) = 1229 π(10^5) = 9592 π(10^6) = 78498 π(10^7) = 664579 π(10^8) = 5761455 π(10^9) = 50847534 This took 341 milliseconds.</pre> =={{header\|Erlang}}== Line 744 ⟶ 1,031: The above time as run on an Intel i5-6500 (3.6 GHz single-threaded boost) isn't particularly fast but includes some DotNet initialization and JIT compilation overhead, and is about as fast as a highly optimized page-segmented wheel-factorized Sieve of Eratosthenes; Although this is about ten times faster than if it were using memoization (and uses much less memory), it is only reasonably usable for trivial ranges such as this (trivial in terms of prime counting functions). '''The Less Recursive "Bottom-Up" with a TinyPhi LUT Algorithm''' Just substitute the following F# code for the `countPrimes` function above to enjoy the gain in speed: Line 803 ⟶ 1,090: '''The Non-Recursive Partial Sieving Algorithm''' Just substitute the following F# code for the `countPrimes` function above to enjoy the further gain in speed; note that rather than using a recursive function loop for the partial sieving culling pass as per the above two version, this version uses a Seq iteration which is slower but more concise in expression, but as sieving is a negligible part of the total execution time, it doesn't matter and conciseness was considered to be more important; this version may appear to be recursive to those unfamiliar with Functional Programming (FP) implementations but FP generally turns all function recursions in tail-call position (which all of these are) into the same compiled code as a simple loop in other languages: {{trans\|Nim}} <syntaxhighlight lang="fsharp">let masks = Array.init 8 ((<<<) 1uy) // quick bit twiddling Line 880 ⟶ 1,167: The above function enjoys quite a large gain in speed of about a further ten times over the immediately preceding version (although one can't see that gain for these trivial ranges as it is buried in the constant overheads) due to not using recursion at all and the greatly reduced computational complexity of O(n(3/4)/((log n)2)) instead of the almost-linear-for-large-counting-ranges O(n/((log n)*2)) for the previous two versions, although the previous two versions differ in performance by a constant factor due to the overheads of recursion and division; for instance, this version can calculate the number of primes to 1e11 in about a hundred milliseconds. This version of prime counting function might be considered to be reasonably useful for counting primes up to a 1e16 in about a hundred seconds as long as the computer used has the required free memory of about 800 Megabytes. This F# version is about twice as slow as the Nim version from which it was translated due to the benefits of native code compilation and more optimizations for Nim rather than JIT compilation for F#. At that, this version is about the same speed as when translated to Rust and Crystal once the range is increased where constant overheads aren't a factor, which both use native code compilers. =={{header\|FreeBASIC}}== {{incorrect\|FreeBASIC\|This is not a Legendre prime counting function but a very inefficient trial division (`Mod`) sieve.}} <syntaxhighlight lang="vbnet">Function isPrime(n As Uinteger) As Boolean Dim As Uinteger i For i = 2 To Sqr(n) If n Mod i = 0 Then Return False Next i Return True End Function Dim As Uinteger n, i, j, count Dim Shared As Ulongint primes(1e8) n = 1 For i = 0 To 9 count = 0 For j = 2 To n If isPrime(j) Then count += 1 primes(count) = j End If Next j Print "10^"; i; " "; count n = 10 Next i Sleep</syntaxhighlight> =={{header\|Go}}== Line 1,005 ⟶ 1,321: Same as first version. </pre> ===Iterative, partial sieving=== {{trans\|Vlang}} This non-memoized, non-recursive version is much quicker than the first two versions, running in about 2 milliseconds which is the same as V. <syntaxhighlight lang="ecmascript">package main import ( ~~=={{header\|Java}}==~~ "fmt" ~~<syntaxhighlight lang="java">import java.util.;~~ "math" "time" ) var masks = [8]uint8{1, 2, 4, 8, 16, 32, 64, 128} ~~public class LegendrePrimeCounter {~~ ~~public static void main(String[] args) {~~ ~~LegendrePrimeCounter counter = new LegendrePrimeCounter(1000000000);~~ ~~for (int i = 0, n = 1; i < 10; ++i, n = 10)~~ ~~System.out.printf("10^%d\t%d\n", i, counter.primeCount((n)));~~ } func half(n int) int { return (n - 1) >> 1 } ~~private List<Integer> primes;~~ func divide(nm, d uint64) int { return int(float64(nm) / float64(d)) } ~~public LegendrePrimeCounter(int limit) {~~ ~~primes = generatePrimes((int)Math.sqrt((double)limit));~~ } func countPrimes(n uint64) int64 { ~~public int primeCount(int n) {~~ if (n < 2)9 { if n < 2 ~~return 0;~~{ ~~int~~ a = ~~primeCount((int)Math.sqrt((double)n));~~ return 0 ~~return~~} ~~phi(n,~~else ~~a) + a - 1;~~{ return (int64(n) + 1) / 2 } } rtlmt := int(math.Sqrt(float64(n))) ~~private~~mxndx ~~int~~:= ~~phi~~(~~int~~rtlmt x,- ~~int a~~1) {/ 2 arrlen := mxndx + ~~if (a == 0)~~1 smalls := make([]uint32, arrlen) ~~return x;~~ roughs := if make(~~a ==~~[]uint32, 1arrlen) larges := make([]int64, arrlen) ~~return x - (x >> 1);~~ for i ~~int pa~~ := ~~primes.get~~uint32(a0); -i 1< uint32(arrlen); i++ { ifsmalls[i] ~~(x <~~= ~~pa)~~i roughs[i] = i + ~~return~~i + 1; ~~return~~larges[i] ~~phi~~= int64(~~x, a~~(n/uint64(i+i+1) - 1) ~~- phi(x~~ / ~~pa, a - 1~~2); } cullbuflen := (mxndx + 8) / 8 cullbuf := make([]uint8, cullbuflen) ~~private static List<Integer> generatePrimes(int limit) {~~ nbps := 0 ~~boolean[] sieve = new boolean[limit >> 1];~~ rilmt := arrlen ~~Arrays.fill(sieve, true);~~ for ~~(int p~~i := ~~3, s = 9~~1; ~~s < limit~~; p i++~~= 2)~~ { sqri := (i + ifi) * (~~sieve[p~~i >>+ 1]) { if sqri > mxndx { ~~for (int q = s; q < limit; q += p << 1)~~ ~~sieve[q >> 1] = false;~~break } if (cullbuf[i>>3] & masks[i&7]) != 0 { continue } cullbuf[i>>3] \|= masks[i&7] bp := i + i + 1 for c := sqri; c < arrlen; c += bp { cullbuf[c>>3] \|= masks[c&7] } nri := 0 for ori := 0; ori < rilmt; ori++ { r := int(roughs[ori]) rci := r >> 1 if (cullbuf[rci>>3] & masks[rci&7]) != 0 { continue } d := r * bp t := int64(0) if d <= rtlmt { t = larges[int(smalls[d>>1])-nbps] } else { t = int64(smalls[half(divide(n, uint64(d)))]) } larges[nri] = larges[ori] - t + int64(nbps) roughs[nri] = uint32(r) nri++ } si := mxndx for pm := (rtlmt/bp - 1) \| 1; pm >= bp; pm -= 2 { c := smalls[pm>>1] e := (pm * bp) >> 1 for ; si >= e; si-- { smalls[si] -= (c - uint32(nbps)) } ~~s += (p + 1) << 2;~~ } ~~List<Integer> primes~~rilmt = ~~new ArrayList<>();~~nri ~~if (limit > 2)~~nbps++ } ~~primes.add(2);~~ ans := larges[0] + ~~for~~ int64(~~int~~((rilmt ~~i =~~+ 2(nbps-1;)) i <(rilmt ~~sieve.length;~~- ~~++i~~1) {/ 2)) for ri := 1; ri < rilmt; ri++ ~~if (sieve[i])~~{ ans -= ~~primes.add((i << 1) + 1);~~larges[ri] } for ri := 1; ~~return primes~~; ri++ { p := uint64(roughs[ri]) m := n / p ei := int(smalls[half(int(m/p))]) - nbps if ei <= ri { break } ans -= int64((ei - ri) * (nbps + ri - 1)) for sri := ri + 1; sri < ei+1; sri++ { ans += int64(smalls[half(divide(m, uint64(roughs[sri])))]) } } return ans + 1 } func main() { start := time.Now() for i, n := uint64(0), uint64(1); i <= 9; i, n = i+1, n10 { fmt.Printf("10^%d %d\n", i, countPrimes(n)) } elapsed := time.Since(start).Microseconds() fmt.Printf("\nTook %d microseconds\n", elapsed) }</syntaxhighlight> {{out}} <pre> 10^0 0 10^1 4 10^2 25 10^3 168 10^4 1229 10^5 9592 10^6 78498 10^7 664579 10^8 5761455 10^9 50847534 Took 1862 microseconds </pre> Line 1,314 ⟶ 1,686: '''The Non-Recursive Partial Sieving Algorithm''' Just substitute the following Haskell code for the `countPrimes` function above to enjoy the further gain in speed; this version may appear to be recursive to those unfamiliar with Functional Programming (FP) implementations but FP generally turns all function recursions in tail-call position (which all of these are) into the same compiled code as a simple loop in other languages: <syntaxhighlight lang="haskell">~~countPrimesxx~~countPrimes :: Word64 -> Int64 ~~countPrimesxx~~countPrimes n = if n < 3 then (if n < 2 then 0 else 1) else let Line 1,460 ⟶ 1,832: But we can simplify that to p:inv when we know that primes are not being tested. =={{header\|Java}}== <syntaxhighlight lang="java">import java.util.; public class LegendrePrimeCounter { public static void main(String[] args) { LegendrePrimeCounter counter = new LegendrePrimeCounter(1000000000); for (int i = 0, n = 1; i < 10; ++i, n = 10) System.out.printf("10^%d\t%d\n", i, counter.primeCount((n))); } private List<Integer> primes; public LegendrePrimeCounter(int limit) { primes = generatePrimes((int)Math.sqrt((double)limit)); } public int primeCount(int n) { if (n < 2) return 0; int a = primeCount((int)Math.sqrt((double)n)); return phi(n, a) + a - 1; } private int phi(int x, int a) { if (a == 0) return x; if (a == 1) return x - (x >> 1); int pa = primes.get(a - 1); if (x <= pa) return 1; return phi(x, a - 1) - phi(x / pa, a - 1); } private static List<Integer> generatePrimes(int limit) { boolean[] sieve = new boolean[limit >> 1]; Arrays.fill(sieve, true); for (int p = 3, s = 9; s < limit; p += 2) { if (sieve[p >> 1]) { for (int q = s; q < limit; q += p << 1) sieve[q >> 1] = false; } s += (p + 1) << 2; } List<Integer> primes = new ArrayList<>(); if (limit > 2) primes.add(2); for (int i = 1; i < sieve.length; ++i) { if (sieve[i]) primes.add((i << 1) + 1); } return primes; } }</syntaxhighlight> {{out}} <pre> 10^0 0 10^1 4 10^2 25 10^3 168 10^4 1229 10^5 9592 10^6 78498 10^7 664579 10^8 5761455 10^9 50847534 </pre> =={{header\|JavaScript}}== There doesn't seem to be much point to contributing memoized (Hash table) versions as they seem to be the result of the task author not realizing that there is a simple way of keeping the computation complexity from having exponential growth with counting range by limiting the "splitting" of the "phi" calculation when the result must be just one. Accordingly, the following JavaScript versions are [translated and improved from the non-memoizing Nim versions](https://rosettacode.org/wiki/Legendre_prime_counting_function#Non-Memoized_Versions), which explanations can be referenced for an understanding of how they work: '''The Basic Recursive Legendre Algorithm''' {{trans\|Nim}} <syntaxhighlight lang="javascript">"use strict"; function countPrimesTo(lmt) { if (lmt < 3) { if (lmt < 2) return 0; else return 1; } const sqrtlmt = Math.sqrt(lmt) >>> 0; const oprms = function() { const mxndx = (sqrtlmt - 3) >>> 1; const arr = new Float64Array(mxndx + 1); for (let i = 0 >>> 0; i <= mxndx; ++i) arr[i] = (i + i + 3) >>> 0; let bp = 3 >>> 0; while (true) { let i = (bp - 3) >>> 1; let sqri = ((i + i) (i + 3) + 3) >>> 0; if (sqri > mxndx) break; if (arr[i] != 0) for (; sqri <= mxndx; sqri += bp) arr[sqri] = 0; bp += 2; } return arr.filter(v => v != 0); }(); function phi(x, a) { if (a <= 0) return x - Math.trunc(x / 2); const na = (a - 1) >>> 0; const p = oprms[na]; if (x <= p) return 1; return phi(x, na) - phi(Math.trunc(x / p), na); } return phi(lmt, oprms.length) + oprms.length; } const start = Date.now(); for (let i = 0; i <= 9; ++i) console.log(`π(10${i}) =`, countPrimesTo(10i)); const elpsd = Date.now() - start; console.log("This took", elpsd, "milliseconds.")</syntaxhighlight> {{out}} <pre>π(100) = 0 π(101) = 4 π(102) = 25 π(103) = 168 π(104) = 1229 π(105) = 9592 π(106) = 78498 π(107) = 664579 π(108) = 5761455 π(109) = 50847534 This took 712 milliseconds.</pre> The time is as run on an Intel i5-6500 (3.6 GHz single-threaded boost) using node.js version 17.3.1. Although this is about ten times faster than if it were using memoization (and uses much less memory), it is only reasonably usable for trivial ranges such as this (trivial in terms of prime counting functions). '''The Less Recursive "Bottom-Up" with a TinyPhi LUT Algorithm''' Just substitute the following JavaScript code for the `countPrimesTo` function above to enjoy the gain in speed: {{trans\|Nim}} <syntaxhighlight lang="javascript">const TinyPhiPrimes = [ 2, 3, 5, 7, 11, 13 ]; const TinyPhiOddDegree = TinyPhiPrimes.length - 1; const TinyPhiOddCirc = TinyPhiPrimes.reduce((acc, p) => acc * p) / 2; const TinyPhiTot = TinyPhiPrimes.reduce((acc, p) => acc * (p - 1), 1) const TinyPhiLUT = function() { const arr = new Uint16Array(TinyPhiOddCirc); arr.fill(1); for (const p of TinyPhiPrimes) { if (p <= 2) continue; arr[p >> 1] = 0; for (let c = (p * p) >> 1; c < TinyPhiOddCirc; c += p) arr[c] = 0 >>> 0; } for (let i = 0 \| 0, acc = 0 \| 0; i < TinyPhiOddCirc; ++i) { acc += arr[i]; arr[i] = acc; } return arr; }(); function tinyPhi(x) { const ndx = Math.trunc(( x - 1) / 2); const numtots = Math.trunc(ndx / TinyPhiOddCirc); const rem = (ndx - numtots * TinyPhiOddCirc) >>> 0; return numtots * TinyPhiTot + TinyPhiLUT[rem]; } function countPrimesTo(lmt) { if (lmt < 169) { if (lmt < 3) { if (lmt < 2) return 0; else return 1; } // adjust for the missing "degree" base primes if (lmt <= 13) return ((lmt - 1) >>> 1) + (lmt < 9 ? 1 : 0); return 5 + TinyPhiLUT[(lmt - 1) >>> 1]; } const sqrtlmt = Math.sqrt(lmt) >>> 0; const oprms = function() { const mxndx = (sqrtlmt - 3) >>> 1; const arr = new Float64Array(mxndx + 1); for (let i = 0 >>> 0; i <= mxndx; ++i) arr[i] = (i + i + 3) >>> 0; let bp = 3 >>> 0; while (true) { let i = (bp - 3) >>> 1; let sqri = ((i + i) * (i + 3) + 3) >>> 0; if (sqri > mxndx) break; if (arr[i] != 0) for (; sqri <= mxndx; sqri += bp) arr[sqri] = 0; bp += 2; } return arr.filter(v => v != 0); }(); function lvl(pilmt, m) { let ans = 0; for (let pi = TinyPhiOddDegree; pi < pilmt; ++pi) { const p = oprms[pi]; const nm = m * p; if (lmt <= nm * p) return ans + pilmt - pi; ans += tinyPhi(Math.trunc(lmt / nm)); if (pi > TinyPhiOddDegree) ans -= lvl(pi, nm); } return ans; } return tinyPhi(lmt) - lvl(oprms.length, 1) + oprms.length; }</syntaxhighlight> Use of the above function gets a gain in speed of about a further fifteen times over the above version due to less recursion and the use of the "Tiny_Phi" Look Up Table (LUT) for smaller "degrees" of primes which greatly reduces the number of integer divisions. This version of prime counting function might be considered to be reasonably useful for counting primes up to a trillion (1e12) in a few tens of seconds. '''The Non-Recursive Partial Sieving Algorithm''' Just substitute the following JavaScript code for the `countPrimesTo` function above to enjoy the gain in speed: {{trans\|Nim}} <syntaxhighlight lang="javascript">const masks = new Uint8Array(8); // faster than bit twiddling! for (let i = 0; i < 8; ++i) masks[i] = (1 << i) >>> 0; function countPrimesTo(lmt) { if (lmt < 3) { if (lmt < 2) return 0; else return 1; } function half(x) { return (x - 1) >>> 1; } function divide(nm, d) { return (nm / d) >>> 0; } const sqrtlmt = Math.trunc(Math.sqrt(lmt)); const mxndx = (sqrtlmt - 1) >>> 1; const cbsz = (mxndx + 8) >>> 3; const cullbuf = new Uint8Array(cbsz); const smalls = new Uint32Array(mxndx + 1); for (let i = 0; i <= mxndx; ++i) smalls[i] = i >>> 0; const roughs = new Uint32Array(mxndx + 1); for (let i = 0; i <= mxndx; ++i) roughs[i] = (i + i + 1) >>> 0; const larges = new Float64Array(mxndx + 1); for (let i = 0; i <= mxndx; ++i) larges[i] = Math.trunc((Math.trunc(lmt / (i + i + 1)) - 1) / 2); // partial sieve loop, adjusting larges/smalls, compressing larges/roughs... let nobps = 0 >>> 0; let rilmt = mxndx; let bp = 3 >>> 0; while (true) { // break when square root is reached const i = bp >>> 1; let sqri = ((i + i) * (i + 1)) >>> 0; if (sqri > mxndx) break; // partial sieving pass if bp is prime: if ((cullbuf[i >> 3] & masks[i & 7]) == 0) { cullbuf[i >> 3] \|= masks[i & 7]; // cull bp! for (; sqri <= mxndx; sqri += bp) cullbuf[sqri >> 3] \|= masks[sqri & 7]; // cull bp mults! // now adjust `larges` for latest partial sieve pass... var ori = 0 // compress input rough index to output one for (let iri = 0; iri <= rilmt; ++iri) { const r = roughs[iri]; const rci = r >>> 1; // skip roughs just culled! if ((cullbuf[rci >> 3] & masks[rci & 7]) != 0) continue; const d = bp * r; larges[ori] = larges[iri] - ( (d <= sqrtlmt) ? larges[smalls[d >>> 1] - nobps] : smalls[half(divide(lmt, d))] ) + nobps; // base primes count over subtracted! roughs[ori++] = r; } let si = mxndx // and adjust `smalls` for latest partial sieve pass... for (let bpm = (sqrtlmt / bp - 1) \| 1; bpm >= bp; bpm -= 2) { const c = smalls[bpm >>> 1] - nobps; const ei = ((bpm * bp) >>> 1); while (si >= ei) smalls[si--] -= c; } nobps++; rilmt = ori - 1; } bp += 2; } // combine results to here; correcting for over subtraction in combining... let ans = larges[0]; for (let i = 1; i <= rilmt; ++i) ans -= larges[i]; ans += Math.trunc((rilmt + 1 + 2 * (nobps - 1)) * rilmt / 2); // add final adjustment for pairs of current roughs to cube root of range... let ri = 0 while (true) { // break when reaches cube root of counting range... const p = roughs[++ri]; const q = Math.trunc(lmt / p); const ei = smalls[half(divide(q, p))] - nobps; if (ei <= ri) break; // break here when no more pairs! for (let ori = ri + 1; ori <= ei; ++ori) ans += smalls[half(divide(q, roughs[ori]))]; ans -= (ei - ri) * (nobps + ri - 1); } return ans + 1; // add one for only even prime of two! }</syntaxhighlight> The above code enjoys quite a large gain in speed of about a further ten times (and increasing with range) over the immediately preceding version for larger "non-trivial" ranges (since there is an appreciable environment overhead in initialization and JIT compilation) due to not using recursion at all and the greatly reduced computational complexity of O(n(3/4)/((log n)2)) instead of the almost-linear-for-large-counting-ranges O(n/((log n)*2)) for the previous two versions, although the previous two versions differ in performance by a constant factor due to the overheads of recursion and division; for instance, this version can calculate the number of primes to 1e11 in about 125 milliseconds. This version of prime counting function might be considered to be reasonably useful for counting primes up to a 1e16 in under three minutes as long as the computer used has the required free memory of about 800 Megabytes. This JavaScript version is about three times as slow as the Nim version from which it was translated for large ranges where the initialization overhead is not significant due to being run by the JavaScript engine and JIT compiled. =={{header\|jq}}== Line 1,631 ⟶ 2,259: 0.003234 seconds (421 allocations: 14.547 KiB) </pre> === nonrecursive method === {{trans\|Nim}} <syntaxhighlight lang="julia"> function countprimes(n) n < 3 && return typeof(n)(n > 1) rtlmt = isqrt(n) mxndx = (rtlmt - 1) ÷ 2 smalls::Array{UInt32} = [i for i in 0:mxndx+1] roughs::Array{UInt32} = [i + i + 1 for i in 0:mxndx+1] larges::Array{Int64} = [(n ÷ (i + i + 1) - 1) ÷ 2 for i in 0:mxndx+1] cmpsts = falses(mxndx + 1) bp, npc, mxri = 3, 0, mxndx @inbounds while true i = bp >> 1 sqri = (i + i) (i + 1) sqri > mxndx && break if !cmpsts[i + 1] cmpsts[i + 1] = true for c in sqri:bp:mxndx cmpsts[c + 1] = true end ri = 0 for k in 0:mxri q = roughs[k + 1] qi = q >> 1 cmpsts[qi + 1] && continue d = UInt64(bp) * UInt64(q) larges[ri + 1] = larges[k + 1] + npc - (d <= rtlmt ? larges[smalls[d >> 1 + 1] - npc + 1] : smalls[(Int(floor(n / d)) - 1) >> 1 + 1]) roughs[ri + 1] = q ri += 1 end m = mxndx @simd for k in (rtlmt ÷ bp - 1) \| 1 : -2 : bp c = smalls[k >> 1 + 1] - npc ee = (k * bp) >> 1 while m >= ee smalls[m + 1] -= c m -= 1 end end mxri = ri - 1 npc += 1 end bp += 2 end result = larges[1] @simd for i in 2:mxri+1 result -= larges[i] end result += (mxri + 1 + 2 * (npc - 1)) * mxri ÷ 2 for j in 1:mxri p = UInt64(roughs[j + 1]) m = n ÷ p ee = smalls[(Int(floor(m / p)) - 1) >> 1 + 1] - npc ee <= j && break for k in j+1:ee result += smalls[(Int(floor(m / roughs[k + 1])) - 1) >> 1 + 1] end result -= (ee - j) * (npc + j - 1) end return result + 1 end for i in 0:14 println("π(10^$i) = ", countprimes(10^i)) end @time countprimes(10^13) @time countprimes(10^14) </syntaxhighlight>{{out}} <pre> π(10^0) = 0 π(10^1) = 4 π(10^2) = 25 π(10^3) = 168 π(10^4) = 1229 π(10^5) = 9592 π(10^6) = 78498 π(10^7) = 664579 π(10^8) = 5761455 π(10^9) = 50847534 π(10^10) = 455052511 π(10^11) = 4118054813 π(10^12) = 37607912018 π(10^13) = 346065536839 π(10^14) = 3204941750802 0.894891 seconds (13 allocations: 48.442 MiB, 1.06% gc time) 4.479385 seconds (13 allocations: 153.185 MiB, 0.12% gc time) </pre> =={{header\|Kotlin}}== There doesn't seem to be much point to contributing memoized (Hash table) versions as they seem to be the result of the task author not realizing that there is a simple way of keeping the computation complexity from having exponential growth with counting range by limiting the "splitting" of the "phi" calculation when the result must be just one. Accordingly, the following Kotlin versions are [translated and improved from the non-memoizing Nim versions](https://rosettacode.org/wiki/Legendre_prime_counting_function#Non-Memoized_Versions), which explanations can be referenced for an understanding of how they work: '''The Basic Recursive Legendre Algorithm''' {{trans\|Nim}} <syntaxhighlight lang="kotlin">fun countPrimes(lmt: Long): Long { if (lmt < 3) return if (lmt < 2) 0 else 1 val sqrtlmt = Math.sqrt(lmt.toDouble()).toInt() fun makePrimes(): IntArray { val mxndx = (sqrtlmt - 3) / 2 val arr = IntArray(mxndx + 1, { it + it + 3}) var i = 0 while (true) { val sqri = (i + i) * (i + 3) + 3 if (sqri > mxndx) break if (arr[i] != 0) { val bp = i + i + 3 for (c in sqri .. mxndx step bp) arr[c] = 0 } i++ } return arr.filter { it != 0 }.toIntArray() } val oprms = makePrimes() fun phi(x: Long, a: Int): Long { if (a <= 0) return x - (x shr 1) val na = a - 1; val p = oprms[na].toLong() if (x <= p) return 1 return phi(x, na) - phi(x / p, na) } return phi(lmt, oprms.size) + oprms.size.toLong() } fun main() { val strt = System.currentTimeMillis() for (i in 0 .. 9) { val arg = Math.pow(10.toDouble(), i.toDouble()).toLong() println("π(10$i) = ${countPrimes(arg)}") } val stop = System.currentTimeMillis() println("This took ${stop - strt} milliseconds.") }</syntaxhighlight> {{out}} <pre>π(100) = 0 π(101) = 4 π(102) = 25 π(103) = 168 π(104) = 1229 π(105) = 9592 π(106) = 78498 π(107) = 664579 π(108) = 5761455 π(10*9) = 50847534 This took 480 milliseconds.</pre> The time is as run on an Intel i5-6500 (3.6 GHz single-threaded boost). Although this is about ten times faster than if it were using memoization (and uses much less memory), it is only reasonably usable for trivial ranges such as this (trivial in terms of prime counting functions). '''The Less Recursive "Bottom-Up" with a TinyPhi LUT Algorithm''' Just substitute the following Kotlin code for the `countPrimes` function above to enjoy the gain in speed: {{trans\|Nim}} <syntaxhighlight lang="kotlin">val cTinyPhiPrimes = intArrayOf(2, 3, 5, 7, 11, 13) val cTinyPhiDeg = cTinyPhiPrimes.size - 1 val cTinyPhiOddCirc = cTinyPhiPrimes.reduce(Int::times) / 2 val cTinyPhiTot = cTinyPhiPrimes.fold(1) { s, p -> s (p - 1) } fun makeTPLUT(): IntArray { val arr = IntArray(cTinyPhiOddCirc) { _ -> 1 } for (bp in cTinyPhiPrimes.drop(1)) { arr[bp shr 1] = 0 for (c in ((bp * bp) shr 1) until cTinyPhiOddCirc step bp) arr[c] = 0 } var acc = 0 for (i in 0 until cTinyPhiOddCirc) { acc += arr[i]; arr[i] = acc } return arr } val cTinyPhiLUT = makeTPLUT() fun tinyPhi(x: Long): Long { val ndx = (x - 1) shr 1; val numtots = ndx / cTinyPhiOddCirc.toLong() val rem = (ndx - numtots * cTinyPhiOddCirc.toLong()).toInt() return numtots * cTinyPhiTot.toLong() + cTinyPhiLUT[rem].toLong() } fun countPrimes(lmt: Long): Long { if (lmt < 169) { if (lmt < 3) return if (lmt < 2) 0 else 1 // adjust for the missing "degree" base primes if (lmt <= 13) return ((lmt - 1).toLong() shr 1) + (if (lmt < 9) 1 else 0); return 5.toLong() + cTinyPhiLUT[(lmt - 1).toInt() shr 1].toLong(); } val sqrtlmt = Math.sqrt(lmt.toDouble()).toInt() fun makePrimes(): IntArray { val mxndx = (sqrtlmt - 3) / 2 val arr = IntArray(mxndx + 1, { it + it + 3}) var i = 0 while (true) { val sqri = (i + i) * (i + 3) + 3 if (sqri > mxndx) break if (arr[i] != 0) { val bp = i + i + 3 for (c in sqri .. mxndx step bp) arr[c] = 0 } i++ } return arr.filter { it != 0 }.toIntArray() } val oprms = makePrimes() fun lvl(pilmt: Int, m: Long): Long { var acc = 0.toLong() for (pi in cTinyPhiDeg until pilmt) { val p = oprms[pi].toLong(); val nm = m * p if (lmt <= nm * p) return acc + (pilmt - pi).toLong() val q = (lmt.toDouble() / nm.toDouble()).toLong(); acc += tinyPhi(q) if (pi > cTinyPhiDeg) acc -= lvl(pi, nm) } return acc } return tinyPhi(lmt) - lvl(oprms.size, 1) + oprms.size.toLong() }</syntaxhighlight> Use of the above function gets a gain in speed of about a further twenty times over the above version due to less recursion and the use of the "Tiny_Phi" Look Up Table (LUT) for smaller "degrees" of primes which greatly reduces the number of integer divisions, which have also been converted to floating point divisions because they are faster although with a lost of precision for counting ranges that one would likely not use this implementation for. This version of prime counting function might be considered to be reasonably useful for counting primes up to a trillion (1e12) in a few tens of seconds. '''The Non-Recursive Partial Sieving Algorithm''' The following Kotlin code enjoys the further gain in speed: {{trans\|Nim}} <syntaxhighlight lang="kotlin">import java.util.BitSet fun countPrimes(lmt: Long): Long { if (lmt < 3) return if (lmt < 2) 0 else 1 // odds only! fun half(x: Int): Int = (x - 1) shr 1 fun divide(nm: Long, d: Long): Int = (nm.toDouble() / d.toDouble()).toInt() val sqrtlmt = Math.sqrt(lmt.toDouble()).toLong() val mxndx = ((sqrtlmt - 1) shr 1).toInt() val cmpsts = BitSet(mxndx + 1) val smalls = IntArray(mxndx + 1) { it } val roughs = IntArray(mxndx + 1) { it + it + 1 } val larges = LongArray(mxndx + 1) { (lmt / (it + it + 1).toLong() - 1) shr 1 } // partial sieve loop, adjusting larges/smalls, compressing larges/roughs... var nobps = 0; var rilmt = mxndx; var bp = 3.toLong() while (true) { val i = (bp shr 1).toInt(); val sqri = (i + i) * (i + 1) if (sqri > mxndx) break if (!cmpsts.get(i)) { // condition for partial sieving pass for bp is prime cmpsts.set(i) // cull bp! for (c in sqri .. mxndx step bp.toInt()) cmpsts.set(c) // cull bp mults! // now adjust `larges` for latest partial sieve pass... var ori = 0 // compress input rough index to output one for (iri in 0 .. rilmt) { val r = roughs[iri]; val rci = (r shr 1) if (cmpsts.get(rci)) continue // skip roughs culled in this sieve pass! val d = bp * r.toLong() larges[ori] = larges[iri] - ( if (d <= sqrtlmt) larges[smalls[(d shr 1).toInt()] - nobps] else smalls[half(divide(lmt, d))].toLong() ) + nobps.toLong() // base primes count over subtracted! roughs[ori++] = r } var si = mxndx // and adjust `smalls` for latest partial sieve pass... for (bpm in (sqrtlmt / bp - 1) or 1 downTo bp step 2) { val c = smalls[(bpm shr 1).toInt()] - nobps val ei = ((bpm * bp) shr 1).toInt() while (si >= ei) smalls[si--] -= c } nobps++; rilmt = ori - 1 } bp += 2 } // combine results to here; correcting for over subtraction in combining... var ans = larges[0]; for (i in 1 .. rilmt) ans -= larges[i] ans += (rilmt.toLong() + 1 + 2 * (nobps.toLong() - 1)) * rilmt.toLong() / 2 // add final adjustment for pairs of current roughs to cube root of range... var ri = 0 while (true) { // break when reaches cube root of counting range... val p = roughs[++ri].toLong(); val q = lmt / p val ei = smalls[half(divide(q, p))] - nobps if (ei <= ri) break // break here when no more pairs! for (ori in ri + 1 .. ei) ans += smalls[half(divide(q, roughs[ori].toLong()))].toLong() ans -= (ei - ri).toLong() * (nobps.toLong() + ri.toLong() - 1) } return ans + 1 // add one for only even prime of two! } fun main() { val strt = System.currentTimeMillis() for (i in 0 .. 9) { val arg = Math.pow(10.toDouble(), i.toDouble()).toLong() println("π(10$i) = ${countPrimes(arg)}") } val stop = System.currentTimeMillis() println("This took ${stop - strt} milliseconds.") }</syntaxhighlight> The above code enjoys quite a large gain in speed of about a further ten times (and increasing with range) over the immediately preceding version for larger "non-trivial" ranges (since there is an appreciable environment overhead in initialization and JIT compilation) due to not using recursion at all and the greatly reduced computational complexity of O(n(3/4)/((log n)2)) instead of the almost-linear-for-large-counting-ranges O(n/((log n)2)) for the previous two versions, although the previous two versions differ in performance by a constant factor due to the overheads of recursion and division; for instance, this version can calculate the number of primes to 1e11 in about 82 milliseconds. This version of prime counting function might be considered to be reasonably useful for counting primes up to a 1e16 in about two minutes as long as the computer used has the required free memory of about 800 Megabytes. This Kotlin version is about twice as slow as the Nim version from which it was translated for large ranges where the initialization overhead is not significant due to being run under the Java Virtual Machine (JVM) environment and JIT compiled. =={{header\|Mathematica}}/{{header\|Wolfram Language}}== Line 1,650 ⟶ 2,581: 5761455 50847534</pre> =={{header\|Mojo}}== Currently, Mojo does not allow many forms of recursion so the simple recursive solutions are not possible; however, those are much slower than the solution by partial sieving anyway, as per the following code: {{trans\|Nim}} <syntaxhighlight lang="mojo">from time import (now) alias cLIMIT: UInt64 = 100_000_000_000 @always_inline fn mkMasks() -> DTypePointer[DType.uint8]: let rslt = DTypePointer[DType.uint8].alloc(8) for i in range(8): rslt.offset(i).store(1 << i) return rslt let masksp = mkMasks() fn intsqrt(n: UInt64) -> UInt64: if n < 4: if n < 1: return 0 else: return 1 var x: UInt64 = n; var qn: UInt64 = 0; var r: UInt64 = 0 while qn < 64 and (1 << qn) <= n: qn += 2 var q: UInt64 = 1 << qn while q > 1: if qn >= 64: q = 1 << (qn - 2); qn = 0 else: q >>= 2 let t: UInt64 = r + q r >>= 1 if x >= t: x -= t; r += q return r fn countPrimes(n: UInt64) -> Int64: if n < 3: if n < 2: return 0 else: return 1 let rtlmt: Int = intsqrt(n).to_int() # precision limits range to maybe 1e16! let mxndx = (rtlmt - 1) >> 1 @always_inline fn half(n: Int64) -> Int64 : return ((n - 1) // 2) @always_inline fn divide(nm: UInt64, d: UInt64) -> Int64: return ((nm * 1.0) / (d * 1.0)).to_int() let smalls = # current accumulated counts of odd primes 1 to sqrt range DTypePointer[DType.uint32].alloc(mxndx + 1) # initialized for no sieving whatsoever other than odds-only - partial sieved by 2: # 0 odd primes to 1; 1 odd prime to 3, etc.... for i in range(mxndx + 1): smalls.offset(i).store(i) let roughs = # current odd k-rough numbers up to sqrt of range; k = 2 DTypePointer[DType.uint32].alloc(mxndx + 1) # initialized to all odd positive numbers 1, 3, 5, ... sqrt range... for i in range(mxndx + 1): roughs.offset(i).store(i + i + 1) # array of current phi counts for above roughs... # these are not strictly `phi`'s since they also include the # count of base primes in order to match the above `smalls` definition! let larges = # starts as size of counts just as `roughs` so they align! DTypePointer[DType.uint64].alloc(mxndx + 1) # initialized for current roughs after accounting for even prime of two... for i in range(mxndx + 1): larges.offset(i).store((n // (i + i + 1) - 1) // 2) # cmpsts is a bit-packed boolean array representing # odd composite numbers from 1 up to rtlmt used for sieving... # initialized as "zeros" meaning all odd positives are potentially prime # note that this array starts at (and keeps) 1 to match the algorithm even # though 1 is not a prime, as 1 is important in computation of phi... let cmpsts = DTypePointer[DType.uint8].alloc((mxndx + 8) // 8) memset_zero(cmpsts, (mxndx + 8) // 8) # number of found base primes and current highest used rough index... var npc: Int = 0; var mxri: Int = mxndx for i in range(1, mxndx + 1): # start at index for 3; i will never reach mxndx... let sqri = (i + i) * (i + 1) # computation of square index! if sqri > mxndx: break # stop partial sieving due to square index limit! if (cmpsts.offset(i >> 3).load() & masksp.offset(i & 7).load()) != 0: continue # if not prime # culling the base prime from cmpsts means it will never be found again let cp = cmpsts.offset(i >> 3) cp.store(cp.load() \| masksp.offset(i & 7).load()) # cull base prime let bp = i + i + 1 # base prime from index! for c in range(sqri, mxndx + 1, bp): # SoE culling of all bp multiples... let cp = cmpsts.offset(c >> 3); cp.store(cp.load() \| masksp.offset(c & 7).load()) # partial sieving to current base prime is now completed! var ri: Int = 0 # to keep track of current used roughs index! for k in range(mxri + 1): # processing over current roughs size... # q is not necessarily a prime but may be a # product of primes not yet culled by partial sieving; # this is what saves operations compared to recursive Legendre: let q: UInt64 = roughs.offset(k).load().to_int(); let qi = q >> 1 # index of always odd q! # skip over values of `q` already culled in the last partial sieve: if (cmpsts.offset(qi >> 3).load() & masksp.offset(qi & 7).load()) != 0: continue # since `q` cannot be equal to bp due to cull of bp and above skip; let d: UInt64 = bp * q # `d` is odd product of some combination of odd primes! # the following computation is essential to the algorithm's speed: # see above description in the text for how this works: larges.offset(ri).store(larges.offset(k).load() - (larges.offset(smalls.offset(d >> 1).load().to_int() - npc).load() if d <= rtlmt else smalls.offset(half(divide(n, d))).load().to_int()) + npc) # eliminate rough values that have been culled in partial sieve: # note that `larges` and `roughs` indices relate to each other! roughs.offset(ri).store(q.to_int()); ri += 1 # update rough value; advance rough index var m = mxndx # adjust `smalls` counts for the newly culled odds... # this is faster than recounting over the `cmpsts` array for each loop... for k in range(((rtlmt // bp) - 1) \| 1, bp - 1, -2): # k always odd! # `c` is correction from current count to desired count... # `e` is end limit index no correction is necessary for current cull... let c = smalls.offset(k >> 1).load() - npc; let e = (k * bp) >> 1 while m >= e: let cp = smalls.offset(m) cp.store(cp.load() - c); m -= 1 # correct over range down to `e` mxri = ri - 1; npc += 1 # set next loop max roughs index; count base prime # now `smalls` is a LUT of odd prime accumulated counts for all odd primes; # `roughs` is exactly the "k-roughs" up to the sqrt of range with `k` the # index of the next prime above the quad root of the range; # `larges` is the partial prime counts for each of the `roughs` values... # note that `larges` values include the count of the odd base primes!!! # `cmpsts` are never used again! # the following does the top most "phi tree" calculation: var result: Int64 = larges.load().to_int() # the answer to here is all valid `phis` for i in range(1, mxri + 1): result -= larges.offset(i).load().to_int() # combined here by subtraction # compensate for the included odd base prime counts over subracted above: result += ((mxri + 1 + 2 * (npc - 1)) * mxri // 2) # This loop adds the counts due to the products of the `roughs` primes, # of which we only use two different ones at a time, as all the # combinations with lower primes than the cube root of the range have # already been computed and included with the previous major loop... # see text description above for how this works... for j in range(1, mxri + 1): # for all `roughs` (now prime) not including one: let p: UInt64 = roughs.offset(j).load().to_int() let m: UInt64 = (n // p) # `m` is the `p` quotient # so that the end limit `e` can be calculated based on `n`/(`p`^2) let e: Int = smalls.offset(half((m // p).to_int())).load().to_int() - npc # following break test equivalent to non-memoization/non-splitting optmization: if e <= j: break # stop at about `p` of cube root of range! for k in range(j + 1, e + 1): # for all `roughs` greater than `p` to end limit: result += smalls.offset(half(divide(m, roughs.offset(k).load().to_int()))).load().to_int() # compensate for all the extra base prime counts just added! result -= ((e - j) * (npc + j - 1)) result += 1 # include the count for the only even prime of two smalls.free(); roughs.free(); larges.free(); cmpsts.free() return result fn main(): var pow: Int = 1 for i in range(10): print('10^', i, '=', countPrimes(pow)) pow = 10 let start = now() let answr = countPrimes(cLIMIT) let elpsd = (now() - start) / 1000000 print("Found", answr, "primes up to", cLIMIT, "in", elpsd, "milliseconds.")</syntaxhighlight> {{out}} <pre>10^ 0 = 0 10^ 1 = 4 10^ 2 = 25 10^ 3 = 168 10^ 4 = 1229 10^ 5 = 9592 10^ 6 = 78498 10^ 7 = 664579 10^ 8 = 5761455 10^ 9 = 50847534 Found 4118054813 primes up to 100000000000 in 16.696860000000001 milliseconds.</pre> This is as run on an AMD 7840HS single-thread boosted to 5.1 GHz. It is over twice as slow as when run from the Nim code it is translated from, likely due to LLVM not handling this algorithm as well as the GCC compiler that did the final "back-end" compilation for the Nim code. =={{header\|Nim}}== Line 1,686 ⟶ 2,791: for i in 0..9: echo "π(10^$1) = $2".format(i, π(n)) n = 10</syntaxhighlight></syntaxhighlight> This is not quite as fast as the Nim version or other languages whose back end is C as the LLVM-based back ends don't compile to quite the same optimization level for this algorithm than does GCC. {{out}} Line 2,014 ⟶ 3,121: As counting range is increased above these trivial ranges, a better algorithm such as that of LMO will likely perform much better than this and use much less memory (to proportional to the cube root of the range), although at the cost of greater code complexity and more lines of code (about 500 LOC). The trade-off between algorithms of the Legendre type and those of the Meissel type is that the latter decreases the time complexity but at the cost of more time spent sieving; modern follow-on work to LMO produces algorithms which are able to tune the balance between Legendre-type and Meissel-type algorithm in trading off the execution time costs between the different parts of the given algorithm for the best in performance, with the latest in Kim Walisch's tuning of Xavier Gourdon's work being about five to ten times faster than LMO (plus includes multi-threading abilities). =={{header\|Pascal}}== <syntaxhighlight lang="pascal"> // Rosetta Code task "Legendre prime counting function". // Solution for Free Pascal (Lazarus) or Delphi. program LegendrePrimeCount; {$IFDEF FPC} // Free Pascal {$MODE Delphi} {$ELSE} // Delphi {$APPTYPE CONSOLE} {$ENDIF} // Optimization needs to be on if the program is to finish in a reasonable // length of time. See "Comments on Task" on the Rosetta Code website. {$DEFINE SIMPLE_OPTIMIZATION} uses SysUtils, Types; {------------------------------------------------------------------- Function to return an array of primes up to the passed-in limit. Uses a straightforward Eratosthenes sieve. TIntegerDynArray must be 0-based. To be compatible with Rosetta Code, the first prime 2 is at result[1], and result[0] is not used. } function FindPrimes( limit : integer) : Types.TIntegerDynArray; var deleted : array of boolean; j, k, p, resultSize : integer; begin if (limit < 2) then begin SetLength( result, 1); exit; end; SetLength( deleted, limit + 1); // 0..limit deleted[0] := true; for j := 1 to limit do deleted[j] := false; p := 2; while (pp <= limit) do begin j := 2p; while (j <= limit) do begin deleted[j] := true; inc( j, p); end; repeat inc(p) until (p > limit) or (not deleted[p]); end; resultSize := 0; for j := 0 to limit do if not deleted[j] then inc( resultSize); SetLength( result, resultSize); k := 0; for j := 0 to limit do begin if not deleted[j] then begin result[k] := j; inc(k); end; end; end; {----------------------------------------------------------------------------- Function to count primes up to the passed-in limit, by Legendre's method. Iterative, using a stack. Each item in the stack is a term phi(x,a) along with a sign. If the top item on the stack can be evaluated easily, it is popped off and its value is added to the result. Else the top item is replaced by two items according to the formual in the task description. } function CountPrimes( n : integer) : integer; type TPhiTerm = record IsNeg : boolean; x : integer; a : integer; end; const STACK_SIZE = 100; // 10 is enough for n = 10^9 var primes : Types.TIntegerDynArray; nrPrimes : integer; stack : array [0..STACK_SIZE - 1] of TPhiTerm; sp : integer; // stack pointer, points to first free entry tos : TPhiTerm; // top of stack begin primes := FindPrimes( Trunc( Sqrt( n + 0.5))); nrPrimes := Length( primes) - 1; // primes[0] is not used result := nrPrimes - 1; // initialize total // Push initial entry onto stack with stack[0] do begin IsNeg := false; x := n; a := nrPrimes; end; sp := 1; while sp > 0 do begin tos := stack[sp - 1]; {$IFDEF SIMPLE_OPTIMIZATION} // Using optimization described in "Comments on Task" if tos.x = 0 then begin // top of stack = 0 dec(sp); // pop top of stack, no change to result end else if (tos.a > 0) and (tos.x < primes[tos.a]) then begin // top of stack = 1 dec( sp); // pop top of stack, update result if tos.IsNeg then dec( result) else inc( result); end else if tos.a = 0 then begin {$ELSE} // Using only the task description, i.e. only phi(x,0) = x if tos.a = 0 then begin {$ENDIF} dec( sp); // pop top of stack, update result if tos.IsNeg then dec( result, tos.x) else inc( result, tos.x); end else begin // Replace top of stack by two items as in the task description, // namely phi(x, a - 1) and -phi(x div primes[a], a - 1) if (sp >= STACK_SIZE) then raise SysUtils.Exception.Create( 'Legendre phi stack overflow'); with stack[sp - 1] do begin IsNeg := tos.isNeg; x := tos.x; a := tos.a - 1; end; with stack[sp] do begin IsNeg := not tos.IsNeg; x := tos.x div primes[tos.a]; a := tos.a - 1; end; inc(sp); end; end; end; {----------------------------------------------------------- Main routine } var power, limit, count : integer; begin WriteLn( 'Limit Count'); limit := 1; for power := 0 to 9 do begin if power > 0 then limit := 10limit; count := CountPrimes( limit); WriteLn( SysUtils.Format( '10^%d %10d', [power, count])) end; end. </syntaxhighlight> {{out}} <pre> Limit Count 10^0 0 10^1 4 10^2 25 10^3 168 10^4 1229 10^5 9592 10^6 78498 10^7 664579 10^8 5761455 10^9 50847534 </pre> =={{header\|Perl}}== Line 2,127 ⟶ 3,397: </pre> <small>(It is about 4 times slower under pwa/p2js so output is limited to 10^8, unless you like staring at a blank screen for 52s)</small> === Non-recursive partial sieve === <!--<syntaxhighlight lang="phix">(phixonline)--> <span style="color: #008080;">with</span> <span style="color: #008080;">javascript_semantics</span> <span style="color: #7060A8;">requires</span><span style="color: #0000FF;">(</span><span style="color: #008000;">"1.0.2"</span><span style="color: #0000FF;">)</span> <span style="color: #000080;font-style:italic;">-- (for in, tagstart)</span> <span style="color: #008080;">function</span> <span style="color: #000000;">half</span><span style="color: #0000FF;">(</span><span style="color: #004080;">integer</span> <span style="color: #000000;">n</span><span style="color: #0000FF;">)</span> <span style="color: #008080;">return</span> <span style="color: #7060A8;">floor</span><span style="color: #0000FF;">((</span><span style="color: #000000;">n</span><span style="color: #0000FF;">-</span><span style="color: #000000;">1</span><span style="color: #0000FF;">)/</span><span style="color: #000000;">2</span><span style="color: #0000FF;">)+</span><span style="color: #000000;">1</span> <span style="color: #008080;">end</span> <span style="color: #008080;">function</span> <span style="color: #000080;font-style:italic;">// convenience convert to idx</span> <span style="color: #008080;">function</span> <span style="color: #000000;">count_primes</span><span style="color: #0000FF;">(</span><span style="color: #004080;">atom</span> <span style="color: #000000;">n</span><span style="color: #0000FF;">)</span> <span style="color: #000080;font-style:italic;">// non-recursive Legendre prime counting function for a range `n`... // has O(n^(3/4)/((log n)^2)) time complexity; O(n^(1/2)) space complexity.</span> <span style="color: #008080;">if</span> <span style="color: #000000;">n</span><span style="color: #0000FF;"><</span><span style="color: #000000;">3</span> <span style="color: #008080;">then</span> <span style="color: #008080;">return</span> <span style="color: #7060A8;">iff</span><span style="color: #0000FF;">(</span><span style="color: #000000;">n</span><span style="color: #0000FF;"><</span><span style="color: #000000;">2</span><span style="color: #0000FF;">?</span><span style="color: #000000;">0</span><span style="color: #0000FF;">:</span><span style="color: #000000;">1</span><span style="color: #0000FF;">)</span> <span style="color: #008080;">end</span> <span style="color: #008080;">if</span> <span style="color: #000080;font-style:italic;">// can't odd sieve for n less than 3!</span> <span style="color: #004080;">integer</span> <span style="color: #000000;">sqrtn</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">trunc</span><span style="color: #0000FF;">(</span><span style="color: #7060A8;">sqrt</span><span style="color: #0000FF;">(</span><span style="color: #000000;">n</span><span style="color: #0000FF;">)),</span> <span style="color: #000080;font-style:italic;">// (actual limit)</span> <span style="color: #000000;">mxndx</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">floor</span><span style="color: #0000FF;">((</span><span style="color: #000000;">sqrtn</span><span style="color: #0000FF;">-</span><span style="color: #000000;">1</span><span style="color: #0000FF;">)/</span><span style="color: #000000;">2</span><span style="color: #0000FF;">)</span> <span style="color: #000080;font-style:italic;">// odds-only limit -- -- smalls is the current accumulated counts of odd primes 1 to sqrt(n), initialized -- to odds-only sieving, ie {0,1,2,3,4...} meaning 0 odd primes to 1, 1 o.p to 3,... -- -- roughs is the current odd k-rough numbers up to sqrt of range; k = 2 -- initialized to all odd positive numbers 1, 3, 5, 7, 9, 11, ... sqrt(n) -- -- larges is an array of current phi counts for the above roughs... except they are -- not strictly `phi`'s since they also include primes, to match `smalls` above! -- initialized for current roughs after accounting for the even prime of two... -- -- composite is a flag array representing odd numbers 1..sqrtn, for sieving. -- initialized false, meaning all positive odd numbers are potentially prime -- note that this array starts at (and keeps) 1 to match the algorithm even -- though 1 is not actually a prime, as 1 is important in computation of phi... --</span> <span style="color: #004080;">sequence</span> <span style="color: #000000;">smalls</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">tagset</span><span style="color: #0000FF;">(</span><span style="color: #000000;">mxndx</span><span style="color: #0000FF;">,</span><span style="color: #000000;">0</span><span style="color: #0000FF;">),</span> <span style="color: #000000;">roughs</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">tagstart</span><span style="color: #0000FF;">(</span><span style="color: #000000;">1</span><span style="color: #0000FF;">,</span><span style="color: #000000;">mxndx</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span><span style="color: #0000FF;">,</span><span style="color: #000000;">2</span><span style="color: #0000FF;">),</span> <span style="color: #000000;">larges</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">sq_floor_div</span><span style="color: #0000FF;">(</span><span style="color: #7060A8;">sq_sub</span><span style="color: #0000FF;">(</span><span style="color: #7060A8;">sq_div</span><span style="color: #0000FF;">(</span><span style="color: #000000;">n</span><span style="color: #0000FF;">,</span><span style="color: #000000;">roughs</span><span style="color: #0000FF;">),</span><span style="color: #000000;">1</span><span style="color: #0000FF;">),</span><span style="color: #000000;">2</span><span style="color: #0000FF;">),</span> <span style="color: #000000;">composite</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">repeat</span><span style="color: #0000FF;">(</span><span style="color: #004600;">false</span><span style="color: #0000FF;">,</span><span style="color: #000000;">mxndx</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span><span style="color: #0000FF;">)</span> <span style="color: #004080;">integer</span> <span style="color: #000000;">bp</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">3</span><span style="color: #0000FF;">,</span> <span style="color: #000080;font-style:italic;">// 'current' base prime</span> <span style="color: #000000;">nbp</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">0</span><span style="color: #0000FF;">,</span> <span style="color: #000080;font-style:italic;">// number of base primes found </span> <span style="color: #000000;">mxri</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">mxndx</span><span style="color: #0000FF;">,</span> <span style="color: #000080;font-style:italic;">// current highest used rough index</span> <span style="color: #000000;">i</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">2</span><span style="color: #0000FF;">,</span> <span style="color: #000000;">sqri</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">4</span> <span style="color: #000080;font-style:italic;">// index and square (index-1) limit // partial sieve loop, adjusting larges/smalls, compressing larges/roughs...</span> <span style="color: #008080;">while</span> <span style="color: #000000;">sqri</span><span style="color: #0000FF;"><=</span><span style="color: #000000;">mxndx</span> <span style="color: #008080;">do</span> <span style="color: #000080;font-style:italic;">// partial sieve to square index limit</span> <span style="color: #008080;">if</span> <span style="color: #008080;">not</span> <span style="color: #000000;">composite</span><span style="color: #0000FF;">[</span><span style="color: #000000;">i</span><span style="color: #0000FF;">]</span> <span style="color: #008080;">then</span> <span style="color: #000080;font-style:italic;">// cull from composite so they will never be found again</span> <span style="color: #000000;">composite</span><span style="color: #0000FF;">[</span><span style="color: #000000;">i</span><span style="color: #0000FF;">]</span> <span style="color: #0000FF;">=</span> <span style="color: #004600;">true</span> <span style="color: #000080;font-style:italic;">// cull bp and multiples</span> <span style="color: #008080;">for</span> <span style="color: #000000;">c</span><span style="color: #0000FF;">=</span><span style="color: #000000;">sqri</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span> <span style="color: #008080;">to</span> <span style="color: #000000;">mxndx</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span> <span style="color: #008080;">by</span> <span style="color: #000000;">bp</span> <span style="color: #008080;">do</span> <span style="color: #000000;">composite</span><span style="color: #0000FF;">[</span><span style="color: #000000;">c</span><span style="color: #0000FF;">]</span> <span style="color: #0000FF;">=</span> <span style="color: #004600;">true</span> <span style="color: #008080;">end</span> <span style="color: #008080;">for</span> <span style="color: #000080;font-style:italic;">// partial sieving to current base prime is now completed! // now adjust `larges` for latest partial sieve pass...</span> <span style="color: #004080;">integer</span> <span style="color: #000000;">ori</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">0</span> <span style="color: #000080;font-style:italic;">// compress input rough index(k) to output one</span> <span style="color: #008080;">for</span> <span style="color: #000000;">k</span><span style="color: #0000FF;">,</span><span style="color: #000000;">q</span> <span style="color: #008080;">in</span> <span style="color: #000000;">roughs</span> <span style="color: #008080;">to</span> <span style="color: #000000;">mxri</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span> <span style="color: #008080;">do</span> <span style="color: #000080;font-style:italic;">// q is not necessarily prime but may be a product of primes not yet // culled by partial sieving (saves ops cmprd to recursive Legendre) // skip over values of `q` already culled in the last partial sieve:</span> <span style="color: #004080;">integer</span> <span style="color: #000000;">qi</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">floor</span><span style="color: #0000FF;">(</span><span style="color: #000000;">q</span><span style="color: #0000FF;">/</span><span style="color: #000000;">2</span><span style="color: #0000FF;">)+</span><span style="color: #000000;">1</span><span style="color: #0000FF;">;</span> <span style="color: #000080;font-style:italic;">// index of always odd q!</span> <span style="color: #008080;">if</span> <span style="color: #008080;">not</span> <span style="color: #000000;">composite</span><span style="color: #0000FF;">[</span><span style="color: #000000;">qi</span><span style="color: #0000FF;">]</span> <span style="color: #008080;">then</span> <span style="color: #000080;font-style:italic;">// since `q` cannot be equal to bp due to cull of bp and above skip;</span> <span style="color: #004080;">atom</span> <span style="color: #000000;">d</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">bp</span><span style="color: #0000FF;"></span><span style="color: #000000;">q</span><span style="color: #0000FF;">,</span> <span style="color: #000080;font-style:italic;">// `d` is odd product of some combination of odd primes! // the following computation is essential to the algorithm's speed, // see the Nim entry for the full details of how this works</span> <span style="color: #000000;">dadj</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">iff</span><span style="color: #0000FF;">(</span><span style="color: #000000;">d</span><span style="color: #0000FF;"><=</span><span style="color: #000000;">sqrtn</span> <span style="color: #0000FF;">?</span> <span style="color: #000000;">larges</span><span style="color: #0000FF;">[</span><span style="color: #000000;">smalls</span><span style="color: #0000FF;">[</span><span style="color: #000000;">half</span><span style="color: #0000FF;">(</span><span style="color: #000000;">d</span><span style="color: #0000FF;">)]-</span><span style="color: #000000;">nbp</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span><span style="color: #0000FF;">]</span> <span style="color: #0000FF;">:</span> <span style="color: #000000;">smalls</span><span style="color: #0000FF;">[</span><span style="color: #000000;">half</span><span style="color: #0000FF;">(</span><span style="color: #7060A8;">floor</span><span style="color: #0000FF;">(</span><span style="color: #000000;">n</span><span style="color: #0000FF;">/</span><span style="color: #000000;">d</span><span style="color: #0000FF;">))])</span> <span style="color: #000000;">ori</span> <span style="color: #0000FF;">+=</span> <span style="color: #000000;">1</span> <span style="color: #000000;">larges</span><span style="color: #0000FF;">[</span><span style="color: #000000;">ori</span><span style="color: #0000FF;">]</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">larges</span><span style="color: #0000FF;">[</span><span style="color: #000000;">k</span><span style="color: #0000FF;">]-</span><span style="color: #000000;">dadj</span><span style="color: #0000FF;">+</span><span style="color: #000000;">nbp</span> <span style="color: #000080;font-style:italic;">// base primes count over subtracted! // eliminate rough values that have been culled in partial sieve: // note that `larges` and `roughs` indices relate to each other!</span> <span style="color: #000000;">roughs</span><span style="color: #0000FF;">[</span><span style="color: #000000;">ori</span><span style="color: #0000FF;">]</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">q</span> <span style="color: #008080;">end</span> <span style="color: #008080;">if</span> <span style="color: #008080;">end</span> <span style="color: #008080;">for</span> <span style="color: #004080;">integer</span> <span style="color: #000000;">m</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">mxndx</span> <span style="color: #000080;font-style:italic;">// and adjust `smalls` for latest partial sieve pass... // this is faster than recounting over the `composite` array for each loop...</span> <span style="color: #008080;">for</span> <span style="color: #000000;">k</span><span style="color: #0000FF;">=(</span><span style="color: #000000;">sqrtn</span><span style="color: #0000FF;">/</span><span style="color: #000000;">bp</span><span style="color: #0000FF;">-</span><span style="color: #000000;">1</span><span style="color: #0000FF;">)\|\|</span><span style="color: #000000;">1</span> <span style="color: #008080;">to</span> <span style="color: #000000;">bp</span> <span style="color: #008080;">by</span> <span style="color: #0000FF;">-</span><span style="color: #000000;">2</span> <span style="color: #008080;">do</span> <span style="color: #000080;font-style:italic;">// k always odd! // `c` is correction from current count to desired count... // `e` is end limit index no correction is necessary for current cull...</span> <span style="color: #004080;">integer</span> <span style="color: #000000;">c</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">smalls</span><span style="color: #0000FF;">[</span><span style="color: #000000;">half</span><span style="color: #0000FF;">(</span><span style="color: #000000;">k</span><span style="color: #0000FF;">)]-</span><span style="color: #000000;">nbp</span><span style="color: #0000FF;">,</span> <span style="color: #000000;">e</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">floor</span><span style="color: #0000FF;">((</span><span style="color: #000000;">k</span><span style="color: #0000FF;"></span><span style="color: #000000;">bp</span><span style="color: #0000FF;">)/</span><span style="color: #000000;">2</span><span style="color: #0000FF;">)</span> <span style="color: #008080;">while</span> <span style="color: #000000;">m</span><span style="color: #0000FF;">>=</span><span style="color: #000000;">e</span> <span style="color: #008080;">do</span> <span style="color: #000080;font-style:italic;">-- smalls[m+1] -= c -- (grr, js! [I have a plan, working on it])</span> <span style="color: #000000;">m</span> <span style="color: #0000FF;">+=</span> <span style="color: #000000;">1</span> <span style="color: #000000;">smalls</span><span style="color: #0000FF;">[</span><span style="color: #000000;">m</span><span style="color: #0000FF;">]</span> <span style="color: #0000FF;">-=</span> <span style="color: #000000;">c</span> <span style="color: #000080;font-style:italic;">-- m -= 1</span> <span style="color: #000000;">m</span> <span style="color: #0000FF;">-=</span> <span style="color: #000000;">2</span> <span style="color: #008080;">end</span> <span style="color: #008080;">while</span> <span style="color: #008080;">end</span> <span style="color: #008080;">for</span> <span style="color: #000000;">nbp</span> <span style="color: #0000FF;">+=</span> <span style="color: #000000;">1</span> <span style="color: #000080;font-style:italic;">// increase number of found base primes</span> <span style="color: #000000;">mxri</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">ori</span><span style="color: #0000FF;">-</span><span style="color: #000000;">1</span> <span style="color: #000080;font-style:italic;">// advance rough index for later</span> <span style="color: #008080;">end</span> <span style="color: #008080;">if</span> <span style="color: #000000;">bp</span> <span style="color: #0000FF;">+=</span> <span style="color: #000000;">2</span> <span style="color: #000000;">sqri</span> <span style="color: #0000FF;">=</span> <span style="color: #0000FF;">(</span><span style="color: #000000;">i</span><span style="color: #0000FF;">+</span><span style="color: #000000;">i</span><span style="color: #0000FF;">)(</span><span style="color: #000000;">i</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span><span style="color: #0000FF;">)</span> <span style="color: #000000;">i</span> <span style="color: #0000FF;">+=</span> <span style="color: #000000;">1</span> <span style="color: #008080;">end</span> <span style="color: #008080;">while</span> <span style="color: #000080;font-style:italic;">// now `smalls` is a LUT of odd prime accumulated counts for all odd primes; // `roughs` is exactly the "k-roughs" up to the sqrt of range with `k` (erm, // mxri?) the index of the next prime above the quad root of the range; // `larges` is the partial prime counts for each of the `roughs` values... // note that `larges` values include the count of the odd base primes!!! // - and `composite` is never used again! // the following does the top-most "phi tree" calculation: // the answer to here is all valid `phis`, combined here by subtraction, // + compensate for included odd base prime counts over subracted above:</span> <span style="color: #004080;">atom</span> <span style="color: #000000;">result</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">larges</span><span style="color: #0000FF;">[</span><span style="color: #000000;">1</span><span style="color: #0000FF;">]</span> <span style="color: #0000FF;">-</span> <span style="color: #7060A8;">sum</span><span style="color: #0000FF;">(</span><span style="color: #000000;">larges</span><span style="color: #0000FF;">[</span><span style="color: #000000;">2</span><span style="color: #0000FF;">..</span><span style="color: #000000;">mxri</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span><span style="color: #0000FF;">])</span> <span style="color: #0000FF;">+</span> <span style="color: #7060A8;">trunc</span><span style="color: #0000FF;">((</span><span style="color: #000000;">mxri</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span> <span style="color: #0000FF;">+</span> <span style="color: #000000;">2</span><span style="color: #0000FF;">(</span><span style="color: #000000;">nbp</span><span style="color: #0000FF;">-</span><span style="color: #000000;">1</span><span style="color: #0000FF;">))</span><span style="color: #000000;">mxri</span><span style="color: #0000FF;">/</span><span style="color: #000000;">2</span><span style="color: #0000FF;">)</span> <span style="color: #0000FF;">+</span> <span style="color: #000000;">1</span> <span style="color: #000080;font-style:italic;">// include the only even prime, ie 2 // This loop adds the counts due to the products of the `roughs` primes, // of which we only use two different ones at a time, as all the // combinations with lower primes than the cube root of the range have // already been computed and included with the previous major loop... // see text description in the Nim entry for how this works...</span> <span style="color: #008080;">for</span> <span style="color: #000000;">ri</span><span style="color: #0000FF;">,</span><span style="color: #000000;">p</span> <span style="color: #008080;">in</span> <span style="color: #000000;">roughs</span> <span style="color: #008080;">from</span> <span style="color: #000000;">2</span> <span style="color: #008080;">do</span> <span style="color: #000080;font-style:italic;">// for all `roughs` (now prime) bar '1':</span> <span style="color: #004080;">atom</span> <span style="color: #000000;">m</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">trunc</span><span style="color: #0000FF;">(</span><span style="color: #000000;">n</span><span style="color: #0000FF;">/</span><span style="color: #000000;">p</span><span style="color: #0000FF;">),</span> <span style="color: #000080;font-style:italic;">// `m` is the `p` quotient // so that the end limit `e` can be calculated based on `n`/(`p`^2)</span> <span style="color: #000000;">e</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">smalls</span><span style="color: #0000FF;">[</span><span style="color: #000000;">half</span><span style="color: #0000FF;">(</span><span style="color: #7060A8;">floor</span><span style="color: #0000FF;">(</span><span style="color: #000000;">m</span><span style="color: #0000FF;">/</span><span style="color: #000000;">p</span><span style="color: #0000FF;">))+</span><span style="color: #000000;">1</span><span style="color: #0000FF;">]-</span><span style="color: #000000;">nbp</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span> <span style="color: #000080;font-style:italic;">// the following test is equivalent to non-splitting optmization:</span> <span style="color: #008080;">if</span> <span style="color: #000000;">e</span><span style="color: #0000FF;"><=</span><span style="color: #000000;">ri</span> <span style="color: #008080;">then</span> <span style="color: #008080;">exit</span> <span style="color: #008080;">end</span> <span style="color: #008080;">if</span> <span style="color: #000080;font-style:italic;">// quit when no more pairs! - aka stop // at about `p` of cube root of range!</span> <span style="color: #008080;">for</span> <span style="color: #000000;">k</span><span style="color: #0000FF;">=</span><span style="color: #000000;">ri</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span> <span style="color: #008080;">to</span> <span style="color: #000000;">e</span> <span style="color: #008080;">do</span> <span style="color: #000080;font-style:italic;">// for all `roughs` greater than `p` to limit:</span> <span style="color: #000000;">result</span> <span style="color: #0000FF;">+=</span> <span style="color: #000000;">smalls</span><span style="color: #0000FF;">[</span><span style="color: #000000;">half</span><span style="color: #0000FF;">(</span><span style="color: #7060A8;">floor</span><span style="color: #0000FF;">(</span><span style="color: #000000;">m</span><span style="color: #0000FF;">/</span><span style="color: #000000;">roughs</span><span style="color: #0000FF;">[</span><span style="color: #000000;">k</span><span style="color: #0000FF;">]))];</span> <span style="color: #008080;">end</span> <span style="color: #008080;">for</span> <span style="color: #000080;font-style:italic;">// compensate for all the extra base prime counts just added!</span> <span style="color: #000000;">result</span> <span style="color: #0000FF;">-=</span> <span style="color: #0000FF;">(</span><span style="color: #000000;">e</span><span style="color: #0000FF;">-</span><span style="color: #000000;">ri</span><span style="color: #0000FF;">)(</span><span style="color: #000000;">nbp</span><span style="color: #0000FF;">+</span><span style="color: #000000;">ri</span><span style="color: #0000FF;">-</span><span style="color: #000000;">2</span><span style="color: #0000FF;">)</span> <span style="color: #008080;">end</span> <span style="color: #008080;">for</span> <span style="color: #008080;">return</span> <span style="color: #000000;">result</span> <span style="color: #008080;">end</span> <span style="color: #008080;">function</span> <span style="color: #004080;">atom</span> <span style="color: #000000;">t</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">time</span><span style="color: #0000FF;">()</span> <span style="color: #008080;">constant</span> <span style="color: #000000;">expected</span> <span style="color: #0000FF;">=</span> <span style="color: #0000FF;">{</span><span style="color: #000000;">0</span><span style="color: #0000FF;">,</span><span style="color: #000000;">4</span><span style="color: #0000FF;">,</span><span style="color: #000000;">25</span><span style="color: #0000FF;">,</span><span style="color: #000000;">168</span><span style="color: #0000FF;">,</span><span style="color: #000000;">1229</span><span style="color: #0000FF;">,</span><span style="color: #000000;">9592</span><span style="color: #0000FF;">,</span><span style="color: #000000;">78498</span><span style="color: #0000FF;">,</span><span style="color: #000000;">664579</span><span style="color: #0000FF;">,</span><span style="color: #000000;">5761455</span><span style="color: #0000FF;">,</span> <span style="color: #000000;">50847534</span><span style="color: #0000FF;">,</span><span style="color: #000000;">455052511</span><span style="color: #0000FF;">,</span><span style="color: #000000;">4118054813</span><span style="color: #0000FF;">,</span><span style="color: #000000;">37607912018</span><span style="color: #0000FF;">,</span> <span style="color: #000000;">346065536839</span><span style="color: #0000FF;">,</span><span style="color: #000000;">3204941750802</span><span style="color: #0000FF;">}</span> <span style="color: #008080;">for</span> <span style="color: #000000;">i</span><span style="color: #0000FF;">=</span><span style="color: #000000;">0</span> <span style="color: #008080;">to</span> <span style="color: #7060A8;">iff</span><span style="color: #0000FF;">(</span><span style="color: #7060A8;">platform</span><span style="color: #0000FF;">()=</span><span style="color: #004600;">JS</span><span style="color: #0000FF;">?</span><span style="color: #000000;">11</span><span style="color: #0000FF;">:</span><span style="color: #000000;">14</span><span style="color: #0000FF;">)</span> <span style="color: #008080;">do</span> <span style="color: #000080;font-style:italic;">-- (sp: keep js under 2s)</span> <span style="color: #004080;">atom</span> <span style="color: #000000;">c</span> <span style="color: #0000FF;">=</span> <span style="color: #000000;">count_primes</span><span style="color: #0000FF;">(</span><span style="color: #7060A8;">power</span><span style="color: #0000FF;">(</span><span style="color: #000000;">10</span><span style="color: #0000FF;">,</span><span style="color: #000000;">i</span><span style="color: #0000FF;">))</span> <span style="color: #7060A8;">assert</span><span style="color: #0000FF;">(</span><span style="color: #000000;">c</span><span style="color: #0000FF;">==</span><span style="color: #000000;">expected</span><span style="color: #0000FF;">[</span><span style="color: #000000;">i</span><span style="color: #0000FF;">+</span><span style="color: #000000;">1</span><span style="color: #0000FF;">])</span> <span style="color: #004080;">string</span> <span style="color: #000000;">e</span> <span style="color: #0000FF;">=</span> <span style="color: #7060A8;">elapsed</span><span style="color: #0000FF;">(</span><span style="color: #7060A8;">time</span><span style="color: #0000FF;">()-</span><span style="color: #000000;">t</span><span style="color: #0000FF;">,</span><span style="color: #000000;">0.1</span><span style="color: #0000FF;">,</span><span style="color: #008000;">" (%s)"</span><span style="color: #0000FF;">)</span> <span style="color: #7060A8;">printf</span><span style="color: #0000FF;">(</span><span style="color: #000000;">1</span><span style="color: #0000FF;">,</span><span style="color: #008000;">"10^%d = %d%s\n"</span><span style="color: #0000FF;">,{</span><span style="color: #000000;">i</span><span style="color: #0000FF;">,</span><span style="color: #000000;">c</span><span style="color: #0000FF;">,</span><span style="color: #000000;">e</span><span style="color: #0000FF;">})</span> <span style="color: #008080;">end</span> <span style="color: #008080;">for</span> <span style="color: #7060A8;">printf</span><span style="color: #0000FF;">(</span><span style="color: #000000;">1</span><span style="color: #0000FF;">,</span><span style="color: #008000;">"\nTook %s\n"</span><span style="color: #0000FF;">,</span><span style="color: #7060A8;">elapsed</span><span style="color: #0000FF;">(</span><span style="color: #7060A8;">time</span><span style="color: #0000FF;">()-</span><span style="color: #000000;">t</span><span style="color: #0000FF;">))</span> <!--</syntaxhighlight>--> {{out}} <pre> 10^0 = 0 10^1 = 4 10^2 = 25 10^3 = 168 10^4 = 1229 10^5 = 9592 10^6 = 78498 10^7 = 664579 10^8 = 5761455 10^9 = 50847534 10^10 = 455052511 (0.3s) 10^11 = 4118054813 (1.7s) 10^12 = 37607912018 (7.9s) 10^13 = 346065536839 (40.8s) 10^14 = 3204941750802 (3 minutes and 44s) Took 3 minutes and 44s </pre> About 15 times slower than Julia on the same box (gulp, earmarked for further investigation in 2.0.0).<br> [At the last minute, I nicked the idea of using a simple bool array instead of those bit-fields from Julia.]<br> A copy of this code [up to 1e9] has also found it's way into tests\t68forin.exw =={{header\|Picat}}== Line 2,265 ⟶ 3,698: </pre> =={{header\|Ruby}}== {{trans\|Wren}} <syntaxhighlight lang="ruby">require 'prime' def pi(n) @pr = Prime.each(Integer.sqrt(n)).to_a a = @pr.size case n when 0,1 then 0 when 2 then 1 else phi(n,a) + a - 1 end end def phi(x,a) case a when 0 then x when 1 then x-(x>>1) else pa = @pr[a-1] return 1 if x <= pa phi(x, a-1)- phi(x/pa, a-1) end end (0..9).each {\|n\| puts "10E#{n} #{pi(10n)}" } </syntaxhighlight> {{out}} <pre>10E0 0 10E1 4 10E2 25 10E3 168 10E4 1229 10E5 9592 10E6 78498 10E7 664579 10E8 5761455 10E9 50847534 </pre> =={{header\|Sidef}}== <syntaxhighlight lang="ruby">func legendre_phi(x, a) is cached { Line 2,465 ⟶ 3,937: [inline] fn half(n ~~int~~u64) ~~int~~i64 { return i64((n - 1) >>> 1) } // convenience function! [inline] // floating point divide faster than integer divide! fn divide(nm u64, d u64) ~~int~~u64 { return ~~int~~u64(f64(nm) / f64(d)) } [direct_array_access] fn count_primes_to(n u64) i64 { if n < u64(39) { return if n < i64(2) { i64(0) } else { i64((n + 1) / 2) } } rtlmt := ~~int~~u64(sqrt(f64(n))) mxndx := i64((rtlmt - 1) / 2) arrlen := int(mxndx + 1) mut smalls := []u32{ len: arrlen, cap: arrlen, init: u32(it) } mut roughs := []u32{ len: arrlen, cap: arrlen, init: u32(it + it + 1) } mut larges := []i64{ len: arrlen, cap: arrlen, init: i64(((n / u64(it + it + 1) - 1) / 2)) } cullbuflen := int((mxndx + 8) / 8) mut cullbuf := []u8{len: cullbuflen, cap: cullbuflen, init: u8(0)} mut nbps := i64(0) // do partial sieving for each odd base prime to quad root... mut rilmt := arrlen // number of roughs start with full size! for i := i64(1); ; i++ { // start with 3; breaks when partial sieving done... sqri := (i + i) (i + 1) if sqri > mxndx { break } // breaks here! if (cullbuf[i >>> 3] & masks[i & 7]) != u8(0) { continue } // not prime! cullbuf[i >>> 3] \|= masks[i & 7] // cull bp rep! bp := u64(i + i + 1) // partial sieve by bp... for c := sqri; c < arrlen; c += i64(bp) { cullbuf[c >>> 3] \|= masks[c & 7] } mut nri := 0 // transfer from `ori` to `nri` indexes: for ori in 0 .. rilmt { // update `roughs` and `larges` for partial sieve... qr := ~~int(~~roughs[ori]) pirci := qi64(r >>> 1) // skip recently culled in last partial sieve... if (cullbuf[pirci >>> 3] & masks[pirci & 7]) != u8(0) { continue } d := qu64(r) * u64(bp) larges[nri] = larges[ori] - (if d <= rtlmt { larges[~~int~~i64(smalls[d >>> 1]) - nbps] } else { i64(smalls[half(divide(n, ~~u64(~~d)))]) }) + ~~i64(~~nbps) // adjust for over subtraction of base primes! roughs[nri] = ~~u32(q)~~r // compress for culled `larges` and `roughs`! nri++ // advance output `roughs` index! } Line 2,508 ⟶ 3,980: mut si := mxndx // update `smalls` for partial sieve... for pm := ((rtlmt / bp) - 1) \| 1; pm >= bp; pm -= 2 { c := smalls[pm >>> 1] e := (pm * bp) >>> 1 for ; si >= e; si-- { smalls[si] -= (c - u32(nbps)) } } Line 2,525 ⟶ 3,997: p := u64(roughs[ri]) m := n / p ei := int(smalls[half(~~int~~u64(m / p))]) - nbps if ei <= ri { break } // break out when only multiple equal to `p` ans -= i64((ei - ri) * (nbps + ri - 1)) // adjust for over addition below! Line 2,555 ⟶ 4,027: This took 2 milliseconds.</pre> The above code is about as fast as the same algorithm in the fastest of languages such as C/C++/Nim due to the greatly reduced computational complexity of O(n(3/4)/((log n)2)); it can compute the number of primes to 1e11 in about 22 milliseconds on the same machine as shown where it is run on an Intel i5-6500 (3.6 GHz single-thread boosted). The above code can ~~find~~compute the number of primes to ~~a trillion (1e12)~~1e16 in about a ~~hundred milliseconds~~minute, ~~but~~although ~~has~~there is a ~~segmentation~~precision/accuracy ~~fault~~problem for ~~values~~counting ~~much~~ranges ~~larger~~above ~~than~~about ~~that~~9e15 ~~for~~due ~~unknown reasons, as~~to the ~~code~~speed-up ~~has~~optimization ~~been~~of ~~translated~~using ~~reasonably~~floating ~~faithfully~~point ~~from~~division ~~Nim~~operations ~~and~~(precise ~~Crystal, perhaps due~~only to ~~limitations~~53-bits, inwhich ~~the~~is ~~size~~about ofthis ~~objects that the default garbage collection can handle~~limit). =={{header\|Wren}}== Line 2,563 ⟶ 4,035: To sieve a billion numbers and then count the primes up to 10^k would take about 53 seconds in Wren so, as expected, the Legendre method represents a considerable speed up. <syntaxhighlight lang="~~ecmascript~~wren">import "./math" for Int var pi = Fn.new { \|n\| Line 2,607 ⟶ 4,079: The memoized version requires a cache of around 6.5 million map entries, which at 8 bytes each (all numbers are 64 bit floats in Wren) for both the key and the value, equates in round figures to memory usage of 104 MB on top of that needed for the prime sieve. The following version strips out memoization and, whilst somewhat slower at 5.4 seconds, may be preferred in a constrained memory environment. <syntaxhighlight lang="~~ecmascript~~wren">import "./math" for Int var pi = Fn.new { \|n\| Line 2,638 ⟶ 4,110: {{trans\|Vlang}} This non-memoized, non-recursive version is far quicker than the first two versions, running in about 114 milliseconds. Nowhere near as quick as V, of course, but acceptable for Wren which is interpreted and only has one built-in numeric type, a 64 bit float. <syntaxhighlight lang="~~ecmascript~~wren">import "./math" for Int var masks = [1, 2, 4, 8, 16, 32, 64, 128] Line 2,645 ⟶ 4,117: var countPrimes = Fn.new { \|n\| if (n < 39) return (n < 2) ? 0 : ((n + 1)/2).floor var rtlmt = n.sqrt.floor var mxndx = Int.quo(rtlmt - 1, 2) Line 2,678 ⟶ 4,150: var nri = 0 for (ori in 0...rilmt) { var qr = roughs[ori] var pirci = qr >> 1 if ((cullbuf[pirci >> 3] & masks[pirci & 7]) != 0) continue var d = qr * bp var t = (d <= rtlmt) ? larges[smalls[d >> 1] - nbps] : smalls[half.call(Int.quo(n, d))] larges[nri] = larges[ori] - t + nbps roughs[nri] = qr nri = nri + 1 }