diff options
author | Michael I. Bushnell <mib@gnu.org> | 1994-08-30 21:14:11 +0000 |
---|---|---|
committer | Michael I. Bushnell <mib@gnu.org> | 1994-08-30 21:14:11 +0000 |
commit | 02fcc25495b92d66f94cfce341daeed59de670a1 (patch) | |
tree | 0947213d442add66cf0c65f3308a31037972ba57 | |
parent | ce43e3758068cfe34ab2b50b595fe43146664ac4 (diff) |
Formerly primes.c.~11~
-rw-r--r-- | proc/primes.c | 211 |
1 files changed, 92 insertions, 119 deletions
diff --git a/proc/primes.c b/proc/primes.c index 8ba433d6..7284f244 100644 --- a/proc/primes.c +++ b/proc/primes.c @@ -16,143 +16,116 @@ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */ #include <stdlib.h> +#include <limits.h> #include <string.h> #include <assert.h> +#define BITS_PER_UNSIGNED (8 * sizeof (unsigned)) +#define SQRT_INT_MAX (1 << (BITS_PER_UNSIGNED / 2)) + /* Return the next prime greater than or equal to N. */ int -nextprime (int n) +nextprime (unsigned n) { - static int *q; - static int k = 2; - static int l = 2; - int p; - int *m; - int i, j; - - /* See the comment at the end for an explanation of the algorithm - used. */ - - if (!q) + /* Among other things, We guarantee that, for all i (0 <= i < primes_len), + primes[i] is a prime, + next_multiple[i] is a multiple of primes[i], + next_multiple[i] > primes[primes_len - 1], + next_multiple[i] is not a multiple of two unless primes[i] == 2, and + next_multiple[i] is the smallest such value. */ + static unsigned *primes, *next_multiple; + static int primes_len; + static int primes_size; + static unsigned next_sieve; /* always even */ + unsigned max_prime; + + if (! primes) { - /* Init */ - q = malloc (sizeof (int) * 2); - q[0] = 2; - q[1] = 3; + primes_size = 128; + primes = (unsigned *) malloc (primes_size * sizeof (*primes)); + next_multiple = (unsigned *) malloc (primes_size + * sizeof (*next_multiple)); + + primes[0] = 2; next_multiple[0] = 6; + primes[1] = 3; next_multiple[1] = 9; + primes[2] = 5; next_multiple[2] = 15; + primes_len = 3; + + next_sieve = primes[primes_len - 1] + 1; } - if (n <= q[0]) - return q[0]; + if (n <= primes[0]) + return primes[0]; - while (n > q[l - 1]) + while (n > (max_prime = primes[primes_len - 1])) { - /* Grow */ + /* primes doesn't contain any prime large enough. Sieve from + max_prime + 1 to 2 * max_prime, looking for more primes. */ + unsigned start = next_sieve; + unsigned end = start + max_prime + 1; + char *sieve = (char *) alloca ((end - start) * sizeof (*sieve)); + int i; - /* Alloc */ - p = q[l-1] * q[l-1]; - m = calloc (p, sizeof (int)); - assert (m); + assert (sieve); - /* Sieve */ - for (i = 0; i < l; i++) - for (j = q[i] * 2; j < p; j += q[i]) - m[j] = 1; + bzero (sieve, (end - start) * sizeof (*sieve)); - /* Copy */ - for (i = q[l-1] + 1; i < p; i++) + /* ANSI C doesn't define what this means. Fuck you. */ + sieve -= start; + + /* Set sieve[i] for all composites i, start <= i < end. + Ignore multiples of 2. */ + for (i = 1; i < primes_len; i++) { - if (l == k) - { - q = realloc (q, k * sizeof (int) * 2); - assert (q); - k *= 2; - } - if (!m[i]) - q[l++] = i; + unsigned twice_prime = 2 * primes[i]; + unsigned multiple; + + for (multiple = next_multiple[i]; + multiple < end; + multiple += twice_prime) + sieve[multiple] = 1; + next_multiple[i] = multiple; } - free (m); + for (i = start + 1; i < end; i += 2) + if (! sieve[i]) + { + if (primes_len >= primes_size) + { + primes_size *= 2; + primes = (int *) realloc (primes, + primes_size * sizeof (*primes)); + next_multiple + = (int *) realloc (next_multiple, + primes_size * sizeof (*next_multiple)); + } + primes[primes_len] = i; + if (i >= SQRT_INT_MAX) + next_multiple[primes_len] = INT_MAX; + else + next_multiple[primes_len] = i * i; + primes_len++; + } + + next_sieve = end; } - - /* Search */ - i = 0; - j = l - 1; - p = j / 2; - while (q[p - 1] >= n || q[p] < n) - { - if (n > q[p]) - i = p + 1; - else - j = p - 1; - p = ((j - i) / 2) + i; - } - - return q[p]; + /* Now we have at least one prime >= n. Find the smallest such. */ + { + int bottom = 0; + int top = primes_len; + + while (bottom < top) + { + int mid = (bottom + top) / 2; + + if (primes[mid] < n) + bottom = mid + 1; + else + top = mid; + } + + return primes[top]; + } } -/* [This code originally contained the comment "You are not expected -to understand this" (on the theory that every Unix-like system should -have such a comment somewhere, and now I have to find somewhere else -to put it). I then offered this function as a challenge to Jim -Blandy (jimb@totoro.bio.indiana.edu). At that time only the six -comments in the function and the description at the top were present. -Jim produced the following brilliant explanation. - - -mib] - - -The static variable q points to a sorted array of the first l natural -prime numbers. k is the number of elements which have been allocated -to q, l <= k; we occasionally double k and realloc q accordingly to -maintain this invariant. - -The table is initialized to contain a few primes (lines 26, 27, -34-40). Subsequent code assumes the table isn't empty. - -When passed a number n, we grow q until it contains a prime >= n -(lines 45--70), do a binary search in q to find the least prime >= n -(lines 72--84), and return that. - -We grow q using a "sieve of Eratosthenes" procedure. Let p be the -largest prime we've yet found, q[l-1]. We allocate a boolean array m -of p^2 elements, and initialize all its elements to false. (Upon -completion, m[j] will be false iff j is a prime.) For each number -q[i] in q, we set all m[j] to true, where j is a multiple of q[i], and -j is a valid index in m. Once this is done, since every number j (p < -j < p^2) is either prime, or has a prime factor not greater than p, -m[j] will be false iff j is prime. We scan m for false elements, and -add their indices to q. - -As an optimization, we take advantage of the fact that 2 is the first -prime. But essentially, the code works as described above. - -Why is m's size chosen as it is? Note that the sieve only guarantees -to mark multiples of the numbers in q. Given that q contains all the -prime numbers from 2 to p, we can safely sieve for prime numbers -between 2 and p^2, because any composite number in that range must -have a prime factor not greater than its square root, and thus not -greater than p; q already contains all such primes. I suppose we -could trust the sieve a bit farther ahead, but I'm not sure we could -go very far at all. - - -Possible bug: if there is no prime j such that p < j <= p^2, then the -growth loop will add no primes to q, and thus never exit. Is there -any guarantee that there will be such a j? I thought that people had -found proofs that the average density of primes was logarithmic in -their size, or something like that, but no guarantees. Perhaps there -is no bug, and this is the part I am not expected to understand; oh, -well. - - -[I don't know if this is a bug or not. The proofs of the density of -primes only deal with average long-term density, and there might be -stretches where prims thin out to the point that this algorithm fails. -However, it can only compute primes up to maxint (because ints are -used as indexes into the array M in the seive step). It's certainly -the case that no such thinning out happens before 2^32, so we're safe. -And since this function is only used to size process tables, I don't -think it will ever get that far even. -mib] - -*/ |