summaryrefslogtreecommitdiff
path: root/proc/primes.c
diff options
context:
space:
mode:
authorMichael I. Bushnell <mib@gnu.org>1994-08-30 21:14:11 +0000
committerMichael I. Bushnell <mib@gnu.org>1994-08-30 21:14:11 +0000
commit02fcc25495b92d66f94cfce341daeed59de670a1 (patch)
tree0947213d442add66cf0c65f3308a31037972ba57 /proc/primes.c
parentce43e3758068cfe34ab2b50b595fe43146664ac4 (diff)
Formerly primes.c.~11~
Diffstat (limited to 'proc/primes.c')
-rw-r--r--proc/primes.c211
1 files changed, 92 insertions, 119 deletions
diff --git a/proc/primes.c b/proc/primes.c
index 8ba433d6..7284f244 100644
--- a/proc/primes.c
+++ b/proc/primes.c
@@ -16,143 +16,116 @@
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */
#include <stdlib.h>
+#include <limits.h>
#include <string.h>
#include <assert.h>
+#define BITS_PER_UNSIGNED (8 * sizeof (unsigned))
+#define SQRT_INT_MAX (1 << (BITS_PER_UNSIGNED / 2))
+
/* Return the next prime greater than or equal to N. */
int
-nextprime (int n)
+nextprime (unsigned n)
{
- static int *q;
- static int k = 2;
- static int l = 2;
- int p;
- int *m;
- int i, j;
-
- /* See the comment at the end for an explanation of the algorithm
- used. */
-
- if (!q)
+ /* Among other things, We guarantee that, for all i (0 <= i < primes_len),
+ primes[i] is a prime,
+ next_multiple[i] is a multiple of primes[i],
+ next_multiple[i] > primes[primes_len - 1],
+ next_multiple[i] is not a multiple of two unless primes[i] == 2, and
+ next_multiple[i] is the smallest such value. */
+ static unsigned *primes, *next_multiple;
+ static int primes_len;
+ static int primes_size;
+ static unsigned next_sieve; /* always even */
+ unsigned max_prime;
+
+ if (! primes)
{
- /* Init */
- q = malloc (sizeof (int) * 2);
- q[0] = 2;
- q[1] = 3;
+ primes_size = 128;
+ primes = (unsigned *) malloc (primes_size * sizeof (*primes));
+ next_multiple = (unsigned *) malloc (primes_size
+ * sizeof (*next_multiple));
+
+ primes[0] = 2; next_multiple[0] = 6;
+ primes[1] = 3; next_multiple[1] = 9;
+ primes[2] = 5; next_multiple[2] = 15;
+ primes_len = 3;
+
+ next_sieve = primes[primes_len - 1] + 1;
}
- if (n <= q[0])
- return q[0];
+ if (n <= primes[0])
+ return primes[0];
- while (n > q[l - 1])
+ while (n > (max_prime = primes[primes_len - 1]))
{
- /* Grow */
+ /* primes doesn't contain any prime large enough. Sieve from
+ max_prime + 1 to 2 * max_prime, looking for more primes. */
+ unsigned start = next_sieve;
+ unsigned end = start + max_prime + 1;
+ char *sieve = (char *) alloca ((end - start) * sizeof (*sieve));
+ int i;
- /* Alloc */
- p = q[l-1] * q[l-1];
- m = calloc (p, sizeof (int));
- assert (m);
+ assert (sieve);
- /* Sieve */
- for (i = 0; i < l; i++)
- for (j = q[i] * 2; j < p; j += q[i])
- m[j] = 1;
+ bzero (sieve, (end - start) * sizeof (*sieve));
- /* Copy */
- for (i = q[l-1] + 1; i < p; i++)
+ /* ANSI C doesn't define what this means. Fuck you. */
+ sieve -= start;
+
+ /* Set sieve[i] for all composites i, start <= i < end.
+ Ignore multiples of 2. */
+ for (i = 1; i < primes_len; i++)
{
- if (l == k)
- {
- q = realloc (q, k * sizeof (int) * 2);
- assert (q);
- k *= 2;
- }
- if (!m[i])
- q[l++] = i;
+ unsigned twice_prime = 2 * primes[i];
+ unsigned multiple;
+
+ for (multiple = next_multiple[i];
+ multiple < end;
+ multiple += twice_prime)
+ sieve[multiple] = 1;
+ next_multiple[i] = multiple;
}
- free (m);
+ for (i = start + 1; i < end; i += 2)
+ if (! sieve[i])
+ {
+ if (primes_len >= primes_size)
+ {
+ primes_size *= 2;
+ primes = (int *) realloc (primes,
+ primes_size * sizeof (*primes));
+ next_multiple
+ = (int *) realloc (next_multiple,
+ primes_size * sizeof (*next_multiple));
+ }
+ primes[primes_len] = i;
+ if (i >= SQRT_INT_MAX)
+ next_multiple[primes_len] = INT_MAX;
+ else
+ next_multiple[primes_len] = i * i;
+ primes_len++;
+ }
+
+ next_sieve = end;
}
-
- /* Search */
- i = 0;
- j = l - 1;
- p = j / 2;
- while (q[p - 1] >= n || q[p] < n)
- {
- if (n > q[p])
- i = p + 1;
- else
- j = p - 1;
- p = ((j - i) / 2) + i;
- }
-
- return q[p];
+ /* Now we have at least one prime >= n. Find the smallest such. */
+ {
+ int bottom = 0;
+ int top = primes_len;
+
+ while (bottom < top)
+ {
+ int mid = (bottom + top) / 2;
+
+ if (primes[mid] < n)
+ bottom = mid + 1;
+ else
+ top = mid;
+ }
+
+ return primes[top];
+ }
}
-/* [This code originally contained the comment "You are not expected
-to understand this" (on the theory that every Unix-like system should
-have such a comment somewhere, and now I have to find somewhere else
-to put it). I then offered this function as a challenge to Jim
-Blandy (jimb@totoro.bio.indiana.edu). At that time only the six
-comments in the function and the description at the top were present.
-Jim produced the following brilliant explanation.
-
- -mib]
-
-
-The static variable q points to a sorted array of the first l natural
-prime numbers. k is the number of elements which have been allocated
-to q, l <= k; we occasionally double k and realloc q accordingly to
-maintain this invariant.
-
-The table is initialized to contain a few primes (lines 26, 27,
-34-40). Subsequent code assumes the table isn't empty.
-
-When passed a number n, we grow q until it contains a prime >= n
-(lines 45--70), do a binary search in q to find the least prime >= n
-(lines 72--84), and return that.
-
-We grow q using a "sieve of Eratosthenes" procedure. Let p be the
-largest prime we've yet found, q[l-1]. We allocate a boolean array m
-of p^2 elements, and initialize all its elements to false. (Upon
-completion, m[j] will be false iff j is a prime.) For each number
-q[i] in q, we set all m[j] to true, where j is a multiple of q[i], and
-j is a valid index in m. Once this is done, since every number j (p <
-j < p^2) is either prime, or has a prime factor not greater than p,
-m[j] will be false iff j is prime. We scan m for false elements, and
-add their indices to q.
-
-As an optimization, we take advantage of the fact that 2 is the first
-prime. But essentially, the code works as described above.
-
-Why is m's size chosen as it is? Note that the sieve only guarantees
-to mark multiples of the numbers in q. Given that q contains all the
-prime numbers from 2 to p, we can safely sieve for prime numbers
-between 2 and p^2, because any composite number in that range must
-have a prime factor not greater than its square root, and thus not
-greater than p; q already contains all such primes. I suppose we
-could trust the sieve a bit farther ahead, but I'm not sure we could
-go very far at all.
-
-
-Possible bug: if there is no prime j such that p < j <= p^2, then the
-growth loop will add no primes to q, and thus never exit. Is there
-any guarantee that there will be such a j? I thought that people had
-found proofs that the average density of primes was logarithmic in
-their size, or something like that, but no guarantees. Perhaps there
-is no bug, and this is the part I am not expected to understand; oh,
-well.
-
-
-[I don't know if this is a bug or not. The proofs of the density of
-primes only deal with average long-term density, and there might be
-stretches where prims thin out to the point that this algorithm fails.
-However, it can only compute primes up to maxint (because ints are
-used as indexes into the array M in the seive step). It's certainly
-the case that no such thinning out happens before 2^32, so we're safe.
-And since this function is only used to size process tables, I don't
-think it will ever get that far even. -mib]
-
-*/