# Chapter 11 : Sieve of Eratosthenes

In [1]:
# Sieve of Eratosthenes
def sieve(n):
    sieve = [True] * (n+1)
    sieve[0] = sieve[1] = False
    i = 2
    while (i * i <= n):
        if (sieve[i]): # 소수를 찾으면 이후 배수를 전부 False
            k = i * i # 이 이하의 숫자들은 이미 다른 소수의 배수
            while (k <= n):
                sieve[k] = False
                k += i
        i += 1
    return sieve

In [2]:
primes = []
for i, p in enumerate(sieve(20)):
    if p:
        primes.append(i)
print(primes)

[2, 3, 5, 7, 11, 13, 17, 19]


연산의 복잡도는 다음과 같다.

$$ \frac n2 + \frac n3 + \frac n5 + \cdots = \sum_{p_j \le \sqrt{n}} \frac n {p_j} = n \cdot \sum_{p_j \le \sqrt{n}} \frac 1 {p_j} $$

$n$ 이하의 소수 갯수는 $O(\log \log n)$ 이므로 총 복잡도는  $O(n\log \log n)$이다.

## 11.1. Factorization

숫자를 나누는 최소 소수를 찾아보자.

In [3]:
# Preparing the array F for factorization.

def arrayF(n):
    F = [0] * (n+1)
    i = 2
    while (i * i <= n):
        if (F[i] == 0):
            k = i * i
            while (k <= n):
                if (F[k]==0):
                    F[k] = i
                k += i
        i += 1
    return F

In [10]:
F = arrayF(36)
F

[0,
 0,
 0,
 0,
 2,
 0,
 2,
 0,
 2,
 3,
 2,
 0,
 2,
 0,
 2,
 3,
 2,
 0,
 2,
 0,
 2,
 3,
 2,
 0,
 2,
 5,
 2,
 3,
 2,
 0,
 2,
 0,
 2,
 3,
 2,
 5,
 2]

In [11]:
# Factorization of x

def factorization(x, F):
    primeFactors = []
    while (F[x] > 0) :
        primeFactors += [F[x]]
        x = int(x/F[x])
    primeFactors += [x]
    return primeFactors

In [12]:
factorization(36, F)

[2, 2, 3, 3]

# CountNonDivisible

You are given an array A consisting of N integers.

For each number A[i] such that 0 ≤ i < N, we want to count the number of elements of the array that are not the divisors of A[i]. We say that these elements are non-divisors.

For example, consider integer N = 5 and array A such that:

    A[0] = 3
    A[1] = 1
    A[2] = 2
    A[3] = 3
    A[4] = 6

For the following elements:

* A[0] = 3, the non-divisors are: 2, 6,
* A[1] = 1, the non-divisors are: 3, 2, 3, 6,
* A[2] = 2, the non-divisors are: 3, 3, 6,
* A[3] = 3, the non-divisors are: 2, 6,
* A[4] = 6, there aren't any non-divisors.

Write a function:

    def solution(A)

that, given an array A consisting of N integers, returns a sequence of integers representing the amount of non-divisors.

Result array should be returned as an array of integers.

For example, given:

    A[0] = 3
    A[1] = 1
    A[2] = 2
    A[3] = 3
    A[4] = 6
the function should return [2, 4, 3, 2, 0], as explained above.

Write an efficient algorithm for the following assumptions:

* N is an integer within the range [1..50,000];
* each element of array A is an integer within the range [1..2 * N].

In [13]:
A = [3,1,2,3,6]

초딩 풀이 간다

In [24]:
def solution(A):
    ans = []
    for i in range(len(A)):
        div = 0
        for j in range(len(A)):
            if i != j and A[i] % A[j] != 0:
                div += 1
        ans.append(div)
    return ans

In [25]:
solution(A)

[2, 4, 3, 2, 0]

https://app.codility.com/demo/results/trainingUYVK59-9Z8/

55점 $O(N^2)$

In [57]:
M = max(A)+1
d = dict()
for a in set(A):
    d[a] = set(A) - divisors(a)

In [58]:
d

{1: {2, 3, 6}, 2: {3, 6}, 3: {2, 6}, 6: set()}

In [56]:
from collections import Counter
c = Counter(A)
c

Counter({3: 2, 1: 1, 2: 1, 6: 1})

In [62]:
sol = dict()
for key, item in d.items():
    sol[key] = 0
    for j in item:
        sol[key] += c[j]
        
sol

{1: 4, 2: 3, 3: 2, 6: 0}

In [14]:
A

[3, 1, 2, 3, 6]

In [65]:
def solution(A):
    
    def divisors(n):
        i=1
        result = set()
        while i*i < n:
            if n % i == 0:
                result.update([i, int(n/i)])
            i += 1
        if i*i == n:
            result.add(i)

        return result
    
    M = max(A)+1
    d = dict()
    for a in set(A):
        d[a] = set(A) - divisors(a)
        
    from collections import Counter
    c = Counter(A)
    
    sol = dict()
    for key, item in d.items():
        sol[key] = 0
        for j in item:
            sol[key] += c[j]
            
    ans = []
    for a in A:
        ans.append(sol[a])
    return ans

https://app.codility.com/demo/results/trainingGVSGFP-6BN/

66점

In [68]:
A

[3, 1, 2, 3, 6]

In [88]:
def solution(A):
    import math
    
    n = len(A)
    cnt = [0] * (2*n+1)
    for a in A:
        cnt[a] += 1
    print(cnt)
    
    ans = []
    for i in range(n):
        sol = 0
        for j in range(1, math.floor(math.sqrt(A[i]))+1):
            if A[i] % j == 0:
                sol += cnt[j]
                if j * j != A[i] :
                    sol += cnt[A[i]//j]
        ans.append(n-sol)
    return ans

In [89]:
solution(A)

[0, 1, 1, 2, 0, 0, 1, 0, 0, 0, 0]


[2, 4, 3, 2, 0]

https://app.codility.com/demo/results/training4UCAMG-949/

77점...

In [90]:
def solution(A):
    import math
    
    n = len(A)
    cnt = [0] * (2*n+1)
    for a in A:
        cnt[a] += 1
    #print(cnt)
    
    ans = []
    for i in range(n):
        sol = 0
        j=1
        while j * j <= A[i]:
            if A[i] % j == 0:
                sol += cnt[j]
                if j * j != A[i] :
                    sol += cnt[A[i]//j]
            j+=1
        ans.append(n-sol)
    return ans

In [91]:
solution(A)

[0, 1, 1, 2, 0, 0, 1, 0, 0, 0, 0]


[2, 4, 3, 2, 0]

https://app.codility.com/demo/results/trainingCBZW86-7ZH/

77점... 오히려 위보다 더 오래 걸린다

In [93]:
from collections import Counter
c = Counter(A)
c

Counter({3: 2, 1: 1, 2: 1, 6: 1})

In [97]:
def solution(A):
    import math
    from collections import Counter
    
    n = len(A)
    cnt = [0] * (2*n+1)
    c = Counter(A)
    for a in set(A):
        cnt[a] = c[a]

    
    ans = []
    for i in range(n):
        sol = 0
        for j in range(1, math.floor(math.sqrt(A[i]))+1):
            if A[i] % j == 0:
                sol += cnt[j]
                if j * j != A[i] :
                    sol += cnt[A[i]//j]
        ans.append(n-sol)
    return ans

In [96]:
solution(A)

[2, 4, 3, 2, 0]

이것도 77점

In [100]:
def solution(A):
    import math
    
    n = len(A)
    cnt = [0] * (2*n+1)
    for a in A:
        cnt[a] += 1

    # 똑같은 원소에 대해 다시 계산하는 걸 막기 위해 
    # 계산 여부 리스트 활용
    cald = [-1] * (2*n+1)
        
    ans = []
    for i in range(n):
        if cald[A[i]] == -1: # 기존에 계산 안했으면
            sol = 0
            for j in range(1, math.floor(math.sqrt(A[i]))+1):
                if A[i] % j == 0:
                    sol += cnt[j]
                    if j * j != A[i] :
                        sol += cnt[A[i]//j]
            cald[A[i]] = sol
        else:
            sol = cald[A[i]] # 계산 했으면 걍 리스트 값 가져옴
        ans.append(n-sol)
    return ans

In [99]:
solution(A)

[2, 4, 3, 2, 0]

https://app.codility.com/demo/results/trainingM345EC-EW5/

100점 $O(N log{N})$

# CountSemiprimes

A prime is a positive integer X that has exactly two distinct divisors: 1 and X. The first few prime integers are 2, 3, 5, 7, 11 and 13.

A semiprime is a natural number that is the product of two (not necessarily distinct) prime numbers. The first few semiprimes are 4, 6, 9, 10, 14, 15, 21, 22, 25, 26.

You are given two non-empty arrays P and Q, each consisting of M integers. These arrays represent queries about the number of semiprimes within specified ranges.

Query K requires you to find the number of semiprimes within the range (P[K], Q[K]), where 1 ≤ P[K] ≤ Q[K] ≤ N.

For example, consider an integer N = 26 and arrays P, Q such that:

    P[0] = 1    Q[0] = 26
    P[1] = 4    Q[1] = 10
    P[2] = 16   Q[2] = 20
The number of semiprimes within each of these ranges is as follows:

* (1, 26) is 10,
* (4, 10) is 4,
* (16, 20) is 0.

Write a function:

    def solution(N, P, Q)

that, given an integer N and two non-empty arrays P and Q consisting of M integers, returns an array consisting of M elements specifying the consecutive answers to all the queries.

For example, given an integer N = 26 and arrays P, Q such that:

    P[0] = 1    Q[0] = 26
    P[1] = 4    Q[1] = 10
    P[2] = 16   Q[2] = 20
    
the function should return the values [10, 4, 0], as explained above.

Write an efficient algorithm for the following assumptions:

* N is an integer within the range [1..50,000];
* M is an integer within the range [1..30,000];
* each element of arrays P, Q is an integer within the range [1..N];
* P[i] ≤ Q[i].

In [60]:
P = [1,4,16]
Q = [26,10,20]

In [61]:
m = min(P)
M = max(Q)

In [62]:
F = arrayF(M+1)
d = dict()
for i in range(m,M+1):
    if len(factorization(i, F))==2:
        d[i] = True
    else:
        d[i] = False

In [63]:
def solution(N, P,Q):
    m = min(P)
    M = N
    
    F = arrayF(M+1)
    d = dict()
    for i in range(m,M+1):
        if len(factorization(i, F))==2:
            d[i] = True
        else:
            d[i] = False
            
    
        
    n = len(P)
    ans = []
    for i in range(n):
        div = 0 
        for j in range(P[i],Q[i]+1):
            if d[j]==True:
                div+=1
        ans.append(div)
    return ans

In [65]:
solution(26,P,Q)

[10, 4, 0]

https://app.codility.com/demo/results/trainingVAA433-3JK/

66점

In [66]:
def solution(N, P,Q):
    # Preparing the array F for factorization.

    def arrayF(n):
        F = [0] * (n+1)
        i = 2
        while (i * i <= n):
            if (F[i] == 0):
                k = i * i
                while (k <= n):
                    if (F[k]==0):
                        F[k] = i
                    k += i
            i += 1
        return F

    def factorization(x, F):
        primeFactors = []
        while (F[x] > 0) :
            primeFactors += [F[x]]
            x = int(x/F[x])
        primeFactors += [x]
        return primeFactors
    
    m = min(P)
    M = N+2
    
    # list of semiprimes
    F = arrayF(M+1)
    d = [0] * (M+1)
    s = 0
    for i in range(1,M+1):
        if len(factorization(i, F))==2:
            s += 1
        d[i] = s
    
    n = len(P)
    ans = []
    for i in range(n):
        ans.append(d[Q[i]]-d[P[i]-1])
        
    return ans

In [67]:
solution(28, P,Q)

[0, 0, 0, 0, 1, 1, 2, 2, 2, 3, 4, 4, 4, 4, 5, 6, 6, 6, 6, 6, 6, 7, 8, 8, 8, 9, 10, 10, 10, 10, 10]


[10, 4, 0]

https://app.codility.com/demo/results/training54S88P-G7T/

100점 $O(N * log(log(N)) + M)$