## Arora-Ge Attack on LWE Demonstration

### 0. Dependencies and Directories

In [1]:
# Set root directory
import os

ROOT_DIR = "D:\Coding\CZ4010\Applied-Cryptography-Project"
os.chdir(ROOT_DIR)

In [2]:
import numpy as np
from math import comb
from pprint import pprint

from LWE_PKC import LWE_Encrypt, LWE_Decrypt
from utils import ascii_to_binary_list, binary_list_to_ascii

### 1. Testing out the Cryptosystem

We will encrypt a binary encoded message.

In [3]:
# Encode message with binary bits
message_ascii = "My username is RahulG1309."
message_binary = ascii_to_binary_list(message_ascii)

print(f"Message: {message_ascii}")
print(f"\nEncoded: {message_binary}")

Message: My username is RahulG1309.

Encoded: [0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0]


In [4]:
# LWE Parameters
n = 10
q = 9377
max_error = 1

# If we have sufficient samples we can recover the secret.
m = 500

# Initialize PKC with parameters
lwe_d = LWE_Decrypt(n=n, q=q, max_error=max_error, list_size=m)

In [5]:
# Public Keys
A_list, T_list, q, max_error = lwe_d.get_public_keys()

print("A_list:")
pprint(A_list)

print("\nT_list:")
pprint(T_list)

A_list:
array([[4851, 5436, 6800, ..., 6227,  547, 4864],
       [3637, 6079, 7541, ..., 6107, 3884,  770],
       [7749, 1269, 4726, ..., 6340, 5638, 8528],
       ...,
       [7256, 6210,  966, ..., 4150,  267, 5202],
       [8771,  641, 4783, ..., 4444, 8705, 7559],
       [3342, 5475, 5505, ..., 2377, 6434,  704]])

T_list:
array([5690, 3734, 3005,  651, 9303, 5730, 8784, 8821,  317, 2599, 3306,
       3886, 1157, 9359, 1635,  352, 6256, 6453, 8987, 2623, 7849, 4900,
       6185, 1276, 8884, 5059, 7609, 1385, 8801, 5883, 6269, 5913, 4274,
       1394, 2109, 2778, 1091, 5800, 2150, 7542, 5241, 2963, 3075,  648,
       5129, 2102, 3833, 5244, 5102, 8066, 5348, 7680, 7500, 5247,  715,
       5845, 1700,  238, 4379, 7622, 4638, 4251, 6747, 2398, 3038, 2619,
       2472, 7474, 4576, 1042, 6383, 7810, 8450, 1422, 5859, 7361, 2781,
       7374,  964,  370, 5309,   95, 5884, 6449, 8396, 6833, 6559, 1890,
       6621, 7731, 1078, 8613, 1003, 6533, 5028, 3603, 5930, 8903, 7841,
       8760, 

In [6]:
# Encrypt Message
lwe_e = LWE_Encrypt(A_list, T_list, q, max_error)
A_new, T_send = lwe_e.encrypt_message(message_binary)

print("A_new:")
pprint(np.array(A_new))

print("\nT_send:")
pprint(np.array(T_send))

A_new:
array([[8367, 1574, 8373, ..., 8160,   84, 3435],
       [1558, 6009, 3294, ..., 5937, 2112,  757],
       [6970, 3781, 4980, ..., 3266, 5011, 6740],
       ...,
       [8877, 1123, 3488, ..., 4636, 6551, 7614],
       [1394, 2081, 8765, ..., 3795, 7052, 3311],
       [9243, 4173, 7464, ..., 3258,  711, 3614]], dtype=int32)

T_send:
array([2998,  856, 4387, 5015, 4792, 6703, 7568, 1334, 1786, 1798,  778,
       7135, 4815, 1129, 3605, 9127, 6315, 8419, 5878, 5632, 5517, 7349,
       4957, 2028, 2842,  398, 1608, 5084, 6249, 7482,  577, 3736,  650,
       5844,  945, 6179, 8995, 4604, 7603, 3004, 4107, 7808, 1994, 8909,
        987, 2117, 4569, 9240, 4016, 6514, 5744, 5025, 5343, 9256, 2330,
       4650, 7426,  311, 8149, 7612, 7578, 3253, 1899, 5902,  494, 2595,
       7222, 2593, 1679, 7011, 6440, 8743, 6781,  712, 7805, 7441, 8411,
       6002, 5752, 5046, 7225, 4484, 7131,  970, 3495,  865, 7924, 7845,
       7883, 5082, 5495, 2490, 8468, 8933, 7706, 5482,   98,  522,  191,
 

In [7]:
# Decrypt Message
decrypted_messge_binary = lwe_d.decrypt_message(A_new, T_send)
decrypted_messge_ascii = binary_list_to_ascii(decrypted_messge_binary)
print(f"Decrypted Message: {decrypted_messge_binary}")
print(f"\nDecoded: {decrypted_messge_ascii}")

Decrypted Message: [0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0]

Decoded: My username is RahulG1309.


### 2. Arora-Ge Algebraic Attack

As part of LWE, the errors are drawn from a finite set, a fact which makes
it possible to attack LWE and recover the secret without knowing the secret
key. Arora and Ge (Princeton) proposed an attack in 2011 that leverages this property using
algebraic methods to recover the secret.

<b>References,</b>
<br> `https://users.cs.duke.edu/~rongge/LPSN.pdf`
<br> `https://eprint.iacr.org/2014/1018.pdf`
<br> `https://people.csail.mit.edu/vinodv/CS294/lecture2.pdf`

If the error distribution is truncated and takes values in the set $\{-T, ... , -1, 0, 1, ... , T\} \implies |E| = 2T + 1$ where, $T = \text{max\_error}$

We can recover the secret `s` from `A_list` and `b_list` if we have enough LWE samples <A, b>.

Precisely we require $m >= {n + |E| \choose |E|}$ LWE samples to solve the system of polynomials by linearization.

In [8]:
# Set root directory
import os

ROOT_DIR = "D:\Coding\CZ4010\Applied-Cryptography-Project"
os.chdir(ROOT_DIR)

In [9]:
import numpy as np
from math import comb
from pprint import pprint

from LWE_PKC import LWE_Encrypt, LWE_Decrypt
from utils import ascii_to_binary_list, binary_list_to_ascii

from itertools import product
from collections import defaultdict
from sympy import symbols, Matrix, GF, init_printing
from sympy.polys.matrices import DomainMatrix

In [10]:
# LWE Parameters
n = 10
q = 9377
max_error = 1

m = 300

# If we have sufficient samples we can recover the secret.
E = 2*max_error + 1
m = comb(n+E, E) - 1

# Initialize PKC with parameters
lwe_d = LWE_Decrypt(n=n, q=q, max_error=max_error, list_size=m)

In [11]:
# The secret is randomly initalized in the class
A_list, b_list, q, max_error = lwe_d.get_public_keys()
print(f"Randomly Initalized Secret: {lwe_d.secret}")

Randomly Initalized Secret: [3986, 681, 8889, 1999, 2878, 4885, 493, 52, 3658, 1668]


In [12]:
print(f"Cardinality of error set: {E}")
print(f"Number of LWE samples: {len(A_list)} >= {comb(n+E, E)-1}")

Cardinality of error set: 3
Number of LWE samples: 285 >= 285


In [13]:
# Define the secret vector
secret_vector = symbols(f'x1:{n+1}')
secret_vector

(x1, x2, x3, x4, x5, x6, x7, x8, x9, x10)

In [14]:
# Construct the polynomials for each LWE instance <A, b>
polynomials_over_Zq = []
error_set = [i for i in range(-max_error, max_error+1)] 

for A, b in zip(A_list, b_list):
    # Initalize the polynomial term to the identity polynomial of the finite field
    polynomial_over_Zq = GF(q)[secret_vector](1)

    for e in error_set:
        # Multiply each variable by its corresponding weight
        weighted_polynomial = sum(w * var for w, var in zip(A, secret_vector))

        # Construct the weighted polynomial (this is the AT*s term in the equation)
        weighted_secret_polynomial_over_Zq = GF(q)[secret_vector](weighted_polynomial)

        # Complete the term (b - AT*s - e)
        term = b - weighted_secret_polynomial_over_Zq - e

        # Accumulate the product
        polynomial_over_Zq = polynomial_over_Zq * term
    
    polynomials_over_Zq.append(polynomial_over_Zq)

# Sanity check
assert len(polynomials_over_Zq) == len(A_list)

Now that we have the polynomials, let us solve them by linearization.

In [15]:
def generate_tuples(n, d):
    """
    Helper function that determines all tuples that represent the monomials in the polynomials constructed from an LWE sample.
    """
    # Use itertools.product to generate all tuples
    tuples = list(product(range(d + 1), repeat=n))
    
    # Remove tuples that have a degree > d
    tuples_pruned = [x for x in tuples if sum(x) <= d]

    return tuples_pruned

In [16]:
coefficients_dicts = []
tuples = generate_tuples(n, E)

for polynomial in polynomials_over_Zq:
    coefficients_dict = defaultdict(int, {key: 0 for key in tuples})

    for term_key, coeff in polynomial.terms():
        coefficients_dict[term_key] = int(coeff) # NOTE: Converting to int!!!

    coefficients_dicts.append(coefficients_dict)

In [17]:
row_order = []

# Let's keep the degree 1 terms up front for convenince
for i in range(n):
    term = [0]*n
    term[i] = 1
    row_order.append(tuple(term))

# We want the secret at the start and the constant term at the end
seen = set(row_order)
constant_term_key = tuple([0]*n)
candidates = generate_tuples(n, E)

for x in candidates:
    if x not in seen and x != constant_term_key:
        row_order.append(x)

# Ensure the constant term is at the end
row_order.append(constant_term_key)

# Sanity check
assert len(row_order) == len(candidates)

In [18]:
# Construct the coefficient matrix
coefficient_matrix = []
rhs = []

for coeff_dict in coefficients_dicts:
    row = []

    for key in row_order[:-1]:
        row.append(coeff_dict[key])
    
    # Append row
    coefficient_matrix.append(row)

    # Append the rhs
    negative_constant_term = -coeff_dict[row_order[-1]]
    rhs.append(negative_constant_term)

Let us take a look at the matrices before solving them over the Zq domain.

In [19]:
# Solving linear system using DomainMatrix
m = Matrix(coefficient_matrix)
b = Matrix(rhs)

# Convert matrices to finite field of order q (q is prime):
K = GF(q, symmetric=False)
dm = DomainMatrix.from_Matrix(m).convert_to(K)
bm = DomainMatrix.from_Matrix(b).convert_to(K)

# Print shape of system of equations
print(dm.shape)
print(bm.shape)

# Solve and convert back to an ordinary Matrix:
solution_vector = dm.lu_solve(bm).to_Matrix()

(285, 285)
(285, 1)


In [20]:
print(f"Randomly Initalized Secret:\t\t{lwe_d.secret}")
print(f"Secret obtained from Arora-Ge Attack:\t{solution_vector[:n]}")

Randomly Initalized Secret:		[3986, 681, 8889, 1999, 2878, 4885, 493, 52, 3658, 1668]
Secret obtained from Arora-Ge Attack:	[3986, 681, 8889, 1999, 2878, 4885, 493, 52, 3658, 1668]


In [21]:
print(f"Did we correctly determine the secret? \n{lwe_d.secret == solution_vector[:n]}")

Did we correctly determine the secret? 
True


Works pretty well for `n <= 12` and `max_error = 1 or 2`. Basically ensure `m <= 1000` else it takes VERY long to run and will most likely go out of memory too.


### Thank you!
