In [1]:
pip install -r ../../requirements.txt

You should consider upgrading via the '/usr/local/bin/python3 -m pip install --upgrade pip' command.[0m
Note: you may need to restart the kernel to use updated packages.


In [2]:
import ezkl
import torch
from torch import nn
import json
import os
import time
import scipy
import numpy as np
import matplotlib.pyplot as plt
import statistics
import math

In [3]:
%run -i ../../zkstats/core.py

In [4]:
# init path
os.makedirs(os.path.dirname('shared/'), exist_ok=True)
os.makedirs(os.path.dirname('prover/'), exist_ok=True)
verifier_model_path = os.path.join('shared/verifier.onnx')
prover_model_path = os.path.join('prover/prover.onnx')
verifier_compiled_model_path = os.path.join('shared/verifier.compiled')
prover_compiled_model_path = os.path.join('prover/prover.compiled')
pk_path = os.path.join('shared/test.pk')
vk_path = os.path.join('shared/test.vk')
proof_path = os.path.join('shared/test.pf')
settings_path = os.path.join('shared/settings.json')
srs_path = os.path.join('shared/kzg.srs')
witness_path = os.path.join('prover/witness.json')
# this is private to prover since it contains actual data
comb_data_path = os.path.join('prover/comb_data.json')

=======================  ZK-STATS FLOW =======================

Here, Given data1, data2, what if a person requests mean(median(data1), median(data2)). We show that the code is composable enough to do so. However, a person can just request median(data1), and median(data2). Then just compute mean on his own as well 

In [41]:
data_path1 = os.path.join('data1.json')
data_path2 = os.path.join('data2.json')
dummy_data_path1 = os.path.join('shared/dummy_data1.json')
dummy_data_path2 = os.path.join('shared/dummy_data2.json')

f_raw_input1 = open(data_path1, "r")
data1 = json.loads(f_raw_input1.read())["input_data"][0]
data_tensor1 = torch.reshape(torch.tensor(data1),(1, len(data1), 1))
f_raw_input2 = open(data_path2, "r")
data2 = json.loads(f_raw_input2.read())["input_data"][0]
data_tensor2 = torch.reshape(torch.tensor(data2),(1, len(data2), 1))

dummy_data1 = np.round(np.random.uniform(1,10,len(data1)),1)
json.dump({"input_data":[dummy_data1.tolist()]}, open(dummy_data_path1, 'w'))
dummy_data2 = np.round(np.random.uniform(1,10,len(data2)),1)
json.dump({"input_data":[dummy_data2.tolist()]}, open(dummy_data_path2, 'w'))


dummy_theory_output_median1 = torch.tensor(np.median(dummy_data1))
dummy_lower_to_median1 = torch.tensor(np.sort(dummy_data1)[int(len(dummy_data1)/2)-1])
dummy_upper_to_median1 = torch.tensor(np.sort(dummy_data1)[int(len(dummy_data1)/2)])

dummy_theory_output_median2 = torch.tensor(np.median(dummy_data2))
dummy_lower_to_median2 = torch.tensor(np.sort(dummy_data2)[int(len(dummy_data2)/2)-1])
dummy_upper_to_median2 = torch.tensor(np.sort(dummy_data2)[int(len(dummy_data2)/2)])

print('median1: ', dummy_theory_output_median1)
print('median2: ', dummy_theory_output_median2)
dummy_theory_output_mean = torch.mean(torch.tensor([dummy_theory_output_median1, dummy_theory_output_median2]))
print("theory mean output: ", dummy_theory_output_mean)

median1:  tensor(5.6500, dtype=torch.float64)
median2:  tensor(5.5500, dtype=torch.float64)
theory mean output:  tensor(5.6000, dtype=torch.float64)


In [42]:
def median(X, median, lower, upper):
    # since within 1%, we regard as same value
    count_less = torch.sum((X < 0.99*median).double())
    count_equal = torch.sum((torch.abs(X-median)<=torch.abs(0.01*median)).double())
    len = X.size()[1]
    half_len = torch.floor(torch.div(len, 2))
        
    # not support modulo yet
    less_cons = count_less<half_len+2*(len/2 - torch.floor(len/2))
    more_cons = count_less+count_equal>half_len

    # For count_equal == 0
    lower_exist = torch.sum((torch.abs(X-lower)<=torch.abs(0.01*lower)).double())>0
    lower_cons = torch.sum((X>1.01*lower).double())==half_len
    upper_exist = torch.sum((torch.abs(X-upper)<=torch.abs(0.01*upper)).double())>0
    upper_cons = torch.sum((X<0.99*upper).double())==half_len
    bound = count_less==half_len
    # 0.02 since 2*0.01
    bound_avg = (torch.abs(lower+upper-2*median)<=torch.abs(0.02*median))

    median_in_cons = torch.logical_and(less_cons, more_cons)
    median_out_cons = torch.logical_and(torch.logical_and(bound, bound_avg), torch.logical_and(torch.logical_and(lower_cons, upper_cons), torch.logical_and(lower_exist, upper_exist)))
        
    return(torch.where(count_equal==0, median_out_cons, median_in_cons), median)


In [43]:
def mean(X, mean):
    return (torch.abs(torch.sum(X)-X.size()[1]*(mean))<=torch.abs(0.01*X.size()[1]*mean), mean)

In [44]:
print("dummy output: ", dummy_theory_output_mean)
# Verifier/ data consumer side: send desired calculation
class verifier_model(nn.Module):
    def __init__(self):
        super(verifier_model, self).__init__()
        # w represents mean in this case
        self.median1 = nn.Parameter(data = dummy_theory_output_median1, requires_grad = False)
        self.lower1 = nn.Parameter(data = dummy_lower_to_median1, requires_grad = False)
        self.upper1 = nn.Parameter(data = dummy_upper_to_median1, requires_grad = False)
        self.median2 = nn.Parameter(data = dummy_theory_output_median2, requires_grad = False)
        self.lower2 = nn.Parameter(data = dummy_lower_to_median2, requires_grad = False)
        self.upper2 = nn.Parameter(data = dummy_upper_to_median2, requires_grad = False)
        self.mean = nn.Parameter(data = dummy_theory_output_mean, requires_grad = False)
    def forward(self,X1, X2):
        bool1, median1 = median(X1, self.median1, self.lower1, self.upper1)
        bool2, median2 = median(X2, self.median2, self.lower2, self.upper2)
        bool3, output_mean = mean(torch.tensor([median1, median2]).reshape(1,-1,1), self.mean)
        return (torch.logical_and(torch.logical_and(bool1, bool2),bool3), output_mean )

    
verifier_define_calculation(verifier_model, verifier_model_path, [dummy_data_path1, dummy_data_path2])

dummy output:  tensor(5.6000, dtype=torch.float64)


  bool3, output_mean = mean(torch.tensor([median1, median2]).reshape(1,-1,1), self.mean)
  bool3, output_mean = mean(torch.tensor([median1, median2]).reshape(1,-1,1), self.mean)


In [45]:
# prover calculates settings, send to verifier

theory_output_median1 = torch.tensor(np.median(data1))
lower_to_median1 = torch.tensor(np.sort(data1)[int(len(data1)/2)-1])
upper_to_median1 = torch.tensor(np.sort(data1)[int(len(data1)/2)])

theory_output_median2 = torch.tensor(np.median(data2))
lower_to_median2 = torch.tensor(np.sort(data2)[int(len(data2)/2)-1])
upper_to_median2 = torch.tensor(np.sort(data2)[int(len(data2)/2)])

print('median1: ', theory_output_median1)
print('median2: ', theory_output_median2)
theory_output_mean = torch.mean(torch.tensor([theory_output_median1, theory_output_median2]))
print("theory mean output: ", theory_output_mean)

class prover_model(nn.Module):
    def __init__(self):
        super(prover_model, self).__init__()
        # w represents mean in this case
        self.median1 = nn.Parameter(data = theory_output_median1, requires_grad = False)
        self.lower1 = nn.Parameter(data = lower_to_median1, requires_grad = False)
        self.upper1 = nn.Parameter(data = upper_to_median1, requires_grad = False)
        self.median2 = nn.Parameter(data = theory_output_median2, requires_grad = False)
        self.lower2 = nn.Parameter(data = lower_to_median2, requires_grad = False)
        self.upper2 = nn.Parameter(data = upper_to_median2, requires_grad = False)
        self.mean = nn.Parameter(data = theory_output_mean, requires_grad = False)
    def forward(self,X1, X2):
        bool1, median1 = median(X1, self.median1, self.lower1, self.upper1)
        bool2, median2 = median(X2, self.median2, self.lower2, self.upper2)
        bool3, output_mean = mean(torch.tensor([median1, median2]).reshape(1,-1,1), self.mean)
        return (torch.logical_and(torch.logical_and(bool1, bool2),bool3), output_mean )

 

prover_gen_settings([data_path1, data_path2], comb_data_path, prover_model,prover_model_path, "default", "resources", settings_path)

median1:  tensor(49.5500, dtype=torch.float64)
median2:  tensor(49.1500, dtype=torch.float64)
theory mean output:  tensor(49.3500, dtype=torch.float64)


  bool3, output_mean = mean(torch.tensor([median1, median2]).reshape(1,-1,1), self.mean)
  bool3, output_mean = mean(torch.tensor([median1, median2]).reshape(1,-1,1), self.mean)


==== Generate & Calibrate Setting ====
scale:  default
setting:  {"run_args":{"tolerance":{"val":0.0,"scale":1.0},"input_scale":8,"param_scale":8,"scale_rebase_multiplier":10,"lookup_range":[-25518,25754],"logrows":16,"num_inner_cols":2,"variables":[["batch_size",1]],"input_visibility":{"Hashed":{"hash_is_public":true,"outlets":[]}},"output_visibility":"Public","param_visibility":"Private"},"num_rows":20992,"total_assignments":16092,"total_const_size":2432,"model_instance_shapes":[[1],[1]],"model_output_scales":[0,8],"model_input_scales":[8,8],"module_sizes":{"kzg":[],"poseidon":[20992,[2]],"elgamal":[0,[0]]},"required_lookups":["Abs",{"GreaterThan":{"a":0.0}},"KroneckerDelta"],"check_mode":"UNSAFE","version":"7.0.0","num_blinding_factors":null}


In [46]:
# Here verifier & prover can concurrently call setup since all params are public to get pk. 
# Here write as verifier function to emphasize that verifier must calculate its own vk to be sure
verifier_setup(verifier_model_path, verifier_compiled_model_path, settings_path,vk_path, pk_path )

print("=======================================")
# Prover generates proof
print("Theory output: ", theory_output_mean)
prover_gen_proof(prover_model_path, comb_data_path, witness_path, prover_compiled_model_path, settings_path, proof_path, pk_path)

spawning module 0
spawning module 2


==== setting up ezkl ====


spawning module 0
spawning module 2


Time setup: 8.246044874191284 seconds
Theory output:  tensor(49.3500, dtype=torch.float64)
!@# compiled_model exists? True
!@# compiled_model exists? True
==== Generating Witness ====
witness boolean:  1.0
witness result 1 : 49.3515625
==== Generating Proof ====


spawning module 0
spawning module 2


proof:  {'instances': [[[3042937791208075219, 8157070662846698822, 3804781648660056856, 172406108020799675], [15295097400487804665, 12861486368330479023, 3350118022201779210, 343142782800691716], [12436184717236109307, 3962172157175319849, 7381016538464732718, 1011752739694698287], [10870267098303494893, 1752989342377741058, 8860763459400202009, 2635465469930673149]]], 'proof': '01e7dcbfee754c7a8aa11015a39fea458716285859a64bbe82744e9c384cedf2055ee78aba0581b2c9ea49dad8b251a891bba08f86dca25041dad49b0f1125b9006dac74377b41af9bf9bd320a8f3706d1f1cc8e8e770ec9f9df16c512f3bab727714cd3233b4aa0f8f20c703de91d8d8701965731dd87b19ca54323a0446b260ec0ad82c849e47a2f6676b4937cf5701852069209218cef637d4ec26f4d20051a831485652c170280aa120f8c16ef4bf3dedfdf28a87562a70d6c2a3beb619613f993a49e827248670a1c74bb9511c156eeb390c0d0b2fdafa126743bcc5e1c10f30a905c18c5dfbb76f6ed230246e41a4cd59eda1c9ef94177b4ac4a29ddc61bcbaa8b9dc8c4fece9647fb4db53d194a4481ff026aa8ed6d1d0473a3a508521b2bd4455d82d65897732ed9acf6e784200685fa31

In [48]:
# Verifier verifies
verifier_verify(proof_path, settings_path, vk_path)

num_inputs:  2
prf instances:  [[[3042937791208075219, 8157070662846698822, 3804781648660056856, 172406108020799675], [15295097400487804665, 12861486368330479023, 3350118022201779210, 343142782800691716], [12436184717236109307, 3962172157175319849, 7381016538464732718, 1011752739694698287], [10870267098303494893, 1752989342377741058, 8860763459400202009, 2635465469930673149]]]
proof boolean:  1.0
proof result 1 : 49.3515625
verified
