In [1]:
import json
from pprint import pprint
import sys
from pathlib import Path

sys.path.append(str(Path('..').resolve()))
import utils

with open("java_programs.dict", "r") as f:
    java_programs = json.load(f)

SIZES = {2,4,8,16,30}
PROGRAM_NAME = "QuickSort"

In [2]:
pprint(java_programs[PROGRAM_NAME]["2"])

{'assertions': '(assert  ( <=  in0 in1))',
 'constants': '(declare-const in0 Int)\n(declare-const in1 Int)',
 'response': 'Worst-case time complexity: O(n^2)\n'
             '\n'
             'Reason: The algorithm always selects the last element as pivot '
             '(Lomuto partition). If the input is already sorted '
             '(nondecreasing) or reverse-sorted (nonincreasing), the pivot '
             'ends up as an extreme (max or min) and each partition reduces '
             'the problem by only one element, yielding one-sided recursion '
             'and Θ(n^2) comparisons/swaps overall.\n'
             '\n'
             'For input size n = 2, one sufficient constraint to realize the '
             'worst-case pattern (already sorted, so pivot is always the '
             'maximum) is in0 ≤ in1.\n'
             '\n'
             'Answer:\n'
             '(set-logic QF_LIA)\n'
             '(declare-fun in0 () Int)\n'
             '(declare-fun in1 () Int)\n'
            

In [3]:
utils.check_logical_equivalence(
    original_assertions=java_programs[PROGRAM_NAME]["2"]["assertions"],
    generated_assertions=java_programs[PROGRAM_NAME]["2"]["response"].split("(declare-fun in1 () Int)\n")[1].split("(check-sat)\n")[0],
    constants=java_programs[PROGRAM_NAME]["2"]["constants"]
)

{'result': True}

In [4]:
pprint(java_programs[PROGRAM_NAME]["4"])

{'assertions': '(assert (and (and (and (and (and  ( <=  in0 in3)  ( <=  in1 '
               'in3))  ( <=  in2 in3))  ( <=  in0 in2))  ( <=  in1 in2))  ( '
               '<=  in0 in1)))',
 'constants': '(declare-const in0 Int)\n'
              '(declare-const in2 Int)\n'
              '(declare-const in1 Int)\n'
              '(declare-const in3 Int)',
 'response': '- Worst-case time complexity: O(n^2). This happens because the '
             'pivot is always chosen as the last element (Lomuto partition). '
             'If the input array is already sorted (strictly increasing) or '
             'strictly decreasing, each partition produces one subarray of '
             'size n−1 and the other of size 0, leading to quadratic time.\n'
             '\n'
             '- SMT2 constraint for n=4 that forces this worst case (array '
             'strictly increasing or strictly decreasing so the pivot is '
             'always an extreme):\n'
             '\n'
             'Answer:\n'
   

In [5]:
utils.check_logical_equivalence(
    original_assertions=java_programs[PROGRAM_NAME]["4"]["assertions"],
    generated_assertions=java_programs[PROGRAM_NAME]["4"]["response"].split("(declare-fun in3 () Int)\n")[1].split("(check-sat)\n")[0],
    constants=java_programs[PROGRAM_NAME]["4"]["constants"]
)

{'result': False, 'reason': 'A does not imply B'}

In [6]:
pprint(java_programs[PROGRAM_NAME]["8"])

{'assertions': '(assert (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and  ( <=  in0 in7)  ( <=  in1 in7))  ( <=  '
               'in2 in7))  ( <=  in3 in7))  ( <=  in4 in7))  ( <=  in5 in7))  '
               '( <=  in6 in7))  ( <=  in0 in6))  ( <=  in1 in6))  ( <=  in2 '
               'in6))  ( <=  in3 in6))  ( <=  in4 in6))  ( <=  in5 in6))  ( '
               '<=  in0 in5))  ( <=  in1 in5))  ( <=  in2 in5))  ( <=  in3 '
               'in5))  ( <=  in4 in5))  ( <=  in0 in4))  ( <=  in1 in4))  ( '
               '<=  in2 in4))  ( <=  in3 in4))  ( <=  in0 in3))  ( <=  in1 '
               'in3))  ( <=  in2 in3))  ( <=  in0 in2))  ( <=  in1 in2))  ( '
               '<=  in0 in1)))',
 'constants': '(declare-const in6 Int)\n'
              '(declare-const in5 Int)\n'
              '(declare-const in7 Int)\n'
              '(declare-const in0 Int)\n'
              '

In [7]:
utils.check_logical_equivalence(
    original_assertions=java_programs[PROGRAM_NAME]["8"]["assertions"],
    generated_assertions=java_programs[PROGRAM_NAME]["8"]["response"].split("(declare-fun in7 () Int)\n")[1].split("(check-sat)\n")[0],
    constants=java_programs[PROGRAM_NAME]["8"]["constants"]
)

{'result': False, 'reason': 'A does not imply B'}

In [8]:
pprint(java_programs[PROGRAM_NAME]["16"])

{'assertions': '(assert (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and  ( '
               '<=  in0 in15)  ( <=  in1 in15))  ( <=  in2 in15))  ( <=  in3 '
               'in15))  ( <=  in4 in15))  ( <=  in5 in15))  ( <=  in6 in15))  '
               '( <=  in7 in15))  ( <=  in8 in15))  ( <

In [9]:
utils.check_logical_equivalence(
    original_assertions=java_programs[PROGRAM_NAME]["16"]["assertions"],
    generated_assertions=java_programs[PROGRAM_NAME]["16"]["response"].split("(declare-fun in15 () Int)\n")[1].split("(check-sat)\n")[0],
    constants=java_programs[PROGRAM_NAME]["16"]["constants"]
)

{'result': False, 'reason': 'B does not imply A'}

In [10]:
pprint(java_programs[PROGRAM_NAME]["30"])

{'assertions': '(assert (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and (and (and (and '
               '(and (and (and (and (and (and (and (and (and 

In [11]:
utils.check_logical_equivalence(
    original_assertions=java_programs[PROGRAM_NAME]["30"]["assertions"],
    generated_assertions=java_programs[PROGRAM_NAME]["30"]["response"].split("(declare-fun in29 () Int)\n")[1].split("(check-sat)\n")[0],
    constants=java_programs[PROGRAM_NAME]["30"]["constants"]
)


{'result': False, 'reason': 'B does not imply A'}