In [12]:
# Binary Search
# Runtime: 72 ms, faster than 21.71%
# https://www.cnblogs.com/grandyang/p/5533305.html
from typing import List

class Solution:
    def intersect(self, nums1: List[int], nums2: List[int]) -> List[int]:
        def binarySearch(A: List[int], target: int) -> int:
            lo, hi = 0, len(A)
            while lo < hi:
                mid = (lo+hi)//2
                if A[mid] == b: # found
                    return mid
                elif A[mid] > b:
                    hi = mid
                else:
                    lo = mid+1
            return -1
        
        l1, l2 = len(nums1), len(nums2)
        # A is longer than B
        A, B = (nums1, nums2) if l1 > l2 else (nums2, nums1)
        A.sort()
        # traverse B, do binary search in A. If found, add to result
        res = []
        for b in B:
            idx = binarySearch(A, b)
            if idx != -1:
                res.append(b)
                # delete elemented already found to avoid duplicate search
                # e.g. nums1 = [3,1,2], nums2 = [1,1]
                del A[idx]
        return res

Follow up:
* What if the given array is already sorted? How would you optimize your algorithm?
* What if nums1's size is small compared to nums2's size? Which algorithm is better?
* What if elements of nums2 are stored on disk, and the memory is limited such that you cannot load all elements into the memory at once?
  1. If only nums2 cannot fit in memory, put all elements of nums1 into a HashMap, read chunks of array that fit into the memory, and record the intersections. (aka. map-side join)
  1. Store the two strings in distributed system (whether self designed or not), then using *MapReduce* technique to solve the problem;
  1. Processing the Strings by *chunk*, which fits the memory, then deal with each chunk of data at a time;
  1. Processing the Strings by *streaming*, then check.
  1. The two arrays needs to be sorted (e.g. using external sort or sort-merge join) first before processing by chunk or by streaming.

In [9]:
Solution().intersect(nums1 = [4,9,5], nums2 = [9,4,9,8,4])

[4, 9]

In [10]:
Solution().intersect(nums1 = [1,2,2,1], nums2 = [2,2])

[2, 2]

In [11]:
Solution().intersect(nums1 = [3,1,2], nums2 = [1,1])

[1]