Problem Statement.

Given two sentences words1, words2 (each represented as an array of strings), and a list of similar word pairs pairs, determine if two sentences are similar.

For example, words1 = ["great", "acting", "skills"] and words2 = ["fine", "drama", "talent"] are similar, if the similar word pairs are pairs = [["great", "good"], ["fine", "good"], ["acting","drama"], ["skills","talent"]].

Note that the similarity relation is transitive. For example, if "great" and "good" are similar, and "fine" and "good" are similar, then "great" and "fine" are similar.

Similarity is also symmetric. For example, "great" and "fine" being similar is the same as "fine" and "great" being similar.

Also, a word is always similar with itself. For example, the sentences words1 = ["great"], words2 = ["great"], pairs = [] are similar, even though there are no specified similar word pairs.

Finally, sentences can only be similar if they have the same number of words. So a sentence like words1 = ["great"] can never be similar to words2 = ["doubleplus","good"].

Note:

    The length of words1 and words2 will not exceed 1000.
    The length of pairs will not exceed 2000.
    The length of each pairs[i] will be 2.
    The length of each words[i] and pairs[i][j] will be in the range [1, 20].

# BFS - O(W * P) runtime, O(P) space, where W is length of words1 & words2 and P is the length of pairs

In [3]:
from typing import List
from collections import deque, defaultdict

class Solution:
    def areSentencesSimilarTwo(self, words1: List[str], words2: List[str], pairs: List[List[str]]) -> bool:
        if len(words1) != len(words2): return False
        
        pairsDict = defaultdict(set)
        
        for w1, w2 in pairs:
            pairsDict[w1].add(w2)
            pairsDict[w2].add(w1)
            
        visited = set()
        similarSets = []
        
        for w in pairsDict:
            if w not in visited:
                queue = deque([w])
                currSet = set()
                visited.add(w)
                
                while queue:
                    word = queue.popleft()
                    currSet.add(word)
                    for nw in pairsDict[word]:
                        if nw not in visited:
                            queue.append(nw)
                            visited.add(nw)
                similarSets.append(currSet)
            
        for w1, w2 in zip(words1, words2):
            if w1 == w2: continue
            else: 
                foundMatch = False
                for currSet in similarSets:
                    if (w1 in currSet and w2 in currSet): 
                        foundMatch = True
                        break
                        
                if not foundMatch: return False
            
        return True

# Slower but simpler - O(W * P) runtime, O(P) space, where W is length of words1 & words2 and P is the length of pairs

In [5]:
from typing import List

class Solution:
    def areSentencesSimilarTwo(self, words1: List[str], words2: List[str], pairs: List[List[str]]) -> bool:
        if len(words1) != len(words2): return False
        graph = collections.defaultdict(list)
        for w1, w2 in pairs:
            graph[w1].append(w2)
            graph[w2].append(w1)

        for w1, w2 in zip(words1, words2):
            stack, seen = [w1], {w1}
            while stack:
                word = stack.pop()
                if word == w2: break
                for nei in graph[word]:
                    if nei not in seen:
                        seen.add(nei)
                        stack.append(nei)
            else:
                return False
        return True

In [4]:
instance = Solution()
instance.areSentencesSimilarTwo(["great", "acting", "skills"], ["fine", "drama", "talent"], 
                                [["great", "good"], ["fine", "good"], ["acting","drama"], ["skills","talent"]])

True