# Su Doku

<blockquote>
<p>Su Doku (Japanese meaning <i>number place</i>) is the name given to a popular puzzle concept. Its origin is unclear, but credit must be attributed to Leonhard Euler who invented a similar, and much more difficult, puzzle idea called Latin Squares. The objective of Su Doku puzzles, however, is to replace the blanks (or zeros) in a 9 by 9 grid in such that each row, column, and 3 by 3 box contains each of the digits 1 to 9. Below is an example of a typical starting puzzle grid and its solution grid.</p>
<div style="text-align:center;">
<table border="0" cellpadding="0" cellspacing="0" align="center"><tr><td>
<table cellpadding="5" cellspacing="0" border="1"><tr><td style="font-family:'courier new';font-size:14pt;">0 0 3<br />9 0 0<br />0 0 1</td>
<td style="font-family:'courier new';font-size:14pt;">0 2 0<br />3 0 5<br />8 0 6</td>
<td style="font-family:'courier new';font-size:14pt;">6 0 0<br />0 0 1<br />4 0 0</td>
</tr><tr><td style="font-family:'courier new';font-size:14pt;">0 0 8<br />7 0 0<br />0 0 6</td>
<td style="font-family:'courier new';font-size:14pt;">1 0 2<br />0 0 0<br />7 0 8</td>
<td style="font-family:'courier new';font-size:14pt;">9 0 0<br />0 0 8<br />2 0 0</td>
</tr><tr><td style="font-family:'courier new';font-size:14pt;">0 0 2<br />8 0 0<br />0 0 5</td>
<td style="font-family:'courier new';font-size:14pt;">6 0 9<br />2 0 3<br />0 1 0</td>
<td style="font-family:'courier new';font-size:14pt;">5 0 0<br />0 0 9<br />3 0 0</td>
</tr></table></td>
<td width="50"><br /></td>
<td>
<table cellpadding="5" cellspacing="0" border="1"><tr><td style="font-family:'courier new';font-size:14pt;">4 8 3<br />9 6 7<br />2 5 1</td>
<td style="font-family:'courier new';font-size:14pt;">9 2 1<br />3 4 5<br />8 7 6</td>
<td style="font-family:'courier new';font-size:14pt;">6 5 7<br />8 2 1<br />4 9 3</td>
</tr><tr><td style="font-family:'courier new';font-size:14pt;">5 4 8<br />7 2 9<br />1 3 6</td>
<td style="font-family:'courier new';font-size:14pt;">1 3 2<br />5 6 4<br />7 9 8</td>
<td style="font-family:'courier new';font-size:14pt;">9 7 6<br />1 3 8<br />2 4 5</td>
</tr><tr><td style="font-family:'courier new';font-size:14pt;">3 7 2<br />8 1 4<br />6 9 5</td>
<td style="font-family:'courier new';font-size:14pt;">6 8 9<br />2 5 3<br />4 1 7</td>
<td style="font-family:'courier new';font-size:14pt;">5 1 4<br />7 6 9<br />3 8 2</td>
</tr></table></td>
</tr></table></div>
<p>A well constructed Su Doku puzzle has a unique solution and can be solved by logic, although it may be necessary to employ "guess and test" methods in order to eliminate options (there is much contested opinion over this). The complexity of the search determines the difficulty of the puzzle; the example above is considered <i>easy</i> because it can be solved by straight forward direct deduction.</p>
<p>The 6K text file, <a href="./p096_sudoku.txt">sudoku.txt</a> (right click and 'Save Link/Target As...'), contains fifty different Su Doku puzzles ranging in difficulty, but all with unique solutions (the first puzzle in the file is the example above).</p>
<p>By solving all fifty puzzles find the sum of the 3-digit numbers found in the top left corner of each solution grid; for example, 483 is the 3-digit number found in the top left corner of the solution grid above.</p>
</blockquote>

## Module Code

In [1]:
module Sudoku

debug = false
A = Set('1':'9')

function readgrid(io)
  header = readline(io)
  length(header) > 0 || return nothing
  id = parse(Int, header[6:7])
  G = Array{Union{Missing, Char}}(missing, 9, 9)
  for i in 1:9
  row = readline(io)
    for j in 1:9
      row[j] ∈ A && (G[i, j] = row[j])
    end
  end
  (id, G)
end

progress(G::Array{Union{Missing, Char},2}) = count(x->x∈A, G)
progress(C::Array{Set{Char},2}) = 81 - sum(length, C)

function printgrid(G)
  println("$(G[1,1]) $(G[1,2]) $(G[1,3]) | $(G[1,4]) $(G[1,5]) $(G[1,6]) | $(G[1,7]) $(G[1,8]) $(G[1,9])")
  println("$(G[2,1]) $(G[2,2]) $(G[2,3]) | $(G[2,4]) $(G[2,5]) $(G[2,6]) | $(G[2,7]) $(G[2,8]) $(G[2,9])")
  println("$(G[3,1]) $(G[3,2]) $(G[3,3]) | $(G[3,4]) $(G[3,5]) $(G[3,6]) | $(G[3,7]) $(G[3,8]) $(G[3,9])")
  println("------+-------+------")
  println("$(G[4,1]) $(G[4,2]) $(G[4,3]) | $(G[4,4]) $(G[4,5]) $(G[4,6]) | $(G[4,7]) $(G[4,8]) $(G[4,9])")
  println("$(G[5,1]) $(G[5,2]) $(G[5,3]) | $(G[5,4]) $(G[5,5]) $(G[5,6]) | $(G[5,7]) $(G[5,8]) $(G[5,9])")
  println("$(G[6,1]) $(G[6,2]) $(G[6,3]) | $(G[6,4]) $(G[6,5]) $(G[6,6]) | $(G[6,7]) $(G[6,8]) $(G[6,9])")
  println("------+-------+------")
  println("$(G[7,1]) $(G[7,2]) $(G[7,3]) | $(G[7,4]) $(G[7,5]) $(G[7,6]) | $(G[7,7]) $(G[7,8]) $(G[7,9])")
  println("$(G[8,1]) $(G[8,2]) $(G[8,3]) | $(G[8,4]) $(G[8,5]) $(G[8,6]) | $(G[8,7]) $(G[8,8]) $(G[8,9])")
  println("$(G[9,1]) $(G[9,2]) $(G[9,3]) | $(G[9,4]) $(G[9,5]) $(G[9,6]) | $(G[9,7]) $(G[9,8]) $(G[9,9])")
  println("progress: $(progress(G))\n\n")
end

function displaygrid(G)
  html = ["<table><tbody>"]
  for i in 1:9
    push!(html, """<tr style="background: none !important;">""")
    for j in 1:9
      css = [
        "width: 1.5em !important;",
        "height: 1.5em !important;",
        "text-align: center !important;",
        "vertical-align: middle !important;",
        "font-size: 150%;",
        "font-weight: bold;"
      ]
      push!(css, i ∈ [1, 4, 7] ? "border-top: 2px solid !important;" : "border-top: 0.5px solid !important;")
      push!(css, j ∈ [3, 6, 9] ? "border-right: 2px solid !important;" : "border-right: 0.5px solid !important;")
      push!(css, i ∈ [3, 6, 9] ? "border-bottom: 2px solid !important;" : "border-bottom: 0.5px solid !important;")
      push!(css, j ∈ [1, 4, 7] ? "border-left: 2px solid !important;" : "border-left: 0.5px solid !important;")
      push!(html, """<td style="$(string(css...))">""")
      push!(html, ismissing(G[i,j]) ? "&nbsp;" : string(G[i,j]))
      push!(html, "</td>")
    end
    push!(html, "</tr>")
  end
  push!(html, "</tbody></table>")
  display("text/html", string(html...))
end

# setfrom(B) = Set(B) ∩ A

row(G::Array{Union{Missing, Char},2}, i) = G[i, :]
col(G::Array{Union{Missing, Char},2}, j) = G[:, j]
box(G::Array{Union{Missing, Char},2}, k) = G[(k-1)÷3*3+1:(k-1)÷3*3+3, (k-1)%3*3+1:(k-1)%3*3+3]
box(G::Array{Union{Missing, Char},2}, i, j) = G[(i-1)÷3*3+1:(i-1)÷3*3+3, (j-1)÷3*3+1:(j-1)÷3*3+3]

row(C::Array{Set{Char},2}, k) = view(C, k, :)
col(C::Array{Set{Char},2}, k) = view(C, :, k)
box(C::Array{Set{Char},2}, k) = view(C, (k-1)÷3*3+1:(k-1)÷3*3+3, (k-1)%3*3+1:(k-1)%3*3+3)
box(C::Array{Set{Char},2}, i, j) = view(C, (i-1)÷3*3+1:(i-1)÷3*3+3, (j-1)÷3*3+1:(j-1)÷3*3+3)

boxid(i, j) = (i-1)÷3*3 + (j-1)÷3+1

candidates(G, i, j) = ismissing(G[i, j]) ? setdiff(A, row(G, i), col(G, j), box(G, i, j)) : Set([G[i, j]])
candidates(G) = [candidates(G, i, j) for i in 1:9, j in 1:9]

isvalid(G::Array{Union{Missing, Char},2}) = all([all([issetequal(A, Set(row(G, k))), issetequal(A, Set(col(G, k))), issetequal(A, Set(box(G, k)))]) for k in 1:9])

iscomplete(C::Array{Set{Char},2}) = all(isequal(length(c), 1) for c in C)
isvalid(C::Array{Set{Char},2}) = all([all([issetequal(A, union(row(C, k)...)), issetequal(A, union(col(C, k)...)), issetequal(A, union(box(C, k)...))]) for k in 1:9])
issolved(C::Array{Set{Char},2}) = iscomplete(C) && isvalid(C)

function printcandidates(C::Array{Set{Char},2})
  println('-'^72)
  for r in eachrow(C)
    println(join([join(sort(collect(c))) for c in r], "\t"))
  end
  println('-'^72)
end

function displaygrid(C::Array{Set{Char},2}; caption="")
  html = ["""<table style="margin-top: 2em; margin-bottom: 2em;">"""]
  length(caption) > 0 && push!(html, """<caption style="font-size: 200%;">$caption</caption>""")
  push!(html, "<tbody>")
  for i in 1:9
    push!(html, """<tr style="background: none !important; padding: 0 !important;">""")
    for j in 1:9
      css = [
        "width: 68px;",
        "height: 68px;",
        "text-align: center !important;",
        "padding: 0 !important;",
      ]
      push!(css, i ∈ [1, 4, 7] ? "border-top: 2px solid !important;" : "border-top: 0.5px solid !important;")
      push!(css, j ∈ [3, 6, 9] ? "border-right: 2px solid !important;" : "border-right: 0.5px solid !important;")
      push!(css, i ∈ [3, 6, 9] ? "border-bottom: 2px solid !important;" : "border-bottom: 0.5px solid !important;")
      push!(css, j ∈ [1, 4, 7] ? "border-left: 2px solid !important;" : "border-left: 0.5px solid !important;")

      if length(C[i, j]) > 1
        push!(html, """<td style="$(string(css...))">""")
        push!(html, """<table style="margin: 0 !important; font-size: 0.67rem; width: 100%; height: 100%;"><tbody>""")
        for k in '1':'9'
          Int(k)%3 == 1 && push!(html, """<tr style="background: none !important; padding: 0 !important;">""")
          push!(html, """<td style="width: 33.3%; height: 33.3%; text-align: center;">""")
          push!(html, k ∈ C[i, j] ? "$k" : "&nbsp;")
          push!(html, "</td>")
          Int(k)%3 == 0 && push!(html, "</tr>")
        end
        push!(html, "</tbody></table>")
        push!(html, "</td>")
      else
        push!(css, "font-size: 250%;")
        push!(css, "font-weight: bold;")
        push!(html, """<td style="$(string(css...))">""")
        push!(html, string(collect(C[i, j])[1]))
        push!(html, "</td>")
      end
    end
    push!(html, "</tr>")
  end
  push!(html, "</tbody></table>")
  display("text/html", string(html...))
end

function nakedsingles!(C)
  debug && println("\nIn nakedsingles!()")
  before = progress(C)
  for i in 1:9, j in 1:9
    length(C[i, j]) > 1 && continue
    for X in [row(C, i), col(C, j), box(C, i, j)], k in eachindex(X)
      issetequal(X[k], C[i, j]) || setdiff!(X[k], C[i, j])
    end
    debug && println()
  end
  @assert isvalid(C) "puzzle in invalid state"
  after = progress(C)
  debug && before < after && println("naked singles: $before ↦ $after")
  before < after
end

function hiddensingles!(C)
  debug && println("\nIn hiddensingles!()")
  @assert isvalid(C) "puzzle in invalid state"
  before = progress(C)
  for k in 1:9, X in [row(C, k), col(C, k), box(C, k)]
    D = Dict([e => 0 for e ∈ A])
    for s in X, e in s
      D[e] += 1
    end
    for s in Set(keys(filter(p -> isequal(p.second, 1), D))), ij in eachindex(X)
      s ∈ X[ij] && (X[ij] = Set([s]))
    end
  end
  @assert isvalid(C) "puzzle in invalid state"
  after = progress(C)
  debug && before < after && println("hidden singles: $before ↦ $after")
  before < after
end

function nakedpairs!(C)
  debug && println("\nIn nakedpairs!()")
  @assert isvalid(C) "puzzle in invalid state"
  before = progress(C)
  for k in 1:9, X in [row(C, k), col(C, k), box(C, k)]
    paircount = Dict()
    for ij in eachindex(X)
      if (length(X[ij]) == 2)
        if haskey(paircount, X[ij])
          paircount[X[ij]] += 1
        else
          paircount[X[ij]] = 1
        end
      end
    end
    for (pair, count) in paircount
      if count == 2
        debug && println("naked pair: $pair")
        for ij in eachindex(X)
          issetequal(X[ij], pair) || setdiff!(X[ij], pair)
        end
      end
    end
    before < progress(C) && nakedsingles!(C)
  end
  @assert isvalid(C) "puzzle in invalid state"
  after = progress(C)
  debug && before < after && println("naked pairs: $before ↦ $after")
  before < after
end

function hiddenpairs!(C)
  debug && println("\nIn hiddenpairs!()")
  @assert isvalid(C) "puzzle in invalid state"
  debug && printcandidates(C)
  before = progress(C)
  for k in 1:9, X in [row(C, k), col(C, k), box(C, k)]
    debug && println((k=k, X=X))
    D1 = Dict([e => 0 for e ∈ A])
    for s in X, e in s
      D1[e] += 1
    end
    debug && println("D1: $D1")
    D2 = Dict([k => Set() for k in keys(filter(p -> isequal(p.second, 2), D1))])
    for k in keys(D2), ij in eachindex(X)
      k ∈ X[ij] && push!(D2[k], ij)
    end
    debug && println("D2: $D2")
    for (pair, locations) in [Set([k1, k2]) => s1 for (k1, s1) in D2, (k2, s2) in D2 if k1 < k2 && issetequal(s1, s2)]
      debug && println("hidden pair: $pair {$(summary(pair))} => $locations")
      for ij in locations
        debug && println("replacing $(X[ij]) with $pair")
        X[ij] = copy(pair) # this copy() to keep from replacing cell with reference to other cell — so many hours…
        debug && printcandidates(C)
      end
    end
  end
  @assert isvalid(C) "puzzle in invalid state"
  after = progress(C)
  debug && before < after && println("hidden pairs: $before ↦ $after")
  before < after
end

function lcpointing!(C)
  before = progress(C)
  for k in 1:9
    X = box(C, k)
    U = [x for x in X if length(x) > 1]
    isempty(U) && continue
    for d in union(U...)
      inrows = Set()
      incols = Set()
      for i in 1:3, j in 1:3
        d ∈ X[i, j] && push!(inrows, i)
        d ∈ X[i, j] && push!(incols, j)
      end
      if length(inrows) == 1
        i = collect(inrows)[1] + (k-1)÷3*3
        for j in 1:9
          boxid(i, j) != k && !issetequal(C[i, j], Set([d])) && setdiff!(C[i, j], Set([d]))
        end
      end
      if length(incols) == 1
        j = collect(incols)[1] + (k-1)%3*3
        for i in 1:9
          boxid(i, j) != k && !issetequal(C[i, j], Set([d])) && setdiff!(C[i, j], Set([d]))
        end
      end
    end
  end
  @assert isvalid(C) "puzzle in invalid state"
  after = progress(C)
  debug && before < after && println("locked candidates (pointing): $before ↦ $after")
  before < after
end

function lcclaiming!(C)
  before = progress(C)
  for k in 1:9
    X = row(C, k)
    U = [x for x in X if length(x) > 1]
    if !isempty(U)
      for d in union(U...)
        inbox = Set()
        for j in 1:9
          d ∈ X[j] && push!(inbox, boxid(k, j))
        end
        if length(inbox) == 1
          b = collect(inbox)[1]
          debug && println("\nlocked candidate (claiming) $d in row $k, box $b")
          for i′ in range((b-1)÷3*3+1, length=3), j′ in range((b-1)%3*3+1, length=3)
            length(C[i′, j′]) == 1 && continue
            i′ == k && continue
            setdiff!(C[i′, j′], Set([d]))
            @assert isvalid(C) "puzzle in invalid state(row)"
          end
        end
      end
    end

    X = col(C, k)
    U = [x for x in X if length(x) > 1]
    if !isempty(U)
      for d in union(U...)
        inbox = Set()
        for i in 1:9
          d ∈ X[i] && push!(inbox, boxid(i, k))
        end
        if length(inbox) == 1
          b = collect(inbox)[1]
          debug && println("locked candidate (claiming) $d in col $k, box $b")
          for i′ in range((b-1)÷3*3+1, length=3), j′ in range((b-1)%3*3+1, length=3)
            length(C[i′, j′]) == 1 && continue
            j′ == k && continue
            setdiff!(C[i′, j′], Set([d]))
            @assert isvalid(C) "puzzle in invalid state (column)"
          end
        end
      end
    end
  end
  @assert isvalid(C) "puzzle in invalid state"
  after = progress(C)
  debug && before < after && println("locked candidates (claiming): $before ↦ $after")
  before < after
end

function solvepuzzle(G)
  C = candidates(G)
  stuck = false
  while !issolved(C) && !stuck
    u = [
      nakedsingles!(C),
      hiddensingles!(C),
      # nakedpairs!(C), # hiddenpairs finds nakedpairs
      hiddenpairs!(C),
      lcpointing!(C),
      lcclaiming!(C)
    ]
    stuck = !any(u)
  end
  (issolved(C), map(x -> length(x) == 1 ? collect(x)[1] : missing, C), issolved(C) ? nothing : C)
end

end

Main.Sudoku

## Using the Module

In [2]:
puzzles = Vector{Any}(nothing, 50)
puzzlefile = open("p096_sudoku.txt")
for p in 1:50
    n, g = Sudoku.readgrid(puzzlefile)
#     println("\nPuzzle $n")
    puzzles[n] = copy(g)
    a, b = Sudoku.solvepuzzle(g)
    a || println("\n$n not solved")
end
close(puzzlefile)


7 not solved


In [3]:
G = puzzles[7]
a, b, c = Sudoku.solvepuzzle(G)
Sudoku.displaygrid(c, caption="Grid 7")

0,1,2,3,4,5,6,7,8
1 7,4,3,9,8,67,2,5,1 67
1,,,,,,,,
,,,,,,,,
7,,,,,,,,
,,,,,,,,
,,6,,,,,,
7,,,,,,,,
1,,,,,,,,
,,6,,,,,,
7,,,,,,,,

0,1,2
1.0,,
,,
7.0,,

0,1,2
,,
,,6.0
7.0,,

0,1,2
1.0,,
,,6.0
7.0,,

0,1,2
,,
,,
7.0,8.0,9.0

0,1,2
1.0,,
,,
7.0,8.0,9.0

0,1,2
1.0,,3.0
,,
,8.0,

0,1,2
,,3.0
,,
,8.0,

0,1,2
1.0,,
,,
7.0,8.0,

0,1,2
,,
,5.0,
7.0,8.0,

0,1,2
,,
,5.0,
7.0,8.0,

0,1,2
,,3.0
,,
7.0,,

0,1,2
,,3.0
,,6.0
,,

0,1,2
,,
,,6.0
,8.0,

0,1,2
,,
,5.0,6.0
,8.0,

0,1,2
,2,
,5,6.0
,8,

0,1,2
1.0,,3.0
,,
,,

0,1,2
1.0,,3.0
,5.0,
,,

0,1,2
1.0,,
,5.0,6.0
,8.0,

0,1,2
1.0,2.0,
,,6.0
,8.0,

0,1,2
,,
,5.0,
7.0,,

0,1,2
,2.0,
,5.0,
7.0,,

0,1,2
1.0,,
,5.0,
7.0,,

0,1,2
1.0,,
4.0,5.0,
,,9.0

0,1,2
,2.0,
4.0,,
,,

0,1,2
1.0,2.0,
,,
,,9.0

0,1,2
,,
,5.0,6.0
7.0,8.0,

0,1,2
,,
,5.0,
7.0,,

0,1,2
,,
,5.0,6.0
,8.0,

0,1,2
,,
,,6.0
,8.0,

0,1,2
1.0,,
,,6.0
7.0,,9.0

0,1,2
1.0,,
4.0,,6.0
,,

0,1,2
,,3.0
,,6.0
7.0,,

0,1,2
,,3
4.0,,6
,,9

0,1,2
,,3.0
4.0,,6.0
,,

0,1,2
,,
,,6.0
,,9.0

0,1,2
1.0,,
,,
7.0,,

0,1,2
,,
,,6.0
7.0,,9.0

0,1,2
1.0,,
,,6.0
7.0,,9.0

0,1,2
1.0,,
,,
7.0,,

0,1,2
1.0,,
4.0,,6.0
,,

0,1,2
,2.0,3.0
,,6.0
7.0,,

0,1,2
,,3
4.0,,6
,8.0,9

0,1,2
,2.0,3.0
4.0,,6.0
,8.0,

0,1,2
,2.0,
,,6.0
,,

0,1,2
,2.0,
,,6.0
,,


It is fun to try to write a program to solve these puzzles the way humans do. But the easiest approach is simple backtracking I suspect.