diff --git a/asset/sass/chapter.scss b/asset/sass/chapter.scss
index 167c84967..f436fb328 100644
--- a/asset/sass/chapter.scss
+++ b/asset/sass/chapter.scss
@@ -99,9 +99,13 @@ article.chapter {
   .design-note {
     background: hsl(80, 30%, 96%);
 
-    code, pre {
+    code, .codehilite {
       background: hsl(80, 20%, 93%);
     }
+
+    .codehilite {
+      margin: -12px 0 -12px -12px;
+    }
   }
 }
 
diff --git a/asset/style.scss b/asset/style.scss
index a2f4ae435..b73e807f2 100644
--- a/asset/style.scss
+++ b/asset/style.scss
@@ -357,7 +357,7 @@ aside {
     padding: 1px 2px;
   }
 
-  pre {
+  .codehilite {
     padding: 6px;
     margin: -12px 0;
   }
diff --git a/book/scanning.md b/book/scanning.md
index 9e8101644..ac5a05191 100644
--- a/book/scanning.md
+++ b/book/scanning.md
@@ -1,461 +1,437 @@
 ^title Scanning
 ^part A Tree-Walk Interpreter in Java
 
+**TODO: explain snippet notation in introduction**
 
-**TODO: context lines aren't correct. showing content from later or earlier snippets.**
+**TODO: consider reorganizing the headers and subheaders**
 
----
+The first step in any compiler or interpreter is <span name="lexing">scanning</span>. The scanner takes in the raw source code as a series characters and groups them into meaningful chunks -- the "words" and "punctuation" that make up the language's artificial grammar.
 
-- first step of lang is scanning
-- also great first chapter because pretty easy
-- by end of chapter, be able to take any string of lox code and chunk into
-  tokens to later feed into parser
+<aside name="lexing">
 
-## The Interpreter Shell
+This task has been variously called "scanning" and "lexing" -- short for lexical analysis -- over the years and the two terms don't have very distinct definitions. Way back when computers were as big as Winebagos but had less memory than your watch, some people used "scanner" only to refer to the piece of code that deals with reading raw source code characters from disk and buffering them in memory. Then lexing was the phase after that that did useful stuff with the characters.
 
-- since just started, before we get to scanner, need to sketch out app skeleton
-- very first bit of jlox
+These days, reading a source file into memory is an easier task and the two terms are basically interchangeable.
+
+</aside>
+
+This is a good starting for us too because the code isn't very hard -- pretty much a switch statement with delusions of grandeur. It will let us get warmed up before we tackle some of the more interesting material later.
+
+By the end of this chapter, we'll have a full-featured fast scanner that can handle any string of Lox source code and produce the tokens that we'll feed into the parser in the next chapter.
+
+## The Interpreter Framework
+
+Since this is our first real chapter, before we get to actually scanning some code, we need to tie together the basic application framework for our interpreter, jlox.
+
+Because everything starts with a class in Java, we'll begin with like so:
 
 ^code lox-class
 
-- doesn't do much
-- still, makes you get your project set up and figure out ide and stuff
-- also explains notation here for code snippets
-- note file name this should go in
+Stick that in a text file, and go get your IDE and Makefile or whatever set up. I'll be right here when you're ready. Good? OK, let's keep going.
 
-- lox is scripting lang
-- two ways to run code
-- if give jlox path to file
-- loads and runs it
+Lox is a scripting language, which means it executes directly from source. There are actually two ways you can run some code. If you start jlox from the command line and give it a path to a file, it reads it and executes it:
 
 ^code run-file
 
-- other way is "interactive prompt"
-- lets user incrementally build up program one line at time
-- if run jlox with no arg, enters this mode
+If you like a closer emotional connection to your interpreter, you can also run it interactively. If you fire up jlox without any arguments, it drops you into a prompt where you can enter and execute code one line at a time.
+
+<aside name="repl">
+
+An interactive prompt is also called a "REPL" (pronounced like "ripple" but with
+an "e"). The name comes from Lisp where providing one is as simple as
+wrapping a loop around a few built-in functions:
+
+```lisp
+(print (eval (read))
+```
+
+Working outwards from the most nested function call, you **R**ead a line of input, **E**valuate it, **P**rint the result, then **L**oop and do it all over again.
 
-^code repl
+</aside>
 
-- reads line of input, executes it and loops
-- (ctrl-c exits)
-- called "repl" -- lisp history
-- both use:
+^code prompt
+
+To escape that infinite loop in jlox, hit Control-C or yank the plug out of your machine if you have anger management problems.
+
+Both the prompt and the file runner are thin wrappers around this core function:
 
 ^code run
 
-- eventually, this will plumb through parser and interpreter
-- for now, just prints tokens so we can see what scanner produces
+It's not super useful yet since we haven't written the interpreter, but baby steps, you know? Right now, we'll just have it print out the tokens our forthcoming scanner spits out so that we can see if we're making progress. Feel free to run this periodically as you work you way through the chapter to see how it does.
+
+### Error handling
+
+While we're setting things up, another key piece of infrastructure is *error handling*. Textbooks sometimes gloss over this because it's more an engineering concern than a formal computer science-y problem. But if you care about making a language that's actually *usable*, then how your interpreter handles errors is a vital concern.
+
+The tools your language provides for dealing with errors make up a large portion of your language's user interface. When their code is working, they aren't thinking about your language at all -- they're headspace is all about *their program*. It's only when things go sideways that they focus on your beautiful language and its implementation.
 
-### error handling
+When that happens, it's up to us to give the user all of the information they need to understand what went wrong and guide them tactfully back to where they are trying to go. Doing that well means thinking about error handling all through the implementation of our interpreter, starting now.
 
-- another key part of interpreter is how it manages errors
-- often left out of textbooks, but vital when comes to real impl
-- users need help them most when program isn't doing what they want
-- error handling pervasive part of job
-- sooner start, the better
-- confess: pretty simple here, though
+Having said all that, for *this* interpreter, what we'll build is pretty bare bones. I'd love to talk about interactive debuggers, static analyzers and other fun stuff, but there's only so much time.
 
-- put in framework now and use it later
+For now, we'll start with:
 
 ^code lox-error
 
-- tells user error occurred on given line
-- telling user that error occurred not very useful
-- need to tell them where
-- if get error trying to add num to bool, not helpful to say "some + somewhere
-  in prog is bad, good luck finding it!"
-- better would be line, column and length
-- best would allow multiple source locations since some errors involved multiple
-  points in code
+This tells users some syntax error occurred on a given line. This is really the bare minimum to be able to claim you even *have* error reporting. Imagine you accidentally leave a dangling comma in some function call and the interpreter prints out:
 
-- just line to keep book simpler
+```
+Error: Unexpected "," somewhere in your program. Good luck finding it!
+```
+
+So we at least need to point them to the right line. Even better would be the beginning and end column so they know where in the line. Even better than *that* is to *show* the user the offending line, like:
 
-- reason defining in lox class is because of hadError
+```text
+Error: Unexpected "," in argument list.
+
+    15 | function(first, second,);
+                               ^-- Here.
+```
+
+I'd love to implement something like that in this book but the honest truth is that it's a lot of grungy string munging code. Very useful for users, but not super fun to read in a book and not very technically interesting. So we'll stick with just a line number. In your interpreters, please do kick it up a notch.
+
+The primary reason we're sticking this error reporting function in the main Lox class is because of that `hadError` field. It's defined here:
 
 ^code had-error (1 before)
 
-- when error occurs while loading script, want to set exit code
-- nice to be good command line citizen
-- [yes static is hacky]
+If a syntax error occurs when running a script, we want to exit with a non-zero exit code like a good command line citizen should:
 
 ^code exit-code (1 before, 1 after)
 
-- also generally code to separate error *reporting* code from error *generating*
-  code
-- scanner detects error, but not really its job to know how best to present it
-  to user
-- in prod language, should pass in some kind of ErrorReporter interface to
-  scanner
-- abstract how error displayed
-- can print to stderr, show popup on screen, add errors to ide's error log, etc.
-- to keep simple, don't have actual abstraction here, but do at least split it
-  out some
-
-- shell is in place
-- once have scanner class with scanTokens() working, can start using
-- before get to that, talk about tokens
+We also need to reset it in the prompt. If the user makes a mistake, they should be able to keep going:
+
+^code reset-had-error (1 before, 1 after)
+
+The other reason I pulled the error reporting out here instead of stuffing it into the scanner and other phases where the error occurs is to remind you that it's a good engineering practice to separate the code that *generates* the errors from the code that *reports* them.
+
+The various phases of the front end will detect errors, but it's not really their job to know how to present that to a user. In a full-featured language implementation, you will likely have multiple ways errors can get displayed: on stderr, in an IDE's error window, logged to a file, etc. You don't want that code jammed in your parser.
+
+Ideally, we would have an actual abstraction, some kind of <span name="reporter">"ErrorReporter"</span> interface that gets passed to the scanner and parser so that we can swap out different reporting strategies. For our simple interpreter here, I didn't do that, but I did at least separate out the code for error reporting.
+
+<aside name="reporter">
+
+I had exactly that when I first implemented jlox. I ended up tearing it out
+because it felt like pointless boilerplate in such a minimal implementation.
+
+</aside>
+
+And with that, our basic shell is in place. Once we have a Scanner class with some `scanTokens()` method, we can start running it. Before we get to that, les talk about these mysterious "tokens" and the prizes they may or may not be redeemed for.
 
 ## Tokens and Lexemes
 
-- what is token?
-- smallest sequence of chars that is meaningful
-- in `name = "lox";` "name", "=", `"lox"` and `;` all meaningful
-- `na` is not, neither is `ox"`.
-- scanner's just is to go through string of chars, find meaningful units
-- each is called lexeme
-- lexeme just raw sequence of chars
-
-- in process of recognizing lexemes, also figure out other useful stuff
-
-### token type
-
-- if lexeme is a word, like `while` can also recognize that it's keyword `while`
-- since keywords affect grammar of language, parser will often need logic like,
-  "if next token is `while` then ..."
-- technically, is redundant with lexeme
-- could compare strings
-- but very slow and kind of ugly
-- so at point when we recognize lexeme, which also store which *type* of token
-  it represents
-- which keyword, punctuation, operator, or literal
-- simple enum
+Here's a line of Lox code:
+
+```lox
+var language = "lox";
+```
+
+Here, `var` is the keyword for declaring a variable. That three-character sequence *means* something. If we yank, say, `gua` out of the middle of `language`, those three characters don't mean anything on their own.
+
+That's what lexical analysis is really about. Our job is to scan through the list of characters and group them together into the smallest possible sequences that still have a well-defined meaning. Each of these is called a **lexeme**.
+
+In that line of code, the lexemes are:
+
+```
+var
+language
+=
+"lox"
+;
+```
+
+**TODO: illustrate**
+
+The lexemes are just the raw substrings of the source code. However, in the process of recognizing those and drawing boundaries between each one, we also stumble upon some other useful information. Things like:
+
+### Lexeme type
+
+If the lexeme is an identifier whose name matches one of the language's reserved words, like `while` or `if`, we can recognize that now. Since keywords are part of the grammatical structure of the language, the parser often has logic like, "If the next token is `while` then parse a while statement."
+
+Technically, the parser can determine that right from the lexeme by comparing the strings. But that's slow and kind of ugly. Instead, at the point that we recognize a lexeme, we'll also remember which *kind* of lexeme it represents. We'll have a different type for each keyword, operator, bit of punctuation, and literal value.
+
+It's a simple enum:
 
 ^code token-type
 
-### literal
+### Literal value
+
+Some lexemes represent literal values -- numbers and strings and the like.
+Since the scanner has to walk each character in the literal to correctly identify it, it can also convert it to its actual runtime value as used by the interpreter later.
+
+For example, after the scanner walks over the characters `123` in a number literal, we can convert it the actual numeric value 123.
+
+### Location information
+
+Back when I was on my soapbox about error handling, we saw that we need to tell users *where* errors occurred. We have to keep track of that information through every phase of the interpreter, starting here.
+
+In our simple interpreter, we just track which line the token appears on, but more sophisticated implementations would track the column and length too.
 
-- some lexemes for literals
-- at point that scanner detects literal, can also produce runtime value
-- if lexeme is number `123` can convert to actual number value 123
+<aside name="location">
 
-### line info
+Many token implementations store the location as two numbers: the number of characters from the beginning of the source file to the beginning of the lexeme, and the number of characters in the lexeme. The scanner needs to know these anyway, so there's no overhead to track them.
 
-- as we saw, error reporter needs to know where error occurred
-- have to keep track of that through all phases of interpreter
-- can't drop on floor if error may occur later
-- start in scanner
-- each token tracks which line appeared on
+Those can be later converted to line and column positions later by looking back at the source file and counting the preceding newlines. That sounds slow, and it kind of is. However *you only need to do it when you need to actually display a line and column to the user.* The vast majority of tokens never appear in an error message. For those the less time you spend calculating position information ahead of time, the better.
 
-- bundle all of that together into token class
+</aside>
+
+We take all of this and wrap it up in a class:
 
 ^code token-class
 
-- java really verbose for dumb data object, but that's it
+And *that's* what a **token** is -- a bundle containing the raw lexeme along with the other things the scanner knows about it.
 
 ## Regular Languages and Expressions
 
-- now know what we need to produce, let's produce it
-- core of scanner is loop
-- starting at beginning of source, figure out what lexeme first char is part of
-- consume as many chars as belong to that lexeme
-- produce token
-- repeat with rest of string
-- when whole string is done, done scanning
-
-- process of matching chars might seem familiar
-- if ever used regular expression, might consider using regex to do it
-- ex: if source is `breakfast = "croissant";`, first lexeme is `breakfast`
-  identifier
-- could use regex like `[a-zA-Z_][a-zA-Z_0-9]*` to match it
-- captures underlying rule that identifier start with letter or underscore
-  followed by zero or more letters, underscores or digits
-- you have deep insight here
-
-- rules that determine what chars are allowed in each kind of lexeme are called
-  "lexical grammar"
-- in lox, as in most languages, rules are simple enough to fit within
-  restriction called "regular language"
-- lot of interesting theory here about what makes language regular, how it
-  ties to fsms
-- most other pl books cover well, not getting into here
-- same "regular" in "regular" expression
-- you *can* make a scanner that uses regexs to match lexemes
-- could use java's regex lib
-- also tools like lex/flex that will take whole file of regex rules and
-  generate scanner
-
-- want to understand how they work
-- hand-build scanner for our language's rules
-- basic scan loop
-
-## The Scanner
-
-- let's sketch out class
+Now that we know what we're trying to produce, let's, well, produce it. The code of the scanner is a loop. Starting at the beginning of the source code, it figures out what lexeme the first character belongs to. Then it consumes any following characters that belong to that same lexeme.
+
+When it hits the end of that lexeme, it emits a token. Then it loops back and does it again, starting from the very next character in the source code. It keeps doing that, eating characters and occasionally, uh, excreting tokens, until it runs out of characters.
+
+**TODO: illustrate**
+
+The first step inside the loop where we look at the first couple of characters and figure out which kind of lexeme it *matches* might sound familiar. If you're familiar with regular expressions, you might consider defining a regex for each kind of lexeme and use those to match characters. For example, Lox has the same identifier rules as C, and the regex `[a-zA-Z_][a-zA-Z_0-9]*` matches one.
+
+If you did think of regular expressions by now, your <span
+name="theory">intuition</span> is a deep one. The rules that determine how characters are associated with different lexemes for a language are called its **lexical grammar**. In Lox, as in most languages, the rules of that grammar are simple enough to within a boundary called a **[regular language][]**. That's the same "regular" as in regular expressions.
+
+[regular language]: https://en.wikipedia.org/wiki/Regular_language
+
+You very precisely *can* recognize all of the different lexemes for Lox using
+regexes if you want to, and there's a pile of interesting theory underlying why that is and what that means. For
+jlox, we could even use Java's regex library for our scanner. Or we could break
+out a tool like <span name="lex">[Lex][]</span> or [Flex][] to take all of the regular expressions for
+Lox's lexical grammar and spit out an entire scanner for us.
+
+<aside name="lex">
+
+Lex was created by Mike Lesk and Eric Schmidt. Yes, the same Eric Schmidt who ran Sun's software division, was a CEO of Novell, and is executive chairman of Google as of this writing. I'm not saying programming languages are a sure-fire path to wealth and fame, but we can count at least one multi-billionaire among us.
+
+</aside>
+
+[lex]: http://dinosaur.compilertools.net/lex/
+[flex]: https://github.com/westes/flex
+
+<aside name="theory">
+
+It pains me to gloss over the theory so much, especially when it's as fun as I think the [Chomsky hierarchy][] and [FSMs][] are. But the honest truth is other books cover this better than I could. [Compilers: Principles, Techniques, and Tools][dragon] (universally known as "the Dragon Book") is a great place to slake your thirst for knowledge.
+
+[chomsky hierarchy]: https://en.wikipedia.org/wiki/Chomsky_hierarchy
+[dragon]: https://en.wikipedia.org/wiki/Compilers:_Principles,_Techniques,_and_Tools
+[fsms]: https://en.wikipedia.org/wiki/Finite-state_machine
+
+</aside>
+
+But our goal is to understand how a scanner works inside, so we won't be
+outsourcing that task. We're about hand-crafted goods here.
+
+## A Scanner for Lox
+
+Without further ado, let's make ourselves a scanner.
 
 ^code scanner-class
 
-- (seems like creating awful lot of files. early chapters do lot of framework
-  gets better later)
+<aside name="files">
+
+I know it seems like we're cranking out an awful lot of files. Java does tend to
+be verbose, but I promise it gets less so in later chapters. Since we're just
+getting started now, there's a lot of framework to put in place.
+
+</aside>
 
-- like said, scanner walks string
-- finds range of chars that map to lexeme
-- when hits end, creates token
-- loop until reach end
-- then done
-- core looks like:
+We store the raw source code as a simple string, and we have an empty list that we will fill with tokens as we generate them. The aforementioned loop that does that looks like this:
 
 ^code scan-tokens
 
-- eat way through string emitting tokens as we go
-- when done, add special eof token to end of list
-- not strictly needed, but makes parser little cleaner
-- few fields to keep track of where we are
+It works its way through the source code until it runs out of characters. When it's done, it adds one final special "end of file" token to the end. That isn't strictly needed, but it will make our parser a little cleaner.
+
+This loop depends on a couple of fields to keep track of where in the source code we are:
 
 ^code scan-state (1 before, 2 after)
 
-- current index of next char to consume in string
-- tokenStart beginning of next token
-- since later tokens will be more than one char long, need to remember beginning
-- when produce token, will be substring from start to current
-- line is current line number
+The `start` and `current` fields are indexes into the string -- the first character in the current lexeme being scanned, and the character we're currently considering. The other field tracks the line that contains `current`. We'll keep that updated as we go so we can produce tokens that know what line they occur on.
 
-- little helper fn
+Then we have one little helper function:
 
 ^code is-at-end
 
-## Recognizing Lexemes
+### Recognizing lexemes
+
+Each turn of the loop, we scan the next token. This is the real heart of the scanner. We'll start simple. Imagine if every lexeme was only a single character long. To implement that, you can just consume the next character and pick a token type for it.
 
-- finally get to real heart of scanner
-- start simple
-- imagine all tokens only single character
-- how implement?
-- easy, just consume next char
-- based on what it is, produce token of right type
-- lox does have few single-char tokens, so let's do those
+This works fine for several of Lox's real lexemes, so lets start there:
 
 ^code scan-token
 
-- uses couple of helper fns
+Again, we need a couple of helper methods:
 
 ^code advance-and-add-token
 
-- advance adds next char to current lexeme and returns it
-- can call even when don't know what lexeme is yet, do know it's going to be
-  some lexeme
+The `advance()` method adds the next character to the lexeme we're currently building and then returns it. We can call this even before we know what kind of lexeme we're building since we know the character is going into *some* lexeme.
 
-- addtoken grabs current lexeme and line info and adds new token to end of list
-- also have one for literal we'll use later
+If `advance()` is the input then `addToken()` is the output. It grabs the text of the current lexeme and creates a new token for it. Later, we'll use the other overloaded version here to handle tokens with literal values.
 
-### invalid tokens
+### Lexical errors
 
-- before fill in rest of language, what happens if next character doesn't
-  match any lexeme?
-- lox doesn't use `@`
-- what if user types that in
-- add little error handling
+Before we get too far in, let's take a moment to think about errors at the lexical level. Lox doesn't use the `@` character. What happens if a user throws a source file containing that at our interpreter? Right now, it just gets silently added to the next token. That ain't right.
 
-^code char-error (1 before, 1 after)
+Let's fix that:
 
-- note still called advance(), so still consume char and move on
-- important so don't get stuck in infinite loop
-- note also don't stop scanning after this
-- even though error occurred, want to keep going
-- source file may have more than one error
-- if possible, should find them all in one go
-- no fun if user gets one error, fixes, then another appears and so on
-- so strategy is to report error and try to keep truckin'
-- won't actually *execute* code though
-- if any compile error occurs, no running
-- just want to find as many compile errors as we can
-- would be better here to consume multiple unrecognized chars in one go so
-  don't shotgun errors if user has pile of bad chars
-
-### operators
-
-- ok, get back to filling in grammar
-- have punctuation and single-char operators
-
-- not all operators
-- what about `!`?
-- it's a single char token too, right?
-- not if followed by `=`
-- if `!` char appears by itself, should be `!` token
-- but if very next char is `!=`, then should be `!=` token
-- likewise `<`, `>`, and `=`
-- all can be followed by `=`
-
-- for those, need to check next char too
+^code char-error (1 before, 1 after)
 
-^code two-char-tokens (1 before, 2 after)
+Note that the erroneous character was still consumed by the call to `advance(). That's important so that we don't get stuck in an infinite loop.
 
-- uses helper fn
+Note also that we <span name="shotgun">keep scanning</span>. There may be other errors later in the program. It gives our users a better experience if we can detect as many of those as possible in one go. It's no fun if they see one tiny error and fix it, only to have the next error appear, and so on. Syntax error whack-a-mole is a drag.
 
-^code match
+<aside name="shotgun">
 
-- like advance(), but conditional
-- only advances if current char is what looking for
-- returns whether or not it matched
-- lot like `?` in regex, right?
-- could actually use this at top level of scan loop instead of switch
-- long chain of matches
-- but would look at first character multiple times, first for `!=`, then for
-  `!` if second char wasn't `=`
-- switch actually much faster
-- surprisingly, scanning often important bottleneck in compiler
-- only part of compiler that looks at each char of source
-- everything later at coarser granularity, even though some algs have worse
-  complexity
+Because we report each invalid character as its own error, this will shotgun the user with a blast of errors if they accidentally paste a big blob of weird characters. If we wanted to be a little more nicer, we should coalesce a run of invalid characters into a single error.
 
-- now have scanner that can handle `(+-!!==)` stuff like that
+</aside>
 
-### maximal munch
+Even though we keep scanning, though, we won't try to *execute* this code. As soon as the first error is hit, `hadError` gets set so we know not to try to run it.
 
-- our language doesn't have '--', but if it did, how would handle:
+### Operators
 
-    a---b
+We have single-character lexemes covered, but that doesn't cover all of Lox's operators. What about `!`? It's a single character, right? Sometimes, yes, but not if it's followed by a `=`. In that case, it should be a `!=` lexeme. Likewise, `<`, `>`, and `=` can all be followed by `=`.
 
-- could be valid, if scanner broke it up like:
+For those, we need to look at the second character:
 
-    a - --b
+^code two-char-tokens (1 before, 2 after)
 
-- or even
+Those use this new method:
 
-    a - - - b
+^code match
 
-- but means when scanner is looking at first two `--`, would have to know what
-  grammar context it is in to know where to split up
-- do scanners do that?
-- no: adds way too much entanglement
-- basically destroys separation between scanner and parser
-- instead, simple rule, called "maximal munch"
-- scanner always eats as many characters as it can when forming current token
-- so above is scanned as `a -- - b` even though that causes later parse error
-- simple is better
+It's like a conditional `advance()`. It only consumes the current character if it's what we're looking for.
 
-### comments and whitespace
+### Comments and whitespace
 
-- missing one operator, `/`
-- little trickier because of `//`
+We're still missing one operator, `/`. That one needs a little special handling because we use `//` to begin a comment.
 
-^code slash
+^code slash (1 before, 2 after)
 
-- same general idea, after match one `/` if next char is `/`, need to handle
-  it differently
-- comment consumes any char to end of line
+This is roughly similar to the other two-character operators. However, when we match a second `/`, then we know we're in a comment. At that point, we keep consuming characters until we hit the end of the line.
 
-^code comment
+This is our general strategy for handling longer lexemes. Once we've detected the beginning of a lexeme, we shunt off to some code specific to that kind of lexeme that keeps eating characters until it sees the end.
 
-- another helper
+We've got another helper:
 
 ^code peek
 
-- sort of like advance, but doesn't consume
-- **lookahead**
-- only looks at current unconsumed char, so *1* char lookahead
-- important to keep this number small, affects perf of scanner
-- grammar of language defines how small it can be
-- if not *constant* adds lot of complexity to grammar
+It's sort of like `advance()`, but doesn't consume the character. This is called <span name="match">**lookahead**</span>. Since it only looks at the current unconsumed character, we have *one character of lookahead*. The smaller this number is, generally, the faster our scanner will run. The lexical grammar dictates how much lookahead we need. Fortunately, most languages in wide use are designed to be scanned with one or two characters of lookahead.
+
+<aside name="match">
+
+Technically, `match()` is doing lookahead too. `advance()` and `peek()` are the fundamental operators and `match()` combines them.
 
-- aside about lookahead and complexity?
+</aside>
 
-- don't want to use match() because want to handle newline later to keep track
-  of line
-- note, don't emit token
-- comments consumed, but not turned into token
-- just discard
-- no addToken() call
-- that way rest of pipeline doesn't have to worry about them
-- brings to other thing can discard, whitespace:
+After we consume all of the characters in the comment, we don't called `addToken()`. The lexeme just gets discarded the next time we loop around and start a new one. This is deliberate. Comments, by design, aren't interpreted by the language. By discarding them now, we simplify the parser since it won't have to worry about them.
+
+Newlines and other whitespace are also ignored, and now is a good time to do that:
 
 ^code whitespace (1 before, 3 after)
 
-- just line comments, spaces and other whitespace are consumed
-- (remember, already advanced c)
-- but emit no tokens
-- newline char little special
-- also discarded, but increment line
-- that's all that's needed to keep track of what line we're on
+For spaces and tabs, we simply go back to the beginning of the scan loop. That will start a new lexeme after the whitespace character. For newlines we do the same thing, but we also increment the line counter. (This is why we used `peek()` to find the newline after a comment instead of `match()`. We want that newline to get here and update `line`.)
 
-- code more free-form now
-- can correctly scan
+Our scanner is starting to feel more real now. It can handle fairly free-form code like:
 
 ```lox
 // this is a comment
-(()){} // grouping stuff
-!*+-/=<> // operators
+(( )){} // grouping stuff
+!*+-/=<> <= == // operators
 ```
 
-- making progress!
-
 ### String literals
 
-- if can handle tokens like `!=` that are two chars, ready to tackle longer
-  ones like number and string literals
-- start with strings
-- string token always starts with `"`, so begin there
+Now that we know how to handle multiple-character lexemes, we can add support for literals. We'll do strings first, since that always begin with a specific character, `"`:
 
 ^code string-start (1 before, 2 after)
 
-- calls:
+That calls:
 
 ^code string
 
-- like two-char operators, consume additional characters after first
-- but here, do it in a loop until we hit closing `"`
-- also need to safely handle hitting the end of the source without finding the
-  closing quote
-- report unterminated string error
+Like with comments, we keep consuming characters until we hit the `"` that ends the string. We also need to gracefully handle running out of input before the string is closed and report an error for that.
 
-- otherwise, produce actual string literal value by stripping off quotes
-- store that in token
-- lox has no string escape sequences
-- if did, would handle them here so literal had real chars
+For no particular reason, Lox supports multi-line strings. There are pros and cons to that, but prohibiting them was a little more complex that allowing them, so I left them in. This does mean we also need to update `line` when we hit a newline inside a string.
 
-- note allow multiline strings
-- need to update line when newline appears in string too
-- could make this an error but most langs seem to end up supporting
+Finally, the last interesting bit is that when we create the token, we also produce the actual *value* of the string literal that will be used later by the interpreter. Here, that conversion just requires a `substring()` to strip off the quotes. That's because we don't support escape sequences in Lox. If we did, we'd process those here.
 
 ### Number literals
 
-- lox has one number type, but both int and floating point literals
-- int is series of digits
-- floating point is series of digits, followed by `.` and more digits
-- unlike some other langs, don't allow leading or trailing dots
-- just
+All numbers in Lox are floating point at runtime, but it supports both integer and decimal literals. That means a number literal is a series of <span name="minus">digits</span> optionally followed by a `.` and one or more digits:
+
+<aside name="minus">
+
+Since we only look for a digit to start a number, that means `-123` is not a
+number *literal*. Instead, `-123`, is an *expression* that applies `-` to the
+number literal `123`. In practice, the result is the same, though it has one
+interesting edge case if we were to add method calls on numbers. Consider:
+
+```lox
+print -123.abs();
+```
+
+This prints `-123` because `-` has lower precedence than `.`. We could fix that by making `-` part of the number literal. But then consider:
+
+```lox
+var n = 123;
+print -n.abs();
+```
+
+Now this produces a different result than you'd get by repacing `n` with its value. No matter what you do, some case ends up weird.
+
+</aside>
 
 ```lox
 1234
 12.34
 ```
 
-- don't want cases for every digit in switch, so stuff in default
+We don't allow a leading or trailing decimal point, so these are both invalid:
 
-^code digit-start (1 before, 1 after)
+```lox
+.1234
+1234.
+```
+
+We could easily support the former, but I left it out to keep things simple. The latter gets weird if we ever want to allow methods on numbers like `123.sqrt()`.
 
-- little helper
+To recognize the beginning of a number lexeme, we look for any digit. It's kind of tedious to add cases for every decimal digit, so we'll stuff it in the default instead:
 
-- (not use `Character.isDigit()` has stuff like devangari)
+^code digit-start (1 before, 1 after)
+
+This relies on:
 
 ^code is-digit
 
-- like string, goes to separate fun to scan rest of number
+<aside name="is-digit">
+
+The Java standard library provides [`Character.isDigit()`][is-digit] which seems like a good fit. Alas, that method allows things like Devangari digits, fullwidth numbers, and other funny stuff we don't want.
+
+[is-digit]: http://docs.oracle.com/javase/7/docs/api/java/lang/Character.html#isDigit(char)
+
+</aside>
+
+Once we know we are in a number, we branch to a separate method to consume the rest of the literal, like we do with strings:
 
 ^code number
 
-- scan sequential digits
-- when run out of digits, look for fractional part
-- only allow it if there is digit after dot
-- (could allow trailing dot, but little weird in language with `.` method
-  syntax. don't currently allow methods on number literals like `123.abs()`, but wouldn't want to rule out.)
-- need two chars of lookahead
+It consumes as many digits as it finds for the integer part of the literal.
+
+Then it looks for a fractional part, which is a decimal point (`.`) followed by at least one digit. This requires another character of lookahead since we don't want to consume the `.` until we're sure there is a digit *after* it. So we'll add:
 
 ^code peek-next
 
-- then use Java to convert number to string
-- could do this ourselves
-- common interview question
-- but kind of silly
+If we have a fractional part, again, we consume as many digits as we can find.
 
-- last literals are boolean and null, but handle those as keywords, which
-  gets us too...
+Finally, we convert the lexeme to its numeric value. Our interpreter will use Java's `double` type to represent numbers, so we produce a value of that type. We're using Java's own parsing method to convert the lexeme to a real Java double. We could implement this ourselves, but really, unless you're trying to cram for an upcoming programming interview, it's not worth our time.
 
-### Identifiers and keywords
+The remaining literals are Booleans and `null`, but we'll handle those as keywords, which gets us to...
 
-- almost everything
-- in beginning was word, but for us its at the end
+### Identifiers and keywords
 
-- might think we could handle reserved words like we handle multi-char operators like `<=`
-- like:
+Our scanner is almost done. The only things left in the lexical grammar to implement is identifiers and their close cousins the reserved words. You might think we could match keywords like we handle multiple-character operators like `<=`. Something like:
 
 ```java
 case 'o':
@@ -465,63 +441,156 @@ case 'o':
   break;
 ```
 
-- consider if user types in 'orchid'
-- [fortran aside]
-- remember maximal munch!
+But now consider if a user names a variable `orchid`. We don't want the scanner to see the first to letters `or` and immediately emit an `or` keyword token. This gets us to an important principle in lexical grammars called <span name="maximal">**maximal munch**</span>. When the scanner is matching lexemes if two lexical grammar rules match some chunk of characters, *the longest one wins*.
+
+That rule states that if we match `orchid` as an identifier and `or` as a keyword, the latter wins. It's also why we tacitly assume above that `<=` should be scanned as a single `<=` token and not `<` followed by `=`.
+
+<aside name="maximal">
+
+Consider this nasty bit of C code:
+
+```c
+---a;
+```
+
+Is this valid? It depends on how it's scanned. If the scanner sees it as:
+
+```c
+- --a;
+```
+
+Then it would work. But that would require the scanner to know about the grammatical structure of the surrounding code, which entangles things more than we want. Instead, the maximal munch rule says that it is *always* scanned like:
 
-- can't distinguish between reserved word and identifiers until know we've
-  reached end
-- where term comes from "reserved word" is a "word" (ident) that is reserved by
-  the language
-- really is an identifier, just one with special meaning
-- so handle identifiers first
+```c
+-- -a;
+```
+
+Even though that becomes a syntax error later in the parser.
+
+</aside>
 
-**TODO: make sure context lines look right here**
+This means we can't easily detect a reserved word until we've reached the end of what might instead be an identifier. After all, a reserved word *is* an identifier, it's just one that has been claimed by the language for its own use. That's where the term **"reserved word"** comes from.
+
+Instead, we'll assume any lexeme starting with a letter or underscore is an identifier:
 
 ^code identifier-start (3 before, 3 after)
 
-- like number, put in default so don't need cases for every char that can start identifier
-- calls
+That calls:
 
 ^code identifier
 
-- both of those use these obvious helpers
+Those use these helpers:
 
 ^code is-alpha
 
-- to handle keywords, after finish identifier, see if lexeme matches any of
-  known set of reserved words
-- [if use flex to generate lexer, rolls keywords into main fsm. advanced hand-written lexers still sometimes use fsm for this since perf critical]
-- each keyword has its own token type
-- makes parser simpler
-- so need to associate keywords with token types
-- use a map
+Now identifiers are working. To handle keywords, we just see if the identifier's lexeme is one of the reserved words. If so, we'll use a token type specific to that keyword. (That will make parsing easier later.) We'll define this set of reserved words in a map:
 
 ^code keyword-map
 
-- static since immutable global property of lox language
-- [may be first time ever used static block in java]
-
-- then when scanning ident, see if keyword
+Then, after we scan an identifier, we check to see if it matches one of these keywords:
 
 ^code keyword-type (2 before, 1 after)
 
-- after scanning ident, look up lexeme in map
-- if found, use that type
-- otherwise, must be ident
-
-## challenges
-
-- challenge
-  - many langs use newlines as statement separator
-    - have to handle case where newline occurs in place that should not end
-      statement
-    - explain how js, ruby, python, go, and lua handle that
-    - which do you prefer?
-  - python's lexer isn't regular, why not?
-  - aside from separating tokens, spaces aren't used for much. it does
-    come into play in CoffeeScript, Ruby, and C preprocessor. where?
-  - scanner discards whitespace and comments
-    - not meaningful to lang, so don't need
-    - some scanners keep them
-    - why?
+If so, we use that keyword's token type. Otherwise, it's a regular user-defined identifier.
+
+And with that, we now have a complete scanner for the entire Lox lexical grammar. Fire up the REPL and type some valid and invalid code in. Does it produce the tokens you expect? Try to come up with some interesting edge cases and see if it handles them as it should.
+
+<div class="challenges">
+
+## Challenges
+
+1.  The lexical grammars of Python and Haskell are not *regular*. What does that
+    mean, and why aren't they?
+
+1.  Aside from separating tokens -- distinguishing `print foo` from
+    `printfoo` -- spaces aren't used for much in most languages. However, they
+    do affect how code is parsed in CoffeeScript, Ruby, and the C preprocessor.
+    Where and what effect do they have in each language?
+
+1.  Our scanner here, like most, discards comments and whitespace since those
+    aren't needed by the parser. Why might you want to write a scanner that does
+    *not* discard those? What would it be useful for?
+
+1.  Add support to Lox's scanner for C-style `/* ... */` block comments. Make
+    sure the handle newlines in them. Consider allowing them to nest. Is adding
+    support for nesting more work than you expected? Why?
+
+</div>
+
+<div class="design-note">
+
+## Design Note: Implicit Semicolons
+
+Programmers today are spoiled for choice in languages and have gotten picky about the look and feel of its syntax. They want their language to look clean and modern. One bit of syntactic lichen that almost every new language eliminates (and some ancient ones like BASIC never had) is `;` as an explicit statement separator.
+
+Instead, they treat a newline as a statement separator where it makes sense to do so. The "where it makes sense" part is the interesting bit. While *most* statements are on their own line, sometimes you need to split it in the middle and break it across a couple of lines. Those newlines should not be treated as separators.
+
+Most of the obvious cases are easy to detect, but there are a handful of nasty cases you run into:
+
+* A return value on the next line:
+
+        :::js
+        return
+        "value"
+
+    Is "value" the value being returned, or do we have a return statement with no value followed by an expression statement containing a string literal?
+
+* A parenthesized expression on the next line:
+
+        :::js
+        func
+        (parenthsized)
+
+    Is this a call to `func(parenthesized)`, or two expression statements, one for `func` and one for a parenthesized expression?
+
+* A `-` on the next line:
+
+        :::js
+        first
+        -second
+
+    Is this `first - second` -- an infix subtraction -- or two expression statements, one for `first` and one to negate `second`?
+
+In all of these, treating the newline as a separator not would both produce valid code, but possibly not the code the user wants. Across languages, there is an unsettling variety in the rules they use to decide which newlines are separators. Here are a couple:
+
+* [Lua][] completely ignores newlines, but carefully controls its grammar such that no separator between statements is needed at all in most cases. This is perfectly valid:
+
+        :::lua
+        a = 1 b = 2
+
+    It avoids the `return` problem above by requiring a `return` statement to be the very last statement in a block. If there is a value after `return` before the keyword `end`, it *must* be for the return. For the other two cases, they allow an explicit `;` and expect users to use that. In practice, that almost never happens because there's no point in a parenthesized or unary negation expression statement.
+
+* [Go][] handles it in the scanner. If a newline appears following one of a handful of token types that are known to potentially end a statement, the newline is treated like a semicolon. The Go team provides a canonical code formatter, [gofmt][], and the ecosystem is fervent about its use, which ensures that idiomatic styled code works well with this simple rule.
+
+* [Python][] treats all newlines as significent unless an explicit backslash is used at the end of a line to continue it to the next line. Also, newlines anywhere inside a pair of brackets (`()`, `[]`, or `{}`) are ignored. Idiomatic style strongly prefers the latter.
+
+    This rule works well for Python because it is a strongly statement-oriented language. In particular, Python's grammar disallows a statement ever appearing inside an expression. This is also true of C, but not true of many other languages which have a "lambda" or function literal syntax.
+
+    For example, in JavaScript, you can have:
+
+        :::js
+        console.log(function() {
+          statementInAnExpression();
+        });
+
+    Python would need a different set of rules for implicitly joining lines if you could get back *into* a <span name="lambda">statement</span> where newlines should become meaningful while still nested inside brackets.
+
+<aside name="lambda">
+
+And now you know why Python's `lambda` only allows a single expression body.
+
+</aside>
+
+* JavaScript's "[automatic semicolon insertion][asi]" rules are the outliers. Where other languages assume most newlines *are* meaningful and there are just a few in multi-line statements that should be ignored, JS assumes the opposite. It treats all of your semicolons as meaningless whitespace unless that generates a parse error. If it does, it goes back and figures out the minimal set of newlines to turn into semicolons to get to something grammatically valid.
+
+    This design note would turn into a design essay it I went into complete detail about how that even works, much less all the various ways that that is a bad idea. It's a mess. JavaScript is the only language I know where many style guides demand explicit semicolons after every statement even though the language theoretically lets you elide them.
+
+[lua]: https://www.lua.org/pil/1.1.html
+[go]: https://golang.org/ref/spec#Semicolons
+[gofmt]: https://golang.org/cmd/gofmt/
+[python]: https://docs.python.org/3.5/reference/lexical_analysis.html#implicit-line-joining
+[asi]: https://www.ecma-international.org/ecma-262/5.1/#sec-7.9
+
+If you're designing a new language, you almost surely *should* avoid an explicit statement separator. Programmers are creatures of fashion like other humans and semicolons are as passé as ALL CAPS KEYWORDS. Just make sure you pick a set of rules that make sense for your language's particular grammar and idioms. And, uh, don't do what JavaScript did.
+
+</div>
\ No newline at end of file
diff --git a/java/com/craftinginterpreters/lox/Lox.java b/java/com/craftinginterpreters/lox/Lox.java
index 84b100eb7..47502eb3b 100644
--- a/java/com/craftinginterpreters/lox/Lox.java
+++ b/java/com/craftinginterpreters/lox/Lox.java
@@ -27,7 +27,7 @@ public static void main(String[] args) throws IOException {
     } else if (args.length == 1) {
       runFile(args[0]);
     } else {
-      repl();
+      runPrompt();
     }
   }
 //> run-file
@@ -44,17 +44,23 @@ private static void runFile(String path) throws IOException {
 //< Evaluating Expressions not-yet
   }
 //< run-file
-//> repl
-  private static void repl() throws IOException {
+//> prompt
+  private static void runPrompt() throws IOException {
     InputStreamReader input = new InputStreamReader(System.in);
     BufferedReader reader = new BufferedReader(input);
 
-    for (;;) {
+    for (;;) { // [repl]
       System.out.print("> ");
       run(reader.readLine());
+//> reset-had-error
+      hadError = false;
+//< reset-had-error
+//> Evaluating Expressions not-yet
+      hadRuntimeError = false;
+//< Evaluating Expressions not-yet
     }
   }
-//< repl
+//< prompt
 //> run
   private static void run(String source) {
     Scanner scanner = new Scanner(source);
diff --git a/java/com/craftinginterpreters/lox/Scanner.java b/java/com/craftinginterpreters/lox/Scanner.java
index 68649583a..2ca0ef53d 100644
--- a/java/com/craftinginterpreters/lox/Scanner.java
+++ b/java/com/craftinginterpreters/lox/Scanner.java
@@ -8,7 +8,7 @@
 
 import static com.craftinginterpreters.lox.TokenType.*;
 
-class Scanner {
+class Scanner { // [files]
 //> keyword-map
   private static final Map<String, TokenType> keywords;
 
@@ -78,7 +78,8 @@ private void scanToken() {
 //> slash
       case '/':
         if (match('/')) {
-          comment();
+          // A comment goes until the end of the line.
+          while (peek() != '\n' && !isAtEnd()) advance();
         } else {
           addToken(SLASH);
         }
@@ -122,12 +123,6 @@ private void scanToken() {
     }
   }
 //< scan-token
-//> comment
-  private void comment() {
-    // A comment goes until the end of the line.
-    while (peek() != '\n' && !isAtEnd()) advance();
-  }
-//< comment
 //> identifier
   private void identifier() {
     while (isAlphaNumeric(peek())) advance();
@@ -157,9 +152,8 @@ private void number() {
       while (isDigit(peek())) advance();
     }
 
-    double value = Double.parseDouble(
-        source.substring(start, current));
-    addToken(NUMBER, value);
+    addToken(NUMBER,
+        Double.parseDouble(source.substring(start, current)));
   }
 //< number
 //> string
@@ -218,7 +212,7 @@ private boolean isAlphaNumeric(char c) {
 //> is-digit
   private boolean isDigit(char c) {
     return c >= '0' && c <= '9';
-  }
+  } // [is-digit]
 //< is-digit
 //> is-at-end
   private boolean isAtEnd() {
diff --git a/java/com/craftinginterpreters/lox/Token.java b/java/com/craftinginterpreters/lox/Token.java
index ac6188c0d..dad6ecca4 100644
--- a/java/com/craftinginterpreters/lox/Token.java
+++ b/java/com/craftinginterpreters/lox/Token.java
@@ -5,7 +5,7 @@ class Token {
   final TokenType type;
   final String lexeme;
   final Object literal;
-  final int line;
+  final int line; // [location]
 
   Token(TokenType type, String lexeme, Object literal, int line) {
     this.type = type;
diff --git a/note/chapter/parsing-expressions.md b/note/chapter/parsing-expressions.md
index 09055de7e..cd4293174 100644
--- a/note/chapter/parsing-expressions.md
+++ b/note/chapter/parsing-expressions.md
@@ -38,3 +38,11 @@ https://www.cs.cmu.edu/~pattis/misc/ebnf.pdf
   - is an empty source file a valid program?
   - write the bnf for a language you know. if the language is complex, just do
     an interesting subset. what parts are hard?
+
+--
+
+error recovery:
+
+The tricky part, of course, is that the first error may *cause* later **cascaded errors**. For example, if they accidentally started a string with `'` instead of `"`, then the rest of the string literal will likely cause a number of bogus syntax errors when the scanner and parser tries to treat it like code.
+
+There is an art, called **error recovery** to getting back to a good state after an error is found to minimize the number of later spurious errors. We'll talk more about it during parsing.
diff --git a/note/log.txt b/note/log.txt
index 54f736622..8f9d5a644 100644
--- a/note/log.txt
+++ b/note/log.txt
@@ -1,3 +1,9 @@
+2017/01/01 - 772 words design note for scanner, aside markers in code
+2016/12/31 - 1081 words first draft scanner, mostly done
+2016/12/30 - 1085 words first draft scanner
+2016/12/29 - 722 words first draft scanner
+2016/12/28 - 561 words first draft scanner
+2016/12/27 - 1127 words first draft scanner
 2016/12/26 - finish outlining and splitting, reallow multiline strings
 2016/12/25 - fix some bugs in chapter splitting, make multiline strings and error
 2016/12/24 - slice up more scanning code into snippets
diff --git a/site/contents.html b/site/contents.html
index f389c81fe..f1c5a1f61 100644
--- a/site/contents.html
+++ b/site/contents.html
@@ -118,7 +118,6 @@ <h4><a href="the-lox-language.html#design-note">Design Note: Statements and Expr
 <h2><span class="num">II.</span><a href="a-tree-walk-interpreter-in-java.html" name="a-tree-walk-interpreter-in-java">A Tree-Walk Interpreter in Java</a></h2>
   <ol start="4">
     <li><h3><a href="scanning.html">Scanning</a>
-      <a class="not-written" href="#not-written" title="This chapter hasn't been written yet">(coming soon!)</a>
 </h3>
     <p>
     <span class="topic">Tokens</span>
@@ -129,6 +128,7 @@ <h2><span class="num">II.</span><a href="a-tree-walk-interpreter-in-java.html" n
     <span class="topic">Reserved words</span>
     <span class="topic">Error reporting</span>
     </p>
+    <h4><a href="scanning.html#design-note">Design Note: Implicit Semicolons</a></h4>
     </li>
     <li><h3><a href="representing-code.html">Representing Code</a>
       <a class="not-written" href="#not-written" title="This chapter hasn't been written yet">(coming soon!)</a>
diff --git a/site/scanning.html b/site/scanning.html
index bd29dfa69..ce3cced9e 100644
--- a/site/scanning.html
+++ b/site/scanning.html
@@ -23,7 +23,14 @@
 <h3><a href="#top">Scanning<small>4</small></a></h3>
 
 <ul>
-    <em>No sections yet&hellip;</em>
+    <li><a href="#the-interpreter-framework"><small>4.1</small> The Interpreter Framework</a></li>
+    <li><a href="#tokens-and-lexemes"><small>4.2</small> Tokens and Lexemes</a></li>
+    <li><a href="#regular-languages-and-expressions"><small>4.3</small> Regular Languages and Expressions</a></li>
+    <li><a href="#a-scanner-for-lox"><small>4.4</small> A Scanner for Lox</a></li>
+    <li class="divider"></li>
+    <li class="end-part"><a href="#challenges">Challenges</a></li>
+    <li class="end-part"><a href="#design-note"><small>note</small>Implicit Semicolons
+</a></li>
 </ul>
 
 
@@ -48,7 +55,14 @@ <h3><a href="#top">Scanning<small>4</small></a></h3>
 <h3><a href="#top">Scanning<small>4</small></a></h3>
 
 <ul>
-    <em>No sections yet&hellip;</em>
+    <li><a href="#the-interpreter-framework"><small>4.1</small> The Interpreter Framework</a></li>
+    <li><a href="#tokens-and-lexemes"><small>4.2</small> Tokens and Lexemes</a></li>
+    <li><a href="#regular-languages-and-expressions"><small>4.3</small> Regular Languages and Expressions</a></li>
+    <li><a href="#a-scanner-for-lox"><small>4.4</small> A Scanner for Lox</a></li>
+    <li class="divider"></li>
+    <li class="end-part"><a href="#challenges">Challenges</a></li>
+    <li class="end-part"><a href="#design-note"><small>note</small>Implicit Semicolons
+</a></li>
 </ul>
 
 
@@ -66,9 +80,9 @@ <h3><a href="#top">Scanning<small>4</small></a></h3>
   <h1>Scanning</h1>
 
 <div class="sign-up">
-      <h1>I haven't written this chapter yet!</h1>
+    <h1>This book is a work in progress!</h1>
   <span class="dismiss">&times;</span>
-    <p>If you want to know when it goes online, join the mailing list:</p>
+    <p>If you see a mistake, find something unclear, or have a suggestion, please <a href="https://github.com/munificent/crafting-interpreters/issues" target="_blank">file a ticket</a>. To know when new chapters are up, join the mailing list:</p>
 
   <!-- Begin MailChimp Signup Form -->
   <div id="mc_embed_signup">
@@ -83,7 +97,801 @@ <h1>I haven't written this chapter yet!</h1>
   <p class="small">(I post about once a month. Don&#8217;t worry, I won&#8217;t spam you.)</p>
 </div>
 
+<p><strong>TODO: explain snippet notation in introduction</strong></p>
+<p><strong>TODO: consider reorganizing the headers and subheaders</strong></p>
+<p>The first step in any compiler or interpreter is <span name="lexing">scanning</span>. The scanner takes in the raw source code as a series characters and groups them into meaningful chunks&#8202;&mdash;&#8202;the &ldquo;words&rdquo; and &ldquo;punctuation&rdquo; that make up the language&rsquo;s artificial grammar.</p>
+<aside name="lexing">
+<p>This task has been variously called &ldquo;scanning&rdquo; and &ldquo;lexing&rdquo;&#8202;&mdash;&#8202;short for lexical analysis&#8202;&mdash;&#8202;over the years and the two terms don&rsquo;t have very distinct definitions. Way back when computers were as big as Winebagos but had less memory than your watch, some people used &ldquo;scanner&rdquo; only to refer to the piece of code that deals with reading raw source code characters from disk and buffering them in memory. Then lexing was the phase after that that did useful stuff with the characters.</p>
+<p>These days, reading a source file into memory is an easier task and the two terms are basically interchangeable.</p>
+</aside>
+<p>This is a good starting for us too because the code isn&rsquo;t very hard&#8202;&mdash;&#8202;pretty much a switch statement with delusions of grandeur. It will let us get warmed up before we tackle some of the more interesting material later.</p>
+<p>By the end of this chapter, we&rsquo;ll have a full-featured fast scanner that can handle any string of Lox source code and produce the tokens that we&rsquo;ll feed into the parser in the next chapter.</p>
+<h2><a href="#the-interpreter-framework" name="the-interpreter-framework"><small>4&#8202;.&#8202;1</small> The Interpreter Framework</a></h2>
+<p>Since this is our first real chapter, before we get to actually scanning some code, we need to tie together the basic application framework for our interpreter, jlox.</p>
+<p>Because everything starts with a class in Java, we&rsquo;ll begin with like so:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Lox.java</em><br>
+create new file</div>
+<pre><span></span><span class="kn">package</span> <span class="nn">com.craftinginterpreters.lox</span><span class="o">;</span>
 
+<span class="kn">import</span> <span class="nn">java.io.BufferedReader</span><span class="o">;</span>
+<span class="kn">import</span> <span class="nn">java.io.IOException</span><span class="o">;</span>
+<span class="kn">import</span> <span class="nn">java.io.InputStreamReader</span><span class="o">;</span>
+<span class="kn">import</span> <span class="nn">java.nio.charset.Charset</span><span class="o">;</span>
+<span class="kn">import</span> <span class="nn">java.nio.file.Files</span><span class="o">;</span>
+<span class="kn">import</span> <span class="nn">java.nio.file.Paths</span><span class="o">;</span>
+<span class="kn">import</span> <span class="nn">java.util.List</span><span class="o">;</span>
+
+<span class="kd">public</span> <span class="kd">class</span> <span class="nc">Lox</span> <span class="o">{</span>
+  <span class="kd">public</span> <span class="kd">static</span> <span class="kt">void</span> <span class="nf">main</span><span class="o">(</span><span class="n">String</span><span class="o">[]</span> <span class="n">args</span><span class="o">)</span> <span class="kd">throws</span> <span class="n">IOException</span> <span class="o">{</span>
+    <span class="k">if</span> <span class="o">(</span><span class="n">args</span><span class="o">.</span><span class="na">length</span> <span class="o">&gt;</span> <span class="mi">1</span><span class="o">)</span> <span class="o">{</span>
+      <span class="n">System</span><span class="o">.</span><span class="na">out</span><span class="o">.</span><span class="na">println</span><span class="o">(</span><span class="s">&quot;Usage: jlox [script]&quot;</span><span class="o">);</span>
+    <span class="o">}</span> <span class="k">else</span> <span class="k">if</span> <span class="o">(</span><span class="n">args</span><span class="o">.</span><span class="na">length</span> <span class="o">==</span> <span class="mi">1</span><span class="o">)</span> <span class="o">{</span>
+      <span class="n">runFile</span><span class="o">(</span><span class="n">args</span><span class="o">[</span><span class="mi">0</span><span class="o">]);</span>
+    <span class="o">}</span> <span class="k">else</span> <span class="o">{</span>
+      <span class="n">runPrompt</span><span class="o">();</span>
+    <span class="o">}</span>
+  <span class="o">}</span>
+<span class="o">}</span>
+</pre></div>
+
+<p>Stick that in a text file, and go get your IDE and Makefile or whatever set up. I&rsquo;ll be right here when you&rsquo;re ready. Good? OK, let&rsquo;s keep going.</p>
+<p>Lox is a scripting language, which means it executes directly from source. There are actually two ways you can run some code. If you start jlox from the command line and give it a path to a file, it reads it and executes it:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Lox.java</em><br>
+add after <em>main</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kd">static</span> <span class="kt">void</span> <span class="nf">runFile</span><span class="o">(</span><span class="n">String</span> <span class="n">path</span><span class="o">)</span> <span class="kd">throws</span> <span class="n">IOException</span> <span class="o">{</span>
+    <span class="kt">byte</span><span class="o">[]</span> <span class="n">bytes</span> <span class="o">=</span> <span class="n">Files</span><span class="o">.</span><span class="na">readAllBytes</span><span class="o">(</span><span class="n">Paths</span><span class="o">.</span><span class="na">get</span><span class="o">(</span><span class="n">path</span><span class="o">));</span>
+    <span class="n">run</span><span class="o">(</span><span class="k">new</span> <span class="n">String</span><span class="o">(</span><span class="n">bytes</span><span class="o">,</span> <span class="n">Charset</span><span class="o">.</span><span class="na">defaultCharset</span><span class="o">()));</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>If you like a closer emotional connection to your interpreter, you can also run it interactively. If you fire up jlox without any arguments, it drops you into a prompt where you can enter and execute code one line at a time.</p>
+<aside name="repl">
+<p>An interactive prompt is also called a &ldquo;REPL&rdquo; (pronounced like &ldquo;ripple&rdquo; but with
+an &ldquo;e&rdquo;). The name comes from Lisp where providing one is as simple as
+wrapping a loop around a few built-in functions:</p>
+<div class="codehilite"><pre><span></span><span class="p">(</span><span class="nb">print</span> <span class="p">(</span><span class="nb">eval</span> <span class="p">(</span><span class="nb">read</span><span class="p">))</span>
+</pre></div>
+
+
+<p>Working outwards from the most nested function call, you <strong>R</strong>ead a line of input, <strong>E</strong>valuate it, <strong>P</strong>rint the result, then <strong>L</strong>oop and do it all over again.</p>
+</aside>
+<div class="codehilite"><div class="source-file"><em>lox/Lox.java</em><br>
+add after <em>runFile</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kd">static</span> <span class="kt">void</span> <span class="nf">runPrompt</span><span class="o">()</span> <span class="kd">throws</span> <span class="n">IOException</span> <span class="o">{</span>
+    <span class="n">InputStreamReader</span> <span class="n">input</span> <span class="o">=</span> <span class="k">new</span> <span class="n">InputStreamReader</span><span class="o">(</span><span class="n">System</span><span class="o">.</span><span class="na">in</span><span class="o">);</span>
+    <span class="n">BufferedReader</span> <span class="n">reader</span> <span class="o">=</span> <span class="k">new</span> <span class="n">BufferedReader</span><span class="o">(</span><span class="n">input</span><span class="o">);</span>
+
+    <span class="k">for</span> <span class="o">(;;)</span> <span class="o">{</span> <span name="repl"></span>
+      <span class="n">System</span><span class="o">.</span><span class="na">out</span><span class="o">.</span><span class="na">print</span><span class="o">(</span><span class="s">&quot;&gt; &quot;</span><span class="o">);</span>
+      <span class="n">run</span><span class="o">(</span><span class="n">reader</span><span class="o">.</span><span class="na">readLine</span><span class="o">());</span>
+    <span class="o">}</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>To escape that infinite loop in jlox, hit Control-C or yank the plug out of your machine if you have anger management problems.</p>
+<p>Both the prompt and the file runner are thin wrappers around this core function:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Lox.java</em><br>
+add after <em>runPrompt</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kd">static</span> <span class="kt">void</span> <span class="nf">run</span><span class="o">(</span><span class="n">String</span> <span class="n">source</span><span class="o">)</span> <span class="o">{</span>
+    <span class="n">Scanner</span> <span class="n">scanner</span> <span class="o">=</span> <span class="k">new</span> <span class="n">Scanner</span><span class="o">(</span><span class="n">source</span><span class="o">);</span>
+    <span class="n">List</span><span class="o">&lt;</span><span class="n">Token</span><span class="o">&gt;</span> <span class="n">tokens</span> <span class="o">=</span> <span class="n">scanner</span><span class="o">.</span><span class="na">scanTokens</span><span class="o">();</span>
+
+    <span class="c1">// For now, just print the tokens.</span>
+    <span class="k">for</span> <span class="o">(</span><span class="n">Token</span> <span class="n">token</span> <span class="o">:</span> <span class="n">tokens</span><span class="o">)</span> <span class="o">{</span>
+      <span class="n">System</span><span class="o">.</span><span class="na">out</span><span class="o">.</span><span class="na">println</span><span class="o">(</span><span class="n">token</span><span class="o">);</span>
+    <span class="o">}</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>It&rsquo;s not super useful yet since we haven&rsquo;t written the interpreter, but baby steps, you know? Right now, we&rsquo;ll just have it print out the tokens our forthcoming scanner spits out so that we can see if we&rsquo;re making progress. Feel free to run this periodically as you work you way through the chapter to see how it does.</p>
+<h3><a href="#error-handling" name="error-handling"><small>4&#8202;.&#8202;1&#8202;.&#8202;1</small> Error handling</a></h3>
+<p>While we&rsquo;re setting things up, another key piece of infrastructure is <em>error handling</em>. Textbooks sometimes gloss over this because it&rsquo;s more an engineering concern than a formal computer science-y problem. But if you care about making a language that&rsquo;s actually <em>usable</em>, then how your interpreter handles errors is a vital concern.</p>
+<p>The tools your language provides for dealing with errors make up a large portion of your language&rsquo;s user interface. When their code is working, they aren&rsquo;t thinking about your language at all&#8202;&mdash;&#8202;they&rsquo;re headspace is all about <em>their program</em>. It&rsquo;s only when things go sideways that they focus on your beautiful language and its implementation.</p>
+<p>When that happens, it&rsquo;s up to us to give the user all of the information they need to understand what went wrong and guide them tactfully back to where they are trying to go. Doing that well means thinking about error handling all through the implementation of our interpreter, starting now.</p>
+<p>Having said all that, for <em>this</em> interpreter, what we&rsquo;ll build is pretty bare bones. I&rsquo;d love to talk about interactive debuggers, static analyzers and other fun stuff, but there&rsquo;s only so much time.</p>
+<p>For now, we&rsquo;ll start with:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Lox.java</em><br>
+add after <em>run</em>()</div>
+<pre><span></span>  <span class="kd">static</span> <span class="kt">void</span> <span class="nf">error</span><span class="o">(</span><span class="kt">int</span> <span class="n">line</span><span class="o">,</span> <span class="n">String</span> <span class="n">message</span><span class="o">)</span> <span class="o">{</span>
+    <span class="n">report</span><span class="o">(</span><span class="n">line</span><span class="o">,</span> <span class="s">&quot;&quot;</span><span class="o">,</span> <span class="n">message</span><span class="o">);</span>
+  <span class="o">}</span>
+
+  <span class="kd">static</span> <span class="kd">private</span> <span class="kt">void</span> <span class="nf">report</span><span class="o">(</span><span class="kt">int</span> <span class="n">line</span><span class="o">,</span> <span class="n">String</span> <span class="n">where</span><span class="o">,</span> <span class="n">String</span> <span class="n">message</span><span class="o">)</span> <span class="o">{</span>
+    <span class="n">System</span><span class="o">.</span><span class="na">err</span><span class="o">.</span><span class="na">println</span><span class="o">(</span>
+        <span class="s">&quot;[line &quot;</span> <span class="o">+</span> <span class="n">line</span> <span class="o">+</span> <span class="s">&quot;] Error&quot;</span> <span class="o">+</span> <span class="n">where</span> <span class="o">+</span> <span class="s">&quot;: &quot;</span> <span class="o">+</span> <span class="n">message</span><span class="o">);</span>
+    <span class="n">hadError</span> <span class="o">=</span> <span class="kc">true</span><span class="o">;</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>This tells users some syntax error occurred on a given line. This is really the bare minimum to be able to claim you even <em>have</em> error reporting. Imagine you accidentally leave a dangling comma in some function call and the interpreter prints out:</p>
+<div class="codehilite"><pre><span></span><span class="n">Error</span><span class="o">:</span> <span class="n">Unexpected</span> <span class="s2">&quot;,&quot;</span> <span class="n">somewhere</span> <span class="k">in</span> <span class="n">your</span> <span class="n">program</span><span class="o">.</span> <span class="n">Good</span> <span class="n">luck</span> <span class="n">finding</span> <span class="n">it</span><span class="o">!</span>
+</pre></div>
+
+
+<p>So we at least need to point them to the right line. Even better would be the beginning and end column so they know where in the line. Even better than <em>that</em> is to <em>show</em> the user the offending line, like:</p>
+<div class="codehilite"><pre><span></span>Error: Unexpected &quot;,&quot; in argument list.
+
+    15 | function(first, second,);
+                               ^-- Here.
+</pre></div>
+
+
+<p>I&rsquo;d love to implement something like that in this book but the honest truth is that it&rsquo;s a lot of grungy string munging code. Very useful for users, but not super fun to read in a book and not very technically interesting. So we&rsquo;ll stick with just a line number. In your interpreters, please do kick it up a notch.</p>
+<p>The primary reason we&rsquo;re sticking this error reporting function in the main Lox class is because of that <code>hadError</code> field. It&rsquo;s defined here:</p>
+<div class="codehilite"><pre class="insert-before"><span></span><span class="kd">public</span> <span class="kd">class</span> <span class="nc">Lox</span> <span class="o">{</span>
+</pre><div class="source-file"><em>lox/Lox.java</em><br>
+in class <em>Lox</em></div>
+<pre class="insert"><span></span>  <span class="kd">static</span> <span class="kt">boolean</span> <span class="n">hadError</span> <span class="o">=</span> <span class="kc">false</span><span class="o">;</span>
+</pre></div>
+
+<p>If a syntax error occurs when running a script, we want to exit with a non-zero exit code like a good command line citizen should:</p>
+<div class="codehilite"><pre class="insert-before"><span></span>    <span class="n">run</span><span class="o">(</span><span class="k">new</span> <span class="n">String</span><span class="o">(</span><span class="n">bytes</span><span class="o">,</span> <span class="n">Charset</span><span class="o">.</span><span class="na">defaultCharset</span><span class="o">()));</span>
+</pre><div class="source-file"><em>lox/Lox.java</em><br>
+in <em>runFile</em>()</div>
+<pre class="insert"><br><span></span>    <span class="c1">// Indicate an error in the exit code.</span>
+    <span class="k">if</span> <span class="o">(</span><span class="n">hadError</span><span class="o">)</span> <span class="n">System</span><span class="o">.</span><span class="na">exit</span><span class="o">(</span><span class="mi">65</span><span class="o">);</span>
+</pre><pre class="insert-after"><span></span>  <span class="o">}</span>
+</pre></div>
+
+<p>We also need to reset it in the prompt. If the user makes a mistake, they should be able to keep going:</p>
+<div class="codehilite"><pre class="insert-before"><span></span>      <span class="n">run</span><span class="o">(</span><span class="n">reader</span><span class="o">.</span><span class="na">readLine</span><span class="o">());</span>
+</pre><div class="source-file"><em>lox/Lox.java</em><br>
+in <em>runPrompt</em>()</div>
+<pre class="insert"><span></span>      <span class="n">hadError</span> <span class="o">=</span> <span class="kc">false</span><span class="o">;</span>
+</pre><pre class="insert-after"><span></span>    <span class="o">}</span>
+</pre></div>
+
+<p>The other reason I pulled the error reporting out here instead of stuffing it into the scanner and other phases where the error occurs is to remind you that it&rsquo;s a good engineering practice to separate the code that <em>generates</em> the errors from the code that <em>reports</em> them.</p>
+<p>The various phases of the front end will detect errors, but it&rsquo;s not really their job to know how to present that to a user. In a full-featured language implementation, you will likely have multiple ways errors can get displayed: on stderr, in an IDE&rsquo;s error window, logged to a file, etc. You don&rsquo;t want that code jammed in your parser.</p>
+<p>Ideally, we would have an actual abstraction, some kind of <span name="reporter">&ldquo;ErrorReporter&rdquo;</span> interface that gets passed to the scanner and parser so that we can swap out different reporting strategies. For our simple interpreter here, I didn&rsquo;t do that, but I did at least separate out the code for error reporting.</p>
+<aside name="reporter">
+<p>I had exactly that when I first implemented jlox. I ended up tearing it out
+because it felt like pointless boilerplate in such a minimal implementation.</p>
+</aside>
+<p>And with that, our basic shell is in place. Once we have a Scanner class with some <code>scanTokens()</code> method, we can start running it. Before we get to that, les talk about these mysterious &ldquo;tokens&rdquo; and the prizes they may or may not be redeemed for.</p>
+<h2><a href="#tokens-and-lexemes" name="tokens-and-lexemes"><small>4&#8202;.&#8202;2</small> Tokens and Lexemes</a></h2>
+<p>Here&rsquo;s a line of Lox code:</p>
+<div class="codehilite"><pre><span></span><span class="k">var</span> <span class="n">language</span> <span class="o">=</span> <span class="s">&quot;lox&quot;</span><span class="p">;</span>
+</pre></div>
+
+
+<p>Here, <code>var</code> is the keyword for declaring a variable. That three-character sequence <em>means</em> something. If we yank, say, <code>gua</code> out of the middle of <code>language</code>, those three characters don&rsquo;t mean anything on their own.</p>
+<p>That&rsquo;s what lexical analysis is really about. Our job is to scan through the list of characters and group them together into the smallest possible sequences that still have a well-defined meaning. Each of these is called a <strong>lexeme</strong>.</p>
+<p>In that line of code, the lexemes are:</p>
+<div class="codehilite"><pre><span></span>var
+language
+=
+&quot;lox&quot;
+;
+</pre></div>
+
+
+<p><strong>TODO: illustrate</strong></p>
+<p>The lexemes are just the raw substrings of the source code. However, in the process of recognizing those and drawing boundaries between each one, we also stumble upon some other useful information. Things like:</p>
+<h3><a href="#lexeme-type" name="lexeme-type"><small>4&#8202;.&#8202;2&#8202;.&#8202;1</small> Lexeme type</a></h3>
+<p>If the lexeme is an identifier whose name matches one of the language&rsquo;s reserved words, like <code>while</code> or <code>if</code>, we can recognize that now. Since keywords are part of the grammatical structure of the language, the parser often has logic like, &ldquo;If the next token is <code>while</code> then parse a while statement.&rdquo;</p>
+<p>Technically, the parser can determine that right from the lexeme by comparing the strings. But that&rsquo;s slow and kind of ugly. Instead, at the point that we recognize a lexeme, we&rsquo;ll also remember which <em>kind</em> of lexeme it represents. We&rsquo;ll have a different type for each keyword, operator, bit of punctuation, and literal value.</p>
+<p>It&rsquo;s a simple enum:</p>
+<div class="codehilite"><div class="source-file"><em>lox/TokenType.java</em><br>
+create new file</div>
+<pre><span></span><span class="kn">package</span> <span class="nn">com.craftinginterpreters.lox</span><span class="o">;</span>
+
+<span class="kd">enum</span> <span class="n">TokenType</span> <span class="o">{</span>
+  <span class="c1">// Single-character tokens.</span>
+  <span class="n">LEFT_PAREN</span><span class="o">,</span> <span class="n">RIGHT_PAREN</span><span class="o">,</span> <span class="n">LEFT_BRACE</span><span class="o">,</span> <span class="n">RIGHT_BRACE</span><span class="o">,</span>
+  <span class="n">COMMA</span><span class="o">,</span> <span class="n">DOT</span><span class="o">,</span> <span class="n">MINUS</span><span class="o">,</span> <span class="n">PLUS</span><span class="o">,</span> <span class="n">SEMICOLON</span><span class="o">,</span> <span class="n">SLASH</span><span class="o">,</span> <span class="n">STAR</span><span class="o">,</span>
+
+  <span class="c1">// One or two character tokens.</span>
+  <span class="n">BANG</span><span class="o">,</span> <span class="n">BANG_EQUAL</span><span class="o">,</span>
+  <span class="n">EQUAL</span><span class="o">,</span> <span class="n">EQUAL_EQUAL</span><span class="o">,</span>
+  <span class="n">GREATER</span><span class="o">,</span> <span class="n">GREATER_EQUAL</span><span class="o">,</span>
+  <span class="n">LESS</span><span class="o">,</span> <span class="n">LESS_EQUAL</span><span class="o">,</span>
+
+  <span class="c1">// Literals.</span>
+  <span class="n">IDENTIFIER</span><span class="o">,</span> <span class="n">STRING</span><span class="o">,</span> <span class="n">NUMBER</span><span class="o">,</span>
+
+  <span class="c1">// Keywords.</span>
+  <span class="n">AND</span><span class="o">,</span> <span class="n">CLASS</span><span class="o">,</span> <span class="n">ELSE</span><span class="o">,</span> <span class="n">FALSE</span><span class="o">,</span> <span class="n">FUN</span><span class="o">,</span> <span class="n">FOR</span><span class="o">,</span> <span class="n">IF</span><span class="o">,</span> <span class="n">NIL</span><span class="o">,</span> <span class="n">OR</span><span class="o">,</span>
+  <span class="n">PRINT</span><span class="o">,</span> <span class="n">RETURN</span><span class="o">,</span> <span class="n">SUPER</span><span class="o">,</span> <span class="n">THIS</span><span class="o">,</span> <span class="n">TRUE</span><span class="o">,</span> <span class="n">VAR</span><span class="o">,</span> <span class="n">WHILE</span><span class="o">,</span>
+
+  <span class="n">EOF</span>
+<span class="o">}</span>
+</pre></div>
+
+<h3><a href="#literal-value" name="literal-value"><small>4&#8202;.&#8202;2&#8202;.&#8202;2</small> Literal value</a></h3>
+<p>Some lexemes represent literal values&#8202;&mdash;&#8202;numbers and strings and the like.
+Since the scanner has to walk each character in the literal to correctly identify it, it can also convert it to its actual runtime value as used by the interpreter later.</p>
+<p>For example, after the scanner walks over the characters <code>123</code> in a number literal, we can convert it the actual numeric value 123.</p>
+<h3><a href="#location-information" name="location-information"><small>4&#8202;.&#8202;2&#8202;.&#8202;3</small> Location information</a></h3>
+<p>Back when I was on my soapbox about error handling, we saw that we need to tell users <em>where</em> errors occurred. We have to keep track of that information through every phase of the interpreter, starting here.</p>
+<p>In our simple interpreter, we just track which line the token appears on, but more sophisticated implementations would track the column and length too.</p>
+<aside name="location">
+<p>Many token implementations store the location as two numbers: the number of characters from the beginning of the source file to the beginning of the lexeme, and the number of characters in the lexeme. The scanner needs to know these anyway, so there&rsquo;s no overhead to track them.</p>
+<p>Those can be later converted to line and column positions later by looking back at the source file and counting the preceding newlines. That sounds slow, and it kind of is. However <em>you only need to do it when you need to actually display a line and column to the user.</em> The vast majority of tokens never appear in an error message. For those the less time you spend calculating position information ahead of time, the better.</p>
+</aside>
+<p>We take all of this and wrap it up in a class:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Token.java</em><br>
+create new file</div>
+<pre><span></span><span class="kn">package</span> <span class="nn">com.craftinginterpreters.lox</span><span class="o">;</span>
+
+<span class="kd">class</span> <span class="nc">Token</span> <span class="o">{</span>
+  <span class="kd">final</span> <span class="n">TokenType</span> <span class="n">type</span><span class="o">;</span>
+  <span class="kd">final</span> <span class="n">String</span> <span class="n">lexeme</span><span class="o">;</span>
+  <span class="kd">final</span> <span class="n">Object</span> <span class="n">literal</span><span class="o">;</span>
+  <span class="kd">final</span> <span class="kt">int</span> <span class="n">line</span><span class="o">;</span> <span name="location"></span>
+
+  <span class="n">Token</span><span class="o">(</span><span class="n">TokenType</span> <span class="n">type</span><span class="o">,</span> <span class="n">String</span> <span class="n">lexeme</span><span class="o">,</span> <span class="n">Object</span> <span class="n">literal</span><span class="o">,</span> <span class="kt">int</span> <span class="n">line</span><span class="o">)</span> <span class="o">{</span>
+    <span class="k">this</span><span class="o">.</span><span class="na">type</span> <span class="o">=</span> <span class="n">type</span><span class="o">;</span>
+    <span class="k">this</span><span class="o">.</span><span class="na">lexeme</span> <span class="o">=</span> <span class="n">lexeme</span><span class="o">;</span>
+    <span class="k">this</span><span class="o">.</span><span class="na">literal</span> <span class="o">=</span> <span class="n">literal</span><span class="o">;</span>
+    <span class="k">this</span><span class="o">.</span><span class="na">line</span> <span class="o">=</span> <span class="n">line</span><span class="o">;</span>
+  <span class="o">}</span>
+
+  <span class="kd">public</span> <span class="n">String</span> <span class="nf">toString</span><span class="o">()</span> <span class="o">{</span>
+    <span class="k">return</span> <span class="n">type</span> <span class="o">+</span> <span class="s">&quot; &quot;</span> <span class="o">+</span> <span class="n">lexeme</span> <span class="o">+</span> <span class="s">&quot; &quot;</span> <span class="o">+</span> <span class="n">literal</span><span class="o">;</span>
+  <span class="o">}</span>
+<span class="o">}</span>
+</pre></div>
+
+<p>And <em>that&rsquo;s</em> what a <strong>token</strong> is&#8202;&mdash;&#8202;a bundle containing the raw lexeme along with the other things the scanner knows about it.</p>
+<h2><a href="#regular-languages-and-expressions" name="regular-languages-and-expressions"><small>4&#8202;.&#8202;3</small> Regular Languages and Expressions</a></h2>
+<p>Now that we know what we&rsquo;re trying to produce, let&rsquo;s, well, produce it. The code of the scanner is a loop. Starting at the beginning of the source code, it figures out what lexeme the first character belongs to. Then it consumes any following characters that belong to that same lexeme.</p>
+<p>When it hits the end of that lexeme, it emits a token. Then it loops back and does it again, starting from the very next character in the source code. It keeps doing that, eating characters and occasionally, uh, excreting tokens, until it runs out of characters.</p>
+<p><strong>TODO: illustrate</strong></p>
+<p>The first step inside the loop where we look at the first couple of characters and figure out which kind of lexeme it <em>matches</em> might sound familiar. If you&rsquo;re familiar with regular expressions, you might consider defining a regex for each kind of lexeme and use those to match characters. For example, Lox has the same identifier rules as C, and the regex <code>[a-zA-Z_][a-zA-Z_0-9]*</code> matches one.</p>
+<p>If you did think of regular expressions by now, your <span
+name="theory">intuition</span> is a deep one. The rules that determine how characters are associated with different lexemes for a language are called its <strong>lexical grammar</strong>. In Lox, as in most languages, the rules of that grammar are simple enough to within a boundary called a <strong><a href="https://en.wikipedia.org/wiki/Regular_language">regular language</a></strong>. That&rsquo;s the same &ldquo;regular&rdquo; as in regular expressions.</p>
+<p>You very precisely <em>can</em> recognize all of the different lexemes for Lox using
+regexes if you want to, and there&rsquo;s a pile of interesting theory underlying why that is and what that means. For
+jlox, we could even use Java&rsquo;s regex library for our scanner. Or we could break
+out a tool like <span name="lex"><a href="http://dinosaur.compilertools.net/lex/">Lex</a></span> or <a href="https://github.com/westes/flex">Flex</a> to take all of the regular expressions for
+Lox&rsquo;s lexical grammar and spit out an entire scanner for us.</p>
+<aside name="lex">
+<p>Lex was created by Mike Lesk and Eric Schmidt. Yes, the same Eric Schmidt who ran Sun&rsquo;s software division, was a CEO of Novell, and is executive chairman of Google as of this writing. I&rsquo;m not saying programming languages are a sure-fire path to wealth and fame, but we can count at least one multi-billionaire among us.</p>
+</aside>
+<aside name="theory">
+<p>It pains me to gloss over the theory so much, especially when it&rsquo;s as fun as I think the <a href="https://en.wikipedia.org/wiki/Chomsky_hierarchy">Chomsky hierarchy</a> and <a href="https://en.wikipedia.org/wiki/Finite-state_machine">FSMs</a> are. But the honest truth is other books cover this better than I could. <a href="https://en.wikipedia.org/wiki/Compilers:_Principles,_Techniques,_and_Tools">Compilers: Principles, Techniques, and Tools</a> (universally known as &ldquo;the Dragon Book&rdquo;) is a great place to slake your thirst for knowledge.</p>
+</aside>
+<p>But our goal is to understand how a scanner works inside, so we won&rsquo;t be
+outsourcing that task. We&rsquo;re about hand-crafted goods here.</p>
+<h2><a href="#a-scanner-for-lox" name="a-scanner-for-lox"><small>4&#8202;.&#8202;4</small> A Scanner for Lox</a></h2>
+<p>Without further ado, let&rsquo;s make ourselves a scanner.</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+create new file</div>
+<pre><span></span><span class="kn">package</span> <span class="nn">com.craftinginterpreters.lox</span><span class="o">;</span>
+
+<span class="kn">import</span> <span class="nn">java.util.ArrayList</span><span class="o">;</span>
+<span class="kn">import</span> <span class="nn">java.util.HashMap</span><span class="o">;</span>
+<span class="kn">import</span> <span class="nn">java.util.List</span><span class="o">;</span>
+<span class="kn">import</span> <span class="nn">java.util.Map</span><span class="o">;</span>
+
+<span class="kn">import</span> <span class="nn">static</span> <span class="n">com</span><span class="o">.</span><span class="na">craftinginterpreters</span><span class="o">.</span><span class="na">lox</span><span class="o">.</span><span class="na">TokenType</span><span class="o">.*;</span>
+
+<span class="kd">class</span> <span class="nc">Scanner</span> <span class="o">{</span> <span name="files"></span>
+  <span class="kd">private</span> <span class="kd">final</span> <span class="n">String</span> <span class="n">source</span><span class="o">;</span>
+  <span class="kd">private</span> <span class="kd">final</span> <span class="n">List</span><span class="o">&lt;</span><span class="n">Token</span><span class="o">&gt;</span> <span class="n">tokens</span> <span class="o">=</span> <span class="k">new</span> <span class="n">ArrayList</span><span class="o">&lt;&gt;();</span>
+
+  <span class="n">Scanner</span><span class="o">(</span><span class="n">String</span> <span class="n">source</span><span class="o">)</span> <span class="o">{</span>
+    <span class="k">this</span><span class="o">.</span><span class="na">source</span> <span class="o">=</span> <span class="n">source</span><span class="o">;</span>
+  <span class="o">}</span>
+<span class="o">}</span>
+</pre></div>
+
+<aside name="files">
+<p>I know it seems like we&rsquo;re cranking out an awful lot of files. Java does tend to
+be verbose, but I promise it gets less so in later chapters. Since we&rsquo;re just
+getting started now, there&rsquo;s a lot of framework to put in place.</p>
+</aside>
+<p>We store the raw source code as a simple string, and we have an empty list that we will fill with tokens as we generate them. The aforementioned loop that does that looks like this:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>Scanner</em>()</div>
+<pre><span></span>  <span class="n">List</span><span class="o">&lt;</span><span class="n">Token</span><span class="o">&gt;</span> <span class="nf">scanTokens</span><span class="o">()</span> <span class="o">{</span>
+    <span class="k">while</span> <span class="o">(!</span><span class="n">isAtEnd</span><span class="o">())</span> <span class="o">{</span>
+      <span class="c1">// We are the beginning of the next lexeme.</span>
+      <span class="n">start</span> <span class="o">=</span> <span class="n">current</span><span class="o">;</span>
+      <span class="n">scanToken</span><span class="o">();</span>
+    <span class="o">}</span>
+
+    <span class="n">tokens</span><span class="o">.</span><span class="na">add</span><span class="o">(</span><span class="k">new</span> <span class="n">Token</span><span class="o">(</span><span class="n">EOF</span><span class="o">,</span> <span class="s">&quot;&quot;</span><span class="o">,</span> <span class="kc">null</span><span class="o">,</span> <span class="n">line</span><span class="o">));</span>
+    <span class="k">return</span> <span class="n">tokens</span><span class="o">;</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>It works its way through the source code until it runs out of characters. When it&rsquo;s done, it adds one final special &ldquo;end of file&rdquo; token to the end. That isn&rsquo;t strictly needed, but it will make our parser a little cleaner.</p>
+<p>This loop depends on a couple of fields to keep track of where in the source code we are:</p>
+<div class="codehilite"><pre class="insert-before"><span></span>  <span class="kd">private</span> <span class="kd">final</span> <span class="n">List</span><span class="o">&lt;</span><span class="n">Token</span><span class="o">&gt;</span> <span class="n">tokens</span> <span class="o">=</span> <span class="k">new</span> <span class="n">ArrayList</span><span class="o">&lt;&gt;();</span>
+</pre><div class="source-file"><em>lox/Scanner.java</em><br>
+in class <em>Scanner</em></div>
+<pre class="insert"><span></span>  <span class="kd">private</span> <span class="kt">int</span> <span class="n">start</span> <span class="o">=</span> <span class="mi">0</span><span class="o">;</span>
+  <span class="kd">private</span> <span class="kt">int</span> <span class="n">current</span> <span class="o">=</span> <span class="mi">0</span><span class="o">;</span>
+  <span class="kd">private</span> <span class="kt">int</span> <span class="n">line</span> <span class="o">=</span> <span class="mi">1</span><span class="o">;</span>
+</pre><pre class="insert-after"><br><span></span>  <span class="n">Scanner</span><span class="o">(</span><span class="n">String</span> <span class="n">source</span><span class="o">)</span> <span class="o">{</span>
+</pre></div>
+
+<p>The <code>start</code> and <code>current</code> fields are indexes into the string&#8202;&mdash;&#8202;the first character in the current lexeme being scanned, and the character we&rsquo;re currently considering. The other field tracks the line that contains <code>current</code>. We&rsquo;ll keep that updated as we go so we can produce tokens that know what line they occur on.</p>
+<p>Then we have one little helper function:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>scanTokens</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kt">boolean</span> <span class="nf">isAtEnd</span><span class="o">()</span> <span class="o">{</span>
+    <span class="k">return</span> <span class="n">current</span> <span class="o">&gt;=</span> <span class="n">source</span><span class="o">.</span><span class="na">length</span><span class="o">();</span>
+  <span class="o">}</span>
+</pre></div>
+
+<h3><a href="#recognizing-lexemes" name="recognizing-lexemes"><small>4&#8202;.&#8202;4&#8202;.&#8202;1</small> Recognizing lexemes</a></h3>
+<p>Each turn of the loop, we scan the next token. This is the real heart of the scanner. We&rsquo;ll start simple. Imagine if every lexeme was only a single character long. To implement that, you can just consume the next character and pick a token type for it.</p>
+<p>This works fine for several of Lox&rsquo;s real lexemes, so lets start there:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>scanTokens</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kt">void</span> <span class="nf">scanToken</span><span class="o">()</span> <span class="o">{</span>
+    <span class="kt">char</span> <span class="n">c</span> <span class="o">=</span> <span class="n">advance</span><span class="o">();</span>
+    <span class="k">switch</span> <span class="o">(</span><span class="n">c</span><span class="o">)</span> <span class="o">{</span>
+      <span class="k">case</span> <span class="sc">&#39;(&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">LEFT_PAREN</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;)&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">RIGHT_PAREN</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;{&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">LEFT_BRACE</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;}&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">RIGHT_BRACE</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;,&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">COMMA</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;.&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">DOT</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;-&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">MINUS</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;+&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">PLUS</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;;&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">SEMICOLON</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;*&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">STAR</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+    <span class="o">}</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>Again, we need a couple of helper methods:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>isAtEnd</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kt">char</span> <span class="nf">advance</span><span class="o">()</span> <span class="o">{</span>
+    <span class="n">current</span><span class="o">++;</span>
+    <span class="k">return</span> <span class="n">source</span><span class="o">.</span><span class="na">charAt</span><span class="o">(</span><span class="n">current</span> <span class="o">-</span> <span class="mi">1</span><span class="o">);</span>
+  <span class="o">}</span>
+
+  <span class="kd">private</span> <span class="kt">void</span> <span class="nf">addToken</span><span class="o">(</span><span class="n">TokenType</span> <span class="n">type</span><span class="o">)</span> <span class="o">{</span>
+    <span class="n">addToken</span><span class="o">(</span><span class="n">type</span><span class="o">,</span> <span class="kc">null</span><span class="o">);</span>
+  <span class="o">}</span>
+
+  <span class="kd">private</span> <span class="kt">void</span> <span class="nf">addToken</span><span class="o">(</span><span class="n">TokenType</span> <span class="n">type</span><span class="o">,</span> <span class="n">Object</span> <span class="n">literal</span><span class="o">)</span> <span class="o">{</span>
+    <span class="n">String</span> <span class="n">text</span> <span class="o">=</span> <span class="n">source</span><span class="o">.</span><span class="na">substring</span><span class="o">(</span><span class="n">start</span><span class="o">,</span> <span class="n">current</span><span class="o">);</span>
+    <span class="n">tokens</span><span class="o">.</span><span class="na">add</span><span class="o">(</span><span class="k">new</span> <span class="n">Token</span><span class="o">(</span><span class="n">type</span><span class="o">,</span> <span class="n">text</span><span class="o">,</span> <span class="n">literal</span><span class="o">,</span> <span class="n">line</span><span class="o">));</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>The <code>advance()</code> method adds the next character to the lexeme we&rsquo;re currently building and then returns it. We can call this even before we know what kind of lexeme we&rsquo;re building since we know the character is going into <em>some</em> lexeme.</p>
+<p>If <code>advance()</code> is the input then <code>addToken()</code> is the output. It grabs the text of the current lexeme and creates a new token for it. Later, we&rsquo;ll use the other overloaded version here to handle tokens with literal values.</p>
+<h3><a href="#lexical-errors" name="lexical-errors"><small>4&#8202;.&#8202;4&#8202;.&#8202;2</small> Lexical errors</a></h3>
+<p>Before we get too far in, let&rsquo;s take a moment to think about errors at the lexical level. Lox doesn&rsquo;t use the <code>@</code> character. What happens if a user throws a source file containing that at our interpreter? Right now, it just gets silently added to the next token. That ain&rsquo;t right.</p>
+<p>Let&rsquo;s fix that:</p>
+<div class="codehilite"><pre class="insert-before"><span></span>      <span class="k">case</span> <span class="sc">&#39;*&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">STAR</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+</pre><div class="source-file"><em>lox/Scanner.java</em><br>
+in <em>scanToken</em>()</div>
+<pre class="insert"><br><span></span>      <span class="k">default</span><span class="o">:</span>
+          <span class="n">Lox</span><span class="o">.</span><span class="na">error</span><span class="o">(</span><span class="n">line</span><span class="o">,</span> <span class="s">&quot;Unexpected character.&quot;</span><span class="o">);</span>
+        <span class="k">break</span><span class="o">;</span>
+</pre><pre class="insert-after"><span></span>    <span class="o">}</span>
+</pre></div>
+
+<p>Note that the erroneous character was still consumed by the call to `advance(). That&rsquo;s important so that we don&rsquo;t get stuck in an infinite loop.</p>
+<p>Note also that we <span name="shotgun">keep scanning</span>. There may be other errors later in the program. It gives our users a better experience if we can detect as many of those as possible in one go. It&rsquo;s no fun if they see one tiny error and fix it, only to have the next error appear, and so on. Syntax error whack-a-mole is a drag.</p>
+<aside name="shotgun">
+<p>Because we report each invalid character as its own error, this will shotgun the user with a blast of errors if they accidentally paste a big blob of weird characters. If we wanted to be a little more nicer, we should coalesce a run of invalid characters into a single error.</p>
+</aside>
+<p>Even though we keep scanning, though, we won&rsquo;t try to <em>execute</em> this code. As soon as the first error is hit, <code>hadError</code> gets set so we know not to try to run it.</p>
+<h3><a href="#operators" name="operators"><small>4&#8202;.&#8202;4&#8202;.&#8202;3</small> Operators</a></h3>
+<p>We have single-character lexemes covered, but that doesn&rsquo;t cover all of Lox&rsquo;s operators. What about <code>!</code>? It&rsquo;s a single character, right? Sometimes, yes, but not if it&rsquo;s followed by a <code>=</code>. In that case, it should be a <code>!=</code> lexeme. Likewise, <code>&lt;</code>, <code>&gt;</code>, and <code>=</code> can all be followed by <code>=</code>.</p>
+<p>For those, we need to look at the second character:</p>
+<div class="codehilite"><pre class="insert-before"><span></span>      <span class="k">case</span> <span class="sc">&#39;*&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">STAR</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+</pre><div class="source-file"><em>lox/Scanner.java</em><br>
+in <em>scanToken</em>()</div>
+<pre class="insert"><span></span>      <span class="k">case</span> <span class="sc">&#39;!&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">match</span><span class="o">(</span><span class="sc">&#39;=&#39;</span><span class="o">)</span> <span class="o">?</span> <span class="n">BANG_EQUAL</span> <span class="o">:</span> <span class="n">BANG</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;=&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">match</span><span class="o">(</span><span class="sc">&#39;=&#39;</span><span class="o">)</span> <span class="o">?</span> <span class="n">EQUAL_EQUAL</span> <span class="o">:</span> <span class="n">EQUAL</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;&lt;&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">match</span><span class="o">(</span><span class="sc">&#39;=&#39;</span><span class="o">)</span> <span class="o">?</span> <span class="n">LESS_EQUAL</span> <span class="o">:</span> <span class="n">LESS</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+      <span class="k">case</span> <span class="sc">&#39;&gt;&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">match</span><span class="o">(</span><span class="sc">&#39;=&#39;</span><span class="o">)</span> <span class="o">?</span> <span class="n">GREATER_EQUAL</span> <span class="o">:</span> <span class="n">GREATER</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+</pre><pre class="insert-after"><br><span></span>      <span class="k">default</span><span class="o">:</span>
+</pre></div>
+
+<p>Those use this new method:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>scanToken</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kt">boolean</span> <span class="nf">match</span><span class="o">(</span><span class="kt">char</span> <span class="n">expected</span><span class="o">)</span> <span class="o">{</span>
+    <span class="k">if</span> <span class="o">(</span><span class="n">isAtEnd</span><span class="o">())</span> <span class="k">return</span> <span class="kc">false</span><span class="o">;</span>
+    <span class="k">if</span> <span class="o">(</span><span class="n">source</span><span class="o">.</span><span class="na">charAt</span><span class="o">(</span><span class="n">current</span><span class="o">)</span> <span class="o">!=</span> <span class="n">expected</span><span class="o">)</span> <span class="k">return</span> <span class="kc">false</span><span class="o">;</span>
+
+    <span class="n">current</span><span class="o">++;</span>
+    <span class="k">return</span> <span class="kc">true</span><span class="o">;</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>It&rsquo;s like a conditional <code>advance()</code>. It only consumes the current character if it&rsquo;s what we&rsquo;re looking for.</p>
+<h3><a href="#comments-and-whitespace" name="comments-and-whitespace"><small>4&#8202;.&#8202;4&#8202;.&#8202;4</small> Comments and whitespace</a></h3>
+<p>We&rsquo;re still missing one operator, <code>/</code>. That one needs a little special handling because we use <code>//</code> to begin a comment.</p>
+<div class="codehilite"><pre class="insert-before"><span></span>      <span class="k">case</span> <span class="sc">&#39;&gt;&#39;</span><span class="o">:</span> <span class="n">addToken</span><span class="o">(</span><span class="n">match</span><span class="o">(</span><span class="sc">&#39;=&#39;</span><span class="o">)</span> <span class="o">?</span> <span class="n">GREATER_EQUAL</span> <span class="o">:</span> <span class="n">GREATER</span><span class="o">);</span> <span class="k">break</span><span class="o">;</span>
+</pre><div class="source-file"><em>lox/Scanner.java</em><br>
+in <em>scanToken</em>()</div>
+<pre class="insert"><span></span>      <span class="k">case</span> <span class="sc">&#39;/&#39;</span><span class="o">:</span>
+        <span class="k">if</span> <span class="o">(</span><span class="n">match</span><span class="o">(</span><span class="sc">&#39;/&#39;</span><span class="o">))</span> <span class="o">{</span>
+          <span class="c1">// A comment goes until the end of the line.</span>
+          <span class="k">while</span> <span class="o">(</span><span class="n">peek</span><span class="o">()</span> <span class="o">!=</span> <span class="sc">&#39;\n&#39;</span> <span class="o">&amp;&amp;</span> <span class="o">!</span><span class="n">isAtEnd</span><span class="o">())</span> <span class="n">advance</span><span class="o">();</span>
+        <span class="o">}</span> <span class="k">else</span> <span class="o">{</span>
+          <span class="n">addToken</span><span class="o">(</span><span class="n">SLASH</span><span class="o">);</span>
+        <span class="o">}</span>
+        <span class="k">break</span><span class="o">;</span>
+</pre><pre class="insert-after"><br><span></span>      <span class="k">default</span><span class="o">:</span>
+</pre></div>
+
+<p>This is roughly similar to the other two-character operators. However, when we match a second <code>/</code>, then we know we&rsquo;re in a comment. At that point, we keep consuming characters until we hit the end of the line.</p>
+<p>This is our general strategy for handling longer lexemes. Once we&rsquo;ve detected the beginning of a lexeme, we shunt off to some code specific to that kind of lexeme that keeps eating characters until it sees the end.</p>
+<p>We&rsquo;ve got another helper:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>match</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kt">char</span> <span class="nf">peek</span><span class="o">()</span> <span class="o">{</span>
+    <span class="k">if</span> <span class="o">(</span><span class="n">current</span> <span class="o">&gt;=</span> <span class="n">source</span><span class="o">.</span><span class="na">length</span><span class="o">())</span> <span class="k">return</span> <span class="sc">&#39;\0&#39;</span><span class="o">;</span>
+    <span class="k">return</span> <span class="n">source</span><span class="o">.</span><span class="na">charAt</span><span class="o">(</span><span class="n">current</span><span class="o">);</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>It&rsquo;s sort of like <code>advance()</code>, but doesn&rsquo;t consume the character. This is called <span name="match"><strong>lookahead</strong></span>. Since it only looks at the current unconsumed character, we have <em>one character of lookahead</em>. The smaller this number is, generally, the faster our scanner will run. The lexical grammar dictates how much lookahead we need. Fortunately, most languages in wide use are designed to be scanned with one or two characters of lookahead.</p>
+<aside name="match">
+<p>Technically, <code>match()</code> is doing lookahead too. <code>advance()</code> and <code>peek()</code> are the fundamental operators and <code>match()</code> combines them.</p>
+</aside>
+<p>After we consume all of the characters in the comment, we don&rsquo;t called <code>addToken()</code>. The lexeme just gets discarded the next time we loop around and start a new one. This is deliberate. Comments, by design, aren&rsquo;t interpreted by the language. By discarding them now, we simplify the parser since it won&rsquo;t have to worry about them.</p>
+<p>Newlines and other whitespace are also ignored, and now is a good time to do that:</p>
+<div class="codehilite"><pre class="insert-before"><span></span>        <span class="k">break</span><span class="o">;</span>
+</pre><div class="source-file"><em>lox/Scanner.java</em><br>
+in <em>scanToken</em>()</div>
+<pre class="insert"><br><span></span>      <span class="k">case</span> <span class="sc">&#39; &#39;</span><span class="o">:</span>
+      <span class="k">case</span> <span class="sc">&#39;\r&#39;</span><span class="o">:</span>
+      <span class="k">case</span> <span class="sc">&#39;\t&#39;</span><span class="o">:</span>
+        <span class="c1">// Ignore whitespace.</span>
+        <span class="k">break</span><span class="o">;</span>
+
+      <span class="k">case</span> <span class="sc">&#39;\n&#39;</span><span class="o">:</span>
+        <span class="n">line</span><span class="o">++;</span>
+        <span class="k">break</span><span class="o">;</span>
+</pre><pre class="insert-after"><br><span></span>      <span class="k">default</span><span class="o">:</span>
+          <span class="n">Lox</span><span class="o">.</span><span class="na">error</span><span class="o">(</span><span class="n">line</span><span class="o">,</span> <span class="s">&quot;Unexpected character.&quot;</span><span class="o">);</span>
+</pre></div>
+
+<p>For spaces and tabs, we simply go back to the beginning of the scan loop. That will start a new lexeme after the whitespace character. For newlines we do the same thing, but we also increment the line counter. (This is why we used <code>peek()</code> to find the newline after a comment instead of <code>match()</code>. We want that newline to get here and update <code>line</code>.)</p>
+<p>Our scanner is starting to feel more real now. It can handle fairly free-form code like:</p>
+<div class="codehilite"><pre><span></span><span class="c1">// this is a comment</span>
+<span class="p">((</span> <span class="p">)){}</span> <span class="c1">// grouping stuff</span>
+<span class="o">!*+-/=&lt;&gt;</span> <span class="o">&lt;=</span> <span class="o">==</span> <span class="c1">// operators</span>
+</pre></div>
+
+
+<h3><a href="#string-literals" name="string-literals"><small>4&#8202;.&#8202;4&#8202;.&#8202;5</small> String literals</a></h3>
+<p>Now that we know how to handle multiple-character lexemes, we can add support for literals. We&rsquo;ll do strings first, since that always begin with a specific character, <code>"</code>:</p>
+<div class="codehilite"><pre class="insert-before"><span></span>        <span class="k">break</span><span class="o">;</span>
+</pre><div class="source-file"><em>lox/Scanner.java</em><br>
+in <em>scanToken</em>()</div>
+<pre class="insert"><br><span></span>      <span class="k">case</span> <span class="sc">&#39;&quot;&#39;</span><span class="o">:</span> <span class="n">string</span><span class="o">();</span> <span class="k">break</span><span class="o">;</span>
+</pre><pre class="insert-after"><br><span></span>      <span class="k">default</span><span class="o">:</span>
+</pre></div>
+
+<p>That calls:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>scanToken</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kt">void</span> <span class="nf">string</span><span class="o">()</span> <span class="o">{</span>
+    <span class="k">while</span> <span class="o">(</span><span class="n">peek</span><span class="o">()</span> <span class="o">!=</span> <span class="sc">&#39;&quot;&#39;</span> <span class="o">&amp;&amp;</span> <span class="o">!</span><span class="n">isAtEnd</span><span class="o">())</span> <span class="o">{</span>
+      <span class="k">if</span> <span class="o">(</span><span class="n">peek</span><span class="o">()</span> <span class="o">==</span> <span class="sc">&#39;\n&#39;</span><span class="o">)</span> <span class="n">line</span><span class="o">++;</span>
+      <span class="n">advance</span><span class="o">();</span>
+    <span class="o">}</span>
+
+    <span class="c1">// Unterminated string.</span>
+    <span class="k">if</span> <span class="o">(</span><span class="n">isAtEnd</span><span class="o">())</span> <span class="o">{</span>
+      <span class="n">Lox</span><span class="o">.</span><span class="na">error</span><span class="o">(</span><span class="n">line</span><span class="o">,</span> <span class="s">&quot;Unterminated string.&quot;</span><span class="o">);</span>
+      <span class="k">return</span><span class="o">;</span>
+    <span class="o">}</span>
+
+    <span class="c1">// The closing &quot;.</span>
+    <span class="n">advance</span><span class="o">();</span>
+
+    <span class="c1">// Trim the surrounding quotes.</span>
+    <span class="n">String</span> <span class="n">value</span> <span class="o">=</span> <span class="n">source</span><span class="o">.</span><span class="na">substring</span><span class="o">(</span><span class="n">start</span> <span class="o">+</span> <span class="mi">1</span><span class="o">,</span> <span class="n">current</span> <span class="o">-</span> <span class="mi">1</span><span class="o">);</span>
+    <span class="n">addToken</span><span class="o">(</span><span class="n">STRING</span><span class="o">,</span> <span class="n">value</span><span class="o">);</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>Like with comments, we keep consuming characters until we hit the <code>"</code> that ends the string. We also need to gracefully handle running out of input before the string is closed and report an error for that.</p>
+<p>For no particular reason, Lox supports multi-line strings. There are pros and cons to that, but prohibiting them was a little more complex that allowing them, so I left them in. This does mean we also need to update <code>line</code> when we hit a newline inside a string.</p>
+<p>Finally, the last interesting bit is that when we create the token, we also produce the actual <em>value</em> of the string literal that will be used later by the interpreter. Here, that conversion just requires a <code>substring()</code> to strip off the quotes. That&rsquo;s because we don&rsquo;t support escape sequences in Lox. If we did, we&rsquo;d process those here.</p>
+<h3><a href="#number-literals" name="number-literals"><small>4&#8202;.&#8202;4&#8202;.&#8202;6</small> Number literals</a></h3>
+<p>All numbers in Lox are floating point at runtime, but it supports both integer and decimal literals. That means a number literal is a series of <span name="minus">digits</span> optionally followed by a <code>.</code> and one or more digits:</p>
+<aside name="minus">
+<p>Since we only look for a digit to start a number, that means <code>-123</code> is not a
+number <em>literal</em>. Instead, <code>-123</code>, is an <em>expression</em> that applies <code>-</code> to the
+number literal <code>123</code>. In practice, the result is the same, though it has one
+interesting edge case if we were to add method calls on numbers. Consider:</p>
+<div class="codehilite"><pre><span></span><span class="n">print</span> <span class="o">-</span><span class="mi">123</span><span class="p">.</span><span class="n">abs</span><span class="p">();</span>
+</pre></div>
+
+
+<p>This prints <code>-123</code> because <code>-</code> has lower precedence than <code>.</code>. We could fix that by making <code>-</code> part of the number literal. But then consider:</p>
+<div class="codehilite"><pre><span></span><span class="k">var</span> <span class="n">n</span> <span class="o">=</span> <span class="mi">123</span><span class="p">;</span>
+<span class="n">print</span> <span class="o">-</span><span class="n">n</span><span class="p">.</span><span class="n">abs</span><span class="p">();</span>
+</pre></div>
+
+
+<p>Now this produces a different result than you&rsquo;d get by repacing <code>n</code> with its value. No matter what you do, some case ends up weird.</p>
+</aside>
+<div class="codehilite"><pre><span></span><span class="mi">1234</span>
+<span class="mf">12.34</span>
+</pre></div>
+
+
+<p>We don&rsquo;t allow a leading or trailing decimal point, so these are both invalid:</p>
+<div class="codehilite"><pre><span></span><span class="p">.</span><span class="mi">1234</span>
+<span class="mi">1234</span><span class="p">.</span>
+</pre></div>
+
+
+<p>We could easily support the former, but I left it out to keep things simple. The latter gets weird if we ever want to allow methods on numbers like <code>123.sqrt()</code>.</p>
+<p>To recognize the beginning of a number lexeme, we look for any digit. It&rsquo;s kind of tedious to add cases for every decimal digit, so we&rsquo;ll stuff it in the default instead:</p>
+<div class="codehilite"><pre class="insert-before"><span></span>      <span class="k">default</span><span class="o">:</span>
+</pre><div class="source-file"><em>lox/Scanner.java</em><br>
+in <em>scanToken</em>()<br>
+replace 1 line</div>
+<pre class="insert"><span></span>        <span class="k">if</span> <span class="o">(</span><span class="n">isDigit</span><span class="o">(</span><span class="n">c</span><span class="o">))</span> <span class="o">{</span>
+          <span class="n">number</span><span class="o">();</span>
+        <span class="o">}</span> <span class="k">else</span> <span class="o">{</span>
+          <span class="n">Lox</span><span class="o">.</span><span class="na">error</span><span class="o">(</span><span class="n">line</span><span class="o">,</span> <span class="s">&quot;Unexpected character.&quot;</span><span class="o">);</span>
+        <span class="o">}</span>
+</pre><pre class="insert-after"><span></span>        <span class="k">break</span><span class="o">;</span>
+</pre></div>
+
+<p>This relies on:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>peek</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kt">boolean</span> <span class="nf">isDigit</span><span class="o">(</span><span class="kt">char</span> <span class="n">c</span><span class="o">)</span> <span class="o">{</span>
+    <span class="k">return</span> <span class="n">c</span> <span class="o">&gt;=</span> <span class="sc">&#39;0&#39;</span> <span class="o">&amp;&amp;</span> <span class="n">c</span> <span class="o">&lt;=</span> <span class="sc">&#39;9&#39;</span><span class="o">;</span>
+  <span class="o">}</span> <span name="is-digit"></span>
+</pre></div>
+
+<aside name="is-digit">
+<p>The Java standard library provides <a href="http://docs.oracle.com/javase/7/docs/api/java/lang/Character.html#isDigit(char)"><code>Character.isDigit()</code></a> which seems like a good fit. Alas, that method allows things like Devangari digits, fullwidth numbers, and other funny stuff we don&rsquo;t want.</p>
+</aside>
+<p>Once we know we are in a number, we branch to a separate method to consume the rest of the literal, like we do with strings:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>scanToken</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kt">void</span> <span class="nf">number</span><span class="o">()</span> <span class="o">{</span>
+    <span class="k">while</span> <span class="o">(</span><span class="n">isDigit</span><span class="o">(</span><span class="n">peek</span><span class="o">()))</span> <span class="n">advance</span><span class="o">();</span>
+
+    <span class="c1">// Look for a fractional part.</span>
+    <span class="k">if</span> <span class="o">(</span><span class="n">peek</span><span class="o">()</span> <span class="o">==</span> <span class="sc">&#39;.&#39;</span> <span class="o">&amp;&amp;</span> <span class="n">isDigit</span><span class="o">(</span><span class="n">peekNext</span><span class="o">()))</span> <span class="o">{</span>
+      <span class="c1">// Consume the &quot;.&quot;</span>
+      <span class="n">advance</span><span class="o">();</span>
+
+      <span class="k">while</span> <span class="o">(</span><span class="n">isDigit</span><span class="o">(</span><span class="n">peek</span><span class="o">()))</span> <span class="n">advance</span><span class="o">();</span>
+    <span class="o">}</span>
+
+    <span class="n">addToken</span><span class="o">(</span><span class="n">NUMBER</span><span class="o">,</span>
+        <span class="n">Double</span><span class="o">.</span><span class="na">parseDouble</span><span class="o">(</span><span class="n">source</span><span class="o">.</span><span class="na">substring</span><span class="o">(</span><span class="n">start</span><span class="o">,</span> <span class="n">current</span><span class="o">)));</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>It consumes as many digits as it finds for the integer part of the literal.</p>
+<p>Then it looks for a fractional part, which is a decimal point (<code>.</code>) followed by at least one digit. This requires another character of lookahead since we don&rsquo;t want to consume the <code>.</code> until we&rsquo;re sure there is a digit <em>after</em> it. So we&rsquo;ll add:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>peek</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kt">char</span> <span class="nf">peekNext</span><span class="o">()</span> <span class="o">{</span>
+    <span class="k">if</span> <span class="o">(</span><span class="n">current</span> <span class="o">+</span> <span class="mi">1</span> <span class="o">&gt;=</span> <span class="n">source</span><span class="o">.</span><span class="na">length</span><span class="o">())</span> <span class="k">return</span> <span class="sc">&#39;\0&#39;</span><span class="o">;</span>
+    <span class="k">return</span> <span class="n">source</span><span class="o">.</span><span class="na">charAt</span><span class="o">(</span><span class="n">current</span> <span class="o">+</span> <span class="mi">1</span><span class="o">);</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>If we have a fractional part, again, we consume as many digits as we can find.</p>
+<p>Finally, we convert the lexeme to its numeric value. Our interpreter will use Java&rsquo;s <code>double</code> type to represent numbers, so we produce a value of that type. We&rsquo;re using Java&rsquo;s own parsing method to convert the lexeme to a real Java double. We could implement this ourselves, but really, unless you&rsquo;re trying to cram for an upcoming programming interview, it&rsquo;s not worth our time.</p>
+<p>The remaining literals are Booleans and <code>null</code>, but we&rsquo;ll handle those as keywords, which gets us to&hellip;</p>
+<h3><a href="#identifiers-and-keywords" name="identifiers-and-keywords"><small>4&#8202;.&#8202;4&#8202;.&#8202;7</small> Identifiers and keywords</a></h3>
+<p>Our scanner is almost done. The only things left in the lexical grammar to implement is identifiers and their close cousins the reserved words. You might think we could match keywords like we handle multiple-character operators like <code>&lt;=</code>. Something like:</p>
+<div class="codehilite"><pre><span></span><span class="k">case</span> <span class="sc">&#39;o&#39;</span><span class="o">:</span>
+  <span class="k">if</span> <span class="o">(</span><span class="n">peek</span><span class="o">()</span> <span class="o">==</span> <span class="sc">&#39;r&#39;</span><span class="o">)</span> <span class="o">{</span>
+    <span class="n">addToken</span><span class="o">(</span><span class="n">OR</span><span class="o">);</span>
+  <span class="o">}</span>
+  <span class="k">break</span><span class="o">;</span>
+</pre></div>
+
+
+<p>But now consider if a user names a variable <code>orchid</code>. We don&rsquo;t want the scanner to see the first to letters <code>or</code> and immediately emit an <code>or</code> keyword token. This gets us to an important principle in lexical grammars called <span name="maximal"><strong>maximal munch</strong></span>. When the scanner is matching lexemes if two lexical grammar rules match some chunk of characters, <em>the longest one wins</em>.</p>
+<p>That rule states that if we match <code>orchid</code> as an identifier and <code>or</code> as a keyword, the latter wins. It&rsquo;s also why we tacitly assume above that <code>&lt;=</code> should be scanned as a single <code>&lt;=</code> token and not <code>&lt;</code> followed by <code>=</code>.</p>
+<aside name="maximal">
+<p>Consider this nasty bit of C code:</p>
+<div class="codehilite"><pre><span></span><span class="o">---</span><span class="n">a</span><span class="p">;</span>
+</pre></div>
+
+
+<p>Is this valid? It depends on how it&rsquo;s scanned. If the scanner sees it as:</p>
+<div class="codehilite"><pre><span></span><span class="o">-</span> <span class="o">--</span><span class="n">a</span><span class="p">;</span>
+</pre></div>
+
+
+<p>Then it would work. But that would require the scanner to know about the grammatical structure of the surrounding code, which entangles things more than we want. Instead, the maximal munch rule says that it is <em>always</em> scanned like:</p>
+<div class="codehilite"><pre><span></span><span class="o">--</span> <span class="o">-</span><span class="n">a</span><span class="p">;</span>
+</pre></div>
+
+
+<p>Even though that becomes a syntax error later in the parser.</p>
+</aside>
+<p>This means we can&rsquo;t easily detect a reserved word until we&rsquo;ve reached the end of what might instead be an identifier. After all, a reserved word <em>is</em> an identifier, it&rsquo;s just one that has been claimed by the language for its own use. That&rsquo;s where the term <strong>&ldquo;reserved word&rdquo;</strong> comes from.</p>
+<p>Instead, we&rsquo;ll assume any lexeme starting with a letter or underscore is an identifier:</p>
+<div class="codehilite"><pre class="insert-before"><span></span>      <span class="k">default</span><span class="o">:</span>
+        <span class="k">if</span> <span class="o">(</span><span class="n">isDigit</span><span class="o">(</span><span class="n">c</span><span class="o">))</span> <span class="o">{</span>
+          <span class="n">number</span><span class="o">();</span>
+</pre><div class="source-file"><em>lox/Scanner.java</em><br>
+in <em>scanToken</em>()</div>
+<pre class="insert"><span></span>        <span class="o">}</span> <span class="k">else</span> <span class="k">if</span> <span class="o">(</span><span class="n">isAlpha</span><span class="o">(</span><span class="n">c</span><span class="o">))</span> <span class="o">{</span>
+          <span class="n">identifier</span><span class="o">();</span>
+</pre><pre class="insert-after"><span></span>        <span class="o">}</span> <span class="k">else</span> <span class="o">{</span>
+          <span class="n">Lox</span><span class="o">.</span><span class="na">error</span><span class="o">(</span><span class="n">line</span><span class="o">,</span> <span class="s">&quot;Unexpected character.&quot;</span><span class="o">);</span>
+        <span class="o">}</span>
+</pre></div>
+
+<p>That calls:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>scanToken</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kt">void</span> <span class="nf">identifier</span><span class="o">()</span> <span class="o">{</span>
+    <span class="k">while</span> <span class="o">(</span><span class="n">isAlphaNumeric</span><span class="o">(</span><span class="n">peek</span><span class="o">()))</span> <span class="n">advance</span><span class="o">();</span>
+
+    <span class="n">addToken</span><span class="o">(</span><span class="n">IDENTIFIER</span><span class="o">);</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>Those use these helpers:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+add after <em>peekNext</em>()</div>
+<pre><span></span>  <span class="kd">private</span> <span class="kt">boolean</span> <span class="nf">isAlpha</span><span class="o">(</span><span class="kt">char</span> <span class="n">c</span><span class="o">)</span> <span class="o">{</span>
+    <span class="k">return</span> <span class="o">(</span><span class="n">c</span> <span class="o">&gt;=</span> <span class="sc">&#39;a&#39;</span> <span class="o">&amp;&amp;</span> <span class="n">c</span> <span class="o">&lt;=</span> <span class="sc">&#39;z&#39;</span><span class="o">)</span> <span class="o">||</span>
+           <span class="o">(</span><span class="n">c</span> <span class="o">&gt;=</span> <span class="sc">&#39;A&#39;</span> <span class="o">&amp;&amp;</span> <span class="n">c</span> <span class="o">&lt;=</span> <span class="sc">&#39;Z&#39;</span><span class="o">)</span> <span class="o">||</span>
+            <span class="n">c</span> <span class="o">==</span> <span class="sc">&#39;_&#39;</span><span class="o">;</span>
+  <span class="o">}</span>
+
+  <span class="kd">private</span> <span class="kt">boolean</span> <span class="nf">isAlphaNumeric</span><span class="o">(</span><span class="kt">char</span> <span class="n">c</span><span class="o">)</span> <span class="o">{</span>
+    <span class="k">return</span> <span class="n">isAlpha</span><span class="o">(</span><span class="n">c</span><span class="o">)</span> <span class="o">||</span> <span class="n">isDigit</span><span class="o">(</span><span class="n">c</span><span class="o">);</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>Now identifiers are working. To handle keywords, we just see if the identifier&rsquo;s lexeme is one of the reserved words. If so, we&rsquo;ll use a token type specific to that keyword. (That will make parsing easier later.) We&rsquo;ll define this set of reserved words in a map:</p>
+<div class="codehilite"><div class="source-file"><em>lox/Scanner.java</em><br>
+in class <em>Scanner</em></div>
+<pre><span></span>  <span class="kd">private</span> <span class="kd">static</span> <span class="kd">final</span> <span class="n">Map</span><span class="o">&lt;</span><span class="n">String</span><span class="o">,</span> <span class="n">TokenType</span><span class="o">&gt;</span> <span class="n">keywords</span><span class="o">;</span>
+
+  <span class="kd">static</span> <span class="o">{</span>
+    <span class="n">keywords</span> <span class="o">=</span> <span class="k">new</span> <span class="n">HashMap</span><span class="o">&lt;&gt;();</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;and&quot;</span><span class="o">,</span>    <span class="n">AND</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;class&quot;</span><span class="o">,</span>  <span class="n">CLASS</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;else&quot;</span><span class="o">,</span>   <span class="n">ELSE</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;false&quot;</span><span class="o">,</span>  <span class="n">FALSE</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;for&quot;</span><span class="o">,</span>    <span class="n">FOR</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;fun&quot;</span><span class="o">,</span>    <span class="n">FUN</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;if&quot;</span><span class="o">,</span>     <span class="n">IF</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;nil&quot;</span><span class="o">,</span>    <span class="n">NIL</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;or&quot;</span><span class="o">,</span>     <span class="n">OR</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;print&quot;</span><span class="o">,</span>  <span class="n">PRINT</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;return&quot;</span><span class="o">,</span> <span class="n">RETURN</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;super&quot;</span><span class="o">,</span>  <span class="n">SUPER</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;this&quot;</span><span class="o">,</span>   <span class="n">THIS</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;true&quot;</span><span class="o">,</span>   <span class="n">TRUE</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;var&quot;</span><span class="o">,</span>    <span class="n">VAR</span><span class="o">);</span>
+    <span class="n">keywords</span><span class="o">.</span><span class="na">put</span><span class="o">(</span><span class="s">&quot;while&quot;</span><span class="o">,</span>  <span class="n">WHILE</span><span class="o">);</span>
+  <span class="o">}</span>
+</pre></div>
+
+<p>Then, after we scan an identifier, we check to see if it matches one of these keywords:</p>
+<div class="codehilite"><pre class="insert-before"><span></span>    <span class="k">while</span> <span class="o">(</span><span class="n">isAlphaNumeric</span><span class="o">(</span><span class="n">peek</span><span class="o">()))</span> <span class="n">advance</span><span class="o">();</span>
+<br></pre><div class="source-file"><em>lox/Scanner.java</em><br>
+in <em>identifier</em>()<br>
+replace 1 line</div>
+<pre class="insert"><span></span>    <span class="c1">// See if the identifier is a reserved word.</span>
+    <span class="n">String</span> <span class="n">text</span> <span class="o">=</span> <span class="n">source</span><span class="o">.</span><span class="na">substring</span><span class="o">(</span><span class="n">start</span><span class="o">,</span> <span class="n">current</span><span class="o">);</span>
+
+    <span class="n">TokenType</span> <span class="n">type</span> <span class="o">=</span> <span class="n">keywords</span><span class="o">.</span><span class="na">get</span><span class="o">(</span><span class="n">text</span><span class="o">);</span>
+    <span class="k">if</span> <span class="o">(</span><span class="n">type</span> <span class="o">==</span> <span class="kc">null</span><span class="o">)</span> <span class="n">type</span> <span class="o">=</span> <span class="n">IDENTIFIER</span><span class="o">;</span>
+    <span class="n">addToken</span><span class="o">(</span><span class="n">type</span><span class="o">);</span>
+</pre><pre class="insert-after"><span></span>  <span class="o">}</span>
+</pre></div>
+
+<p>If so, we use that keyword&rsquo;s token type. Otherwise, it&rsquo;s a regular user-defined identifier.</p>
+<p>And with that, we now have a complete scanner for the entire Lox lexical grammar. Fire up the REPL and type some valid and invalid code in. Does it produce the tokens you expect? Try to come up with some interesting edge cases and see if it handles them as it should.</p>
+<div class="challenges">
+<h2><a href="#challenges" name="challenges">Challenges</a></h2>
+
+<ol>
+<li>
+<p>The lexical grammars of Python and Haskell are not <em>regular</em>. What does that
+    mean, and why aren&rsquo;t they?</p>
+</li>
+<li>
+<p>Aside from separating tokens&#8202;&mdash;&#8202;distinguishing <code>print foo</code> from
+    <code>printfoo</code>&#8202;&mdash;&#8202;spaces aren&rsquo;t used for much in most languages. However, they
+    do affect how code is parsed in CoffeeScript, Ruby, and the C preprocessor.
+    Where and what effect do they have in each language?</p>
+</li>
+<li>
+<p>Our scanner here, like most, discards comments and whitespace since those
+    aren&rsquo;t needed by the parser. Why might you want to write a scanner that does
+    <em>not</em> discard those? What would it be useful for?</p>
+</li>
+<li>
+<p>Add support to Lox&rsquo;s scanner for C-style <code>/* ... */</code> block comments. Make
+    sure the handle newlines in them. Consider allowing them to nest. Is adding
+    support for nesting more work than you expected? Why?</p>
+</li>
+</ol>
+</div>
+<div class="design-note">
+<h2><a href="#design-note" name="design-note">Design Note: Implicit Semicolons
+</a></h2>
+
+<p>Programmers today are spoiled for choice in languages and have gotten picky about the look and feel of its syntax. They want their language to look clean and modern. One bit of syntactic lichen that almost every new language eliminates (and some ancient ones like BASIC never had) is <code>;</code> as an explicit statement separator.</p>
+<p>Instead, they treat a newline as a statement separator where it makes sense to do so. The &ldquo;where it makes sense&rdquo; part is the interesting bit. While <em>most</em> statements are on their own line, sometimes you need to split it in the middle and break it across a couple of lines. Those newlines should not be treated as separators.</p>
+<p>Most of the obvious cases are easy to detect, but there are a handful of nasty cases you run into:</p>
+<ul>
+<li>
+<p>A return value on the next line:</p>
+<div class="codehilite"><pre><span></span><span class="k">return</span>
+<span class="s2">&quot;value&quot;</span>
+</pre></div>
+
+
+<p>Is &ldquo;value&rdquo; the value being returned, or do we have a return statement with no value followed by an expression statement containing a string literal?</p>
+</li>
+<li>
+<p>A parenthesized expression on the next line:</p>
+<div class="codehilite"><pre><span></span><span class="nx">func</span>
+<span class="p">(</span><span class="nx">parenthsized</span><span class="p">)</span>
+</pre></div>
+
+
+<p>Is this a call to <code>func(parenthesized)</code>, or two expression statements, one for <code>func</code> and one for a parenthesized expression?</p>
+</li>
+<li>
+<p>A <code>-</code> on the next line:</p>
+<div class="codehilite"><pre><span></span><span class="nx">first</span>
+<span class="o">-</span><span class="nx">second</span>
+</pre></div>
+
+
+<p>Is this <code>first - second</code>&#8202;&mdash;&#8202;an infix subtraction&#8202;&mdash;&#8202;or two expression statements, one for <code>first</code> and one to negate <code>second</code>?</p>
+</li>
+</ul>
+<p>In all of these, treating the newline as a separator not would both produce valid code, but possibly not the code the user wants. Across languages, there is an unsettling variety in the rules they use to decide which newlines are separators. Here are a couple:</p>
+<ul>
+<li>
+<p><a href="https://www.lua.org/pil/1.1.html">Lua</a> completely ignores newlines, but carefully controls its grammar such that no separator between statements is needed at all in most cases. This is perfectly valid:</p>
+<div class="codehilite"><pre><span></span><span class="n">a</span> <span class="o">=</span> <span class="mi">1</span> <span class="n">b</span> <span class="o">=</span> <span class="mi">2</span>
+</pre></div>
+
+
+<p>It avoids the <code>return</code> problem above by requiring a <code>return</code> statement to be the very last statement in a block. If there is a value after <code>return</code> before the keyword <code>end</code>, it <em>must</em> be for the return. For the other two cases, they allow an explicit <code>;</code> and expect users to use that. In practice, that almost never happens because there&rsquo;s no point in a parenthesized or unary negation expression statement.</p>
+</li>
+<li>
+<p><a href="https://golang.org/ref/spec#Semicolons">Go</a> handles it in the scanner. If a newline appears following one of a handful of token types that are known to potentially end a statement, the newline is treated like a semicolon. The Go team provides a canonical code formatter, <a href="https://golang.org/cmd/gofmt/">gofmt</a>, and the ecosystem is fervent about its use, which ensures that idiomatic styled code works well with this simple rule.</p>
+</li>
+<li>
+<p><a href="https://docs.python.org/3.5/reference/lexical_analysis.html#implicit-line-joining">Python</a> treats all newlines as significent unless an explicit backslash is used at the end of a line to continue it to the next line. Also, newlines anywhere inside a pair of brackets (<code>()</code>, <code>[]</code>, or <code>{}</code>) are ignored. Idiomatic style strongly prefers the latter.</p>
+<p>This rule works well for Python because it is a strongly statement-oriented language. In particular, Python&rsquo;s grammar disallows a statement ever appearing inside an expression. This is also true of C, but not true of many other languages which have a &ldquo;lambda&rdquo; or function literal syntax.</p>
+<p>For example, in JavaScript, you can have:</p>
+<div class="codehilite"><pre><span></span><span class="nx">console</span><span class="p">.</span><span class="nx">log</span><span class="p">(</span><span class="kd">function</span><span class="p">()</span> <span class="p">{</span>
+  <span class="nx">statementInAnExpression</span><span class="p">();</span>
+<span class="p">});</span>
+</pre></div>
+
+
+<p>Python would need a different set of rules for implicitly joining lines if you could get back <em>into</em> a <span name="lambda">statement</span> where newlines should become meaningful while still nested inside brackets.</p>
+</li>
+</ul>
+<aside name="lambda">
+<p>And now you know why Python&rsquo;s <code>lambda</code> only allows a single expression body.</p>
+</aside>
+<ul>
+<li>
+<p>JavaScript&rsquo;s &ldquo;<a href="https://www.ecma-international.org/ecma-262/5.1/#sec-7.9">automatic semicolon insertion</a>&rdquo; rules are the outliers. Where other languages assume most newlines <em>are</em> meaningful and there are just a few in multi-line statements that should be ignored, JS assumes the opposite. It treats all of your semicolons as meaningless whitespace unless that generates a parse error. If it does, it goes back and figures out the minimal set of newlines to turn into semicolons to get to something grammatically valid.</p>
+<p>This design note would turn into a design essay it I went into complete detail about how that even works, much less all the various ways that that is a bad idea. It&rsquo;s a mess. JavaScript is the only language I know where many style guides demand explicit semicolons after every statement even though the language theoretically lets you elide them.</p>
+</li>
+</ul>
+<p>If you&rsquo;re designing a new language, you almost surely <em>should</em> avoid an explicit statement separator. Programmers are creatures of fashion like other humans and semicolons are as passé as ALL CAPS KEYWORDS. Just make sure you pick a set of rules that make sense for your language&rsquo;s particular grammar and idioms. And, uh, don&rsquo;t do what JavaScript did.</p>
+</div>
 
 <footer>&copy; 2016 Robert Nystrom</footer>
 </article>
diff --git a/site/style.css b/site/style.css
index 5c94b3918..05e440136 100644
--- a/site/style.css
+++ b/site/style.css
@@ -94,8 +94,10 @@ article.chapter .challenges {
   background: #eef4f7; }
 article.chapter .design-note {
   background: #f6f8f2; }
-  article.chapter .design-note code, article.chapter .design-note pre {
+  article.chapter .design-note code, article.chapter .design-note .codehilite {
     background: #eef1ea; }
+  article.chapter .design-note .codehilite {
+    margin: -12px 0 -12px -12px; }
 
 @media only screen and (max-width: 630px) {
   article.chapter h2 a::before, article.chapter h3 a::before {
@@ -462,7 +464,7 @@ aside {
     font-size: 14px;
     border-radius: 2px;
     padding: 1px 2px; }
-  aside pre {
+  aside .codehilite {
     padding: 6px;
     margin: -12px 0; }
 
diff --git a/site/style.css.map b/site/style.css.map
index 3ff4edafb..898d01062 100644
--- a/site/style.css.map
+++ b/site/style.css.map
@@ -1,6 +1,6 @@
 {
 "version": 3,
-"mappings": "AAkCA,UAGC;EAFC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,6CAA6C;AAGpD,UAIC;EAHC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,8CAA8C;EACnD,UAAU,EAAE,MAAM;AAGpB,UAIC;EAHC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,gDAAgD;EACrD,WAAW,EAAE,GAAG;AAGlB,UAKC;EAJC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,sDAAsD;EAC3D,UAAU,EAAE,MAAM;EAClB,WAAW,EAAE,GAAG;AAGlB,UAIC;EAHC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,4CAA4C;EACjD,WAAW,EAAE,IAAI;AAGnB,UAKC;EAJC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,kDAAkD;EACvD,UAAU,EAAE,MAAM;EAClB,WAAW,EAAE,IAAI;AAKnB,8DAA+D;EAC7D,MAAM,EAAE,CAAC;;AAGX,GAAI;EACF,OAAO,EAAE,IAAI;;AAKf,IAAK;EACH,KAAK,EAAE,IAAI;EACX,IAAI,EAAE,0CAAuB;;ACpF7B,kBAAG;EACD,IAAI,EAAE,uCAAoB;EAC1B,MAAM,EAAE,UAAU;EAClB,cAAc,EAAE,GAAG;EAEnB,wBAAM;IACJ,IAAI,EAAE,uCAAoB;IAC1B,KAAK,EAAE,KAAK;AAIhB,kBAAG;EACD,IAAI,EAAE,0CAAuB;EAC7B,MAAM,EAAE,UAAU;EAClB,cAAc,EAAE,GAAG;EAEnB,wBAAM;IACJ,IAAI,EAAE,uCAAoB;IAC1B,KAAK,EAAE,KAAK;AAIhB,0CAAW;EACT,KAAK,EAAE,IAAI;EACX,aAAa,EAAE,IAAI;AAGrB,sDAAuB;EACrB,aAAa,EAAE,IAAI;EACnB,KAAK,EAAE,OAAO;AAGhB,0DAA2B;EACzB,QAAQ,EAAE,QAAQ;EAClB,IAAI,EAAE,KAAK;EACX,KAAK,EDJH,IAAI;ECKN,OAAO,EAAE,QAAQ;EACjB,KAAK,EAAE,IAAI;EACX,UAAU,EAAE,eAAe;EAC3B,UAAU,EAAE,MAAM;AAGpB,sEAAuC;EACrC,KAAK,EAAE,IAAI;AAGb,yDAA0B;EACxB,aAAa,EAAE,GAAG;EAClB,OAAO,EAAE,IAAI;EACb,MAAM,EAAE,qBAAqB;EAE7B,IAAI,EAAE,8CAAqB;EAC3B,KAAK,EAAE,IAAI;EAEX,+DAAG;IACD,MAAM,EAAE,WAAW;IACnB,OAAO,EAAE,CAAC;IACV,IAAI,EAAE,2CAAkB;IACxB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;EAGrB,mEAAK;IACH,KAAK,EAAE,OAAO;EAGhB,mFAAa;IACX,OAAO,EAAE,IAAI;EAGf,+DAAG;IACD,OAAO,EAAE,UAAU;IAEnB,qEAAG;MACD,OAAO,EAAE,SAAS;MAClB,WAAW,EAAE,GAAG;MAEhB,yEAAE;QACA,WAAW,EAAE,GAAG;EAKtB,iEAAI;IACF,MAAM,EAAE,CAAC;EAIX,mFAAa;IACX,aAAa,EAAE,CAAC;AAIpB,2BAAY;EACV,UAAU,ED9EJ,OAAkB;ACiF1B,4BAAa;EACX,UAAU,EAAE,OAAiB;EAE7B,mEAAU;IACR,UAAU,EAAE,OAAiB;;AAOnC,yCAA0C;EAEtC,0DAA2B;IACzB,IAAI,EAAE,KAAW;IACjB,KAAK,EAAE,IAAQ;AAMrB,yCAA0C;EAEtC,kBAAG;IACD,UAAU,EAAE,IAAI;IAChB,cAAc,EAAE,GAAG;IACnB,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;EAGnB,kBAAG;IACD,UAAU,EAAE,IAAI;IAChB,cAAc,EAAE,CAAC;IACjB,SAAS,EAAE,IAAI;EAGjB,0BAAW;IACT,OAAO,EAAE,kBAAkB;IAC3B,MAAM,EAAE,UAAU;IAElB,6BAAG;MACD,OAAO,EAAE,aAAa;MACtB,SAAS,EAAE,IAAI;MACf,WAAW,EAAE,IAAI;AC5IvB,mBAAG;EACD,MAAM,EAAE,YAAY;EACpB,IAAI,EAAE,kDAAyB;EAC/B,cAAc,EAAE,SAAS;EACzB,cAAc,EAAE,GAAG;EAEnB,wBAAK;IACH,OAAO,EAAE,YAAY;IACrB,KAAK,EAAE,IAAI;AAIf,mBAAG;EACD,IAAI,EAAE,2CAAkB;EACxB,cAAc,EAAE,GAAG;AAGrB,mBAAG;EACD,IAAI,EAAE,2CAAkB;EACxB,cAAc,EAAE,GAAG;AAGrB,qBAAK;EACH,MAAM,EAAE,CAAC;EACT,OAAO,EAAE,CAAC;EACV,IAAI,EAAE,0CAAuB;EAC7B,KAAK,EFhBC,OAAkB;AEmB1B,wCAAO;EACL,MAAM,EAAE,UAAU;AAGpB,mBAAG;EACD,OAAO,EAAE,aAAa;EACtB,IAAI,EAAE,8CAAqB;EAC3B,KAAK,EFtBC,OAAkB;AEyB1B,8BAAc;EACZ,YAAY,EAAE,GAAG;EACjB,WAAW,EAAE,GAAG;EAChB,SAAS,EAAE,IAAI;EACf,KAAK,EF7BC,OAAkB;EE8BxB,MAAM,EAAE,IAAI;AAGd,uBAAO;EACL,WAAW,EAAE,MAAM;AAGrB,8BAAc;EACZ,OAAO,EAAE,eAAe;AAG1B,yCAAyB;EACvB,OAAO,EAAE,EAAE;;AAMf,yCAA0C;EAEtC,wBAAQ;IACN,KAAK,EAAE,IAAI;EAGb,wCAAO;IACL,WAAW,EAAE,IAAI;EAGnB,mBAAG;IACD,YAAY,EAAE,IAAI;AAMxB,yCAA0C;EAEtC,mBAAG;IACD,MAAM,EAAE,YAAY;IACpB,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;EAGnB,mBAAG;IACD,OAAO,EAAE,WAAW;IACpB,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;EAGnB,kBAAE;IACA,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;EAGnB,wCAAO;IACL,cAAc,EAAE,GAAG;EAGrB,mBAAG;IACD,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;IACjB,OAAO,EAAE,cAAc;AC1G7B,QAAS;EACP,QAAQ,EAAE,QAAQ;EAClB,OAAO,EAAE,IAAI;EACb,aAAa,EAAE,IAAI;EACnB,UAAU,EAAE,OAAiB;EAC7B,KAAK,EAAE,OAAiB;EACxB,MAAM,EAAE,iBAA2B;EAEnC,WAAG;IACD,MAAM,EAAE,CAAC;IACT,OAAO,EAAE,CAAC;IACV,IAAI,EAAE,4CAAmB;EAG3B,UAAE;IACA,MAAM,EAAE,MAAM;IACd,IAAI,EAAE,uCAAc;EAGtB,gBAAQ;IACN,MAAM,EAAE,YAAY;IACpB,IAAI,EAAE,uCAAc;IACpB,KAAK,EAAE,OAAiB;EAG1B,UAAE;IACA,KAAK,EAAE,OAAkB;EAG3B,gBAAQ;IACN,KAAK,EAAE,OAAkB;IACzB,YAAY,EAAE,OAAiB;EAGjC,iBAAS;IACP,QAAQ,EAAE,QAAQ;IAElB,OAAO,EAAE,CAAC;IACV,KAAK,EAAE,GAAG;IACV,GAAG,EAAE,CAAC;IACN,IAAI,EAAE,uCAAc;IACpB,OAAO,EAAE,OAAO;IAChB,MAAM,EAAE,OAAO;EAGjB,uBAAe;IACb,KAAK,EAAE,OAAkB;EAG3B,cAAM;IACJ,OAAO,EAAE,UAAU;IACnB,OAAO,EAAE,GAAG;IACZ,IAAI,EAAE,kCAAS;IACf,OAAO,EAAE,IAAI;IACb,aAAa,EAAE,GAAG;IAClB,MAAM,EAAE,iBAA4B;IACpC,KAAK,EAAE,OAAiB;EAG1B,oBAAY;IACV,OAAO,EAAE,KAAK;IACd,UAAU,EAAE,UAAU;IACtB,KAAK,EAAE,IAAI;EAGb,qBAAa;IACX,KAAK,EAAE,KAAK;IACZ,MAAM,EAAE,eAAe;IACvB,OAAO,EAAE,OAAO;IAChB,IAAI,EAAE,sCAAa;IACnB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;IACnB,UAAU,EAAE,OAAkB;EAGhC,oBAAY;IACV,YAAY,EAAE,OAAkB;;ACtEpC,OAAQ;EACN,WAAW,EAAE,MAAM;;AAGrB,MAAO;EACL,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,IAAI;EACX,MAAM,EAAE,OAAO;EAEf,OAAO,EAAE,CAAC;EAGV,UAAU,EAAE,eAAe;;AAG7B,CAAE;EACA,KAAK,EJhBS,OAAkB;EIiBhC,eAAe,EAAE,IAAI;EACrB,OAAO,EAAE,IAAI;EAEb,aAAa,EAAE,gCAAqC;EAEpD,UAAU,EAAE,uCACsB;;AAGpC,OAAQ;EACN,KAAK,EJ3BS,OAAkB;EI4BhC,aAAa,EAAE,iBAA8B;;AAG/C,GAAI;EACF,IAAI,EAAE,2CAAkB;EACxB,UAAU,EJ5BF,OAAkB;EI6B1B,KAAK,EJ3BG,OAAkB;EI6B1B,eAAQ;IACN,KAAK,EJ5BC,OAAkB;II6BxB,eAAe,EAAE,IAAI;IACrB,aAAa,EAAE,IAAI;EAGrB,WAAQ;IACN,KAAK,EJjCC,OAAkB;IIkCxB,eAAe,EAAE,IAAI;IACrB,aAAa,EAAE,IAAI;EAGrB,OAAI;IACF,UAAU,EAAE,UAAU;IACtB,KAAK,EAAE,IAAI;IACX,OAAO,EAAE,oBAAoB;EAG/B,MAAG;IACD,IAAI,EAAE,2CAAkB;IACxB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;IACnB,KAAK,EJjDC,OAAkB;EIoD1B,MAAG;IACD,IAAI,EAAE,2CAAkB;IACxB,KAAK,EJtDC,OAAkB;EIyD1B,0BAAmB;IACjB,KAAK,EAAE,KAAK;IACZ,SAAS,EAAE,IAAI;IACf,KAAK,EJ9DC,OAAkB;EIiE1B,cAAO;IACL,MAAM,EAAE,SAAS;IACjB,OAAO,EAAE,cAAc;IACvB,UAAU,EAAE,iBAAkB;IAC9B,aAAa,EAAE,iBAAkB;EAGnC,MAAG;IACD,eAAe,EAAE,IAAI;IACrB,YAAY,EAAE,CAAC;EAGjB,YAAS;IACP,KAAK,EAAE,KAAK;IACZ,SAAS,EAAE,IAAI;IACf,KAAK,EJhFC,OAAkB;EImF1B,cAAW;IACT,MAAM,EAAE,WAAW;IACnB,UAAU,EAAE,iBAAkB;EAGhC,eAAY;IACV,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,GAAG;IAChB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;IAEnB,qBAAM;MACJ,WAAW,EAAE,GAAG;MAChB,cAAc,EAAE,IAAI;MACpB,cAAc,EAAE,CAAC;EAIrB,cAAW;IACT,WAAW,EAAE,GAAG;IAChB,IAAI,EAAE,2CAAkB;IACxB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;;AAIvB,QAAS;EACP,QAAQ,EAAE,KAAK;EACf,KAAK,EAAE,KAAQ;EACf,MAAM,EAAE,IAAI;EAEZ,kBAAU;IACR,MAAM,EAAE,SAAS;;AAOrB,YAAa;EACX,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,KAAQ;;AAKjB,YAAa;EAEX,OAAO,EAAE,IAAI;EAEb,OAAO,EAAE,CAAC;EACV,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,KAAQ;EAEf,yBAAyB,EAAE,GAAG;EAC9B,0BAA0B,EAAE,GAAG;EAE/B,wBAAY;IACV,OAAO,EAAE,SAAS;IAClB,OAAO,EAAE,KAAK;IACd,SAAS,EAAE,IAAI;IACf,UAAU,EAAE,MAAM;IAClB,KAAK,EJjJC,OAAkB;IIkJxB,MAAM,EAAE,OAAO;IAEf,UAAU,EAAE,oDAEe;EAG7B,wDAA+B;IAC7B,aAAa,EAAE,IAAI;EAGrB,8BAAkB;IAChB,KAAK,EJ3JC,OAAkB;EI8J1B,wBAAY;IACV,QAAQ,EAAE,MAAM;IAChB,OAAO,EAAE,MAAM;IAMf,UAAU,EAAE,CAAC;IACb,UAAU,EAAE,sCACoB;IAEhC,mCAAW;MACT,cAAc,EAAE,GAAG;EAIvB,8BAAkB;IAGhB,UAAU,EAAE,KAAK;EAGnB,gBAAI;IACF,OAAO,EAAE,oBAAwB;;AAIrC,mBAAoB;EAClB,QAAQ,EAAE,KAAK;EAEf,GAAG,EAAE,KAAK;EAEV,+BAAY;IACV,UAAU,EAAE,KAAK;EAGnB,+BAAY;IACV,UAAU,EAAE,KAAK;;AAIrB,UAAW;EACT,OAAO,EAAE,IAAI;EAEb,UAAU,EAAE,MAAM;EAElB,cAAI;IACF,UAAU,EAAE,WAAW;IACvB,OAAO,EAAE,YAAY;IACrB,KAAK,EAAE,IAAI;IACX,MAAM,EAAE,IAAI;EAGd,kCAAa;IACX,SAAS,EAAE,IAAI;IACf,QAAQ,EAAE,QAAQ;IAClB,GAAG,EAAE,IAAI;IACT,OAAO,EAAE,MAAM;EAGjB,gBAAM;IACJ,IAAI,EAAE,CAAC;EAGT,gBAAM;IACJ,KAAK,EAAE,CAAC;;AAIZ,MAAO;EACL,KAAK,EAAE,KAAK;;AAGd,KAAM;EACJ,QAAQ,EAAE,QAAQ;EAElB,KAAK,EAAE,KAAS;EAChB,MAAM,EAAE,cAAiB;;AAG3B,iBAAkB;EAChB,KAAK,EJ5OM,OAAgB;EI6O3B,UAAU,EJ5OC,OAAiB;EI6O5B,aAAa,EAAE,GAAG;;AAGpB,IAAK;EACH,IAAI,EAAE,iEAAiB;EACvB,WAAW,EAAE,MAAM;EACnB,OAAO,EAAE,GAAG;;AAGd,MAAO;EACL,KAAK,EJtQS,OAAkB;;AIyQlC,WAAY;EACV,OAAO,EAAE,IAAI;EACb,MAAM,EAAE,KAAK;EAGb,QAAQ,EAAE,IAAI;;AAGhB,GAAI;EACF,IAAI,EAAE,sEAAsB;EAC5B,MAAM,EAAE,CAAC;EACT,OAAO,EAAE,CAAC;;AAGZ,OAAQ;EACN,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,KAAS;EAEhB,UAAG;IACD,QAAQ,EAAE,QAAQ;IAClB,IAAI,EAAE,mCAAgB;IACtB,OAAO,EAAE,cAAc;IACvB,OAAO,EAAE,CAAC;EAGZ,eAAQ;IACN,IAAI,EAAE,2CAAkB;IACxB,OAAO,EAAE,cAAc;IACvB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;EAGrB,eAAQ;IACN,QAAQ,EAAE,QAAQ;IAClB,GAAG,EAAE,IAAI;IACT,KAAK,EAAE,CAAC;IACR,OAAO,EAAE,CAAC;IAEV,IAAI,EAAE,sCAAa;IACnB,KAAK,EJtSC,OAAkB;EIyS1B,SAAE;IACA,MAAM,EAAE,MAAM;EAGhB,sBAAO;IACL,MAAM,EAAE,MAAM;IACd,OAAO,EAAE,UAAU;EAGrB,WAAI;IACF,SAAS,EAAE,IAAI;EAGjB,gBAAS;IACP,SAAS,EAAE,IAAI;IACf,KAAK,EAAE,KAAS;;AAIpB,KAAM;EACJ,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,MAAS;EAChB,KAAK,EAAE,KAAQ;EAEf,IAAI,EAAE,0CAAuB;EAE7B,UAAU,EAAE,iBAAgB;EAE5B,OAAE;IACA,MAAM,EAAE,MAAM;EAGhB,mBAAc;IACZ,UAAU,EAAE,GAAG;EAGjB,kBAAa;IACX,aAAa,EAAE,GAAG;EAGpB,UAAK;IACH,SAAS,EAAE,IAAI;IACf,aAAa,EAAE,GAAG;IAClB,OAAO,EAAE,OAAO;EAGlB,SAAI;IACF,OAAO,EAAE,GAAG;IACZ,MAAM,EAAE,OAAO;;AAInB,UAAW;EACT,QAAQ,EAAE,QAAQ;EAElB,MAAM,EAAE,aAAa;EAErB,qCAAoB;IAClB,QAAQ,EAAE,QAAQ;IAClB,GAAG,EAAE,KAAK;IACV,IAAI,EAAE,qCAAkB;IACxB,KAAK,EJtWC,OAAkB;EIyW1B,kBAAU;IACR,OAAO,EAAE,OAAO;IAChB,IAAI,EAAE,IAAI;EAGZ,iBAAS;IACP,OAAO,EAAE,OAAO;IAChB,KAAK,EAAE,GAAG;EAGZ,YAAE;IACA,MAAM,EAAE,MAAM;IACd,IAAI,EAAE,0CAAuB;IAC7B,KAAK,EJxXC,OAAkB;EI2X1B,eAAK;IACH,OAAO,EAAE,KAAK;IACd,UAAU,EAAE,KAAK;IACjB,KAAK,EJ7XC,OAAkB;II8XxB,SAAS,EAAE,IAAI;IAEf,uBAAU;MACR,OAAO,EAAE,YAAY;MACrB,KAAK,EJjYD,OAAkB;;AIsY5B,MAAO;EACL,UAAU,EAAE,iBAAgB;EAC5B,SAAS,EAAE,IAAI;EACf,UAAU,EAAE,MAAM;EAClB,MAAM,EAAE,MAAM;EACd,WAAW,EAAE,IAAI;;AAKnB,iDAAkD;EAChD,UAAU,EAAE,IAAI;EAChB,WAAW,EAAE,CAAC;;AAGhB,YAAa;EACX,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,MAAS;EAChB,KAAK,EAAE,KAAQ;EACf,OAAO,EAAE,SAAS;EAElB,IAAI,EAAE,sEAAsB;EAC5B,KAAK,EJpZM,OAAiC;EIsZ5C,eAAG;IACD,KAAK,EJzZI,OAAiC;II0Z1C,UAAU,EAAE,MAAM;EAGpB,oBAAU;IACR,OAAO,EAAE,IAAI;IACb,QAAQ,EAAE,QAAQ;IAClB,IAAI,EAAE,KAAc;IACpB,KAAK,EAAE,IAAW;IAClB,UAAU,EAAE,MAAM;;AAMpB,eAAI;EAAE,KAAK,EAAE,OAAiC;AAE9C,iEAAkB;EAAE,KAAK,EAAE,OAAmB;AAC9C,gCAAkB;EAAE,KAAK,EAAE,OAAkB;AAC7C,gDAAkB;EAAE,KAAK,EAAE,OAAkB;AAC7C,gDAAkB;EAAE,KAAK,EAAE,OAAiC;AAC5D,gCAAkB;EAAE,KAAK,EAAE,OAAmB;AAC9C,gCAAkB;EAAE,KAAK,EAAE,OAAmB;AAC9C,kFAAuB;EAAE,KAAK,EAAE,OAAmB;AACnD,gCAAkB;EAAE,KAAK,EAAE,OAAmB;AAC9C,eAAkB;EAAE,KAAK,EAAE,OAAmB;AAE9C,mBAAQ;EACN,MAAM,EAAE,UAAU;EAClB,OAAO,EAAE,QAAQ;EACjB,WAAW,EAAE,iBAAkB;EAC/B,YAAY,EAAE,iBAAkB;EAChC,UAAU,EJtbD,OAAiB;AI0b5B,+DAAwC;EACtC,KAAK,EJ5bI,OAAiC;;AIic9C,0CAA2C;EACzC,QAAS;IAAE,OAAO,EAAE,IAAI;;EACxB,YAAa;IAAE,OAAO,EAAE,KAAK;;EAE7B,IAAK;IACH,MAAM,EAAE,MAAM;;EAGhB,KAAM;IACJ,QAAQ,EAAE,QAAQ;IAClB,KAAK,EAAE,OAAO;IACd,SAAS,EAAE,KAAS;IACpB,MAAM,EAAE,MAAM;;EAGhB,OAAQ;IACN,KAAK,EAAE,OAAO;IACd,YAAY,EAAE,KAAQ;AAK1B,yCAA8C;EAC5C,IAAK;IACH,MAAM,EAAE,CAAC;;EAGX,KAAM;IACJ,SAAS,EAAE,KAAS;;EAGtB,YAAa;IACX,OAAO,EAAE,IAAI;;EAGf,UAAW;IACT,OAAO,EAAE,KAAK;;EAGhB,KAAM;IACJ,MAAM,EAAE,MAAM;IACd,KAAK,EAAE,OAAO;;EAGhB,OAAQ;IACN,MAAM,EAAE,CAAC;IAGT,gBAAS;MACP,KAAK,EAAE,OAAO;MACd,SAAS,EAAE,IAAI;;EAInB,KAAM;IACJ,QAAQ,EAAE,OAAO;IACjB,KAAK,EAAE,OAAO;IACd,KAAK,EAAE,OAAO;IAEd,aAAa,EAAE,iBAAgB;IAE/B,mBAAc;MACZ,UAAU,EAAE,GAAG;IAGjB,kBAAa;MACX,aAAa,EAAE,GAAG;IAKpB,SAAI;MACF,OAAO,EAAE,KAAK;MACd,SAAS,EAAE,KAAQ;MACnB,MAAM,EAAE,MAAM;;EAIlB,YAAa;IACX,QAAQ,EAAE,QAAQ;IAClB,IAAI,EAAE,CAAC;IACP,KAAK,EAAE,OAAO;IACd,UAAU,EAAE,KAAK;IACjB,UAAU,EAAE,KAAK;IACjB,OAAO,EAAE,UAAU;IAEnB,oBAAU;MACR,OAAO,EAAE,IAAI;AAOnB,yCAA0C;EACxC,KAAM;IACJ,MAAM,EAAE,MAAU;IAClB,KAAK,EAAE,OAAO;;EAId,kCAAa;IACX,OAAO,EAAE,MAAU;AAMzB,yCAA0C;EACxC,IAAK;IACH,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;;EAGnB,MAAO;IACL,UAAU,EAAE,kBAAkB;;EAI9B,cAAI;IACF,OAAO,EAAE,WAAW;IACpB,MAAM,EAAE,IAAI;EAGd,kCAAa;IACX,GAAG,EAAE,IAAI;;EAKX,UAAG;IACD,SAAS,EAAE,IAAI;IACf,OAAO,EAAE,cAAc;EAGzB,eAAQ;IACN,SAAS,EAAE,IAAI;IACf,OAAO,EAAE,aAAa;EAGxB,eAAQ;IACN,GAAG,EAAE,IAAI;IACT,SAAS,EAAE,IAAI;EAGjB,SAAE;IACA,MAAM,EAAE,MAAM;EAGhB,sBAAO;IACL,MAAM,EAAE,MAAM;IACd,OAAO,EAAE,UAAU;;EAIvB,UAAW;IACT,MAAM,EAAE,aAAa;IAErB,qCAAoB;MAClB,GAAG,EAAE,KAAK;MACV,SAAS,EAAE,IAAI;IAGjB,YAAE;MACA,MAAM,EAAE,MAAM;MACd,SAAS,EAAE,IAAI;MACf,WAAW,EAAE,IAAI",
+"mappings": "AAkCA,UAGC;EAFC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,6CAA6C;AAGpD,UAIC;EAHC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,8CAA8C;EACnD,UAAU,EAAE,MAAM;AAGpB,UAIC;EAHC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,gDAAgD;EACrD,WAAW,EAAE,GAAG;AAGlB,UAKC;EAJC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,sDAAsD;EAC3D,UAAU,EAAE,MAAM;EAClB,WAAW,EAAE,GAAG;AAGlB,UAIC;EAHC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,4CAA4C;EACjD,WAAW,EAAE,IAAI;AAGnB,UAKC;EAJC,WAAW,EAAE,SAAS;EACtB,GAAG,EAAE,kDAAkD;EACvD,UAAU,EAAE,MAAM;EAClB,WAAW,EAAE,IAAI;AAKnB,8DAA+D;EAC7D,MAAM,EAAE,CAAC;;AAGX,GAAI;EACF,OAAO,EAAE,IAAI;;AAKf,IAAK;EACH,KAAK,EAAE,IAAI;EACX,IAAI,EAAE,0CAAuB;;ACpF7B,kBAAG;EACD,IAAI,EAAE,uCAAoB;EAC1B,MAAM,EAAE,UAAU;EAClB,cAAc,EAAE,GAAG;EAEnB,wBAAM;IACJ,IAAI,EAAE,uCAAoB;IAC1B,KAAK,EAAE,KAAK;AAIhB,kBAAG;EACD,IAAI,EAAE,0CAAuB;EAC7B,MAAM,EAAE,UAAU;EAClB,cAAc,EAAE,GAAG;EAEnB,wBAAM;IACJ,IAAI,EAAE,uCAAoB;IAC1B,KAAK,EAAE,KAAK;AAIhB,0CAAW;EACT,KAAK,EAAE,IAAI;EACX,aAAa,EAAE,IAAI;AAGrB,sDAAuB;EACrB,aAAa,EAAE,IAAI;EACnB,KAAK,EAAE,OAAO;AAGhB,0DAA2B;EACzB,QAAQ,EAAE,QAAQ;EAClB,IAAI,EAAE,KAAK;EACX,KAAK,EDJH,IAAI;ECKN,OAAO,EAAE,QAAQ;EACjB,KAAK,EAAE,IAAI;EACX,UAAU,EAAE,eAAe;EAC3B,UAAU,EAAE,MAAM;AAGpB,sEAAuC;EACrC,KAAK,EAAE,IAAI;AAGb,yDAA0B;EACxB,aAAa,EAAE,GAAG;EAClB,OAAO,EAAE,IAAI;EACb,MAAM,EAAE,qBAAqB;EAE7B,IAAI,EAAE,8CAAqB;EAC3B,KAAK,EAAE,IAAI;EAEX,+DAAG;IACD,MAAM,EAAE,WAAW;IACnB,OAAO,EAAE,CAAC;IACV,IAAI,EAAE,2CAAkB;IACxB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;EAGrB,mEAAK;IACH,KAAK,EAAE,OAAO;EAGhB,mFAAa;IACX,OAAO,EAAE,IAAI;EAGf,+DAAG;IACD,OAAO,EAAE,UAAU;IAEnB,qEAAG;MACD,OAAO,EAAE,SAAS;MAClB,WAAW,EAAE,GAAG;MAEhB,yEAAE;QACA,WAAW,EAAE,GAAG;EAKtB,iEAAI;IACF,MAAM,EAAE,CAAC;EAIX,mFAAa;IACX,aAAa,EAAE,CAAC;AAIpB,2BAAY;EACV,UAAU,ED9EJ,OAAkB;ACiF1B,4BAAa;EACX,UAAU,EAAE,OAAiB;EAE7B,2EAAkB;IAChB,UAAU,EAAE,OAAiB;EAG/B,wCAAY;IACV,MAAM,EAAE,mBAAmB;;AAOjC,yCAA0C;EAEtC,0DAA2B;IACzB,IAAI,EAAE,KAAW;IACjB,KAAK,EAAE,IAAQ;AAMrB,yCAA0C;EAEtC,kBAAG;IACD,UAAU,EAAE,IAAI;IAChB,cAAc,EAAE,GAAG;IACnB,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;EAGnB,kBAAG;IACD,UAAU,EAAE,IAAI;IAChB,cAAc,EAAE,CAAC;IACjB,SAAS,EAAE,IAAI;EAGjB,0BAAW;IACT,OAAO,EAAE,kBAAkB;IAC3B,MAAM,EAAE,UAAU;IAElB,6BAAG;MACD,OAAO,EAAE,aAAa;MACtB,SAAS,EAAE,IAAI;MACf,WAAW,EAAE,IAAI;AChJvB,mBAAG;EACD,MAAM,EAAE,YAAY;EACpB,IAAI,EAAE,kDAAyB;EAC/B,cAAc,EAAE,SAAS;EACzB,cAAc,EAAE,GAAG;EAEnB,wBAAK;IACH,OAAO,EAAE,YAAY;IACrB,KAAK,EAAE,IAAI;AAIf,mBAAG;EACD,IAAI,EAAE,2CAAkB;EACxB,cAAc,EAAE,GAAG;AAGrB,mBAAG;EACD,IAAI,EAAE,2CAAkB;EACxB,cAAc,EAAE,GAAG;AAGrB,qBAAK;EACH,MAAM,EAAE,CAAC;EACT,OAAO,EAAE,CAAC;EACV,IAAI,EAAE,0CAAuB;EAC7B,KAAK,EFhBC,OAAkB;AEmB1B,wCAAO;EACL,MAAM,EAAE,UAAU;AAGpB,mBAAG;EACD,OAAO,EAAE,aAAa;EACtB,IAAI,EAAE,8CAAqB;EAC3B,KAAK,EFtBC,OAAkB;AEyB1B,8BAAc;EACZ,YAAY,EAAE,GAAG;EACjB,WAAW,EAAE,GAAG;EAChB,SAAS,EAAE,IAAI;EACf,KAAK,EF7BC,OAAkB;EE8BxB,MAAM,EAAE,IAAI;AAGd,uBAAO;EACL,WAAW,EAAE,MAAM;AAGrB,8BAAc;EACZ,OAAO,EAAE,eAAe;AAG1B,yCAAyB;EACvB,OAAO,EAAE,EAAE;;AAMf,yCAA0C;EAEtC,wBAAQ;IACN,KAAK,EAAE,IAAI;EAGb,wCAAO;IACL,WAAW,EAAE,IAAI;EAGnB,mBAAG;IACD,YAAY,EAAE,IAAI;AAMxB,yCAA0C;EAEtC,mBAAG;IACD,MAAM,EAAE,YAAY;IACpB,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;EAGnB,mBAAG;IACD,OAAO,EAAE,WAAW;IACpB,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;EAGnB,kBAAE;IACA,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;EAGnB,wCAAO;IACL,cAAc,EAAE,GAAG;EAGrB,mBAAG;IACD,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;IACjB,OAAO,EAAE,cAAc;AC1G7B,QAAS;EACP,QAAQ,EAAE,QAAQ;EAClB,OAAO,EAAE,IAAI;EACb,aAAa,EAAE,IAAI;EACnB,UAAU,EAAE,OAAiB;EAC7B,KAAK,EAAE,OAAiB;EACxB,MAAM,EAAE,iBAA2B;EAEnC,WAAG;IACD,MAAM,EAAE,CAAC;IACT,OAAO,EAAE,CAAC;IACV,IAAI,EAAE,4CAAmB;EAG3B,UAAE;IACA,MAAM,EAAE,MAAM;IACd,IAAI,EAAE,uCAAc;EAGtB,gBAAQ;IACN,MAAM,EAAE,YAAY;IACpB,IAAI,EAAE,uCAAc;IACpB,KAAK,EAAE,OAAiB;EAG1B,UAAE;IACA,KAAK,EAAE,OAAkB;EAG3B,gBAAQ;IACN,KAAK,EAAE,OAAkB;IACzB,YAAY,EAAE,OAAiB;EAGjC,iBAAS;IACP,QAAQ,EAAE,QAAQ;IAElB,OAAO,EAAE,CAAC;IACV,KAAK,EAAE,GAAG;IACV,GAAG,EAAE,CAAC;IACN,IAAI,EAAE,uCAAc;IACpB,OAAO,EAAE,OAAO;IAChB,MAAM,EAAE,OAAO;EAGjB,uBAAe;IACb,KAAK,EAAE,OAAkB;EAG3B,cAAM;IACJ,OAAO,EAAE,UAAU;IACnB,OAAO,EAAE,GAAG;IACZ,IAAI,EAAE,kCAAS;IACf,OAAO,EAAE,IAAI;IACb,aAAa,EAAE,GAAG;IAClB,MAAM,EAAE,iBAA4B;IACpC,KAAK,EAAE,OAAiB;EAG1B,oBAAY;IACV,OAAO,EAAE,KAAK;IACd,UAAU,EAAE,UAAU;IACtB,KAAK,EAAE,IAAI;EAGb,qBAAa;IACX,KAAK,EAAE,KAAK;IACZ,MAAM,EAAE,eAAe;IACvB,OAAO,EAAE,OAAO;IAChB,IAAI,EAAE,sCAAa;IACnB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;IACnB,UAAU,EAAE,OAAkB;EAGhC,oBAAY;IACV,YAAY,EAAE,OAAkB;;ACtEpC,OAAQ;EACN,WAAW,EAAE,MAAM;;AAGrB,MAAO;EACL,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,IAAI;EACX,MAAM,EAAE,OAAO;EAEf,OAAO,EAAE,CAAC;EAGV,UAAU,EAAE,eAAe;;AAG7B,CAAE;EACA,KAAK,EJhBS,OAAkB;EIiBhC,eAAe,EAAE,IAAI;EACrB,OAAO,EAAE,IAAI;EAEb,aAAa,EAAE,gCAAqC;EAEpD,UAAU,EAAE,uCACsB;;AAGpC,OAAQ;EACN,KAAK,EJ3BS,OAAkB;EI4BhC,aAAa,EAAE,iBAA8B;;AAG/C,GAAI;EACF,IAAI,EAAE,2CAAkB;EACxB,UAAU,EJ5BF,OAAkB;EI6B1B,KAAK,EJ3BG,OAAkB;EI6B1B,eAAQ;IACN,KAAK,EJ5BC,OAAkB;II6BxB,eAAe,EAAE,IAAI;IACrB,aAAa,EAAE,IAAI;EAGrB,WAAQ;IACN,KAAK,EJjCC,OAAkB;IIkCxB,eAAe,EAAE,IAAI;IACrB,aAAa,EAAE,IAAI;EAGrB,OAAI;IACF,UAAU,EAAE,UAAU;IACtB,KAAK,EAAE,IAAI;IACX,OAAO,EAAE,oBAAoB;EAG/B,MAAG;IACD,IAAI,EAAE,2CAAkB;IACxB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;IACnB,KAAK,EJjDC,OAAkB;EIoD1B,MAAG;IACD,IAAI,EAAE,2CAAkB;IACxB,KAAK,EJtDC,OAAkB;EIyD1B,0BAAmB;IACjB,KAAK,EAAE,KAAK;IACZ,SAAS,EAAE,IAAI;IACf,KAAK,EJ9DC,OAAkB;EIiE1B,cAAO;IACL,MAAM,EAAE,SAAS;IACjB,OAAO,EAAE,cAAc;IACvB,UAAU,EAAE,iBAAkB;IAC9B,aAAa,EAAE,iBAAkB;EAGnC,MAAG;IACD,eAAe,EAAE,IAAI;IACrB,YAAY,EAAE,CAAC;EAGjB,YAAS;IACP,KAAK,EAAE,KAAK;IACZ,SAAS,EAAE,IAAI;IACf,KAAK,EJhFC,OAAkB;EImF1B,cAAW;IACT,MAAM,EAAE,WAAW;IACnB,UAAU,EAAE,iBAAkB;EAGhC,eAAY;IACV,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,GAAG;IAChB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;IAEnB,qBAAM;MACJ,WAAW,EAAE,GAAG;MAChB,cAAc,EAAE,IAAI;MACpB,cAAc,EAAE,CAAC;EAIrB,cAAW;IACT,WAAW,EAAE,GAAG;IAChB,IAAI,EAAE,2CAAkB;IACxB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;;AAIvB,QAAS;EACP,QAAQ,EAAE,KAAK;EACf,KAAK,EAAE,KAAQ;EACf,MAAM,EAAE,IAAI;EAEZ,kBAAU;IACR,MAAM,EAAE,SAAS;;AAOrB,YAAa;EACX,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,KAAQ;;AAKjB,YAAa;EAEX,OAAO,EAAE,IAAI;EAEb,OAAO,EAAE,CAAC;EACV,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,KAAQ;EAEf,yBAAyB,EAAE,GAAG;EAC9B,0BAA0B,EAAE,GAAG;EAE/B,wBAAY;IACV,OAAO,EAAE,SAAS;IAClB,OAAO,EAAE,KAAK;IACd,SAAS,EAAE,IAAI;IACf,UAAU,EAAE,MAAM;IAClB,KAAK,EJjJC,OAAkB;IIkJxB,MAAM,EAAE,OAAO;IAEf,UAAU,EAAE,oDAEe;EAG7B,wDAA+B;IAC7B,aAAa,EAAE,IAAI;EAGrB,8BAAkB;IAChB,KAAK,EJ3JC,OAAkB;EI8J1B,wBAAY;IACV,QAAQ,EAAE,MAAM;IAChB,OAAO,EAAE,MAAM;IAMf,UAAU,EAAE,CAAC;IACb,UAAU,EAAE,sCACoB;IAEhC,mCAAW;MACT,cAAc,EAAE,GAAG;EAIvB,8BAAkB;IAGhB,UAAU,EAAE,KAAK;EAGnB,gBAAI;IACF,OAAO,EAAE,oBAAwB;;AAIrC,mBAAoB;EAClB,QAAQ,EAAE,KAAK;EAEf,GAAG,EAAE,KAAK;EAEV,+BAAY;IACV,UAAU,EAAE,KAAK;EAGnB,+BAAY;IACV,UAAU,EAAE,KAAK;;AAIrB,UAAW;EACT,OAAO,EAAE,IAAI;EAEb,UAAU,EAAE,MAAM;EAElB,cAAI;IACF,UAAU,EAAE,WAAW;IACvB,OAAO,EAAE,YAAY;IACrB,KAAK,EAAE,IAAI;IACX,MAAM,EAAE,IAAI;EAGd,kCAAa;IACX,SAAS,EAAE,IAAI;IACf,QAAQ,EAAE,QAAQ;IAClB,GAAG,EAAE,IAAI;IACT,OAAO,EAAE,MAAM;EAGjB,gBAAM;IACJ,IAAI,EAAE,CAAC;EAGT,gBAAM;IACJ,KAAK,EAAE,CAAC;;AAIZ,MAAO;EACL,KAAK,EAAE,KAAK;;AAGd,KAAM;EACJ,QAAQ,EAAE,QAAQ;EAElB,KAAK,EAAE,KAAS;EAChB,MAAM,EAAE,cAAiB;;AAG3B,iBAAkB;EAChB,KAAK,EJ5OM,OAAgB;EI6O3B,UAAU,EJ5OC,OAAiB;EI6O5B,aAAa,EAAE,GAAG;;AAGpB,IAAK;EACH,IAAI,EAAE,iEAAiB;EACvB,WAAW,EAAE,MAAM;EACnB,OAAO,EAAE,GAAG;;AAGd,MAAO;EACL,KAAK,EJtQS,OAAkB;;AIyQlC,WAAY;EACV,OAAO,EAAE,IAAI;EACb,MAAM,EAAE,KAAK;EAGb,QAAQ,EAAE,IAAI;;AAGhB,GAAI;EACF,IAAI,EAAE,sEAAsB;EAC5B,MAAM,EAAE,CAAC;EACT,OAAO,EAAE,CAAC;;AAGZ,OAAQ;EACN,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,KAAS;EAEhB,UAAG;IACD,QAAQ,EAAE,QAAQ;IAClB,IAAI,EAAE,mCAAgB;IACtB,OAAO,EAAE,cAAc;IACvB,OAAO,EAAE,CAAC;EAGZ,eAAQ;IACN,IAAI,EAAE,2CAAkB;IACxB,OAAO,EAAE,cAAc;IACvB,cAAc,EAAE,SAAS;IACzB,cAAc,EAAE,GAAG;EAGrB,eAAQ;IACN,QAAQ,EAAE,QAAQ;IAClB,GAAG,EAAE,IAAI;IACT,KAAK,EAAE,CAAC;IACR,OAAO,EAAE,CAAC;IAEV,IAAI,EAAE,sCAAa;IACnB,KAAK,EJtSC,OAAkB;EIyS1B,SAAE;IACA,MAAM,EAAE,MAAM;EAGhB,sBAAO;IACL,MAAM,EAAE,MAAM;IACd,OAAO,EAAE,UAAU;EAGrB,WAAI;IACF,SAAS,EAAE,IAAI;EAGjB,gBAAS;IACP,SAAS,EAAE,IAAI;IACf,KAAK,EAAE,KAAS;;AAIpB,KAAM;EACJ,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,MAAS;EAChB,KAAK,EAAE,KAAQ;EAEf,IAAI,EAAE,0CAAuB;EAE7B,UAAU,EAAE,iBAAgB;EAE5B,OAAE;IACA,MAAM,EAAE,MAAM;EAGhB,mBAAc;IACZ,UAAU,EAAE,GAAG;EAGjB,kBAAa;IACX,aAAa,EAAE,GAAG;EAGpB,UAAK;IACH,SAAS,EAAE,IAAI;IACf,aAAa,EAAE,GAAG;IAClB,OAAO,EAAE,OAAO;EAGlB,iBAAY;IACV,OAAO,EAAE,GAAG;IACZ,MAAM,EAAE,OAAO;;AAInB,UAAW;EACT,QAAQ,EAAE,QAAQ;EAElB,MAAM,EAAE,aAAa;EAErB,qCAAoB;IAClB,QAAQ,EAAE,QAAQ;IAClB,GAAG,EAAE,KAAK;IACV,IAAI,EAAE,qCAAkB;IACxB,KAAK,EJtWC,OAAkB;EIyW1B,kBAAU;IACR,OAAO,EAAE,OAAO;IAChB,IAAI,EAAE,IAAI;EAGZ,iBAAS;IACP,OAAO,EAAE,OAAO;IAChB,KAAK,EAAE,GAAG;EAGZ,YAAE;IACA,MAAM,EAAE,MAAM;IACd,IAAI,EAAE,0CAAuB;IAC7B,KAAK,EJxXC,OAAkB;EI2X1B,eAAK;IACH,OAAO,EAAE,KAAK;IACd,UAAU,EAAE,KAAK;IACjB,KAAK,EJ7XC,OAAkB;II8XxB,SAAS,EAAE,IAAI;IAEf,uBAAU;MACR,OAAO,EAAE,YAAY;MACrB,KAAK,EJjYD,OAAkB;;AIsY5B,MAAO;EACL,UAAU,EAAE,iBAAgB;EAC5B,SAAS,EAAE,IAAI;EACf,UAAU,EAAE,MAAM;EAClB,MAAM,EAAE,MAAM;EACd,WAAW,EAAE,IAAI;;AAKnB,iDAAkD;EAChD,UAAU,EAAE,IAAI;EAChB,WAAW,EAAE,CAAC;;AAGhB,YAAa;EACX,QAAQ,EAAE,QAAQ;EAClB,KAAK,EAAE,MAAS;EAChB,KAAK,EAAE,KAAQ;EACf,OAAO,EAAE,SAAS;EAElB,IAAI,EAAE,sEAAsB;EAC5B,KAAK,EJpZM,OAAiC;EIsZ5C,eAAG;IACD,KAAK,EJzZI,OAAiC;II0Z1C,UAAU,EAAE,MAAM;EAGpB,oBAAU;IACR,OAAO,EAAE,IAAI;IACb,QAAQ,EAAE,QAAQ;IAClB,IAAI,EAAE,KAAc;IACpB,KAAK,EAAE,IAAW;IAClB,UAAU,EAAE,MAAM;;AAMpB,eAAI;EAAE,KAAK,EAAE,OAAiC;AAE9C,iEAAkB;EAAE,KAAK,EAAE,OAAmB;AAC9C,gCAAkB;EAAE,KAAK,EAAE,OAAkB;AAC7C,gDAAkB;EAAE,KAAK,EAAE,OAAkB;AAC7C,gDAAkB;EAAE,KAAK,EAAE,OAAiC;AAC5D,gCAAkB;EAAE,KAAK,EAAE,OAAmB;AAC9C,gCAAkB;EAAE,KAAK,EAAE,OAAmB;AAC9C,kFAAuB;EAAE,KAAK,EAAE,OAAmB;AACnD,gCAAkB;EAAE,KAAK,EAAE,OAAmB;AAC9C,eAAkB;EAAE,KAAK,EAAE,OAAmB;AAE9C,mBAAQ;EACN,MAAM,EAAE,UAAU;EAClB,OAAO,EAAE,QAAQ;EACjB,WAAW,EAAE,iBAAkB;EAC/B,YAAY,EAAE,iBAAkB;EAChC,UAAU,EJtbD,OAAiB;AI0b5B,+DAAwC;EACtC,KAAK,EJ5bI,OAAiC;;AIic9C,0CAA2C;EACzC,QAAS;IAAE,OAAO,EAAE,IAAI;;EACxB,YAAa;IAAE,OAAO,EAAE,KAAK;;EAE7B,IAAK;IACH,MAAM,EAAE,MAAM;;EAGhB,KAAM;IACJ,QAAQ,EAAE,QAAQ;IAClB,KAAK,EAAE,OAAO;IACd,SAAS,EAAE,KAAS;IACpB,MAAM,EAAE,MAAM;;EAGhB,OAAQ;IACN,KAAK,EAAE,OAAO;IACd,YAAY,EAAE,KAAQ;AAK1B,yCAA8C;EAC5C,IAAK;IACH,MAAM,EAAE,CAAC;;EAGX,KAAM;IACJ,SAAS,EAAE,KAAS;;EAGtB,YAAa;IACX,OAAO,EAAE,IAAI;;EAGf,UAAW;IACT,OAAO,EAAE,KAAK;;EAGhB,KAAM;IACJ,MAAM,EAAE,MAAM;IACd,KAAK,EAAE,OAAO;;EAGhB,OAAQ;IACN,MAAM,EAAE,CAAC;IAGT,gBAAS;MACP,KAAK,EAAE,OAAO;MACd,SAAS,EAAE,IAAI;;EAInB,KAAM;IACJ,QAAQ,EAAE,OAAO;IACjB,KAAK,EAAE,OAAO;IACd,KAAK,EAAE,OAAO;IAEd,aAAa,EAAE,iBAAgB;IAE/B,mBAAc;MACZ,UAAU,EAAE,GAAG;IAGjB,kBAAa;MACX,aAAa,EAAE,GAAG;IAKpB,SAAI;MACF,OAAO,EAAE,KAAK;MACd,SAAS,EAAE,KAAQ;MACnB,MAAM,EAAE,MAAM;;EAIlB,YAAa;IACX,QAAQ,EAAE,QAAQ;IAClB,IAAI,EAAE,CAAC;IACP,KAAK,EAAE,OAAO;IACd,UAAU,EAAE,KAAK;IACjB,UAAU,EAAE,KAAK;IACjB,OAAO,EAAE,UAAU;IAEnB,oBAAU;MACR,OAAO,EAAE,IAAI;AAOnB,yCAA0C;EACxC,KAAM;IACJ,MAAM,EAAE,MAAU;IAClB,KAAK,EAAE,OAAO;;EAId,kCAAa;IACX,OAAO,EAAE,MAAU;AAMzB,yCAA0C;EACxC,IAAK;IACH,SAAS,EAAE,IAAI;IACf,WAAW,EAAE,IAAI;;EAGnB,MAAO;IACL,UAAU,EAAE,kBAAkB;;EAI9B,cAAI;IACF,OAAO,EAAE,WAAW;IACpB,MAAM,EAAE,IAAI;EAGd,kCAAa;IACX,GAAG,EAAE,IAAI;;EAKX,UAAG;IACD,SAAS,EAAE,IAAI;IACf,OAAO,EAAE,cAAc;EAGzB,eAAQ;IACN,SAAS,EAAE,IAAI;IACf,OAAO,EAAE,aAAa;EAGxB,eAAQ;IACN,GAAG,EAAE,IAAI;IACT,SAAS,EAAE,IAAI;EAGjB,SAAE;IACA,MAAM,EAAE,MAAM;EAGhB,sBAAO;IACL,MAAM,EAAE,MAAM;IACd,OAAO,EAAE,UAAU;;EAIvB,UAAW;IACT,MAAM,EAAE,aAAa;IAErB,qCAAoB;MAClB,GAAG,EAAE,KAAK;MACV,SAAS,EAAE,IAAI;IAGjB,YAAE;MACA,MAAM,EAAE,MAAM;MACd,SAAS,EAAE,IAAI;MACf,WAAW,EAAE,IAAI",
 "sources": ["../asset/sass/shared.scss","../asset/sass/chapter.scss","../asset/sass/contents.scss","../asset/sass/sign-up.scss","../asset/style.scss"],
 "names": [],
 "file": "style.css"
diff --git a/util/book.py b/util/book.py
index 94422a150..d454bf05d 100644
--- a/util/book.py
+++ b/util/book.py
@@ -63,7 +63,7 @@
           'Tokens', 'Token types', 'Lexical analysis', 'Regular languages',
           'Lookahead', 'Reserved words', 'Error reporting'
         ],
-        'done': False,
+        'design_note': "Implicit Semicolons"
       },
       {
         'name': 'Representing Code',
diff --git a/util/build.py b/util/build.py
index 8b022c8ef..d6ec81d79 100755
--- a/util/build.py
+++ b/util/build.py
@@ -28,7 +28,7 @@
 CODE_BEFORE_PATTERN = re.compile(r'([-a-z0-9]+) \((\d+) before\)')
 CODE_AFTER_PATTERN = re.compile(r'([-a-z0-9]+) \((\d+) after\)')
 CODE_AROUND_PATTERN = re.compile(r'([-a-z0-9]+) \((\d+) before, (\d+) after\)')
-
+ASIDE_COMMENT_PATTERN = re.compile(r'<span class="c1">// \[([-a-z0-9]+)\]</span>')
 
 num_chapters = 0
 empty_chapters = 0
@@ -251,7 +251,7 @@ def format_file(path, skip_up_to_date, dependencies_mod):
       stripped = line.lstrip()
       indentation = line[:len(line) - len(stripped)]
 
-      if stripped.startswith('^'):
+      if line.startswith('^'):
         command,_,arg = stripped.rstrip('\n').lstrip('^').partition(' ')
         arg = arg.strip()
 
@@ -335,6 +335,10 @@ def format_file(path, skip_up_to_date, dependencies_mod):
   contents = contents.replace('<div class="design-note">', '<div class="design-note" markdown="1">')
   body = markdown.markdown(contents, ['extra', 'codehilite', 'smarty'])
 
+  # Turn aside markers in code into spans.
+  # <span class="c1">// [repl]</span>
+  body = ASIDE_COMMENT_PATTERN.sub(r'<span name="\1"></span>', body)
+
   data = {
     'title': title,
     'part': part,