From 172ba42001003bce79708141923ba6100cc7d4f2 Mon Sep 17 00:00:00 2001
From: Alex Kyllo <alex.kyllo@gmail.com>
Date: Sun, 12 Jan 2020 20:20:48 -0800
Subject: [PATCH 001/122] Add support for MSSQL's SELECT TOP N syntax (#150)

Add support for MSSQL SELECT TOP (N) [PERCENT] [WITH TIES] syntax.
---
 src/ast/mod.rs           |  2 +-
 src/ast/query.rs         | 33 +++++++++++++++++++++++++------
 src/dialect/keywords.rs  |  3 ++-
 src/parser.rs            | 31 ++++++++++++++++++++++++++++-
 src/tokenizer.rs         | 23 ++++++++++++++++++++++
 tests/sqlparser_mssql.rs | 42 ++++++++++++++++++++++++++++++++++++++++
 tests/sqlparser_mysql.rs |  2 +-
 7 files changed, 126 insertions(+), 10 deletions(-)
diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index eaf99b31b..2f723f012 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -27,7 +27,7 @@ pub use self::ddl::{
 pub use self::operator::{BinaryOperator, UnaryOperator};
 pub use self::query::{
     Cte, Fetch, Join, JoinConstraint, JoinOperator, OrderByExpr, Query, Select, SelectItem,
-    SetExpr, SetOperator, TableAlias, TableFactor, TableWithJoins, Values,
+    SetExpr, SetOperator, TableAlias, TableFactor, TableWithJoins, Top, Values,
 };
 pub use self::value::{DateTimeField, Value};
 
diff --git a/src/ast/query.rs b/src/ast/query.rs
index 656f7f14b..a5eea141f 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -114,6 +114,8 @@ impl fmt::Display for SetOperator {
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 pub struct Select {
     pub distinct: bool,
+    /// MSSQL syntax: `TOP (<N>) [ PERCENT ] [ WITH TIES ]`
+    pub top: Option<Top>,
     /// projection expressions
     pub projection: Vec<SelectItem>,
     /// FROM
@@ -128,12 +130,11 @@ pub struct Select {
 
 impl fmt::Display for Select {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
-        write!(
-            f,
-            "SELECT{} {}",
-            if self.distinct { " DISTINCT" } else { "" },
-            display_comma_separated(&self.projection)
-        )?;
+        write!(f, "SELECT{}", if self.distinct { " DISTINCT" } else { "" })?;
+        if let Some(ref top) = self.top {
+            write!(f, " {}", top)?;
+        }
+        write!(f, " {}", display_comma_separated(&self.projection))?;
         if !self.from.is_empty() {
             write!(f, " FROM {}", display_comma_separated(&self.from))?;
         }
@@ -408,6 +409,26 @@ impl fmt::Display for Fetch {
     }
 }
 
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub struct Top {
+    /// SQL semantic equivalent of LIMIT but with same structure as FETCH.
+    pub with_ties: bool,
+    pub percent: bool,
+    pub quantity: Option<Expr>,
+}
+
+impl fmt::Display for Top {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        let extension = if self.with_ties { " WITH TIES" } else { "" };
+        if let Some(ref quantity) = self.quantity {
+            let percent = if self.percent { " PERCENT" } else { "" };
+            write!(f, "TOP ({}){}{}", quantity, percent, extension)
+        } else {
+            write!(f, "TOP{}", extension)
+        }
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 pub struct Values(pub Vec<Vec<Expr>>);
 
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index c083c0692..9795f2af3 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -374,6 +374,7 @@ define_keywords!(
     TIMEZONE_HOUR,
     TIMEZONE_MINUTE,
     TO,
+    TOP,
     TRAILING,
     TRANSACTION,
     TRANSLATE,
@@ -426,7 +427,7 @@ define_keywords!(
 /// can be parsed unambiguously without looking ahead.
 pub const RESERVED_FOR_TABLE_ALIAS: &[&str] = &[
     // Reserved as both a table and a column alias:
-    WITH, SELECT, WHERE, GROUP, HAVING, ORDER, LIMIT, OFFSET, FETCH, UNION, EXCEPT, INTERSECT,
+    WITH, SELECT, WHERE, GROUP, HAVING, ORDER, TOP, LIMIT, OFFSET, FETCH, UNION, EXCEPT, INTERSECT,
     // Reserved only as a table alias in the `FROM`/`JOIN` clauses:
     ON, JOIN, INNER, CROSS, FULL, LEFT, RIGHT, NATURAL, USING,
     // for MSSQL-specific OUTER APPLY (seems reserved in most dialects)
diff --git a/src/parser.rs b/src/parser.rs
index cbdcaba09..c9e32ed3b 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -783,7 +783,6 @@ impl Parser {
     }
 
     /// Bail out if the current token is not one of the expected keywords, or consume it if it is
-    #[must_use]
     pub fn expect_one_of_keywords(
         &mut self,
         keywords: &[&'static str],
@@ -1561,6 +1560,13 @@ impl Parser {
         if all && distinct {
             return parser_err!("Cannot specify both ALL and DISTINCT in SELECT");
         }
+
+        let top = if self.parse_keyword("TOP") {
+            Some(self.parse_top()?)
+        } else {
+            None
+        };
+
         let projection = self.parse_comma_separated(Parser::parse_select_item)?;
 
         // Note that for keywords to be properly handled here, they need to be
@@ -1594,6 +1600,7 @@ impl Parser {
 
         Ok(Select {
             distinct,
+            top,
             projection,
             from,
             selection,
@@ -1940,6 +1947,28 @@ impl Parser {
         Ok(OrderByExpr { expr, asc })
     }
 
+    /// Parse a TOP clause, MSSQL equivalent of LIMIT,
+    /// that follows after SELECT [DISTINCT].
+    pub fn parse_top(&mut self) -> Result<Top, ParserError> {
+        let quantity = if self.consume_token(&Token::LParen) {
+            let quantity = self.parse_expr()?;
+            self.expect_token(&Token::RParen)?;
+            Some(quantity)
+        } else {
+            Some(Expr::Value(self.parse_number_value()?))
+        };
+
+        let percent = self.parse_keyword("PERCENT");
+
+        let with_ties = self.parse_keywords(vec!["WITH", "TIES"]);
+
+        Ok(Top {
+            with_ties,
+            percent,
+            quantity,
+        })
+    }
+
     /// Parse a LIMIT clause
     pub fn parse_limit(&mut self) -> Result<Option<Expr>, ParserError> {
         if self.parse_keyword("ALL") {
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 62d534895..96c9535ea 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -522,6 +522,7 @@ fn peeking_take_while(
 #[cfg(test)]
 mod tests {
     use super::super::dialect::GenericDialect;
+    use super::super::dialect::MsSqlDialect;
     use super::*;
 
     #[test]
@@ -782,6 +783,28 @@ mod tests {
         compare(expected, tokens);
     }
 
+    #[test]
+    fn tokenize_mssql_top() {
+        let sql = "SELECT TOP 5 [bar] FROM foo";
+        let dialect = MsSqlDialect {};
+        let mut tokenizer = Tokenizer::new(&dialect, sql);
+        let tokens = tokenizer.tokenize().unwrap();
+        let expected = vec![
+            Token::make_keyword("SELECT"),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_keyword("TOP"),
+            Token::Whitespace(Whitespace::Space),
+            Token::Number(String::from("5")),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_word("bar", Some('[')),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_keyword("FROM"),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_word("foo", None),
+        ];
+        compare(expected, tokens);
+    }
+
     fn compare(expected: Vec<Token>, actual: Vec<Token>) {
         //println!("------------------------------");
         //println!("tokens   = {:?}", actual);
diff --git a/tests/sqlparser_mssql.rs b/tests/sqlparser_mssql.rs
index b5170e208..2774d43ef 100644
--- a/tests/sqlparser_mssql.rs
+++ b/tests/sqlparser_mssql.rs
@@ -68,6 +68,48 @@ fn parse_mssql_apply_join() {
     );
 }
 
+#[test]
+fn parse_mssql_top_paren() {
+    let sql = "SELECT TOP (5) * FROM foo";
+    let select = ms_and_generic().verified_only_select(sql);
+    let top = select.top.unwrap();
+    assert_eq!(Some(Expr::Value(number("5"))), top.quantity);
+    assert!(!top.percent);
+}
+
+#[test]
+fn parse_mssql_top_percent() {
+    let sql = "SELECT TOP (5) PERCENT * FROM foo";
+    let select = ms_and_generic().verified_only_select(sql);
+    let top = select.top.unwrap();
+    assert_eq!(Some(Expr::Value(number("5"))), top.quantity);
+    assert!(top.percent);
+}
+
+#[test]
+fn parse_mssql_top_with_ties() {
+    let sql = "SELECT TOP (5) WITH TIES * FROM foo";
+    let select = ms_and_generic().verified_only_select(sql);
+    let top = select.top.unwrap();
+    assert_eq!(Some(Expr::Value(number("5"))), top.quantity);
+    assert!(top.with_ties);
+}
+
+#[test]
+fn parse_mssql_top_percent_with_ties() {
+    let sql = "SELECT TOP (10) PERCENT WITH TIES * FROM foo";
+    let select = ms_and_generic().verified_only_select(sql);
+    let top = select.top.unwrap();
+    assert_eq!(Some(Expr::Value(number("10"))), top.quantity);
+    assert!(top.percent);
+}
+
+#[test]
+fn parse_mssql_top() {
+    let sql = "SELECT TOP 5 bar, baz FROM foo";
+    let _ = ms_and_generic().one_statement_parses_to(sql, "SELECT TOP (5) bar, baz FROM foo");
+}
+
 fn ms() -> TestedDialects {
     TestedDialects {
         dialects: vec![Box::new(MsSqlDialect {})],
diff --git a/tests/sqlparser_mysql.rs b/tests/sqlparser_mysql.rs
index ce9d0053b..cc6433322 100644
--- a/tests/sqlparser_mysql.rs
+++ b/tests/sqlparser_mysql.rs
@@ -77,7 +77,7 @@ fn parse_show_columns() {
         Statement::ShowColumns {
             extended: false,
             full: false,
-            table_name: table_name.clone(),
+            table_name: table_name,
             filter: Some(ShowStatementFilter::Where(
                 mysql_and_generic().verified_expr("1 = 2")
             )),

From 3255fd3ea8b5f8e9c63c1825fdcd2fc1fb30cc22 Mon Sep 17 00:00:00 2001
From: Eyal Leshem <eyal@satoricyber.com>
Date: Sat, 4 Apr 2020 23:21:36 +0300
Subject: [PATCH 002/122] Add support to to table_name inside parenthesis

---
 src/parser.rs             | 15 +++++----------
 tests/sqlparser_common.rs | 38 ++++++++++++++++++++++++++++++--------
 2 files changed, 35 insertions(+), 18 deletions(-)

diff --git a/src/parser.rs b/src/parser.rs
index c9e32ed3b..e988f9c09 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1771,6 +1771,7 @@ impl Parser {
             //                   ^ ^ ^ ^
             //                   | | | |
             //                   | | | |
+            //                   | | | |
             //                   | | | (4) belongs to a SetExpr::Query inside the subquery
             //                   | | (3) starts a derived table (subquery)
             //                   | (2) starts a nested join
@@ -1793,18 +1794,12 @@ impl Parser {
                     // Ignore the error and back up to where we were before.
                     // Either we'll be able to parse a valid nested join, or
                     // we won't, and we'll return that error instead.
+                    //
+                    // Even the SQL spec prohibits derived tables and bare
+                    // tables from appearing alone in parentheses, we allowed it
+                    // as some Db's allowed that (snowflake as example)
                     self.index = index;
                     let table_and_joins = self.parse_table_and_joins()?;
-                    match table_and_joins.relation {
-                        TableFactor::NestedJoin { .. } => (),
-                        _ => {
-                            if table_and_joins.joins.is_empty() {
-                                // The SQL spec prohibits derived tables and bare
-                                // tables from appearing alone in parentheses.
-                                self.expected("joined table", self.peek_token())?
-                            }
-                        }
-                    }
                     self.expect_token(&Token::RParen)?;
                     Ok(TableFactor::NestedJoin(Box::new(table_and_joins)))
                 }
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 71b11f3b7..939673dcd 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1806,11 +1806,19 @@ fn parse_join_nesting() {
         vec![join(nest!(nest!(nest!(table("b"), table("c")))))]
     );
 
-    let res = parse_sql_statements("SELECT * FROM (a NATURAL JOIN (b))");
-    assert_eq!(
-        ParserError::ParserError("Expected joined table, found: )".to_string()),
-        res.unwrap_err()
-    );
+    // Parenthesized table names are non-standard, but supported in Snowflake SQL
+    let sql = "SELECT * FROM (a NATURAL JOIN (b))";
+    let select = verified_only_select(sql);
+    let from = only(select.from);
+
+    assert_eq!(from.relation, nest!(table("a"), nest!(table("b"))));
+
+    // Double parentheses around table names are non-standard, but supported in Snowflake SQL
+    let sql = "SELECT * FROM (a NATURAL JOIN ((b)))";
+    let select = verified_only_select(sql);
+    let from = only(select.from);
+
+    assert_eq!(from.relation, nest!(table("a"), nest!(nest!(table("b")))));
 }
 
 #[test]
@@ -1953,10 +1961,24 @@ fn parse_derived_tables() {
         }))
     );
 
-    let res = parse_sql_statements("SELECT * FROM ((SELECT 1) AS t)");
+    // Nesting a subquery in parentheses is non-standard, but supported in Snowflake SQL
+    let sql = "SELECT * FROM ((SELECT 1) AS t)";
+    let select = verified_only_select(sql);
+    let from = only(select.from);
+
     assert_eq!(
-        ParserError::ParserError("Expected joined table, found: )".to_string()),
-        res.unwrap_err()
+        from.relation,
+        TableFactor::NestedJoin(Box::new(TableWithJoins {
+            relation: TableFactor::Derived {
+                lateral: false,
+                subquery: Box::new(verified_query("SELECT 1")),
+                alias: Some(TableAlias {
+                    name: "t".into(),
+                    columns: vec![],
+                })
+            },
+            joins: Vec::new(),
+        }))
     );
 }
 

From 4ce0eb11aee27f2fd8ae4c31fe982a8f0efca8c1 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Tue, 14 Apr 2020 16:56:16 +0300
Subject: [PATCH 003/122] Fix a new clippy lint (`.nth(0)`) to unbreak CI

"iter.next() is equivalent to iter.nth(0), as they both consume the
next element, but is more readable."

https://rust-lang.github.io/rust-clippy/master/index.html#iter_nth_zero
---
 examples/cli.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/cli.rs b/examples/cli.rs
index 77a0b5014..d0ba9a578 100644
--- a/examples/cli.rs
+++ b/examples/cli.rs
@@ -40,7 +40,7 @@ fn main() {
     println!("Parsing from file '{}' using {:?}", &filename, dialect);
     let contents = fs::read_to_string(&filename)
         .unwrap_or_else(|_| panic!("Unable to read the file {}", &filename));
-    let without_bom = if contents.chars().nth(0).unwrap() as u64 != 0xfeff {
+    let without_bom = if contents.chars().next().unwrap() as u64 != 0xfeff {
         contents.as_str()
     } else {
         let mut chars = contents.chars();

From dcc624c56128c3d6cba24812cf0747195308309a Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Tue, 14 Apr 2020 19:03:39 +0300
Subject: [PATCH 004/122] Make CI handle missing rustfmt in the nightly

---
 .travis.yml | 20 ++++++++++++++------
 1 file changed, 14 insertions(+), 6 deletions(-)

diff --git a/.travis.yml b/.travis.yml
index e90fe8400..425a48ef5 100644
--- a/.travis.yml
+++ b/.travis.yml
@@ -23,6 +23,16 @@ rust:
   - stable
 
 before_script:
+  # Travis installs rust with a non-default "minimal" profile, and advises us
+  # to add clippy manually:
+  - rustup component add clippy
+  # Unfortunately, this method often breaks on the nightly channel, where the
+  # most recent build might not have all the optional components.
+  # We explicitly specify `--profile default` to obtain the most recent nightly
+  # that has rustfmt (we don't care if it's a week old, as we need it only for
+  # an experimental flag):
+  - rustup toolchain install nightly --profile default
+
   - pip install 'travis-cargo<0.2' --user && export PATH=$HOME/.local/bin:$PATH
   - export PATH=$HOME/.cargo/bin:$PATH
   # `cargo install` fails if the specified binary is already installed, and
@@ -33,13 +43,9 @@ before_script:
   # rebuilds from scratch, ignoring the cache entirely.
   #
   # [0]: https://github.com/rust-lang/cargo/issues/2082
-  - cargo install cargo-update || echo "cargo-update already installed"
-  - cargo install cargo-travis || echo "cargo-travis already installed"
+  - cargo install cargo-update || echo "cargo-update already installed"  # for `cargo install-update`
+  - cargo install cargo-travis || echo "cargo-travis already installed"  # for `cargo coveralls`
   - cargo install-update -a  # updates cargo-travis, if the cached version is outdated
-  - rustup component add clippy
-  # The license_template_path setting we use to verify copyright headers is
-  # only available on the nightly rustfmt.
-  - rustup toolchain install nightly && rustup component add --toolchain nightly rustfmt
 
 script:
   # Clippy must be run first, as its lints are only triggered during
@@ -50,6 +56,8 @@ script:
   - travis-cargo build
   - travis-cargo test
   - travis-cargo test -- all-features
+  # The license_template_path setting we use to verify copyright headers is
+  # only available on the nightly rustfmt.
   - cargo +nightly fmt -- --check --config-path <(echo 'license_template_path = "HEADER"')
 
 after_success:

From baacc956ea26ddb7b8dea4cb9ccd9aac5532e171 Mon Sep 17 00:00:00 2001
From: Alex Dukhno <alex.dukhno@icloud.com>
Date: Sun, 19 Apr 2020 13:07:00 +0300
Subject: [PATCH 005/122] derive default for GenericDialect

---
 src/dialect/generic.rs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/dialect/generic.rs b/src/dialect/generic.rs
index 50054069e..104d3a9a3 100644
--- a/src/dialect/generic.rs
+++ b/src/dialect/generic.rs
@@ -12,8 +12,8 @@
 
 use crate::dialect::Dialect;
 
-#[derive(Debug)]
-pub struct GenericDialect {}
+#[derive(Debug, Default)]
+pub struct GenericDialect;
 
 impl Dialect for GenericDialect {
     fn is_identifier_start(&self, ch: char) -> bool {

From 05a29212ffbf0704a620dfef1b850089d2efa1ab Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Mon, 20 Apr 2020 04:07:21 +0300
Subject: [PATCH 006/122] Update comments (follow-up to PR #155)

https://github.com/andygrove/sqlparser-rs/pull/155
---
 src/ast/query.rs |  9 +++++----
 src/parser.rs    | 26 +++++++++++---------------
 2 files changed, 16 insertions(+), 19 deletions(-)

diff --git a/src/ast/query.rs b/src/ast/query.rs
index a5eea141f..3588257e7 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -225,10 +225,11 @@ pub enum TableFactor {
         subquery: Box<Query>,
         alias: Option<TableAlias>,
     },
-    /// Represents a parenthesized join expression, such as
-    /// `(foo <JOIN> bar [ <JOIN> baz ... ])`.
-    /// The inner `TableWithJoins` can have no joins only if its
-    /// `relation` is itself a `TableFactor::NestedJoin`.
+    /// Represents a parenthesized table factor. The SQL spec only allows a
+    /// join expression (`(foo <JOIN> bar [ <JOIN> baz ... ])`) to be nested,
+    /// possibly several times, but the parser also accepts the non-standard
+    /// nesting of bare tables (`table_with_joins.joins.is_empty()`), so the
+    /// name `NestedJoin` is a bit of misnomer.
     NestedJoin(Box<TableWithJoins>),
 }
 
diff --git a/src/parser.rs b/src/parser.rs
index e988f9c09..cdaf8989d 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1771,7 +1771,6 @@ impl Parser {
             //                   ^ ^ ^ ^
             //                   | | | |
             //                   | | | |
-            //                   | | | |
             //                   | | | (4) belongs to a SetExpr::Query inside the subquery
             //                   | | (3) starts a derived table (subquery)
             //                   | (2) starts a nested join
@@ -1784,23 +1783,20 @@ impl Parser {
                 // case (3), and the next token would be `NATURAL`.
                 Ok(table_factor) => Ok(table_factor),
                 Err(_) => {
-                    // The '(' we've recently consumed does not start a derived
-                    // table. For valid input this can happen either when the
-                    // token following the paren can't start a query (e.g. `foo`
-                    // in `FROM (foo NATURAL JOIN bar)`, or when the '(' we've
-                    // consumed is followed by another '(' that starts a
-                    // derived table, like (3), or another nested join (2).
-                    //
-                    // Ignore the error and back up to where we were before.
-                    // Either we'll be able to parse a valid nested join, or
-                    // we won't, and we'll return that error instead.
-                    //
-                    // Even the SQL spec prohibits derived tables and bare
-                    // tables from appearing alone in parentheses, we allowed it
-                    // as some Db's allowed that (snowflake as example)
+                    // A parsing error from `parse_derived_table_factor` indicates that
+                    // the '(' we've recently consumed does not start a derived table
+                    // (cases 1, 2, or 4). Ignore the error and back up to where we
+                    // were before - right after the opening '('.
                     self.index = index;
+
+                    // Inside the parentheses we expect to find a table factor
+                    // followed by some joins or another level of nesting.
                     let table_and_joins = self.parse_table_and_joins()?;
                     self.expect_token(&Token::RParen)?;
+                    // The SQL spec prohibits derived and bare tables from appearing
+                    // alone in parentheses. We don't enforce this as some databases
+                    // (e.g. Snowflake) allow such syntax.
+
                     Ok(TableFactor::NestedJoin(Box::new(table_and_joins)))
                 }
             }

From c0b0b5924d4d06359e3419b75fab03e7704a7edd Mon Sep 17 00:00:00 2001
From: Matt Jibson <matt.jibson@gmail.com>
Date: Mon, 13 Apr 2020 17:59:10 -0600
Subject: [PATCH 007/122] Add support for OFFSET with the ROWS keyword

MySQL doesn't support the ROWS part of OFFSET. Teach the parser to
remember which variant it saw, including just ROW.
---
 src/ast/mod.rs            |  4 +--
 src/ast/query.rs          | 35 ++++++++++++++++++--
 src/parser.rs             | 12 +++++--
 tests/sqlparser_common.rs | 70 +++++++++++++++++++++++++++++----------
 4 files changed, 96 insertions(+), 25 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 2f723f012..3ace38c02 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -26,8 +26,8 @@ pub use self::ddl::{
 };
 pub use self::operator::{BinaryOperator, UnaryOperator};
 pub use self::query::{
-    Cte, Fetch, Join, JoinConstraint, JoinOperator, OrderByExpr, Query, Select, SelectItem,
-    SetExpr, SetOperator, TableAlias, TableFactor, TableWithJoins, Top, Values,
+    Cte, Fetch, Join, JoinConstraint, JoinOperator, Offset, OffsetRows, OrderByExpr, Query, Select,
+    SelectItem, SetExpr, SetOperator, TableAlias, TableFactor, TableWithJoins, Top, Values,
 };
 pub use self::value::{DateTimeField, Value};
 
diff --git a/src/ast/query.rs b/src/ast/query.rs
index 3588257e7..433421985 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -24,8 +24,8 @@ pub struct Query {
     pub order_by: Vec<OrderByExpr>,
     /// `LIMIT { <N> | ALL }`
     pub limit: Option<Expr>,
-    /// `OFFSET <N> { ROW | ROWS }`
-    pub offset: Option<Expr>,
+    /// `OFFSET <N> [ { ROW | ROWS } ]`
+    pub offset: Option<Offset>,
     /// `FETCH { FIRST | NEXT } <N> [ PERCENT ] { ROW | ROWS } | { ONLY | WITH TIES }`
     pub fetch: Option<Fetch>,
 }
@@ -43,7 +43,7 @@ impl fmt::Display for Query {
             write!(f, " LIMIT {}", limit)?;
         }
         if let Some(ref offset) = self.offset {
-            write!(f, " OFFSET {} ROWS", offset)?;
+            write!(f, " {}", offset)?;
         }
         if let Some(ref fetch) = self.fetch {
             write!(f, " {}", fetch)?;
@@ -391,6 +391,35 @@ impl fmt::Display for OrderByExpr {
     }
 }
 
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub struct Offset {
+    pub value: Expr,
+    pub rows: OffsetRows,
+}
+
+impl fmt::Display for Offset {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        write!(f, "OFFSET {}{}", self.value, self.rows)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub enum OffsetRows {
+    None,
+    Row,
+    Rows,
+}
+
+impl fmt::Display for OffsetRows {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        match self {
+            OffsetRows::None => Ok(()),
+            OffsetRows::Row => write!(f, " ROW"),
+            OffsetRows::Rows => write!(f, " ROWS"),
+        }
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 pub struct Fetch {
     pub with_ties: bool,
diff --git a/src/parser.rs b/src/parser.rs
index cdaf8989d..3b61ad112 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1970,10 +1970,16 @@ impl Parser {
     }
 
     /// Parse an OFFSET clause
-    pub fn parse_offset(&mut self) -> Result<Expr, ParserError> {
+    pub fn parse_offset(&mut self) -> Result<Offset, ParserError> {
         let value = Expr::Value(self.parse_number_value()?);
-        self.expect_one_of_keywords(&["ROW", "ROWS"])?;
-        Ok(value)
+        let rows = if self.parse_keyword("ROW") {
+            OffsetRows::Row
+        } else if self.parse_keyword("ROWS") {
+            OffsetRows::Rows
+        } else {
+            OffsetRows::None
+        };
+        Ok(Offset { value, rows })
     }
 
     /// Parse a FETCH clause
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 939673dcd..fe4013fac 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -2265,34 +2265,52 @@ fn parse_invalid_subquery_without_parens() {
 
 #[test]
 fn parse_offset() {
+    let expect = Some(Offset {
+        value: Expr::Value(number("2")),
+        rows: OffsetRows::Rows,
+    });
     let ast = verified_query("SELECT foo FROM bar OFFSET 2 ROWS");
-    assert_eq!(ast.offset, Some(Expr::Value(number("2"))));
+    assert_eq!(ast.offset, expect);
     let ast = verified_query("SELECT foo FROM bar WHERE foo = 4 OFFSET 2 ROWS");
-    assert_eq!(ast.offset, Some(Expr::Value(number("2"))));
+    assert_eq!(ast.offset, expect);
     let ast = verified_query("SELECT foo FROM bar ORDER BY baz OFFSET 2 ROWS");
-    assert_eq!(ast.offset, Some(Expr::Value(number("2"))));
+    assert_eq!(ast.offset, expect);
     let ast = verified_query("SELECT foo FROM bar WHERE foo = 4 ORDER BY baz OFFSET 2 ROWS");
-    assert_eq!(ast.offset, Some(Expr::Value(number("2"))));
+    assert_eq!(ast.offset, expect);
     let ast = verified_query("SELECT foo FROM (SELECT * FROM bar OFFSET 2 ROWS) OFFSET 2 ROWS");
-    assert_eq!(ast.offset, Some(Expr::Value(number("2"))));
+    assert_eq!(ast.offset, expect);
     match ast.body {
         SetExpr::Select(s) => match only(s.from).relation {
             TableFactor::Derived { subquery, .. } => {
-                assert_eq!(subquery.offset, Some(Expr::Value(number("2"))));
+                assert_eq!(subquery.offset, expect);
             }
             _ => panic!("Test broke"),
         },
         _ => panic!("Test broke"),
     }
     let ast = verified_query("SELECT 'foo' OFFSET 0 ROWS");
-    assert_eq!(ast.offset, Some(Expr::Value(number("0"))));
-}
-
-#[test]
-fn parse_singular_row_offset() {
-    one_statement_parses_to(
-        "SELECT foo FROM bar OFFSET 1 ROW",
-        "SELECT foo FROM bar OFFSET 1 ROWS",
+    assert_eq!(
+        ast.offset,
+        Some(Offset {
+            value: Expr::Value(number("0")),
+            rows: OffsetRows::Rows,
+        })
+    );
+    let ast = verified_query("SELECT 'foo' OFFSET 1 ROW");
+    assert_eq!(
+        ast.offset,
+        Some(Offset {
+            value: Expr::Value(number("1")),
+            rows: OffsetRows::Row,
+        })
+    );
+    let ast = verified_query("SELECT 'foo' OFFSET 1");
+    assert_eq!(
+        ast.offset,
+        Some(Offset {
+            value: Expr::Value(number("1")),
+            rows: OffsetRows::None,
+        })
     );
 }
 
@@ -2343,7 +2361,13 @@ fn parse_fetch() {
     let ast = verified_query(
         "SELECT foo FROM bar WHERE foo = 4 ORDER BY baz OFFSET 2 ROWS FETCH FIRST 2 ROWS ONLY",
     );
-    assert_eq!(ast.offset, Some(Expr::Value(number("2"))));
+    assert_eq!(
+        ast.offset,
+        Some(Offset {
+            value: Expr::Value(number("2")),
+            rows: OffsetRows::Rows,
+        })
+    );
     assert_eq!(ast.fetch, fetch_first_two_rows_only);
     let ast = verified_query(
         "SELECT foo FROM (SELECT * FROM bar FETCH FIRST 2 ROWS ONLY) FETCH FIRST 2 ROWS ONLY",
@@ -2359,12 +2383,24 @@ fn parse_fetch() {
         _ => panic!("Test broke"),
     }
     let ast = verified_query("SELECT foo FROM (SELECT * FROM bar OFFSET 2 ROWS FETCH FIRST 2 ROWS ONLY) OFFSET 2 ROWS FETCH FIRST 2 ROWS ONLY");
-    assert_eq!(ast.offset, Some(Expr::Value(number("2"))));
+    assert_eq!(
+        ast.offset,
+        Some(Offset {
+            value: Expr::Value(number("2")),
+            rows: OffsetRows::Rows,
+        })
+    );
     assert_eq!(ast.fetch, fetch_first_two_rows_only);
     match ast.body {
         SetExpr::Select(s) => match only(s.from).relation {
             TableFactor::Derived { subquery, .. } => {
-                assert_eq!(subquery.offset, Some(Expr::Value(number("2"))));
+                assert_eq!(
+                    subquery.offset,
+                    Some(Offset {
+                        value: Expr::Value(number("2")),
+                        rows: OffsetRows::Rows,
+                    })
+                );
                 assert_eq!(subquery.fetch, fetch_first_two_rows_only);
             }
             _ => panic!("Test broke"),

From 06865113d74fe39451f0a4cee3c18f5675392e48 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Mon, 20 Apr 2020 05:43:57 +0300
Subject: [PATCH 008/122] Update comments (follow-up to PR #158)

---
 src/ast/query.rs | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/ast/query.rs b/src/ast/query.rs
index 433421985..a26ba2655 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -403,8 +403,10 @@ impl fmt::Display for Offset {
     }
 }
 
+/// Stores the keyword after `OFFSET <number>`
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 pub enum OffsetRows {
+    /// Omitting ROW/ROWS is non-standard MySQL quirk.
     None,
     Row,
     Rows,

From 5ad578e3e5c7831de3636d130beb3376d7c56f9d Mon Sep 17 00:00:00 2001
From: Alex Dukhno <5074607+alex-dukhno@users.noreply.github.com>
Date: Tue, 21 Apr 2020 16:28:02 +0300
Subject: [PATCH 009/122] Implement CREATE TABLE IF NOT EXISTS (#163)

A non-standard feature supported at least by Postgres

https://www.postgresql.org/docs/12/sql-createtable.html
---
 src/ast/mod.rs              |  5 +++-
 src/parser.rs               |  3 +++
 tests/sqlparser_common.rs   |  3 +++
 tests/sqlparser_postgres.rs | 52 +++++++++++++++++++++++++++++++++++++
 4 files changed, 62 insertions(+), 1 deletion(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 3ace38c02..98637e697 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -471,6 +471,7 @@ pub enum Statement {
         columns: Vec<ColumnDef>,
         constraints: Vec<TableConstraint>,
         with_options: Vec<SqlOption>,
+        if_not_exists: bool,
         external: bool,
         file_format: Option<FileFormat>,
         location: Option<String>,
@@ -623,14 +624,16 @@ impl fmt::Display for Statement {
                 columns,
                 constraints,
                 with_options,
+                if_not_exists,
                 external,
                 file_format,
                 location,
             } => {
                 write!(
                     f,
-                    "CREATE {}TABLE {} ({}",
+                    "CREATE {}TABLE {}{} ({}",
                     if *external { "EXTERNAL " } else { "" },
+                    if *if_not_exists { "IF NOT EXISTS " } else { "" },
                     name,
                     display_comma_separated(columns)
                 )?;
diff --git a/src/parser.rs b/src/parser.rs
index 3b61ad112..0939b7e39 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -880,6 +880,7 @@ impl Parser {
             columns,
             constraints,
             with_options: vec![],
+            if_not_exists: false,
             external: true,
             file_format: Some(file_format),
             location: Some(location),
@@ -932,6 +933,7 @@ impl Parser {
     }
 
     pub fn parse_create_table(&mut self) -> Result<Statement, ParserError> {
+        let if_not_exists = self.parse_keywords(vec!["IF", "NOT", "EXISTS"]);
         let table_name = self.parse_object_name()?;
         // parse optional column list (schema)
         let (columns, constraints) = self.parse_columns()?;
@@ -942,6 +944,7 @@ impl Parser {
             columns,
             constraints,
             with_options,
+            if_not_exists,
             external: false,
             file_format: None,
             location: None,
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index fe4013fac..c62fc86d7 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -909,6 +909,7 @@ fn parse_create_table() {
             columns,
             constraints,
             with_options,
+            if_not_exists: false,
             external: false,
             file_format: None,
             location: None,
@@ -1045,6 +1046,7 @@ fn parse_create_external_table() {
             columns,
             constraints,
             with_options,
+            if_not_exists,
             external,
             file_format,
             location,
@@ -1086,6 +1088,7 @@ fn parse_create_external_table() {
             assert_eq!("/tmp/example.csv", location.unwrap());
 
             assert_eq!(with_options, vec![]);
+            assert!(!if_not_exists);
         }
         _ => unreachable!(),
     }
diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index a903ced64..bd467dc74 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -39,6 +39,7 @@ fn parse_create_table_with_defaults() {
             columns,
             constraints,
             with_options,
+            if_not_exists: false,
             external: false,
             file_format: None,
             location: None,
@@ -225,6 +226,57 @@ fn parse_create_table_with_inherit() {
     pg().verified_stmt(sql);
 }
 
+#[test]
+fn parse_create_table_if_not_exists() {
+    let sql = "CREATE TABLE IF NOT EXISTS uk_cities ()";
+    let ast =
+        pg_and_generic().one_statement_parses_to(sql, "CREATE TABLE IF NOT EXISTS uk_cities ()");
+    match ast {
+        Statement::CreateTable {
+            name,
+            columns: _columns,
+            constraints,
+            with_options,
+            if_not_exists: true,
+            external: false,
+            file_format: None,
+            location: None,
+        } => {
+            assert_eq!("uk_cities", name.to_string());
+            assert!(constraints.is_empty());
+            assert_eq!(with_options, vec![]);
+        }
+        _ => unreachable!(),
+    }
+}
+
+#[test]
+fn parse_bad_if_not_exists() {
+    let res = pg().parse_sql_statements("CREATE TABLE NOT EXISTS uk_cities ()");
+    assert_eq!(
+        ParserError::ParserError("Expected end of statement, found: EXISTS".to_string()),
+        res.unwrap_err()
+    );
+
+    let res = pg().parse_sql_statements("CREATE TABLE IF EXISTS uk_cities ()");
+    assert_eq!(
+        ParserError::ParserError("Expected end of statement, found: EXISTS".to_string()),
+        res.unwrap_err()
+    );
+
+    let res = pg().parse_sql_statements("CREATE TABLE IF uk_cities ()");
+    assert_eq!(
+        ParserError::ParserError("Expected end of statement, found: uk_cities".to_string()),
+        res.unwrap_err()
+    );
+
+    let res = pg().parse_sql_statements("CREATE TABLE IF NOT uk_cities ()");
+    assert_eq!(
+        ParserError::ParserError("Expected end of statement, found: NOT".to_string()),
+        res.unwrap_err()
+    );
+}
+
 #[test]
 fn parse_copy_example() {
     let sql = r#"COPY public.actor (actor_id, first_name, last_name, last_update, value) FROM stdin;

From 40853fe4120dca02f01cdc873b7b10ecd21d8ea6 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Sun, 10 May 2020 21:06:11 +0300
Subject: [PATCH 010/122] Fix a recently implemented clippy lint

https://rust-lang.github.io/rust-clippy/master/index.html#single_component_path_imports
"Import with single component use path such as `use cratename;`
is not necessary, and thus should be removed."
---
 examples/cli.rs | 2 --
 1 file changed, 2 deletions(-)

diff --git a/examples/cli.rs b/examples/cli.rs
index d0ba9a578..917629e43 100644
--- a/examples/cli.rs
+++ b/examples/cli.rs
@@ -12,8 +12,6 @@
 
 #![warn(clippy::all)]
 
-use simple_logger;
-
 ///! A small command-line app to run the parser.
 /// Run with `cargo run --example cli`
 use std::fs;

From 327e6cd9f1751e65461e867ea5c58f185d1a5f19 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Sun, 10 May 2020 21:21:01 +0300
Subject: [PATCH 011/122] Report an error for unterminated string literals

...updated the TODOs regarding single-quoted literals parsing while at it.
---
 src/parser.rs             | 10 +++++++++
 src/tokenizer.rs          | 47 ++++++++++++++++++++++++++++++---------
 tests/sqlparser_common.rs |  2 +-
 3 files changed, 48 insertions(+), 11 deletions(-)

diff --git a/src/parser.rs b/src/parser.rs
index 0939b7e39..7c6a401d5 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1324,6 +1324,16 @@ impl Parser {
             }
             // MSSQL supports single-quoted strings as aliases for columns
             // We accept them as table aliases too, although MSSQL does not.
+            //
+            // Note, that this conflicts with an obscure rule from the SQL
+            // standard, which we don't implement:
+            // https://crate.io/docs/sql-99/en/latest/chapters/07.html#character-string-literal-s
+            //    "[Obscure Rule] SQL allows you to break a long <character
+            //    string literal> up into two or more smaller <character string
+            //    literal>s, split by a <separator> that includes a newline
+            //    character. When it sees such a <literal>, your DBMS will
+            //    ignore the <separator> and treat the multiple strings as
+            //    a single <literal>."
             Some(Token::SingleQuotedString(ref s)) => Ok(Some(Ident::with_quote('\'', s.clone()))),
             not_an_ident => {
                 if after_as {
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 96c9535ea..86452a445 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -278,7 +278,7 @@ impl<'a> Tokenizer<'a> {
                     match chars.peek() {
                         Some('\'') => {
                             // N'...' - a <national character string literal>
-                            let s = self.tokenize_single_quoted_string(chars);
+                            let s = self.tokenize_single_quoted_string(chars)?;
                             Ok(Some(Token::NationalStringLiteral(s)))
                         }
                         _ => {
@@ -295,7 +295,7 @@ impl<'a> Tokenizer<'a> {
                     match chars.peek() {
                         Some('\'') => {
                             // X'...' - a <binary string literal>
-                            let s = self.tokenize_single_quoted_string(chars);
+                            let s = self.tokenize_single_quoted_string(chars)?;
                             Ok(Some(Token::HexStringLiteral(s)))
                         }
                         _ => {
@@ -313,7 +313,7 @@ impl<'a> Tokenizer<'a> {
                 }
                 // string
                 '\'' => {
-                    let s = self.tokenize_single_quoted_string(chars);
+                    let s = self.tokenize_single_quoted_string(chars)?;
                     Ok(Some(Token::SingleQuotedString(s)))
                 }
                 // delimited (quoted) identifier
@@ -431,11 +431,10 @@ impl<'a> Tokenizer<'a> {
     }
 
     /// Read a single quoted string, starting with the opening quote.
-    fn tokenize_single_quoted_string(&self, chars: &mut Peekable<Chars<'_>>) -> String {
-        //TODO: handle escaped quotes in string
-        //TODO: handle newlines in string
-        //TODO: handle EOF before terminating quote
-        //TODO: handle 'string' <white space> 'string continuation'
+    fn tokenize_single_quoted_string(
+        &self,
+        chars: &mut Peekable<Chars<'_>>,
+    ) -> Result<String, TokenizerError> {
         let mut s = String::new();
         chars.next(); // consume the opening quote
         while let Some(&ch) = chars.peek() {
@@ -447,7 +446,7 @@ impl<'a> Tokenizer<'a> {
                         s.push('\'');
                         chars.next();
                     } else {
-                        break;
+                        return Ok(s);
                     }
                 }
                 _ => {
@@ -456,7 +455,10 @@ impl<'a> Tokenizer<'a> {
                 }
             }
         }
-        s
+        Err(TokenizerError(format!(
+            "Unterminated string literal at Line: {}, Col: {}",
+            self.line, self.col
+        )))
     }
 
     fn tokenize_multiline_comment(
@@ -640,6 +642,31 @@ mod tests {
         compare(expected, tokens);
     }
 
+    #[test]
+    fn tokenize_newline_in_string_literal() {
+        let sql = String::from("'foo\r\nbar\nbaz'");
+
+        let dialect = GenericDialect {};
+        let mut tokenizer = Tokenizer::new(&dialect, &sql);
+        let tokens = tokenizer.tokenize().unwrap();
+        let expected = vec![Token::SingleQuotedString("foo\r\nbar\nbaz".to_string())];
+        compare(expected, tokens);
+    }
+
+    #[test]
+    fn tokenize_unterminated_string_literal() {
+        let sql = String::from("select 'foo");
+
+        let dialect = GenericDialect {};
+        let mut tokenizer = Tokenizer::new(&dialect, &sql);
+        assert_eq!(
+            tokenizer.tokenize(),
+            Err(TokenizerError(
+                "Unterminated string literal at Line: 1, Col: 8".to_string()
+            ))
+        );
+    }
+
     #[test]
     fn tokenize_invalid_string_cols() {
         let sql = String::from("\n\nSELECT * FROM table\tمصطفىh");
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index c62fc86d7..41ceeae54 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1031,7 +1031,7 @@ fn parse_create_external_table() {
                name VARCHAR(100) NOT NULL,\
                lat DOUBLE NULL,\
                lng DOUBLE)\
-               STORED AS TEXTFILE LOCATION '/tmp/example.csv";
+               STORED AS TEXTFILE LOCATION '/tmp/example.csv'";
     let ast = one_statement_parses_to(
         sql,
         "CREATE EXTERNAL TABLE uk_cities (\

From 7d60bfd8660056b696c387ca97d42797c585edb2 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Sun, 10 May 2020 21:43:40 +0300
Subject: [PATCH 012/122] Update CHANGELOG.md

---
 CHANGELOG.md | 15 +++++++++++++--
 1 file changed, 13 insertions(+), 2 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 23b2fdde1..d552e942f 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -6,10 +6,21 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 Given that the parser produces a typed AST, any changes to the AST will technically be breaking and thus will result in a `0.(N+1)` version. We document changes that break via addition as "Added".
 
 ## [Unreleased]
-Nothing here yet! Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented changes.
+Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented changes.
 
+### Changed
+- Change `Ident` (previously a simple `String`) to store the parsed (unquoted) `value` of the identifier and the `quote_style` separately (#143) - thanks @apparebit!
+- Support Snowflake's `FROM (table_name)` (#155) - thanks @eyalleshem!
+
+### Added
+- Support MSSQL `TOP (<N>) [ PERCENT ] [ WITH TIES ]` (#150) - thanks @alexkyllo!
+- Support MySQL `LIMIT row_count OFFSET offset` (not followed by `ROW` or `ROWS`) and remember which variant was parsed (#158) - thanks @mjibson!
+- Support PostgreSQL `CREATE TABLE IF NOT EXISTS table_name` (#163) - thanks @alex-dukhno!
+
+### Fixed
+- Report an error for unterminated string literals (#165)
 
-## [0.5.0] - 2019-10-10 
+## [0.5.0] - 2019-10-10
 
 ### Changed
 - Replace the `Value::Long(u64)` and `Value::Double(f64)` variants with `Value::Number(String)` to avoid losing precision when parsing decimal literals (#130) - thanks @benesch!

From 8406a938d5a1c61722fe730ba8d7a3190bedd687 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Tue, 26 May 2020 21:33:10 +0300
Subject: [PATCH 013/122] Port the changes made to travis configuration in #159
 to GitHub workflows

This should fix the build failures due to unavailable components, e.g.

error: component 'rustfmt' for target 'x86_64-unknown-linux-gnu' is unavailable for download for channel nightly
Sometimes not all components are available in any given nightly.
---
 .github/workflows/rust.yml | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/.github/workflows/rust.yml b/.github/workflows/rust.yml
index 0f2507b23..06db11ebf 100644
--- a/.github/workflows/rust.yml
+++ b/.github/workflows/rust.yml
@@ -4,14 +4,13 @@ on: [push]
 
 jobs:
   build:
-
     runs-on: ubuntu-latest
 
     steps:
     - uses: actions/checkout@v1
     - name: Setup Rust
       run: |
-        rustup toolchain install nightly && rustup component add --toolchain nightly rustfmt
+        rustup toolchain install nightly --profile default
         rustup toolchain install stable
         rustup override set stable
     # Clippy must be run first, as its lints are only triggered during

From 5aacc5ebcd5c1345cc7f2597ddfdfc5a926312e6 Mon Sep 17 00:00:00 2001
From: mashuai <mashuai@bytedance.com>
Date: Fri, 15 May 2020 21:55:25 +0800
Subject: [PATCH 014/122] add create index and drop index support

---
 src/ast/mod.rs            | 33 +++++++++++++++++++++++++++++++++
 src/dialect/keywords.rs   |  3 ++-
 src/parser.rs             | 27 +++++++++++++++++++++++++--
 tests/sqlparser_common.rs | 38 ++++++++++++++++++++++++++++++++++++++
 4 files changed, 98 insertions(+), 3 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 98637e697..e7ae0c731 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -476,6 +476,15 @@ pub enum Statement {
         file_format: Option<FileFormat>,
         location: Option<String>,
     },
+    /// CREATE INDEX
+    CreateIndex {
+        /// index name
+        name: ObjectName,
+        table_name: ObjectName,
+        columns: Vec<Ident>,
+        unique: bool,
+        if_not_exists: bool,
+    },
     /// ALTER TABLE
     AlterTable {
         /// Table name
@@ -655,6 +664,28 @@ impl fmt::Display for Statement {
                 }
                 Ok(())
             }
+            Statement::CreateIndex {
+                name,
+                table_name,
+                columns,
+                unique,
+                if_not_exists,
+            } => {
+                write!(
+                    f,
+                    "CREATE{}INDEX{}{} ON {}({}",
+                    if *unique { " UNIQUE " } else { " " },
+                    if *if_not_exists {
+                        " IF NOT EXISTS "
+                    } else {
+                        " "
+                    },
+                    name,
+                    table_name,
+                    display_separated(columns, ",")
+                )?;
+                write!(f, ");")
+            }
             Statement::AlterTable { name, operation } => {
                 write!(f, "ALTER TABLE {} {}", name, operation)
             }
@@ -819,6 +850,7 @@ impl FromStr for FileFormat {
 pub enum ObjectType {
     Table,
     View,
+    Index,
 }
 
 impl fmt::Display for ObjectType {
@@ -826,6 +858,7 @@ impl fmt::Display for ObjectType {
         f.write_str(match self {
             ObjectType::Table => "TABLE",
             ObjectType::View => "VIEW",
+            ObjectType::Index => "INDEX",
         })
     }
 }
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index 9795f2af3..bf33f29c9 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -420,7 +420,8 @@ define_keywords!(
     WORK,
     YEAR,
     ZONE,
-    END_EXEC = "END-EXEC"
+    END_EXEC = "END-EXEC",
+    INDEX
 );
 
 /// These keywords can't be used as a table alias, so that `FROM table_name alias`
diff --git a/src/parser.rs b/src/parser.rs
index 7c6a401d5..a7cb3ce4a 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -855,13 +855,17 @@ impl Parser {
     pub fn parse_create(&mut self) -> Result<Statement, ParserError> {
         if self.parse_keyword("TABLE") {
             self.parse_create_table()
+        } else if self.parse_keyword("INDEX") {
+            self.parse_create_index(false)
+        } else if self.parse_keywords(vec!["UNIQUE", "INDEX"]) {
+            self.parse_create_index(true)
         } else if self.parse_keyword("MATERIALIZED") || self.parse_keyword("VIEW") {
             self.prev_token();
             self.parse_create_view()
         } else if self.parse_keyword("EXTERNAL") {
             self.parse_create_external_table()
         } else {
-            self.expected("TABLE or VIEW after CREATE", self.peek_token())
+            self.expected("TABLE, VIEW or INDEX after CREATE", self.peek_token())
         }
     }
 
@@ -912,8 +916,10 @@ impl Parser {
             ObjectType::Table
         } else if self.parse_keyword("VIEW") {
             ObjectType::View
+        } else if self.parse_keyword("INDEX") {
+            ObjectType::Index
         } else {
-            return self.expected("TABLE or VIEW after DROP", self.peek_token());
+            return self.expected("TABLE, VIEW or INDEX after DROP", self.peek_token());
         };
         // Many dialects support the non standard `IF EXISTS` clause and allow
         // specifying multiple objects to delete in a single statement
@@ -932,6 +938,23 @@ impl Parser {
         })
     }
 
+    pub fn parse_create_index(&mut self, unique: bool) -> Result<Statement, ParserError> {
+        let if_not_exists = self.parse_keywords(vec!["IF", "NOT", "EXISTS"]);
+        let index_name = self.parse_object_name()?;
+        self.expect_keyword("ON")?;
+        let table_name = self.parse_object_name()?;
+        self.expect_token(&Token::LParen)?;
+        let columns = self.parse_comma_separated(Parser::parse_identifier)?;
+        self.expect_token(&Token::RParen)?;
+        Ok(Statement::CreateIndex {
+            name: index_name,
+            table_name,
+            columns,
+            unique,
+            if_not_exists,
+        })
+    }
+
     pub fn parse_create_table(&mut self) -> Result<Statement, ParserError> {
         let if_not_exists = self.parse_keywords(vec!["IF", "NOT", "EXISTS"]);
         let table_name = self.parse_object_name()?;
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 41ceeae54..147ebcd6a 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -2631,6 +2631,44 @@ fn ensure_multiple_dialects_are_tested() {
     let _ = parse_sql_statements("SELECT @foo");
 }
 
+#[test]
+fn parse_create_index() {
+    let sql = "CREATE UNIQUE INDEX IF NOT EXISTS idx_name ON test(name,age);";
+    let ident_vec = vec![Ident::new("name"), Ident::new("age")];
+    match verified_stmt(sql) {
+        Statement::CreateIndex {
+            name,
+            table_name,
+            columns,
+            unique,
+            if_not_exists,
+        } => {
+            assert_eq!("idx_name", name.to_string());
+            assert_eq!("test", table_name.to_string());
+            assert_eq!(ident_vec, columns);
+            assert_eq!(true, unique);
+            assert_eq!(true, if_not_exists)
+        }
+        _ => unreachable!(),
+    }
+}
+#[test]
+fn parse_drop_index() {
+    let sql = "DROP INDEX idx_a";
+    match verified_stmt(sql) {
+        Statement::Drop {
+            names, object_type, ..
+        } => {
+            assert_eq!(
+                vec!["idx_a"],
+                names.iter().map(ToString::to_string).collect::<Vec<_>>()
+            );
+            assert_eq!(ObjectType::Index, object_type);
+        }
+        _ => unreachable!(),
+    }
+}
+
 fn parse_sql_statements(sql: &str) -> Result<Vec<Statement>, ParserError> {
     all_dialects().parse_sql_statements(sql)
 }

From 320d2f2d0515cc604978736ce00181ec49695eb4 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Wed, 27 May 2020 05:04:22 +0300
Subject: [PATCH 015/122] Update CHANGELOG.md and a fix last-minute review nit

---
 CHANGELOG.md            | 1 +
 src/dialect/keywords.rs | 4 ++--
 src/parser.rs           | 4 +---
 3 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index d552e942f..c65a68615 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -13,6 +13,7 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 - Support Snowflake's `FROM (table_name)` (#155) - thanks @eyalleshem!
 
 ### Added
+- Support basic forms of `CREATE INDEX` and `DROP INDEX` (#167) - thanks @mashuai!
 - Support MSSQL `TOP (<N>) [ PERCENT ] [ WITH TIES ]` (#150) - thanks @alexkyllo!
 - Support MySQL `LIMIT row_count OFFSET offset` (not followed by `ROW` or `ROWS`) and remember which variant was parsed (#158) - thanks @mjibson!
 - Support PostgreSQL `CREATE TABLE IF NOT EXISTS table_name` (#163) - thanks @alex-dukhno!
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index bf33f29c9..7ab86de2e 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -200,6 +200,7 @@ define_keywords!(
     IDENTITY,
     IF,
     IN,
+    INDEX,
     INDICATOR,
     INNER,
     INOUT,
@@ -420,8 +421,7 @@ define_keywords!(
     WORK,
     YEAR,
     ZONE,
-    END_EXEC = "END-EXEC",
-    INDEX
+    END_EXEC = "END-EXEC"
 );
 
 /// These keywords can't be used as a table alias, so that `FROM table_name alias`
diff --git a/src/parser.rs b/src/parser.rs
index a7cb3ce4a..dc8e6b7ea 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -943,9 +943,7 @@ impl Parser {
         let index_name = self.parse_object_name()?;
         self.expect_keyword("ON")?;
         let table_name = self.parse_object_name()?;
-        self.expect_token(&Token::LParen)?;
-        let columns = self.parse_comma_separated(Parser::parse_identifier)?;
-        self.expect_token(&Token::RParen)?;
+        let columns = self.parse_parenthesized_column_list(Mandatory)?;
         Ok(Statement::CreateIndex {
             name: index_name,
             table_name,

From 98f97d09db13501fcbfa852dd5d67417568271f4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Christoph=20M=C3=BCller?= <pmzqxfmn@runbox.com>
Date: Wed, 27 May 2020 17:24:23 +0200
Subject: [PATCH 016/122] Add support for "on delete cascade" column option
 (#170)

Specifically, `FOREIGN KEY REFERENCES <foreign_table> (<referred_columns>)`
can now be followed by `ON DELETE <referential_action>` and/or by
`ON UPDATE <referential_action>`.
---
 src/ast/ddl.rs            | 53 +++++++++++++++++++++++++++++++++------
 src/ast/mod.rs            |  3 ++-
 src/dialect/keywords.rs   |  1 +
 src/parser.rs             | 36 +++++++++++++++++++++++++-
 tests/sqlparser_common.rs | 49 ++++++++++++++++++++++++++++++++++--
 5 files changed, 131 insertions(+), 11 deletions(-)

diff --git a/src/ast/ddl.rs b/src/ast/ddl.rs
index 7333ad287..776927669 100644
--- a/src/ast/ddl.rs
+++ b/src/ast/ddl.rs
@@ -155,10 +155,15 @@ pub enum ColumnOption {
         is_primary: bool,
     },
     /// A referential integrity constraint (`[FOREIGN KEY REFERENCES
-    /// <foreign_table> (<referred_columns>)`).
+    /// <foreign_table> (<referred_columns>)
+    /// { [ON DELETE <referential_action>] [ON UPDATE <referential_action>] |
+    ///   [ON UPDATE <referential_action>] [ON DELETE <referential_action>]
+    /// }`).
     ForeignKey {
         foreign_table: ObjectName,
         referred_columns: Vec<Ident>,
+        on_delete: Option<ReferentialAction>,
+        on_update: Option<ReferentialAction>,
     },
     // `CHECK (<expr>)`
     Check(Expr),
@@ -177,12 +182,21 @@ impl fmt::Display for ColumnOption {
             ForeignKey {
                 foreign_table,
                 referred_columns,
-            } => write!(
-                f,
-                "REFERENCES {} ({})",
-                foreign_table,
-                display_comma_separated(referred_columns)
-            ),
+                on_delete,
+                on_update,
+            } => {
+                write!(f, "REFERENCES {}", foreign_table)?;
+                if !referred_columns.is_empty() {
+                    write!(f, " ({})", display_comma_separated(referred_columns))?;
+                }
+                if let Some(action) = on_delete {
+                    write!(f, " ON DELETE {}", action)?;
+                }
+                if let Some(action) = on_update {
+                    write!(f, " ON UPDATE {}", action)?;
+                }
+                Ok(())
+            }
             Check(expr) => write!(f, "CHECK ({})", expr),
         }
     }
@@ -200,3 +214,28 @@ fn display_constraint_name<'a>(name: &'a Option<Ident>) -> impl fmt::Display + '
     }
     ConstraintName(name)
 }
+
+/// `<referential_action> =
+/// { RESTRICT | CASCADE | SET NULL | NO ACTION | SET DEFAULT }`
+///
+/// Used in foreign key constraints in `ON UPDATE` and `ON DELETE` options.
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub enum ReferentialAction {
+    Restrict,
+    Cascade,
+    SetNull,
+    NoAction,
+    SetDefault,
+}
+
+impl fmt::Display for ReferentialAction {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        f.write_str(match self {
+            ReferentialAction::Restrict => "RESTRICT",
+            ReferentialAction::Cascade => "CASCADE",
+            ReferentialAction::SetNull => "SET NULL",
+            ReferentialAction::NoAction => "NO ACTION",
+            ReferentialAction::SetDefault => "SET DEFAULT",
+        })
+    }
+}
diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index e7ae0c731..bc5c5dafc 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -22,7 +22,8 @@ use std::fmt;
 
 pub use self::data_type::DataType;
 pub use self::ddl::{
-    AlterTableOperation, ColumnDef, ColumnOption, ColumnOptionDef, TableConstraint,
+    AlterTableOperation, ColumnDef, ColumnOption, ColumnOptionDef, ReferentialAction,
+    TableConstraint,
 };
 pub use self::operator::{BinaryOperator, UnaryOperator};
 pub use self::query::{
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index 7ab86de2e..4f39904b6 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -51,6 +51,7 @@ macro_rules! define_keywords {
 
 define_keywords!(
     ABS,
+    ACTION,
     ADD,
     ASC,
     ALL,
diff --git a/src/parser.rs b/src/parser.rs
index dc8e6b7ea..5741167de 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1038,10 +1038,25 @@ impl Parser {
             ColumnOption::Unique { is_primary: false }
         } else if self.parse_keyword("REFERENCES") {
             let foreign_table = self.parse_object_name()?;
-            let referred_columns = self.parse_parenthesized_column_list(Mandatory)?;
+            // PostgreSQL allows omitting the column list and
+            // uses the primary key column of the foreign table by default
+            let referred_columns = self.parse_parenthesized_column_list(Optional)?;
+            let mut on_delete = None;
+            let mut on_update = None;
+            loop {
+                if on_delete.is_none() && self.parse_keywords(vec!["ON", "DELETE"]) {
+                    on_delete = Some(self.parse_referential_action()?);
+                } else if on_update.is_none() && self.parse_keywords(vec!["ON", "UPDATE"]) {
+                    on_update = Some(self.parse_referential_action()?);
+                } else {
+                    break;
+                }
+            }
             ColumnOption::ForeignKey {
                 foreign_table,
                 referred_columns,
+                on_delete,
+                on_update,
             }
         } else if self.parse_keyword("CHECK") {
             self.expect_token(&Token::LParen)?;
@@ -1055,6 +1070,25 @@ impl Parser {
         Ok(ColumnOptionDef { name, option })
     }
 
+    pub fn parse_referential_action(&mut self) -> Result<ReferentialAction, ParserError> {
+        if self.parse_keyword("RESTRICT") {
+            Ok(ReferentialAction::Restrict)
+        } else if self.parse_keyword("CASCADE") {
+            Ok(ReferentialAction::Cascade)
+        } else if self.parse_keywords(vec!["SET", "NULL"]) {
+            Ok(ReferentialAction::SetNull)
+        } else if self.parse_keywords(vec!["NO", "ACTION"]) {
+            Ok(ReferentialAction::NoAction)
+        } else if self.parse_keywords(vec!["SET", "DEFAULT"]) {
+            Ok(ReferentialAction::SetDefault)
+        } else {
+            self.expected(
+                "one of RESTRICT, CASCADE, SET NULL, NO ACTION or SET DEFAULT",
+                self.peek_token(),
+            )
+        }
+    }
+
     pub fn parse_optional_table_constraint(
         &mut self,
     ) -> Result<Option<TableConstraint>, ParserError> {
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 147ebcd6a..47d7db053 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -893,7 +893,9 @@ fn parse_create_table() {
                lat DOUBLE NULL,\
                lng DOUBLE,
                constrained INT NULL CONSTRAINT pkey PRIMARY KEY NOT NULL UNIQUE CHECK (constrained > 0),
-               ref INT REFERENCES othertable (a, b))";
+               ref INT REFERENCES othertable (a, b),\
+               ref2 INT references othertable2 on delete cascade on update no action\
+               )";
     let ast = one_statement_parses_to(
         sql,
         "CREATE TABLE uk_cities (\
@@ -901,7 +903,8 @@ fn parse_create_table() {
          lat double NULL, \
          lng double, \
          constrained int NULL CONSTRAINT pkey PRIMARY KEY NOT NULL UNIQUE CHECK (constrained > 0), \
-         ref int REFERENCES othertable (a, b))",
+         ref int REFERENCES othertable (a, b), \
+         ref2 int REFERENCES othertable2 ON DELETE CASCADE ON UPDATE NO ACTION)",
     );
     match ast {
         Statement::CreateTable {
@@ -978,8 +981,24 @@ fn parse_create_table() {
                             option: ColumnOption::ForeignKey {
                                 foreign_table: ObjectName(vec!["othertable".into()]),
                                 referred_columns: vec!["a".into(), "b".into(),],
+                                on_delete: None,
+                                on_update: None,
                             }
                         }]
+                    },
+                    ColumnDef {
+                        name: "ref2".into(),
+                        data_type: DataType::Int,
+                        collation: None,
+                        options: vec![ColumnOptionDef {
+                            name: None,
+                            option: ColumnOption::ForeignKey {
+                                foreign_table: ObjectName(vec!["othertable2".into()]),
+                                referred_columns: vec![],
+                                on_delete: Some(ReferentialAction::Cascade),
+                                on_update: Some(ReferentialAction::NoAction),
+                            }
+                        },]
                     }
                 ]
             );
@@ -996,6 +1015,32 @@ fn parse_create_table() {
         .contains("Expected column option, found: GARBAGE"));
 }
 
+#[test]
+fn parse_create_table_with_multiple_on_delete_fails() {
+    parse_sql_statements(
+        "\
+        create table X (\
+            y_id int references Y (id) \
+            on delete cascade on update cascade on delete no action\
+        )",
+    )
+    .expect_err("should have failed");
+}
+
+#[test]
+fn parse_create_table_with_on_delete_on_update_2in_any_order() -> Result<(), ParserError> {
+    let sql = |options: &str| -> String {
+        format!("create table X (y_id int references Y (id) {})", options)
+    };
+
+    parse_sql_statements(&sql("on update cascade on delete no action"))?;
+    parse_sql_statements(&sql("on delete cascade on update cascade"))?;
+    parse_sql_statements(&sql("on update no action"))?;
+    parse_sql_statements(&sql("on delete restrict"))?;
+
+    Ok(())
+}
+
 #[test]
 fn parse_create_table_with_options() {
     let sql = "CREATE TABLE t (c int) WITH (foo = 'bar', a = 123)";

From 8d5eaf95b30c9a6ac76970ba37aa2c207daf0ca5 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Wed, 27 May 2020 19:41:31 +0300
Subject: [PATCH 017/122] Update CHANGELOG

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index c65a68615..81705b536 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -14,6 +14,7 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 
 ### Added
 - Support basic forms of `CREATE INDEX` and `DROP INDEX` (#167) - thanks @mashuai!
+- Support `ON { UPDATE | DELETE } { RESTRICT | CASCADE | SET NULL | NO ACTION | SET DEFAULT }` in `FOREIGN KEY` constraints (#170) - thanks @c7hm4r!
 - Support MSSQL `TOP (<N>) [ PERCENT ] [ WITH TIES ]` (#150) - thanks @alexkyllo!
 - Support MySQL `LIMIT row_count OFFSET offset` (not followed by `ROW` or `ROWS`) and remember which variant was parsed (#158) - thanks @mjibson!
 - Support PostgreSQL `CREATE TABLE IF NOT EXISTS table_name` (#163) - thanks @alex-dukhno!

From a2f4996bdd0ee67a00ba9a39046eb378ccc58b9a Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Tue, 26 May 2020 21:09:58 +0300
Subject: [PATCH 018/122] Update README to point to SQL:2016, instead of 2011

This was discussed in #125, but we forgot to update the README at the time.
---
 README.md | 12 +++++-------
 1 file changed, 5 insertions(+), 7 deletions(-)

diff --git a/README.md b/README.md
index 7677f7983..1ff329c26 100644
--- a/README.md
+++ b/README.md
@@ -47,10 +47,8 @@ published regularly since. Most revisions have added significant new features to
 the language, and as a result no database claims to support the full breadth of
 features. This parser currently supports most of the SQL-92 syntax, plus some
 syntax from newer versions that have been explicitly requested, plus some MSSQL-
-and PostgreSQL-specific syntax. Whenever possible, the [online SQL:2011
-grammar][sql-2011-grammar] is used to guide what syntax to accept. (We will
-happily accept changes that conform to the SQL:2016 syntax as well, but that
-edition's grammar is not yet available online.)
+and PostgreSQL-specific syntax. Whenever possible, the [online SQL:2016
+grammar][sql-2016-grammar] is used to guide what syntax to accept.
 
 Unfortunately, stating anything more specific about compliance is difficult.
 There is no publicly available test suite that can assess compliance
@@ -105,8 +103,8 @@ If you are unable to submit a patch, feel free to file an issue instead. Please
 try to include:
 
   * some representative examples of the syntax you wish to support or fix;
-  * the relevant bits of the [SQL grammar][sql-2011-grammar], if the syntax is
-    part of SQL:2011; and
+  * the relevant bits of the [SQL grammar][sql-2016-grammar], if the syntax is
+    part of SQL:2016; and
   * links to documentation for the feature for a few of the most popular
     databases that support it.
 
@@ -123,5 +121,5 @@ resources.
 [DataFusion]: https://github.com/apache/arrow/tree/master/rust/datafusion
 [LocustDB]: https://github.com/cswinter/LocustDB
 [Pratt Parser]: https://tdop.github.io/
-[sql-2011-grammar]: https://jakewheat.github.io/sql-overview/sql-2011-foundation-grammar.html
+[sql-2016-grammar]: https://jakewheat.github.io/sql-overview/sql-2016-foundation-grammar.html
 [sql-standard]: https://en.wikipedia.org/wiki/ISO/IEC_9075
\ No newline at end of file

From 1cf9e5ecefc11bfc92dd66060f075c1270b21d30 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Tue, 26 May 2020 21:14:13 +0300
Subject: [PATCH 019/122] Update README: we support bits and pieces from other
 dialects too

---
 README.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/README.md b/README.md
index 1ff329c26..3b277a96b 100644
--- a/README.md
+++ b/README.md
@@ -46,9 +46,9 @@ SQL was first standardized in 1987, and revisions of the standard have been
 published regularly since. Most revisions have added significant new features to
 the language, and as a result no database claims to support the full breadth of
 features. This parser currently supports most of the SQL-92 syntax, plus some
-syntax from newer versions that have been explicitly requested, plus some MSSQL-
-and PostgreSQL-specific syntax. Whenever possible, the [online SQL:2016
-grammar][sql-2016-grammar] is used to guide what syntax to accept.
+syntax from newer versions that have been explicitly requested, plus some MSSQL,
+PostgreSQL, and other dialect-specific syntax. Whenever possible, the [online
+SQL:2016 grammar][sql-2016-grammar] is used to guide what syntax to accept.
 
 Unfortunately, stating anything more specific about compliance is difficult.
 There is no publicly available test suite that can assess compliance

From 91f769e46028c22e3d2f9dc17022d341df759b01 Mon Sep 17 00:00:00 2001
From: Alex Dukhno <alex.dukhno@icloud.com>
Date: Thu, 28 May 2020 19:50:16 +0300
Subject: [PATCH 020/122] added create and drop schema

---
 src/ast/mod.rs            |  5 +++++
 src/dialect/keywords.rs   |  1 +
 src/parser.rs             | 16 ++++++++++++++--
 tests/sqlparser_common.rs | 22 ++++++++++++++++++++++
 4 files changed, 42 insertions(+), 2 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index bc5c5dafc..a867abcf9 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -535,6 +535,8 @@ pub enum Statement {
     Commit { chain: bool },
     /// `ROLLBACK [ TRANSACTION | WORK ] [ AND [ NO ] CHAIN ]`
     Rollback { chain: bool },
+    /// CREATE SCHEMA
+    CreateSchema { schema_name: ObjectName },
 }
 
 impl fmt::Display for Statement {
@@ -754,6 +756,7 @@ impl fmt::Display for Statement {
             Statement::Rollback { chain } => {
                 write!(f, "ROLLBACK{}", if *chain { " AND CHAIN" } else { "" },)
             }
+            Statement::CreateSchema { schema_name } => write!(f, "CREATE SCHEMA {}", schema_name),
         }
     }
 }
@@ -852,6 +855,7 @@ pub enum ObjectType {
     Table,
     View,
     Index,
+    Schema,
 }
 
 impl fmt::Display for ObjectType {
@@ -860,6 +864,7 @@ impl fmt::Display for ObjectType {
             ObjectType::Table => "TABLE",
             ObjectType::View => "VIEW",
             ObjectType::Index => "INDEX",
+            ObjectType::Schema => "SCHEMA",
         })
     }
 }
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index 4f39904b6..b8f8817f5 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -330,6 +330,7 @@ define_keywords!(
     ROW_NUMBER,
     ROWS,
     SAVEPOINT,
+    SCHEMA,
     SCOPE,
     SCROLL,
     SEARCH,
diff --git a/src/parser.rs b/src/parser.rs
index 5741167de..d235eb169 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -864,11 +864,21 @@ impl Parser {
             self.parse_create_view()
         } else if self.parse_keyword("EXTERNAL") {
             self.parse_create_external_table()
+        } else if self.parse_keyword("SCHEMA") {
+            self.parse_create_schema()
         } else {
-            self.expected("TABLE, VIEW or INDEX after CREATE", self.peek_token())
+            self.expected(
+                "TABLE, VIEW, INDEX or SCHEMA after CREATE",
+                self.peek_token(),
+            )
         }
     }
 
+    pub fn parse_create_schema(&mut self) -> Result<Statement, ParserError> {
+        let schema_name = self.parse_object_name()?;
+        Ok(Statement::CreateSchema { schema_name })
+    }
+
     pub fn parse_create_external_table(&mut self) -> Result<Statement, ParserError> {
         self.expect_keyword("TABLE")?;
         let table_name = self.parse_object_name()?;
@@ -918,8 +928,10 @@ impl Parser {
             ObjectType::View
         } else if self.parse_keyword("INDEX") {
             ObjectType::Index
+        } else if self.parse_keyword("SCHEMA") {
+            ObjectType::Schema
         } else {
-            return self.expected("TABLE, VIEW or INDEX after DROP", self.peek_token());
+            return self.expected("TABLE, VIEW, INDEX or SCHEMA after DROP", self.peek_token());
         };
         // Many dialects support the non standard `IF EXISTS` clause and allow
         // specifying multiple objects to delete in a single statement
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 47d7db053..7272e35ac 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1027,6 +1027,28 @@ fn parse_create_table_with_multiple_on_delete_fails() {
     .expect_err("should have failed");
 }
 
+#[test]
+fn parse_create_schema() {
+    let sql = "CREATE SCHEMA X";
+
+    match verified_stmt(sql) {
+        Statement::CreateSchema { schema_name } => {
+            assert_eq!(schema_name.to_string(), "X".to_owned())
+        }
+        _ => unreachable!(),
+    }
+}
+
+#[test]
+fn parse_drop_schema() {
+    let sql = "DROP SCHEMA X";
+
+    match verified_stmt(sql) {
+        Statement::Drop { object_type, .. } => assert_eq!(object_type, ObjectType::Schema),
+        _ => unreachable!(),
+    }
+}
+
 #[test]
 fn parse_create_table_with_on_delete_on_update_2in_any_order() -> Result<(), ParserError> {
     let sql = |options: &str| -> String {

From 418b9631ce9c24cf9bb26cf7dd9e42edd29de985 Mon Sep 17 00:00:00 2001
From: QP Hou <dave2008713@gmail.com>
Date: Sat, 30 May 2020 07:05:15 -0700
Subject: [PATCH 021/122] add nulls first/last support to order by expression
 (#176)

Following `<sort specification list>` from the standard https://jakewheat.github.io/sql-overview/sql-2016-foundation-grammar.html#_10_10_sort_specification_list
---
 CHANGELOG.md              |  6 ++++--
 src/ast/query.rs          | 18 ++++++++++++++----
 src/dialect/keywords.rs   |  2 ++
 src/parser.rs             | 15 ++++++++++++++-
 tests/sqlparser_common.rs | 31 ++++++++++++++++++++++++++++++-
 5 files changed, 64 insertions(+), 8 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 81705b536..d39c76cdb 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -13,11 +13,13 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 - Support Snowflake's `FROM (table_name)` (#155) - thanks @eyalleshem!
 
 ### Added
-- Support basic forms of `CREATE INDEX` and `DROP INDEX` (#167) - thanks @mashuai!
-- Support `ON { UPDATE | DELETE } { RESTRICT | CASCADE | SET NULL | NO ACTION | SET DEFAULT }` in `FOREIGN KEY` constraints (#170) - thanks @c7hm4r!
 - Support MSSQL `TOP (<N>) [ PERCENT ] [ WITH TIES ]` (#150) - thanks @alexkyllo!
 - Support MySQL `LIMIT row_count OFFSET offset` (not followed by `ROW` or `ROWS`) and remember which variant was parsed (#158) - thanks @mjibson!
 - Support PostgreSQL `CREATE TABLE IF NOT EXISTS table_name` (#163) - thanks @alex-dukhno!
+- Support basic forms of `CREATE INDEX` and `DROP INDEX` (#167) - thanks @mashuai!
+- Support `ON { UPDATE | DELETE } { RESTRICT | CASCADE | SET NULL | NO ACTION | SET DEFAULT }` in `FOREIGN KEY` constraints (#170) - thanks @c7hm4r!
+- Support basic forms of `CREATE SCHEMA` and `DROP SCHEMA` (#173) - thanks @alex-dukhno!
+- Support `NULLS FIRST`/`LAST` in `ORDER BY` expressions (#176) - thanks @houqp!
 
 ### Fixed
 - Report an error for unterminated string literals (#165)
diff --git a/src/ast/query.rs b/src/ast/query.rs
index a26ba2655..a5918f1a3 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -374,20 +374,30 @@ pub enum JoinConstraint {
     Natural,
 }
 
-/// SQL ORDER BY expression
+/// An `ORDER BY` expression
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 pub struct OrderByExpr {
     pub expr: Expr,
+    /// Optional `ASC` or `DESC`
     pub asc: Option<bool>,
+    /// Optional `NULLS FIRST` or `NULLS LAST`
+    pub nulls_first: Option<bool>,
 }
 
 impl fmt::Display for OrderByExpr {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        write!(f, "{}", self.expr)?;
         match self.asc {
-            Some(true) => write!(f, "{} ASC", self.expr),
-            Some(false) => write!(f, "{} DESC", self.expr),
-            None => write!(f, "{}", self.expr),
+            Some(true) => write!(f, " ASC")?,
+            Some(false) => write!(f, " DESC")?,
+            None => (),
         }
+        match self.nulls_first {
+            Some(true) => write!(f, " NULLS FIRST")?,
+            Some(false) => write!(f, " NULLS LAST")?,
+            None => (),
+        }
+        Ok(())
     }
 }
 
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index b8f8817f5..a01871c6e 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -220,6 +220,7 @@ define_keywords!(
     LAG,
     LANGUAGE,
     LARGE,
+    LAST,
     LAST_VALUE,
     LATERAL,
     LEAD,
@@ -262,6 +263,7 @@ define_keywords!(
     NTILE,
     NULL,
     NULLIF,
+    NULLS,
     NUMERIC,
     OBJECT,
     OCTET_LENGTH,
diff --git a/src/parser.rs b/src/parser.rs
index d235eb169..608ac4736 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -2015,7 +2015,20 @@ impl Parser {
         } else {
             None
         };
-        Ok(OrderByExpr { expr, asc })
+
+        let nulls_first = if self.parse_keywords(vec!["NULLS", "FIRST"]) {
+            Some(true)
+        } else if self.parse_keywords(vec!["NULLS", "LAST"]) {
+            Some(false)
+        } else {
+            None
+        };
+
+        Ok(OrderByExpr {
+            expr,
+            asc,
+            nulls_first,
+        })
     }
 
     /// Parse a TOP clause, MSSQL equivalent of LIMIT,
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 7272e35ac..c87fcf3a2 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -746,14 +746,17 @@ fn parse_select_order_by() {
                 OrderByExpr {
                     expr: Expr::Identifier(Ident::new("lname")),
                     asc: Some(true),
+                    nulls_first: None,
                 },
                 OrderByExpr {
                     expr: Expr::Identifier(Ident::new("fname")),
                     asc: Some(false),
+                    nulls_first: None,
                 },
                 OrderByExpr {
                     expr: Expr::Identifier(Ident::new("id")),
                     asc: None,
+                    nulls_first: None,
                 },
             ],
             select.order_by
@@ -775,10 +778,35 @@ fn parse_select_order_by_limit() {
             OrderByExpr {
                 expr: Expr::Identifier(Ident::new("lname")),
                 asc: Some(true),
+                nulls_first: None,
             },
             OrderByExpr {
                 expr: Expr::Identifier(Ident::new("fname")),
                 asc: Some(false),
+                nulls_first: None,
+            },
+        ],
+        select.order_by
+    );
+    assert_eq!(Some(Expr::Value(number("2"))), select.limit);
+}
+
+#[test]
+fn parse_select_order_by_nulls_order() {
+    let sql = "SELECT id, fname, lname FROM customer WHERE id < 5 \
+               ORDER BY lname ASC NULLS FIRST, fname DESC NULLS LAST LIMIT 2";
+    let select = verified_query(sql);
+    assert_eq!(
+        vec![
+            OrderByExpr {
+                expr: Expr::Identifier(Ident::new("lname")),
+                asc: Some(true),
+                nulls_first: Some(true),
+            },
+            OrderByExpr {
+                expr: Expr::Identifier(Ident::new("fname")),
+                asc: Some(false),
+                nulls_first: Some(false),
             },
         ],
         select.order_by
@@ -1251,7 +1279,8 @@ fn parse_window_functions() {
                 partition_by: vec![],
                 order_by: vec![OrderByExpr {
                     expr: Expr::Identifier(Ident::new("dt")),
-                    asc: Some(false)
+                    asc: Some(false),
+                    nulls_first: None,
                 }],
                 window_frame: None,
             }),

From 5f3c1bda0133348a0b60f18c88a0d48b9400dcfe Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Sat, 30 May 2020 08:50:17 -0700
Subject: [PATCH 022/122] Provide LISTAGG implementation (#174)

This patch provides an initial implemenation of LISTAGG[1]. Notably this
implemenation deviates from ANSI SQL by allowing both WITHIN GROUP and
the delimiter to be optional. We do so because Redshift SQL works this
way and this approach is ultimately more flexible.

Fixes #169.

[1] https://modern-sql.com/feature/listagg
---
 CHANGELOG.md              |  1 +
 src/ast/mod.rs            | 74 ++++++++++++++++++++++++++++++++
 src/dialect/keywords.rs   |  3 ++
 src/parser.rs             | 88 +++++++++++++++++++++++++++++++++------
 tests/sqlparser_common.rs | 58 ++++++++++++++++++++++++--
 5 files changed, 207 insertions(+), 17 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index d39c76cdb..60c25da18 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -20,6 +20,7 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 - Support `ON { UPDATE | DELETE } { RESTRICT | CASCADE | SET NULL | NO ACTION | SET DEFAULT }` in `FOREIGN KEY` constraints (#170) - thanks @c7hm4r!
 - Support basic forms of `CREATE SCHEMA` and `DROP SCHEMA` (#173) - thanks @alex-dukhno!
 - Support `NULLS FIRST`/`LAST` in `ORDER BY` expressions (#176) - thanks @houqp!
+- Support `LISTAGG()` (#174) - thanks @maxcountryman!
 
 ### Fixed
 - Report an error for unterminated string literals (#165)
diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index a867abcf9..2dbf42b29 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -224,6 +224,8 @@ pub enum Expr {
     /// A parenthesized subquery `(SELECT ...)`, used in expression like
     /// `SELECT (subquery) AS x` or `WHERE (subquery) = x`
     Subquery(Box<Query>),
+    /// The `LISTAGG` function `SELECT LISTAGG(...) WITHIN GROUP (ORDER BY ...)`
+    ListAgg(ListAgg),
 }
 
 impl fmt::Display for Expr {
@@ -299,6 +301,7 @@ impl fmt::Display for Expr {
             }
             Expr::Exists(s) => write!(f, "EXISTS ({})", s),
             Expr::Subquery(s) => write!(f, "({})", s),
+            Expr::ListAgg(listagg) => write!(f, "{}", listagg),
         }
     }
 }
@@ -850,6 +853,77 @@ impl FromStr for FileFormat {
     }
 }
 
+/// A `LISTAGG` invocation `LISTAGG( [ DISTINCT ] <expr>[, <separator> ] [ON OVERFLOW <on_overflow>] ) )
+/// [ WITHIN GROUP (ORDER BY <within_group1>[, ...] ) ]`
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub struct ListAgg {
+    pub distinct: bool,
+    pub expr: Box<Expr>,
+    pub separator: Option<Box<Expr>>,
+    pub on_overflow: Option<ListAggOnOverflow>,
+    pub within_group: Vec<OrderByExpr>,
+}
+
+impl fmt::Display for ListAgg {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        write!(
+            f,
+            "LISTAGG({}{}",
+            if self.distinct { "DISTINCT " } else { "" },
+            self.expr
+        )?;
+        if let Some(separator) = &self.separator {
+            write!(f, ", {}", separator)?;
+        }
+        if let Some(on_overflow) = &self.on_overflow {
+            write!(f, "{}", on_overflow)?;
+        }
+        write!(f, ")")?;
+        if !self.within_group.is_empty() {
+            write!(
+                f,
+                " WITHIN GROUP (ORDER BY {})",
+                display_comma_separated(&self.within_group)
+            )?;
+        }
+        Ok(())
+    }
+}
+
+/// The `ON OVERFLOW` clause of a LISTAGG invocation
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub enum ListAggOnOverflow {
+    /// `ON OVERFLOW ERROR`
+    Error,
+
+    /// `ON OVERFLOW TRUNCATE [ <filler> ] WITH[OUT] COUNT`
+    Truncate {
+        filler: Option<Box<Expr>>,
+        with_count: bool,
+    },
+}
+
+impl fmt::Display for ListAggOnOverflow {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        write!(f, " ON OVERFLOW")?;
+        match self {
+            ListAggOnOverflow::Error => write!(f, " ERROR"),
+            ListAggOnOverflow::Truncate { filler, with_count } => {
+                write!(f, " TRUNCATE")?;
+                if let Some(filler) = filler {
+                    write!(f, " {}", filler)?;
+                }
+                if *with_count {
+                    write!(f, " WITH")?;
+                } else {
+                    write!(f, " WITHOUT")?;
+                }
+                write!(f, " COUNT")
+            }
+        }
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 pub enum ObjectType {
     Table,
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index a01871c6e..ee59a1c92 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -161,6 +161,7 @@ define_keywords!(
     END_FRAME,
     END_PARTITION,
     EQUALS,
+    ERROR,
     ESCAPE,
     EVERY,
     EXCEPT,
@@ -230,6 +231,7 @@ define_keywords!(
     LIKE,
     LIKE_REGEX,
     LIMIT,
+    LISTAGG,
     LN,
     LOCAL,
     LOCALTIME,
@@ -279,6 +281,7 @@ define_keywords!(
     OUT,
     OUTER,
     OVER,
+    OVERFLOW,
     OVERLAPS,
     OVERLAY,
     PARAMETER,
diff --git a/src/parser.rs b/src/parser.rs
index 608ac4736..c0345736f 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -191,6 +191,7 @@ impl Parser {
                 "EXISTS" => self.parse_exists_expr(),
                 "EXTRACT" => self.parse_extract_expr(),
                 "INTERVAL" => self.parse_literal_interval(),
+                "LISTAGG" => self.parse_listagg_expr(),
                 "NOT" => Ok(Expr::UnaryOp {
                     op: UnaryOperator::Not,
                     expr: Box::new(self.parse_subexpr(Self::UNARY_NOT_PREC)?),
@@ -272,14 +273,7 @@ impl Parser {
 
     pub fn parse_function(&mut self, name: ObjectName) -> Result<Expr, ParserError> {
         self.expect_token(&Token::LParen)?;
-        let all = self.parse_keyword("ALL");
-        let distinct = self.parse_keyword("DISTINCT");
-        if all && distinct {
-            return parser_err!(format!(
-                "Cannot specify both ALL and DISTINCT in function: {}",
-                name.to_string(),
-            ));
-        }
+        let distinct = self.parse_all_or_distinct()?;
         let args = self.parse_optional_args()?;
         let over = if self.parse_keyword("OVER") {
             // TBD: support window names (`OVER mywin`) in place of inline specification
@@ -423,6 +417,66 @@ impl Parser {
         })
     }
 
+    /// Parse a SQL LISTAGG expression, e.g. `LISTAGG(...) WITHIN GROUP (ORDER BY ...)`.
+    pub fn parse_listagg_expr(&mut self) -> Result<Expr, ParserError> {
+        self.expect_token(&Token::LParen)?;
+        let distinct = self.parse_all_or_distinct()?;
+        let expr = Box::new(self.parse_expr()?);
+        // While ANSI SQL would would require the separator, Redshift makes this optional. Here we
+        // choose to make the separator optional as this provides the more general implementation.
+        let separator = if self.consume_token(&Token::Comma) {
+            Some(Box::new(self.parse_expr()?))
+        } else {
+            None
+        };
+        let on_overflow = if self.parse_keywords(vec!["ON", "OVERFLOW"]) {
+            if self.parse_keyword("ERROR") {
+                Some(ListAggOnOverflow::Error)
+            } else {
+                self.expect_keyword("TRUNCATE")?;
+                let filler = match self.peek_token() {
+                    Some(Token::Word(kw)) if kw.keyword == "WITH" || kw.keyword == "WITHOUT" => {
+                        None
+                    }
+                    Some(Token::SingleQuotedString(_))
+                    | Some(Token::NationalStringLiteral(_))
+                    | Some(Token::HexStringLiteral(_)) => Some(Box::new(self.parse_expr()?)),
+                    _ => self.expected(
+                        "either filler, WITH, or WITHOUT in LISTAGG",
+                        self.peek_token(),
+                    )?,
+                };
+                let with_count = self.parse_keyword("WITH");
+                if !with_count && !self.parse_keyword("WITHOUT") {
+                    self.expected("either WITH or WITHOUT in LISTAGG", self.peek_token())?;
+                }
+                self.expect_keyword("COUNT")?;
+                Some(ListAggOnOverflow::Truncate { filler, with_count })
+            }
+        } else {
+            None
+        };
+        self.expect_token(&Token::RParen)?;
+        // Once again ANSI SQL requires WITHIN GROUP, but Redshift does not. Again we choose the
+        // more general implementation.
+        let within_group = if self.parse_keywords(vec!["WITHIN", "GROUP"]) {
+            self.expect_token(&Token::LParen)?;
+            self.expect_keywords(&["ORDER", "BY"])?;
+            let order_by_expr = self.parse_comma_separated(Parser::parse_order_by_expr)?;
+            self.expect_token(&Token::RParen)?;
+            order_by_expr
+        } else {
+            vec![]
+        };
+        Ok(Expr::ListAgg(ListAgg {
+            distinct,
+            expr,
+            separator,
+            on_overflow,
+            within_group,
+        }))
+    }
+
     // This function parses date/time fields for both the EXTRACT function-like
     // operator and interval qualifiers. EXTRACT supports a wider set of
     // date/time fields than interval qualifiers, so this function may need to
@@ -851,6 +905,18 @@ impl Parser {
         Ok(values)
     }
 
+    /// Parse either `ALL` or `DISTINCT`. Returns `true` if `DISTINCT` is parsed and results in a
+    /// `ParserError` if both `ALL` and `DISTINCT` are fround.
+    pub fn parse_all_or_distinct(&mut self) -> Result<bool, ParserError> {
+        let all = self.parse_keyword("ALL");
+        let distinct = self.parse_keyword("DISTINCT");
+        if all && distinct {
+            return parser_err!("Cannot specify both ALL and DISTINCT".to_string());
+        } else {
+            Ok(distinct)
+        }
+    }
+
     /// Parse a SQL CREATE statement
     pub fn parse_create(&mut self) -> Result<Statement, ParserError> {
         if self.parse_keyword("TABLE") {
@@ -1635,11 +1701,7 @@ impl Parser {
     /// Parse a restricted `SELECT` statement (no CTEs / `UNION` / `ORDER BY`),
     /// assuming the initial `SELECT` was already consumed
     pub fn parse_select(&mut self) -> Result<Select, ParserError> {
-        let all = self.parse_keyword("ALL");
-        let distinct = self.parse_keyword("DISTINCT");
-        if all && distinct {
-            return parser_err!("Cannot specify both ALL and DISTINCT in SELECT");
-        }
+        let distinct = self.parse_all_or_distinct()?;
 
         let top = if self.parse_keyword("TOP") {
             Some(self.parse_top()?)
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index c87fcf3a2..257b48230 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -244,7 +244,7 @@ fn parse_select_all() {
 fn parse_select_all_distinct() {
     let result = parse_sql_statements("SELECT ALL DISTINCT name FROM customer");
     assert_eq!(
-        ParserError::ParserError("Cannot specify both ALL and DISTINCT in SELECT".to_string()),
+        ParserError::ParserError("Cannot specify both ALL and DISTINCT".to_string()),
         result.unwrap_err(),
     );
 }
@@ -357,9 +357,7 @@ fn parse_select_count_distinct() {
     let sql = "SELECT COUNT(ALL DISTINCT + x) FROM customer";
     let res = parse_sql_statements(sql);
     assert_eq!(
-        ParserError::ParserError(
-            "Cannot specify both ALL and DISTINCT in function: COUNT".to_string()
-        ),
+        ParserError::ParserError("Cannot specify both ALL and DISTINCT".to_string()),
         res.unwrap_err()
     );
 }
@@ -914,6 +912,58 @@ fn parse_extract() {
     );
 }
 
+#[test]
+fn parse_listagg() {
+    let sql = "SELECT LISTAGG(DISTINCT dateid, ', ' ON OVERFLOW TRUNCATE '%' WITHOUT COUNT) \
+               WITHIN GROUP (ORDER BY id, username)";
+    let select = verified_only_select(sql);
+
+    verified_stmt("SELECT LISTAGG(sellerid) WITHIN GROUP (ORDER BY dateid)");
+    verified_stmt("SELECT LISTAGG(dateid)");
+    verified_stmt("SELECT LISTAGG(DISTINCT dateid)");
+    verified_stmt("SELECT LISTAGG(dateid ON OVERFLOW ERROR)");
+    verified_stmt("SELECT LISTAGG(dateid ON OVERFLOW TRUNCATE N'...' WITH COUNT)");
+    verified_stmt("SELECT LISTAGG(dateid ON OVERFLOW TRUNCATE X'deadbeef' WITH COUNT)");
+
+    let expr = Box::new(Expr::Identifier(Ident::new("dateid")));
+    let on_overflow = Some(ListAggOnOverflow::Truncate {
+        filler: Some(Box::new(Expr::Value(Value::SingleQuotedString(
+            "%".to_string(),
+        )))),
+        with_count: false,
+    });
+    let within_group = vec![
+        OrderByExpr {
+            expr: Expr::Identifier(Ident {
+                value: "id".to_string(),
+                quote_style: None,
+            }),
+            asc: None,
+            nulls_first: None,
+        },
+        OrderByExpr {
+            expr: Expr::Identifier(Ident {
+                value: "username".to_string(),
+                quote_style: None,
+            }),
+            asc: None,
+            nulls_first: None,
+        },
+    ];
+    assert_eq!(
+        &Expr::ListAgg(ListAgg {
+            distinct: true,
+            expr,
+            separator: Some(Box::new(Expr::Value(Value::SingleQuotedString(
+                ", ".to_string()
+            )))),
+            on_overflow,
+            within_group
+        }),
+        expr_from_projection(only(&select.projection))
+    );
+}
+
 #[test]
 fn parse_create_table() {
     let sql = "CREATE TABLE uk_cities (\

From 00dc490f72aed72a4c92d367280197a1f0a98a9d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Tue, 2 Jun 2020 20:24:30 +0200
Subject: [PATCH 023/122] Support the string concat operator (#178)

The selected precedence is based on BigQuery documentation, where it is equal to `*` and `/`:

https://cloud.google.com/bigquery/docs/reference/standard-sql/operators
---
 src/ast/operator.rs       |  2 ++
 src/parser.rs             |  3 ++-
 src/tokenizer.rs          | 33 +++++++++++++++++++++++++++++++++
 tests/sqlparser_common.rs | 15 +++++++++++++++
 4 files changed, 52 insertions(+), 1 deletion(-)

diff --git a/src/ast/operator.rs b/src/ast/operator.rs
index f2970482c..2d75c46fa 100644
--- a/src/ast/operator.rs
+++ b/src/ast/operator.rs
@@ -38,6 +38,7 @@ pub enum BinaryOperator {
     Multiply,
     Divide,
     Modulus,
+    StringConcat,
     Gt,
     Lt,
     GtEq,
@@ -58,6 +59,7 @@ impl fmt::Display for BinaryOperator {
             BinaryOperator::Multiply => "*",
             BinaryOperator::Divide => "/",
             BinaryOperator::Modulus => "%",
+            BinaryOperator::StringConcat => "||",
             BinaryOperator::Gt => ">",
             BinaryOperator::Lt => "<",
             BinaryOperator::GtEq => ">=",
diff --git a/src/parser.rs b/src/parser.rs
index c0345736f..00dd24948 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -577,6 +577,7 @@ impl Parser {
             Token::Minus => Some(BinaryOperator::Minus),
             Token::Mult => Some(BinaryOperator::Multiply),
             Token::Mod => Some(BinaryOperator::Modulus),
+            Token::StringConcat => Some(BinaryOperator::StringConcat),
             Token::Div => Some(BinaryOperator::Divide),
             Token::Word(ref k) => match k.keyword.as_ref() {
                 "AND" => Some(BinaryOperator::And),
@@ -708,7 +709,7 @@ impl Parser {
                     Ok(20)
                 }
                 Token::Plus | Token::Minus => Ok(Self::PLUS_MINUS_PREC),
-                Token::Mult | Token::Div | Token::Mod => Ok(40),
+                Token::Mult | Token::Div | Token::Mod | Token::StringConcat => Ok(40),
                 Token::DoubleColon => Ok(50),
                 _ => Ok(0),
             }
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 86452a445..f3504ffb6 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -64,6 +64,8 @@ pub enum Token {
     Div,
     /// Modulo Operator `%`
     Mod,
+    /// String concatenation `||`
+    StringConcat,
     /// Left parenthesis `(`
     LParen,
     /// Right parenthesis `)`
@@ -111,6 +113,7 @@ impl fmt::Display for Token {
             Token::Minus => f.write_str("-"),
             Token::Mult => f.write_str("*"),
             Token::Div => f.write_str("/"),
+            Token::StringConcat => f.write_str("||"),
             Token::Mod => f.write_str("%"),
             Token::LParen => f.write_str("("),
             Token::RParen => f.write_str(")"),
@@ -374,6 +377,16 @@ impl<'a> Tokenizer<'a> {
                 '+' => self.consume_and_return(chars, Token::Plus),
                 '*' => self.consume_and_return(chars, Token::Mult),
                 '%' => self.consume_and_return(chars, Token::Mod),
+                '|' => {
+                    chars.next(); // consume the '|'
+                    match chars.peek() {
+                        Some('|') => self.consume_and_return(chars, Token::StringConcat),
+                        _ => Err(TokenizerError(format!(
+                            "Expecting to see `||`. Bitwise or operator `|` is not supported. \nError at Line: {}, Col: {}",
+                            self.line, self.col
+                        ))),
+                    }
+                }
                 '=' => self.consume_and_return(chars, Token::Eq),
                 '.' => self.consume_and_return(chars, Token::Period),
                 '!' => {
@@ -562,6 +575,26 @@ mod tests {
         compare(expected, tokens);
     }
 
+    #[test]
+    fn tokenize_string_string_concat() {
+        let sql = String::from("SELECT 'a' || 'b'");
+        let dialect = GenericDialect {};
+        let mut tokenizer = Tokenizer::new(&dialect, &sql);
+        let tokens = tokenizer.tokenize().unwrap();
+
+        let expected = vec![
+            Token::make_keyword("SELECT"),
+            Token::Whitespace(Whitespace::Space),
+            Token::SingleQuotedString(String::from("a")),
+            Token::Whitespace(Whitespace::Space),
+            Token::StringConcat,
+            Token::Whitespace(Whitespace::Space),
+            Token::SingleQuotedString(String::from("b")),
+        ];
+
+        compare(expected, tokens);
+    }
+
     #[test]
     fn tokenize_simple_select() {
         let sql = String::from("SELECT * FROM customer WHERE id = 1 LIMIT 5");
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 257b48230..34f8c589a 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -665,6 +665,21 @@ fn parse_in_subquery() {
     );
 }
 
+#[test]
+fn parse_string_agg() {
+    let sql = "SELECT a || b";
+
+    let select = verified_only_select(sql);
+    assert_eq!(
+        SelectItem::UnnamedExpr(Expr::BinaryOp {
+            left: Box::new(Expr::Identifier(Ident::new("a"))),
+            op: BinaryOperator::StringConcat,
+            right: Box::new(Expr::Identifier(Ident::new("b"))),
+        }),
+        select.projection[0]
+    );
+}
+
 #[test]
 fn parse_between() {
     fn chk(negated: bool) {

From b4699bd4a737a0b5daac3b8fc08169d84ea68d99 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Wed, 3 Jun 2020 18:02:05 +0200
Subject: [PATCH 024/122] Support bitwise and, or, xor (#181)

Operator precedence is coming from:

https://cloud.google.com/bigquery/docs/reference/standard-sql/operators
---
 src/ast/operator.rs       |  6 ++++++
 src/parser.rs             |  6 ++++++
 src/tokenizer.rs          | 38 +++++++++++++++++++++++++++++++++-----
 tests/sqlparser_common.rs | 21 +++++++++++++++++++++
 4 files changed, 66 insertions(+), 5 deletions(-)

diff --git a/src/ast/operator.rs b/src/ast/operator.rs
index 2d75c46fa..c9f5eb2e9 100644
--- a/src/ast/operator.rs
+++ b/src/ast/operator.rs
@@ -49,6 +49,9 @@ pub enum BinaryOperator {
     Or,
     Like,
     NotLike,
+    BitwiseOr,
+    BitwiseAnd,
+    BitwiseXor,
 }
 
 impl fmt::Display for BinaryOperator {
@@ -70,6 +73,9 @@ impl fmt::Display for BinaryOperator {
             BinaryOperator::Or => "OR",
             BinaryOperator::Like => "LIKE",
             BinaryOperator::NotLike => "NOT LIKE",
+            BinaryOperator::BitwiseOr => "|",
+            BinaryOperator::BitwiseAnd => "&",
+            BinaryOperator::BitwiseXor => "^",
         })
     }
 }
diff --git a/src/parser.rs b/src/parser.rs
index 00dd24948..0a50d2d75 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -578,6 +578,9 @@ impl Parser {
             Token::Mult => Some(BinaryOperator::Multiply),
             Token::Mod => Some(BinaryOperator::Modulus),
             Token::StringConcat => Some(BinaryOperator::StringConcat),
+            Token::Pipe => Some(BinaryOperator::BitwiseOr),
+            Token::Caret => Some(BinaryOperator::BitwiseXor),
+            Token::Ampersand => Some(BinaryOperator::BitwiseAnd),
             Token::Div => Some(BinaryOperator::Divide),
             Token::Word(ref k) => match k.keyword.as_ref() {
                 "AND" => Some(BinaryOperator::And),
@@ -708,6 +711,9 @@ impl Parser {
                 Token::Eq | Token::Lt | Token::LtEq | Token::Neq | Token::Gt | Token::GtEq => {
                     Ok(20)
                 }
+                Token::Pipe => Ok(21),
+                Token::Caret => Ok(22),
+                Token::Ampersand => Ok(23),
                 Token::Plus | Token::Minus => Ok(Self::PLUS_MINUS_PREC),
                 Token::Mult | Token::Div | Token::Mod | Token::StringConcat => Ok(40),
                 Token::DoubleColon => Ok(50),
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index f3504ffb6..06c52c2c5 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -84,8 +84,12 @@ pub enum Token {
     LBracket,
     /// Right bracket `]`
     RBracket,
-    /// Ampersand &
+    /// Ampersand `&`
     Ampersand,
+    /// Pipe `|`
+    Pipe,
+    /// Caret `^`
+    Caret,
     /// Left brace `{`
     LBrace,
     /// Right brace `}`
@@ -125,6 +129,8 @@ impl fmt::Display for Token {
             Token::LBracket => f.write_str("["),
             Token::RBracket => f.write_str("]"),
             Token::Ampersand => f.write_str("&"),
+            Token::Caret => f.write_str("^"),
+            Token::Pipe => f.write_str("|"),
             Token::LBrace => f.write_str("{"),
             Token::RBrace => f.write_str("}"),
         }
@@ -381,10 +387,8 @@ impl<'a> Tokenizer<'a> {
                     chars.next(); // consume the '|'
                     match chars.peek() {
                         Some('|') => self.consume_and_return(chars, Token::StringConcat),
-                        _ => Err(TokenizerError(format!(
-                            "Expecting to see `||`. Bitwise or operator `|` is not supported. \nError at Line: {}, Col: {}",
-                            self.line, self.col
-                        ))),
+                        // Bitshift '|' operator
+                        _ => Ok(Some(Token::Pipe)),
                     }
                 }
                 '=' => self.consume_and_return(chars, Token::Eq),
@@ -426,6 +430,7 @@ impl<'a> Tokenizer<'a> {
                 '[' => self.consume_and_return(chars, Token::LBracket),
                 ']' => self.consume_and_return(chars, Token::RBracket),
                 '&' => self.consume_and_return(chars, Token::Ampersand),
+                '^' => self.consume_and_return(chars, Token::Caret),
                 '{' => self.consume_and_return(chars, Token::LBrace),
                 '}' => self.consume_and_return(chars, Token::RBrace),
                 other => self.consume_and_return(chars, Token::Char(other)),
@@ -594,6 +599,29 @@ mod tests {
 
         compare(expected, tokens);
     }
+    #[test]
+    fn tokenize_bitwise_op() {
+        let sql = String::from("SELECT one | two ^ three");
+        let dialect = GenericDialect {};
+        let mut tokenizer = Tokenizer::new(&dialect, &sql);
+        let tokens = tokenizer.tokenize().unwrap();
+
+        let expected = vec![
+            Token::make_keyword("SELECT"),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_word("one", None),
+            Token::Whitespace(Whitespace::Space),
+            Token::Pipe,
+            Token::Whitespace(Whitespace::Space),
+            Token::make_word("two", None),
+            Token::Whitespace(Whitespace::Space),
+            Token::Caret,
+            Token::Whitespace(Whitespace::Space),
+            Token::make_word("three", None),
+        ];
+
+        compare(expected, tokens);
+    }
 
     #[test]
     fn tokenize_simple_select() {
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 34f8c589a..1e1c54e10 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -680,6 +680,27 @@ fn parse_string_agg() {
     );
 }
 
+#[test]
+fn parse_bitwise_ops() {
+    let bitwise_ops = &[
+        ("^", BinaryOperator::BitwiseXor),
+        ("|", BinaryOperator::BitwiseOr),
+        ("&", BinaryOperator::BitwiseAnd),
+    ];
+
+    for (str_op, op) in bitwise_ops {
+        let select = verified_only_select(&format!("SELECT a {} b", &str_op));
+        assert_eq!(
+            SelectItem::UnnamedExpr(Expr::BinaryOp {
+                left: Box::new(Expr::Identifier(Ident::new("a"))),
+                op: op.clone(),
+                right: Box::new(Expr::Identifier(Ident::new("b"))),
+            }),
+            select.projection[0]
+        );
+    }
+}
+
 #[test]
 fn parse_between() {
     fn chk(negated: bool) {

From d32df527e68dd76d857f47ea051a3ec22138469b Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Wed, 3 Jun 2020 22:31:41 +0200
Subject: [PATCH 025/122] Accept &str in `Parse::parse_sql` (#182)

It is more generic to accept a `&str` than a `String` in an API,
and avoids having to convert a string to a `String` when not
needed, avoiding a copy.
---
 README.md                | 4 ++--
 examples/cli.rs          | 2 +-
 examples/parse_select.rs | 2 +-
 src/lib.rs               | 2 +-
 src/parser.rs            | 2 +-
 src/test_utils.rs        | 4 ++--
 6 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/README.md b/README.md
index 3b277a96b..24674d911 100644
--- a/README.md
+++ b/README.md
@@ -29,7 +29,7 @@ let sql = "SELECT a, b, 123, myfunc(b) \
 
 let dialect = GenericDialect {}; // or AnsiDialect, or your own dialect ...
 
-let ast = Parser::parse_sql(&dialect, sql.to_string()).unwrap();
+let ast = Parser::parse_sql(&dialect, sql).unwrap();
 
 println!("AST: {:?}", ast);
 ```
@@ -122,4 +122,4 @@ resources.
 [LocustDB]: https://github.com/cswinter/LocustDB
 [Pratt Parser]: https://tdop.github.io/
 [sql-2016-grammar]: https://jakewheat.github.io/sql-overview/sql-2016-foundation-grammar.html
-[sql-standard]: https://en.wikipedia.org/wiki/ISO/IEC_9075
\ No newline at end of file
+[sql-standard]: https://en.wikipedia.org/wiki/ISO/IEC_9075
diff --git a/examples/cli.rs b/examples/cli.rs
index 917629e43..2b0822584 100644
--- a/examples/cli.rs
+++ b/examples/cli.rs
@@ -45,7 +45,7 @@ fn main() {
         chars.next();
         chars.as_str()
     };
-    let parse_result = Parser::parse_sql(&*dialect, without_bom.to_owned());
+    let parse_result = Parser::parse_sql(&*dialect, without_bom);
     match parse_result {
         Ok(statements) => {
             println!(
diff --git a/examples/parse_select.rs b/examples/parse_select.rs
index 539d91652..e7aa16307 100644
--- a/examples/parse_select.rs
+++ b/examples/parse_select.rs
@@ -23,7 +23,7 @@ fn main() {
 
     let dialect = GenericDialect {};
 
-    let ast = Parser::parse_sql(&dialect, sql.to_string()).unwrap();
+    let ast = Parser::parse_sql(&dialect, sql).unwrap();
 
     println!("AST: {:?}", ast);
 }
diff --git a/src/lib.rs b/src/lib.rs
index 156e20eb8..d25b24997 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -28,7 +28,7 @@
 //!            WHERE a > b AND b < 100 \
 //!            ORDER BY a DESC, b";
 //!
-//! let ast = Parser::parse_sql(&dialect, sql.to_string()).unwrap();
+//! let ast = Parser::parse_sql(&dialect, sql).unwrap();
 //!
 //! println!("AST: {:?}", ast);
 //! ```
diff --git a/src/parser.rs b/src/parser.rs
index 0a50d2d75..9a22f4d19 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -82,7 +82,7 @@ impl Parser {
     }
 
     /// Parse a SQL statement and produce an Abstract Syntax Tree (AST)
-    pub fn parse_sql(dialect: &dyn Dialect, sql: String) -> Result<Vec<Statement>, ParserError> {
+    pub fn parse_sql(dialect: &dyn Dialect, sql: &str) -> Result<Vec<Statement>, ParserError> {
         let mut tokenizer = Tokenizer::new(dialect, &sql);
         let tokens = tokenizer.tokenize()?;
         let mut parser = Parser::new(tokens);
diff --git a/src/test_utils.rs b/src/test_utils.rs
index d36eeb044..4d4d35616 100644
--- a/src/test_utils.rs
+++ b/src/test_utils.rs
@@ -58,9 +58,9 @@ impl TestedDialects {
     }
 
     pub fn parse_sql_statements(&self, sql: &str) -> Result<Vec<Statement>, ParserError> {
-        self.one_of_identical_results(|dialect| Parser::parse_sql(dialect, sql.to_string()))
+        self.one_of_identical_results(|dialect| Parser::parse_sql(dialect, &sql))
         // To fail the `ensure_multiple_dialects_are_tested` test:
-        // Parser::parse_sql(&**self.dialects.first().unwrap(), sql.to_string())
+        // Parser::parse_sql(&**self.dialects.first().unwrap(), sql)
     }
 
     /// Ensures that `sql` parses as a single statement, optionally checking

From 6e6fae73a0aa368ae7a452855ae5fcca2b5cbc3e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Sun, 7 Jun 2020 15:46:55 +0200
Subject: [PATCH 026/122] Add benchmarks using cargo bench / criterion (#190)

---
 docs/benchmarking.md                       |  6 +++
 sqlparser_bench/Cargo.toml                 | 17 +++++++++
 sqlparser_bench/benches/sqlparser_bench.rs | 43 ++++++++++++++++++++++
 sqlparser_bench/src/lib.rs                 |  7 ++++
 4 files changed, 73 insertions(+)
 create mode 100644 docs/benchmarking.md
 create mode 100644 sqlparser_bench/Cargo.toml
 create mode 100644 sqlparser_bench/benches/sqlparser_bench.rs
 create mode 100644 sqlparser_bench/src/lib.rs

diff --git a/docs/benchmarking.md b/docs/benchmarking.md
new file mode 100644
index 000000000..feae53c84
--- /dev/null
+++ b/docs/benchmarking.md
@@ -0,0 +1,6 @@
+# Benchmarking
+
+Run `cargo bench` in the project `sqlparser_bench` execute the queries.
+It will report results using the `criterion` library to perform the benchmarking.
+
+The bench project lives in another crate, to avoid the negative impact on building the `sqlparser` crate.
diff --git a/sqlparser_bench/Cargo.toml b/sqlparser_bench/Cargo.toml
new file mode 100644
index 000000000..43ea11913
--- /dev/null
+++ b/sqlparser_bench/Cargo.toml
@@ -0,0 +1,17 @@
+[package]
+name = "sqlparser_bench"
+version = "0.1.0"
+authors = ["Dandandan <danielheres@gmail.com>"]
+edition = "2018"
+
+# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
+
+[dependencies]
+sqlparser = { path = "../", version = "0.5.1-alpha-0" }
+
+[dev-dependencies]
+criterion = {version = "0.3"}
+
+[[bench]]
+name = "sqlparser_bench"
+harness = false
diff --git a/sqlparser_bench/benches/sqlparser_bench.rs b/sqlparser_bench/benches/sqlparser_bench.rs
new file mode 100644
index 000000000..5293c0f50
--- /dev/null
+++ b/sqlparser_bench/benches/sqlparser_bench.rs
@@ -0,0 +1,43 @@
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+use criterion::{criterion_group, criterion_main, Criterion};
+use sqlparser::dialect::GenericDialect;
+use sqlparser::parser::Parser;
+
+fn basic_queries(c: &mut Criterion) {
+    let mut group = c.benchmark_group("sqlparser-rs parsing benchmark");
+    let dialect = GenericDialect {};
+
+    let string = "SELECT * FROM table WHERE 1 = 1";
+    group.bench_function("sqlparser::select", |b| {
+        b.iter(|| Parser::parse_sql(&dialect, string));
+    });
+
+    let with_query = "
+        WITH derived AS (
+            SELECT MAX(a) AS max_a,
+                   COUNT(b) AS b_num,
+                   user_id
+            FROM TABLE
+            GROUP BY user_id
+        )
+        SELECT * FROM table
+        LEFT JOIN derived USING (user_id)
+    ";
+    group.bench_function("sqlparser::with_select", |b| {
+        b.iter(|| Parser::parse_sql(&dialect, with_query));
+    });
+}
+
+criterion_group!(benches, basic_queries);
+criterion_main!(benches);
diff --git a/sqlparser_bench/src/lib.rs b/sqlparser_bench/src/lib.rs
new file mode 100644
index 000000000..31e1bb209
--- /dev/null
+++ b/sqlparser_bench/src/lib.rs
@@ -0,0 +1,7 @@
+#[cfg(test)]
+mod tests {
+    #[test]
+    fn it_works() {
+        assert_eq!(2 + 2, 4);
+    }
+}

From af54eb02b25c418504264d0bd23e66d19712ff4b Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Sun, 7 Jun 2020 10:15:31 -0700
Subject: [PATCH 027/122] Rework github actions, add code coverage (#186)

This reworks our GitHub Actions workflow to include code coverage via
tarpaulin.

Fixes #164.
---
 .github/workflows/rust.yml | 79 +++++++++++++++++++++++++++-----------
 1 file changed, 57 insertions(+), 22 deletions(-)

diff --git a/.github/workflows/rust.yml b/.github/workflows/rust.yml
index 06db11ebf..a53e0babc 100644
--- a/.github/workflows/rust.yml
+++ b/.github/workflows/rust.yml
@@ -1,30 +1,65 @@
 name: Rust
 
-on: [push]
+on: [push, pull_request]
 
 jobs:
-  build:
+
+  codestyle:
     runs-on: ubuntu-latest
+    steps:
+      - name: Set up Rust
+        uses: hecrj/setup-rust-action@v1
+        with:
+          components: rustfmt
+          # Note that `nightly` is required for `license_template_path`, as
+          # it's an unstable feature.
+          rust-version: nightly
+      - uses: actions/checkout@v2
+      - run: cargo fmt -- --check --config-path <(echo 'license_template_path = "HEADER"')
+
+  lint:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Set up Rust
+        uses: hecrj/setup-rust-action@v1
+        with:
+          components: clippy
+      - uses: actions/checkout@v2
+      - run: cargo clippy --all-targets --all-features -- -D warnings
 
+  compile:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Set up Rust
+        uses: hecrj/setup-rust-action@v1
+      - uses: actions/checkout@master
+      - run: cargo check --all-targets --all-features
+
+  test:
+    strategy:
+      matrix:
+        rust: [stable, beta, nightly]
+    runs-on: ubuntu-latest
     steps:
-    - uses: actions/checkout@v1
     - name: Setup Rust
-      run: |
-        rustup toolchain install nightly --profile default
-        rustup toolchain install stable
-        rustup override set stable
-    # Clippy must be run first, as its lints are only triggered during
-    # compilation. Put another way: after a successful `cargo build`, `cargo
-    # clippy` is guaranteed to produce no results. This bug is known upstream:
-    # https://github.com/rust-lang/rust-clippy/issues/2604.
-#    - name: Clippy
-#      run: cargo clippy -- --all-targets --all-features -- -D warnings
-    - name: Check formatting
-      run: |
-        cargo +nightly fmt -- --check --config-path <(echo 'license_template_path = "HEADER"')
-    - name: Build
-      run: cargo build --verbose
-    - name: Run tests
-      run: cargo test --verbose
-    - name: Run tests for all features
-      run: cargo test --verbose -- all-features
+      uses: hecrj/setup-rust-action@v1
+      with:
+        rust-version: ${{ matrix.rust }}
+    - name: Install Tarpaulin
+      uses: actions-rs/install@v0.1
+      with:
+        crate: cargo-tarpaulin
+        version: 0.13.3
+        use-tool-cache: true
+    - name: Checkout
+      uses: actions/checkout@v2
+    - name: Test
+      run: cargo test --all-features
+    - name: Coverage
+      if: matrix.rust == 'stable'
+      run: cargo tarpaulin -o Lcov --output-dir ./coverage
+    - name: Coveralls
+      if: matrix.rust == 'stable'
+      uses: coverallsapp/github-action@master
+      with:
+        github-token: ${{ secrets.GITHUB_TOKEN }}

From a42121de522941a82a2b89eb5ac662822964f151 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Sun, 7 Jun 2020 19:25:10 +0200
Subject: [PATCH 028/122] Use binary search to speed up matching keywords
 (#191)

---
 src/dialect/keywords.rs   | 29 +++++++++++++++--------------
 src/tokenizer.rs          |  7 +++----
 tests/sqlparser_common.rs |  9 +++++++++
 3 files changed, 27 insertions(+), 18 deletions(-)

diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index ee59a1c92..bb4f678e0 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -49,11 +49,11 @@ macro_rules! define_keywords {
     }
 }
 
+// The following keywords should be sorted to be able to match using binary search
 define_keywords!(
     ABS,
     ACTION,
     ADD,
-    ASC,
     ALL,
     ALLOCATE,
     ALTER,
@@ -65,6 +65,7 @@ define_keywords!(
     ARRAY_AGG,
     ARRAY_MAX_CARDINALITY,
     AS,
+    ASC,
     ASENSITIVE,
     ASYMMETRIC,
     AT,
@@ -93,9 +94,9 @@ define_keywords!(
     CEILING,
     CHAIN,
     CHAR,
-    CHAR_LENGTH,
     CHARACTER,
     CHARACTER_LENGTH,
+    CHAR_LENGTH,
     CHECK,
     CLOB,
     CLOSE,
@@ -158,6 +159,7 @@ define_keywords!(
     ELEMENT,
     ELSE,
     END,
+    END_EXEC = "END-EXEC",
     END_FRAME,
     END_PARTITION,
     EQUALS,
@@ -175,8 +177,8 @@ define_keywords!(
     FALSE,
     FETCH,
     FIELDS,
-    FIRST,
     FILTER,
+    FIRST,
     FIRST_VALUE,
     FLOAT,
     FLOOR,
@@ -255,8 +257,8 @@ define_keywords!(
     NATURAL,
     NCHAR,
     NCLOB,
-    NEXT,
     NEW,
+    NEXT,
     NO,
     NONE,
     NORMALIZE,
@@ -268,8 +270,8 @@ define_keywords!(
     NULLS,
     NUMERIC,
     OBJECT,
-    OCTET_LENGTH,
     OCCURRENCES_REGEX,
+    OCTET_LENGTH,
     OF,
     OFFSET,
     OLD,
@@ -285,12 +287,12 @@ define_keywords!(
     OVERLAPS,
     OVERLAY,
     PARAMETER,
-    PARTITION,
     PARQUET,
+    PARTITION,
     PERCENT,
-    PERCENT_RANK,
     PERCENTILE_CONT,
     PERCENTILE_DISC,
+    PERCENT_RANK,
     PERIOD,
     PORTION,
     POSITION,
@@ -332,8 +334,8 @@ define_keywords!(
     ROLLBACK,
     ROLLUP,
     ROW,
-    ROW_NUMBER,
     ROWS,
+    ROW_NUMBER,
     SAVEPOINT,
     SCHEMA,
     SCOPE,
@@ -390,10 +392,10 @@ define_keywords!(
     TRANSLATION,
     TREAT,
     TRIGGER,
-    TRUNCATE,
     TRIM,
     TRIM_ARRAY,
     TRUE,
+    TRUNCATE,
     UESCAPE,
     UNBOUNDED,
     UNCOMMITTED,
@@ -409,11 +411,11 @@ define_keywords!(
     VALUE,
     VALUES,
     VALUE_OF,
-    VAR_POP,
-    VAR_SAMP,
     VARBINARY,
     VARCHAR,
     VARYING,
+    VAR_POP,
+    VAR_SAMP,
     VERSIONING,
     VIEW,
     WHEN,
@@ -424,11 +426,10 @@ define_keywords!(
     WITH,
     WITHIN,
     WITHOUT,
-    WRITE,
     WORK,
+    WRITE,
     YEAR,
-    ZONE,
-    END_EXEC = "END-EXEC"
+    ZONE
 );
 
 /// These keywords can't be used as a table alias, so that `FROM table_name alias`
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 06c52c2c5..910f73911 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -143,10 +143,9 @@ impl Token {
     }
     pub fn make_word(word: &str, quote_style: Option<char>) -> Self {
         let word_uppercase = word.to_uppercase();
-        //TODO: need to reintroduce FnvHashSet at some point .. iterating over keywords is
-        // not fast but I want the simplicity for now while I experiment with pluggable
-        // dialects
-        let is_keyword = quote_style == None && ALL_KEYWORDS.contains(&word_uppercase.as_str());
+        //TODO: validate use of a hashset (e.g. FnvHashSet) compared to using binary search 
+        let is_keyword =
+            quote_style == None && ALL_KEYWORDS.binary_search(&word_uppercase.as_str()).is_ok();
         Token::Word(Word {
             value: word.to_string(),
             quote_style,
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 1e1c54e10..a63d3d49f 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -21,6 +21,7 @@
 use matches::assert_matches;
 
 use sqlparser::ast::*;
+use sqlparser::dialect::keywords::ALL_KEYWORDS;
 use sqlparser::parser::*;
 use sqlparser::test_utils::{all_dialects, expr_from_projection, number, only};
 
@@ -2851,6 +2852,14 @@ fn parse_drop_index() {
     }
 }
 
+#[test]
+fn keywords_sorted() {
+    // assert!(ALL_KEYWORDS.is_sorted())
+    let mut copy = Vec::from(ALL_KEYWORDS);
+    copy.sort();
+    assert!(copy == ALL_KEYWORDS)
+}
+
 fn parse_sql_statements(sql: &str) -> Result<Vec<Statement>, ParserError> {
     all_dialects().parse_sql_statements(sql)
 }

From 10b0b7f884dfe027514d135b2ff547cb82fa5ebe Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Sun, 7 Jun 2020 20:43:44 +0300
Subject: [PATCH 029/122] Update CHANGELOG (#192)

Also remove a comment with a trailing space, which rustfmt doesn't like
---
 CHANGELOG.md     | 3 +++
 src/tokenizer.rs | 1 -
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 60c25da18..ab27d94e8 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -9,6 +9,7 @@ Given that the parser produces a typed AST, any changes to the AST will technica
 Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented changes.
 
 ### Changed
+- **`Parser::parse_sql` now accepts a `&str` instead of `String` (#182)** - thanks @Dandandan!
 - Change `Ident` (previously a simple `String`) to store the parsed (unquoted) `value` of the identifier and the `quote_style` separately (#143) - thanks @apparebit!
 - Support Snowflake's `FROM (table_name)` (#155) - thanks @eyalleshem!
 
@@ -21,6 +22,8 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 - Support basic forms of `CREATE SCHEMA` and `DROP SCHEMA` (#173) - thanks @alex-dukhno!
 - Support `NULLS FIRST`/`LAST` in `ORDER BY` expressions (#176) - thanks @houqp!
 - Support `LISTAGG()` (#174) - thanks @maxcountryman!
+- Support the string concatentation operator `||` (#178) - thanks @Dandandan!
+- Support bitwise AND (`&`), OR (`|`), XOR (`^`) (#181) - thanks @Dandandan!
 
 ### Fixed
 - Report an error for unterminated string literals (#165)
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 910f73911..1f33dd5dc 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -143,7 +143,6 @@ impl Token {
     }
     pub fn make_word(word: &str, quote_style: Option<char>) -> Self {
         let word_uppercase = word.to_uppercase();
-        //TODO: validate use of a hashset (e.g. FnvHashSet) compared to using binary search 
         let is_keyword =
             quote_style == None && ALL_KEYWORDS.binary_search(&word_uppercase.as_str()).is_ok();
         Token::Word(Word {

From d842f495db6936f64b2738178a431f0ebd6c4e07 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Wed, 10 Jun 2020 08:15:44 +0200
Subject: [PATCH 030/122] Add line and column number to TokenizerError (#194)

Addresses https://github.com/andygrove/sqlparser-rs/issues/179 for tokenize errors
---
 src/parser.rs    |  5 ++++-
 src/tokenizer.rs | 54 +++++++++++++++++++++++++++---------------------
 2 files changed, 34 insertions(+), 25 deletions(-)

diff --git a/src/parser.rs b/src/parser.rs
index 9a22f4d19..780334a9b 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -49,7 +49,10 @@ use IsLateral::*;
 
 impl From<TokenizerError> for ParserError {
     fn from(e: TokenizerError) -> Self {
-        ParserError::TokenizerError(format!("{:?}", e))
+        ParserError::TokenizerError(format!(
+            "{} at Line: {}, Column {}",
+            e.message, e.line, e.col
+        ))
     }
 }
 
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 1f33dd5dc..68ebfaf62 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -217,7 +217,11 @@ impl fmt::Display for Whitespace {
 
 /// Tokenizer error
 #[derive(Debug, PartialEq)]
-pub struct TokenizerError(String);
+pub struct TokenizerError {
+    pub message: String,
+    pub line: u64,
+    pub col: u64,
+}
 
 /// SQL Tokenizer
 pub struct Tokenizer<'a> {
@@ -331,10 +335,10 @@ impl<'a> Tokenizer<'a> {
                     if chars.next() == Some(quote_end) {
                         Ok(Some(Token::make_word(&s, Some(quote_start))))
                     } else {
-                        Err(TokenizerError(format!(
-                            "Expected close delimiter '{}' before EOF.",
-                            quote_end
-                        )))
+                        self.tokenizer_error(
+                            format!("Expected close delimiter '{}' before EOF.", quote_end)
+                                .as_str(),
+                        )
                     }
                 }
                 // numbers
@@ -395,10 +399,7 @@ impl<'a> Tokenizer<'a> {
                     chars.next(); // consume
                     match chars.peek() {
                         Some('=') => self.consume_and_return(chars, Token::Neq),
-                        _ => Err(TokenizerError(format!(
-                            "Tokenizer Error at Line: {}, Col: {}",
-                            self.line, self.col
-                        ))),
+                        _ => self.tokenizer_error("Expected to see '=' after '!' character"),
                     }
                 }
                 '<' => {
@@ -437,6 +438,14 @@ impl<'a> Tokenizer<'a> {
         }
     }
 
+    fn tokenizer_error<R>(&self, message: &str) -> Result<R, TokenizerError> {
+        Err(TokenizerError {
+            message: message.to_string(),
+            col: self.col,
+            line: self.line,
+        })
+    }
+
     /// Tokenize an identifier or keyword, after the first char is already consumed.
     fn tokenize_word(&self, first_char: char, chars: &mut Peekable<Chars<'_>>) -> String {
         let mut s = first_char.to_string();
@@ -471,10 +480,7 @@ impl<'a> Tokenizer<'a> {
                 }
             }
         }
-        Err(TokenizerError(format!(
-            "Unterminated string literal at Line: {}, Col: {}",
-            self.line, self.col
-        )))
+        self.tokenizer_error("Unterminated string literal")
     }
 
     fn tokenize_multiline_comment(
@@ -499,11 +505,7 @@ impl<'a> Tokenizer<'a> {
                         s.push(ch);
                     }
                 }
-                None => {
-                    break Err(TokenizerError(
-                        "Unexpected EOF while in a multi-line comment".to_string(),
-                    ));
-                }
+                None => break self.tokenizer_error("Unexpected EOF while in a multi-line comment"),
             }
         }
     }
@@ -720,9 +722,11 @@ mod tests {
         let mut tokenizer = Tokenizer::new(&dialect, &sql);
         assert_eq!(
             tokenizer.tokenize(),
-            Err(TokenizerError(
-                "Unterminated string literal at Line: 1, Col: 8".to_string()
-            ))
+            Err(TokenizerError {
+                message: "Unterminated string literal".to_string(),
+                line: 1,
+                col: 8
+            })
         );
     }
 
@@ -843,9 +847,11 @@ mod tests {
         let mut tokenizer = Tokenizer::new(&dialect, &sql);
         assert_eq!(
             tokenizer.tokenize(),
-            Err(TokenizerError(
-                "Expected close delimiter '\"' before EOF.".to_string(),
-            ))
+            Err(TokenizerError {
+                message: "Expected close delimiter '\"' before EOF.".to_string(),
+                line: 1,
+                col: 1
+            })
         );
     }
 

From 846c52f4500a5b79d351f8f9e3166e2806508a55 Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Tue, 9 Jun 2020 23:32:13 -0700
Subject: [PATCH 031/122] Allow omitting units after INTERVAL (#184)

Alter INTERVAL to support postgres syntax

This patch updates our INTERVAL implementation such that the Postgres
and Redshfit variation of the syntax is supported: namely that 'leading
field' is optional.

Fixes #177.
---
 src/ast/value.rs          | 16 +++++++---------
 src/parser.rs             | 17 +++++++++++++----
 tests/sqlparser_common.rs | 29 ++++++++++++++++++++++++-----
 3 files changed, 44 insertions(+), 18 deletions(-)

diff --git a/src/ast/value.rs b/src/ast/value.rs
index fe2870f95..fdcd238cd 100644
--- a/src/ast/value.rs
+++ b/src/ast/value.rs
@@ -37,7 +37,7 @@ pub enum Value {
     /// `TIMESTAMP '...'` literals
     Timestamp(String),
     /// INTERVAL literals, roughly in the following format:
-    /// `INTERVAL '<value>' <leading_field> [ (<leading_precision>) ]
+    /// `INTERVAL '<value>' [ <leading_field> [ (<leading_precision>) ] ]
     /// [ TO <last_field> [ (<fractional_seconds_precision>) ] ]`,
     /// e.g. `INTERVAL '123:45.67' MINUTE(3) TO SECOND(2)`.
     ///
@@ -46,7 +46,7 @@ pub enum Value {
     /// so the user will have to reject intervals like `HOUR TO YEAR`.
     Interval {
         value: String,
-        leading_field: DateTimeField,
+        leading_field: Option<DateTimeField>,
         leading_precision: Option<u64>,
         last_field: Option<DateTimeField>,
         /// The seconds precision can be specified in SQL source as
@@ -72,7 +72,7 @@ impl fmt::Display for Value {
             Value::Timestamp(v) => write!(f, "TIMESTAMP '{}'", escape_single_quote_string(v)),
             Value::Interval {
                 value,
-                leading_field: DateTimeField::Second,
+                leading_field: Some(DateTimeField::Second),
                 leading_precision: Some(leading_precision),
                 last_field,
                 fractional_seconds_precision: Some(fractional_seconds_precision),
@@ -95,12 +95,10 @@ impl fmt::Display for Value {
                 last_field,
                 fractional_seconds_precision,
             } => {
-                write!(
-                    f,
-                    "INTERVAL '{}' {}",
-                    escape_single_quote_string(value),
-                    leading_field
-                )?;
+                write!(f, "INTERVAL '{}'", escape_single_quote_string(value))?;
+                if let Some(leading_field) = leading_field {
+                    write!(f, " {}", leading_field)?;
+                }
                 if let Some(leading_precision) = leading_precision {
                     write!(f, " ({})", leading_precision)?;
                 }
diff --git a/src/parser.rs b/src/parser.rs
index 780334a9b..7c136cc6e 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -526,12 +526,21 @@ impl Parser {
         // Following the string literal is a qualifier which indicates the units
         // of the duration specified in the string literal.
         //
-        // Note that PostgreSQL allows omitting the qualifier, but we currently
-        // require at least the leading field, in accordance with the ANSI spec.
-        let leading_field = self.parse_date_time_field()?;
+        // Note that PostgreSQL allows omitting the qualifier, so we provide
+        // this more general implemenation.
+        let leading_field = match self.peek_token() {
+            Some(Token::Word(kw))
+                if ["YEAR", "MONTH", "DAY", "HOUR", "MINUTE", "SECOND"]
+                    .iter()
+                    .any(|d| kw.keyword == *d) =>
+            {
+                Some(self.parse_date_time_field()?)
+            }
+            _ => None,
+        };
 
         let (leading_precision, last_field, fsec_precision) =
-            if leading_field == DateTimeField::Second {
+            if leading_field == Some(DateTimeField::Second) {
                 // SQL mandates special syntax for `SECOND TO SECOND` literals.
                 // Instead of
                 //     `SECOND [(<leading precision>)] TO SECOND[(<fractional seconds precision>)]`
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index a63d3d49f..8ff6e7e9b 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1459,7 +1459,7 @@ fn parse_literal_interval() {
     assert_eq!(
         &Expr::Value(Value::Interval {
             value: "1-1".into(),
-            leading_field: DateTimeField::Year,
+            leading_field: Some(DateTimeField::Year),
             leading_precision: None,
             last_field: Some(DateTimeField::Month),
             fractional_seconds_precision: None,
@@ -1472,7 +1472,7 @@ fn parse_literal_interval() {
     assert_eq!(
         &Expr::Value(Value::Interval {
             value: "01:01.01".into(),
-            leading_field: DateTimeField::Minute,
+            leading_field: Some(DateTimeField::Minute),
             leading_precision: Some(5),
             last_field: Some(DateTimeField::Second),
             fractional_seconds_precision: Some(5),
@@ -1485,7 +1485,7 @@ fn parse_literal_interval() {
     assert_eq!(
         &Expr::Value(Value::Interval {
             value: "1".into(),
-            leading_field: DateTimeField::Second,
+            leading_field: Some(DateTimeField::Second),
             leading_precision: Some(5),
             last_field: None,
             fractional_seconds_precision: Some(4),
@@ -1498,7 +1498,7 @@ fn parse_literal_interval() {
     assert_eq!(
         &Expr::Value(Value::Interval {
             value: "10".into(),
-            leading_field: DateTimeField::Hour,
+            leading_field: Some(DateTimeField::Hour),
             leading_precision: None,
             last_field: None,
             fractional_seconds_precision: None,
@@ -1511,7 +1511,7 @@ fn parse_literal_interval() {
     assert_eq!(
         &Expr::Value(Value::Interval {
             value: "10".into(),
-            leading_field: DateTimeField::Hour,
+            leading_field: Some(DateTimeField::Hour),
             leading_precision: Some(1),
             last_field: None,
             fractional_seconds_precision: None,
@@ -1519,6 +1519,19 @@ fn parse_literal_interval() {
         expr_from_projection(only(&select.projection)),
     );
 
+    let sql = "SELECT INTERVAL '1 DAY'";
+    let select = verified_only_select(sql);
+    assert_eq!(
+        &Expr::Value(Value::Interval {
+            value: "1 DAY".into(),
+            leading_field: None,
+            leading_precision: None,
+            last_field: None,
+            fractional_seconds_precision: None,
+        }),
+        expr_from_projection(only(&select.projection)),
+    );
+
     let result = parse_sql_statements("SELECT INTERVAL '1' SECOND TO SECOND");
     assert_eq!(
         ParserError::ParserError("Expected end of statement, found: SECOND".to_string()),
@@ -1544,6 +1557,12 @@ fn parse_literal_interval() {
     verified_only_select("SELECT INTERVAL '1' HOUR TO MINUTE");
     verified_only_select("SELECT INTERVAL '1' HOUR TO SECOND");
     verified_only_select("SELECT INTERVAL '1' MINUTE TO SECOND");
+    verified_only_select("SELECT INTERVAL '1 YEAR'");
+    verified_only_select("SELECT INTERVAL '1 YEAR' AS one_year");
+    one_statement_parses_to(
+        "SELECT INTERVAL '1 YEAR' one_year",
+        "SELECT INTERVAL '1 YEAR' AS one_year",
+    );
 }
 
 #[test]

From d9a7491d9a8f773d568b13c7b06d4f25a24e3892 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Wed, 10 Jun 2020 09:33:31 +0300
Subject: [PATCH 032/122] Various follow-ups to recent pushes

- Update CHANGELOG
- Update `.gitignore` for the build directory of the benchmark crate
- Remove src/lib from the recently added benchmark crate per
  https://github.com/andygrove/sqlparser-rs/pull/190#pullrequestreview-425835379
---
 .gitignore                 | 1 +
 CHANGELOG.md               | 2 ++
 sqlparser_bench/src/lib.rs | 7 -------
 3 files changed, 3 insertions(+), 7 deletions(-)
 delete mode 100644 sqlparser_bench/src/lib.rs

diff --git a/.gitignore b/.gitignore
index 46c66224f..dcc3cbd93 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,6 +1,7 @@
 # Generated by Cargo
 # will have compiled files and executables
 /target/
+/sqlparser_bench/target/
 
 # Remove Cargo.lock from gitignore if creating an executable, leave it for libraries
 # More information here http://doc.crates.io/guide.html#cargotoml-vs-cargolock
diff --git a/CHANGELOG.md b/CHANGELOG.md
index ab27d94e8..93cfe06b4 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -12,6 +12,8 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 - **`Parser::parse_sql` now accepts a `&str` instead of `String` (#182)** - thanks @Dandandan!
 - Change `Ident` (previously a simple `String`) to store the parsed (unquoted) `value` of the identifier and the `quote_style` separately (#143) - thanks @apparebit!
 - Support Snowflake's `FROM (table_name)` (#155) - thanks @eyalleshem!
+- Add line and column number to TokenizerError (#194) - thanks @Dandandan!
+- Make the units keyword following `INTERVAL '...'` optional (#184) - thanks @maxcountryman!
 
 ### Added
 - Support MSSQL `TOP (<N>) [ PERCENT ] [ WITH TIES ]` (#150) - thanks @alexkyllo!
diff --git a/sqlparser_bench/src/lib.rs b/sqlparser_bench/src/lib.rs
deleted file mode 100644
index 31e1bb209..000000000
--- a/sqlparser_bench/src/lib.rs
+++ /dev/null
@@ -1,7 +0,0 @@
-#[cfg(test)]
-mod tests {
-    #[test]
-    fn it_works() {
-        assert_eq!(2 + 2, 4);
-    }
-}

From 2f1015339aa9cd007994f8aea51ec96e62945066 Mon Sep 17 00:00:00 2001
From: Taehoon Moon <panarch@kaist.ac.kr>
Date: Wed, 10 Jun 2020 18:53:52 +0900
Subject: [PATCH 033/122] Add serde support to AST structs and enums (#196)

Apply serde to AST structs and enums to be serializable/deserializable.
serde support is optional, can be activated by feature named "serde".
---
 Cargo.toml           |  3 ++-
 src/ast/data_type.rs |  3 +++
 src/ast/ddl.rs       |  8 ++++++++
 src/ast/mod.rs       | 22 ++++++++++++++++++++++
 src/ast/operator.rs  |  4 ++++
 src/ast/query.rs     | 20 ++++++++++++++++++++
 src/ast/value.rs     |  4 ++++
 7 files changed, 63 insertions(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index 895f07f6a..3232e6a05 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -19,8 +19,9 @@ name = "sqlparser"
 path = "src/lib.rs"
 
 [dependencies]
-bigdecimal = { version = "0.1.0", optional = true }
+bigdecimal = { version = "0.1.0", features = ["serde"], optional = true }
 log = "0.4.5"
+serde = { version = "1.0", features = ["derive"], optional = true }
 
 [dev-dependencies]
 simple_logger = "1.0.1"
diff --git a/src/ast/data_type.rs b/src/ast/data_type.rs
index cfbc2147d..fc8b98c55 100644
--- a/src/ast/data_type.rs
+++ b/src/ast/data_type.rs
@@ -11,10 +11,13 @@
 // limitations under the License.
 
 use super::ObjectName;
+#[cfg(feature = "serde")]
+use serde::{Deserialize, Serialize};
 use std::fmt;
 
 /// SQL data types
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum DataType {
     /// Fixed-length character type e.g. CHAR(10)
     Char(Option<u64>),
diff --git a/src/ast/ddl.rs b/src/ast/ddl.rs
index 776927669..d7503ba77 100644
--- a/src/ast/ddl.rs
+++ b/src/ast/ddl.rs
@@ -13,10 +13,13 @@
 //! AST types specific to CREATE/ALTER variants of [Statement]
 //! (commonly referred to as Data Definition Language, or DDL)
 use super::{display_comma_separated, DataType, Expr, Ident, ObjectName};
+#[cfg(feature = "serde")]
+use serde::{Deserialize, Serialize};
 use std::fmt;
 
 /// An `ALTER TABLE` (`Statement::AlterTable`) operation
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum AlterTableOperation {
     /// `ADD <table_constraint>`
     AddConstraint(TableConstraint),
@@ -36,6 +39,7 @@ impl fmt::Display for AlterTableOperation {
 /// A table-level constraint, specified in a `CREATE TABLE` or an
 /// `ALTER TABLE ADD <constraint>` statement.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum TableConstraint {
     /// `[ CONSTRAINT <name> ] { PRIMARY KEY | UNIQUE } (<columns>)`
     Unique {
@@ -95,6 +99,7 @@ impl fmt::Display for TableConstraint {
 
 /// SQL column definition
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct ColumnDef {
     pub name: Ident,
     pub data_type: DataType,
@@ -129,6 +134,7 @@ impl fmt::Display for ColumnDef {
 /// non-constraint options, lumping them all together under the umbrella of
 /// "column options," and we allow any column option to be named.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct ColumnOptionDef {
     pub name: Option<Ident>,
     pub option: ColumnOption,
@@ -143,6 +149,7 @@ impl fmt::Display for ColumnOptionDef {
 /// `ColumnOption`s are modifiers that follow a column definition in a `CREATE
 /// TABLE` statement.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum ColumnOption {
     /// `NULL`
     Null,
@@ -220,6 +227,7 @@ fn display_constraint_name<'a>(name: &'a Option<Ident>) -> impl fmt::Display + '
 ///
 /// Used in foreign key constraints in `ON UPDATE` and `ON DELETE` options.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum ReferentialAction {
     Restrict,
     Cascade,
diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 2dbf42b29..c04fb0269 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -18,6 +18,8 @@ mod operator;
 mod query;
 mod value;
 
+#[cfg(feature = "serde")]
+use serde::{Deserialize, Serialize};
 use std::fmt;
 
 pub use self::data_type::DataType;
@@ -71,6 +73,7 @@ where
 
 /// An identifier, decomposed into its value or character data and the quote style.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Ident {
     /// The value of the identifier without quotes.
     pub value: String,
@@ -127,6 +130,7 @@ impl fmt::Display for Ident {
 
 /// A name of a table, view, custom type, etc., possibly multi-part, i.e. db.schema.obj
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct ObjectName(pub Vec<Ident>);
 
 impl fmt::Display for ObjectName {
@@ -141,6 +145,7 @@ impl fmt::Display for ObjectName {
 /// (e.g. boolean vs string), so the caller must handle expressions of
 /// inappropriate type, like `WHERE 1` or `SELECT 1=1`, as necessary.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum Expr {
     /// Identifier e.g. table name or column name
     Identifier(Ident),
@@ -308,6 +313,7 @@ impl fmt::Display for Expr {
 
 /// A window specification (i.e. `OVER (PARTITION BY .. ORDER BY .. etc.)`)
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct WindowSpec {
     pub partition_by: Vec<Expr>,
     pub order_by: Vec<OrderByExpr>,
@@ -353,6 +359,7 @@ impl fmt::Display for WindowSpec {
 /// Note: The parser does not validate the specified bounds; the caller should
 /// reject invalid bounds like `ROWS UNBOUNDED FOLLOWING` before execution.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct WindowFrame {
     pub units: WindowFrameUnits,
     pub start_bound: WindowFrameBound,
@@ -364,6 +371,7 @@ pub struct WindowFrame {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum WindowFrameUnits {
     Rows,
     Range,
@@ -398,6 +406,7 @@ impl FromStr for WindowFrameUnits {
 
 /// Specifies [WindowFrame]'s `start_bound` and `end_bound`
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum WindowFrameBound {
     /// `CURRENT ROW`
     CurrentRow,
@@ -422,6 +431,7 @@ impl fmt::Display for WindowFrameBound {
 /// A top-level statement (SELECT, INSERT, CREATE, etc.)
 #[allow(clippy::large_enum_variant)]
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum Statement {
     /// SELECT
     Query(Box<Query>),
@@ -766,6 +776,7 @@ impl fmt::Display for Statement {
 
 /// SQL assignment `foo = expr` as used in SQLUpdate
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Assignment {
     pub id: Ident,
     pub value: Expr,
@@ -779,6 +790,7 @@ impl fmt::Display for Assignment {
 
 /// A function call
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Function {
     pub name: ObjectName,
     pub args: Vec<Expr>,
@@ -805,6 +817,7 @@ impl fmt::Display for Function {
 
 /// External table's available file format
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum FileFormat {
     TEXTFILE,
     SEQUENCEFILE,
@@ -856,6 +869,7 @@ impl FromStr for FileFormat {
 /// A `LISTAGG` invocation `LISTAGG( [ DISTINCT ] <expr>[, <separator> ] [ON OVERFLOW <on_overflow>] ) )
 /// [ WITHIN GROUP (ORDER BY <within_group1>[, ...] ) ]`
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct ListAgg {
     pub distinct: bool,
     pub expr: Box<Expr>,
@@ -892,6 +906,7 @@ impl fmt::Display for ListAgg {
 
 /// The `ON OVERFLOW` clause of a LISTAGG invocation
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum ListAggOnOverflow {
     /// `ON OVERFLOW ERROR`
     Error,
@@ -925,6 +940,7 @@ impl fmt::Display for ListAggOnOverflow {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum ObjectType {
     Table,
     View,
@@ -944,6 +960,7 @@ impl fmt::Display for ObjectType {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct SqlOption {
     pub name: Ident,
     pub value: Value,
@@ -956,6 +973,7 @@ impl fmt::Display for SqlOption {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum TransactionMode {
     AccessMode(TransactionAccessMode),
     IsolationLevel(TransactionIsolationLevel),
@@ -972,6 +990,7 @@ impl fmt::Display for TransactionMode {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum TransactionAccessMode {
     ReadOnly,
     ReadWrite,
@@ -988,6 +1007,7 @@ impl fmt::Display for TransactionAccessMode {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum TransactionIsolationLevel {
     ReadUncommitted,
     ReadCommitted,
@@ -1008,6 +1028,7 @@ impl fmt::Display for TransactionIsolationLevel {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum ShowStatementFilter {
     Like(String),
     Where(Expr),
@@ -1024,6 +1045,7 @@ impl fmt::Display for ShowStatementFilter {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum SetVariableValue {
     Ident(Ident),
     Literal(Value),
diff --git a/src/ast/operator.rs b/src/ast/operator.rs
index c9f5eb2e9..63e75eead 100644
--- a/src/ast/operator.rs
+++ b/src/ast/operator.rs
@@ -10,10 +10,13 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
+#[cfg(feature = "serde")]
+use serde::{Deserialize, Serialize};
 use std::fmt;
 
 /// Unary operators
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum UnaryOperator {
     Plus,
     Minus,
@@ -32,6 +35,7 @@ impl fmt::Display for UnaryOperator {
 
 /// Binary operators
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum BinaryOperator {
     Plus,
     Minus,
diff --git a/src/ast/query.rs b/src/ast/query.rs
index a5918f1a3..73477b126 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -11,10 +11,13 @@
 // limitations under the License.
 
 use super::*;
+#[cfg(feature = "serde")]
+use serde::{Deserialize, Serialize};
 
 /// The most complete variant of a `SELECT` query expression, optionally
 /// including `WITH`, `UNION` / other set operations, and `ORDER BY`.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Query {
     /// WITH (common table expressions, or CTEs)
     pub ctes: Vec<Cte>,
@@ -55,6 +58,7 @@ impl fmt::Display for Query {
 /// A node in a tree, representing a "query body" expression, roughly:
 /// `SELECT ... [ {UNION|EXCEPT|INTERSECT} SELECT ...]`
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum SetExpr {
     /// Restricted SELECT .. FROM .. HAVING (no ORDER BY or set operations)
     Select(Box<Select>),
@@ -92,6 +96,7 @@ impl fmt::Display for SetExpr {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum SetOperator {
     Union,
     Except,
@@ -112,6 +117,7 @@ impl fmt::Display for SetOperator {
 /// appear either as the only body item of an `SQLQuery`, or as an operand
 /// to a set operation like `UNION`.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Select {
     pub distinct: bool,
     /// MSSQL syntax: `TOP (<N>) [ PERCENT ] [ WITH TIES ]`
@@ -156,6 +162,7 @@ impl fmt::Display for Select {
 /// of the columns returned by the query. The parser does not validate that the
 /// number of columns in the query matches the number of columns in the query.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Cte {
     pub alias: TableAlias,
     pub query: Query,
@@ -169,6 +176,7 @@ impl fmt::Display for Cte {
 
 /// One item of the comma-separated list following `SELECT`
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum SelectItem {
     /// Any expression, not followed by `[ AS ] alias`
     UnnamedExpr(Expr),
@@ -192,6 +200,7 @@ impl fmt::Display for SelectItem {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct TableWithJoins {
     pub relation: TableFactor,
     pub joins: Vec<Join>,
@@ -209,6 +218,7 @@ impl fmt::Display for TableWithJoins {
 
 /// A table name or a parenthesized subquery with an optional alias
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum TableFactor {
     Table {
         name: ObjectName,
@@ -274,6 +284,7 @@ impl fmt::Display for TableFactor {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct TableAlias {
     pub name: Ident,
     pub columns: Vec<Ident>,
@@ -290,6 +301,7 @@ impl fmt::Display for TableAlias {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Join {
     pub relation: TableFactor,
     pub join_operator: JoinOperator,
@@ -355,6 +367,7 @@ impl fmt::Display for Join {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum JoinOperator {
     Inner(JoinConstraint),
     LeftOuter(JoinConstraint),
@@ -368,6 +381,7 @@ pub enum JoinOperator {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum JoinConstraint {
     On(Expr),
     Using(Vec<Ident>),
@@ -376,6 +390,7 @@ pub enum JoinConstraint {
 
 /// An `ORDER BY` expression
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct OrderByExpr {
     pub expr: Expr,
     /// Optional `ASC` or `DESC`
@@ -402,6 +417,7 @@ impl fmt::Display for OrderByExpr {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Offset {
     pub value: Expr,
     pub rows: OffsetRows,
@@ -415,6 +431,7 @@ impl fmt::Display for Offset {
 
 /// Stores the keyword after `OFFSET <number>`
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum OffsetRows {
     /// Omitting ROW/ROWS is non-standard MySQL quirk.
     None,
@@ -433,6 +450,7 @@ impl fmt::Display for OffsetRows {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Fetch {
     pub with_ties: bool,
     pub percent: bool,
@@ -452,6 +470,7 @@ impl fmt::Display for Fetch {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Top {
     /// SQL semantic equivalent of LIMIT but with same structure as FETCH.
     pub with_ties: bool,
@@ -472,6 +491,7 @@ impl fmt::Display for Top {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Values(pub Vec<Vec<Expr>>);
 
 impl fmt::Display for Values {
diff --git a/src/ast/value.rs b/src/ast/value.rs
index fdcd238cd..c5b0f3a88 100644
--- a/src/ast/value.rs
+++ b/src/ast/value.rs
@@ -12,10 +12,13 @@
 
 #[cfg(feature = "bigdecimal")]
 use bigdecimal::BigDecimal;
+#[cfg(feature = "serde")]
+use serde::{Deserialize, Serialize};
 use std::fmt;
 
 /// Primitive SQL values such as number and string
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum Value {
     /// Numeric literal
     #[cfg(not(feature = "bigdecimal"))]
@@ -116,6 +119,7 @@ impl fmt::Display for Value {
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum DateTimeField {
     Year,
     Month,

From 0fe3a8ec39e0b85ad0da88add137df3d330dc060 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Wed, 10 Jun 2020 14:05:17 +0300
Subject: [PATCH 034/122] Use Token::EOF instead of Option<Token> (#195)

This simplifies codes slightly, removing the need deal with the EOF case explicitly.

The clone kludge in `_ => self.expected("date/time field",
Token::Word(w.clone())))` will become unnecessary once we stop using
a separate match for the keywords, as suggested in
https://github.com/andygrove/sqlparser-rs/pull/193#issuecomment-641607194
---
 src/parser.rs    | 333 +++++++++++++++++++++--------------------------
 src/tokenizer.rs |   3 +
 2 files changed, 148 insertions(+), 188 deletions(-)

diff --git a/src/parser.rs b/src/parser.rs
index 7c136cc6e..35147b4fb 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -98,9 +98,10 @@ impl Parser {
                 expecting_statement_delimiter = false;
             }
 
-            if parser.peek_token().is_none() {
+            if parser.peek_token() == Token::EOF {
                 break;
-            } else if expecting_statement_delimiter {
+            }
+            if expecting_statement_delimiter {
                 return parser.expected("end of statement", parser.peek_token());
             }
 
@@ -115,43 +116,34 @@ impl Parser {
     /// stopping before the statement separator, if any.
     pub fn parse_statement(&mut self) -> Result<Statement, ParserError> {
         match self.next_token() {
-            Some(t) => match t {
-                Token::Word(ref w) if w.keyword != "" => match w.keyword.as_ref() {
-                    "SELECT" | "WITH" | "VALUES" => {
-                        self.prev_token();
-                        Ok(Statement::Query(Box::new(self.parse_query()?)))
-                    }
-                    "CREATE" => Ok(self.parse_create()?),
-                    "DROP" => Ok(self.parse_drop()?),
-                    "DELETE" => Ok(self.parse_delete()?),
-                    "INSERT" => Ok(self.parse_insert()?),
-                    "UPDATE" => Ok(self.parse_update()?),
-                    "ALTER" => Ok(self.parse_alter()?),
-                    "COPY" => Ok(self.parse_copy()?),
-                    "SET" => Ok(self.parse_set()?),
-                    "SHOW" => Ok(self.parse_show()?),
-                    "START" => Ok(self.parse_start_transaction()?),
-                    // `BEGIN` is a nonstandard but common alias for the
-                    // standard `START TRANSACTION` statement. It is supported
-                    // by at least PostgreSQL and MySQL.
-                    "BEGIN" => Ok(self.parse_begin()?),
-                    "COMMIT" => Ok(self.parse_commit()?),
-                    "ROLLBACK" => Ok(self.parse_rollback()?),
-                    _ => parser_err!(format!(
-                        "Unexpected keyword {:?} at the beginning of a statement",
-                        w.to_string()
-                    )),
-                },
-                Token::LParen => {
+            Token::Word(w) => match w.keyword.as_ref() {
+                "SELECT" | "WITH" | "VALUES" => {
                     self.prev_token();
                     Ok(Statement::Query(Box::new(self.parse_query()?)))
                 }
-                unexpected => self.expected(
-                    "a keyword at the beginning of a statement",
-                    Some(unexpected),
-                ),
+                "CREATE" => Ok(self.parse_create()?),
+                "DROP" => Ok(self.parse_drop()?),
+                "DELETE" => Ok(self.parse_delete()?),
+                "INSERT" => Ok(self.parse_insert()?),
+                "UPDATE" => Ok(self.parse_update()?),
+                "ALTER" => Ok(self.parse_alter()?),
+                "COPY" => Ok(self.parse_copy()?),
+                "SET" => Ok(self.parse_set()?),
+                "SHOW" => Ok(self.parse_show()?),
+                "START" => Ok(self.parse_start_transaction()?),
+                // `BEGIN` is a nonstandard but common alias for the
+                // standard `START TRANSACTION` statement. It is supported
+                // by at least PostgreSQL and MySQL.
+                "BEGIN" => Ok(self.parse_begin()?),
+                "COMMIT" => Ok(self.parse_commit()?),
+                "ROLLBACK" => Ok(self.parse_rollback()?),
+                _ => self.expected("an SQL statement", Token::Word(w.clone())),
             },
-            None => self.expected("SQL statement", None),
+            Token::LParen => {
+                self.prev_token();
+                Ok(Statement::Query(Box::new(self.parse_query()?)))
+            }
+            unexpected => self.expected("an SQL statement", unexpected),
         }
     }
 
@@ -179,10 +171,7 @@ impl Parser {
 
     /// Parse an expression prefix
     pub fn parse_prefix(&mut self) -> Result<Expr, ParserError> {
-        let tok = self
-            .next_token()
-            .ok_or_else(|| ParserError::ParserError("Unexpected EOF".to_string()))?;
-        let expr = match tok {
+        let expr = match self.next_token() {
             Token::Word(w) => match w.keyword.as_ref() {
                 "TRUE" | "FALSE" | "NULL" => {
                     self.prev_token();
@@ -204,13 +193,13 @@ impl Parser {
                 // Here `w` is a word, check if it's a part of a multi-part
                 // identifier, a function call, or a simple identifier:
                 _ => match self.peek_token() {
-                    Some(Token::LParen) | Some(Token::Period) => {
+                    Token::LParen | Token::Period => {
                         let mut id_parts: Vec<Ident> = vec![w.to_ident()];
                         let mut ends_with_wildcard = false;
                         while self.consume_token(&Token::Period) {
                             match self.next_token() {
-                                Some(Token::Word(w)) => id_parts.push(w.to_ident()),
-                                Some(Token::Mult) => {
+                                Token::Word(w) => id_parts.push(w.to_ident()),
+                                Token::Mult => {
                                     ends_with_wildcard = true;
                                     break;
                                 }
@@ -261,7 +250,7 @@ impl Parser {
                 self.expect_token(&Token::RParen)?;
                 Ok(expr)
             }
-            unexpected => self.expected("an expression", Some(unexpected)),
+            unexpected => self.expected("an expression", unexpected),
         }?;
 
         if self.parse_keyword("COLLATE") {
@@ -319,7 +308,7 @@ impl Parser {
 
     pub fn parse_window_frame(&mut self) -> Result<WindowFrame, ParserError> {
         let units = match self.next_token() {
-            Some(Token::Word(w)) => w.keyword.parse::<WindowFrameUnits>()?,
+            Token::Word(w) => w.keyword.parse::<WindowFrameUnits>()?,
             unexpected => return self.expected("ROWS, RANGE, GROUPS", unexpected),
         };
         let (start_bound, end_bound) = if self.parse_keyword("BETWEEN") {
@@ -438,16 +427,13 @@ impl Parser {
             } else {
                 self.expect_keyword("TRUNCATE")?;
                 let filler = match self.peek_token() {
-                    Some(Token::Word(kw)) if kw.keyword == "WITH" || kw.keyword == "WITHOUT" => {
-                        None
+                    Token::Word(w) if w.keyword == "WITH" || w.keyword == "WITHOUT" => None,
+                    Token::SingleQuotedString(_)
+                    | Token::NationalStringLiteral(_)
+                    | Token::HexStringLiteral(_) => Some(Box::new(self.parse_expr()?)),
+                    unexpected => {
+                        self.expected("either filler, WITH, or WITHOUT in LISTAGG", unexpected)?
                     }
-                    Some(Token::SingleQuotedString(_))
-                    | Some(Token::NationalStringLiteral(_))
-                    | Some(Token::HexStringLiteral(_)) => Some(Box::new(self.parse_expr()?)),
-                    _ => self.expected(
-                        "either filler, WITH, or WITHOUT in LISTAGG",
-                        self.peek_token(),
-                    )?,
                 };
                 let with_count = self.parse_keyword("WITH");
                 if !with_count && !self.parse_keyword("WITHOUT") {
@@ -485,19 +471,17 @@ impl Parser {
     // date/time fields than interval qualifiers, so this function may need to
     // be split in two.
     pub fn parse_date_time_field(&mut self) -> Result<DateTimeField, ParserError> {
-        let tok = self.next_token();
-        if let Some(Token::Word(ref k)) = tok {
-            match k.keyword.as_ref() {
+        match self.next_token() {
+            Token::Word(w) => match w.keyword.as_ref() {
                 "YEAR" => Ok(DateTimeField::Year),
                 "MONTH" => Ok(DateTimeField::Month),
                 "DAY" => Ok(DateTimeField::Day),
                 "HOUR" => Ok(DateTimeField::Hour),
                 "MINUTE" => Ok(DateTimeField::Minute),
                 "SECOND" => Ok(DateTimeField::Second),
-                _ => self.expected("date/time field", tok)?,
-            }
-        } else {
-            self.expected("date/time field", tok)?
+                _ => self.expected("date/time field", Token::Word(w.clone()))?,
+            },
+            unexpected => self.expected("date/time field", unexpected),
         }
     }
 
@@ -529,7 +513,7 @@ impl Parser {
         // Note that PostgreSQL allows omitting the qualifier, so we provide
         // this more general implemenation.
         let leading_field = match self.peek_token() {
-            Some(Token::Word(kw))
+            Token::Word(kw)
                 if ["YEAR", "MONTH", "DAY", "HOUR", "MINUTE", "SECOND"]
                     .iter()
                     .any(|d| kw.keyword == *d) =>
@@ -575,10 +559,8 @@ impl Parser {
 
     /// Parse an operator following an expression
     pub fn parse_infix(&mut self, expr: Expr, precedence: u8) -> Result<Expr, ParserError> {
-        debug!("parsing infix");
-        let tok = self.next_token().unwrap(); // safe as EOF's precedence is the lowest
-
-        let regular_binary_operator = match tok {
+        let tok = self.next_token();
+        let regular_binary_operator = match &tok {
             Token::Eq => Some(BinaryOperator::Eq),
             Token::Neq => Some(BinaryOperator::NotEq),
             Token::Gt => Some(BinaryOperator::Gt),
@@ -594,7 +576,7 @@ impl Parser {
             Token::Caret => Some(BinaryOperator::BitwiseXor),
             Token::Ampersand => Some(BinaryOperator::BitwiseAnd),
             Token::Div => Some(BinaryOperator::Divide),
-            Token::Word(ref k) => match k.keyword.as_ref() {
+            Token::Word(w) => match w.keyword.as_ref() {
                 "AND" => Some(BinaryOperator::And),
                 "OR" => Some(BinaryOperator::Or),
                 "LIKE" => Some(BinaryOperator::Like),
@@ -616,8 +598,8 @@ impl Parser {
                 op,
                 right: Box::new(self.parse_subexpr(precedence)?),
             })
-        } else if let Token::Word(ref k) = tok {
-            match k.keyword.as_ref() {
+        } else if let Token::Word(w) = &tok {
+            match w.keyword.as_ref() {
                 "IS" => {
                     if self.parse_keyword("NULL") {
                         Ok(Expr::IsNull(Box::new(expr)))
@@ -699,51 +681,45 @@ impl Parser {
 
     /// Get the precedence of the next token
     pub fn get_next_precedence(&self) -> Result<u8, ParserError> {
-        if let Some(token) = self.peek_token() {
-            debug!("get_next_precedence() {:?}", token);
-
-            match &token {
-                Token::Word(k) if k.keyword == "OR" => Ok(5),
-                Token::Word(k) if k.keyword == "AND" => Ok(10),
-                Token::Word(k) if k.keyword == "NOT" => match &self.peek_nth_token(1) {
-                    // The precedence of NOT varies depending on keyword that
-                    // follows it. If it is followed by IN, BETWEEN, or LIKE,
-                    // it takes on the precedence of those tokens. Otherwise it
-                    // is not an infix operator, and therefore has zero
-                    // precedence.
-                    Some(Token::Word(k)) if k.keyword == "IN" => Ok(Self::BETWEEN_PREC),
-                    Some(Token::Word(k)) if k.keyword == "BETWEEN" => Ok(Self::BETWEEN_PREC),
-                    Some(Token::Word(k)) if k.keyword == "LIKE" => Ok(Self::BETWEEN_PREC),
-                    _ => Ok(0),
-                },
-                Token::Word(k) if k.keyword == "IS" => Ok(17),
-                Token::Word(k) if k.keyword == "IN" => Ok(Self::BETWEEN_PREC),
-                Token::Word(k) if k.keyword == "BETWEEN" => Ok(Self::BETWEEN_PREC),
-                Token::Word(k) if k.keyword == "LIKE" => Ok(Self::BETWEEN_PREC),
-                Token::Eq | Token::Lt | Token::LtEq | Token::Neq | Token::Gt | Token::GtEq => {
-                    Ok(20)
-                }
-                Token::Pipe => Ok(21),
-                Token::Caret => Ok(22),
-                Token::Ampersand => Ok(23),
-                Token::Plus | Token::Minus => Ok(Self::PLUS_MINUS_PREC),
-                Token::Mult | Token::Div | Token::Mod | Token::StringConcat => Ok(40),
-                Token::DoubleColon => Ok(50),
+        let token = self.peek_token();
+        debug!("get_next_precedence() {:?}", token);
+        match token {
+            Token::Word(w) if w.keyword == "OR" => Ok(5),
+            Token::Word(w) if w.keyword == "AND" => Ok(10),
+            Token::Word(w) if w.keyword == "NOT" => match self.peek_nth_token(1) {
+                // The precedence of NOT varies depending on keyword that
+                // follows it. If it is followed by IN, BETWEEN, or LIKE,
+                // it takes on the precedence of those tokens. Otherwise it
+                // is not an infix operator, and therefore has zero
+                // precedence.
+                Token::Word(w) if w.keyword == "IN" => Ok(Self::BETWEEN_PREC),
+                Token::Word(w) if w.keyword == "BETWEEN" => Ok(Self::BETWEEN_PREC),
+                Token::Word(w) if w.keyword == "LIKE" => Ok(Self::BETWEEN_PREC),
                 _ => Ok(0),
-            }
-        } else {
-            Ok(0)
+            },
+            Token::Word(w) if w.keyword == "IS" => Ok(17),
+            Token::Word(w) if w.keyword == "IN" => Ok(Self::BETWEEN_PREC),
+            Token::Word(w) if w.keyword == "BETWEEN" => Ok(Self::BETWEEN_PREC),
+            Token::Word(w) if w.keyword == "LIKE" => Ok(Self::BETWEEN_PREC),
+            Token::Eq | Token::Lt | Token::LtEq | Token::Neq | Token::Gt | Token::GtEq => Ok(20),
+            Token::Pipe => Ok(21),
+            Token::Caret => Ok(22),
+            Token::Ampersand => Ok(23),
+            Token::Plus | Token::Minus => Ok(Self::PLUS_MINUS_PREC),
+            Token::Mult | Token::Div | Token::Mod | Token::StringConcat => Ok(40),
+            Token::DoubleColon => Ok(50),
+            _ => Ok(0),
         }
     }
 
     /// Return the first non-whitespace token that has not yet been processed
     /// (or None if reached end-of-file)
-    pub fn peek_token(&self) -> Option<Token> {
+    pub fn peek_token(&self) -> Token {
         self.peek_nth_token(0)
     }
 
     /// Return nth non-whitespace token that has not yet been processed
-    pub fn peek_nth_token(&self, mut n: usize) -> Option<Token> {
+    pub fn peek_nth_token(&self, mut n: usize) -> Token {
         let mut index = self.index;
         loop {
             index += 1;
@@ -751,7 +727,7 @@ impl Parser {
                 Some(Token::Whitespace(_)) => continue,
                 non_whitespace => {
                     if n == 0 {
-                        return non_whitespace.cloned();
+                        return non_whitespace.cloned().unwrap_or(Token::EOF);
                     }
                     n -= 1;
                 }
@@ -762,12 +738,12 @@ impl Parser {
     /// Return the first non-whitespace token that has not yet been processed
     /// (or None if reached end-of-file) and mark it as processed. OK to call
     /// repeatedly after reaching EOF.
-    pub fn next_token(&mut self) -> Option<Token> {
+    pub fn next_token(&mut self) -> Token {
         loop {
             self.index += 1;
             match self.tokens.get(self.index - 1) {
                 Some(Token::Whitespace(_)) => continue,
-                token => return token.cloned(),
+                token => return token.cloned().unwrap_or(Token::EOF),
             }
         }
     }
@@ -793,12 +769,8 @@ impl Parser {
     }
 
     /// Report unexpected token
-    fn expected<T>(&self, expected: &str, found: Option<Token>) -> Result<T, ParserError> {
-        parser_err!(format!(
-            "Expected {}, found: {}",
-            expected,
-            found.map_or_else(|| "EOF".to_string(), |t| format!("{}", t))
-        ))
+    fn expected<T>(&self, expected: &str, found: Token) -> Result<T, ParserError> {
+        parser_err!(format!("Expected {}, found: {}", expected, found))
     }
 
     /// Look for an expected keyword and consume it if it exists
@@ -810,7 +782,7 @@ impl Parser {
         // the string actually represents a known keyword...
         assert!(keywords::ALL_KEYWORDS.contains(&expected));
         match self.peek_token() {
-            Some(Token::Word(ref k)) if expected.eq_ignore_ascii_case(&k.keyword) => {
+            Token::Word(w) if expected.eq_ignore_ascii_case(&w.keyword) => {
                 self.next_token();
                 true
             }
@@ -844,9 +816,9 @@ impl Parser {
             );
         }
         match self.peek_token() {
-            Some(Token::Word(ref k)) => keywords
+            Token::Word(w) => keywords
                 .iter()
-                .find(|keyword| keyword.eq_ignore_ascii_case(&k.keyword))
+                .find(|keyword| keyword.eq_ignore_ascii_case(&w.keyword))
                 .map(|keyword| {
                     self.next_token();
                     *keyword
@@ -891,12 +863,11 @@ impl Parser {
     /// Consume the next token if it matches the expected token, otherwise return false
     #[must_use]
     pub fn consume_token(&mut self, expected: &Token) -> bool {
-        match &self.peek_token() {
-            Some(t) if *t == *expected => {
-                self.next_token();
-                true
-            }
-            _ => false,
+        if self.peek_token() == *expected {
+            self.next_token();
+            true
+        } else {
+            false
         }
     }
 
@@ -1079,7 +1050,7 @@ impl Parser {
         loop {
             if let Some(constraint) = self.parse_optional_table_constraint()? {
                 constraints.push(constraint);
-            } else if let Some(Token::Word(column_name)) = self.peek_token() {
+            } else if let Token::Word(column_name) = self.peek_token() {
                 self.next_token();
                 let data_type = self.parse_data_type()?;
                 let collation = if self.parse_keyword("COLLATE") {
@@ -1090,7 +1061,7 @@ impl Parser {
                 let mut options = vec![];
                 loop {
                     match self.peek_token() {
-                        None | Some(Token::Comma) | Some(Token::RParen) => break,
+                        Token::EOF | Token::Comma | Token::RParen => break,
                         _ => options.push(self.parse_column_option_def()?),
                     }
                 }
@@ -1195,8 +1166,8 @@ impl Parser {
             None
         };
         match self.next_token() {
-            Some(Token::Word(ref k)) if k.keyword == "PRIMARY" || k.keyword == "UNIQUE" => {
-                let is_primary = k.keyword == "PRIMARY";
+            Token::Word(w) if w.keyword == "PRIMARY" || w.keyword == "UNIQUE" => {
+                let is_primary = w.keyword == "PRIMARY";
                 if is_primary {
                     self.expect_keyword("KEY")?;
                 }
@@ -1207,7 +1178,7 @@ impl Parser {
                     is_primary,
                 }))
             }
-            Some(Token::Word(ref k)) if k.keyword == "FOREIGN" => {
+            Token::Word(w) if w.keyword == "FOREIGN" => {
                 self.expect_keyword("KEY")?;
                 let columns = self.parse_parenthesized_column_list(Mandatory)?;
                 self.expect_keyword("REFERENCES")?;
@@ -1220,7 +1191,7 @@ impl Parser {
                     referred_columns,
                 }))
             }
-            Some(Token::Word(ref k)) if k.keyword == "CHECK" => {
+            Token::Word(w) if w.keyword == "CHECK" => {
                 self.expect_token(&Token::LParen)?;
                 let expr = Box::new(self.parse_expr()?);
                 self.expect_token(&Token::RParen)?;
@@ -1312,14 +1283,10 @@ impl Parser {
                     if self.consume_token(&Token::Period) {
                         return Ok(values);
                     }
-                    if let Some(token) = self.next_token() {
-                        if let Token::Word(Word { value: v, .. }) = token {
-                            if v == "N" {
-                                values.push(None);
-                            }
+                    if let Token::Word(w) = self.next_token() {
+                        if w.value == "N" {
+                            values.push(None);
                         }
-                    } else {
-                        continue;
                     }
                 }
                 _ => {
@@ -1333,30 +1300,23 @@ impl Parser {
     /// Parse a literal value (numbers, strings, date/time, booleans)
     fn parse_value(&mut self) -> Result<Value, ParserError> {
         match self.next_token() {
-            Some(t) => match t {
-                Token::Word(k) => match k.keyword.as_ref() {
-                    "TRUE" => Ok(Value::Boolean(true)),
-                    "FALSE" => Ok(Value::Boolean(false)),
-                    "NULL" => Ok(Value::Null),
-                    _ => {
-                        return parser_err!(format!("No value parser for keyword {}", k.keyword));
-                    }
-                },
-                // The call to n.parse() returns a bigdecimal when the
-                // bigdecimal feature is enabled, and is otherwise a no-op
-                // (i.e., it returns the input string).
-                Token::Number(ref n) => match n.parse() {
-                    Ok(n) => Ok(Value::Number(n)),
-                    Err(e) => parser_err!(format!("Could not parse '{}' as number: {}", n, e)),
-                },
-                Token::SingleQuotedString(ref s) => Ok(Value::SingleQuotedString(s.to_string())),
-                Token::NationalStringLiteral(ref s) => {
-                    Ok(Value::NationalStringLiteral(s.to_string()))
-                }
-                Token::HexStringLiteral(ref s) => Ok(Value::HexStringLiteral(s.to_string())),
-                _ => parser_err!(format!("Unsupported value: {:?}", t)),
+            Token::Word(w) => match w.keyword.as_ref() {
+                "TRUE" => Ok(Value::Boolean(true)),
+                "FALSE" => Ok(Value::Boolean(false)),
+                "NULL" => Ok(Value::Null),
+                _ => self.expected("a concrete value", Token::Word(w.clone())),
+            },
+            // The call to n.parse() returns a bigdecimal when the
+            // bigdecimal feature is enabled, and is otherwise a no-op
+            // (i.e., it returns the input string).
+            Token::Number(ref n) => match n.parse() {
+                Ok(n) => Ok(Value::Number(n)),
+                Err(e) => parser_err!(format!("Could not parse '{}' as number: {}", n, e)),
             },
-            None => parser_err!("Expecting a value, but found EOF"),
+            Token::SingleQuotedString(ref s) => Ok(Value::SingleQuotedString(s.to_string())),
+            Token::NationalStringLiteral(ref s) => Ok(Value::NationalStringLiteral(s.to_string())),
+            Token::HexStringLiteral(ref s) => Ok(Value::HexStringLiteral(s.to_string())),
+            unexpected => self.expected("a value", unexpected),
         }
     }
 
@@ -1373,25 +1333,25 @@ impl Parser {
     /// Parse an unsigned literal integer/long
     pub fn parse_literal_uint(&mut self) -> Result<u64, ParserError> {
         match self.next_token() {
-            Some(Token::Number(s)) => s.parse::<u64>().map_err(|e| {
+            Token::Number(s) => s.parse::<u64>().map_err(|e| {
                 ParserError::ParserError(format!("Could not parse '{}' as u64: {}", s, e))
             }),
-            other => self.expected("literal int", other),
+            unexpected => self.expected("literal int", unexpected),
         }
     }
 
     /// Parse a literal string
     pub fn parse_literal_string(&mut self) -> Result<String, ParserError> {
         match self.next_token() {
-            Some(Token::SingleQuotedString(ref s)) => Ok(s.clone()),
-            other => self.expected("literal string", other),
+            Token::SingleQuotedString(s) => Ok(s),
+            unexpected => self.expected("literal string", unexpected),
         }
     }
 
     /// Parse a SQL datatype (in the context of a CREATE TABLE statement for example)
     pub fn parse_data_type(&mut self) -> Result<DataType, ParserError> {
         match self.next_token() {
-            Some(Token::Word(k)) => match k.keyword.as_ref() {
+            Token::Word(w) => match w.keyword.as_ref() {
                 "BOOLEAN" => Ok(DataType::Boolean),
                 "FLOAT" => Ok(DataType::Float(self.parse_optional_precision()?)),
                 "REAL" => Ok(DataType::Real),
@@ -1451,7 +1411,7 @@ impl Parser {
                     Ok(DataType::Custom(type_name))
                 }
             },
-            other => self.expected("a data type name", other),
+            unexpected => self.expected("a data type name", unexpected),
         }
     }
 
@@ -1469,9 +1429,7 @@ impl Parser {
             // which may start a construct allowed in this position, to be parsed as aliases.
             // (For example, in `FROM t1 JOIN` the `JOIN` will always be parsed as a keyword,
             // not an alias.)
-            Some(Token::Word(ref w))
-                if after_as || !reserved_kwds.contains(&w.keyword.as_str()) =>
-            {
+            Token::Word(w) if after_as || !reserved_kwds.contains(&w.keyword.as_str()) => {
                 Ok(Some(w.to_ident()))
             }
             // MSSQL supports single-quoted strings as aliases for columns
@@ -1486,7 +1444,7 @@ impl Parser {
             //    character. When it sees such a <literal>, your DBMS will
             //    ignore the <separator> and treat the multiple strings as
             //    a single <literal>."
-            Some(Token::SingleQuotedString(ref s)) => Ok(Some(Ident::with_quote('\'', s.clone()))),
+            Token::SingleQuotedString(s) => Ok(Some(Ident::with_quote('\'', s))),
             not_an_ident => {
                 if after_as {
                     return self.expected("an identifier after AS", not_an_ident);
@@ -1530,7 +1488,7 @@ impl Parser {
     /// Parse a simple one-word identifier (possibly quoted, possibly a keyword)
     pub fn parse_identifier(&mut self) -> Result<Ident, ParserError> {
         match self.next_token() {
-            Some(Token::Word(w)) => Ok(w.to_ident()),
+            Token::Word(w) => Ok(w.to_ident()),
             unexpected => self.expected("identifier", unexpected),
         }
     }
@@ -1683,8 +1641,7 @@ impl Parser {
 
         loop {
             // The query can be optionally followed by a set operator:
-            let next_token = self.peek_token();
-            let op = self.parse_set_operator(&next_token);
+            let op = self.parse_set_operator(&self.peek_token());
             let next_precedence = match op {
                 // UNION and EXCEPT have the same binding power and evaluate left-to-right
                 Some(SetOperator::Union) | Some(SetOperator::Except) => 10,
@@ -1708,11 +1665,11 @@ impl Parser {
         Ok(expr)
     }
 
-    fn parse_set_operator(&mut self, token: &Option<Token>) -> Option<SetOperator> {
+    fn parse_set_operator(&mut self, token: &Token) -> Option<SetOperator> {
         match token {
-            Some(Token::Word(w)) if w.keyword == "UNION" => Some(SetOperator::Union),
-            Some(Token::Word(w)) if w.keyword == "EXCEPT" => Some(SetOperator::Except),
-            Some(Token::Word(w)) if w.keyword == "INTERSECT" => Some(SetOperator::Intersect),
+            Token::Word(w) if w.keyword == "UNION" => Some(SetOperator::Union),
+            Token::Word(w) if w.keyword == "EXCEPT" => Some(SetOperator::Except),
+            Token::Word(w) if w.keyword == "INTERSECT" => Some(SetOperator::Intersect),
             _ => None,
         }
     }
@@ -1777,8 +1734,8 @@ impl Parser {
             let token = self.peek_token();
             let value = match (self.parse_value(), token) {
                 (Ok(value), _) => SetVariableValue::Literal(value),
-                (Err(_), Some(Token::Word(ident))) => SetVariableValue::Ident(ident.to_ident()),
-                (Err(_), other) => self.expected("variable value", other)?,
+                (Err(_), Token::Word(ident)) => SetVariableValue::Ident(ident.to_ident()),
+                (Err(_), unexpected) => self.expected("variable value", unexpected)?,
             };
             Ok(Statement::SetVariable {
                 local: modifier == Some("LOCAL"),
@@ -1868,8 +1825,8 @@ impl Parser {
                 }
             } else {
                 let natural = self.parse_keyword("NATURAL");
-                let peek_keyword = if let Some(Token::Word(kw)) = self.peek_token() {
-                    kw.keyword
+                let peek_keyword = if let Token::Word(w) = self.peek_token() {
+                    w.keyword
                 } else {
                     String::default()
                 };
@@ -2283,19 +2240,19 @@ mod tests {
     fn test_prev_index() {
         let sql = "SELECT version";
         all_dialects().run_parser_method(sql, |parser| {
-            assert_eq!(parser.peek_token(), Some(Token::make_keyword("SELECT")));
-            assert_eq!(parser.next_token(), Some(Token::make_keyword("SELECT")));
+            assert_eq!(parser.peek_token(), Token::make_keyword("SELECT"));
+            assert_eq!(parser.next_token(), Token::make_keyword("SELECT"));
             parser.prev_token();
-            assert_eq!(parser.next_token(), Some(Token::make_keyword("SELECT")));
-            assert_eq!(parser.next_token(), Some(Token::make_word("version", None)));
+            assert_eq!(parser.next_token(), Token::make_keyword("SELECT"));
+            assert_eq!(parser.next_token(), Token::make_word("version", None));
             parser.prev_token();
-            assert_eq!(parser.peek_token(), Some(Token::make_word("version", None)));
-            assert_eq!(parser.next_token(), Some(Token::make_word("version", None)));
-            assert_eq!(parser.peek_token(), None);
+            assert_eq!(parser.peek_token(), Token::make_word("version", None));
+            assert_eq!(parser.next_token(), Token::make_word("version", None));
+            assert_eq!(parser.peek_token(), Token::EOF);
             parser.prev_token();
-            assert_eq!(parser.next_token(), Some(Token::make_word("version", None)));
-            assert_eq!(parser.next_token(), None);
-            assert_eq!(parser.next_token(), None);
+            assert_eq!(parser.next_token(), Token::make_word("version", None));
+            assert_eq!(parser.next_token(), Token::EOF);
+            assert_eq!(parser.next_token(), Token::EOF);
             parser.prev_token();
         });
     }
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 68ebfaf62..48b58f1b8 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -26,6 +26,8 @@ use std::fmt;
 /// SQL Token enumeration
 #[derive(Debug, Clone, PartialEq)]
 pub enum Token {
+    /// An end-of-file marker, not a real token
+    EOF,
     /// A keyword (like SELECT) or an optionally quoted SQL identifier
     Word(Word),
     /// An unsigned numeric literal
@@ -99,6 +101,7 @@ pub enum Token {
 impl fmt::Display for Token {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
         match self {
+            Token::EOF => f.write_str("EOF"),
             Token::Word(ref w) => write!(f, "{}", w),
             Token::Number(ref n) => f.write_str(n),
             Token::Char(ref c) => write!(f, "{}", c),

From 34548e890b177ae1bfe9465cba433b06ae78930c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Thu, 11 Jun 2020 21:00:35 +0200
Subject: [PATCH 035/122] Change Word::keyword to a enum (#193)

This improves performance and paves the way to future API enhancements as discussed in the PR https://github.com/andygrove/sqlparser-rs/pull/193
---
 src/ast/mod.rs            |  16 -
 src/dialect/keywords.rs   |  64 +++-
 src/parser.rs             | 634 ++++++++++++++++++++------------------
 src/tokenizer.rs          |  13 +-
 tests/sqlparser_common.rs |  10 +-
 5 files changed, 395 insertions(+), 342 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index c04fb0269..da8088842 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -388,22 +388,6 @@ impl fmt::Display for WindowFrameUnits {
     }
 }
 
-impl FromStr for WindowFrameUnits {
-    type Err = ParserError;
-
-    fn from_str(s: &str) -> Result<Self, Self::Err> {
-        match s {
-            "ROWS" => Ok(WindowFrameUnits::Rows),
-            "RANGE" => Ok(WindowFrameUnits::Range),
-            "GROUPS" => Ok(WindowFrameUnits::Groups),
-            _ => Err(ParserError::ParserError(format!(
-                "Expected ROWS, RANGE, or GROUPS, found: {}",
-                s
-            ))),
-        }
-    }
-}
-
 /// Specifies [WindowFrame]'s `start_bound` and `end_bound`
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index bb4f678e0..e804f3693 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -41,12 +41,24 @@ macro_rules! define_keywords {
     ($(
         $ident:ident $(= $string_keyword:expr)?
     ),*) => {
-        $(kw_def!($ident $(= $string_keyword)?);)*
+        #[derive(Debug, Clone, Copy, PartialEq, PartialOrd, Eq, Ord)]
+        #[allow(non_camel_case_types)]
+        pub enum Keyword {
+            NoKeyword,
+            $($ident),*
+        }
 
+        pub const ALL_KEYWORDS_INDEX: &[Keyword] = &[
+            $(Keyword::$ident),*
+        ];
+
+        $(kw_def!($ident $(= $string_keyword)?);)*
         pub const ALL_KEYWORDS: &[&str] = &[
             $($ident),*
         ];
-    }
+
+    };
+
 }
 
 // The following keywords should be sorted to be able to match using binary search
@@ -434,20 +446,52 @@ define_keywords!(
 
 /// These keywords can't be used as a table alias, so that `FROM table_name alias`
 /// can be parsed unambiguously without looking ahead.
-pub const RESERVED_FOR_TABLE_ALIAS: &[&str] = &[
+pub const RESERVED_FOR_TABLE_ALIAS: &[Keyword] = &[
     // Reserved as both a table and a column alias:
-    WITH, SELECT, WHERE, GROUP, HAVING, ORDER, TOP, LIMIT, OFFSET, FETCH, UNION, EXCEPT, INTERSECT,
+    Keyword::WITH,
+    Keyword::SELECT,
+    Keyword::WHERE,
+    Keyword::GROUP,
+    Keyword::HAVING,
+    Keyword::ORDER,
+    Keyword::TOP,
+    Keyword::LIMIT,
+    Keyword::OFFSET,
+    Keyword::FETCH,
+    Keyword::UNION,
+    Keyword::EXCEPT,
+    Keyword::INTERSECT,
     // Reserved only as a table alias in the `FROM`/`JOIN` clauses:
-    ON, JOIN, INNER, CROSS, FULL, LEFT, RIGHT, NATURAL, USING,
+    Keyword::ON,
+    Keyword::JOIN,
+    Keyword::INNER,
+    Keyword::CROSS,
+    Keyword::FULL,
+    Keyword::LEFT,
+    Keyword::RIGHT,
+    Keyword::NATURAL,
+    Keyword::USING,
     // for MSSQL-specific OUTER APPLY (seems reserved in most dialects)
-    OUTER,
+    Keyword::OUTER,
 ];
 
 /// Can't be used as a column alias, so that `SELECT <expr> alias`
 /// can be parsed unambiguously without looking ahead.
-pub const RESERVED_FOR_COLUMN_ALIAS: &[&str] = &[
+pub const RESERVED_FOR_COLUMN_ALIAS: &[Keyword] = &[
     // Reserved as both a table and a column alias:
-    WITH, SELECT, WHERE, GROUP, HAVING, ORDER, LIMIT, OFFSET, FETCH, UNION, EXCEPT, INTERSECT,
-    // Reserved only as a column alias in the `SELECT` clause:
-    FROM,
+    Keyword::WITH,
+    Keyword::SELECT,
+    Keyword::WHERE,
+    Keyword::GROUP,
+    Keyword::HAVING,
+    Keyword::ORDER,
+    Keyword::TOP,
+    Keyword::LIMIT,
+    Keyword::OFFSET,
+    Keyword::FETCH,
+    Keyword::UNION,
+    Keyword::EXCEPT,
+    Keyword::INTERSECT,
+    // Reserved only as a column alias in the `SELECT` clause
+    Keyword::FROM,
 ];
diff --git a/src/parser.rs b/src/parser.rs
index 35147b4fb..2dc612dfc 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -16,6 +16,7 @@ use log::debug;
 
 use super::ast::*;
 use super::dialect::keywords;
+use super::dialect::keywords::Keyword;
 use super::dialect::Dialect;
 use super::tokenizer::*;
 use std::error::Error;
@@ -116,28 +117,28 @@ impl Parser {
     /// stopping before the statement separator, if any.
     pub fn parse_statement(&mut self) -> Result<Statement, ParserError> {
         match self.next_token() {
-            Token::Word(w) => match w.keyword.as_ref() {
-                "SELECT" | "WITH" | "VALUES" => {
+            Token::Word(w) => match w.keyword {
+                Keyword::SELECT | Keyword::WITH | Keyword::VALUES => {
                     self.prev_token();
                     Ok(Statement::Query(Box::new(self.parse_query()?)))
                 }
-                "CREATE" => Ok(self.parse_create()?),
-                "DROP" => Ok(self.parse_drop()?),
-                "DELETE" => Ok(self.parse_delete()?),
-                "INSERT" => Ok(self.parse_insert()?),
-                "UPDATE" => Ok(self.parse_update()?),
-                "ALTER" => Ok(self.parse_alter()?),
-                "COPY" => Ok(self.parse_copy()?),
-                "SET" => Ok(self.parse_set()?),
-                "SHOW" => Ok(self.parse_show()?),
-                "START" => Ok(self.parse_start_transaction()?),
+                Keyword::CREATE => Ok(self.parse_create()?),
+                Keyword::DROP => Ok(self.parse_drop()?),
+                Keyword::DELETE => Ok(self.parse_delete()?),
+                Keyword::INSERT => Ok(self.parse_insert()?),
+                Keyword::UPDATE => Ok(self.parse_update()?),
+                Keyword::ALTER => Ok(self.parse_alter()?),
+                Keyword::COPY => Ok(self.parse_copy()?),
+                Keyword::SET => Ok(self.parse_set()?),
+                Keyword::SHOW => Ok(self.parse_show()?),
+                Keyword::START => Ok(self.parse_start_transaction()?),
                 // `BEGIN` is a nonstandard but common alias for the
                 // standard `START TRANSACTION` statement. It is supported
                 // by at least PostgreSQL and MySQL.
-                "BEGIN" => Ok(self.parse_begin()?),
-                "COMMIT" => Ok(self.parse_commit()?),
-                "ROLLBACK" => Ok(self.parse_rollback()?),
-                _ => self.expected("an SQL statement", Token::Word(w.clone())),
+                Keyword::BEGIN => Ok(self.parse_begin()?),
+                Keyword::COMMIT => Ok(self.parse_commit()?),
+                Keyword::ROLLBACK => Ok(self.parse_rollback()?),
+                _ => self.expected("an SQL statement", Token::Word(w)),
             },
             Token::LParen => {
                 self.prev_token();
@@ -172,24 +173,26 @@ impl Parser {
     /// Parse an expression prefix
     pub fn parse_prefix(&mut self) -> Result<Expr, ParserError> {
         let expr = match self.next_token() {
-            Token::Word(w) => match w.keyword.as_ref() {
-                "TRUE" | "FALSE" | "NULL" => {
+            Token::Word(w) => match w.keyword {
+                Keyword::TRUE | Keyword::FALSE | Keyword::NULL => {
                     self.prev_token();
                     Ok(Expr::Value(self.parse_value()?))
                 }
-                "CASE" => self.parse_case_expr(),
-                "CAST" => self.parse_cast_expr(),
-                "DATE" => Ok(Expr::Value(Value::Date(self.parse_literal_string()?))),
-                "EXISTS" => self.parse_exists_expr(),
-                "EXTRACT" => self.parse_extract_expr(),
-                "INTERVAL" => self.parse_literal_interval(),
-                "LISTAGG" => self.parse_listagg_expr(),
-                "NOT" => Ok(Expr::UnaryOp {
+                Keyword::CASE => self.parse_case_expr(),
+                Keyword::CAST => self.parse_cast_expr(),
+                Keyword::DATE => Ok(Expr::Value(Value::Date(self.parse_literal_string()?))),
+                Keyword::EXISTS => self.parse_exists_expr(),
+                Keyword::EXTRACT => self.parse_extract_expr(),
+                Keyword::INTERVAL => self.parse_literal_interval(),
+                Keyword::LISTAGG => self.parse_listagg_expr(),
+                Keyword::NOT => Ok(Expr::UnaryOp {
                     op: UnaryOperator::Not,
                     expr: Box::new(self.parse_subexpr(Self::UNARY_NOT_PREC)?),
                 }),
-                "TIME" => Ok(Expr::Value(Value::Time(self.parse_literal_string()?))),
-                "TIMESTAMP" => Ok(Expr::Value(Value::Timestamp(self.parse_literal_string()?))),
+                Keyword::TIME => Ok(Expr::Value(Value::Time(self.parse_literal_string()?))),
+                Keyword::TIMESTAMP => {
+                    Ok(Expr::Value(Value::Timestamp(self.parse_literal_string()?)))
+                }
                 // Here `w` is a word, check if it's a part of a multi-part
                 // identifier, a function call, or a simple identifier:
                 _ => match self.peek_token() {
@@ -241,19 +244,20 @@ impl Parser {
                 Ok(Expr::Value(self.parse_value()?))
             }
             Token::LParen => {
-                let expr = if self.parse_keyword("SELECT") || self.parse_keyword("WITH") {
-                    self.prev_token();
-                    Expr::Subquery(Box::new(self.parse_query()?))
-                } else {
-                    Expr::Nested(Box::new(self.parse_expr()?))
-                };
+                let expr =
+                    if self.parse_keyword(Keyword::SELECT) || self.parse_keyword(Keyword::WITH) {
+                        self.prev_token();
+                        Expr::Subquery(Box::new(self.parse_query()?))
+                    } else {
+                        Expr::Nested(Box::new(self.parse_expr()?))
+                    };
                 self.expect_token(&Token::RParen)?;
                 Ok(expr)
             }
             unexpected => self.expected("an expression", unexpected),
         }?;
 
-        if self.parse_keyword("COLLATE") {
+        if self.parse_keyword(Keyword::COLLATE) {
             Ok(Expr::Collate {
                 expr: Box::new(expr),
                 collation: self.parse_object_name()?,
@@ -267,16 +271,16 @@ impl Parser {
         self.expect_token(&Token::LParen)?;
         let distinct = self.parse_all_or_distinct()?;
         let args = self.parse_optional_args()?;
-        let over = if self.parse_keyword("OVER") {
+        let over = if self.parse_keyword(Keyword::OVER) {
             // TBD: support window names (`OVER mywin`) in place of inline specification
             self.expect_token(&Token::LParen)?;
-            let partition_by = if self.parse_keywords(vec!["PARTITION", "BY"]) {
+            let partition_by = if self.parse_keywords(vec![Keyword::PARTITION, Keyword::BY]) {
                 // a list of possibly-qualified column names
                 self.parse_comma_separated(Parser::parse_expr)?
             } else {
                 vec![]
             };
-            let order_by = if self.parse_keywords(vec!["ORDER", "BY"]) {
+            let order_by = if self.parse_keywords(vec![Keyword::ORDER, Keyword::BY]) {
                 self.parse_comma_separated(Parser::parse_order_by_expr)?
             } else {
                 vec![]
@@ -306,14 +310,23 @@ impl Parser {
         }))
     }
 
+    pub fn parse_window_frame_units(&mut self) -> Result<WindowFrameUnits, ParserError> {
+        match self.next_token() {
+            Token::Word(w) => match w.keyword {
+                Keyword::ROWS => Ok(WindowFrameUnits::Rows),
+                Keyword::RANGE => Ok(WindowFrameUnits::Range),
+                Keyword::GROUPS => Ok(WindowFrameUnits::Groups),
+                _ => self.expected("ROWS, RANGE, GROUPS", Token::Word(w))?,
+            },
+            unexpected => self.expected("ROWS, RANGE, GROUPS", unexpected),
+        }
+    }
+
     pub fn parse_window_frame(&mut self) -> Result<WindowFrame, ParserError> {
-        let units = match self.next_token() {
-            Token::Word(w) => w.keyword.parse::<WindowFrameUnits>()?,
-            unexpected => return self.expected("ROWS, RANGE, GROUPS", unexpected),
-        };
-        let (start_bound, end_bound) = if self.parse_keyword("BETWEEN") {
+        let units = self.parse_window_frame_units()?;
+        let (start_bound, end_bound) = if self.parse_keyword(Keyword::BETWEEN) {
             let start_bound = self.parse_window_frame_bound()?;
-            self.expect_keyword("AND")?;
+            self.expect_keyword(Keyword::AND)?;
             let end_bound = Some(self.parse_window_frame_bound()?);
             (start_bound, end_bound)
         } else {
@@ -328,17 +341,17 @@ impl Parser {
 
     /// Parse `CURRENT ROW` or `{ <positive number> | UNBOUNDED } { PRECEDING | FOLLOWING }`
     pub fn parse_window_frame_bound(&mut self) -> Result<WindowFrameBound, ParserError> {
-        if self.parse_keywords(vec!["CURRENT", "ROW"]) {
+        if self.parse_keywords(vec![Keyword::CURRENT, Keyword::ROW]) {
             Ok(WindowFrameBound::CurrentRow)
         } else {
-            let rows = if self.parse_keyword("UNBOUNDED") {
+            let rows = if self.parse_keyword(Keyword::UNBOUNDED) {
                 None
             } else {
                 Some(self.parse_literal_uint()?)
             };
-            if self.parse_keyword("PRECEDING") {
+            if self.parse_keyword(Keyword::PRECEDING) {
                 Ok(WindowFrameBound::Preceding(rows))
-            } else if self.parse_keyword("FOLLOWING") {
+            } else if self.parse_keyword(Keyword::FOLLOWING) {
                 Ok(WindowFrameBound::Following(rows))
             } else {
                 self.expected("PRECEDING or FOLLOWING", self.peek_token())
@@ -348,26 +361,26 @@ impl Parser {
 
     pub fn parse_case_expr(&mut self) -> Result<Expr, ParserError> {
         let mut operand = None;
-        if !self.parse_keyword("WHEN") {
+        if !self.parse_keyword(Keyword::WHEN) {
             operand = Some(Box::new(self.parse_expr()?));
-            self.expect_keyword("WHEN")?;
+            self.expect_keyword(Keyword::WHEN)?;
         }
         let mut conditions = vec![];
         let mut results = vec![];
         loop {
             conditions.push(self.parse_expr()?);
-            self.expect_keyword("THEN")?;
+            self.expect_keyword(Keyword::THEN)?;
             results.push(self.parse_expr()?);
-            if !self.parse_keyword("WHEN") {
+            if !self.parse_keyword(Keyword::WHEN) {
                 break;
             }
         }
-        let else_result = if self.parse_keyword("ELSE") {
+        let else_result = if self.parse_keyword(Keyword::ELSE) {
             Some(Box::new(self.parse_expr()?))
         } else {
             None
         };
-        self.expect_keyword("END")?;
+        self.expect_keyword(Keyword::END)?;
         Ok(Expr::Case {
             operand,
             conditions,
@@ -380,7 +393,7 @@ impl Parser {
     pub fn parse_cast_expr(&mut self) -> Result<Expr, ParserError> {
         self.expect_token(&Token::LParen)?;
         let expr = self.parse_expr()?;
-        self.expect_keyword("AS")?;
+        self.expect_keyword(Keyword::AS)?;
         let data_type = self.parse_data_type()?;
         self.expect_token(&Token::RParen)?;
         Ok(Expr::Cast {
@@ -400,7 +413,7 @@ impl Parser {
     pub fn parse_extract_expr(&mut self) -> Result<Expr, ParserError> {
         self.expect_token(&Token::LParen)?;
         let field = self.parse_date_time_field()?;
-        self.expect_keyword("FROM")?;
+        self.expect_keyword(Keyword::FROM)?;
         let expr = self.parse_expr()?;
         self.expect_token(&Token::RParen)?;
         Ok(Expr::Extract {
@@ -421,13 +434,17 @@ impl Parser {
         } else {
             None
         };
-        let on_overflow = if self.parse_keywords(vec!["ON", "OVERFLOW"]) {
-            if self.parse_keyword("ERROR") {
+        let on_overflow = if self.parse_keywords(vec![Keyword::ON, Keyword::OVERFLOW]) {
+            if self.parse_keyword(Keyword::ERROR) {
                 Some(ListAggOnOverflow::Error)
             } else {
-                self.expect_keyword("TRUNCATE")?;
+                self.expect_keyword(Keyword::TRUNCATE)?;
                 let filler = match self.peek_token() {
-                    Token::Word(w) if w.keyword == "WITH" || w.keyword == "WITHOUT" => None,
+                    Token::Word(w)
+                        if w.keyword == Keyword::WITH || w.keyword == Keyword::WITHOUT =>
+                    {
+                        None
+                    }
                     Token::SingleQuotedString(_)
                     | Token::NationalStringLiteral(_)
                     | Token::HexStringLiteral(_) => Some(Box::new(self.parse_expr()?)),
@@ -435,11 +452,11 @@ impl Parser {
                         self.expected("either filler, WITH, or WITHOUT in LISTAGG", unexpected)?
                     }
                 };
-                let with_count = self.parse_keyword("WITH");
-                if !with_count && !self.parse_keyword("WITHOUT") {
+                let with_count = self.parse_keyword(Keyword::WITH);
+                if !with_count && !self.parse_keyword(Keyword::WITHOUT) {
                     self.expected("either WITH or WITHOUT in LISTAGG", self.peek_token())?;
                 }
-                self.expect_keyword("COUNT")?;
+                self.expect_keyword(Keyword::COUNT)?;
                 Some(ListAggOnOverflow::Truncate { filler, with_count })
             }
         } else {
@@ -448,9 +465,9 @@ impl Parser {
         self.expect_token(&Token::RParen)?;
         // Once again ANSI SQL requires WITHIN GROUP, but Redshift does not. Again we choose the
         // more general implementation.
-        let within_group = if self.parse_keywords(vec!["WITHIN", "GROUP"]) {
+        let within_group = if self.parse_keywords(vec![Keyword::WITHIN, Keyword::GROUP]) {
             self.expect_token(&Token::LParen)?;
-            self.expect_keywords(&["ORDER", "BY"])?;
+            self.expect_keywords(&[Keyword::ORDER, Keyword::BY])?;
             let order_by_expr = self.parse_comma_separated(Parser::parse_order_by_expr)?;
             self.expect_token(&Token::RParen)?;
             order_by_expr
@@ -472,14 +489,14 @@ impl Parser {
     // be split in two.
     pub fn parse_date_time_field(&mut self) -> Result<DateTimeField, ParserError> {
         match self.next_token() {
-            Token::Word(w) => match w.keyword.as_ref() {
-                "YEAR" => Ok(DateTimeField::Year),
-                "MONTH" => Ok(DateTimeField::Month),
-                "DAY" => Ok(DateTimeField::Day),
-                "HOUR" => Ok(DateTimeField::Hour),
-                "MINUTE" => Ok(DateTimeField::Minute),
-                "SECOND" => Ok(DateTimeField::Second),
-                _ => self.expected("date/time field", Token::Word(w.clone()))?,
+            Token::Word(w) => match w.keyword {
+                Keyword::YEAR => Ok(DateTimeField::Year),
+                Keyword::MONTH => Ok(DateTimeField::Month),
+                Keyword::DAY => Ok(DateTimeField::Day),
+                Keyword::HOUR => Ok(DateTimeField::Hour),
+                Keyword::MINUTE => Ok(DateTimeField::Minute),
+                Keyword::SECOND => Ok(DateTimeField::Second),
+                _ => self.expected("date/time field", Token::Word(w))?,
             },
             unexpected => self.expected("date/time field", unexpected),
         }
@@ -514,9 +531,16 @@ impl Parser {
         // this more general implemenation.
         let leading_field = match self.peek_token() {
             Token::Word(kw)
-                if ["YEAR", "MONTH", "DAY", "HOUR", "MINUTE", "SECOND"]
-                    .iter()
-                    .any(|d| kw.keyword == *d) =>
+                if [
+                    Keyword::YEAR,
+                    Keyword::MONTH,
+                    Keyword::DAY,
+                    Keyword::HOUR,
+                    Keyword::MINUTE,
+                    Keyword::SECOND,
+                ]
+                .iter()
+                .any(|d| kw.keyword == *d) =>
             {
                 Some(self.parse_date_time_field()?)
             }
@@ -535,7 +559,7 @@ impl Parser {
                 (leading_precision, last_field, fsec_precision)
             } else {
                 let leading_precision = self.parse_optional_precision()?;
-                if self.parse_keyword("TO") {
+                if self.parse_keyword(Keyword::TO) {
                     let last_field = Some(self.parse_date_time_field()?);
                     let fsec_precision = if last_field == Some(DateTimeField::Second) {
                         self.parse_optional_precision()?
@@ -576,12 +600,12 @@ impl Parser {
             Token::Caret => Some(BinaryOperator::BitwiseXor),
             Token::Ampersand => Some(BinaryOperator::BitwiseAnd),
             Token::Div => Some(BinaryOperator::Divide),
-            Token::Word(w) => match w.keyword.as_ref() {
-                "AND" => Some(BinaryOperator::And),
-                "OR" => Some(BinaryOperator::Or),
-                "LIKE" => Some(BinaryOperator::Like),
-                "NOT" => {
-                    if self.parse_keyword("LIKE") {
+            Token::Word(w) => match w.keyword {
+                Keyword::AND => Some(BinaryOperator::And),
+                Keyword::OR => Some(BinaryOperator::Or),
+                Keyword::LIKE => Some(BinaryOperator::Like),
+                Keyword::NOT => {
+                    if self.parse_keyword(Keyword::LIKE) {
                         Some(BinaryOperator::NotLike)
                     } else {
                         None
@@ -599,22 +623,22 @@ impl Parser {
                 right: Box::new(self.parse_subexpr(precedence)?),
             })
         } else if let Token::Word(w) = &tok {
-            match w.keyword.as_ref() {
-                "IS" => {
-                    if self.parse_keyword("NULL") {
+            match w.keyword {
+                Keyword::IS => {
+                    if self.parse_keyword(Keyword::NULL) {
                         Ok(Expr::IsNull(Box::new(expr)))
-                    } else if self.parse_keywords(vec!["NOT", "NULL"]) {
+                    } else if self.parse_keywords(vec![Keyword::NOT, Keyword::NULL]) {
                         Ok(Expr::IsNotNull(Box::new(expr)))
                     } else {
                         self.expected("NULL or NOT NULL after IS", self.peek_token())
                     }
                 }
-                "NOT" | "IN" | "BETWEEN" => {
+                Keyword::NOT | Keyword::IN | Keyword::BETWEEN => {
                     self.prev_token();
-                    let negated = self.parse_keyword("NOT");
-                    if self.parse_keyword("IN") {
+                    let negated = self.parse_keyword(Keyword::NOT);
+                    if self.parse_keyword(Keyword::IN) {
                         self.parse_in(expr, negated)
-                    } else if self.parse_keyword("BETWEEN") {
+                    } else if self.parse_keyword(Keyword::BETWEEN) {
                         self.parse_between(expr, negated)
                     } else {
                         self.expected("IN or BETWEEN after NOT", self.peek_token())
@@ -634,7 +658,7 @@ impl Parser {
     /// Parses the parens following the `[ NOT ] IN` operator
     pub fn parse_in(&mut self, expr: Expr, negated: bool) -> Result<Expr, ParserError> {
         self.expect_token(&Token::LParen)?;
-        let in_op = if self.parse_keyword("SELECT") || self.parse_keyword("WITH") {
+        let in_op = if self.parse_keyword(Keyword::SELECT) || self.parse_keyword(Keyword::WITH) {
             self.prev_token();
             Expr::InSubquery {
                 expr: Box::new(expr),
@@ -657,7 +681,7 @@ impl Parser {
         // Stop parsing subexpressions for <low> and <high> on tokens with
         // precedence lower than that of `BETWEEN`, such as `AND`, `IS`, etc.
         let low = self.parse_subexpr(Self::BETWEEN_PREC)?;
-        self.expect_keyword("AND")?;
+        self.expect_keyword(Keyword::AND)?;
         let high = self.parse_subexpr(Self::BETWEEN_PREC)?;
         Ok(Expr::Between {
             expr: Box::new(expr),
@@ -684,23 +708,23 @@ impl Parser {
         let token = self.peek_token();
         debug!("get_next_precedence() {:?}", token);
         match token {
-            Token::Word(w) if w.keyword == "OR" => Ok(5),
-            Token::Word(w) if w.keyword == "AND" => Ok(10),
-            Token::Word(w) if w.keyword == "NOT" => match self.peek_nth_token(1) {
+            Token::Word(w) if w.keyword == Keyword::OR => Ok(5),
+            Token::Word(w) if w.keyword == Keyword::AND => Ok(10),
+            Token::Word(w) if w.keyword == Keyword::NOT => match self.peek_nth_token(1) {
                 // The precedence of NOT varies depending on keyword that
                 // follows it. If it is followed by IN, BETWEEN, or LIKE,
                 // it takes on the precedence of those tokens. Otherwise it
                 // is not an infix operator, and therefore has zero
                 // precedence.
-                Token::Word(w) if w.keyword == "IN" => Ok(Self::BETWEEN_PREC),
-                Token::Word(w) if w.keyword == "BETWEEN" => Ok(Self::BETWEEN_PREC),
-                Token::Word(w) if w.keyword == "LIKE" => Ok(Self::BETWEEN_PREC),
+                Token::Word(w) if w.keyword == Keyword::IN => Ok(Self::BETWEEN_PREC),
+                Token::Word(w) if w.keyword == Keyword::BETWEEN => Ok(Self::BETWEEN_PREC),
+                Token::Word(w) if w.keyword == Keyword::LIKE => Ok(Self::BETWEEN_PREC),
                 _ => Ok(0),
             },
-            Token::Word(w) if w.keyword == "IS" => Ok(17),
-            Token::Word(w) if w.keyword == "IN" => Ok(Self::BETWEEN_PREC),
-            Token::Word(w) if w.keyword == "BETWEEN" => Ok(Self::BETWEEN_PREC),
-            Token::Word(w) if w.keyword == "LIKE" => Ok(Self::BETWEEN_PREC),
+            Token::Word(w) if w.keyword == Keyword::IS => Ok(17),
+            Token::Word(w) if w.keyword == Keyword::IN => Ok(Self::BETWEEN_PREC),
+            Token::Word(w) if w.keyword == Keyword::BETWEEN => Ok(Self::BETWEEN_PREC),
+            Token::Word(w) if w.keyword == Keyword::LIKE => Ok(Self::BETWEEN_PREC),
             Token::Eq | Token::Lt | Token::LtEq | Token::Neq | Token::Gt | Token::GtEq => Ok(20),
             Token::Pipe => Ok(21),
             Token::Caret => Ok(22),
@@ -775,14 +799,9 @@ impl Parser {
 
     /// Look for an expected keyword and consume it if it exists
     #[must_use]
-    pub fn parse_keyword(&mut self, expected: &'static str) -> bool {
-        // Ideally, we'd accept a enum variant, not a string, but since
-        // it's not trivial to maintain the enum without duplicating all
-        // the keywords three times, we'll settle for a run-time check that
-        // the string actually represents a known keyword...
-        assert!(keywords::ALL_KEYWORDS.contains(&expected));
+    pub fn parse_keyword(&mut self, expected: Keyword) -> bool {
         match self.peek_token() {
-            Token::Word(w) if expected.eq_ignore_ascii_case(&w.keyword) => {
+            Token::Word(w) if expected == w.keyword => {
                 self.next_token();
                 true
             }
@@ -792,10 +811,10 @@ impl Parser {
 
     /// Look for an expected sequence of keywords and consume them if they exist
     #[must_use]
-    pub fn parse_keywords(&mut self, keywords: Vec<&'static str>) -> bool {
+    pub fn parse_keywords(&mut self, keywords: Vec<Keyword>) -> bool {
         let index = self.index;
         for keyword in keywords {
-            if !self.parse_keyword(&keyword) {
+            if !self.parse_keyword(keyword) {
                 //println!("parse_keywords aborting .. did not find {}", keyword);
                 // reset index and return immediately
                 self.index = index;
@@ -807,34 +826,27 @@ impl Parser {
 
     /// Look for one of the given keywords and return the one that matches.
     #[must_use]
-    pub fn parse_one_of_keywords(&mut self, keywords: &[&'static str]) -> Option<&'static str> {
-        for keyword in keywords {
-            assert!(
-                keywords::ALL_KEYWORDS.contains(keyword),
-                "{} is not contained in keyword list",
-                keyword
-            );
-        }
+    pub fn parse_one_of_keywords(&mut self, keywords: &[Keyword]) -> Option<Keyword> {
         match self.peek_token() {
-            Token::Word(w) => keywords
-                .iter()
-                .find(|keyword| keyword.eq_ignore_ascii_case(&w.keyword))
-                .map(|keyword| {
-                    self.next_token();
-                    *keyword
-                }),
+            Token::Word(w) => {
+                keywords
+                    .iter()
+                    .find(|keyword| **keyword == w.keyword)
+                    .map(|keyword| {
+                        self.next_token();
+                        *keyword
+                    })
+            }
             _ => None,
         }
     }
 
     /// Bail out if the current token is not one of the expected keywords, or consume it if it is
-    pub fn expect_one_of_keywords(
-        &mut self,
-        keywords: &[&'static str],
-    ) -> Result<&'static str, ParserError> {
+    pub fn expect_one_of_keywords(&mut self, keywords: &[Keyword]) -> Result<Keyword, ParserError> {
         if let Some(keyword) = self.parse_one_of_keywords(keywords) {
             Ok(keyword)
         } else {
+            let keywords: Vec<String> = keywords.iter().map(|x| format!("{:?}", x)).collect();
             self.expected(
                 &format!("one of {}", keywords.join(" or ")),
                 self.peek_token(),
@@ -843,18 +855,18 @@ impl Parser {
     }
 
     /// Bail out if the current token is not an expected keyword, or consume it if it is
-    pub fn expect_keyword(&mut self, expected: &'static str) -> Result<(), ParserError> {
+    pub fn expect_keyword(&mut self, expected: Keyword) -> Result<(), ParserError> {
         if self.parse_keyword(expected) {
             Ok(())
         } else {
-            self.expected(expected, self.peek_token())
+            self.expected(format!("{:?}", &expected).as_str(), self.peek_token())
         }
     }
 
     /// Bail out if the following tokens are not the expected sequence of
     /// keywords, or consume them if they are.
-    pub fn expect_keywords(&mut self, expected: &[&'static str]) -> Result<(), ParserError> {
-        for kw in expected {
+    pub fn expect_keywords(&mut self, expected: &[Keyword]) -> Result<(), ParserError> {
+        for &kw in expected {
             self.expect_keyword(kw)?;
         }
         Ok(())
@@ -898,8 +910,8 @@ impl Parser {
     /// Parse either `ALL` or `DISTINCT`. Returns `true` if `DISTINCT` is parsed and results in a
     /// `ParserError` if both `ALL` and `DISTINCT` are fround.
     pub fn parse_all_or_distinct(&mut self) -> Result<bool, ParserError> {
-        let all = self.parse_keyword("ALL");
-        let distinct = self.parse_keyword("DISTINCT");
+        let all = self.parse_keyword(Keyword::ALL);
+        let distinct = self.parse_keyword(Keyword::DISTINCT);
         if all && distinct {
             return parser_err!("Cannot specify both ALL and DISTINCT".to_string());
         } else {
@@ -909,18 +921,18 @@ impl Parser {
 
     /// Parse a SQL CREATE statement
     pub fn parse_create(&mut self) -> Result<Statement, ParserError> {
-        if self.parse_keyword("TABLE") {
+        if self.parse_keyword(Keyword::TABLE) {
             self.parse_create_table()
-        } else if self.parse_keyword("INDEX") {
+        } else if self.parse_keyword(Keyword::INDEX) {
             self.parse_create_index(false)
-        } else if self.parse_keywords(vec!["UNIQUE", "INDEX"]) {
+        } else if self.parse_keywords(vec![Keyword::UNIQUE, Keyword::INDEX]) {
             self.parse_create_index(true)
-        } else if self.parse_keyword("MATERIALIZED") || self.parse_keyword("VIEW") {
+        } else if self.parse_keyword(Keyword::MATERIALIZED) || self.parse_keyword(Keyword::VIEW) {
             self.prev_token();
             self.parse_create_view()
-        } else if self.parse_keyword("EXTERNAL") {
+        } else if self.parse_keyword(Keyword::EXTERNAL) {
             self.parse_create_external_table()
-        } else if self.parse_keyword("SCHEMA") {
+        } else if self.parse_keyword(Keyword::SCHEMA) {
             self.parse_create_schema()
         } else {
             self.expected(
@@ -936,13 +948,13 @@ impl Parser {
     }
 
     pub fn parse_create_external_table(&mut self) -> Result<Statement, ParserError> {
-        self.expect_keyword("TABLE")?;
+        self.expect_keyword(Keyword::TABLE)?;
         let table_name = self.parse_object_name()?;
         let (columns, constraints) = self.parse_columns()?;
-        self.expect_keywords(&["STORED", "AS"])?;
+        self.expect_keywords(&[Keyword::STORED, Keyword::AS])?;
         let file_format = self.parse_identifier()?.value.parse::<FileFormat>()?;
 
-        self.expect_keyword("LOCATION")?;
+        self.expect_keyword(Keyword::LOCATION)?;
         let location = self.parse_literal_string()?;
 
         Ok(Statement::CreateTable {
@@ -958,14 +970,14 @@ impl Parser {
     }
 
     pub fn parse_create_view(&mut self) -> Result<Statement, ParserError> {
-        let materialized = self.parse_keyword("MATERIALIZED");
-        self.expect_keyword("VIEW")?;
+        let materialized = self.parse_keyword(Keyword::MATERIALIZED);
+        self.expect_keyword(Keyword::VIEW)?;
         // Many dialects support `OR REPLACE` | `OR ALTER` right after `CREATE`, but we don't (yet).
         // ANSI SQL and Postgres support RECURSIVE here, but we don't support it either.
         let name = self.parse_object_name()?;
         let columns = self.parse_parenthesized_column_list(Optional)?;
         let with_options = self.parse_with_options()?;
-        self.expect_keyword("AS")?;
+        self.expect_keyword(Keyword::AS)?;
         let query = Box::new(self.parse_query()?);
         // Optional `WITH [ CASCADED | LOCAL ] CHECK OPTION` is widely supported here.
         Ok(Statement::CreateView {
@@ -978,23 +990,23 @@ impl Parser {
     }
 
     pub fn parse_drop(&mut self) -> Result<Statement, ParserError> {
-        let object_type = if self.parse_keyword("TABLE") {
+        let object_type = if self.parse_keyword(Keyword::TABLE) {
             ObjectType::Table
-        } else if self.parse_keyword("VIEW") {
+        } else if self.parse_keyword(Keyword::VIEW) {
             ObjectType::View
-        } else if self.parse_keyword("INDEX") {
+        } else if self.parse_keyword(Keyword::INDEX) {
             ObjectType::Index
-        } else if self.parse_keyword("SCHEMA") {
+        } else if self.parse_keyword(Keyword::SCHEMA) {
             ObjectType::Schema
         } else {
             return self.expected("TABLE, VIEW, INDEX or SCHEMA after DROP", self.peek_token());
         };
         // Many dialects support the non standard `IF EXISTS` clause and allow
         // specifying multiple objects to delete in a single statement
-        let if_exists = self.parse_keywords(vec!["IF", "EXISTS"]);
+        let if_exists = self.parse_keywords(vec![Keyword::IF, Keyword::EXISTS]);
         let names = self.parse_comma_separated(Parser::parse_object_name)?;
-        let cascade = self.parse_keyword("CASCADE");
-        let restrict = self.parse_keyword("RESTRICT");
+        let cascade = self.parse_keyword(Keyword::CASCADE);
+        let restrict = self.parse_keyword(Keyword::RESTRICT);
         if cascade && restrict {
             return parser_err!("Cannot specify both CASCADE and RESTRICT in DROP");
         }
@@ -1007,9 +1019,9 @@ impl Parser {
     }
 
     pub fn parse_create_index(&mut self, unique: bool) -> Result<Statement, ParserError> {
-        let if_not_exists = self.parse_keywords(vec!["IF", "NOT", "EXISTS"]);
+        let if_not_exists = self.parse_keywords(vec![Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
         let index_name = self.parse_object_name()?;
-        self.expect_keyword("ON")?;
+        self.expect_keyword(Keyword::ON)?;
         let table_name = self.parse_object_name()?;
         let columns = self.parse_parenthesized_column_list(Mandatory)?;
         Ok(Statement::CreateIndex {
@@ -1022,7 +1034,7 @@ impl Parser {
     }
 
     pub fn parse_create_table(&mut self) -> Result<Statement, ParserError> {
-        let if_not_exists = self.parse_keywords(vec!["IF", "NOT", "EXISTS"]);
+        let if_not_exists = self.parse_keywords(vec![Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
         let table_name = self.parse_object_name()?;
         // parse optional column list (schema)
         let (columns, constraints) = self.parse_columns()?;
@@ -1053,7 +1065,7 @@ impl Parser {
             } else if let Token::Word(column_name) = self.peek_token() {
                 self.next_token();
                 let data_type = self.parse_data_type()?;
-                let collation = if self.parse_keyword("COLLATE") {
+                let collation = if self.parse_keyword(Keyword::COLLATE) {
                     Some(self.parse_object_name()?)
                 } else {
                     None
@@ -1088,23 +1100,23 @@ impl Parser {
     }
 
     pub fn parse_column_option_def(&mut self) -> Result<ColumnOptionDef, ParserError> {
-        let name = if self.parse_keyword("CONSTRAINT") {
+        let name = if self.parse_keyword(Keyword::CONSTRAINT) {
             Some(self.parse_identifier()?)
         } else {
             None
         };
 
-        let option = if self.parse_keywords(vec!["NOT", "NULL"]) {
+        let option = if self.parse_keywords(vec![Keyword::NOT, Keyword::NULL]) {
             ColumnOption::NotNull
-        } else if self.parse_keyword("NULL") {
+        } else if self.parse_keyword(Keyword::NULL) {
             ColumnOption::Null
-        } else if self.parse_keyword("DEFAULT") {
+        } else if self.parse_keyword(Keyword::DEFAULT) {
             ColumnOption::Default(self.parse_expr()?)
-        } else if self.parse_keywords(vec!["PRIMARY", "KEY"]) {
+        } else if self.parse_keywords(vec![Keyword::PRIMARY, Keyword::KEY]) {
             ColumnOption::Unique { is_primary: true }
-        } else if self.parse_keyword("UNIQUE") {
+        } else if self.parse_keyword(Keyword::UNIQUE) {
             ColumnOption::Unique { is_primary: false }
-        } else if self.parse_keyword("REFERENCES") {
+        } else if self.parse_keyword(Keyword::REFERENCES) {
             let foreign_table = self.parse_object_name()?;
             // PostgreSQL allows omitting the column list and
             // uses the primary key column of the foreign table by default
@@ -1112,9 +1124,11 @@ impl Parser {
             let mut on_delete = None;
             let mut on_update = None;
             loop {
-                if on_delete.is_none() && self.parse_keywords(vec!["ON", "DELETE"]) {
+                if on_delete.is_none() && self.parse_keywords(vec![Keyword::ON, Keyword::DELETE]) {
                     on_delete = Some(self.parse_referential_action()?);
-                } else if on_update.is_none() && self.parse_keywords(vec!["ON", "UPDATE"]) {
+                } else if on_update.is_none()
+                    && self.parse_keywords(vec![Keyword::ON, Keyword::UPDATE])
+                {
                     on_update = Some(self.parse_referential_action()?);
                 } else {
                     break;
@@ -1126,7 +1140,7 @@ impl Parser {
                 on_delete,
                 on_update,
             }
-        } else if self.parse_keyword("CHECK") {
+        } else if self.parse_keyword(Keyword::CHECK) {
             self.expect_token(&Token::LParen)?;
             let expr = self.parse_expr()?;
             self.expect_token(&Token::RParen)?;
@@ -1139,15 +1153,15 @@ impl Parser {
     }
 
     pub fn parse_referential_action(&mut self) -> Result<ReferentialAction, ParserError> {
-        if self.parse_keyword("RESTRICT") {
+        if self.parse_keyword(Keyword::RESTRICT) {
             Ok(ReferentialAction::Restrict)
-        } else if self.parse_keyword("CASCADE") {
+        } else if self.parse_keyword(Keyword::CASCADE) {
             Ok(ReferentialAction::Cascade)
-        } else if self.parse_keywords(vec!["SET", "NULL"]) {
+        } else if self.parse_keywords(vec![Keyword::SET, Keyword::NULL]) {
             Ok(ReferentialAction::SetNull)
-        } else if self.parse_keywords(vec!["NO", "ACTION"]) {
+        } else if self.parse_keywords(vec![Keyword::NO, Keyword::ACTION]) {
             Ok(ReferentialAction::NoAction)
-        } else if self.parse_keywords(vec!["SET", "DEFAULT"]) {
+        } else if self.parse_keywords(vec![Keyword::SET, Keyword::DEFAULT]) {
             Ok(ReferentialAction::SetDefault)
         } else {
             self.expected(
@@ -1160,16 +1174,16 @@ impl Parser {
     pub fn parse_optional_table_constraint(
         &mut self,
     ) -> Result<Option<TableConstraint>, ParserError> {
-        let name = if self.parse_keyword("CONSTRAINT") {
+        let name = if self.parse_keyword(Keyword::CONSTRAINT) {
             Some(self.parse_identifier()?)
         } else {
             None
         };
         match self.next_token() {
-            Token::Word(w) if w.keyword == "PRIMARY" || w.keyword == "UNIQUE" => {
-                let is_primary = w.keyword == "PRIMARY";
+            Token::Word(w) if w.keyword == Keyword::PRIMARY || w.keyword == Keyword::UNIQUE => {
+                let is_primary = w.keyword == Keyword::PRIMARY;
                 if is_primary {
-                    self.expect_keyword("KEY")?;
+                    self.expect_keyword(Keyword::KEY)?;
                 }
                 let columns = self.parse_parenthesized_column_list(Mandatory)?;
                 Ok(Some(TableConstraint::Unique {
@@ -1178,10 +1192,10 @@ impl Parser {
                     is_primary,
                 }))
             }
-            Token::Word(w) if w.keyword == "FOREIGN" => {
-                self.expect_keyword("KEY")?;
+            Token::Word(w) if w.keyword == Keyword::FOREIGN => {
+                self.expect_keyword(Keyword::KEY)?;
                 let columns = self.parse_parenthesized_column_list(Mandatory)?;
-                self.expect_keyword("REFERENCES")?;
+                self.expect_keyword(Keyword::REFERENCES)?;
                 let foreign_table = self.parse_object_name()?;
                 let referred_columns = self.parse_parenthesized_column_list(Mandatory)?;
                 Ok(Some(TableConstraint::ForeignKey {
@@ -1191,7 +1205,7 @@ impl Parser {
                     referred_columns,
                 }))
             }
-            Token::Word(w) if w.keyword == "CHECK" => {
+            Token::Word(w) if w.keyword == Keyword::CHECK => {
                 self.expect_token(&Token::LParen)?;
                 let expr = Box::new(self.parse_expr()?);
                 self.expect_token(&Token::RParen)?;
@@ -1209,7 +1223,7 @@ impl Parser {
     }
 
     pub fn parse_with_options(&mut self) -> Result<Vec<SqlOption>, ParserError> {
-        if self.parse_keyword("WITH") {
+        if self.parse_keyword(Keyword::WITH) {
             self.expect_token(&Token::LParen)?;
             let options = self.parse_comma_separated(Parser::parse_sql_option)?;
             self.expect_token(&Token::RParen)?;
@@ -1227,10 +1241,10 @@ impl Parser {
     }
 
     pub fn parse_alter(&mut self) -> Result<Statement, ParserError> {
-        self.expect_keyword("TABLE")?;
-        let _ = self.parse_keyword("ONLY");
+        self.expect_keyword(Keyword::TABLE)?;
+        let _ = self.parse_keyword(Keyword::ONLY);
         let table_name = self.parse_object_name()?;
-        let operation = if self.parse_keyword("ADD") {
+        let operation = if self.parse_keyword(Keyword::ADD) {
             if let Some(constraint) = self.parse_optional_table_constraint()? {
                 AlterTableOperation::AddConstraint(constraint)
             } else {
@@ -1249,7 +1263,7 @@ impl Parser {
     pub fn parse_copy(&mut self) -> Result<Statement, ParserError> {
         let table_name = self.parse_object_name()?;
         let columns = self.parse_parenthesized_column_list(Optional)?;
-        self.expect_keywords(&["FROM", "STDIN"])?;
+        self.expect_keywords(&[Keyword::FROM, Keyword::STDIN])?;
         self.expect_token(&Token::SemiColon)?;
         let values = self.parse_tsv()?;
         Ok(Statement::Copy {
@@ -1300,11 +1314,11 @@ impl Parser {
     /// Parse a literal value (numbers, strings, date/time, booleans)
     fn parse_value(&mut self) -> Result<Value, ParserError> {
         match self.next_token() {
-            Token::Word(w) => match w.keyword.as_ref() {
-                "TRUE" => Ok(Value::Boolean(true)),
-                "FALSE" => Ok(Value::Boolean(false)),
-                "NULL" => Ok(Value::Null),
-                _ => self.expected("a concrete value", Token::Word(w.clone())),
+            Token::Word(w) => match w.keyword {
+                Keyword::TRUE => Ok(Value::Boolean(true)),
+                Keyword::FALSE => Ok(Value::Boolean(false)),
+                Keyword::NULL => Ok(Value::Null),
+                _ => self.expected("a concrete value", Token::Word(w)),
             },
             // The call to n.parse() returns a bigdecimal when the
             // bigdecimal feature is enabled, and is otherwise a no-op
@@ -1351,47 +1365,47 @@ impl Parser {
     /// Parse a SQL datatype (in the context of a CREATE TABLE statement for example)
     pub fn parse_data_type(&mut self) -> Result<DataType, ParserError> {
         match self.next_token() {
-            Token::Word(w) => match w.keyword.as_ref() {
-                "BOOLEAN" => Ok(DataType::Boolean),
-                "FLOAT" => Ok(DataType::Float(self.parse_optional_precision()?)),
-                "REAL" => Ok(DataType::Real),
-                "DOUBLE" => {
-                    let _ = self.parse_keyword("PRECISION");
+            Token::Word(w) => match w.keyword {
+                Keyword::BOOLEAN => Ok(DataType::Boolean),
+                Keyword::FLOAT => Ok(DataType::Float(self.parse_optional_precision()?)),
+                Keyword::REAL => Ok(DataType::Real),
+                Keyword::DOUBLE => {
+                    let _ = self.parse_keyword(Keyword::PRECISION);
                     Ok(DataType::Double)
                 }
-                "SMALLINT" => Ok(DataType::SmallInt),
-                "INT" | "INTEGER" => Ok(DataType::Int),
-                "BIGINT" => Ok(DataType::BigInt),
-                "VARCHAR" => Ok(DataType::Varchar(self.parse_optional_precision()?)),
-                "CHAR" | "CHARACTER" => {
-                    if self.parse_keyword("VARYING") {
+                Keyword::SMALLINT => Ok(DataType::SmallInt),
+                Keyword::INT | Keyword::INTEGER => Ok(DataType::Int),
+                Keyword::BIGINT => Ok(DataType::BigInt),
+                Keyword::VARCHAR => Ok(DataType::Varchar(self.parse_optional_precision()?)),
+                Keyword::CHAR | Keyword::CHARACTER => {
+                    if self.parse_keyword(Keyword::VARYING) {
                         Ok(DataType::Varchar(self.parse_optional_precision()?))
                     } else {
                         Ok(DataType::Char(self.parse_optional_precision()?))
                     }
                 }
-                "UUID" => Ok(DataType::Uuid),
-                "DATE" => Ok(DataType::Date),
-                "TIMESTAMP" => {
+                Keyword::UUID => Ok(DataType::Uuid),
+                Keyword::DATE => Ok(DataType::Date),
+                Keyword::TIMESTAMP => {
                     // TBD: we throw away "with/without timezone" information
-                    if self.parse_keyword("WITH") || self.parse_keyword("WITHOUT") {
-                        self.expect_keywords(&["TIME", "ZONE"])?;
+                    if self.parse_keyword(Keyword::WITH) || self.parse_keyword(Keyword::WITHOUT) {
+                        self.expect_keywords(&[Keyword::TIME, Keyword::ZONE])?;
                     }
                     Ok(DataType::Timestamp)
                 }
-                "TIME" => {
+                Keyword::TIME => {
                     // TBD: we throw away "with/without timezone" information
-                    if self.parse_keyword("WITH") || self.parse_keyword("WITHOUT") {
-                        self.expect_keywords(&["TIME", "ZONE"])?;
+                    if self.parse_keyword(Keyword::WITH) || self.parse_keyword(Keyword::WITHOUT) {
+                        self.expect_keywords(&[Keyword::TIME, Keyword::ZONE])?;
                     }
                     Ok(DataType::Time)
                 }
                 // Interval types can be followed by a complicated interval
                 // qualifier that we don't currently support. See
                 // parse_interval_literal for a taste.
-                "INTERVAL" => Ok(DataType::Interval),
-                "REGCLASS" => Ok(DataType::Regclass),
-                "TEXT" => {
+                Keyword::INTERVAL => Ok(DataType::Interval),
+                Keyword::REGCLASS => Ok(DataType::Regclass),
+                Keyword::TEXT => {
                     if self.consume_token(&Token::LBracket) {
                         // Note: this is postgresql-specific
                         self.expect_token(&Token::RBracket)?;
@@ -1400,8 +1414,8 @@ impl Parser {
                         Ok(DataType::Text)
                     }
                 }
-                "BYTEA" => Ok(DataType::Bytea),
-                "NUMERIC" | "DECIMAL" | "DEC" => {
+                Keyword::BYTEA => Ok(DataType::Bytea),
+                Keyword::NUMERIC | Keyword::DECIMAL | Keyword::DEC => {
                     let (precision, scale) = self.parse_optional_precision_scale()?;
                     Ok(DataType::Decimal(precision, scale))
                 }
@@ -1420,16 +1434,16 @@ impl Parser {
     /// `SELECT ... FROM t1 foo, t2 bar`, `SELECT ... FROM (...) AS bar`
     pub fn parse_optional_alias(
         &mut self,
-        reserved_kwds: &[&str],
+        reserved_kwds: &[Keyword],
     ) -> Result<Option<Ident>, ParserError> {
-        let after_as = self.parse_keyword("AS");
+        let after_as = self.parse_keyword(Keyword::AS);
         match self.next_token() {
             // Accept any identifier after `AS` (though many dialects have restrictions on
             // keywords that may appear here). If there's no `AS`: don't parse keywords,
             // which may start a construct allowed in this position, to be parsed as aliases.
             // (For example, in `FROM t1 JOIN` the `JOIN` will always be parsed as a keyword,
             // not an alias.)
-            Token::Word(w) if after_as || !reserved_kwds.contains(&w.keyword.as_str()) => {
+            Token::Word(w) if after_as || !reserved_kwds.contains(&w.keyword) => {
                 Ok(Some(w.to_ident()))
             }
             // MSSQL supports single-quoted strings as aliases for columns
@@ -1461,7 +1475,7 @@ impl Parser {
     /// addition to the table itself.
     pub fn parse_optional_table_alias(
         &mut self,
-        reserved_kwds: &[&str],
+        reserved_kwds: &[Keyword],
     ) -> Result<Option<TableAlias>, ParserError> {
         match self.parse_optional_alias(reserved_kwds)? {
             Some(name) => {
@@ -1473,7 +1487,7 @@ impl Parser {
     }
 
     /// Parse a possibly qualified, possibly quoted identifier, e.g.
-    /// `foo` or `myschema."table"`
+    /// `foo` or `myschema."table"
     pub fn parse_object_name(&mut self) -> Result<ObjectName, ParserError> {
         let mut idents = vec![];
         loop {
@@ -1537,9 +1551,9 @@ impl Parser {
     }
 
     pub fn parse_delete(&mut self) -> Result<Statement, ParserError> {
-        self.expect_keyword("FROM")?;
+        self.expect_keyword(Keyword::FROM)?;
         let table_name = self.parse_object_name()?;
-        let selection = if self.parse_keyword("WHERE") {
+        let selection = if self.parse_keyword(Keyword::WHERE) {
             Some(self.parse_expr()?)
         } else {
             None
@@ -1556,7 +1570,7 @@ impl Parser {
     /// by `ORDER BY`. Unlike some other parse_... methods, this one doesn't
     /// expect the initial keyword to be already consumed
     pub fn parse_query(&mut self) -> Result<Query, ParserError> {
-        let ctes = if self.parse_keyword("WITH") {
+        let ctes = if self.parse_keyword(Keyword::WITH) {
             // TODO: optional RECURSIVE
             self.parse_comma_separated(Parser::parse_cte)?
         } else {
@@ -1565,25 +1579,25 @@ impl Parser {
 
         let body = self.parse_query_body(0)?;
 
-        let order_by = if self.parse_keywords(vec!["ORDER", "BY"]) {
+        let order_by = if self.parse_keywords(vec![Keyword::ORDER, Keyword::BY]) {
             self.parse_comma_separated(Parser::parse_order_by_expr)?
         } else {
             vec![]
         };
 
-        let limit = if self.parse_keyword("LIMIT") {
+        let limit = if self.parse_keyword(Keyword::LIMIT) {
             self.parse_limit()?
         } else {
             None
         };
 
-        let offset = if self.parse_keyword("OFFSET") {
+        let offset = if self.parse_keyword(Keyword::OFFSET) {
             Some(self.parse_offset()?)
         } else {
             None
         };
 
-        let fetch = if self.parse_keyword("FETCH") {
+        let fetch = if self.parse_keyword(Keyword::FETCH) {
             Some(self.parse_fetch()?)
         } else {
             None
@@ -1605,7 +1619,7 @@ impl Parser {
             name: self.parse_identifier()?,
             columns: self.parse_parenthesized_column_list(Optional)?,
         };
-        self.expect_keyword("AS")?;
+        self.expect_keyword(Keyword::AS)?;
         self.expect_token(&Token::LParen)?;
         let query = self.parse_query()?;
         self.expect_token(&Token::RParen)?;
@@ -1623,14 +1637,14 @@ impl Parser {
     fn parse_query_body(&mut self, precedence: u8) -> Result<SetExpr, ParserError> {
         // We parse the expression using a Pratt parser, as in `parse_expr()`.
         // Start by parsing a restricted SELECT or a `(subquery)`:
-        let mut expr = if self.parse_keyword("SELECT") {
+        let mut expr = if self.parse_keyword(Keyword::SELECT) {
             SetExpr::Select(Box::new(self.parse_select()?))
         } else if self.consume_token(&Token::LParen) {
             // CTEs are not allowed here, but the parser currently accepts them
             let subquery = self.parse_query()?;
             self.expect_token(&Token::RParen)?;
             SetExpr::Query(Box::new(subquery))
-        } else if self.parse_keyword("VALUES") {
+        } else if self.parse_keyword(Keyword::VALUES) {
             SetExpr::Values(self.parse_values()?)
         } else {
             return self.expected(
@@ -1657,7 +1671,7 @@ impl Parser {
             expr = SetExpr::SetOperation {
                 left: Box::new(expr),
                 op: op.unwrap(),
-                all: self.parse_keyword("ALL"),
+                all: self.parse_keyword(Keyword::ALL),
                 right: Box::new(self.parse_query_body(next_precedence)?),
             };
         }
@@ -1667,9 +1681,9 @@ impl Parser {
 
     fn parse_set_operator(&mut self, token: &Token) -> Option<SetOperator> {
         match token {
-            Token::Word(w) if w.keyword == "UNION" => Some(SetOperator::Union),
-            Token::Word(w) if w.keyword == "EXCEPT" => Some(SetOperator::Except),
-            Token::Word(w) if w.keyword == "INTERSECT" => Some(SetOperator::Intersect),
+            Token::Word(w) if w.keyword == Keyword::UNION => Some(SetOperator::Union),
+            Token::Word(w) if w.keyword == Keyword::EXCEPT => Some(SetOperator::Except),
+            Token::Word(w) if w.keyword == Keyword::INTERSECT => Some(SetOperator::Intersect),
             _ => None,
         }
     }
@@ -1679,7 +1693,7 @@ impl Parser {
     pub fn parse_select(&mut self) -> Result<Select, ParserError> {
         let distinct = self.parse_all_or_distinct()?;
 
-        let top = if self.parse_keyword("TOP") {
+        let top = if self.parse_keyword(Keyword::TOP) {
             Some(self.parse_top()?)
         } else {
             None
@@ -1692,25 +1706,25 @@ impl Parser {
         // otherwise they may be parsed as an alias as part of the `projection`
         // or `from`.
 
-        let from = if self.parse_keyword("FROM") {
+        let from = if self.parse_keyword(Keyword::FROM) {
             self.parse_comma_separated(Parser::parse_table_and_joins)?
         } else {
             vec![]
         };
 
-        let selection = if self.parse_keyword("WHERE") {
+        let selection = if self.parse_keyword(Keyword::WHERE) {
             Some(self.parse_expr()?)
         } else {
             None
         };
 
-        let group_by = if self.parse_keywords(vec!["GROUP", "BY"]) {
+        let group_by = if self.parse_keywords(vec![Keyword::GROUP, Keyword::BY]) {
             self.parse_comma_separated(Parser::parse_expr)?
         } else {
             vec![]
         };
 
-        let having = if self.parse_keyword("HAVING") {
+        let having = if self.parse_keyword(Keyword::HAVING) {
             Some(self.parse_expr()?)
         } else {
             None
@@ -1728,9 +1742,9 @@ impl Parser {
     }
 
     pub fn parse_set(&mut self) -> Result<Statement, ParserError> {
-        let modifier = self.parse_one_of_keywords(&["SESSION", "LOCAL"]);
+        let modifier = self.parse_one_of_keywords(&[Keyword::SESSION, Keyword::LOCAL]);
         let variable = self.parse_identifier()?;
-        if self.consume_token(&Token::Eq) || self.parse_keyword("TO") {
+        if self.consume_token(&Token::Eq) || self.parse_keyword(Keyword::TO) {
             let token = self.peek_token();
             let value = match (self.parse_value(), token) {
                 (Ok(value), _) => SetVariableValue::Literal(value),
@@ -1738,7 +1752,7 @@ impl Parser {
                 (Err(_), unexpected) => self.expected("variable value", unexpected)?,
             };
             Ok(Statement::SetVariable {
-                local: modifier == Some("LOCAL"),
+                local: modifier == Some(Keyword::LOCAL),
                 variable,
                 value,
             })
@@ -1753,7 +1767,12 @@ impl Parser {
 
     pub fn parse_show(&mut self) -> Result<Statement, ParserError> {
         if self
-            .parse_one_of_keywords(&["EXTENDED", "FULL", "COLUMNS", "FIELDS"])
+            .parse_one_of_keywords(&[
+                Keyword::EXTENDED,
+                Keyword::FULL,
+                Keyword::COLUMNS,
+                Keyword::FIELDS,
+            ])
             .is_some()
         {
             self.prev_token();
@@ -1766,10 +1785,10 @@ impl Parser {
     }
 
     fn parse_show_columns(&mut self) -> Result<Statement, ParserError> {
-        let extended = self.parse_keyword("EXTENDED");
-        let full = self.parse_keyword("FULL");
-        self.expect_one_of_keywords(&["COLUMNS", "FIELDS"])?;
-        self.expect_one_of_keywords(&["FROM", "IN"])?;
+        let extended = self.parse_keyword(Keyword::EXTENDED);
+        let full = self.parse_keyword(Keyword::FULL);
+        self.expect_one_of_keywords(&[Keyword::COLUMNS, Keyword::FIELDS])?;
+        self.expect_one_of_keywords(&[Keyword::FROM, Keyword::IN])?;
         let table_name = self.parse_object_name()?;
         // MySQL also supports FROM <database> here. In other words, MySQL
         // allows both FROM <table> FROM <database> and FROM <database>.<table>,
@@ -1784,11 +1803,11 @@ impl Parser {
     }
 
     fn parse_show_statement_filter(&mut self) -> Result<Option<ShowStatementFilter>, ParserError> {
-        if self.parse_keyword("LIKE") {
+        if self.parse_keyword(Keyword::LIKE) {
             Ok(Some(ShowStatementFilter::Like(
                 self.parse_literal_string()?,
             )))
-        } else if self.parse_keyword("WHERE") {
+        } else if self.parse_keyword(Keyword::WHERE) {
             Ok(Some(ShowStatementFilter::Where(self.parse_expr()?)))
         } else {
             Ok(None)
@@ -1803,10 +1822,10 @@ impl Parser {
         // a table alias.
         let mut joins = vec![];
         loop {
-            let join = if self.parse_keyword("CROSS") {
-                let join_operator = if self.parse_keyword("JOIN") {
+            let join = if self.parse_keyword(Keyword::CROSS) {
+                let join_operator = if self.parse_keyword(Keyword::JOIN) {
                     JoinOperator::CrossJoin
-                } else if self.parse_keyword("APPLY") {
+                } else if self.parse_keyword(Keyword::APPLY) {
                     // MSSQL extension, similar to CROSS JOIN LATERAL
                     JoinOperator::CrossApply
                 } else {
@@ -1816,39 +1835,41 @@ impl Parser {
                     relation: self.parse_table_factor()?,
                     join_operator,
                 }
-            } else if self.parse_keyword("OUTER") {
+            } else if self.parse_keyword(Keyword::OUTER) {
                 // MSSQL extension, similar to LEFT JOIN LATERAL .. ON 1=1
-                self.expect_keyword("APPLY")?;
+                self.expect_keyword(Keyword::APPLY)?;
                 Join {
                     relation: self.parse_table_factor()?,
                     join_operator: JoinOperator::OuterApply,
                 }
             } else {
-                let natural = self.parse_keyword("NATURAL");
+                let natural = self.parse_keyword(Keyword::NATURAL);
                 let peek_keyword = if let Token::Word(w) = self.peek_token() {
                     w.keyword
                 } else {
-                    String::default()
+                    Keyword::NoKeyword
                 };
 
-                let join_operator_type = match peek_keyword.as_ref() {
-                    "INNER" | "JOIN" => {
-                        let _ = self.parse_keyword("INNER");
-                        self.expect_keyword("JOIN")?;
+                let join_operator_type = match peek_keyword {
+                    Keyword::INNER | Keyword::JOIN => {
+                        let _ = self.parse_keyword(Keyword::INNER);
+                        self.expect_keyword(Keyword::JOIN)?;
                         JoinOperator::Inner
                     }
-                    kw @ "LEFT" | kw @ "RIGHT" | kw @ "FULL" => {
+                    kw @ Keyword::LEFT | kw @ Keyword::RIGHT | kw @ Keyword::FULL => {
                         let _ = self.next_token();
-                        let _ = self.parse_keyword("OUTER");
-                        self.expect_keyword("JOIN")?;
+                        let _ = self.parse_keyword(Keyword::OUTER);
+                        self.expect_keyword(Keyword::JOIN)?;
                         match kw {
-                            "LEFT" => JoinOperator::LeftOuter,
-                            "RIGHT" => JoinOperator::RightOuter,
-                            "FULL" => JoinOperator::FullOuter,
+                            Keyword::LEFT => JoinOperator::LeftOuter,
+                            Keyword::RIGHT => JoinOperator::RightOuter,
+                            Keyword::FULL => JoinOperator::FullOuter,
                             _ => unreachable!(),
                         }
                     }
-                    "OUTER" => return self.expected("LEFT, RIGHT, or FULL", self.peek_token()),
+                    Keyword::OUTER => {
+                        return self.expected("LEFT, RIGHT, or FULL", self.peek_token())
+                    }
                     _ if natural => {
                         return self.expected("a join type after NATURAL", self.peek_token());
                     }
@@ -1868,7 +1889,7 @@ impl Parser {
 
     /// A table name or a parenthesized subquery, followed by optional `[AS] alias`
     pub fn parse_table_factor(&mut self) -> Result<TableFactor, ParserError> {
-        if self.parse_keyword("LATERAL") {
+        if self.parse_keyword(Keyword::LATERAL) {
             // LATERAL must always be followed by a subquery.
             if !self.consume_token(&Token::LParen) {
                 self.expected("subquery after LATERAL", self.peek_token())?;
@@ -1929,7 +1950,7 @@ impl Parser {
             let alias = self.parse_optional_table_alias(keywords::RESERVED_FOR_TABLE_ALIAS)?;
             // MSSQL-specific table hints:
             let mut with_hints = vec![];
-            if self.parse_keyword("WITH") {
+            if self.parse_keyword(Keyword::WITH) {
                 if self.consume_token(&Token::LParen) {
                     with_hints = self.parse_comma_separated(Parser::parse_expr)?;
                     self.expect_token(&Token::RParen)?;
@@ -1967,10 +1988,10 @@ impl Parser {
     fn parse_join_constraint(&mut self, natural: bool) -> Result<JoinConstraint, ParserError> {
         if natural {
             Ok(JoinConstraint::Natural)
-        } else if self.parse_keyword("ON") {
+        } else if self.parse_keyword(Keyword::ON) {
             let constraint = self.parse_expr()?;
             Ok(JoinConstraint::On(constraint))
-        } else if self.parse_keyword("USING") {
+        } else if self.parse_keyword(Keyword::USING) {
             let columns = self.parse_parenthesized_column_list(Mandatory)?;
             Ok(JoinConstraint::Using(columns))
         } else {
@@ -1980,7 +2001,7 @@ impl Parser {
 
     /// Parse an INSERT statement
     pub fn parse_insert(&mut self) -> Result<Statement, ParserError> {
-        self.expect_keyword("INTO")?;
+        self.expect_keyword(Keyword::INTO)?;
         let table_name = self.parse_object_name()?;
         let columns = self.parse_parenthesized_column_list(Optional)?;
         let source = Box::new(self.parse_query()?);
@@ -1993,9 +2014,9 @@ impl Parser {
 
     pub fn parse_update(&mut self) -> Result<Statement, ParserError> {
         let table_name = self.parse_object_name()?;
-        self.expect_keyword("SET")?;
+        self.expect_keyword(Keyword::SET)?;
         let assignments = self.parse_comma_separated(Parser::parse_assignment)?;
-        let selection = if self.parse_keyword("WHERE") {
+        let selection = if self.parse_keyword(Keyword::WHERE) {
             Some(self.parse_expr()?)
         } else {
             None
@@ -2046,17 +2067,17 @@ impl Parser {
     pub fn parse_order_by_expr(&mut self) -> Result<OrderByExpr, ParserError> {
         let expr = self.parse_expr()?;
 
-        let asc = if self.parse_keyword("ASC") {
+        let asc = if self.parse_keyword(Keyword::ASC) {
             Some(true)
-        } else if self.parse_keyword("DESC") {
+        } else if self.parse_keyword(Keyword::DESC) {
             Some(false)
         } else {
             None
         };
 
-        let nulls_first = if self.parse_keywords(vec!["NULLS", "FIRST"]) {
+        let nulls_first = if self.parse_keywords(vec![Keyword::NULLS, Keyword::FIRST]) {
             Some(true)
-        } else if self.parse_keywords(vec!["NULLS", "LAST"]) {
+        } else if self.parse_keywords(vec![Keyword::NULLS, Keyword::LAST]) {
             Some(false)
         } else {
             None
@@ -2080,9 +2101,9 @@ impl Parser {
             Some(Expr::Value(self.parse_number_value()?))
         };
 
-        let percent = self.parse_keyword("PERCENT");
+        let percent = self.parse_keyword(Keyword::PERCENT);
 
-        let with_ties = self.parse_keywords(vec!["WITH", "TIES"]);
+        let with_ties = self.parse_keywords(vec![Keyword::WITH, Keyword::TIES]);
 
         Ok(Top {
             with_ties,
@@ -2093,7 +2114,7 @@ impl Parser {
 
     /// Parse a LIMIT clause
     pub fn parse_limit(&mut self) -> Result<Option<Expr>, ParserError> {
-        if self.parse_keyword("ALL") {
+        if self.parse_keyword(Keyword::ALL) {
             Ok(None)
         } else {
             Ok(Some(Expr::Value(self.parse_number_value()?)))
@@ -2103,9 +2124,9 @@ impl Parser {
     /// Parse an OFFSET clause
     pub fn parse_offset(&mut self) -> Result<Offset, ParserError> {
         let value = Expr::Value(self.parse_number_value()?);
-        let rows = if self.parse_keyword("ROW") {
+        let rows = if self.parse_keyword(Keyword::ROW) {
             OffsetRows::Row
-        } else if self.parse_keyword("ROWS") {
+        } else if self.parse_keyword(Keyword::ROWS) {
             OffsetRows::Rows
         } else {
             OffsetRows::None
@@ -2115,18 +2136,21 @@ impl Parser {
 
     /// Parse a FETCH clause
     pub fn parse_fetch(&mut self) -> Result<Fetch, ParserError> {
-        self.expect_one_of_keywords(&["FIRST", "NEXT"])?;
-        let (quantity, percent) = if self.parse_one_of_keywords(&["ROW", "ROWS"]).is_some() {
+        self.expect_one_of_keywords(&[Keyword::FIRST, Keyword::NEXT])?;
+        let (quantity, percent) = if self
+            .parse_one_of_keywords(&[Keyword::ROW, Keyword::ROWS])
+            .is_some()
+        {
             (None, false)
         } else {
             let quantity = Expr::Value(self.parse_value()?);
-            let percent = self.parse_keyword("PERCENT");
-            self.expect_one_of_keywords(&["ROW", "ROWS"])?;
+            let percent = self.parse_keyword(Keyword::PERCENT);
+            self.expect_one_of_keywords(&[Keyword::ROW, Keyword::ROWS])?;
             (Some(quantity), percent)
         };
-        let with_ties = if self.parse_keyword("ONLY") {
+        let with_ties = if self.parse_keyword(Keyword::ONLY) {
             false
-        } else if self.parse_keywords(vec!["WITH", "TIES"]) {
+        } else if self.parse_keywords(vec![Keyword::WITH, Keyword::TIES]) {
             true
         } else {
             return self.expected("one of ONLY or WITH TIES", self.peek_token());
@@ -2149,14 +2173,14 @@ impl Parser {
     }
 
     pub fn parse_start_transaction(&mut self) -> Result<Statement, ParserError> {
-        self.expect_keyword("TRANSACTION")?;
+        self.expect_keyword(Keyword::TRANSACTION)?;
         Ok(Statement::StartTransaction {
             modes: self.parse_transaction_modes()?,
         })
     }
 
     pub fn parse_begin(&mut self) -> Result<Statement, ParserError> {
-        let _ = self.parse_one_of_keywords(&["TRANSACTION", "WORK"]);
+        let _ = self.parse_one_of_keywords(&[Keyword::TRANSACTION, Keyword::WORK]);
         Ok(Statement::StartTransaction {
             modes: self.parse_transaction_modes()?,
         })
@@ -2166,22 +2190,22 @@ impl Parser {
         let mut modes = vec![];
         let mut required = false;
         loop {
-            let mode = if self.parse_keywords(vec!["ISOLATION", "LEVEL"]) {
-                let iso_level = if self.parse_keywords(vec!["READ", "UNCOMMITTED"]) {
+            let mode = if self.parse_keywords(vec![Keyword::ISOLATION, Keyword::LEVEL]) {
+                let iso_level = if self.parse_keywords(vec![Keyword::READ, Keyword::UNCOMMITTED]) {
                     TransactionIsolationLevel::ReadUncommitted
-                } else if self.parse_keywords(vec!["READ", "COMMITTED"]) {
+                } else if self.parse_keywords(vec![Keyword::READ, Keyword::COMMITTED]) {
                     TransactionIsolationLevel::ReadCommitted
-                } else if self.parse_keywords(vec!["REPEATABLE", "READ"]) {
+                } else if self.parse_keywords(vec![Keyword::REPEATABLE, Keyword::READ]) {
                     TransactionIsolationLevel::RepeatableRead
-                } else if self.parse_keyword("SERIALIZABLE") {
+                } else if self.parse_keyword(Keyword::SERIALIZABLE) {
                     TransactionIsolationLevel::Serializable
                 } else {
                     self.expected("isolation level", self.peek_token())?
                 };
                 TransactionMode::IsolationLevel(iso_level)
-            } else if self.parse_keywords(vec!["READ", "ONLY"]) {
+            } else if self.parse_keywords(vec![Keyword::READ, Keyword::ONLY]) {
                 TransactionMode::AccessMode(TransactionAccessMode::ReadOnly)
-            } else if self.parse_keywords(vec!["READ", "WRITE"]) {
+            } else if self.parse_keywords(vec![Keyword::READ, Keyword::WRITE]) {
                 TransactionMode::AccessMode(TransactionAccessMode::ReadWrite)
             } else if required {
                 self.expected("transaction mode", self.peek_token())?
@@ -2211,10 +2235,10 @@ impl Parser {
     }
 
     pub fn parse_commit_rollback_chain(&mut self) -> Result<bool, ParserError> {
-        let _ = self.parse_one_of_keywords(&["TRANSACTION", "WORK"]);
-        if self.parse_keyword("AND") {
-            let chain = !self.parse_keyword("NO");
-            self.expect_keyword("CHAIN")?;
+        let _ = self.parse_one_of_keywords(&[Keyword::TRANSACTION, Keyword::WORK]);
+        if self.parse_keyword(Keyword::AND) {
+            let chain = !self.parse_keyword(Keyword::NO);
+            self.expect_keyword(Keyword::CHAIN)?;
             Ok(chain)
         } else {
             Ok(false)
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 48b58f1b8..520424af3 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -19,7 +19,7 @@
 use std::iter::Peekable;
 use std::str::Chars;
 
-use super::dialect::keywords::ALL_KEYWORDS;
+use super::dialect::keywords::{Keyword, ALL_KEYWORDS, ALL_KEYWORDS_INDEX};
 use super::dialect::Dialect;
 use std::fmt;
 
@@ -146,15 +146,14 @@ impl Token {
     }
     pub fn make_word(word: &str, quote_style: Option<char>) -> Self {
         let word_uppercase = word.to_uppercase();
-        let is_keyword =
-            quote_style == None && ALL_KEYWORDS.binary_search(&word_uppercase.as_str()).is_ok();
         Token::Word(Word {
             value: word.to_string(),
             quote_style,
-            keyword: if is_keyword {
-                word_uppercase
+            keyword: if quote_style == None {
+                let keyword = ALL_KEYWORDS.binary_search(&word_uppercase.as_str());
+                keyword.map_or(Keyword::NoKeyword, |x| ALL_KEYWORDS_INDEX[x])
             } else {
-                "".to_string()
+                Keyword::NoKeyword
             },
         })
     }
@@ -172,7 +171,7 @@ pub struct Word {
     pub quote_style: Option<char>,
     /// If the word was not quoted and it matched one of the known keywords,
     /// this will have one of the values from dialect::keywords, otherwise empty
-    pub keyword: String,
+    pub keyword: Keyword,
 }
 
 impl fmt::Display for Word {
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 8ff6e7e9b..9720c3972 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -22,7 +22,7 @@ use matches::assert_matches;
 
 use sqlparser::ast::*;
 use sqlparser::dialect::keywords::ALL_KEYWORDS;
-use sqlparser::parser::*;
+use sqlparser::parser::{Parser, ParserError};
 use sqlparser::test_utils::{all_dialects, expr_from_projection, number, only};
 
 #[test]
@@ -1354,10 +1354,12 @@ fn parse_window_functions() {
                avg(bar) OVER (ORDER BY a \
                RANGE BETWEEN 1 PRECEDING AND 1 FOLLOWING), \
                max(baz) OVER (ORDER BY a \
-               ROWS UNBOUNDED PRECEDING) \
+               ROWS UNBOUNDED PRECEDING), \
+               sum(qux) OVER (ORDER BY a \
+               GROUPS BETWEEN 1 PRECEDING AND 1 FOLLOWING) \
                FROM foo";
     let select = verified_only_select(sql);
-    assert_eq!(4, select.projection.len());
+    assert_eq!(5, select.projection.len());
     assert_eq!(
         &Expr::Function(Function {
             name: ObjectName(vec![Ident::new("row_number")]),
@@ -2872,7 +2874,7 @@ fn parse_drop_index() {
 }
 
 #[test]
-fn keywords_sorted() {
+fn all_keywords_sorted() {
     // assert!(ALL_KEYWORDS.is_sorted())
     let mut copy = Vec::from(ALL_KEYWORDS);
     copy.sort();

From 6cdd4a146d66bece40b2802a7f51d97b2a0cd46c Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Thu, 11 Jun 2020 14:04:43 -0700
Subject: [PATCH 036/122] Support general "typed string" literals (#187)

Fixes #168 by enabling `DATE` and other keywords to be used as
identifiers when not followed by a string literal.

A "typed string" is our term for generalized version of `DATE '...'`/`TIME '...'`/
`TIMESTAMP '...'` literals, represented as `TypedString { data_type, value }`
in the AST.

Unlike DATE/TIME/TIMESTAMP literals, this is a non-standard extension
supported by PostgreSQL at least.

This is a port of MaterializeInc/materialize#3146

Co-authored-by: Nikhil Benesch <nikhil.benesch@gmail.com>
Co-authored-by: Nickolay Ponomarev <asqueella@gmail.com>
---
 CHANGELOG.md              |   3 ++
 src/ast/mod.rs            |   8 +++
 src/ast/value.rs          |   9 ----
 src/parser.rs             | 107 +++++++++++++++++++++++++++-----------
 tests/sqlparser_common.rs |  34 +++++++++---
 5 files changed, 117 insertions(+), 44 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 93cfe06b4..616f8774e 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -13,7 +13,9 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 - Change `Ident` (previously a simple `String`) to store the parsed (unquoted) `value` of the identifier and the `quote_style` separately (#143) - thanks @apparebit!
 - Support Snowflake's `FROM (table_name)` (#155) - thanks @eyalleshem!
 - Add line and column number to TokenizerError (#194) - thanks @Dandandan!
+- Use Token::EOF instead of Option<Token> (#195)
 - Make the units keyword following `INTERVAL '...'` optional (#184) - thanks @maxcountryman!
+- Generalize `DATE`/`TIME`/`TIMESTAMP` literals representation in the AST (`TypedString { data_type, value }`) and allow `DATE` and other keywords to be used as identifiers when not followed by a string (#187) - thanks @maxcountryman!
 
 ### Added
 - Support MSSQL `TOP (<N>) [ PERCENT ] [ WITH TIES ]` (#150) - thanks @alexkyllo!
@@ -26,6 +28,7 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 - Support `LISTAGG()` (#174) - thanks @maxcountryman!
 - Support the string concatentation operator `||` (#178) - thanks @Dandandan!
 - Support bitwise AND (`&`), OR (`|`), XOR (`^`) (#181) - thanks @Dandandan!
+- Add serde support to AST structs and enums (#196) - thanks @panarch!
 
 ### Fixed
 - Report an error for unterminated string literals (#165)
diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index da8088842..fe5cba0de 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -210,6 +210,10 @@ pub enum Expr {
     Nested(Box<Expr>),
     /// A literal value, such as string, number, date or NULL
     Value(Value),
+    /// A constant of form `<data_type> 'value'`.
+    /// This can represent ANSI SQL `DATE`, `TIME`, and `TIMESTAMP` literals (such as `DATE '2020-01-01'`),
+    /// as well as constants of other types (a non-standard PostgreSQL extension).
+    TypedString { data_type: DataType, value: String },
     /// Scalar function call e.g. `LEFT(foo, 5)`
     Function(Function),
     /// `CASE [<operand>] WHEN <condition> THEN <result> ... [ELSE <result>] END`
@@ -284,6 +288,10 @@ impl fmt::Display for Expr {
             Expr::Collate { expr, collation } => write!(f, "{} COLLATE {}", expr, collation),
             Expr::Nested(ast) => write!(f, "({})", ast),
             Expr::Value(v) => write!(f, "{}", v),
+            Expr::TypedString { data_type, value } => {
+                write!(f, "{}", data_type)?;
+                write!(f, " '{}'", &value::escape_single_quote_string(value))
+            }
             Expr::Function(fun) => write!(f, "{}", fun),
             Expr::Case {
                 operand,
diff --git a/src/ast/value.rs b/src/ast/value.rs
index c5b0f3a88..9e82c175d 100644
--- a/src/ast/value.rs
+++ b/src/ast/value.rs
@@ -33,12 +33,6 @@ pub enum Value {
     HexStringLiteral(String),
     /// Boolean value true or false
     Boolean(bool),
-    /// `DATE '...'` literals
-    Date(String),
-    /// `TIME '...'` literals
-    Time(String),
-    /// `TIMESTAMP '...'` literals
-    Timestamp(String),
     /// INTERVAL literals, roughly in the following format:
     /// `INTERVAL '<value>' [ <leading_field> [ (<leading_precision>) ] ]
     /// [ TO <last_field> [ (<fractional_seconds_precision>) ] ]`,
@@ -70,9 +64,6 @@ impl fmt::Display for Value {
             Value::NationalStringLiteral(v) => write!(f, "N'{}'", v),
             Value::HexStringLiteral(v) => write!(f, "X'{}'", v),
             Value::Boolean(v) => write!(f, "{}", v),
-            Value::Date(v) => write!(f, "DATE '{}'", escape_single_quote_string(v)),
-            Value::Time(v) => write!(f, "TIME '{}'", escape_single_quote_string(v)),
-            Value::Timestamp(v) => write!(f, "TIMESTAMP '{}'", escape_single_quote_string(v)),
             Value::Interval {
                 value,
                 leading_field: Some(DateTimeField::Second),
diff --git a/src/parser.rs b/src/parser.rs
index 2dc612dfc..a9b147fed 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -35,6 +35,15 @@ macro_rules! parser_err {
     };
 }
 
+// Returns a successful result if the optional expression is some
+macro_rules! return_ok_if_some {
+    ($e:expr) => {{
+        if let Some(v) = $e {
+            return Ok(v);
+        }
+    }};
+}
+
 #[derive(PartialEq)]
 pub enum IsOptional {
     Optional,
@@ -172,6 +181,40 @@ impl Parser {
 
     /// Parse an expression prefix
     pub fn parse_prefix(&mut self) -> Result<Expr, ParserError> {
+        // PostgreSQL allows any string literal to be preceded by a type name, indicating that the
+        // string literal represents a literal of that type. Some examples:
+        //
+        //      DATE '2020-05-20'
+        //      TIMESTAMP WITH TIME ZONE '2020-05-20 7:43:54'
+        //      BOOL 'true'
+        //
+        // The first two are standard SQL, while the latter is a PostgreSQL extension. Complicating
+        // matters is the fact that INTERVAL string literals may optionally be followed by special
+        // keywords, e.g.:
+        //
+        //      INTERVAL '7' DAY
+        //
+        // Note also that naively `SELECT date` looks like a syntax error because the `date` type
+        // name is not followed by a string literal, but in fact in PostgreSQL it is a valid
+        // expression that should parse as the column name "date".
+        return_ok_if_some!(self.maybe_parse(|parser| {
+            match parser.parse_data_type()? {
+                DataType::Interval => parser.parse_literal_interval(),
+                // PosgreSQL allows almost any identifier to be used as custom data type name,
+                // and we support that in `parse_data_type()`. But unlike Postgres we don't
+                // have a list of globally reserved keywords (since they vary across dialects),
+                // so given `NOT 'a' LIKE 'b'`, we'd accept `NOT` as a possible custom data type
+                // name, resulting in `NOT 'a'` being recognized as a `TypedString` instead of
+                // an unary negation `NOT ('a' LIKE 'b')`. To solve this, we don't accept the
+                // `type 'string'` syntax for the custom data types at all.
+                DataType::Custom(..) => parser_err!("dummy"),
+                data_type => Ok(Expr::TypedString {
+                    data_type,
+                    value: parser.parse_literal_string()?,
+                }),
+            }
+        }));
+
         let expr = match self.next_token() {
             Token::Word(w) => match w.keyword {
                 Keyword::TRUE | Keyword::FALSE | Keyword::NULL => {
@@ -180,7 +223,6 @@ impl Parser {
                 }
                 Keyword::CASE => self.parse_case_expr(),
                 Keyword::CAST => self.parse_cast_expr(),
-                Keyword::DATE => Ok(Expr::Value(Value::Date(self.parse_literal_string()?))),
                 Keyword::EXISTS => self.parse_exists_expr(),
                 Keyword::EXTRACT => self.parse_extract_expr(),
                 Keyword::INTERVAL => self.parse_literal_interval(),
@@ -189,10 +231,6 @@ impl Parser {
                     op: UnaryOperator::Not,
                     expr: Box::new(self.parse_subexpr(Self::UNARY_NOT_PREC)?),
                 }),
-                Keyword::TIME => Ok(Expr::Value(Value::Time(self.parse_literal_string()?))),
-                Keyword::TIMESTAMP => {
-                    Ok(Expr::Value(Value::Timestamp(self.parse_literal_string()?)))
-                }
                 // Here `w` is a word, check if it's a part of a multi-part
                 // identifier, a function call, or a simple identifier:
                 _ => match self.peek_token() {
@@ -907,6 +945,22 @@ impl Parser {
         Ok(values)
     }
 
+    /// Run a parser method `f`, reverting back to the current position
+    /// if unsuccessful.
+    #[must_use]
+    fn maybe_parse<T, F>(&mut self, mut f: F) -> Option<T>
+    where
+        F: FnMut(&mut Parser) -> Result<T, ParserError>,
+    {
+        let index = self.index;
+        if let Ok(t) = f(self) {
+            Some(t)
+        } else {
+            self.index = index;
+            None
+        }
+    }
+
     /// Parse either `ALL` or `DISTINCT`. Returns `true` if `DISTINCT` is parsed and results in a
     /// `ParserError` if both `ALL` and `DISTINCT` are fround.
     pub fn parse_all_or_distinct(&mut self) -> Result<bool, ParserError> {
@@ -1898,7 +1952,6 @@ impl Parser {
         }
 
         if self.consume_token(&Token::LParen) {
-            let index = self.index;
             // A left paren introduces either a derived table (i.e., a subquery)
             // or a nested join. It's nearly impossible to determine ahead of
             // time which it is... so we just try to parse both.
@@ -1915,30 +1968,26 @@ impl Parser {
             //                   | (2) starts a nested join
             //                   (1) an additional set of parens around a nested join
             //
-            match self.parse_derived_table_factor(NotLateral) {
-                // The recently consumed '(' started a derived table, and we've
-                // parsed the subquery, followed by the closing ')', and the
-                // alias of the derived table. In the example above this is
-                // case (3), and the next token would be `NATURAL`.
-                Ok(table_factor) => Ok(table_factor),
-                Err(_) => {
-                    // A parsing error from `parse_derived_table_factor` indicates that
-                    // the '(' we've recently consumed does not start a derived table
-                    // (cases 1, 2, or 4). Ignore the error and back up to where we
-                    // were before - right after the opening '('.
-                    self.index = index;
-
-                    // Inside the parentheses we expect to find a table factor
-                    // followed by some joins or another level of nesting.
-                    let table_and_joins = self.parse_table_and_joins()?;
-                    self.expect_token(&Token::RParen)?;
-                    // The SQL spec prohibits derived and bare tables from appearing
-                    // alone in parentheses. We don't enforce this as some databases
-                    // (e.g. Snowflake) allow such syntax.
 
-                    Ok(TableFactor::NestedJoin(Box::new(table_and_joins)))
-                }
-            }
+            // If the recently consumed '(' starts a derived table, the call to
+            // `parse_derived_table_factor` below will return success after parsing the
+            // subquery, followed by the closing ')', and the alias of the derived table.
+            // In the example above this is case (3).
+            return_ok_if_some!(
+                self.maybe_parse(|parser| parser.parse_derived_table_factor(NotLateral))
+            );
+            // A parsing error from `parse_derived_table_factor` indicates that the '(' we've
+            // recently consumed does not start a derived table (cases 1, 2, or 4).
+            // `maybe_parse` will ignore such an error and rewind to be after the opening '('.
+
+            // Inside the parentheses we expect to find a table factor
+            // followed by some joins or another level of nesting.
+            let table_and_joins = self.parse_table_and_joins()?;
+            self.expect_token(&Token::RParen)?;
+            // The SQL spec prohibits derived and bare tables from appearing
+            // alone in parentheses. We don't enforce this as some databases
+            // (e.g. Snowflake) allow such syntax.
+            Ok(TableFactor::NestedJoin(Box::new(table_and_joins)))
         } else {
             let name = self.parse_object_name()?;
             // Postgres, MSSQL: table-valued functions:
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 9720c3972..3b55f8b8f 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -413,6 +413,19 @@ fn parse_null_in_select() {
     );
 }
 
+#[test]
+fn parse_select_with_date_column_name() {
+    let sql = "SELECT date";
+    let select = verified_only_select(sql);
+    assert_eq!(
+        &Expr::Identifier(Ident {
+            value: "date".into(),
+            quote_style: None
+        }),
+        expr_from_projection(only(&select.projection)),
+    );
+}
+
 #[test]
 fn parse_escaped_single_quote_string_predicate() {
     use self::BinaryOperator::*;
@@ -1426,30 +1439,39 @@ fn parse_literal_string() {
 
 #[test]
 fn parse_literal_date() {
-    let sql = "SELECT DATE '1999-01-01'";
+    let sql = "SELECT date '1999-01-01'";
     let select = verified_only_select(sql);
     assert_eq!(
-        &Expr::Value(Value::Date("1999-01-01".into())),
+        &Expr::TypedString {
+            data_type: DataType::Date,
+            value: "1999-01-01".into()
+        },
         expr_from_projection(only(&select.projection)),
     );
 }
 
 #[test]
 fn parse_literal_time() {
-    let sql = "SELECT TIME '01:23:34'";
+    let sql = "SELECT time '01:23:34'";
     let select = verified_only_select(sql);
     assert_eq!(
-        &Expr::Value(Value::Time("01:23:34".into())),
+        &Expr::TypedString {
+            data_type: DataType::Time,
+            value: "01:23:34".into()
+        },
         expr_from_projection(only(&select.projection)),
     );
 }
 
 #[test]
 fn parse_literal_timestamp() {
-    let sql = "SELECT TIMESTAMP '1999-01-01 01:23:34'";
+    let sql = "SELECT timestamp '1999-01-01 01:23:34'";
     let select = verified_only_select(sql);
     assert_eq!(
-        &Expr::Value(Value::Timestamp("1999-01-01 01:23:34".into())),
+        &Expr::TypedString {
+            data_type: DataType::Timestamp,
+            value: "1999-01-01 01:23:34".into()
+        },
         expr_from_projection(only(&select.projection)),
     );
 }

From f4fbd9b6b395abe080d945d19edb8cf8038ba241 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Fri, 12 Jun 2020 01:10:17 +0200
Subject: [PATCH 037/122] Take slice as input for parse_keywords (#199)

---
 src/parser.rs | 62 +++++++++++++++++++++++++--------------------------
 1 file changed, 31 insertions(+), 31 deletions(-)

diff --git a/src/parser.rs b/src/parser.rs
index a9b147fed..d2ab7b1ae 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -312,13 +312,13 @@ impl Parser {
         let over = if self.parse_keyword(Keyword::OVER) {
             // TBD: support window names (`OVER mywin`) in place of inline specification
             self.expect_token(&Token::LParen)?;
-            let partition_by = if self.parse_keywords(vec![Keyword::PARTITION, Keyword::BY]) {
+            let partition_by = if self.parse_keywords(&[Keyword::PARTITION, Keyword::BY]) {
                 // a list of possibly-qualified column names
                 self.parse_comma_separated(Parser::parse_expr)?
             } else {
                 vec![]
             };
-            let order_by = if self.parse_keywords(vec![Keyword::ORDER, Keyword::BY]) {
+            let order_by = if self.parse_keywords(&[Keyword::ORDER, Keyword::BY]) {
                 self.parse_comma_separated(Parser::parse_order_by_expr)?
             } else {
                 vec![]
@@ -379,7 +379,7 @@ impl Parser {
 
     /// Parse `CURRENT ROW` or `{ <positive number> | UNBOUNDED } { PRECEDING | FOLLOWING }`
     pub fn parse_window_frame_bound(&mut self) -> Result<WindowFrameBound, ParserError> {
-        if self.parse_keywords(vec![Keyword::CURRENT, Keyword::ROW]) {
+        if self.parse_keywords(&[Keyword::CURRENT, Keyword::ROW]) {
             Ok(WindowFrameBound::CurrentRow)
         } else {
             let rows = if self.parse_keyword(Keyword::UNBOUNDED) {
@@ -472,7 +472,7 @@ impl Parser {
         } else {
             None
         };
-        let on_overflow = if self.parse_keywords(vec![Keyword::ON, Keyword::OVERFLOW]) {
+        let on_overflow = if self.parse_keywords(&[Keyword::ON, Keyword::OVERFLOW]) {
             if self.parse_keyword(Keyword::ERROR) {
                 Some(ListAggOnOverflow::Error)
             } else {
@@ -503,7 +503,7 @@ impl Parser {
         self.expect_token(&Token::RParen)?;
         // Once again ANSI SQL requires WITHIN GROUP, but Redshift does not. Again we choose the
         // more general implementation.
-        let within_group = if self.parse_keywords(vec![Keyword::WITHIN, Keyword::GROUP]) {
+        let within_group = if self.parse_keywords(&[Keyword::WITHIN, Keyword::GROUP]) {
             self.expect_token(&Token::LParen)?;
             self.expect_keywords(&[Keyword::ORDER, Keyword::BY])?;
             let order_by_expr = self.parse_comma_separated(Parser::parse_order_by_expr)?;
@@ -665,7 +665,7 @@ impl Parser {
                 Keyword::IS => {
                     if self.parse_keyword(Keyword::NULL) {
                         Ok(Expr::IsNull(Box::new(expr)))
-                    } else if self.parse_keywords(vec![Keyword::NOT, Keyword::NULL]) {
+                    } else if self.parse_keywords(&[Keyword::NOT, Keyword::NULL]) {
                         Ok(Expr::IsNotNull(Box::new(expr)))
                     } else {
                         self.expected("NULL or NOT NULL after IS", self.peek_token())
@@ -849,9 +849,9 @@ impl Parser {
 
     /// Look for an expected sequence of keywords and consume them if they exist
     #[must_use]
-    pub fn parse_keywords(&mut self, keywords: Vec<Keyword>) -> bool {
+    pub fn parse_keywords(&mut self, keywords: &[Keyword]) -> bool {
         let index = self.index;
-        for keyword in keywords {
+        for &keyword in keywords {
             if !self.parse_keyword(keyword) {
                 //println!("parse_keywords aborting .. did not find {}", keyword);
                 // reset index and return immediately
@@ -979,7 +979,7 @@ impl Parser {
             self.parse_create_table()
         } else if self.parse_keyword(Keyword::INDEX) {
             self.parse_create_index(false)
-        } else if self.parse_keywords(vec![Keyword::UNIQUE, Keyword::INDEX]) {
+        } else if self.parse_keywords(&[Keyword::UNIQUE, Keyword::INDEX]) {
             self.parse_create_index(true)
         } else if self.parse_keyword(Keyword::MATERIALIZED) || self.parse_keyword(Keyword::VIEW) {
             self.prev_token();
@@ -1057,7 +1057,7 @@ impl Parser {
         };
         // Many dialects support the non standard `IF EXISTS` clause and allow
         // specifying multiple objects to delete in a single statement
-        let if_exists = self.parse_keywords(vec![Keyword::IF, Keyword::EXISTS]);
+        let if_exists = self.parse_keywords(&[Keyword::IF, Keyword::EXISTS]);
         let names = self.parse_comma_separated(Parser::parse_object_name)?;
         let cascade = self.parse_keyword(Keyword::CASCADE);
         let restrict = self.parse_keyword(Keyword::RESTRICT);
@@ -1073,7 +1073,7 @@ impl Parser {
     }
 
     pub fn parse_create_index(&mut self, unique: bool) -> Result<Statement, ParserError> {
-        let if_not_exists = self.parse_keywords(vec![Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
+        let if_not_exists = self.parse_keywords(&[Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
         let index_name = self.parse_object_name()?;
         self.expect_keyword(Keyword::ON)?;
         let table_name = self.parse_object_name()?;
@@ -1088,7 +1088,7 @@ impl Parser {
     }
 
     pub fn parse_create_table(&mut self) -> Result<Statement, ParserError> {
-        let if_not_exists = self.parse_keywords(vec![Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
+        let if_not_exists = self.parse_keywords(&[Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
         let table_name = self.parse_object_name()?;
         // parse optional column list (schema)
         let (columns, constraints) = self.parse_columns()?;
@@ -1160,13 +1160,13 @@ impl Parser {
             None
         };
 
-        let option = if self.parse_keywords(vec![Keyword::NOT, Keyword::NULL]) {
+        let option = if self.parse_keywords(&[Keyword::NOT, Keyword::NULL]) {
             ColumnOption::NotNull
         } else if self.parse_keyword(Keyword::NULL) {
             ColumnOption::Null
         } else if self.parse_keyword(Keyword::DEFAULT) {
             ColumnOption::Default(self.parse_expr()?)
-        } else if self.parse_keywords(vec![Keyword::PRIMARY, Keyword::KEY]) {
+        } else if self.parse_keywords(&[Keyword::PRIMARY, Keyword::KEY]) {
             ColumnOption::Unique { is_primary: true }
         } else if self.parse_keyword(Keyword::UNIQUE) {
             ColumnOption::Unique { is_primary: false }
@@ -1178,10 +1178,10 @@ impl Parser {
             let mut on_delete = None;
             let mut on_update = None;
             loop {
-                if on_delete.is_none() && self.parse_keywords(vec![Keyword::ON, Keyword::DELETE]) {
+                if on_delete.is_none() && self.parse_keywords(&[Keyword::ON, Keyword::DELETE]) {
                     on_delete = Some(self.parse_referential_action()?);
                 } else if on_update.is_none()
-                    && self.parse_keywords(vec![Keyword::ON, Keyword::UPDATE])
+                    && self.parse_keywords(&[Keyword::ON, Keyword::UPDATE])
                 {
                     on_update = Some(self.parse_referential_action()?);
                 } else {
@@ -1211,11 +1211,11 @@ impl Parser {
             Ok(ReferentialAction::Restrict)
         } else if self.parse_keyword(Keyword::CASCADE) {
             Ok(ReferentialAction::Cascade)
-        } else if self.parse_keywords(vec![Keyword::SET, Keyword::NULL]) {
+        } else if self.parse_keywords(&[Keyword::SET, Keyword::NULL]) {
             Ok(ReferentialAction::SetNull)
-        } else if self.parse_keywords(vec![Keyword::NO, Keyword::ACTION]) {
+        } else if self.parse_keywords(&[Keyword::NO, Keyword::ACTION]) {
             Ok(ReferentialAction::NoAction)
-        } else if self.parse_keywords(vec![Keyword::SET, Keyword::DEFAULT]) {
+        } else if self.parse_keywords(&[Keyword::SET, Keyword::DEFAULT]) {
             Ok(ReferentialAction::SetDefault)
         } else {
             self.expected(
@@ -1633,7 +1633,7 @@ impl Parser {
 
         let body = self.parse_query_body(0)?;
 
-        let order_by = if self.parse_keywords(vec![Keyword::ORDER, Keyword::BY]) {
+        let order_by = if self.parse_keywords(&[Keyword::ORDER, Keyword::BY]) {
             self.parse_comma_separated(Parser::parse_order_by_expr)?
         } else {
             vec![]
@@ -1772,7 +1772,7 @@ impl Parser {
             None
         };
 
-        let group_by = if self.parse_keywords(vec![Keyword::GROUP, Keyword::BY]) {
+        let group_by = if self.parse_keywords(&[Keyword::GROUP, Keyword::BY]) {
             self.parse_comma_separated(Parser::parse_expr)?
         } else {
             vec![]
@@ -2124,9 +2124,9 @@ impl Parser {
             None
         };
 
-        let nulls_first = if self.parse_keywords(vec![Keyword::NULLS, Keyword::FIRST]) {
+        let nulls_first = if self.parse_keywords(&[Keyword::NULLS, Keyword::FIRST]) {
             Some(true)
-        } else if self.parse_keywords(vec![Keyword::NULLS, Keyword::LAST]) {
+        } else if self.parse_keywords(&[Keyword::NULLS, Keyword::LAST]) {
             Some(false)
         } else {
             None
@@ -2152,7 +2152,7 @@ impl Parser {
 
         let percent = self.parse_keyword(Keyword::PERCENT);
 
-        let with_ties = self.parse_keywords(vec![Keyword::WITH, Keyword::TIES]);
+        let with_ties = self.parse_keywords(&[Keyword::WITH, Keyword::TIES]);
 
         Ok(Top {
             with_ties,
@@ -2199,7 +2199,7 @@ impl Parser {
         };
         let with_ties = if self.parse_keyword(Keyword::ONLY) {
             false
-        } else if self.parse_keywords(vec![Keyword::WITH, Keyword::TIES]) {
+        } else if self.parse_keywords(&[Keyword::WITH, Keyword::TIES]) {
             true
         } else {
             return self.expected("one of ONLY or WITH TIES", self.peek_token());
@@ -2239,12 +2239,12 @@ impl Parser {
         let mut modes = vec![];
         let mut required = false;
         loop {
-            let mode = if self.parse_keywords(vec![Keyword::ISOLATION, Keyword::LEVEL]) {
-                let iso_level = if self.parse_keywords(vec![Keyword::READ, Keyword::UNCOMMITTED]) {
+            let mode = if self.parse_keywords(&[Keyword::ISOLATION, Keyword::LEVEL]) {
+                let iso_level = if self.parse_keywords(&[Keyword::READ, Keyword::UNCOMMITTED]) {
                     TransactionIsolationLevel::ReadUncommitted
-                } else if self.parse_keywords(vec![Keyword::READ, Keyword::COMMITTED]) {
+                } else if self.parse_keywords(&[Keyword::READ, Keyword::COMMITTED]) {
                     TransactionIsolationLevel::ReadCommitted
-                } else if self.parse_keywords(vec![Keyword::REPEATABLE, Keyword::READ]) {
+                } else if self.parse_keywords(&[Keyword::REPEATABLE, Keyword::READ]) {
                     TransactionIsolationLevel::RepeatableRead
                 } else if self.parse_keyword(Keyword::SERIALIZABLE) {
                     TransactionIsolationLevel::Serializable
@@ -2252,9 +2252,9 @@ impl Parser {
                     self.expected("isolation level", self.peek_token())?
                 };
                 TransactionMode::IsolationLevel(iso_level)
-            } else if self.parse_keywords(vec![Keyword::READ, Keyword::ONLY]) {
+            } else if self.parse_keywords(&[Keyword::READ, Keyword::ONLY]) {
                 TransactionMode::AccessMode(TransactionAccessMode::ReadOnly)
-            } else if self.parse_keywords(vec![Keyword::READ, Keyword::WRITE]) {
+            } else if self.parse_keywords(&[Keyword::READ, Keyword::WRITE]) {
                 TransactionMode::AccessMode(TransactionAccessMode::ReadWrite)
             } else if required {
                 self.expected("transaction mode", self.peek_token())?

From a0f076acda6bf0a849bf9070700ae7728c999f77 Mon Sep 17 00:00:00 2001
From: Taehoon Moon <panarch@kaist.ac.kr>
Date: Fri, 12 Jun 2020 22:38:59 +0900
Subject: [PATCH 038/122] Make the cli example print JSON (#197)

...via the new json_example feature - to make it easier to try out the parser without coding.
---
 Cargo.toml      |  8 ++++++++
 README.md       |  6 ++++++
 examples/cli.rs | 24 +++++++++++++++++++++---
 3 files changed, 35 insertions(+), 3 deletions(-)

diff --git a/Cargo.toml b/Cargo.toml
index 3232e6a05..804fac0e4 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -18,10 +18,18 @@ edition = "2018"
 name = "sqlparser"
 path = "src/lib.rs"
 
+[features]
+# Enable JSON output in the `cli` example:
+json_example = ["serde_json", "serde"]
+
 [dependencies]
 bigdecimal = { version = "0.1.0", features = ["serde"], optional = true }
 log = "0.4.5"
 serde = { version = "1.0", features = ["derive"], optional = true }
+# serde_json is only used in examples/cli, but we have to put it outside
+# of dev-dependencies because of
+# https://github.com/rust-lang/cargo/issues/1596
+serde_json = { version = "1.0", optional = true }
 
 [dev-dependencies]
 simple_logger = "1.0.1"
diff --git a/README.md b/README.md
index 24674d911..8bf1d4617 100644
--- a/README.md
+++ b/README.md
@@ -40,6 +40,12 @@ This outputs
 AST: [Query(Query { ctes: [], body: Select(Select { distinct: false, projection: [UnnamedExpr(Identifier("a")), UnnamedExpr(Identifier("b")), UnnamedExpr(Value(Long(123))), UnnamedExpr(Function(Function { name: ObjectName(["myfunc"]), args: [Identifier("b")], over: None, distinct: false }))], from: [TableWithJoins { relation: Table { name: ObjectName(["table_1"]), alias: None, args: [], with_hints: [] }, joins: [] }], selection: Some(BinaryOp { left: BinaryOp { left: Identifier("a"), op: Gt, right: Identifier("b") }, op: And, right: BinaryOp { left: Identifier("b"), op: Lt, right: Value(Long(100)) } }), group_by: [], having: None }), order_by: [OrderByExpr { expr: Identifier("a"), asc: Some(false) }, OrderByExpr { expr: Identifier("b"), asc: None }], limit: None, offset: None, fetch: None })]
 ```
 
+## Command line
+To parse a file and dump the results as JSON:
+```
+$ cargo run --feature json_example --example cli FILENAME.sql [--dialectname]
+```
+
 ## SQL compliance
 
 SQL was first standardized in 1987, and revisions of the standard have been
diff --git a/examples/cli.rs b/examples/cli.rs
index 2b0822584..f019c520b 100644
--- a/examples/cli.rs
+++ b/examples/cli.rs
@@ -23,8 +23,16 @@ fn main() {
     simple_logger::init().unwrap();
 
     let filename = std::env::args().nth(1).expect(
-        "No arguments provided!\n\n\
-         Usage: cargo run --example cli FILENAME.sql [--dialectname]",
+        r#"
+No arguments provided!
+
+Usage:
+$ cargo run --example cli FILENAME.sql [--dialectname]
+
+To print the parse results as JSON:
+$ cargo run --feature json_example --example cli FILENAME.sql [--dialectname]
+
+"#,
     );
 
     let dialect: Box<dyn Dialect> = match std::env::args().nth(2).unwrap_or_default().as_ref() {
@@ -56,7 +64,17 @@ fn main() {
                     .collect::<Vec<_>>()
                     .join("\n")
             );
-            println!("Parse results:\n{:#?}", statements);
+
+            if cfg!(feature = "json_example") {
+                #[cfg(feature = "json_example")]
+                {
+                    let serialized = serde_json::to_string_pretty(&statements).unwrap();
+                    println!("Serialized as JSON:\n{}", serialized);
+                }
+            } else {
+                println!("Parse results:\n{:#?}", statements);
+            }
+
             std::process::exit(0);
         }
         Err(e) => {

From 68afa2a7648904d613ddfbbd36db264baaf33e83 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Fri, 12 Jun 2020 17:10:44 +0200
Subject: [PATCH 039/122] Make FileFormat case insensitive (#200)

---
 src/parser.rs             |  7 ++++++-
 tests/sqlparser_common.rs | 18 ++++++++++++++++++
 2 files changed, 24 insertions(+), 1 deletion(-)

diff --git a/src/parser.rs b/src/parser.rs
index d2ab7b1ae..4993eb29a 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1006,7 +1006,12 @@ impl Parser {
         let table_name = self.parse_object_name()?;
         let (columns, constraints) = self.parse_columns()?;
         self.expect_keywords(&[Keyword::STORED, Keyword::AS])?;
-        let file_format = self.parse_identifier()?.value.parse::<FileFormat>()?;
+        // We probably shouldn't parse the file format as an identifier..
+        let file_format = self
+            .parse_identifier()?
+            .value
+            .to_ascii_uppercase()
+            .parse::<FileFormat>()?;
 
         self.expect_keyword(Keyword::LOCATION)?;
         let location = self.parse_literal_string()?;
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 3b55f8b8f..5599eab91 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1289,6 +1289,24 @@ fn parse_create_external_table() {
     }
 }
 
+#[test]
+fn parse_create_external_table_lowercase() {
+    let sql = "create external table uk_cities (\
+               name varchar(100) not null,\
+               lat double null,\
+               lng double)\
+               stored as parquet location '/tmp/example.csv'";
+    let ast = one_statement_parses_to(
+        sql,
+        "CREATE EXTERNAL TABLE uk_cities (\
+         name character varying(100) NOT NULL, \
+         lat double NULL, \
+         lng double) \
+         STORED AS PARQUET LOCATION '/tmp/example.csv'",
+    );
+    assert_matches!(ast, Statement::CreateTable{..});
+}
+
 #[test]
 fn parse_create_table_empty() {
     // Zero-column tables are weird, but supported by at least PostgreSQL.

From b24dbe513c6c4638a372d85be237f0dd4aeda4eb Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Sat, 13 Jun 2020 14:38:01 +0200
Subject: [PATCH 040/122] Replace FromStr with normal parser function for
 FileFormat (#201)

The previous version accepted quoting file format keywords
(`STORED AS "TEXTFILE"`) and was inconsistent with the
way WindowFrameUnits was parsed.
---
 src/ast/mod.rs          | 23 -----------------------
 src/dialect/keywords.rs |  6 ++++++
 src/parser.rs           | 23 +++++++++++++++++------
 3 files changed, 23 insertions(+), 29 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index fe5cba0de..cab337920 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -835,29 +835,6 @@ impl fmt::Display for FileFormat {
     }
 }
 
-use crate::parser::ParserError;
-use std::str::FromStr;
-impl FromStr for FileFormat {
-    type Err = ParserError;
-
-    fn from_str(s: &str) -> Result<Self, Self::Err> {
-        use self::FileFormat::*;
-        match s {
-            "TEXTFILE" => Ok(TEXTFILE),
-            "SEQUENCEFILE" => Ok(SEQUENCEFILE),
-            "ORC" => Ok(ORC),
-            "PARQUET" => Ok(PARQUET),
-            "AVRO" => Ok(AVRO),
-            "RCFILE" => Ok(RCFILE),
-            "JSONFILE" => Ok(JSONFILE),
-            _ => Err(ParserError::ParserError(format!(
-                "Unexpected file format: {}",
-                s
-            ))),
-        }
-    }
-}
-
 /// A `LISTAGG` invocation `LISTAGG( [ DISTINCT ] <expr>[, <separator> ] [ON OVERFLOW <on_overflow>] ) )
 /// [ WITHIN GROUP (ORDER BY <within_group1>[, ...] ) ]`
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index e804f3693..f5e75f74c 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -84,6 +84,7 @@ define_keywords!(
     ATOMIC,
     AUTHORIZATION,
     AVG,
+    AVRO,
     BEGIN,
     BEGIN_FRAME,
     BEGIN_PARTITION,
@@ -231,6 +232,7 @@ define_keywords!(
     IS,
     ISOLATION,
     JOIN,
+    JSONFILE,
     KEY,
     LAG,
     LANGUAGE,
@@ -291,6 +293,7 @@ define_keywords!(
     ONLY,
     OPEN,
     OR,
+    ORC,
     ORDER,
     OUT,
     OUTER,
@@ -318,6 +321,7 @@ define_keywords!(
     PROCEDURE,
     RANGE,
     RANK,
+    RCFILE,
     READ,
     READS,
     REAL,
@@ -356,6 +360,7 @@ define_keywords!(
     SECOND,
     SELECT,
     SENSITIVE,
+    SEQUENCEFILE,
     SERIALIZABLE,
     SESSION,
     SESSION_USER,
@@ -389,6 +394,7 @@ define_keywords!(
     TABLE,
     TABLESAMPLE,
     TEXT,
+    TEXTFILE,
     THEN,
     TIES,
     TIME,
diff --git a/src/parser.rs b/src/parser.rs
index 4993eb29a..1763afb49 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1006,12 +1006,7 @@ impl Parser {
         let table_name = self.parse_object_name()?;
         let (columns, constraints) = self.parse_columns()?;
         self.expect_keywords(&[Keyword::STORED, Keyword::AS])?;
-        // We probably shouldn't parse the file format as an identifier..
-        let file_format = self
-            .parse_identifier()?
-            .value
-            .to_ascii_uppercase()
-            .parse::<FileFormat>()?;
+        let file_format = self.parse_file_format()?;
 
         self.expect_keyword(Keyword::LOCATION)?;
         let location = self.parse_literal_string()?;
@@ -1028,6 +1023,22 @@ impl Parser {
         })
     }
 
+    pub fn parse_file_format(&mut self) -> Result<FileFormat, ParserError> {
+        match self.next_token() {
+            Token::Word(w) => match w.keyword {
+                Keyword::AVRO => Ok(FileFormat::AVRO),
+                Keyword::JSONFILE => Ok(FileFormat::JSONFILE),
+                Keyword::ORC => Ok(FileFormat::ORC),
+                Keyword::PARQUET => Ok(FileFormat::PARQUET),
+                Keyword::RCFILE => Ok(FileFormat::RCFILE),
+                Keyword::SEQUENCEFILE => Ok(FileFormat::SEQUENCEFILE),
+                Keyword::TEXTFILE => Ok(FileFormat::TEXTFILE),
+                _ => self.expected("fileformat", Token::Word(w)),
+            },
+            unexpected => self.expected("fileformat", unexpected),
+        }
+    }
+
     pub fn parse_create_view(&mut self) -> Result<Statement, ParserError> {
         let materialized = self.parse_keyword(Keyword::MATERIALIZED);
         self.expect_keyword(Keyword::VIEW)?;

From fab6e2827195b6067cac5e5b3a1a9bb6bc161ae7 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Sat, 13 Jun 2020 15:18:44 +0200
Subject: [PATCH 041/122] Output DataType capitalized (#202)

This makes it consistent with other output which also prints keywords capitalized.
---
 src/ast/data_type.rs        | 46 ++++++++++++++++----------------
 tests/sqlparser_common.rs   | 52 ++++++++++++++++++-------------------
 tests/sqlparser_postgres.rs | 36 ++++++++++++-------------
 3 files changed, 67 insertions(+), 67 deletions(-)

diff --git a/src/ast/data_type.rs b/src/ast/data_type.rs
index fc8b98c55..53122ab5d 100644
--- a/src/ast/data_type.rs
+++ b/src/ast/data_type.rs
@@ -72,36 +72,36 @@ pub enum DataType {
 impl fmt::Display for DataType {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
         match self {
-            DataType::Char(size) => format_type_with_optional_length(f, "char", size),
+            DataType::Char(size) => format_type_with_optional_length(f, "CHAR", size),
             DataType::Varchar(size) => {
-                format_type_with_optional_length(f, "character varying", size)
+                format_type_with_optional_length(f, "CHARACTER VARYING", size)
             }
-            DataType::Uuid => write!(f, "uuid"),
-            DataType::Clob(size) => write!(f, "clob({})", size),
-            DataType::Binary(size) => write!(f, "binary({})", size),
-            DataType::Varbinary(size) => write!(f, "varbinary({})", size),
-            DataType::Blob(size) => write!(f, "blob({})", size),
+            DataType::Uuid => write!(f, "UUID"),
+            DataType::Clob(size) => write!(f, "CLOB({})", size),
+            DataType::Binary(size) => write!(f, "BINARY({})", size),
+            DataType::Varbinary(size) => write!(f, "VARBINARY({})", size),
+            DataType::Blob(size) => write!(f, "BLOB({})", size),
             DataType::Decimal(precision, scale) => {
                 if let Some(scale) = scale {
-                    write!(f, "numeric({},{})", precision.unwrap(), scale)
+                    write!(f, "NUMERIC({},{})", precision.unwrap(), scale)
                 } else {
-                    format_type_with_optional_length(f, "numeric", precision)
+                    format_type_with_optional_length(f, "NUMERIC", precision)
                 }
             }
-            DataType::Float(size) => format_type_with_optional_length(f, "float", size),
-            DataType::SmallInt => write!(f, "smallint"),
-            DataType::Int => write!(f, "int"),
-            DataType::BigInt => write!(f, "bigint"),
-            DataType::Real => write!(f, "real"),
-            DataType::Double => write!(f, "double"),
-            DataType::Boolean => write!(f, "boolean"),
-            DataType::Date => write!(f, "date"),
-            DataType::Time => write!(f, "time"),
-            DataType::Timestamp => write!(f, "timestamp"),
-            DataType::Interval => write!(f, "interval"),
-            DataType::Regclass => write!(f, "regclass"),
-            DataType::Text => write!(f, "text"),
-            DataType::Bytea => write!(f, "bytea"),
+            DataType::Float(size) => format_type_with_optional_length(f, "FLOAT", size),
+            DataType::SmallInt => write!(f, "SMALLINT"),
+            DataType::Int => write!(f, "INT"),
+            DataType::BigInt => write!(f, "BIGINT"),
+            DataType::Real => write!(f, "REAL"),
+            DataType::Double => write!(f, "DOUBLE"),
+            DataType::Boolean => write!(f, "BOOLEAN"),
+            DataType::Date => write!(f, "DATE"),
+            DataType::Time => write!(f, "TIME"),
+            DataType::Timestamp => write!(f, "TIMESTAMP"),
+            DataType::Interval => write!(f, "INTERVAL"),
+            DataType::Regclass => write!(f, "REGCLASS"),
+            DataType::Text => write!(f, "TEXT"),
+            DataType::Bytea => write!(f, "BYTEA"),
             DataType::Array(ty) => write!(f, "{}[]", ty),
             DataType::Custom(ty) => write!(f, "{}", ty),
         }
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 5599eab91..bff131334 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -908,7 +908,7 @@ fn parse_limit_accepts_all() {
 
 #[test]
 fn parse_cast() {
-    let sql = "SELECT CAST(id AS bigint) FROM customer";
+    let sql = "SELECT CAST(id AS BIGINT) FROM customer";
     let select = verified_only_select(sql);
     assert_eq!(
         &Expr::Cast {
@@ -919,19 +919,19 @@ fn parse_cast() {
     );
     one_statement_parses_to(
         "SELECT CAST(id AS BIGINT) FROM customer",
-        "SELECT CAST(id AS bigint) FROM customer",
+        "SELECT CAST(id AS BIGINT) FROM customer",
     );
 
-    verified_stmt("SELECT CAST(id AS numeric) FROM customer");
+    verified_stmt("SELECT CAST(id AS NUMERIC) FROM customer");
 
     one_statement_parses_to(
-        "SELECT CAST(id AS dec) FROM customer",
-        "SELECT CAST(id AS numeric) FROM customer",
+        "SELECT CAST(id AS DEC) FROM customer",
+        "SELECT CAST(id AS NUMERIC) FROM customer",
     );
 
     one_statement_parses_to(
-        "SELECT CAST(id AS decimal) FROM customer",
-        "SELECT CAST(id AS numeric) FROM customer",
+        "SELECT CAST(id AS DECIMAL) FROM customer",
+        "SELECT CAST(id AS NUMERIC) FROM customer",
     );
 }
 
@@ -1027,12 +1027,12 @@ fn parse_create_table() {
     let ast = one_statement_parses_to(
         sql,
         "CREATE TABLE uk_cities (\
-         name character varying(100) NOT NULL, \
-         lat double NULL, \
-         lng double, \
-         constrained int NULL CONSTRAINT pkey PRIMARY KEY NOT NULL UNIQUE CHECK (constrained > 0), \
-         ref int REFERENCES othertable (a, b), \
-         ref2 int REFERENCES othertable2 ON DELETE CASCADE ON UPDATE NO ACTION)",
+         name CHARACTER VARYING(100) NOT NULL, \
+         lat DOUBLE NULL, \
+         lng DOUBLE, \
+         constrained INT NULL CONSTRAINT pkey PRIMARY KEY NOT NULL UNIQUE CHECK (constrained > 0), \
+         ref INT REFERENCES othertable (a, b), \
+         ref2 INT REFERENCES othertable2 ON DELETE CASCADE ON UPDATE NO ACTION)",
     );
     match ast {
         Statement::CreateTable {
@@ -1193,7 +1193,7 @@ fn parse_create_table_with_on_delete_on_update_2in_any_order() -> Result<(), Par
 
 #[test]
 fn parse_create_table_with_options() {
-    let sql = "CREATE TABLE t (c int) WITH (foo = 'bar', a = 123)";
+    let sql = "CREATE TABLE t (c INT) WITH (foo = 'bar', a = 123)";
     match verified_stmt(sql) {
         Statement::CreateTable { with_options, .. } => {
             assert_eq!(
@@ -1217,7 +1217,7 @@ fn parse_create_table_with_options() {
 #[test]
 fn parse_create_table_trailing_comma() {
     let sql = "CREATE TABLE foo (bar int,)";
-    all_dialects().one_statement_parses_to(sql, "CREATE TABLE foo (bar int)");
+    all_dialects().one_statement_parses_to(sql, "CREATE TABLE foo (bar INT)");
 }
 
 #[test]
@@ -1230,9 +1230,9 @@ fn parse_create_external_table() {
     let ast = one_statement_parses_to(
         sql,
         "CREATE EXTERNAL TABLE uk_cities (\
-         name character varying(100) NOT NULL, \
-         lat double NULL, \
-         lng double) \
+         name CHARACTER VARYING(100) NOT NULL, \
+         lat DOUBLE NULL, \
+         lng DOUBLE) \
          STORED AS TEXTFILE LOCATION '/tmp/example.csv'",
     );
     match ast {
@@ -1299,9 +1299,9 @@ fn parse_create_external_table_lowercase() {
     let ast = one_statement_parses_to(
         sql,
         "CREATE EXTERNAL TABLE uk_cities (\
-         name character varying(100) NOT NULL, \
-         lat double NULL, \
-         lng double) \
+         name CHARACTER VARYING(100) NOT NULL, \
+         lat DOUBLE NULL, \
+         lng DOUBLE) \
          STORED AS PARQUET LOCATION '/tmp/example.csv'",
     );
     assert_matches!(ast, Statement::CreateTable{..});
@@ -1339,7 +1339,7 @@ fn parse_alter_table_constraints() {
             }
             _ => unreachable!(),
         }
-        verified_stmt(&format!("CREATE TABLE foo (id int, {})", constraint_text));
+        verified_stmt(&format!("CREATE TABLE foo (id INT, {})", constraint_text));
     }
 }
 
@@ -1457,7 +1457,7 @@ fn parse_literal_string() {
 
 #[test]
 fn parse_literal_date() {
-    let sql = "SELECT date '1999-01-01'";
+    let sql = "SELECT DATE '1999-01-01'";
     let select = verified_only_select(sql);
     assert_eq!(
         &Expr::TypedString {
@@ -1470,7 +1470,7 @@ fn parse_literal_date() {
 
 #[test]
 fn parse_literal_time() {
-    let sql = "SELECT time '01:23:34'";
+    let sql = "SELECT TIME '01:23:34'";
     let select = verified_only_select(sql);
     assert_eq!(
         &Expr::TypedString {
@@ -1483,7 +1483,7 @@ fn parse_literal_time() {
 
 #[test]
 fn parse_literal_timestamp() {
-    let sql = "SELECT timestamp '1999-01-01 01:23:34'";
+    let sql = "SELECT TIMESTAMP '1999-01-01 01:23:34'";
     let select = verified_only_select(sql);
     assert_eq!(
         &Expr::TypedString {
@@ -2289,7 +2289,7 @@ fn parse_multiple_statements() {
     );
     test_with("DELETE FROM foo", "SELECT", " bar");
     test_with("INSERT INTO foo VALUES (1)", "SELECT", " bar");
-    test_with("CREATE TABLE foo (baz int)", "SELECT", " bar");
+    test_with("CREATE TABLE foo (baz INT)", "SELECT", " bar");
     // Make sure that empty statements do not cause an error:
     let res = parse_sql_statements(";;");
     assert_eq!(0, res.unwrap().len());
diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index bd467dc74..88e94d01c 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -124,7 +124,7 @@ fn parse_create_table_with_defaults() {
                             ColumnOptionDef {
                                 name: None,
                                 option: ColumnOption::Default(
-                                    pg().verified_expr("CAST(now() AS text)")
+                                    pg().verified_expr("CAST(now() AS TEXT)")
                                 )
                             },
                             ColumnOptionDef {
@@ -192,25 +192,25 @@ fn parse_create_table_from_pg_dump() {
             info text[],
             address_id smallint NOT NULL,
             activebool boolean DEFAULT true NOT NULL,
-            create_date date DEFAULT now()::date NOT NULL,
-            create_date1 date DEFAULT 'now'::text::date NOT NULL,
+            create_date date DEFAULT now()::DATE NOT NULL,
+            create_date1 date DEFAULT 'now'::TEXT::date NOT NULL,
             last_update timestamp without time zone DEFAULT now(),
             release_year public.year,
             active integer
         )";
     pg().one_statement_parses_to(sql, "CREATE TABLE public.customer (\
-            customer_id int DEFAULT nextval(CAST('public.customer_customer_id_seq' AS regclass)) NOT NULL, \
-            store_id smallint NOT NULL, \
-            first_name character varying(45) NOT NULL, \
-            last_name character varying(45) NOT NULL, \
-            info text[], \
-            address_id smallint NOT NULL, \
-            activebool boolean DEFAULT true NOT NULL, \
-            create_date date DEFAULT CAST(now() AS date) NOT NULL, \
-            create_date1 date DEFAULT CAST(CAST('now' AS text) AS date) NOT NULL, \
-            last_update timestamp DEFAULT now(), \
+            customer_id INT DEFAULT nextval(CAST('public.customer_customer_id_seq' AS REGCLASS)) NOT NULL, \
+            store_id SMALLINT NOT NULL, \
+            first_name CHARACTER VARYING(45) NOT NULL, \
+            last_name CHARACTER VARYING(45) NOT NULL, \
+            info TEXT[], \
+            address_id SMALLINT NOT NULL, \
+            activebool BOOLEAN DEFAULT true NOT NULL, \
+            create_date DATE DEFAULT CAST(now() AS DATE) NOT NULL, \
+            create_date1 DATE DEFAULT CAST(CAST('now' AS TEXT) AS DATE) NOT NULL, \
+            last_update TIMESTAMP DEFAULT now(), \
             release_year public.year, \
-            active int\
+            active INT\
         )");
 }
 
@@ -218,10 +218,10 @@ fn parse_create_table_from_pg_dump() {
 fn parse_create_table_with_inherit() {
     let sql = "\
                CREATE TABLE bazaar.settings (\
-               settings_id uuid PRIMARY KEY DEFAULT uuid_generate_v4() NOT NULL, \
-               user_id uuid UNIQUE, \
-               value text[], \
-               use_metric boolean DEFAULT true\
+               settings_id UUID PRIMARY KEY DEFAULT uuid_generate_v4() NOT NULL, \
+               user_id UUID UNIQUE, \
+               value TEXT[], \
+               use_metric BOOLEAN DEFAULT true\
                )";
     pg().verified_stmt(sql);
 }

From faeb7d440a28861171cf7974382c072251208058 Mon Sep 17 00:00:00 2001
From: mz <hitmashuai@gmail.com>
Date: Wed, 17 Jun 2020 03:52:37 +0800
Subject: [PATCH 042/122] Implement ALTER TABLE ADD COLUMN and RENAME (#203)

Based on sqlite grammar
https://www.sqlite.org/lang_altertable.html
---
 CHANGELOG.md              |  3 ++
 src/ast/ddl.rs            | 23 +++++++++++++
 src/dialect/keywords.rs   |  1 +
 src/parser.rs             | 68 +++++++++++++++++++++++++--------------
 tests/sqlparser_common.rs | 49 ++++++++++++++++++++++++++--
 5 files changed, 117 insertions(+), 27 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 616f8774e..06b0220cd 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -16,6 +16,7 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 - Use Token::EOF instead of Option<Token> (#195)
 - Make the units keyword following `INTERVAL '...'` optional (#184) - thanks @maxcountryman!
 - Generalize `DATE`/`TIME`/`TIMESTAMP` literals representation in the AST (`TypedString { data_type, value }`) and allow `DATE` and other keywords to be used as identifiers when not followed by a string (#187) - thanks @maxcountryman!
+- Output DataType capitalized (`fmt::Display`) (#202) - thanks @Dandandan!
 
 ### Added
 - Support MSSQL `TOP (<N>) [ PERCENT ] [ WITH TIES ]` (#150) - thanks @alexkyllo!
@@ -29,9 +30,11 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 - Support the string concatentation operator `||` (#178) - thanks @Dandandan!
 - Support bitwise AND (`&`), OR (`|`), XOR (`^`) (#181) - thanks @Dandandan!
 - Add serde support to AST structs and enums (#196) - thanks @panarch!
+- Support `ALTER TABLE ADD COLUMN`, `RENAME COLUMN`, and `RENAME TO` (#203) - thanks @mashuai!
 
 ### Fixed
 - Report an error for unterminated string literals (#165)
+- Make file format (`STORED AS`) case insensitive (#200) and don't allow quoting it (#201) - thanks @Dandandan!
 
 ## [0.5.0] - 2019-10-10
 
diff --git a/src/ast/ddl.rs b/src/ast/ddl.rs
index d7503ba77..c1e66373b 100644
--- a/src/ast/ddl.rs
+++ b/src/ast/ddl.rs
@@ -23,15 +23,38 @@ use std::fmt;
 pub enum AlterTableOperation {
     /// `ADD <table_constraint>`
     AddConstraint(TableConstraint),
+    /// `ADD [ COLUMN ] <column_def>`
+    AddColumn { column_def: ColumnDef },
     /// TODO: implement `DROP CONSTRAINT <name>`
     DropConstraint { name: Ident },
+    /// `RENAME [ COLUMN ] <old_column_name> TO <new_column_name>`
+    RenameColumn {
+        old_column_name: Ident,
+        new_column_name: Ident,
+    },
+    /// `RENAME TO <table_name>`
+    RenameTable { table_name: Ident },
 }
 
 impl fmt::Display for AlterTableOperation {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
         match self {
             AlterTableOperation::AddConstraint(c) => write!(f, "ADD {}", c),
+            AlterTableOperation::AddColumn { column_def } => {
+                write!(f, "ADD COLUMN {}", column_def.to_string())
+            }
             AlterTableOperation::DropConstraint { name } => write!(f, "DROP CONSTRAINT {}", name),
+            AlterTableOperation::RenameColumn {
+                old_column_name,
+                new_column_name,
+            } => write!(
+                f,
+                "RENAME COLUMN {} TO {}",
+                old_column_name, new_column_name
+            ),
+            AlterTableOperation::RenameTable { table_name } => {
+                write!(f, "RENAME TO {}", table_name)
+            }
         }
     }
 }
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index f5e75f74c..1d84fa5f5 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -340,6 +340,7 @@ define_keywords!(
     REGR_SXY,
     REGR_SYY,
     RELEASE,
+    RENAME,
     REPEATABLE,
     RESTRICT,
     RESULT,
diff --git a/src/parser.rs b/src/parser.rs
index 1763afb49..fb750afa0 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1122,6 +1122,29 @@ impl Parser {
         })
     }
 
+    fn parse_column_def(&mut self) -> Result<ColumnDef, ParserError> {
+        let name = self.parse_identifier()?;
+        let data_type = self.parse_data_type()?;
+        let collation = if self.parse_keyword(Keyword::COLLATE) {
+            Some(self.parse_object_name()?)
+        } else {
+            None
+        };
+        let mut options = vec![];
+        loop {
+            match self.peek_token() {
+                Token::EOF | Token::Comma | Token::RParen => break,
+                _ => options.push(self.parse_column_option_def()?),
+            }
+        }
+        Ok(ColumnDef {
+            name,
+            data_type,
+            collation,
+            options,
+        })
+    }
+
     fn parse_columns(&mut self) -> Result<(Vec<ColumnDef>, Vec<TableConstraint>), ParserError> {
         let mut columns = vec![];
         let mut constraints = vec![];
@@ -1132,28 +1155,9 @@ impl Parser {
         loop {
             if let Some(constraint) = self.parse_optional_table_constraint()? {
                 constraints.push(constraint);
-            } else if let Token::Word(column_name) = self.peek_token() {
-                self.next_token();
-                let data_type = self.parse_data_type()?;
-                let collation = if self.parse_keyword(Keyword::COLLATE) {
-                    Some(self.parse_object_name()?)
-                } else {
-                    None
-                };
-                let mut options = vec![];
-                loop {
-                    match self.peek_token() {
-                        Token::EOF | Token::Comma | Token::RParen => break,
-                        _ => options.push(self.parse_column_option_def()?),
-                    }
-                }
-
-                columns.push(ColumnDef {
-                    name: column_name.to_ident(),
-                    data_type,
-                    collation,
-                    options,
-                });
+            } else if let Token::Word(_) = self.peek_token() {
+                let column_def = self.parse_column_def()?;
+                columns.push(column_def);
             } else {
                 return self.expected("column name or constraint definition", self.peek_token());
             }
@@ -1318,10 +1322,26 @@ impl Parser {
             if let Some(constraint) = self.parse_optional_table_constraint()? {
                 AlterTableOperation::AddConstraint(constraint)
             } else {
-                return self.expected("a constraint in ALTER TABLE .. ADD", self.peek_token());
+                let _ = self.parse_keyword(Keyword::COLUMN);
+                let column_def = self.parse_column_def()?;
+                AlterTableOperation::AddColumn { column_def }
+            }
+        } else if self.parse_keyword(Keyword::RENAME) {
+            if self.parse_keyword(Keyword::TO) {
+                let table_name = self.parse_identifier()?;
+                AlterTableOperation::RenameTable { table_name }
+            } else {
+                let _ = self.parse_keyword(Keyword::COLUMN);
+                let old_column_name = self.parse_identifier()?;
+                self.expect_keyword(Keyword::TO)?;
+                let new_column_name = self.parse_identifier()?;
+                AlterTableOperation::RenameColumn {
+                    old_column_name,
+                    new_column_name,
+                }
             }
         } else {
-            return self.expected("ADD after ALTER TABLE", self.peek_token());
+            return self.expected("ADD or RENAME after ALTER TABLE", self.peek_token());
         };
         Ok(Statement::AlterTable {
             name: table_name,
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index bff131334..15050c6fb 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1313,6 +1313,51 @@ fn parse_create_table_empty() {
     let _ = verified_stmt("CREATE TABLE t ()");
 }
 
+#[test]
+fn parse_alter_table() {
+    let add_column = "ALTER TABLE tab ADD COLUMN foo TEXT";
+    match verified_stmt(add_column) {
+        Statement::AlterTable {
+            name,
+            operation: AlterTableOperation::AddColumn { column_def },
+        } => {
+            assert_eq!("tab", name.to_string());
+            assert_eq!("foo", column_def.name.to_string());
+            assert_eq!("TEXT", column_def.data_type.to_string());
+        }
+        _ => unreachable!(),
+    };
+
+    let rename_table = "ALTER TABLE tab RENAME TO new_tab";
+    match verified_stmt(rename_table) {
+        Statement::AlterTable {
+            name,
+            operation: AlterTableOperation::RenameTable { table_name },
+        } => {
+            assert_eq!("tab", name.to_string());
+            assert_eq!("new_tab", table_name.to_string())
+        }
+        _ => unreachable!(),
+    };
+
+    let rename_column = "ALTER TABLE tab RENAME COLUMN foo TO new_foo";
+    match verified_stmt(rename_column) {
+        Statement::AlterTable {
+            name,
+            operation:
+                AlterTableOperation::RenameColumn {
+                    old_column_name,
+                    new_column_name,
+                },
+        } => {
+            assert_eq!("tab", name.to_string());
+            assert_eq!(old_column_name.to_string(), "foo");
+            assert_eq!(new_column_name.to_string(), "new_foo");
+        }
+        _ => unreachable!(),
+    }
+}
+
 #[test]
 fn parse_alter_table_constraints() {
     check_one("CONSTRAINT address_pkey PRIMARY KEY (address_id)");
@@ -1347,9 +1392,7 @@ fn parse_alter_table_constraints() {
 fn parse_bad_constraint() {
     let res = parse_sql_statements("ALTER TABLE tab ADD");
     assert_eq!(
-        ParserError::ParserError(
-            "Expected a constraint in ALTER TABLE .. ADD, found: EOF".to_string()
-        ),
+        ParserError::ParserError("Expected identifier, found: EOF".to_string()),
         res.unwrap_err()
     );
 

From 26361fd854a9067034277d353597bd4c05dd017a Mon Sep 17 00:00:00 2001
From: Jovansonlee Cesar <ivanceras@gmail.com>
Date: Wed, 17 Jun 2020 04:39:52 +0800
Subject: [PATCH 043/122] Implement ALTER TABLE DROP COLUMN (#148)

This implements `DROP [ COLUMN ] [ IF EXISTS ] column_name [ CASCADE ]`
sub-command of `ALTER TABLE`, which is what PostgreSQL supports https://www.postgresql.org/docs/12/sql-altertable.html
(except for the RESTRICT option)

Co-authored-by: Nickolay Ponomarev <asqueella@gmail.com>
---
 CHANGELOG.md              |  1 +
 src/ast/ddl.rs            | 17 +++++++++++++++++
 src/parser.rs             | 12 +++++++++++-
 tests/sqlparser_common.rs | 33 +++++++++++++++++++++++++++++++++
 4 files changed, 62 insertions(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 06b0220cd..d391940b0 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -31,6 +31,7 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 - Support bitwise AND (`&`), OR (`|`), XOR (`^`) (#181) - thanks @Dandandan!
 - Add serde support to AST structs and enums (#196) - thanks @panarch!
 - Support `ALTER TABLE ADD COLUMN`, `RENAME COLUMN`, and `RENAME TO` (#203) - thanks @mashuai!
+- Support `ALTER TABLE DROP COLUMN` (#148) - thanks @ivanceras!
 
 ### Fixed
 - Report an error for unterminated string literals (#165)
diff --git a/src/ast/ddl.rs b/src/ast/ddl.rs
index c1e66373b..f46364251 100644
--- a/src/ast/ddl.rs
+++ b/src/ast/ddl.rs
@@ -27,6 +27,12 @@ pub enum AlterTableOperation {
     AddColumn { column_def: ColumnDef },
     /// TODO: implement `DROP CONSTRAINT <name>`
     DropConstraint { name: Ident },
+    /// `DROP [ COLUMN ] [ IF EXISTS ] <column_name> [ CASCADE ]`
+    DropColumn {
+        column_name: Ident,
+        if_exists: bool,
+        cascade: bool,
+    },
     /// `RENAME [ COLUMN ] <old_column_name> TO <new_column_name>`
     RenameColumn {
         old_column_name: Ident,
@@ -44,6 +50,17 @@ impl fmt::Display for AlterTableOperation {
                 write!(f, "ADD COLUMN {}", column_def.to_string())
             }
             AlterTableOperation::DropConstraint { name } => write!(f, "DROP CONSTRAINT {}", name),
+            AlterTableOperation::DropColumn {
+                column_name,
+                if_exists,
+                cascade,
+            } => write!(
+                f,
+                "DROP COLUMN {}{}{}",
+                if *if_exists { "IF EXISTS " } else { "" },
+                column_name,
+                if *cascade { " CASCADE" } else { "" }
+            ),
             AlterTableOperation::RenameColumn {
                 old_column_name,
                 new_column_name,
diff --git a/src/parser.rs b/src/parser.rs
index fb750afa0..543c79a6e 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1340,8 +1340,18 @@ impl Parser {
                     new_column_name,
                 }
             }
+        } else if self.parse_keyword(Keyword::DROP) {
+            let _ = self.parse_keyword(Keyword::COLUMN);
+            let if_exists = self.parse_keywords(&[Keyword::IF, Keyword::EXISTS]);
+            let column_name = self.parse_identifier()?;
+            let cascade = self.parse_keyword(Keyword::CASCADE);
+            AlterTableOperation::DropColumn {
+                column_name,
+                if_exists,
+                cascade,
+            }
         } else {
-            return self.expected("ADD or RENAME after ALTER TABLE", self.peek_token());
+            return self.expected("ADD, RENAME, or DROP after ALTER TABLE", self.peek_token());
         };
         Ok(Statement::AlterTable {
             name: table_name,
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 15050c6fb..abfa33fdf 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1388,6 +1388,39 @@ fn parse_alter_table_constraints() {
     }
 }
 
+#[test]
+fn parse_alter_table_drop_column() {
+    check_one("DROP COLUMN IF EXISTS is_active CASCADE");
+    one_statement_parses_to(
+        "ALTER TABLE tab DROP IF EXISTS is_active CASCADE",
+        "ALTER TABLE tab DROP COLUMN IF EXISTS is_active CASCADE",
+    );
+    one_statement_parses_to(
+        "ALTER TABLE tab DROP is_active CASCADE",
+        "ALTER TABLE tab DROP COLUMN is_active CASCADE",
+    );
+
+    fn check_one(constraint_text: &str) {
+        match verified_stmt(&format!("ALTER TABLE tab {}", constraint_text)) {
+            Statement::AlterTable {
+                name,
+                operation:
+                    AlterTableOperation::DropColumn {
+                        column_name,
+                        if_exists,
+                        cascade,
+                    },
+            } => {
+                assert_eq!("tab", name.to_string());
+                assert_eq!("is_active", column_name.to_string());
+                assert_eq!(true, if_exists);
+                assert_eq!(true, cascade);
+            }
+            _ => unreachable!(),
+        }
+    }
+}
+
 #[test]
 fn parse_bad_constraint() {
     let res = parse_sql_statements("ALTER TABLE tab ADD");

From 15d5f7164612c733417a86a97ef319eda3b2d634 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Tue, 23 Jun 2020 15:30:22 +0200
Subject: [PATCH 044/122] Add CREATE TABLE AS support (#206)

We parse it as a regular `CREATE TABLE` statement
followed by an `AS <query>`, which is how BigQuery works:
https://cloud.google.com/bigquery/docs/reference/standard-sql/data-definition-language#create_table_statement


ANSI SQL and PostgreSQL only support a plain list of columns
after the table name in a CTAS
    `CREATE TABLE t (a) AS SELECT a FROM foo`

We currently only allow specifying a full schema with data
types, or omitting it altogether.

https://www.postgresql.org/docs/12/sql-createtableas.html
https://jakewheat.github.io/sql-overview/sql-2016-foundation-grammar.html#as-subquery-clause


Finally, when no schema is specified, we print empty parens after a
plain `CREATE TABLE t ();` as required by PostgreSQL, but skip them
in a CTAS: `CREATE TABLE t AS ...`. This affects serialization only,
the parser allows omitting the schema in a regular `CREATE TABLE` too
since the first release of the parser:
https://github.com/benesch/sqlparser-rs/blame/7d27abdfb4ac4a0980d79b12d9d8ef156434e984/src/sqlparser.rs#L325-L332

Co-authored-by: Nickolay Ponomarev <asqueella@gmail.com>
---
 CHANGELOG.md                |  1 +
 src/ast/mod.rs              | 33 +++++++++++++++++++++-------
 src/parser.rs               | 11 ++++++++++
 tests/sqlparser_common.rs   | 38 ++++++++++++++++++++++++++------
 tests/sqlparser_mysql.rs    |  2 +-
 tests/sqlparser_postgres.rs | 43 ++++++++++++++++++++++++++++---------
 6 files changed, 103 insertions(+), 25 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index d391940b0..dc775ba7a 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -32,6 +32,7 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 - Add serde support to AST structs and enums (#196) - thanks @panarch!
 - Support `ALTER TABLE ADD COLUMN`, `RENAME COLUMN`, and `RENAME TO` (#203) - thanks @mashuai!
 - Support `ALTER TABLE DROP COLUMN` (#148) - thanks @ivanceras!
+- Support `CREATE TABLE ... AS ...` (#206) - thanks @Dandandan!
 
 ### Fixed
 - Report an error for unterminated string literals (#165)
diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index cab337920..c3c8a8ebb 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -481,6 +481,7 @@ pub enum Statement {
         external: bool,
         file_format: Option<FileFormat>,
         location: Option<String>,
+        query: Option<Box<Query>>,
     },
     /// CREATE INDEX
     CreateIndex {
@@ -645,19 +646,32 @@ impl fmt::Display for Statement {
                 external,
                 file_format,
                 location,
+                query,
             } => {
+                // We want to allow the following options
+                // Empty column list, allowed by PostgreSQL:
+                //   `CREATE TABLE t ()`
+                // No columns provided for CREATE TABLE AS:
+                //   `CREATE TABLE t AS SELECT a from t2`
+                // Columns provided for CREATE TABLE AS:
+                //   `CREATE TABLE t (a INT) AS SELECT a from t2`
                 write!(
                     f,
-                    "CREATE {}TABLE {}{} ({}",
-                    if *external { "EXTERNAL " } else { "" },
-                    if *if_not_exists { "IF NOT EXISTS " } else { "" },
-                    name,
-                    display_comma_separated(columns)
+                    "CREATE {external}TABLE {if_not_exists}{name}",
+                    external = if *external { "EXTERNAL " } else { "" },
+                    if_not_exists = if *if_not_exists { "IF NOT EXISTS " } else { "" },
+                    name = name,
                 )?;
-                if !constraints.is_empty() {
-                    write!(f, ", {}", display_comma_separated(constraints))?;
+                if !columns.is_empty() || !constraints.is_empty() {
+                    write!(f, " ({}", display_comma_separated(columns))?;
+                    if !columns.is_empty() && !constraints.is_empty() {
+                        write!(f, ", ")?;
+                    }
+                    write!(f, "{})", display_comma_separated(constraints))?;
+                } else if query.is_none() {
+                    // PostgreSQL allows `CREATE TABLE t ();`, but requires empty parens
+                    write!(f, " ()")?;
                 }
-                write!(f, ")")?;
 
                 if *external {
                     write!(
@@ -670,6 +684,9 @@ impl fmt::Display for Statement {
                 if !with_options.is_empty() {
                     write!(f, " WITH ({})", display_comma_separated(with_options))?;
                 }
+                if let Some(query) = query {
+                    write!(f, " AS {}", query)?;
+                }
                 Ok(())
             }
             Statement::CreateIndex {
diff --git a/src/parser.rs b/src/parser.rs
index 543c79a6e..611ae586c 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1020,6 +1020,7 @@ impl Parser {
             external: true,
             file_format: Some(file_format),
             location: Some(location),
+            query: None,
         })
     }
 
@@ -1108,8 +1109,17 @@ impl Parser {
         let table_name = self.parse_object_name()?;
         // parse optional column list (schema)
         let (columns, constraints) = self.parse_columns()?;
+
+        // PostgreSQL supports `WITH ( options )`, before `AS`
         let with_options = self.parse_with_options()?;
 
+        // Parse optional `AS ( query )`
+        let query = if self.parse_keyword(Keyword::AS) {
+            Some(Box::new(self.parse_query()?))
+        } else {
+            None
+        };
+
         Ok(Statement::CreateTable {
             name: table_name,
             columns,
@@ -1119,6 +1129,7 @@ impl Parser {
             external: false,
             file_format: None,
             location: None,
+            query,
         })
     }
 
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index abfa33fdf..9812d5d5a 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1044,6 +1044,7 @@ fn parse_create_table() {
             external: false,
             file_format: None,
             location: None,
+            query: _query,
         } => {
             assert_eq!("uk_cities", name.to_string());
             assert_eq!(
@@ -1177,6 +1178,36 @@ fn parse_drop_schema() {
     }
 }
 
+#[test]
+fn parse_create_table_as() {
+    let sql = "CREATE TABLE t AS SELECT * FROM a";
+
+    match verified_stmt(sql) {
+        Statement::CreateTable { name, query, .. } => {
+            assert_eq!(name.to_string(), "t".to_string());
+            assert_eq!(query, Some(Box::new(verified_query("SELECT * FROM a"))));
+        }
+        _ => unreachable!(),
+    }
+
+    // BigQuery allows specifying table schema in CTAS
+    // ANSI SQL and PostgreSQL let you only specify the list of columns
+    // (without data types) in a CTAS, but we have yet to support that.
+    let sql = "CREATE TABLE t (a INT, b INT) AS SELECT 1 AS b, 2 AS a";
+    match verified_stmt(sql) {
+        Statement::CreateTable { columns, query, .. } => {
+            assert_eq!(columns.len(), 2);
+            assert_eq!(columns[0].to_string(), "a INT".to_string());
+            assert_eq!(columns[1].to_string(), "b INT".to_string());
+            assert_eq!(
+                query,
+                Some(Box::new(verified_query("SELECT 1 AS b, 2 AS a")))
+            );
+        }
+        _ => unreachable!(),
+    }
+}
+
 #[test]
 fn parse_create_table_with_on_delete_on_update_2in_any_order() -> Result<(), ParserError> {
     let sql = |options: &str| -> String {
@@ -1245,6 +1276,7 @@ fn parse_create_external_table() {
             external,
             file_format,
             location,
+            query: _query,
         } => {
             assert_eq!("uk_cities", name.to_string());
             assert_eq!(
@@ -1307,12 +1339,6 @@ fn parse_create_external_table_lowercase() {
     assert_matches!(ast, Statement::CreateTable{..});
 }
 
-#[test]
-fn parse_create_table_empty() {
-    // Zero-column tables are weird, but supported by at least PostgreSQL.
-    let _ = verified_stmt("CREATE TABLE t ()");
-}
-
 #[test]
 fn parse_alter_table() {
     let add_column = "ALTER TABLE tab ADD COLUMN foo TEXT";
diff --git a/tests/sqlparser_mysql.rs b/tests/sqlparser_mysql.rs
index cc6433322..1ac8e384c 100644
--- a/tests/sqlparser_mysql.rs
+++ b/tests/sqlparser_mysql.rs
@@ -77,7 +77,7 @@ fn parse_show_columns() {
         Statement::ShowColumns {
             extended: false,
             full: false,
-            table_name: table_name,
+            table_name,
             filter: Some(ShowStatementFilter::Where(
                 mysql_and_generic().verified_expr("1 = 2")
             )),
diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index 88e94d01c..4b339744f 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -43,6 +43,7 @@ fn parse_create_table_with_defaults() {
             external: false,
             file_format: None,
             location: None,
+            query: _query,
         } => {
             assert_eq!("public.customer", name.to_string());
             assert_eq!(
@@ -226,25 +227,47 @@ fn parse_create_table_with_inherit() {
     pg().verified_stmt(sql);
 }
 
+#[test]
+fn parse_create_table_empty() {
+    // Zero-column tables are weird, but supported by at least PostgreSQL.
+    // <https://github.com/andygrove/sqlparser-rs/pull/94>
+    let _ = pg_and_generic().verified_stmt("CREATE TABLE t ()");
+}
+
+#[test]
+fn parse_create_table_constraints_only() {
+    // Zero-column tables can also have constraints in PostgreSQL
+    let sql = "CREATE TABLE t (CONSTRAINT positive CHECK (2 > 1))";
+    let ast = pg_and_generic().verified_stmt(sql);
+    match ast {
+        Statement::CreateTable {
+            name,
+            columns,
+            constraints,
+            ..
+        } => {
+            assert_eq!("t", name.to_string());
+            assert!(columns.is_empty());
+            assert_eq!(
+                only(constraints).to_string(),
+                "CONSTRAINT positive CHECK (2 > 1)"
+            );
+        }
+        _ => unreachable!(),
+    };
+}
+
 #[test]
 fn parse_create_table_if_not_exists() {
     let sql = "CREATE TABLE IF NOT EXISTS uk_cities ()";
-    let ast =
-        pg_and_generic().one_statement_parses_to(sql, "CREATE TABLE IF NOT EXISTS uk_cities ()");
+    let ast = pg_and_generic().verified_stmt(sql);
     match ast {
         Statement::CreateTable {
             name,
-            columns: _columns,
-            constraints,
-            with_options,
             if_not_exists: true,
-            external: false,
-            file_format: None,
-            location: None,
+            ..
         } => {
             assert_eq!("uk_cities", name.to_string());
-            assert!(constraints.is_empty());
-            assert_eq!(with_options, vec![]);
         }
         _ => unreachable!(),
     }

From 05f8992a2f34fce85598b6d7fc4554280fae0565 Mon Sep 17 00:00:00 2001
From: Andy Grove <andygrove73@gmail.com>
Date: Thu, 25 Jun 2020 20:46:18 -0600
Subject: [PATCH 045/122] (cargo-release) version 0.5.1

---
 Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index 804fac0e4..6a3138f39 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "sqlparser"
 description = "Extensible SQL Lexer and Parser with support for ANSI SQL:2011"
-version = "0.5.1-alpha-0"
+version = "0.5.1"
 authors = ["Andy Grove <andygrove73@gmail.com>"]
 homepage = "https://github.com/andygrove/sqlparser-rs"
 documentation = "https://docs.rs/sqlparser/"

From 1946791302e15792f82b6cd4cec417d2abf120f9 Mon Sep 17 00:00:00 2001
From: Andy Grove <andygrove73@gmail.com>
Date: Thu, 25 Jun 2020 20:46:29 -0600
Subject: [PATCH 046/122] (cargo-release) start next development iteration
 0.5.2-alpha.0

---
 Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index 6a3138f39..6f3ad98b2 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "sqlparser"
 description = "Extensible SQL Lexer and Parser with support for ANSI SQL:2011"
-version = "0.5.1"
+version = "0.5.2-alpha.0"
 authors = ["Andy Grove <andygrove73@gmail.com>"]
 homepage = "https://github.com/andygrove/sqlparser-rs"
 documentation = "https://docs.rs/sqlparser/"

From 0c82be5c3b34e3409607e34f14e0f45dae9dc4dd Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Fri, 26 Jun 2020 14:55:55 +0300
Subject: [PATCH 047/122] Follow-up to the recent release (CHANGELOG and the
 bench crate)

---
 CHANGELOG.md               | 13 +++++++++++++
 sqlparser_bench/Cargo.toml |  6 ++----
 2 files changed, 15 insertions(+), 4 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index dc775ba7a..adb24870d 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -8,6 +8,19 @@ Given that the parser produces a typed AST, any changes to the AST will technica
 ## [Unreleased]
 Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented changes.
 
+### Changed
+
+### Added
+
+### Fixed
+
+
+## [0.5.1] - 2020-06-26
+This release should have been called `0.6`, as it introduces multiple incompatible changes to the API. If you don't want to upgrade yet, you can revert to the previous version by changing your `Cargo.toml` to:
+
+    sqlparser = "= 0.5.0"
+
+
 ### Changed
 - **`Parser::parse_sql` now accepts a `&str` instead of `String` (#182)** - thanks @Dandandan!
 - Change `Ident` (previously a simple `String`) to store the parsed (unquoted) `value` of the identifier and the `quote_style` separately (#143) - thanks @apparebit!
diff --git a/sqlparser_bench/Cargo.toml b/sqlparser_bench/Cargo.toml
index 43ea11913..d98ff156c 100644
--- a/sqlparser_bench/Cargo.toml
+++ b/sqlparser_bench/Cargo.toml
@@ -4,13 +4,11 @@ version = "0.1.0"
 authors = ["Dandandan <danielheres@gmail.com>"]
 edition = "2018"
 
-# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
-
 [dependencies]
-sqlparser = { path = "../", version = "0.5.1-alpha-0" }
+sqlparser = { path = "../" }
 
 [dev-dependencies]
-criterion = {version = "0.3"}
+criterion = "0.3"
 
 [[bench]]
 name = "sqlparser_bench"

From 0c83e5d9e810b23e9f8b1d728879e5707641196d Mon Sep 17 00:00:00 2001
From: mz <hitmashuai@gmail.com>
Date: Fri, 26 Jun 2020 20:11:46 +0800
Subject: [PATCH 048/122] Support SQLite's WITHOUT ROWID in CREATE TABLE (#208)

Per https://sqlite.org/lang_createtable.html

Co-authored-by: mashuai <mashuai@bytedance.com>
---
 CHANGELOG.md                |  1 +
 src/ast/mod.rs              |  6 ++++++
 src/dialect/keywords.rs     |  1 +
 src/parser.rs               |  5 +++++
 tests/sqlparser_common.rs   |  4 ++--
 tests/sqlparser_postgres.rs |  2 +-
 tests/sqlparser_sqlite.rs   | 41 +++++++++++++++++++++++++++++++++++++
 7 files changed, 57 insertions(+), 3 deletions(-)
 create mode 100644 tests/sqlparser_sqlite.rs

diff --git a/CHANGELOG.md b/CHANGELOG.md
index adb24870d..888ce51a5 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -11,6 +11,7 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 ### Changed
 
 ### Added
+- Support SQLite's `CREATE TABLE (...) WITHOUT ROWID` (#208) - thanks @mashuai!
 
 ### Fixed
 
diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index c3c8a8ebb..885935b3a 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -482,6 +482,7 @@ pub enum Statement {
         file_format: Option<FileFormat>,
         location: Option<String>,
         query: Option<Box<Query>>,
+        without_rowid: bool,
     },
     /// CREATE INDEX
     CreateIndex {
@@ -647,6 +648,7 @@ impl fmt::Display for Statement {
                 file_format,
                 location,
                 query,
+                without_rowid,
             } => {
                 // We want to allow the following options
                 // Empty column list, allowed by PostgreSQL:
@@ -672,6 +674,10 @@ impl fmt::Display for Statement {
                     // PostgreSQL allows `CREATE TABLE t ();`, but requires empty parens
                     write!(f, " ()")?;
                 }
+                // Only for SQLite
+                if *without_rowid {
+                    write!(f, " WITHOUT ROWID")?;
+                }
 
                 if *external {
                     write!(
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index 1d84fa5f5..8f8047aa5 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -351,6 +351,7 @@ define_keywords!(
     ROLLBACK,
     ROLLUP,
     ROW,
+    ROWID,
     ROWS,
     ROW_NUMBER,
     SAVEPOINT,
diff --git a/src/parser.rs b/src/parser.rs
index 611ae586c..d4c894db7 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1021,6 +1021,7 @@ impl Parser {
             file_format: Some(file_format),
             location: Some(location),
             query: None,
+            without_rowid: false,
         })
     }
 
@@ -1110,6 +1111,9 @@ impl Parser {
         // parse optional column list (schema)
         let (columns, constraints) = self.parse_columns()?;
 
+        // SQLite supports `WITHOUT ROWID` at the end of `CREATE TABLE`
+        let without_rowid = self.parse_keywords(&[Keyword::WITHOUT, Keyword::ROWID]);
+
         // PostgreSQL supports `WITH ( options )`, before `AS`
         let with_options = self.parse_with_options()?;
 
@@ -1130,6 +1134,7 @@ impl Parser {
             file_format: None,
             location: None,
             query,
+            without_rowid,
         })
     }
 
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 9812d5d5a..79e922c87 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1044,7 +1044,7 @@ fn parse_create_table() {
             external: false,
             file_format: None,
             location: None,
-            query: _query,
+            ..
         } => {
             assert_eq!("uk_cities", name.to_string());
             assert_eq!(
@@ -1276,7 +1276,7 @@ fn parse_create_external_table() {
             external,
             file_format,
             location,
-            query: _query,
+            ..
         } => {
             assert_eq!("uk_cities", name.to_string());
             assert_eq!(
diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index 4b339744f..59d7c23e4 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -43,7 +43,7 @@ fn parse_create_table_with_defaults() {
             external: false,
             file_format: None,
             location: None,
-            query: _query,
+            ..
         } => {
             assert_eq!("public.customer", name.to_string());
             assert_eq!(
diff --git a/tests/sqlparser_sqlite.rs b/tests/sqlparser_sqlite.rs
new file mode 100644
index 000000000..7a1ce816a
--- /dev/null
+++ b/tests/sqlparser_sqlite.rs
@@ -0,0 +1,41 @@
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#![warn(clippy::all)]
+//! Test SQL syntax specific to SQLite. The parser based on the
+//! generic dialect is also tested (on the inputs it can handle).
+
+use sqlparser::ast::*;
+use sqlparser::dialect::GenericDialect;
+use sqlparser::test_utils::*;
+
+#[test]
+fn parse_create_table_without_rowid() {
+    let sql = "CREATE TABLE t (a INT) WITHOUT ROWID";
+    match sqlite_and_generic().verified_stmt(sql) {
+        Statement::CreateTable {
+            name,
+            without_rowid: true,
+            ..
+        } => {
+            assert_eq!("t", name.to_string());
+        }
+        _ => unreachable!(),
+    }
+}
+
+fn sqlite_and_generic() -> TestedDialects {
+    TestedDialects {
+        // we don't have a separate SQLite dialect, so test only the generic dialect for now
+        dialects: vec![Box::new(GenericDialect {})],
+    }
+}

From a53f1d26eff6a546533e84be561c9416b9cb397e Mon Sep 17 00:00:00 2001
From: mz <hitmashuai@gmail.com>
Date: Sun, 28 Jun 2020 09:31:33 +0800
Subject: [PATCH 049/122] Support SQLite `CREATE VIRTUAL TABLE` (#209)

`CREATE VIRTUAL TABLE .. USING <module_name> (<module_args>)`

https://www.sqlite.org/lang_createvtab.html
---
 CHANGELOG.md              |  1 +
 src/ast/mod.rs            | 25 +++++++++++++++++++++++++
 src/dialect/keywords.rs   |  1 +
 src/parser.rs             | 28 ++++++++++++++++++++++++----
 tests/sqlparser_sqlite.rs | 22 ++++++++++++++++++++++
 5 files changed, 73 insertions(+), 4 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 888ce51a5..1d07b33fa 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -12,6 +12,7 @@ Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented
 
 ### Added
 - Support SQLite's `CREATE TABLE (...) WITHOUT ROWID` (#208) - thanks @mashuai!
+- Support SQLite's `CREATE VIRTUAL TABLE` (#209) - thanks @mashuai!
 
 ### Fixed
 
diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 885935b3a..9486f16c6 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -484,6 +484,13 @@ pub enum Statement {
         query: Option<Box<Query>>,
         without_rowid: bool,
     },
+    /// SQLite's `CREATE VIRTUAL TABLE .. USING <module_name> (<module_args>)`
+    CreateVirtualTable {
+        name: ObjectName,
+        if_not_exists: bool,
+        module_name: Ident,
+        module_args: Vec<Ident>,
+    },
     /// CREATE INDEX
     CreateIndex {
         /// index name
@@ -695,6 +702,24 @@ impl fmt::Display for Statement {
                 }
                 Ok(())
             }
+            Statement::CreateVirtualTable {
+                name,
+                if_not_exists,
+                module_name,
+                module_args,
+            } => {
+                write!(
+                    f,
+                    "CREATE VIRTUAL TABLE {if_not_exists}{name} USING {module_name}",
+                    if_not_exists = if *if_not_exists { "IF NOT EXISTS " } else { "" },
+                    name = name,
+                    module_name = module_name
+                )?;
+                if !module_args.is_empty() {
+                    write!(f, " ({})", display_comma_separated(module_args))?;
+                }
+                Ok(())
+            }
             Statement::CreateIndex {
                 name,
                 table_name,
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index 8f8047aa5..b6cfe35e9 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -438,6 +438,7 @@ define_keywords!(
     VAR_SAMP,
     VERSIONING,
     VIEW,
+    VIRTUAL,
     WHEN,
     WHENEVER,
     WHERE,
diff --git a/src/parser.rs b/src/parser.rs
index d4c894db7..a1e542484 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -55,6 +55,7 @@ pub enum IsLateral {
     Lateral,
     NotLateral,
 }
+use crate::ast::Statement::CreateVirtualTable;
 use IsLateral::*;
 
 impl From<TokenizerError> for ParserError {
@@ -986,16 +987,35 @@ impl Parser {
             self.parse_create_view()
         } else if self.parse_keyword(Keyword::EXTERNAL) {
             self.parse_create_external_table()
+        } else if self.parse_keyword(Keyword::VIRTUAL) {
+            self.parse_create_virtual_table()
         } else if self.parse_keyword(Keyword::SCHEMA) {
             self.parse_create_schema()
         } else {
-            self.expected(
-                "TABLE, VIEW, INDEX or SCHEMA after CREATE",
-                self.peek_token(),
-            )
+            self.expected("an object type after CREATE", self.peek_token())
         }
     }
 
+    /// SQLite-specific `CREATE VIRTUAL TABLE`
+    pub fn parse_create_virtual_table(&mut self) -> Result<Statement, ParserError> {
+        self.expect_keyword(Keyword::TABLE)?;
+        let if_not_exists = self.parse_keywords(&[Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
+        let table_name = self.parse_object_name()?;
+        self.expect_keyword(Keyword::USING)?;
+        let module_name = self.parse_identifier()?;
+        // SQLite docs note that module "arguments syntax is sufficiently
+        // general that the arguments can be made to appear as column
+        // definitions in a traditional CREATE TABLE statement", but
+        // we don't implement that.
+        let module_args = self.parse_parenthesized_column_list(Optional)?;
+        Ok(CreateVirtualTable {
+            name: table_name,
+            if_not_exists,
+            module_name,
+            module_args,
+        })
+    }
+
     pub fn parse_create_schema(&mut self) -> Result<Statement, ParserError> {
         let schema_name = self.parse_object_name()?;
         Ok(Statement::CreateSchema { schema_name })
diff --git a/tests/sqlparser_sqlite.rs b/tests/sqlparser_sqlite.rs
index 7a1ce816a..6d715abea 100644
--- a/tests/sqlparser_sqlite.rs
+++ b/tests/sqlparser_sqlite.rs
@@ -33,6 +33,28 @@ fn parse_create_table_without_rowid() {
     }
 }
 
+#[test]
+fn parse_create_virtual_table() {
+    let sql = "CREATE VIRTUAL TABLE IF NOT EXISTS t USING module_name (arg1, arg2)";
+    match sqlite_and_generic().verified_stmt(sql) {
+        Statement::CreateVirtualTable {
+            name,
+            if_not_exists: true,
+            module_name,
+            module_args,
+        } => {
+            let args = vec![Ident::new("arg1"), Ident::new("arg2")];
+            assert_eq!("t", name.to_string());
+            assert_eq!("module_name", module_name.to_string());
+            assert_eq!(args, module_args);
+        }
+        _ => unreachable!(),
+    }
+
+    let sql = "CREATE VIRTUAL TABLE t USING module_name";
+    sqlite_and_generic().verified_stmt(sql);
+}
+
 fn sqlite_and_generic() -> TestedDialects {
     TestedDialects {
         // we don't have a separate SQLite dialect, so test only the generic dialect for now

From 2a6d5f2b6101dfcb7c73693bd50e4b5e6efb0ca3 Mon Sep 17 00:00:00 2001
From: Andy Grove <andygrove@users.noreply.github.com>
Date: Sun, 28 Jun 2020 09:52:52 -0600
Subject: [PATCH 050/122] update cargo manifest (#214)

---
 Cargo.toml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/Cargo.toml b/Cargo.toml
index 6f3ad98b2..67669d76c 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -3,10 +3,10 @@ name = "sqlparser"
 description = "Extensible SQL Lexer and Parser with support for ANSI SQL:2011"
 version = "0.5.2-alpha.0"
 authors = ["Andy Grove <andygrove73@gmail.com>"]
-homepage = "https://github.com/andygrove/sqlparser-rs"
+homepage = "https://github.com/ballista-compute/sqlparser-rs"
 documentation = "https://docs.rs/sqlparser/"
 keywords = [ "ansi", "sql", "lexer", "parser" ]
-repository = "https://github.com/andygrove/sqlparser-rs"
+repository = "https://github.com/ballista-compute/sqlparser-rs"
 license = "Apache-2.0"
 include = [
     "src/**/*.rs",

From 8cc7702a8ccfa61371c53c33c7b1a5ae40e1cda7 Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Thu, 2 Jul 2020 12:31:54 -0700
Subject: [PATCH 051/122] update branch references to `main` (#215)

* update branch references to `main`

* ensure we point to ballista-compute

* update a couple of links to point to ballista-compute
---
 CHANGELOG.md                | 3 ++-
 README.md                   | 6 +++---
 tests/sqlparser_common.rs   | 2 +-
 tests/sqlparser_postgres.rs | 2 +-
 4 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 1d07b33fa..4e99d86eb 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -6,7 +6,7 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 Given that the parser produces a typed AST, any changes to the AST will technically be breaking and thus will result in a `0.(N+1)` version. We document changes that break via addition as "Added".
 
 ## [Unreleased]
-Check https://github.com/andygrove/sqlparser-rs/commits/master for undocumented changes.
+Check https://github.com/ballista-compute/sqlparser-rs/commits/main for undocumented changes.
 
 ### Changed
 
@@ -166,3 +166,4 @@ We don't have a changelog for the changes made in 2018, but thanks to @crw5996,
 
 ## [0.1.0] - 2018-09-03
 Initial release
+
diff --git a/README.md b/README.md
index 8bf1d4617..59cedee64 100644
--- a/README.md
+++ b/README.md
@@ -2,8 +2,8 @@
 
 [![License](https://img.shields.io/badge/License-Apache%202.0-blue.svg)](https://opensource.org/licenses/Apache-2.0)
 [![Version](https://img.shields.io/crates/v/sqlparser.svg)](https://crates.io/crates/sqlparser)
-[![Build Status](https://travis-ci.org/andygrove/sqlparser-rs.svg?branch=master)](https://travis-ci.org/andygrove/sqlparser-rs)
-[![Coverage Status](https://coveralls.io/repos/github/andygrove/sqlparser-rs/badge.svg?branch=master)](https://coveralls.io/github/andygrove/sqlparser-rs?branch=master)
+[![Build Status](https://travis-ci.org/ballista-compute/sqlparser-rs.svg?branch=main)](https://travis-ci.org/ballista-computee/sqlparser-rs)
+[![Coverage Status](https://coveralls.io/repos/github/ballista-compute/sqlparser-rs/badge.svg?branch=main)](https://coveralls.io/github/ballista-compute/sqlparser-rs?branch=main)
 [![Gitter Chat](https://badges.gitter.im/sqlparser-rs/community.svg)](https://gitter.im/sqlparser-rs/community?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge)
 
 The goal of this project is to build a SQL lexer and parser capable of parsing
@@ -123,7 +123,7 @@ resources.
 
 [tdop-tutorial]: https://eli.thegreenplace.net/2010/01/02/top-down-operator-precedence-parsing
 [`cargo fmt`]: https://github.com/rust-lang/rustfmt#on-the-stable-toolchain
-[current issues]: https://github.com/andygrove/sqlparser-rs/issues
+[current issues]: https://github.com/ballista-compute/sqlparser-rs/issues
 [DataFusion]: https://github.com/apache/arrow/tree/master/rust/datafusion
 [LocustDB]: https://github.com/cswinter/LocustDB
 [Pratt Parser]: https://tdop.github.io/
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 79e922c87..7d5317ae2 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -2878,7 +2878,7 @@ fn parse_start_transaction() {
     verified_stmt("START TRANSACTION ISOLATION LEVEL REPEATABLE READ");
     verified_stmt("START TRANSACTION ISOLATION LEVEL SERIALIZABLE");
 
-    // Regression test for https://github.com/andygrove/sqlparser-rs/pull/139,
+    // Regression test for https://github.com/ballista-compute/sqlparser-rs/pull/139,
     // in which START TRANSACTION would fail to parse if followed by a statement
     // terminator.
     assert_eq!(
diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index 59d7c23e4..481d0cbe1 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -230,7 +230,7 @@ fn parse_create_table_with_inherit() {
 #[test]
 fn parse_create_table_empty() {
     // Zero-column tables are weird, but supported by at least PostgreSQL.
-    // <https://github.com/andygrove/sqlparser-rs/pull/94>
+    // <https://github.com/ballista-compute/sqlparser-rs/pull/94>
     let _ = pg_and_generic().verified_stmt("CREATE TABLE t ()");
 }
 

From f3b9edca2820d79caf1d9d749bac30c6f1b6ee4a Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Sun, 5 Jul 2020 05:32:01 -0700
Subject: [PATCH 052/122] update travis badge to point to actions status (#219)

* update travis badge to point to actions status

It seems Travis is currently not updating as expected, likely as a side effect of the repo moving. If we're comfortable leaning on Actions, then we can switch out the badge here and plan to remove Travis entirely. Alternatively we could reconfigure Travis to work with the new repo name.

* Refer to correct branch

Co-authored-by: Dandandan <danielheres@gmail.com>
---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 59cedee64..844ae52a5 100644
--- a/README.md
+++ b/README.md
@@ -2,7 +2,7 @@
 
 [![License](https://img.shields.io/badge/License-Apache%202.0-blue.svg)](https://opensource.org/licenses/Apache-2.0)
 [![Version](https://img.shields.io/crates/v/sqlparser.svg)](https://crates.io/crates/sqlparser)
-[![Build Status](https://travis-ci.org/ballista-compute/sqlparser-rs.svg?branch=main)](https://travis-ci.org/ballista-computee/sqlparser-rs)
+[![Build Status](https://github.com/ballista-compute/sqlparser-rs/workflows/Rust/badge.svg?branch=main)](https://github.com/ballista-compute/sqlparser-rs/actions?query=workflow%3ARust+branch%3Amain)
 [![Coverage Status](https://coveralls.io/repos/github/ballista-compute/sqlparser-rs/badge.svg?branch=main)](https://coveralls.io/github/ballista-compute/sqlparser-rs?branch=main)
 [![Gitter Chat](https://badges.gitter.im/sqlparser-rs/community.svg)](https://gitter.im/sqlparser-rs/community?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge)
 

From 5cab18963e5d6eda5bc61c13b22991000b82b8c5 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Tue, 14 Jul 2020 21:48:07 +0200
Subject: [PATCH 053/122] Add TPCH reggression tests (#221)

* Add TPC-H reggression tests
---
 tests/queries/tpch/1.sql      | 21 +++++++++++++++
 tests/queries/tpch/10.sql     | 34 +++++++++++++++++++++++++
 tests/queries/tpch/11.sql     | 30 ++++++++++++++++++++++
 tests/queries/tpch/12.sql     | 31 ++++++++++++++++++++++
 tests/queries/tpch/13.sql     | 23 +++++++++++++++++
 tests/queries/tpch/14.sql     | 16 ++++++++++++
 tests/queries/tpch/15.sql     | 36 ++++++++++++++++++++++++++
 tests/queries/tpch/16.sql     | 33 ++++++++++++++++++++++++
 tests/queries/tpch/17.sql     | 20 +++++++++++++++
 tests/queries/tpch/18.sql     | 35 +++++++++++++++++++++++++
 tests/queries/tpch/19.sql     | 38 +++++++++++++++++++++++++++
 tests/queries/tpch/2.sql      | 46 +++++++++++++++++++++++++++++++++
 tests/queries/tpch/20.sql     | 40 +++++++++++++++++++++++++++++
 tests/queries/tpch/21.sql     | 42 ++++++++++++++++++++++++++++++
 tests/queries/tpch/22.sql     | 40 +++++++++++++++++++++++++++++
 tests/queries/tpch/3.sql      | 25 ++++++++++++++++++
 tests/queries/tpch/4.sql      | 24 ++++++++++++++++++
 tests/queries/tpch/5.sql      | 27 ++++++++++++++++++++
 tests/queries/tpch/6.sql      | 12 +++++++++
 tests/queries/tpch/7.sql      | 42 ++++++++++++++++++++++++++++++
 tests/queries/tpch/8.sql      | 40 +++++++++++++++++++++++++++++
 tests/queries/tpch/9.sql      | 35 +++++++++++++++++++++++++
 tests/sqlparser_regression.rs | 48 +++++++++++++++++++++++++++++++++++
 23 files changed, 738 insertions(+)
 create mode 100644 tests/queries/tpch/1.sql
 create mode 100644 tests/queries/tpch/10.sql
 create mode 100644 tests/queries/tpch/11.sql
 create mode 100644 tests/queries/tpch/12.sql
 create mode 100644 tests/queries/tpch/13.sql
 create mode 100644 tests/queries/tpch/14.sql
 create mode 100644 tests/queries/tpch/15.sql
 create mode 100644 tests/queries/tpch/16.sql
 create mode 100644 tests/queries/tpch/17.sql
 create mode 100644 tests/queries/tpch/18.sql
 create mode 100644 tests/queries/tpch/19.sql
 create mode 100644 tests/queries/tpch/2.sql
 create mode 100644 tests/queries/tpch/20.sql
 create mode 100644 tests/queries/tpch/21.sql
 create mode 100644 tests/queries/tpch/22.sql
 create mode 100644 tests/queries/tpch/3.sql
 create mode 100644 tests/queries/tpch/4.sql
 create mode 100644 tests/queries/tpch/5.sql
 create mode 100644 tests/queries/tpch/6.sql
 create mode 100644 tests/queries/tpch/7.sql
 create mode 100644 tests/queries/tpch/8.sql
 create mode 100644 tests/queries/tpch/9.sql
 create mode 100644 tests/sqlparser_regression.rs

diff --git a/tests/queries/tpch/1.sql b/tests/queries/tpch/1.sql
new file mode 100644
index 000000000..ae44c94d2
--- /dev/null
+++ b/tests/queries/tpch/1.sql
@@ -0,0 +1,21 @@
+select
+	l_returnflag,
+	l_linestatus,
+	sum(l_quantity) as sum_qty,
+	sum(l_extendedprice) as sum_base_price,
+	sum(l_extendedprice * (1 - l_discount)) as sum_disc_price,
+	sum(l_extendedprice * (1 - l_discount) * (1 + l_tax)) as sum_charge,
+	avg(l_quantity) as avg_qty,
+	avg(l_extendedprice) as avg_price,
+	avg(l_discount) as avg_disc,
+	count(*) as count_order
+from
+	lineitem
+where
+	l_shipdate <= date '1998-12-01' - interval '90' day (3)
+group by
+	l_returnflag,
+	l_linestatus
+order by
+	l_returnflag,
+	l_linestatus;
diff --git a/tests/queries/tpch/10.sql b/tests/queries/tpch/10.sql
new file mode 100644
index 000000000..a8de12995
--- /dev/null
+++ b/tests/queries/tpch/10.sql
@@ -0,0 +1,34 @@
+-- using default substitutions
+
+
+select
+	c_custkey,
+	c_name,
+	sum(l_extendedprice * (1 - l_discount)) as revenue,
+	c_acctbal,
+	n_name,
+	c_address,
+	c_phone,
+	c_comment
+from
+	customer,
+	orders,
+	lineitem,
+	nation
+where
+	c_custkey = o_custkey
+	and l_orderkey = o_orderkey
+	and o_orderdate >= date '1993-10-01'
+	and o_orderdate < date '1993-10-01' + interval '3' month
+	and l_returnflag = 'R'
+	and c_nationkey = n_nationkey
+group by
+	c_custkey,
+	c_name,
+	c_acctbal,
+	c_phone,
+	n_name,
+	c_address,
+	c_comment
+order by
+	revenue desc;
diff --git a/tests/queries/tpch/11.sql b/tests/queries/tpch/11.sql
new file mode 100644
index 000000000..f9cf254b5
--- /dev/null
+++ b/tests/queries/tpch/11.sql
@@ -0,0 +1,30 @@
+-- using default substitutions
+
+
+select
+	ps_partkey,
+	sum(ps_supplycost * ps_availqty) as value
+from
+	partsupp,
+	supplier,
+	nation
+where
+	ps_suppkey = s_suppkey
+	and s_nationkey = n_nationkey
+	and n_name = 'GERMANY'
+group by
+	ps_partkey having
+		sum(ps_supplycost * ps_availqty) > (
+			select
+				sum(ps_supplycost * ps_availqty) * 0.0001000000
+			from
+				partsupp,
+				supplier,
+				nation
+			where
+				ps_suppkey = s_suppkey
+				and s_nationkey = n_nationkey
+				and n_name = 'GERMANY'
+		)
+order by
+	value desc;
diff --git a/tests/queries/tpch/12.sql b/tests/queries/tpch/12.sql
new file mode 100644
index 000000000..ca9c494e7
--- /dev/null
+++ b/tests/queries/tpch/12.sql
@@ -0,0 +1,31 @@
+-- using default substitutions
+
+
+select
+	l_shipmode,
+	sum(case
+		when o_orderpriority = '1-URGENT'
+			or o_orderpriority = '2-HIGH'
+			then 1
+		else 0
+	end) as high_line_count,
+	sum(case
+		when o_orderpriority <> '1-URGENT'
+			and o_orderpriority <> '2-HIGH'
+			then 1
+		else 0
+	end) as low_line_count
+from
+	orders,
+	lineitem
+where
+	o_orderkey = l_orderkey
+	and l_shipmode in ('MAIL', 'SHIP')
+	and l_commitdate < l_receiptdate
+	and l_shipdate < l_commitdate
+	and l_receiptdate >= date '1994-01-01'
+	and l_receiptdate < date '1994-01-01' + interval '1' year
+group by
+	l_shipmode
+order by
+	l_shipmode;
diff --git a/tests/queries/tpch/13.sql b/tests/queries/tpch/13.sql
new file mode 100644
index 000000000..32b0ebeb9
--- /dev/null
+++ b/tests/queries/tpch/13.sql
@@ -0,0 +1,23 @@
+-- using default substitutions
+
+
+select
+	c_count,
+	count(*) as custdist
+from
+	(
+		select
+			c_custkey,
+			count(o_orderkey)
+		from
+			customer left outer join orders on
+				c_custkey = o_custkey
+				and o_comment not like '%special%requests%'
+		group by
+			c_custkey
+	) as c_orders (c_custkey, c_count)
+group by
+	c_count
+order by
+	custdist desc,
+	c_count desc;
diff --git a/tests/queries/tpch/14.sql b/tests/queries/tpch/14.sql
new file mode 100644
index 000000000..74f9643ef
--- /dev/null
+++ b/tests/queries/tpch/14.sql
@@ -0,0 +1,16 @@
+-- using default substitutions
+
+
+select
+	100.00 * sum(case
+		when p_type like 'PROMO%'
+			then l_extendedprice * (1 - l_discount)
+		else 0
+	end) / sum(l_extendedprice * (1 - l_discount)) as promo_revenue
+from
+	lineitem,
+	part
+where
+	l_partkey = p_partkey
+	and l_shipdate >= date '1995-09-01'
+	and l_shipdate < date '1995-09-01' + interval '1' month;
diff --git a/tests/queries/tpch/15.sql b/tests/queries/tpch/15.sql
new file mode 100644
index 000000000..8b3b8c1ef
--- /dev/null
+++ b/tests/queries/tpch/15.sql
@@ -0,0 +1,36 @@
+-- using default substitutions
+
+create view revenue0 (supplier_no, total_revenue) as
+	select
+		l_suppkey,
+		sum(l_extendedprice * (1 - l_discount))
+	from
+		lineitem
+	where
+		l_shipdate >= date '1996-01-01'
+		and l_shipdate < date '1996-01-01' + interval '3' month
+	group by
+		l_suppkey;
+
+
+select
+	s_suppkey,
+	s_name,
+	s_address,
+	s_phone,
+	total_revenue
+from
+	supplier,
+	revenue0
+where
+	s_suppkey = supplier_no
+	and total_revenue = (
+		select
+			max(total_revenue)
+		from
+			revenue0
+	)
+order by
+	s_suppkey;
+
+drop view revenue0;
diff --git a/tests/queries/tpch/16.sql b/tests/queries/tpch/16.sql
new file mode 100644
index 000000000..a0412fcbb
--- /dev/null
+++ b/tests/queries/tpch/16.sql
@@ -0,0 +1,33 @@
+-- using default substitutions
+
+
+select
+	p_brand,
+	p_type,
+	p_size,
+	count(distinct ps_suppkey) as supplier_cnt
+from
+	partsupp,
+	part
+where
+	p_partkey = ps_partkey
+	and p_brand <> 'Brand#45'
+	and p_type not like 'MEDIUM POLISHED%'
+	and p_size in (49, 14, 23, 45, 19, 3, 36, 9)
+	and ps_suppkey not in (
+		select
+			s_suppkey
+		from
+			supplier
+		where
+			s_comment like '%Customer%Complaints%'
+	)
+group by
+	p_brand,
+	p_type,
+	p_size
+order by
+	supplier_cnt desc,
+	p_brand,
+	p_type,
+	p_size;
diff --git a/tests/queries/tpch/17.sql b/tests/queries/tpch/17.sql
new file mode 100644
index 000000000..d59bc18ab
--- /dev/null
+++ b/tests/queries/tpch/17.sql
@@ -0,0 +1,20 @@
+-- using default substitutions
+
+
+select
+	sum(l_extendedprice) / 7.0 as avg_yearly
+from
+	lineitem,
+	part
+where
+	p_partkey = l_partkey
+	and p_brand = 'Brand#23'
+	and p_container = 'MED BOX'
+	and l_quantity < (
+		select
+			0.2 * avg(l_quantity)
+		from
+			lineitem
+		where
+			l_partkey = p_partkey
+	);
diff --git a/tests/queries/tpch/18.sql b/tests/queries/tpch/18.sql
new file mode 100644
index 000000000..e07956fed
--- /dev/null
+++ b/tests/queries/tpch/18.sql
@@ -0,0 +1,35 @@
+-- using default substitutions
+
+
+select
+	c_name,
+	c_custkey,
+	o_orderkey,
+	o_orderdate,
+	o_totalprice,
+	sum(l_quantity)
+from
+	customer,
+	orders,
+	lineitem
+where
+	o_orderkey in (
+		select
+			l_orderkey
+		from
+			lineitem
+		group by
+			l_orderkey having
+				sum(l_quantity) > 300
+	)
+	and c_custkey = o_custkey
+	and o_orderkey = l_orderkey
+group by
+	c_name,
+	c_custkey,
+	o_orderkey,
+	o_orderdate,
+	o_totalprice
+order by
+	o_totalprice desc,
+	o_orderdate;
diff --git a/tests/queries/tpch/19.sql b/tests/queries/tpch/19.sql
new file mode 100644
index 000000000..908e08297
--- /dev/null
+++ b/tests/queries/tpch/19.sql
@@ -0,0 +1,38 @@
+-- using default substitutions
+
+
+select
+	sum(l_extendedprice* (1 - l_discount)) as revenue
+from
+	lineitem,
+	part
+where
+	(
+		p_partkey = l_partkey
+		and p_brand = 'Brand#12'
+		and p_container in ('SM CASE', 'SM BOX', 'SM PACK', 'SM PKG')
+		and l_quantity >= 1 and l_quantity <= 1 + 10
+		and p_size between 1 and 5
+		and l_shipmode in ('AIR', 'AIR REG')
+		and l_shipinstruct = 'DELIVER IN PERSON'
+	)
+	or
+	(
+		p_partkey = l_partkey
+		and p_brand = 'Brand#23'
+		and p_container in ('MED BAG', 'MED BOX', 'MED PKG', 'MED PACK')
+		and l_quantity >= 10 and l_quantity <= 10 + 10
+		and p_size between 1 and 10
+		and l_shipmode in ('AIR', 'AIR REG')
+		and l_shipinstruct = 'DELIVER IN PERSON'
+	)
+	or
+	(
+		p_partkey = l_partkey
+		and p_brand = 'Brand#34'
+		and p_container in ('LG CASE', 'LG BOX', 'LG PACK', 'LG PKG')
+		and l_quantity >= 20 and l_quantity <= 20 + 10
+		and p_size between 1 and 15
+		and l_shipmode in ('AIR', 'AIR REG')
+		and l_shipinstruct = 'DELIVER IN PERSON'
+	);
diff --git a/tests/queries/tpch/2.sql b/tests/queries/tpch/2.sql
new file mode 100644
index 000000000..f04c1d497
--- /dev/null
+++ b/tests/queries/tpch/2.sql
@@ -0,0 +1,46 @@
+-- using default substitutions
+
+
+select
+	s_acctbal,
+	s_name,
+	n_name,
+	p_partkey,
+	p_mfgr,
+	s_address,
+	s_phone,
+	s_comment
+from
+	part,
+	supplier,
+	partsupp,
+	nation,
+	region
+where
+	p_partkey = ps_partkey
+	and s_suppkey = ps_suppkey
+	and p_size = 15
+	and p_type like '%BRASS'
+	and s_nationkey = n_nationkey
+	and n_regionkey = r_regionkey
+	and r_name = 'EUROPE'
+	and ps_supplycost = (
+		select
+			min(ps_supplycost)
+		from
+			partsupp,
+			supplier,
+			nation,
+			region
+		where
+			p_partkey = ps_partkey
+			and s_suppkey = ps_suppkey
+			and s_nationkey = n_nationkey
+			and n_regionkey = r_regionkey
+			and r_name = 'EUROPE'
+	)
+order by
+	s_acctbal desc,
+	n_name,
+	s_name,
+	p_partkey;
diff --git a/tests/queries/tpch/20.sql b/tests/queries/tpch/20.sql
new file mode 100644
index 000000000..7aaabc2d5
--- /dev/null
+++ b/tests/queries/tpch/20.sql
@@ -0,0 +1,40 @@
+-- using default substitutions
+
+
+select
+	s_name,
+	s_address
+from
+	supplier,
+	nation
+where
+	s_suppkey in (
+		select
+			ps_suppkey
+		from
+			partsupp
+		where
+			ps_partkey in (
+				select
+					p_partkey
+				from
+					part
+				where
+					p_name like 'forest%'
+			)
+			and ps_availqty > (
+				select
+					0.5 * sum(l_quantity)
+				from
+					lineitem
+				where
+					l_partkey = ps_partkey
+					and l_suppkey = ps_suppkey
+					and l_shipdate >= date '1994-01-01'
+					and l_shipdate < date '1994-01-01' + interval '1' year
+			)
+	)
+	and s_nationkey = n_nationkey
+	and n_name = 'CANADA'
+order by
+	s_name;
diff --git a/tests/queries/tpch/21.sql b/tests/queries/tpch/21.sql
new file mode 100644
index 000000000..5a287f9a3
--- /dev/null
+++ b/tests/queries/tpch/21.sql
@@ -0,0 +1,42 @@
+-- using default substitutions
+
+
+select
+	s_name,
+	count(*) as numwait
+from
+	supplier,
+	lineitem l1,
+	orders,
+	nation
+where
+	s_suppkey = l1.l_suppkey
+	and o_orderkey = l1.l_orderkey
+	and o_orderstatus = 'F'
+	and l1.l_receiptdate > l1.l_commitdate
+	and exists (
+		select
+			*
+		from
+			lineitem l2
+		where
+			l2.l_orderkey = l1.l_orderkey
+			and l2.l_suppkey <> l1.l_suppkey
+	)
+	and not exists (
+		select
+			*
+		from
+			lineitem l3
+		where
+			l3.l_orderkey = l1.l_orderkey
+			and l3.l_suppkey <> l1.l_suppkey
+			and l3.l_receiptdate > l3.l_commitdate
+	)
+	and s_nationkey = n_nationkey
+	and n_name = 'SAUDI ARABIA'
+group by
+	s_name
+order by
+	numwait desc,
+	s_name;
diff --git a/tests/queries/tpch/22.sql b/tests/queries/tpch/22.sql
new file mode 100644
index 000000000..1fc8523ad
--- /dev/null
+++ b/tests/queries/tpch/22.sql
@@ -0,0 +1,40 @@
+-- using default substitutions
+
+
+select
+	cntrycode,
+	count(*) as numcust,
+	sum(c_acctbal) as totacctbal
+from
+	(
+		select
+			substring(c_phone from 1 for 2) as cntrycode,
+			c_acctbal
+		from
+			customer
+		where
+			substring(c_phone from 1 for 2) in
+				('13', '31', '23', '29', '30', '18', '17')
+			and c_acctbal > (
+				select
+					avg(c_acctbal)
+				from
+					customer
+				where
+					c_acctbal > 0.00
+					and substring(c_phone from 1 for 2) in
+						('13', '31', '23', '29', '30', '18', '17')
+			)
+			and not exists (
+				select
+					*
+				from
+					orders
+				where
+					o_custkey = c_custkey
+			)
+	) as custsale
+group by
+	cntrycode
+order by
+	cntrycode;
diff --git a/tests/queries/tpch/3.sql b/tests/queries/tpch/3.sql
new file mode 100644
index 000000000..710aac520
--- /dev/null
+++ b/tests/queries/tpch/3.sql
@@ -0,0 +1,25 @@
+-- using default substitutions
+
+
+select
+	l_orderkey,
+	sum(l_extendedprice * (1 - l_discount)) as revenue,
+	o_orderdate,
+	o_shippriority
+from
+	customer,
+	orders,
+	lineitem
+where
+	c_mktsegment = 'BUILDING'
+	and c_custkey = o_custkey
+	and l_orderkey = o_orderkey
+	and o_orderdate < date '1995-03-15'
+	and l_shipdate > date '1995-03-15'
+group by
+	l_orderkey,
+	o_orderdate,
+	o_shippriority
+order by
+	revenue desc,
+	o_orderdate;
diff --git a/tests/queries/tpch/4.sql b/tests/queries/tpch/4.sql
new file mode 100644
index 000000000..e5adb9349
--- /dev/null
+++ b/tests/queries/tpch/4.sql
@@ -0,0 +1,24 @@
+-- using default substitutions
+
+
+select
+	o_orderpriority,
+	count(*) as order_count
+from
+	orders
+where
+	o_orderdate >= date '1993-07-01'
+	and o_orderdate < date '1993-07-01' + interval '3' month
+	and exists (
+		select
+			*
+		from
+			lineitem
+		where
+			l_orderkey = o_orderkey
+			and l_commitdate < l_receiptdate
+	)
+group by
+	o_orderpriority
+order by
+	o_orderpriority;
diff --git a/tests/queries/tpch/5.sql b/tests/queries/tpch/5.sql
new file mode 100644
index 000000000..ea376576f
--- /dev/null
+++ b/tests/queries/tpch/5.sql
@@ -0,0 +1,27 @@
+-- using default substitutions
+
+
+select
+	n_name,
+	sum(l_extendedprice * (1 - l_discount)) as revenue
+from
+	customer,
+	orders,
+	lineitem,
+	supplier,
+	nation,
+	region
+where
+	c_custkey = o_custkey
+	and l_orderkey = o_orderkey
+	and l_suppkey = s_suppkey
+	and c_nationkey = s_nationkey
+	and s_nationkey = n_nationkey
+	and n_regionkey = r_regionkey
+	and r_name = 'ASIA'
+	and o_orderdate >= date '1994-01-01'
+	and o_orderdate < date '1994-01-01' + interval '1' year
+group by
+	n_name
+order by
+	revenue desc;
diff --git a/tests/queries/tpch/6.sql b/tests/queries/tpch/6.sql
new file mode 100644
index 000000000..949b7b16a
--- /dev/null
+++ b/tests/queries/tpch/6.sql
@@ -0,0 +1,12 @@
+-- using default substitutions
+
+
+select
+	sum(l_extendedprice * l_discount) as revenue
+from
+	lineitem
+where
+	l_shipdate >= date '1994-01-01'
+	and l_shipdate < date '1994-01-01' + interval '1' year
+	and l_discount between .06 - 0.01 and .06 + 0.01
+	and l_quantity < 24;
diff --git a/tests/queries/tpch/7.sql b/tests/queries/tpch/7.sql
new file mode 100644
index 000000000..85dd8f9c8
--- /dev/null
+++ b/tests/queries/tpch/7.sql
@@ -0,0 +1,42 @@
+-- using default substitutions
+
+
+select
+	supp_nation,
+	cust_nation,
+	l_year,
+	sum(volume) as revenue
+from
+	(
+		select
+			n1.n_name as supp_nation,
+			n2.n_name as cust_nation,
+			extract(year from l_shipdate) as l_year,
+			l_extendedprice * (1 - l_discount) as volume
+		from
+			supplier,
+			lineitem,
+			orders,
+			customer,
+			nation n1,
+			nation n2
+		where
+			s_suppkey = l_suppkey
+			and o_orderkey = l_orderkey
+			and c_custkey = o_custkey
+			and s_nationkey = n1.n_nationkey
+			and c_nationkey = n2.n_nationkey
+			and (
+				(n1.n_name = 'FRANCE' and n2.n_name = 'GERMANY')
+				or (n1.n_name = 'GERMANY' and n2.n_name = 'FRANCE')
+			)
+			and l_shipdate between date '1995-01-01' and date '1996-12-31'
+	) as shipping
+group by
+	supp_nation,
+	cust_nation,
+	l_year
+order by
+	supp_nation,
+	cust_nation,
+	l_year;
diff --git a/tests/queries/tpch/8.sql b/tests/queries/tpch/8.sql
new file mode 100644
index 000000000..e6e4d30b8
--- /dev/null
+++ b/tests/queries/tpch/8.sql
@@ -0,0 +1,40 @@
+-- using default substitutions
+
+
+select
+	o_year,
+	sum(case
+		when nation = 'BRAZIL' then volume
+		else 0
+	end) / sum(volume) as mkt_share
+from
+	(
+		select
+			extract(year from o_orderdate) as o_year,
+			l_extendedprice * (1 - l_discount) as volume,
+			n2.n_name as nation
+		from
+			part,
+			supplier,
+			lineitem,
+			orders,
+			customer,
+			nation n1,
+			nation n2,
+			region
+		where
+			p_partkey = l_partkey
+			and s_suppkey = l_suppkey
+			and l_orderkey = o_orderkey
+			and o_custkey = c_custkey
+			and c_nationkey = n1.n_nationkey
+			and n1.n_regionkey = r_regionkey
+			and r_name = 'AMERICA'
+			and s_nationkey = n2.n_nationkey
+			and o_orderdate between date '1995-01-01' and date '1996-12-31'
+			and p_type = 'ECONOMY ANODIZED STEEL'
+	) as all_nations
+group by
+	o_year
+order by
+	o_year;
diff --git a/tests/queries/tpch/9.sql b/tests/queries/tpch/9.sql
new file mode 100644
index 000000000..f9eaf65ee
--- /dev/null
+++ b/tests/queries/tpch/9.sql
@@ -0,0 +1,35 @@
+-- using default substitutions
+
+
+select
+	nation,
+	o_year,
+	sum(amount) as sum_profit
+from
+	(
+		select
+			n_name as nation,
+			extract(year from o_orderdate) as o_year,
+			l_extendedprice * (1 - l_discount) - ps_supplycost * l_quantity as amount
+		from
+			part,
+			supplier,
+			lineitem,
+			partsupp,
+			orders,
+			nation
+		where
+			s_suppkey = l_suppkey
+			and ps_suppkey = l_suppkey
+			and ps_partkey = l_partkey
+			and p_partkey = l_partkey
+			and o_orderkey = l_orderkey
+			and s_nationkey = n_nationkey
+			and p_name like '%green%'
+	) as profit
+group by
+	nation,
+	o_year
+order by
+	nation,
+	o_year desc;
diff --git a/tests/sqlparser_regression.rs b/tests/sqlparser_regression.rs
new file mode 100644
index 000000000..26a5e7d4c
--- /dev/null
+++ b/tests/sqlparser_regression.rs
@@ -0,0 +1,48 @@
+use sqlparser::dialect::GenericDialect;
+use sqlparser::parser::Parser;
+
+macro_rules! tpch_tests {
+    ($($name:ident: $value:expr,)*) => {
+        const QUERIES: &[&str] = &[
+            $(include_str!(concat!("queries/tpch/", $value, ".sql"))),*
+        ];
+    $(
+
+        #[test]
+        fn $name() {
+            let dialect = GenericDialect {};
+
+            let res = Parser::parse_sql(&dialect, QUERIES[$value -1]);
+            // Ignore 6.sql and 22.sql
+            if $value != 6 && $value != 22 {
+                assert!(res.is_ok());
+            }
+        }
+    )*
+    }
+}
+
+tpch_tests! {
+    tpch_1: 1,
+    tpch_2: 2,
+    tpch_3: 3,
+    tpch_4: 4,
+    tpch_5: 5,
+    tpch_6: 6,
+    tpch_7: 7,
+    tpch_8: 8,
+    tpch_9: 9,
+    tpch_10: 10,
+    tpch_11: 11,
+    tpch_12: 12,
+    tpch_13: 13,
+    tpch_14: 14,
+    tpch_15: 15,
+    tpch_16: 16,
+    tpch_17: 17,
+    tpch_18: 18,
+    tpch_19: 19,
+    tpch_20: 20,
+    tpch_21: 21,
+    tpch_22: 22,
+}

From c24b0e01db2bc879a1cd095b5230588967b605c5 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Thu, 16 Jul 2020 17:28:03 +0200
Subject: [PATCH 054/122] Implement ASSERT statement (#226)

As supported by PostgreSQL and BigQuery (with some differences between them)
---
 src/ast/mod.rs            | 20 ++++++++++++++++++++
 src/dialect/keywords.rs   |  1 +
 src/parser.rs             | 17 +++++++++++++++++
 tests/sqlparser_common.rs | 40 +++++++++++++++++++++++++++++++++++++++
 4 files changed, 78 insertions(+)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 9486f16c6..9e0992bce 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -551,6 +551,14 @@ pub enum Statement {
     Rollback { chain: bool },
     /// CREATE SCHEMA
     CreateSchema { schema_name: ObjectName },
+
+    /// ASSERT <condition> [AS <message>]
+    Assert {
+        condition: Expr,
+        // AS or ,
+        separator: String,
+        message: Option<Expr>,
+    },
 }
 
 impl fmt::Display for Statement {
@@ -810,6 +818,18 @@ impl fmt::Display for Statement {
                 write!(f, "ROLLBACK{}", if *chain { " AND CHAIN" } else { "" },)
             }
             Statement::CreateSchema { schema_name } => write!(f, "CREATE SCHEMA {}", schema_name),
+            Statement::Assert {
+                condition,
+                separator,
+                message,
+            } => {
+                write!(f, "ASSERT {}", condition)?;
+
+                if let Some(m) = message {
+                    write!(f, " {} {}", separator, m)?;
+                }
+                Ok(())
+            }
         }
     }
 }
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index b6cfe35e9..dd663e9b6 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -79,6 +79,7 @@ define_keywords!(
     AS,
     ASC,
     ASENSITIVE,
+    ASSERT,
     ASYMMETRIC,
     AT,
     ATOMIC,
diff --git a/src/parser.rs b/src/parser.rs
index a1e542484..f5389ccd8 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -148,6 +148,7 @@ impl Parser {
                 Keyword::BEGIN => Ok(self.parse_begin()?),
                 Keyword::COMMIT => Ok(self.parse_commit()?),
                 Keyword::ROLLBACK => Ok(self.parse_rollback()?),
+                Keyword::ASSERT => Ok(self.parse_assert()?),
                 _ => self.expected("an SQL statement", Token::Word(w)),
             },
             Token::LParen => {
@@ -179,6 +180,22 @@ impl Parser {
         }
         Ok(expr)
     }
+    pub fn parse_assert(&mut self) -> Result<Statement, ParserError> {
+        let condition = self.parse_expr()?;
+        let (separator, message) = if self.consume_token(&Token::Comma) {
+            (",".to_string(), Some(self.parse_expr()?))
+        } else if self.parse_keyword(Keyword::AS) {
+            ("AS".to_string(), Some(self.parse_expr()?))
+        } else {
+            ("".to_string(), None)
+        };
+
+        Ok(Statement::Assert {
+            condition,
+            separator,
+            message,
+        })
+    }
 
     /// Parse an expression prefix
     pub fn parse_prefix(&mut self) -> Result<Expr, ParserError> {
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 7d5317ae2..1ff79b296 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1156,6 +1156,46 @@ fn parse_create_table_with_multiple_on_delete_fails() {
     .expect_err("should have failed");
 }
 
+#[test]
+fn parse_assert() {
+    let sql = "ASSERT (SELECT COUNT(*) FROM table) > 0";
+    let ast = one_statement_parses_to(sql, "ASSERT (SELECT COUNT(*) FROM table) > 0");
+    match ast {
+        Statement::Assert {
+            condition: _condition,
+            separator,
+            message,
+        } => {
+            assert_eq!(message, None);
+            assert_eq!(separator, "");
+        }
+        _ => unreachable!(),
+    }
+}
+
+#[test]
+fn parse_assert_message() {
+    let sql = "ASSERT (SELECT COUNT(*) FROM table) > 0 AS 'No rows in table'";
+    let ast = one_statement_parses_to(
+        sql,
+        "ASSERT (SELECT COUNT(*) FROM table) > 0 AS 'No rows in table'",
+    );
+    match ast {
+        Statement::Assert {
+            condition: _condition,
+            message: Some(message),
+            separator,
+        } => {
+            assert_eq!(separator, "AS");
+            match message {
+                Expr::Value(Value::SingleQuotedString(s)) => assert_eq!(s, "No rows in table"),
+                _ => unreachable!(),
+            };
+        }
+        _ => unreachable!(),
+    }
+}
+
 #[test]
 fn parse_create_schema() {
     let sql = "CREATE SCHEMA X";

From 583f22b92900c7096ae29fd6b5280e27d93884c4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Fri, 17 Jul 2020 13:20:49 +0200
Subject: [PATCH 055/122] Remove PostgreSQL version of assert (#229)

Remove PostgreSQL procedural assert statement. This also simplifies code somewhat.
---
 src/ast/mod.rs            | 10 ++--------
 src/parser.rs             | 14 ++++----------
 tests/sqlparser_common.rs |  4 ----
 3 files changed, 6 insertions(+), 22 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 9e0992bce..be526495b 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -555,8 +555,6 @@ pub enum Statement {
     /// ASSERT <condition> [AS <message>]
     Assert {
         condition: Expr,
-        // AS or ,
-        separator: String,
         message: Option<Expr>,
     },
 }
@@ -818,15 +816,11 @@ impl fmt::Display for Statement {
                 write!(f, "ROLLBACK{}", if *chain { " AND CHAIN" } else { "" },)
             }
             Statement::CreateSchema { schema_name } => write!(f, "CREATE SCHEMA {}", schema_name),
-            Statement::Assert {
-                condition,
-                separator,
-                message,
-            } => {
+            Statement::Assert { condition, message } => {
                 write!(f, "ASSERT {}", condition)?;
 
                 if let Some(m) = message {
-                    write!(f, " {} {}", separator, m)?;
+                    write!(f, " AS {}", m)?;
                 }
                 Ok(())
             }
diff --git a/src/parser.rs b/src/parser.rs
index f5389ccd8..0f6e3c1d0 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -182,19 +182,13 @@ impl Parser {
     }
     pub fn parse_assert(&mut self) -> Result<Statement, ParserError> {
         let condition = self.parse_expr()?;
-        let (separator, message) = if self.consume_token(&Token::Comma) {
-            (",".to_string(), Some(self.parse_expr()?))
-        } else if self.parse_keyword(Keyword::AS) {
-            ("AS".to_string(), Some(self.parse_expr()?))
+        let message = if self.parse_keyword(Keyword::AS) {
+            Some(self.parse_expr()?)
         } else {
-            ("".to_string(), None)
+            None
         };
 
-        Ok(Statement::Assert {
-            condition,
-            separator,
-            message,
-        })
+        Ok(Statement::Assert { condition, message })
     }
 
     /// Parse an expression prefix
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 1ff79b296..31f95b378 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1163,11 +1163,9 @@ fn parse_assert() {
     match ast {
         Statement::Assert {
             condition: _condition,
-            separator,
             message,
         } => {
             assert_eq!(message, None);
-            assert_eq!(separator, "");
         }
         _ => unreachable!(),
     }
@@ -1184,9 +1182,7 @@ fn parse_assert_message() {
         Statement::Assert {
             condition: _condition,
             message: Some(message),
-            separator,
         } => {
-            assert_eq!(separator, "AS");
             match message {
                 Expr::Value(Value::SingleQuotedString(s)) => assert_eq!(s, "No rows in table"),
                 _ => unreachable!(),

From 3a42b69b89493c75b8d847566b4f5d8d5d5c5ba8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Mon, 20 Jul 2020 18:14:46 +0200
Subject: [PATCH 056/122] Release 0.6.0 (#232)

---
 CHANGELOG.md | 8 ++++++--
 Cargo.toml   | 2 +-
 2 files changed, 7 insertions(+), 3 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 4e99d86eb..ea5bf38a9 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -11,11 +11,15 @@ Check https://github.com/ballista-compute/sqlparser-rs/commits/main for undocume
 ### Changed
 
 ### Added
-- Support SQLite's `CREATE TABLE (...) WITHOUT ROWID` (#208) - thanks @mashuai!
-- Support SQLite's `CREATE VIRTUAL TABLE` (#209) - thanks @mashuai!
 
 ### Fixed
 
+## [0.6.0] - 2020-07-20
+
+### Added
+- Support SQLite's `CREATE TABLE (...) WITHOUT ROWID` (#208) - thanks @mashuai!
+- Support SQLite's `CREATE VIRTUAL TABLE` (#209) - thanks @mashuai!
+- Support BigQuery `ASSERT` statement (#226)
 
 ## [0.5.1] - 2020-06-26
 This release should have been called `0.6`, as it introduces multiple incompatible changes to the API. If you don't want to upgrade yet, you can revert to the previous version by changing your `Cargo.toml` to:
diff --git a/Cargo.toml b/Cargo.toml
index 67669d76c..527217917 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "sqlparser"
 description = "Extensible SQL Lexer and Parser with support for ANSI SQL:2011"
-version = "0.5.2-alpha.0"
+version = "0.6.0"
 authors = ["Andy Grove <andygrove73@gmail.com>"]
 homepage = "https://github.com/ballista-compute/sqlparser-rs"
 documentation = "https://docs.rs/sqlparser/"

From f053383c718b3d4942751224783c594ff7e9f0b1 Mon Sep 17 00:00:00 2001
From: Dandandan <danielheres@gmail.com>
Date: Mon, 20 Jul 2020 18:20:08 +0200
Subject: [PATCH 057/122] Release 0.6.1

---
 CHANGELOG.md | 6 +++++-
 Cargo.toml   | 2 +-
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index ea5bf38a9..702e1e6ed 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -14,12 +14,16 @@ Check https://github.com/ballista-compute/sqlparser-rs/commits/main for undocume
 
 ### Fixed
 
+## [0.6.1] - 2020-07-20
+
+### Added
+- Support BigQuery `ASSERT` statement (#226)
+
 ## [0.6.0] - 2020-07-20
 
 ### Added
 - Support SQLite's `CREATE TABLE (...) WITHOUT ROWID` (#208) - thanks @mashuai!
 - Support SQLite's `CREATE VIRTUAL TABLE` (#209) - thanks @mashuai!
-- Support BigQuery `ASSERT` statement (#226)
 
 ## [0.5.1] - 2020-06-26
 This release should have been called `0.6`, as it introduces multiple incompatible changes to the API. If you don't want to upgrade yet, you can revert to the previous version by changing your `Cargo.toml` to:
diff --git a/Cargo.toml b/Cargo.toml
index 527217917..95c2ec9bb 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "sqlparser"
 description = "Extensible SQL Lexer and Parser with support for ANSI SQL:2011"
-version = "0.6.0"
+version = "0.6.1"
 authors = ["Andy Grove <andygrove73@gmail.com>"]
 homepage = "https://github.com/ballista-compute/sqlparser-rs"
 documentation = "https://docs.rs/sqlparser/"

From bc9bfaeb84d9a04653fe6b8678ea7fa66f1ec424 Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Sat, 25 Jul 2020 08:05:34 -0700
Subject: [PATCH 058/122] automate crate publishing

This introduces a new section of the GitHub Actions workflow which will
publish the crate upon a new tag being pushed. Note that this requires a
new project secret, `CRATES_TOKEN`.
---
 .github/workflows/rust.yml | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/.github/workflows/rust.yml b/.github/workflows/rust.yml
index a53e0babc..3fa2aac58 100644
--- a/.github/workflows/rust.yml
+++ b/.github/workflows/rust.yml
@@ -63,3 +63,16 @@ jobs:
       uses: coverallsapp/github-action@master
       with:
         github-token: ${{ secrets.GITHUB_TOKEN }}
+
+  publish-crate:
+    if: startsWith(github.ref, 'refs/tags/')
+    runs-on: ubuntu-latest
+    needs: [test]
+    steps:
+      - name: Set up Rust
+        uses: hecrj/setup-rust-action@v1
+      - uses: actions/checkout@v2
+      - name: Publish
+        shell: bash
+        run: |
+          cargo publish --token ${{ secrets.CRATES_TOKEN }}

From d2e4340a32dfb1031003aa5a0b4ad0a288e300dd Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Mon, 27 Jul 2020 21:59:08 +0200
Subject: [PATCH 059/122] Support create or replace view/table (#239)

* Support create or replace table

* Support create or replace view

* Simplify create or replace table parser

* Add tests for create or replace external table and materialized view

* Formatting

* Address review comments

* Create error if we didn't see a (external) table or (materialized) view afer create or replace
---
 src/ast/mod.rs            |  18 +++--
 src/dialect/keywords.rs   |   1 +
 src/parser.rs             |  32 ++++++---
 tests/sqlparser_common.rs | 137 ++++++++++++++++++++++++++++++++++++++
 4 files changed, 174 insertions(+), 14 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index be526495b..1203b096d 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -462,23 +462,25 @@ pub enum Statement {
     },
     /// CREATE VIEW
     CreateView {
+        or_replace: bool,
+        materialized: bool,
         /// View name
         name: ObjectName,
         columns: Vec<Ident>,
         query: Box<Query>,
-        materialized: bool,
         with_options: Vec<SqlOption>,
     },
     /// CREATE TABLE
     CreateTable {
+        or_replace: bool,
+        external: bool,
+        if_not_exists: bool,
         /// Table name
         name: ObjectName,
         /// Optional schema
         columns: Vec<ColumnDef>,
         constraints: Vec<TableConstraint>,
         with_options: Vec<SqlOption>,
-        if_not_exists: bool,
-        external: bool,
         file_format: Option<FileFormat>,
         location: Option<String>,
         query: Option<Box<Query>>,
@@ -629,12 +631,18 @@ impl fmt::Display for Statement {
             }
             Statement::CreateView {
                 name,
+                or_replace,
                 columns,
                 query,
                 materialized,
                 with_options,
             } => {
                 write!(f, "CREATE")?;
+
+                if *or_replace {
+                    write!(f, " OR REPLACE")?;
+                }
+
                 if *materialized {
                     write!(f, " MATERIALIZED")?;
                 }
@@ -656,6 +664,7 @@ impl fmt::Display for Statement {
                 columns,
                 constraints,
                 with_options,
+                or_replace,
                 if_not_exists,
                 external,
                 file_format,
@@ -672,7 +681,8 @@ impl fmt::Display for Statement {
                 //   `CREATE TABLE t (a INT) AS SELECT a from t2`
                 write!(
                     f,
-                    "CREATE {external}TABLE {if_not_exists}{name}",
+                    "CREATE {or_replace}{external}TABLE {if_not_exists}{name}",
+                    or_replace = if *or_replace { "OR REPLACE " } else { "" },
                     external = if *external { "EXTERNAL " } else { "" },
                     if_not_exists = if *if_not_exists { "IF NOT EXISTS " } else { "" },
                     name = name,
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index dd663e9b6..6ebe27f0e 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -343,6 +343,7 @@ define_keywords!(
     RELEASE,
     RENAME,
     REPEATABLE,
+    REPLACE,
     RESTRICT,
     RESULT,
     RETURN,
diff --git a/src/parser.rs b/src/parser.rs
index 0f6e3c1d0..e41379edb 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -987,17 +987,23 @@ impl Parser {
 
     /// Parse a SQL CREATE statement
     pub fn parse_create(&mut self) -> Result<Statement, ParserError> {
+        let or_replace = self.parse_keywords(&[Keyword::OR, Keyword::REPLACE]);
         if self.parse_keyword(Keyword::TABLE) {
-            self.parse_create_table()
+            self.parse_create_table(or_replace)
+        } else if self.parse_keyword(Keyword::MATERIALIZED) || self.parse_keyword(Keyword::VIEW) {
+            self.prev_token();
+            self.parse_create_view(or_replace)
+        } else if self.parse_keyword(Keyword::EXTERNAL) {
+            self.parse_create_external_table(or_replace)
+        } else if or_replace {
+            self.expected(
+                "[EXTERNAL] TABLE or [MATERIALIZED] VIEW after CREATE OR REPLACE",
+                self.peek_token(),
+            )
         } else if self.parse_keyword(Keyword::INDEX) {
             self.parse_create_index(false)
         } else if self.parse_keywords(&[Keyword::UNIQUE, Keyword::INDEX]) {
             self.parse_create_index(true)
-        } else if self.parse_keyword(Keyword::MATERIALIZED) || self.parse_keyword(Keyword::VIEW) {
-            self.prev_token();
-            self.parse_create_view()
-        } else if self.parse_keyword(Keyword::EXTERNAL) {
-            self.parse_create_external_table()
         } else if self.parse_keyword(Keyword::VIRTUAL) {
             self.parse_create_virtual_table()
         } else if self.parse_keyword(Keyword::SCHEMA) {
@@ -1032,7 +1038,10 @@ impl Parser {
         Ok(Statement::CreateSchema { schema_name })
     }
 
-    pub fn parse_create_external_table(&mut self) -> Result<Statement, ParserError> {
+    pub fn parse_create_external_table(
+        &mut self,
+        or_replace: bool,
+    ) -> Result<Statement, ParserError> {
         self.expect_keyword(Keyword::TABLE)?;
         let table_name = self.parse_object_name()?;
         let (columns, constraints) = self.parse_columns()?;
@@ -1047,6 +1056,7 @@ impl Parser {
             columns,
             constraints,
             with_options: vec![],
+            or_replace,
             if_not_exists: false,
             external: true,
             file_format: Some(file_format),
@@ -1072,10 +1082,10 @@ impl Parser {
         }
     }
 
-    pub fn parse_create_view(&mut self) -> Result<Statement, ParserError> {
+    pub fn parse_create_view(&mut self, or_replace: bool) -> Result<Statement, ParserError> {
         let materialized = self.parse_keyword(Keyword::MATERIALIZED);
         self.expect_keyword(Keyword::VIEW)?;
-        // Many dialects support `OR REPLACE` | `OR ALTER` right after `CREATE`, but we don't (yet).
+        // Many dialects support `OR ALTER` right after `CREATE`, but we don't (yet).
         // ANSI SQL and Postgres support RECURSIVE here, but we don't support it either.
         let name = self.parse_object_name()?;
         let columns = self.parse_parenthesized_column_list(Optional)?;
@@ -1088,6 +1098,7 @@ impl Parser {
             columns,
             query,
             materialized,
+            or_replace,
             with_options,
         })
     }
@@ -1136,7 +1147,7 @@ impl Parser {
         })
     }
 
-    pub fn parse_create_table(&mut self) -> Result<Statement, ParserError> {
+    pub fn parse_create_table(&mut self, or_replace: bool) -> Result<Statement, ParserError> {
         let if_not_exists = self.parse_keywords(&[Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
         let table_name = self.parse_object_name()?;
         // parse optional column list (schema)
@@ -1160,6 +1171,7 @@ impl Parser {
             columns,
             constraints,
             with_options,
+            or_replace,
             if_not_exists,
             external: false,
             file_format: None,
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 31f95b378..5889cc357 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1244,6 +1244,35 @@ fn parse_create_table_as() {
     }
 }
 
+#[test]
+fn parse_create_or_replace_table() {
+    let sql = "CREATE OR REPLACE TABLE t (a INT)";
+
+    match verified_stmt(sql) {
+        Statement::CreateTable {
+            name, or_replace, ..
+        } => {
+            assert_eq!(name.to_string(), "t".to_string());
+            assert!(or_replace);
+        }
+        _ => unreachable!(),
+    }
+
+    let sql = "CREATE TABLE t (a INT, b INT) AS SELECT 1 AS b, 2 AS a";
+    match verified_stmt(sql) {
+        Statement::CreateTable { columns, query, .. } => {
+            assert_eq!(columns.len(), 2);
+            assert_eq!(columns[0].to_string(), "a INT".to_string());
+            assert_eq!(columns[1].to_string(), "b INT".to_string());
+            assert_eq!(
+                query,
+                Some(Box::new(verified_query("SELECT 1 AS b, 2 AS a")))
+            );
+        }
+        _ => unreachable!(),
+    }
+}
+
 #[test]
 fn parse_create_table_with_on_delete_on_update_2in_any_order() -> Result<(), ParserError> {
     let sql = |options: &str| -> String {
@@ -1357,6 +1386,59 @@ fn parse_create_external_table() {
     }
 }
 
+#[test]
+fn parse_create_or_replace_external_table() {
+    // Supported by at least Snowflake
+    // https://docs.snowflake.com/en/sql-reference/sql/create-external-table.html
+    let sql = "CREATE OR REPLACE EXTERNAL TABLE uk_cities (\
+               name VARCHAR(100) NOT NULL)\
+               STORED AS TEXTFILE LOCATION '/tmp/example.csv'";
+    let ast = one_statement_parses_to(
+        sql,
+        "CREATE OR REPLACE EXTERNAL TABLE uk_cities (\
+         name CHARACTER VARYING(100) NOT NULL) \
+         STORED AS TEXTFILE LOCATION '/tmp/example.csv'",
+    );
+    match ast {
+        Statement::CreateTable {
+            name,
+            columns,
+            constraints,
+            with_options,
+            if_not_exists,
+            external,
+            file_format,
+            location,
+            or_replace,
+            ..
+        } => {
+            assert_eq!("uk_cities", name.to_string());
+            assert_eq!(
+                columns,
+                vec![ColumnDef {
+                    name: "name".into(),
+                    data_type: DataType::Varchar(Some(100)),
+                    collation: None,
+                    options: vec![ColumnOptionDef {
+                        name: None,
+                        option: ColumnOption::NotNull
+                    }],
+                },]
+            );
+            assert!(constraints.is_empty());
+
+            assert!(external);
+            assert_eq!(FileFormat::TEXTFILE, file_format.unwrap());
+            assert_eq!("/tmp/example.csv", location.unwrap());
+
+            assert_eq!(with_options, vec![]);
+            assert!(!if_not_exists);
+            assert!(or_replace);
+        }
+        _ => unreachable!(),
+    }
+}
+
 #[test]
 fn parse_create_external_table_lowercase() {
     let sql = "create external table uk_cities (\
@@ -2491,6 +2573,7 @@ fn parse_create_view() {
             name,
             columns,
             query,
+            or_replace,
             materialized,
             with_options,
         } => {
@@ -2498,6 +2581,7 @@ fn parse_create_view() {
             assert_eq!(Vec::<Ident>::new(), columns);
             assert_eq!("SELECT foo FROM bar", query.to_string());
             assert!(!materialized);
+            assert!(!or_replace);
             assert_eq!(with_options, vec![]);
         }
         _ => unreachable!(),
@@ -2534,6 +2618,7 @@ fn parse_create_view_with_columns() {
         Statement::CreateView {
             name,
             columns,
+            or_replace,
             with_options,
             query,
             materialized,
@@ -2543,6 +2628,56 @@ fn parse_create_view_with_columns() {
             assert_eq!(with_options, vec![]);
             assert_eq!("SELECT 1, 2", query.to_string());
             assert!(!materialized);
+            assert!(!or_replace)
+        }
+        _ => unreachable!(),
+    }
+}
+#[test]
+fn parse_create_or_replace_view() {
+    let sql = "CREATE OR REPLACE VIEW v AS SELECT 1";
+    match verified_stmt(sql) {
+        Statement::CreateView {
+            name,
+            columns,
+            or_replace,
+            with_options,
+            query,
+            materialized,
+        } => {
+            assert_eq!("v", name.to_string());
+            assert_eq!(columns, vec![]);
+            assert_eq!(with_options, vec![]);
+            assert_eq!("SELECT 1", query.to_string());
+            assert!(!materialized);
+            assert!(or_replace)
+        }
+        _ => unreachable!(),
+    }
+}
+
+#[test]
+fn parse_create_or_replace_materialized_view() {
+    // Supported in BigQuery (Beta)
+    // https://cloud.google.com/bigquery/docs/materialized-views-intro
+    // and Snowflake:
+    // https://docs.snowflake.com/en/sql-reference/sql/create-materialized-view.html
+    let sql = "CREATE OR REPLACE MATERIALIZED VIEW v AS SELECT 1";
+    match verified_stmt(sql) {
+        Statement::CreateView {
+            name,
+            columns,
+            or_replace,
+            with_options,
+            query,
+            materialized,
+        } => {
+            assert_eq!("v", name.to_string());
+            assert_eq!(columns, vec![]);
+            assert_eq!(with_options, vec![]);
+            assert_eq!("SELECT 1", query.to_string());
+            assert!(materialized);
+            assert!(or_replace)
         }
         _ => unreachable!(),
     }
@@ -2554,6 +2689,7 @@ fn parse_create_materialized_view() {
     match verified_stmt(sql) {
         Statement::CreateView {
             name,
+            or_replace,
             columns,
             query,
             materialized,
@@ -2564,6 +2700,7 @@ fn parse_create_materialized_view() {
             assert_eq!("SELECT foo FROM bar", query.to_string());
             assert!(materialized);
             assert_eq!(with_options, vec![]);
+            assert!(!or_replace);
         }
         _ => unreachable!(),
     }

From 8020b2e5f0aa3c7cf09d08907295f6707047a182 Mon Sep 17 00:00:00 2001
From: Steven <steven.gu@letote.cn>
Date: Tue, 28 Jul 2020 17:01:52 +0800
Subject: [PATCH 060/122] Add Postgres-specific PREPARE, EXECUTE and DEALLOCATE
 (#243)

Adds top-statements PREPARE, EXECUTE and DEALLOCATE for Postgres-specific feature prepared statement.
---
 src/ast/mod.rs              |  43 +++++++++++-
 src/parser.rs               |  41 ++++++++++++
 tests/sqlparser_postgres.rs | 130 ++++++++++++++++++++++++++++++++++++
 3 files changed, 212 insertions(+), 2 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 1203b096d..41bff69d0 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -553,12 +553,27 @@ pub enum Statement {
     Rollback { chain: bool },
     /// CREATE SCHEMA
     CreateSchema { schema_name: ObjectName },
-
-    /// ASSERT <condition> [AS <message>]
+    /// `ASSERT <condition> [AS <message>]`
     Assert {
         condition: Expr,
         message: Option<Expr>,
     },
+    /// `DEALLOCATE [ PREPARE ] { name | ALL }`
+    ///
+    /// Note: this is a PostgreSQL-specific statement.
+    Deallocate { name: Ident, prepare: bool },
+    /// `EXECUTE name [ ( parameter [, ...] ) ]`
+    ///
+    /// Note: this is a PostgreSQL-specific statement.
+    Execute { name: Ident, parameters: Vec<Expr> },
+    /// `PREPARE name [ ( data_type [, ...] ) ] AS statement`
+    ///
+    /// Note: this is a PostgreSQL-specific statement.
+    Prepare {
+        name: Ident,
+        data_types: Vec<DataType>,
+        statement: Box<Statement>,
+    },
 }
 
 impl fmt::Display for Statement {
@@ -834,6 +849,30 @@ impl fmt::Display for Statement {
                 }
                 Ok(())
             }
+            Statement::Deallocate { name, prepare } => write!(
+                f,
+                "DEALLOCATE {prepare}{name}",
+                prepare = if *prepare { "PREPARE " } else { "" },
+                name = name,
+            ),
+            Statement::Execute { name, parameters } => {
+                write!(f, "EXECUTE {}", name)?;
+                if !parameters.is_empty() {
+                    write!(f, "({})", display_comma_separated(parameters))?;
+                }
+                Ok(())
+            }
+            Statement::Prepare {
+                name,
+                data_types,
+                statement,
+            } => {
+                write!(f, "PREPARE {} ", name)?;
+                if !data_types.is_empty() {
+                    write!(f, "({}) ", display_comma_separated(data_types))?;
+                }
+                write!(f, "AS {}", statement)
+            }
         }
     }
 }
diff --git a/src/parser.rs b/src/parser.rs
index e41379edb..27960d1f7 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -149,6 +149,11 @@ impl Parser {
                 Keyword::COMMIT => Ok(self.parse_commit()?),
                 Keyword::ROLLBACK => Ok(self.parse_rollback()?),
                 Keyword::ASSERT => Ok(self.parse_assert()?),
+                // `PREPARE`, `EXECUTE` and `DEALLOCATE` are Postgres-specific
+                // syntaxes. They are used for Postgres prepared statement.
+                Keyword::DEALLOCATE => Ok(self.parse_deallocate()?),
+                Keyword::EXECUTE => Ok(self.parse_execute()?),
+                Keyword::PREPARE => Ok(self.parse_prepare()?),
                 _ => self.expected("an SQL statement", Token::Word(w)),
             },
             Token::LParen => {
@@ -2398,6 +2403,42 @@ impl Parser {
             Ok(false)
         }
     }
+
+    fn parse_deallocate(&mut self) -> Result<Statement, ParserError> {
+        let prepare = self.parse_keyword(Keyword::PREPARE);
+        let name = self.parse_identifier()?;
+        Ok(Statement::Deallocate { name, prepare })
+    }
+
+    fn parse_execute(&mut self) -> Result<Statement, ParserError> {
+        let name = self.parse_identifier()?;
+
+        let mut parameters = vec![];
+        if self.consume_token(&Token::LParen) {
+            parameters = self.parse_comma_separated(Parser::parse_expr)?;
+            self.expect_token(&Token::RParen)?;
+        }
+
+        Ok(Statement::Execute { name, parameters })
+    }
+
+    fn parse_prepare(&mut self) -> Result<Statement, ParserError> {
+        let name = self.parse_identifier()?;
+
+        let mut data_types = vec![];
+        if self.consume_token(&Token::LParen) {
+            data_types = self.parse_comma_separated(Parser::parse_data_type)?;
+            self.expect_token(&Token::RParen)?;
+        }
+
+        self.expect_keyword(Keyword::AS)?;
+        let statement = Box::new(self.parse_statement()?);
+        Ok(Statement::Prepare {
+            name,
+            data_types,
+            statement,
+        })
+    }
 }
 
 impl Word {
diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index 481d0cbe1..f45913a58 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -423,6 +423,136 @@ fn parse_show() {
     )
 }
 
+#[test]
+fn parse_deallocate() {
+    let stmt = pg_and_generic().verified_stmt("DEALLOCATE a");
+    assert_eq!(
+        stmt,
+        Statement::Deallocate {
+            name: "a".into(),
+            prepare: false,
+        }
+    );
+
+    let stmt = pg_and_generic().verified_stmt("DEALLOCATE ALL");
+    assert_eq!(
+        stmt,
+        Statement::Deallocate {
+            name: "ALL".into(),
+            prepare: false,
+        }
+    );
+
+    let stmt = pg_and_generic().verified_stmt("DEALLOCATE PREPARE a");
+    assert_eq!(
+        stmt,
+        Statement::Deallocate {
+            name: "a".into(),
+            prepare: true,
+        }
+    );
+
+    let stmt = pg_and_generic().verified_stmt("DEALLOCATE PREPARE ALL");
+    assert_eq!(
+        stmt,
+        Statement::Deallocate {
+            name: "ALL".into(),
+            prepare: true,
+        }
+    );
+}
+
+#[test]
+fn parse_execute() {
+    let stmt = pg_and_generic().verified_stmt("EXECUTE a");
+    assert_eq!(
+        stmt,
+        Statement::Execute {
+            name: "a".into(),
+            parameters: vec![],
+        }
+    );
+
+    let stmt = pg_and_generic().verified_stmt("EXECUTE a(1, 't')");
+
+    #[cfg(feature = "bigdecimal")]
+    assert_eq!(
+        stmt,
+        Statement::Execute {
+            name: "a".into(),
+            parameters: vec![
+                Expr::Value(Value::Number(bigdecimal::BigDecimal::from(1))),
+                Expr::Value(Value::SingleQuotedString("t".to_string()))
+            ],
+        }
+    );
+}
+
+#[test]
+fn parse_prepare() {
+    let stmt =
+        pg_and_generic().verified_stmt("PREPARE a AS INSERT INTO customers VALUES (a1, a2, a3)");
+    let sub_stmt = match stmt {
+        Statement::Prepare {
+            name,
+            data_types,
+            statement,
+            ..
+        } => {
+            assert_eq!(name, "a".into());
+            assert!(data_types.is_empty());
+
+            statement
+        }
+        _ => unreachable!(),
+    };
+    match sub_stmt.as_ref() {
+        Statement::Insert {
+            table_name,
+            columns,
+            source,
+            ..
+        } => {
+            assert_eq!(table_name.to_string(), "customers");
+            assert!(columns.is_empty());
+
+            let expected_values = [vec![
+                Expr::Identifier("a1".into()),
+                Expr::Identifier("a2".into()),
+                Expr::Identifier("a3".into()),
+            ]];
+            match &source.body {
+                SetExpr::Values(Values(values)) => assert_eq!(values.as_slice(), &expected_values),
+                _ => unreachable!(),
+            }
+        }
+        _ => unreachable!(),
+    };
+
+    let stmt = pg_and_generic()
+        .verified_stmt("PREPARE a (INT, TEXT) AS SELECT * FROM customers WHERE customers.id = a1");
+    let sub_stmt = match stmt {
+        Statement::Prepare {
+            name,
+            data_types,
+            statement,
+            ..
+        } => {
+            assert_eq!(name, "a".into());
+            assert_eq!(data_types, vec![DataType::Int, DataType::Text]);
+
+            statement
+        }
+        _ => unreachable!(),
+    };
+    assert_eq!(
+        sub_stmt,
+        Box::new(Statement::Query(Box::new(pg_and_generic().verified_query(
+            "SELECT * FROM customers WHERE customers.id = a1"
+        ))))
+    );
+}
+
 fn pg() -> TestedDialects {
     TestedDialects {
         dialects: vec![Box::new(PostgreSqlDialect {})],

From 09ca14fe8e8d0b778a1bc93fc4ce67a627a92997 Mon Sep 17 00:00:00 2001
From: mz <hitmashuai@gmail.com>
Date: Wed, 29 Jul 2020 04:34:21 +0800
Subject: [PATCH 061/122] Support dialect-specific auto-increment column
 options for MySQL and SQLite (#234)

In MySQL it's AUTO_INCREMENT
(see https://dev.mysql.com/doc/refman/8.0/en/create-table.html)
and in SQLite it's AUTOINCREMENT.

We use `ColumnOption::DialectSpecific(Vec<Token>)` to avoid adding a new variant for each vendor-specific column option.
---
 CHANGELOG.md              |  3 +++
 src/ast/ddl.rs            |  9 ++++++++-
 src/dialect/keywords.rs   |  7 ++++++-
 src/parser.rs             |  6 ++++++
 src/tokenizer.rs          | 11 ++++++++---
 tests/sqlparser_mysql.rs  | 32 ++++++++++++++++++++++++++++++++
 tests/sqlparser_sqlite.rs | 32 ++++++++++++++++++++++++++++++++
 7 files changed, 95 insertions(+), 5 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 702e1e6ed..8273062d8 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -11,6 +11,9 @@ Check https://github.com/ballista-compute/sqlparser-rs/commits/main for undocume
 ### Changed
 
 ### Added
+- Support `CREATE OR REPLACE VIEW`/`TABLE` (#239)  - thanks @Dandandan!
+- Support PostgreSQL `PREPARE`, `EXECUTE`, and `DEALLOCATE` (#243) - thanks @silathdiir!
+- Support SQLite `AUTOINCREMENT` and MySQL `AUTO_INCREMENT` column option in `CREATE TABLE` - thanks @mashuai!
 
 ### Fixed
 
diff --git a/src/ast/ddl.rs b/src/ast/ddl.rs
index f46364251..31f817448 100644
--- a/src/ast/ddl.rs
+++ b/src/ast/ddl.rs
@@ -13,6 +13,8 @@
 //! AST types specific to CREATE/ALTER variants of [Statement]
 //! (commonly referred to as Data Definition Language, or DDL)
 use super::{display_comma_separated, DataType, Expr, Ident, ObjectName};
+use crate::ast::display_separated;
+use crate::tokenizer::Token;
 #[cfg(feature = "serde")]
 use serde::{Deserialize, Serialize};
 use std::fmt;
@@ -212,8 +214,12 @@ pub enum ColumnOption {
         on_delete: Option<ReferentialAction>,
         on_update: Option<ReferentialAction>,
     },
-    // `CHECK (<expr>)`
+    /// `CHECK (<expr>)`
     Check(Expr),
+    /// Dialect-specific options, such as:
+    /// - MySQL's `AUTO_INCREMENT` or SQLite's `AUTOINCREMENT`
+    /// - ...
+    DialectSpecific(Vec<Token>),
 }
 
 impl fmt::Display for ColumnOption {
@@ -245,6 +251,7 @@ impl fmt::Display for ColumnOption {
                 Ok(())
             }
             Check(expr) => write!(f, "CHECK ({})", expr),
+            DialectSpecific(val) => write!(f, "{}", display_separated(val, " ")),
         }
     }
 }
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index 6ebe27f0e..d14534881 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -23,6 +23,8 @@
 ///     and could be removed.
 /// 3) a `RESERVED_FOR_TABLE_ALIAS` array with keywords reserved in a
 /// "table alias" context.
+#[cfg(feature = "serde")]
+use serde::{Deserialize, Serialize};
 
 /// Defines a string constant for a single keyword: `kw_def!(SELECT);`
 /// expands to `pub const SELECT = "SELECT";`
@@ -41,7 +43,8 @@ macro_rules! define_keywords {
     ($(
         $ident:ident $(= $string_keyword:expr)?
     ),*) => {
-        #[derive(Debug, Clone, Copy, PartialEq, PartialOrd, Eq, Ord)]
+        #[derive(Debug, Clone, Copy, PartialEq, PartialOrd, Eq, Ord, Hash)]
+        #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
         #[allow(non_camel_case_types)]
         pub enum Keyword {
             NoKeyword,
@@ -84,6 +87,8 @@ define_keywords!(
     AT,
     ATOMIC,
     AUTHORIZATION,
+    AUTOINCREMENT,
+    AUTO_INCREMENT,
     AVG,
     AVRO,
     BEGIN,
diff --git a/src/parser.rs b/src/parser.rs
index 27960d1f7..320cb4f5c 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1283,6 +1283,12 @@ impl Parser {
             let expr = self.parse_expr()?;
             self.expect_token(&Token::RParen)?;
             ColumnOption::Check(expr)
+        } else if self.parse_keyword(Keyword::AUTO_INCREMENT) {
+            // Support AUTO_INCREMENT for MySQL
+            ColumnOption::DialectSpecific(vec![Token::make_keyword("AUTO_INCREMENT")])
+        } else if self.parse_keyword(Keyword::AUTOINCREMENT) {
+            // Support AUTOINCREMENT for SQLite
+            ColumnOption::DialectSpecific(vec![Token::make_keyword("AUTOINCREMENT")])
         } else {
             return self.expected("column option", self.peek_token());
         };
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 520424af3..177402599 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -21,10 +21,13 @@ use std::str::Chars;
 
 use super::dialect::keywords::{Keyword, ALL_KEYWORDS, ALL_KEYWORDS_INDEX};
 use super::dialect::Dialect;
+#[cfg(feature = "serde")]
+use serde::{Deserialize, Serialize};
 use std::fmt;
 
 /// SQL Token enumeration
-#[derive(Debug, Clone, PartialEq)]
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum Token {
     /// An end-of-file marker, not a real token
     EOF,
@@ -160,7 +163,8 @@ impl Token {
 }
 
 /// A keyword (like SELECT) or an optionally quoted SQL identifier
-#[derive(Debug, Clone, PartialEq)]
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Word {
     /// The value of the token, without the enclosing quotes, and with the
     /// escape sequences (if any) processed (TODO: escapes are not handled)
@@ -196,7 +200,8 @@ impl Word {
     }
 }
 
-#[derive(Debug, Clone, PartialEq)]
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum Whitespace {
     Space,
     Newline,
diff --git a/tests/sqlparser_mysql.rs b/tests/sqlparser_mysql.rs
index 1ac8e384c..4e49a6348 100644
--- a/tests/sqlparser_mysql.rs
+++ b/tests/sqlparser_mysql.rs
@@ -18,6 +18,7 @@
 use sqlparser::ast::*;
 use sqlparser::dialect::{GenericDialect, MySqlDialect};
 use sqlparser::test_utils::*;
+use sqlparser::tokenizer::Token;
 
 #[test]
 fn parse_identifiers() {
@@ -97,6 +98,37 @@ fn parse_show_columns() {
     }
 }
 
+#[test]
+fn parse_create_table_auto_increment() {
+    let sql = "CREATE TABLE foo (bar INT PRIMARY KEY AUTO_INCREMENT)";
+    match mysql().verified_stmt(sql) {
+        Statement::CreateTable { name, columns, .. } => {
+            assert_eq!(name.to_string(), "foo");
+            assert_eq!(
+                vec![ColumnDef {
+                    name: "bar".into(),
+                    data_type: DataType::Int,
+                    collation: None,
+                    options: vec![
+                        ColumnOptionDef {
+                            name: None,
+                            option: ColumnOption::Unique { is_primary: true }
+                        },
+                        ColumnOptionDef {
+                            name: None,
+                            option: ColumnOption::DialectSpecific(vec![Token::make_keyword(
+                                "AUTO_INCREMENT"
+                            )])
+                        }
+                    ],
+                }],
+                columns
+            );
+        }
+        _ => unreachable!(),
+    }
+}
+
 fn mysql() -> TestedDialects {
     TestedDialects {
         dialects: vec![Box::new(MySqlDialect {})],
diff --git a/tests/sqlparser_sqlite.rs b/tests/sqlparser_sqlite.rs
index 6d715abea..ca6a677be 100644
--- a/tests/sqlparser_sqlite.rs
+++ b/tests/sqlparser_sqlite.rs
@@ -17,6 +17,7 @@
 use sqlparser::ast::*;
 use sqlparser::dialect::GenericDialect;
 use sqlparser::test_utils::*;
+use sqlparser::tokenizer::Token;
 
 #[test]
 fn parse_create_table_without_rowid() {
@@ -55,6 +56,37 @@ fn parse_create_virtual_table() {
     sqlite_and_generic().verified_stmt(sql);
 }
 
+#[test]
+fn parse_create_table_auto_increment() {
+    let sql = "CREATE TABLE foo (bar INT PRIMARY KEY AUTOINCREMENT)";
+    match sqlite_and_generic().verified_stmt(sql) {
+        Statement::CreateTable { name, columns, .. } => {
+            assert_eq!(name.to_string(), "foo");
+            assert_eq!(
+                vec![ColumnDef {
+                    name: "bar".into(),
+                    data_type: DataType::Int,
+                    collation: None,
+                    options: vec![
+                        ColumnOptionDef {
+                            name: None,
+                            option: ColumnOption::Unique { is_primary: true }
+                        },
+                        ColumnOptionDef {
+                            name: None,
+                            option: ColumnOption::DialectSpecific(vec![Token::make_keyword(
+                                "AUTOINCREMENT"
+                            )])
+                        }
+                    ],
+                }],
+                columns
+            );
+        }
+        _ => unreachable!(),
+    }
+}
+
 fn sqlite_and_generic() -> TestedDialects {
     TestedDialects {
         // we don't have a separate SQLite dialect, so test only the generic dialect for now

From d0db8a224b4598015a03061f940c0b32c71b53a2 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Tue, 28 Jul 2020 23:36:13 +0300
Subject: [PATCH 062/122] Run cargo fmt

---
 src/ast/ddl.rs | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/src/ast/ddl.rs b/src/ast/ddl.rs
index 31f817448..847ee71a3 100644
--- a/src/ast/ddl.rs
+++ b/src/ast/ddl.rs
@@ -200,9 +200,7 @@ pub enum ColumnOption {
     /// `DEFAULT <restricted-expr>`
     Default(Expr),
     /// `{ PRIMARY KEY | UNIQUE }`
-    Unique {
-        is_primary: bool,
-    },
+    Unique { is_primary: bool },
     /// A referential integrity constraint (`[FOREIGN KEY REFERENCES
     /// <foreign_table> (<referred_columns>)
     /// { [ON DELETE <referential_action>] [ON UPDATE <referential_action>] |

From 3e880b599a36a6c1eca73b7427b0faea7d7a1eed Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Mon, 27 Jul 2020 21:23:48 +0300
Subject: [PATCH 063/122] Use consistent style for Display impls

---
 src/ast/mod.rs | 84 ++++++++++++++++++++------------------------------
 1 file changed, 33 insertions(+), 51 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 41bff69d0..fa05b1713 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -299,7 +299,7 @@ impl fmt::Display for Expr {
                 results,
                 else_result,
             } => {
-                f.write_str("CASE")?;
+                write!(f, "CASE")?;
                 if let Some(operand) = operand {
                     write!(f, " {}", operand)?;
                 }
@@ -310,7 +310,7 @@ impl fmt::Display for Expr {
                 if let Some(else_result) = else_result {
                     write!(f, " ELSE {}", else_result)?;
                 }
-                f.write_str(" END")
+                write!(f, " END")
             }
             Expr::Exists(s) => write!(f, "EXISTS ({})", s),
             Expr::Subquery(s) => write!(f, "({})", s),
@@ -626,8 +626,7 @@ impl fmt::Display for Statement {
             } => {
                 write!(f, "UPDATE {}", table_name)?;
                 if !assignments.is_empty() {
-                    write!(f, " SET ")?;
-                    write!(f, "{}", display_comma_separated(assignments))?;
+                    write!(f, " SET {}", display_comma_separated(assignments))?;
                 }
                 if let Some(selection) = selection {
                     write!(f, " WHERE {}", selection)?;
@@ -652,26 +651,19 @@ impl fmt::Display for Statement {
                 materialized,
                 with_options,
             } => {
-                write!(f, "CREATE")?;
-
-                if *or_replace {
-                    write!(f, " OR REPLACE")?;
-                }
-
-                if *materialized {
-                    write!(f, " MATERIALIZED")?;
-                }
-
-                write!(f, " VIEW {}", name)?;
-
+                write!(
+                    f,
+                    "CREATE {or_replace}{materialized}VIEW {name}",
+                    or_replace = if *or_replace { "OR REPLACE " } else { "" },
+                    materialized = if *materialized { "MATERIALIZED " } else { "" },
+                    name = name
+                )?;
                 if !with_options.is_empty() {
                     write!(f, " WITH ({})", display_comma_separated(with_options))?;
                 }
-
                 if !columns.is_empty() {
                     write!(f, " ({})", display_comma_separated(columns))?;
                 }
-
                 write!(f, " AS {}", query)
             }
             Statement::CreateTable {
@@ -716,7 +708,6 @@ impl fmt::Display for Statement {
                 if *without_rowid {
                     write!(f, " WITHOUT ROWID")?;
                 }
-
                 if *external {
                     write!(
                         f,
@@ -757,22 +748,15 @@ impl fmt::Display for Statement {
                 columns,
                 unique,
                 if_not_exists,
-            } => {
-                write!(
-                    f,
-                    "CREATE{}INDEX{}{} ON {}({}",
-                    if *unique { " UNIQUE " } else { " " },
-                    if *if_not_exists {
-                        " IF NOT EXISTS "
-                    } else {
-                        " "
-                    },
-                    name,
-                    table_name,
-                    display_separated(columns, ",")
-                )?;
-                write!(f, ");")
-            }
+            } => write!(
+                f,
+                "CREATE {unique}INDEX {if_not_exists}{name} ON {table_name}({columns});",
+                unique = if *unique { "UNIQUE " } else { "" },
+                if_not_exists = if *if_not_exists { "IF NOT EXISTS " } else { "" },
+                name = name,
+                table_name = table_name,
+                columns = display_separated(columns, ",")
+            ),
             Statement::AlterTable { name, operation } => {
                 write!(f, "ALTER TABLE {} {}", name, operation)
             }
@@ -793,13 +777,13 @@ impl fmt::Display for Statement {
                 local,
                 variable,
                 value,
-            } => {
-                f.write_str("SET ")?;
-                if *local {
-                    f.write_str("LOCAL ")?;
-                }
-                write!(f, "{} = {}", variable, value)
-            }
+            } => write!(
+                f,
+                "SET{local} {variable} = {value}",
+                local = if *local { " LOCAL" } else { "" },
+                variable = variable,
+                value = value
+            ),
             Statement::ShowVariable { variable } => write!(f, "SHOW {}", variable),
             Statement::ShowColumns {
                 extended,
@@ -807,14 +791,13 @@ impl fmt::Display for Statement {
                 table_name,
                 filter,
             } => {
-                f.write_str("SHOW ")?;
-                if *extended {
-                    f.write_str("EXTENDED ")?;
-                }
-                if *full {
-                    f.write_str("FULL ")?;
-                }
-                write!(f, "COLUMNS FROM {}", table_name)?;
+                write!(
+                    f,
+                    "SHOW {extended}{full}COLUMNS FROM {table_name}",
+                    extended = if *extended { "EXTENDED " } else { "" },
+                    full = if *full { "FULL " } else { "" },
+                    table_name = table_name,
+                )?;
                 if let Some(filter) = filter {
                     write!(f, " {}", filter)?;
                 }
@@ -843,7 +826,6 @@ impl fmt::Display for Statement {
             Statement::CreateSchema { schema_name } => write!(f, "CREATE SCHEMA {}", schema_name),
             Statement::Assert { condition, message } => {
                 write!(f, "ASSERT {}", condition)?;
-
                 if let Some(m) = message {
                     write!(f, " AS {}", m)?;
                 }

From 9371652446b2148fb04f9a0cf8adebdb86d63ea9 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Tue, 28 Jul 2020 23:49:32 +0300
Subject: [PATCH 064/122] Fix "unused stmt" warning in tests, with default
 features

---
 tests/sqlparser_postgres.rs | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index f45913a58..2b950c0d3 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -474,14 +474,12 @@ fn parse_execute() {
     );
 
     let stmt = pg_and_generic().verified_stmt("EXECUTE a(1, 't')");
-
-    #[cfg(feature = "bigdecimal")]
     assert_eq!(
         stmt,
         Statement::Execute {
             name: "a".into(),
             parameters: vec![
-                Expr::Value(Value::Number(bigdecimal::BigDecimal::from(1))),
+                Expr::Value(number("1")),
                 Expr::Value(Value::SingleQuotedString("t".to_string()))
             ],
         }

From 9a2d86dcb5bc32b0fcdb993d8d22e670871fe018 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Wed, 29 Jul 2020 00:04:40 +0300
Subject: [PATCH 065/122] Change CREATE INDEX serialization to not end with a
 semicolon

---
 src/ast/mod.rs            | 2 +-
 tests/sqlparser_common.rs | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index fa05b1713..332fce63c 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -750,7 +750,7 @@ impl fmt::Display for Statement {
                 if_not_exists,
             } => write!(
                 f,
-                "CREATE {unique}INDEX {if_not_exists}{name} ON {table_name}({columns});",
+                "CREATE {unique}INDEX {if_not_exists}{name} ON {table_name}({columns})",
                 unique = if *unique { "UNIQUE " } else { "" },
                 if_not_exists = if *if_not_exists { "IF NOT EXISTS " } else { "" },
                 name = name,
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 5889cc357..54da1bc0b 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -3152,7 +3152,7 @@ fn ensure_multiple_dialects_are_tested() {
 
 #[test]
 fn parse_create_index() {
-    let sql = "CREATE UNIQUE INDEX IF NOT EXISTS idx_name ON test(name,age);";
+    let sql = "CREATE UNIQUE INDEX IF NOT EXISTS idx_name ON test(name,age)";
     let ident_vec = vec![Ident::new("name"), Ident::new("age")];
     match verified_stmt(sql) {
         Statement::CreateIndex {

From a6e30b3fad3739993ea54e36d2dfb9031d2e91f1 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Wed, 29 Jul 2020 00:14:22 +0300
Subject: [PATCH 066/122] Fix typo in JSONFILE serialization

Closes https://github.com/ballista-compute/sqlparser-rs/issues/237
---
 src/ast/mod.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 332fce63c..3c2f5c4fe 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -923,7 +923,7 @@ impl fmt::Display for FileFormat {
             PARQUET => "PARQUET",
             AVRO => "AVRO",
             RCFILE => "RCFILE",
-            JSONFILE => "TEXTFILE",
+            JSONFILE => "JSONFILE",
         })
     }
 }

From 9e7e30282e737ebd8607775ec93334d1df8932d2 Mon Sep 17 00:00:00 2001
From: mz <hitmashuai@gmail.com>
Date: Thu, 30 Jul 2020 09:22:29 +0800
Subject: [PATCH 067/122] Support identifiers quoted with backticks in the
 MySQL dialect (#247)

Per https://dev.mysql.com/doc/refman/8.0/en/identifiers.html
MySQL historically supports `identifiers quoted in backticks`
in addition to the ANSI "quoting style" (assuming ANSI_QUOTES mode).
---
 src/dialect/mysql.rs     |  4 ++++
 tests/sqlparser_mysql.rs | 25 ++++++++++++++++++++++++-
 2 files changed, 28 insertions(+), 1 deletion(-)

diff --git a/src/dialect/mysql.rs b/src/dialect/mysql.rs
index e0b4e21c4..a4aaafe6b 100644
--- a/src/dialect/mysql.rs
+++ b/src/dialect/mysql.rs
@@ -30,4 +30,8 @@ impl Dialect for MySqlDialect {
     fn is_identifier_part(&self, ch: char) -> bool {
         self.is_identifier_start(ch) || (ch >= '0' && ch <= '9')
     }
+
+    fn is_delimited_identifier_start(&self, ch: char) -> bool {
+        ch == '`'
+    }
 }
diff --git a/tests/sqlparser_mysql.rs b/tests/sqlparser_mysql.rs
index 4e49a6348..c0fc8c8ba 100644
--- a/tests/sqlparser_mysql.rs
+++ b/tests/sqlparser_mysql.rs
@@ -106,7 +106,7 @@ fn parse_create_table_auto_increment() {
             assert_eq!(name.to_string(), "foo");
             assert_eq!(
                 vec![ColumnDef {
-                    name: "bar".into(),
+                    name: Ident::new("bar"),
                     data_type: DataType::Int,
                     collation: None,
                     options: vec![
@@ -129,6 +129,29 @@ fn parse_create_table_auto_increment() {
     }
 }
 
+#[test]
+fn parse_quote_identifiers() {
+    let sql = "CREATE TABLE `PRIMARY` (`BEGIN` INT PRIMARY KEY)";
+    match mysql().verified_stmt(sql) {
+        Statement::CreateTable { name, columns, .. } => {
+            assert_eq!(name.to_string(), "`PRIMARY`");
+            assert_eq!(
+                vec![ColumnDef {
+                    name: Ident::with_quote('`', "BEGIN"),
+                    data_type: DataType::Int,
+                    collation: None,
+                    options: vec![ColumnOptionDef {
+                        name: None,
+                        option: ColumnOption::Unique { is_primary: true }
+                    }],
+                }],
+                columns
+            );
+        }
+        _ => unreachable!(),
+    }
+}
+
 fn mysql() -> TestedDialects {
     TestedDialects {
         dialects: vec![Box::new(MySqlDialect {})],

From 4452f9bad1ce27e6149e38eb61a4883cd85e78b2 Mon Sep 17 00:00:00 2001
From: mz <hitmashuai@gmail.com>
Date: Thu, 30 Jul 2020 20:37:58 +0800
Subject: [PATCH 068/122] Support specifying ASC/DESC in index columns (#249)

...by reusing `OrderByExpr` for `columns` in `Statement::CreateIndex`.

This supports SQLite's indexed-column syntax https://www.sqlite.org/syntax/indexed-column.html

MSSQL's (`ON <object> ( column [ ASC | DESC ] [ ,...n ] )`)
https://docs.microsoft.com/en-us/sql/t-sql/statements/create-index-transact-sql?view=sql-server-ver15

And most of PostgreSQL syntax (except for opclass):
`( { column_name | ( expression ) } [ COLLATE collation ] [ opclass ] [ ASC | DESC ] [ NULLS { FIRST | LAST } ] [, ...] )`
https://www.postgresql.org/docs/12/sql-createindex.html
---
 src/ast/mod.rs            |  2 +-
 src/parser.rs             |  4 +++-
 tests/sqlparser_common.rs | 17 ++++++++++++++---
 3 files changed, 18 insertions(+), 5 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 3c2f5c4fe..865577cae 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -498,7 +498,7 @@ pub enum Statement {
         /// index name
         name: ObjectName,
         table_name: ObjectName,
-        columns: Vec<Ident>,
+        columns: Vec<OrderByExpr>,
         unique: bool,
         if_not_exists: bool,
     },
diff --git a/src/parser.rs b/src/parser.rs
index 320cb4f5c..b58bdc5c6 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1142,7 +1142,9 @@ impl Parser {
         let index_name = self.parse_object_name()?;
         self.expect_keyword(Keyword::ON)?;
         let table_name = self.parse_object_name()?;
-        let columns = self.parse_parenthesized_column_list(Mandatory)?;
+        self.expect_token(&Token::LParen)?;
+        let columns = self.parse_comma_separated(Parser::parse_order_by_expr)?;
+        self.expect_token(&Token::RParen)?;
         Ok(Statement::CreateIndex {
             name: index_name,
             table_name,
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 54da1bc0b..1a1c3ad87 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -3152,8 +3152,19 @@ fn ensure_multiple_dialects_are_tested() {
 
 #[test]
 fn parse_create_index() {
-    let sql = "CREATE UNIQUE INDEX IF NOT EXISTS idx_name ON test(name,age)";
-    let ident_vec = vec![Ident::new("name"), Ident::new("age")];
+    let sql = "CREATE UNIQUE INDEX IF NOT EXISTS idx_name ON test(name,age DESC)";
+    let indexed_columns = vec![
+        OrderByExpr {
+            expr: Expr::Identifier(Ident::new("name")),
+            asc: None,
+            nulls_first: None,
+        },
+        OrderByExpr {
+            expr: Expr::Identifier(Ident::new("age")),
+            asc: Some(false),
+            nulls_first: None,
+        },
+    ];
     match verified_stmt(sql) {
         Statement::CreateIndex {
             name,
@@ -3164,7 +3175,7 @@ fn parse_create_index() {
         } => {
             assert_eq!("idx_name", name.to_string());
             assert_eq!("test", table_name.to_string());
-            assert_eq!(ident_vec, columns);
+            assert_eq!(indexed_columns, columns);
             assert_eq!(true, unique);
             assert_eq!(true, if_not_exists)
         }

From f8feff4ef2cfe4929105641007d831edd6fa8e8f Mon Sep 17 00:00:00 2001
From: mz <hitmashuai@gmail.com>
Date: Fri, 31 Jul 2020 20:09:54 +0800
Subject: [PATCH 069/122] Add SQLite dialect (#248)

---
 src/dialect/mod.rs        |  2 ++
 src/dialect/sqlite.rs     | 38 ++++++++++++++++++++++++++++++++++++++
 tests/sqlparser_sqlite.rs | 38 ++++++++++++++++++++++++++++++++++++--
 3 files changed, 76 insertions(+), 2 deletions(-)
 create mode 100644 src/dialect/sqlite.rs

diff --git a/src/dialect/mod.rs b/src/dialect/mod.rs
index c9ddbedd3..ff28314c8 100644
--- a/src/dialect/mod.rs
+++ b/src/dialect/mod.rs
@@ -16,6 +16,7 @@ pub mod keywords;
 mod mssql;
 mod mysql;
 mod postgresql;
+mod sqlite;
 
 use std::fmt::Debug;
 
@@ -24,6 +25,7 @@ pub use self::generic::GenericDialect;
 pub use self::mssql::MsSqlDialect;
 pub use self::mysql::MySqlDialect;
 pub use self::postgresql::PostgreSqlDialect;
+pub use self::sqlite::SQLiteDialect;
 
 pub trait Dialect: Debug {
     /// Determine if a character starts a quoted identifier. The default
diff --git a/src/dialect/sqlite.rs b/src/dialect/sqlite.rs
new file mode 100644
index 000000000..16ec66ac2
--- /dev/null
+++ b/src/dialect/sqlite.rs
@@ -0,0 +1,38 @@
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+use crate::dialect::Dialect;
+
+#[derive(Debug)]
+pub struct SQLiteDialect {}
+
+impl Dialect for SQLiteDialect {
+    // see https://www.sqlite.org/lang_keywords.html
+    // parse `...`, [...] and "..." as identifier
+    // TODO: support depending on the context tread '...' as identifier too.
+    fn is_delimited_identifier_start(&self, ch: char) -> bool {
+        ch == '`' || ch == '"' || ch == '['
+    }
+
+    fn is_identifier_start(&self, ch: char) -> bool {
+        // See https://www.sqlite.org/draft/tokenreq.html
+        (ch >= 'a' && ch <= 'z')
+            || (ch >= 'A' && ch <= 'Z')
+            || ch == '_'
+            || ch == '$'
+            || (ch >= '\u{007f}' && ch <= '\u{ffff}')
+    }
+
+    fn is_identifier_part(&self, ch: char) -> bool {
+        self.is_identifier_start(ch) || (ch >= '0' && ch <= '9')
+    }
+}
diff --git a/tests/sqlparser_sqlite.rs b/tests/sqlparser_sqlite.rs
index ca6a677be..2a421e94b 100644
--- a/tests/sqlparser_sqlite.rs
+++ b/tests/sqlparser_sqlite.rs
@@ -15,7 +15,7 @@
 //! generic dialect is also tested (on the inputs it can handle).
 
 use sqlparser::ast::*;
-use sqlparser::dialect::GenericDialect;
+use sqlparser::dialect::{GenericDialect, SQLiteDialect};
 use sqlparser::test_utils::*;
 use sqlparser::tokenizer::Token;
 
@@ -87,9 +87,43 @@ fn parse_create_table_auto_increment() {
     }
 }
 
+#[test]
+fn parse_create_sqlite_quote() {
+    let sql = "CREATE TABLE `PRIMARY` (\"KEY\" INT, [INDEX] INT)";
+    match sqlite().verified_stmt(sql) {
+        Statement::CreateTable { name, columns, .. } => {
+            assert_eq!(name.to_string(), "`PRIMARY`");
+            assert_eq!(
+                vec![
+                    ColumnDef {
+                        name: Ident::with_quote('"', "KEY"),
+                        data_type: DataType::Int,
+                        collation: None,
+                        options: vec![],
+                    },
+                    ColumnDef {
+                        name: Ident::with_quote('[', "INDEX"),
+                        data_type: DataType::Int,
+                        collation: None,
+                        options: vec![],
+                    },
+                ],
+                columns
+            );
+        }
+        _ => unreachable!(),
+    }
+}
+
+fn sqlite() -> TestedDialects {
+    TestedDialects {
+        dialects: vec![Box::new(SQLiteDialect {})],
+    }
+}
+
 fn sqlite_and_generic() -> TestedDialects {
     TestedDialects {
         // we don't have a separate SQLite dialect, so test only the generic dialect for now
-        dialects: vec![Box::new(GenericDialect {})],
+        dialects: vec![Box::new(SQLiteDialect {}), Box::new(GenericDialect {})],
     }
 }

From 9c1a5a781d82325b8d99e3b96b35f6a235bf2463 Mon Sep 17 00:00:00 2001
From: mz <hitmashuai@gmail.com>
Date: Fri, 31 Jul 2020 23:10:53 +0800
Subject: [PATCH 070/122] Don't fail parsing ALTER TABLE ADD COLUMN ending with
 a semicolon (#246)

This is a follow-up to https://github.com/ballista-compute/sqlparser-rs/pull/203
where ALTER TABLE ADD COLUMN support was initially implemented.

Fixes #233.
---
 src/parser.rs             | 2 +-
 tests/sqlparser_common.rs | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/parser.rs b/src/parser.rs
index b58bdc5c6..1c3c4eaf9 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1199,7 +1199,7 @@ impl Parser {
         let mut options = vec![];
         loop {
             match self.peek_token() {
-                Token::EOF | Token::Comma | Token::RParen => break,
+                Token::EOF | Token::Comma | Token::RParen | Token::SemiColon => break,
                 _ => options.push(self.parse_column_option_def()?),
             }
         }
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 1a1c3ad87..898c39e47 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1459,8 +1459,8 @@ fn parse_create_external_table_lowercase() {
 
 #[test]
 fn parse_alter_table() {
-    let add_column = "ALTER TABLE tab ADD COLUMN foo TEXT";
-    match verified_stmt(add_column) {
+    let add_column = "ALTER TABLE tab ADD COLUMN foo TEXT;";
+    match one_statement_parses_to(add_column, "ALTER TABLE tab ADD COLUMN foo TEXT") {
         Statement::AlterTable {
             name,
             operation: AlterTableOperation::AddColumn { column_def },

From 76a911b34ed9fa1da28782b5c7f6b5f3c711d1df Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Fri, 31 Jul 2020 08:56:59 -0700
Subject: [PATCH 071/122] ensure we use nightly with fmt

---
 .github/workflows/rust.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/rust.yml b/.github/workflows/rust.yml
index a53e0babc..aed1a371a 100644
--- a/.github/workflows/rust.yml
+++ b/.github/workflows/rust.yml
@@ -15,7 +15,7 @@ jobs:
           # it's an unstable feature.
           rust-version: nightly
       - uses: actions/checkout@v2
-      - run: cargo fmt -- --check --config-path <(echo 'license_template_path = "HEADER"')
+      - run: cargo +nightly fmt -- --check --config-path <(echo 'license_template_path = "HEADER"')
 
   lint:
     runs-on: ubuntu-latest

From cac3a8ec1e02a5ec758a8a9ab3bbc0abd4022d7c Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Fri, 31 Jul 2020 09:01:32 -0700
Subject: [PATCH 072/122] provide missing license header

---
 tests/sqlparser_regression.rs | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/tests/sqlparser_regression.rs b/tests/sqlparser_regression.rs
index 26a5e7d4c..5262ff7aa 100644
--- a/tests/sqlparser_regression.rs
+++ b/tests/sqlparser_regression.rs
@@ -1,3 +1,15 @@
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
 use sqlparser::dialect::GenericDialect;
 use sqlparser::parser::Parser;
 

From 1a70c6e1fedf4c32b800264f63c50517d3380db3 Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Fri, 31 Jul 2020 09:18:34 -0700
Subject: [PATCH 073/122] document initial release process

---
 docs/releasing.md | 32 ++++++++++++++++++++++++++++++++
 1 file changed, 32 insertions(+)
 create mode 100644 docs/releasing.md

diff --git a/docs/releasing.md b/docs/releasing.md
new file mode 100644
index 000000000..ae7d85059
--- /dev/null
+++ b/docs/releasing.md
@@ -0,0 +1,32 @@
+# Releasing
+
+Releasing, i.e. crate publishing, has been automated via GitHub Actions.
+
+In order to author a new release, you simply tag the desired revision and push
+the resulting tag.
+
+**Before releasing** ensure `CHANGELOG.md` is updated appropriately as well as
+`Cargo.toml`.
+
+## Process
+
+Please ensure you follow the correct format when creating new tags. For
+instance:
+
+```
+git tag -a '0.6.0' -m '(cargo-release) sqlparser version 0.6.0'
+```
+
+This will create a new tag, `0.6.0` which the message,
+`(cargo-release) sqlparser version 0.6.0`.
+
+Once the tag is created, pushing the tag upstream will trigger a publishing
+process to crates.io. Now to push our example tag:
+
+```
+git push origin 0.6.0
+```
+
+(Note that this process is fully automated; credentials
+for authoring in this way are securely stored in the repo secrets as
+`CRATE_TOKEN`.)

From 6b37c1642fd0bd584e0fd29cbbd3ed4fe6f5e235 Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Fri, 31 Jul 2020 09:34:51 -0700
Subject: [PATCH 074/122] fix typo

---
 docs/releasing.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/releasing.md b/docs/releasing.md
index ae7d85059..2cc6535d4 100644
--- a/docs/releasing.md
+++ b/docs/releasing.md
@@ -17,7 +17,7 @@ instance:
 git tag -a '0.6.0' -m '(cargo-release) sqlparser version 0.6.0'
 ```
 
-This will create a new tag, `0.6.0` which the message,
+This will create a new tag, `0.6.0` with the message,
 `(cargo-release) sqlparser version 0.6.0`.
 
 Once the tag is created, pushing the tag upstream will trigger a publishing

From 9351efb437f27d2c36fa4f1582ff9a1e01d50e15 Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Sat, 1 Aug 2020 07:30:41 -0700
Subject: [PATCH 075/122] update release instructions

---
 Cargo.toml        |  3 +++
 docs/releasing.md | 19 ++++++++++++-------
 2 files changed, 15 insertions(+), 7 deletions(-)

diff --git a/Cargo.toml b/Cargo.toml
index 95c2ec9bb..81a3c64ec 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -34,3 +34,6 @@ serde_json = { version = "1.0", optional = true }
 [dev-dependencies]
 simple_logger = "1.0.1"
 matches = "0.1"
+
+[package.metadata.release]
+disable-publish = true
diff --git a/docs/releasing.md b/docs/releasing.md
index 2cc6535d4..66b41901b 100644
--- a/docs/releasing.md
+++ b/docs/releasing.md
@@ -2,21 +2,26 @@
 
 Releasing, i.e. crate publishing, has been automated via GitHub Actions.
 
-In order to author a new release, you simply tag the desired revision and push
-the resulting tag.
+We use the [`cargo release`](https://github.com/sunng87/cargo-release)
+subcommand to ensure correct versioning. Install via:
 
-**Before releasing** ensure `CHANGELOG.md` is updated appropriately as well as
-`Cargo.toml`.
+```
+$ cargo install cargo-release
+```
+
+**Before releasing** ensure `CHANGELOG.md` is updated appropriately.
 
 ## Process
 
-Please ensure you follow the correct format when creating new tags. For
-instance:
+Using `cargo-release` we can author a new minor release like so:
 
 ```
-git tag -a '0.6.0' -m '(cargo-release) sqlparser version 0.6.0'
+$ cargo release minor --skip-publish
 ```
 
+**Ensure publishing is skipped** since pushing the resulting tag upstream will
+handle crate publishing automatically.
+
 This will create a new tag, `0.6.0` with the message,
 `(cargo-release) sqlparser version 0.6.0`.
 

From 1cc3bf409959afc595a3e50d0003e762cd493074 Mon Sep 17 00:00:00 2001
From: eyalleshem <38852709+eyalleshem@users.noreply.github.com>
Date: Sun, 2 Aug 2020 08:04:55 +0300
Subject: [PATCH 076/122] Support named arguments in function invocations
 (#250)

This commit supports functions with argument names.

the format is :
"Select some_function( a => exp, b => exp2 .. ) FROM table1
OR
"select * from table(function(a => exp)) f;"

see:
https://jakewheat.github.io/sql-overview/sql-2016-foundation-grammar.html#named-argument-assignment-token
or the motivating example from snowflake:
https://docs.snowflake.com/en/sql-reference/functions/flatten.html
---
 src/ast/mod.rs            | 18 +++++++++++++++++-
 src/ast/query.rs          |  2 +-
 src/parser.rs             | 17 +++++++++++++++--
 src/tokenizer.rs          | 28 +++++++++++++++++++++++++++-
 tests/sqlparser_common.rs | 35 ++++++++++++++++++++++++++++++-----
 5 files changed, 90 insertions(+), 10 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 865577cae..7b143349b 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -873,12 +873,28 @@ impl fmt::Display for Assignment {
     }
 }
 
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
+pub enum FunctionArg {
+    Named { name: Ident, arg: Expr },
+    Unnamed(Expr),
+}
+
+impl fmt::Display for FunctionArg {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        match self {
+            FunctionArg::Named { name, arg } => write!(f, "{} => {}", name, arg),
+            FunctionArg::Unnamed(unnamed_arg) => write!(f, "{}", unnamed_arg),
+        }
+    }
+}
+
 /// A function call
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Function {
     pub name: ObjectName,
-    pub args: Vec<Expr>,
+    pub args: Vec<FunctionArg>,
     pub over: Option<WindowSpec>,
     // aggregate functions may specify eg `COUNT(DISTINCT x)`
     pub distinct: bool,
diff --git a/src/ast/query.rs b/src/ast/query.rs
index 73477b126..ce57fcf7b 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -226,7 +226,7 @@ pub enum TableFactor {
         /// Arguments of a table-valued function, as supported by Postgres
         /// and MSSQL. Note that deprecated MSSQL `FROM foo (NOLOCK)` syntax
         /// will also be parsed as `args`.
-        args: Vec<Expr>,
+        args: Vec<FunctionArg>,
         /// MSSQL-specific `WITH (...)` hints such as NOLOCK.
         with_hints: Vec<Expr>,
     },
diff --git a/src/parser.rs b/src/parser.rs
index 1c3c4eaf9..625a424fb 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -2203,11 +2203,24 @@ impl Parser {
         Ok(Assignment { id, value })
     }
 
-    pub fn parse_optional_args(&mut self) -> Result<Vec<Expr>, ParserError> {
+    fn parse_function_args(&mut self) -> Result<FunctionArg, ParserError> {
+        if self.peek_nth_token(1) == Token::RArrow {
+            let name = self.parse_identifier()?;
+
+            self.expect_token(&Token::RArrow)?;
+            let arg = self.parse_expr()?;
+
+            Ok(FunctionArg::Named { name, arg })
+        } else {
+            Ok(FunctionArg::Unnamed(self.parse_expr()?))
+        }
+    }
+
+    pub fn parse_optional_args(&mut self) -> Result<Vec<FunctionArg>, ParserError> {
         if self.consume_token(&Token::RParen) {
             Ok(vec![])
         } else {
-            let args = self.parse_comma_separated(Parser::parse_expr)?;
+            let args = self.parse_comma_separated(Parser::parse_function_args)?;
             self.expect_token(&Token::RParen)?;
             Ok(args)
         }
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 177402599..644066989 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -99,6 +99,8 @@ pub enum Token {
     LBrace,
     /// Right brace `}`
     RBrace,
+    /// Right Arrow `=>`
+    RArrow,
 }
 
 impl fmt::Display for Token {
@@ -139,6 +141,7 @@ impl fmt::Display for Token {
             Token::Pipe => f.write_str("|"),
             Token::LBrace => f.write_str("{"),
             Token::RBrace => f.write_str("}"),
+            Token::RArrow => f.write_str("=>"),
         }
     }
 }
@@ -400,7 +403,13 @@ impl<'a> Tokenizer<'a> {
                         _ => Ok(Some(Token::Pipe)),
                     }
                 }
-                '=' => self.consume_and_return(chars, Token::Eq),
+                '=' => {
+                    chars.next(); // consume
+                    match chars.peek() {
+                        Some('>') => self.consume_and_return(chars, Token::RArrow),
+                        _ => Ok(Some(Token::Eq)),
+                    }
+                }
                 '.' => self.consume_and_return(chars, Token::Period),
                 '!' => {
                     chars.next(); // consume
@@ -766,6 +775,23 @@ mod tests {
         compare(expected, tokens);
     }
 
+    #[test]
+    fn tokenize_right_arrow() {
+        let sql = String::from("FUNCTION(key=>value)");
+        let dialect = GenericDialect {};
+        let mut tokenizer = Tokenizer::new(&dialect, &sql);
+        let tokens = tokenizer.tokenize().unwrap();
+        let expected = vec![
+            Token::make_word("FUNCTION", None),
+            Token::LParen,
+            Token::make_word("key", None),
+            Token::RArrow,
+            Token::make_word("value", None),
+            Token::RParen,
+        ];
+        compare(expected, tokens);
+    }
+
     #[test]
     fn tokenize_is_null() {
         let sql = String::from("a IS NULL");
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 898c39e47..5443c06e2 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -325,7 +325,7 @@ fn parse_select_count_wildcard() {
     assert_eq!(
         &Expr::Function(Function {
             name: ObjectName(vec![Ident::new("COUNT")]),
-            args: vec![Expr::Wildcard],
+            args: vec![FunctionArg::Unnamed(Expr::Wildcard)],
             over: None,
             distinct: false,
         }),
@@ -340,10 +340,10 @@ fn parse_select_count_distinct() {
     assert_eq!(
         &Expr::Function(Function {
             name: ObjectName(vec![Ident::new("COUNT")]),
-            args: vec![Expr::UnaryOp {
+            args: vec![FunctionArg::Unnamed(Expr::UnaryOp {
                 op: UnaryOperator::Plus,
                 expr: Box::new(Expr::Identifier(Ident::new("x")))
-            }],
+            })],
             over: None,
             distinct: true,
         }),
@@ -883,7 +883,7 @@ fn parse_select_having() {
         Some(Expr::BinaryOp {
             left: Box::new(Expr::Function(Function {
                 name: ObjectName(vec![Ident::new("COUNT")]),
-                args: vec![Expr::Wildcard],
+                args: vec![FunctionArg::Unnamed(Expr::Wildcard)],
                 over: None,
                 distinct: false
             })),
@@ -1589,7 +1589,32 @@ fn parse_scalar_function_in_projection() {
     assert_eq!(
         &Expr::Function(Function {
             name: ObjectName(vec![Ident::new("sqrt")]),
-            args: vec![Expr::Identifier(Ident::new("id"))],
+            args: vec![FunctionArg::Unnamed(Expr::Identifier(Ident::new("id")))],
+            over: None,
+            distinct: false,
+        }),
+        expr_from_projection(only(&select.projection))
+    );
+}
+
+#[test]
+fn parse_named_argument_function() {
+    let sql = "SELECT FUN(a => '1', b => '2') FROM foo";
+    let select = verified_only_select(sql);
+
+    assert_eq!(
+        &Expr::Function(Function {
+            name: ObjectName(vec![Ident::new("FUN")]),
+            args: vec![
+                FunctionArg::Named {
+                    name: Ident::new("a"),
+                    arg: Expr::Value(Value::SingleQuotedString("1".to_owned()))
+                },
+                FunctionArg::Named {
+                    name: Ident::new("b"),
+                    arg: Expr::Value(Value::SingleQuotedString("2".to_owned()))
+                },
+            ],
             over: None,
             distinct: false,
         }),

From caeb046803f9f1a5c0c8558730f12bb879b92785 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Tue, 4 Aug 2020 22:44:13 +0200
Subject: [PATCH 077/122] Enable dependabot for this repository

---
 .github/dependabot.yml | 12 ++++++++++++
 1 file changed, 12 insertions(+)
 create mode 100644 .github/dependabot.yml

diff --git a/.github/dependabot.yml b/.github/dependabot.yml
new file mode 100644
index 000000000..2120c5d65
--- /dev/null
+++ b/.github/dependabot.yml
@@ -0,0 +1,12 @@
+version: 2
+updates:
+  - package-ecosystem: cargo
+    directory: "/"
+    schedule:
+      interval: "daily"
+  directory: "/"
+  schedule:
+    interval: daily
+  open-pull-requests-limit: 10
+  allow:
+  - dependency-type: direct

From a246d5da9a5791267ff1a781672d52290c169c30 Mon Sep 17 00:00:00 2001
From: "Heres, Daniel" <danielheres@gmail.com>
Date: Tue, 4 Aug 2020 22:45:26 +0200
Subject: [PATCH 078/122] Undo accidental commit

---
 .github/dependabot.yml | 12 ------------
 1 file changed, 12 deletions(-)
 delete mode 100644 .github/dependabot.yml

diff --git a/.github/dependabot.yml b/.github/dependabot.yml
deleted file mode 100644
index 2120c5d65..000000000
--- a/.github/dependabot.yml
+++ /dev/null
@@ -1,12 +0,0 @@
-version: 2
-updates:
-  - package-ecosystem: cargo
-    directory: "/"
-    schedule:
-      interval: "daily"
-  directory: "/"
-  schedule:
-    interval: daily
-  open-pull-requests-limit: 10
-  allow:
-  - dependency-type: direct

From 61431b087de26a1b73c0d7acc271d7a59c9bfa8d Mon Sep 17 00:00:00 2001
From: eyalleshem <38852709+eyalleshem@users.noreply.github.com>
Date: Wed, 5 Aug 2020 08:59:43 +0300
Subject: [PATCH 079/122] Support TABLE functions in FROM (#253)

Support `TABLE(...)` syntax in `FROM`, for example:

    select * from TABLE(SOME_FUNCTION(some_arg))

The ANSI spec allows routine invocations (and some other kinds of expressions we don't currently support) inside TABLE:
https://jakewheat.github.io/sql-overview/sql-2016-foundation-grammar.html#PTF-derived-table
https://jakewheat.github.io/sql-overview/sql-2016-foundation-grammar.html#table-function-derived-table
---
 src/ast/query.rs          | 12 +++++++++++
 src/parser.rs             | 13 ++++++++----
 tests/sqlparser_common.rs | 43 ++++++++++++++++++++++++++++++++++-----
 3 files changed, 59 insertions(+), 9 deletions(-)

diff --git a/src/ast/query.rs b/src/ast/query.rs
index ce57fcf7b..e0dbe4c72 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -235,6 +235,11 @@ pub enum TableFactor {
         subquery: Box<Query>,
         alias: Option<TableAlias>,
     },
+    /// `TABLE(<expr>)[ AS <alias> ]`
+    TableFunction {
+        expr: Expr,
+        alias: Option<TableAlias>,
+    },
     /// Represents a parenthesized table factor. The SQL spec only allows a
     /// join expression (`(foo <JOIN> bar [ <JOIN> baz ... ])`) to be nested,
     /// possibly several times, but the parser also accepts the non-standard
@@ -278,6 +283,13 @@ impl fmt::Display for TableFactor {
                 }
                 Ok(())
             }
+            TableFactor::TableFunction { expr, alias } => {
+                write!(f, "TABLE({})", expr)?;
+                if let Some(alias) = alias {
+                    write!(f, " AS {}", alias)?;
+                }
+                Ok(())
+            }
             TableFactor::NestedJoin(table_reference) => write!(f, "({})", table_reference),
         }
     }
diff --git a/src/parser.rs b/src/parser.rs
index 625a424fb..5f77b6691 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -2066,10 +2066,15 @@ impl Parser {
             if !self.consume_token(&Token::LParen) {
                 self.expected("subquery after LATERAL", self.peek_token())?;
             }
-            return self.parse_derived_table_factor(Lateral);
-        }
-
-        if self.consume_token(&Token::LParen) {
+            self.parse_derived_table_factor(Lateral)
+        } else if self.parse_keyword(Keyword::TABLE) {
+            // parse table function (SELECT * FROM TABLE (<expr>) [ AS <alias> ])
+            self.expect_token(&Token::LParen)?;
+            let expr = self.parse_expr()?;
+            self.expect_token(&Token::RParen)?;
+            let alias = self.parse_optional_table_alias(keywords::RESERVED_FOR_TABLE_ALIAS)?;
+            Ok(TableFactor::TableFunction { expr, alias })
+        } else if self.consume_token(&Token::LParen) {
             // A left paren introduces either a derived table (i.e., a subquery)
             // or a nested join. It's nearly impossible to determine ahead of
             // time which it is... so we just try to parse both.
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 5443c06e2..a96ed1838 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1158,8 +1158,8 @@ fn parse_create_table_with_multiple_on_delete_fails() {
 
 #[test]
 fn parse_assert() {
-    let sql = "ASSERT (SELECT COUNT(*) FROM table) > 0";
-    let ast = one_statement_parses_to(sql, "ASSERT (SELECT COUNT(*) FROM table) > 0");
+    let sql = "ASSERT (SELECT COUNT(*) FROM my_table) > 0";
+    let ast = one_statement_parses_to(sql, "ASSERT (SELECT COUNT(*) FROM my_table) > 0");
     match ast {
         Statement::Assert {
             condition: _condition,
@@ -1173,10 +1173,10 @@ fn parse_assert() {
 
 #[test]
 fn parse_assert_message() {
-    let sql = "ASSERT (SELECT COUNT(*) FROM table) > 0 AS 'No rows in table'";
+    let sql = "ASSERT (SELECT COUNT(*) FROM my_table) > 0 AS 'No rows in my_table'";
     let ast = one_statement_parses_to(
         sql,
-        "ASSERT (SELECT COUNT(*) FROM table) > 0 AS 'No rows in table'",
+        "ASSERT (SELECT COUNT(*) FROM my_table) > 0 AS 'No rows in my_table'",
     );
     match ast {
         Statement::Assert {
@@ -1184,7 +1184,7 @@ fn parse_assert_message() {
             message: Some(message),
         } => {
             match message {
-                Expr::Value(Value::SingleQuotedString(s)) => assert_eq!(s, "No rows in table"),
+                Expr::Value(Value::SingleQuotedString(s)) => assert_eq!(s, "No rows in my_table"),
                 _ => unreachable!(),
             };
         }
@@ -1864,6 +1864,39 @@ fn parse_simple_math_expr_minus() {
     verified_only_select(sql);
 }
 
+#[test]
+fn parse_table_function() {
+    let select = verified_only_select("SELECT * FROM TABLE(FUN('1')) AS a");
+
+    match only(select.from).relation {
+        TableFactor::TableFunction { expr, alias } => {
+            let expected_expr = Expr::Function(Function {
+                name: ObjectName(vec![Ident::new("FUN")]),
+                args: vec![FunctionArg::Unnamed(Expr::Value(
+                    Value::SingleQuotedString("1".to_owned()),
+                ))],
+                over: None,
+                distinct: false,
+            });
+            assert_eq!(expr, expected_expr);
+            assert_eq!(alias, table_alias("a"))
+        }
+        _ => panic!("Expecting TableFactor::TableFunction"),
+    }
+
+    let res = parse_sql_statements("SELECT * FROM TABLE '1' AS a");
+    assert_eq!(
+        ParserError::ParserError("Expected (, found: \'1\'".to_string()),
+        res.unwrap_err()
+    );
+
+    let res = parse_sql_statements("SELECT * FROM TABLE (FUN(a) AS a");
+    assert_eq!(
+        ParserError::ParserError("Expected ), found: AS".to_string()),
+        res.unwrap_err()
+    );
+}
+
 #[test]
 fn parse_delimited_identifiers() {
     // check that quoted identifiers in any position remain quoted after serialization

From 5f3a40e7722539d13fe062c2a332b999d1655cda Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Wed, 5 Aug 2020 08:12:13 +0200
Subject: [PATCH 080/122] Dependency updates (#255)

---
 .github/workflows/rust.yml | 2 +-
 Cargo.toml                 | 6 +++---
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/rust.yml b/.github/workflows/rust.yml
index aed1a371a..241b5f239 100644
--- a/.github/workflows/rust.yml
+++ b/.github/workflows/rust.yml
@@ -49,7 +49,7 @@ jobs:
       uses: actions-rs/install@v0.1
       with:
         crate: cargo-tarpaulin
-        version: 0.13.3
+        version: 0.14.2
         use-tool-cache: true
     - name: Checkout
       uses: actions/checkout@v2
diff --git a/Cargo.toml b/Cargo.toml
index 95c2ec9bb..ad02e5ee1 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -23,8 +23,8 @@ path = "src/lib.rs"
 json_example = ["serde_json", "serde"]
 
 [dependencies]
-bigdecimal = { version = "0.1.0", features = ["serde"], optional = true }
-log = "0.4.5"
+bigdecimal = { version = "0.1", features = ["serde"], optional = true }
+log = "0.4"
 serde = { version = "1.0", features = ["derive"], optional = true }
 # serde_json is only used in examples/cli, but we have to put it outside
 # of dev-dependencies because of
@@ -32,5 +32,5 @@ serde = { version = "1.0", features = ["derive"], optional = true }
 serde_json = { version = "1.0", optional = true }
 
 [dev-dependencies]
-simple_logger = "1.0.1"
+simple_logger = "1.6"
 matches = "0.1"

From 3871bbc5ee70fdbb2c550e915fb630a782cf3bd4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Wed, 5 Aug 2020 09:03:29 +0200
Subject: [PATCH 081/122] Enable dependabot for this repository (#256)

* Enable dependabot for this repository

* Remove duplication, add sqlparser_bench
---
 .github/dependabot.yml | 12 ++++++++++++
 1 file changed, 12 insertions(+)
 create mode 100644 .github/dependabot.yml

diff --git a/.github/dependabot.yml b/.github/dependabot.yml
new file mode 100644
index 000000000..a73d1dc4e
--- /dev/null
+++ b/.github/dependabot.yml
@@ -0,0 +1,12 @@
+version: 2
+updates:
+  - package-ecosystem: cargo
+    directory: "/"
+    schedule:
+      interval: daily
+    open-pull-requests-limit: 10
+  - package-ecosystem: cargo
+    directory: "/sqlparser_bench"
+    schedule:
+      interval: daily
+    open-pull-requests-limit: 10

From 1b46e82eec925582fa31d3e80161f0e64388f9cd Mon Sep 17 00:00:00 2001
From: eyalleshem <38852709+eyalleshem@users.noreply.github.com>
Date: Mon, 10 Aug 2020 16:51:59 +0300
Subject: [PATCH 082/122] Enable dialect specific behaviours in the parser
 (#254)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* Change `Parser { ... }` to store the dialect used:
    `Parser<'a> { ... dialect: &'a dyn Dialect }`

    Thanks to @c7hm4r for the initial version of this submitted as
    part of https://github.com/ballista-compute/sqlparser-rs/pull/170

* Introduce `dialect_of!(parser is SQLiteDialect |  GenericDialect)` helper
    to branch on the dialect's type

* Use the new functionality to make `AUTO_INCREMENT` and `AUTOINCREMENT`
  parsing dialect-dependent.


Co-authored-by: Christoph Müller <pmzqxfmn@runbox.com>
Co-authored-by: Nickolay Ponomarev <asqueella@gmail.com>
---
 src/dialect/mod.rs        | 59 ++++++++++++++++++++++++++++++++++++++-
 src/lib.rs                |  1 +
 src/parser.rs             | 29 +++++++++++--------
 src/test_utils.rs         |  6 ++--
 tests/sqlparser_common.rs |  7 +++--
 5 files changed, 85 insertions(+), 17 deletions(-)

diff --git a/src/dialect/mod.rs b/src/dialect/mod.rs
index ff28314c8..91d69a33f 100644
--- a/src/dialect/mod.rs
+++ b/src/dialect/mod.rs
@@ -18,6 +18,7 @@ mod mysql;
 mod postgresql;
 mod sqlite;
 
+use std::any::{Any, TypeId};
 use std::fmt::Debug;
 
 pub use self::ansi::AnsiDialect;
@@ -27,7 +28,15 @@ pub use self::mysql::MySqlDialect;
 pub use self::postgresql::PostgreSqlDialect;
 pub use self::sqlite::SQLiteDialect;
 
-pub trait Dialect: Debug {
+/// `dialect_of!(parser is SQLiteDialect |  GenericDialect)` evaluates
+/// to `true` iff `parser.dialect` is one of the `Dialect`s specified.
+macro_rules! dialect_of {
+    ( $parsed_dialect: ident is $($dialect_type: ty)|+ ) => {
+        ($($parsed_dialect.dialect.is::<$dialect_type>())||+)
+    };
+}
+
+pub trait Dialect: Debug + Any {
     /// Determine if a character starts a quoted identifier. The default
     /// implementation, accepting "double quoted" ids is both ANSI-compliant
     /// and appropriate for most dialects (with the notable exception of
@@ -41,3 +50,51 @@ pub trait Dialect: Debug {
     /// Determine if a character is a valid unquoted identifier character
     fn is_identifier_part(&self, ch: char) -> bool;
 }
+
+impl dyn Dialect {
+    #[inline]
+    pub fn is<T: Dialect>(&self) -> bool {
+        // borrowed from `Any` implementation
+        TypeId::of::<T>() == self.type_id()
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::ansi::AnsiDialect;
+    use super::generic::GenericDialect;
+    use super::*;
+
+    struct DialectHolder<'a> {
+        dialect: &'a dyn Dialect,
+    }
+
+    #[test]
+    fn test_is_dialect() {
+        let generic_dialect: &dyn Dialect = &GenericDialect {};
+        let ansi_dialect: &dyn Dialect = &AnsiDialect {};
+
+        let generic_holder = DialectHolder {
+            dialect: generic_dialect,
+        };
+        let ansi_holder = DialectHolder {
+            dialect: ansi_dialect,
+        };
+
+        assert_eq!(
+            dialect_of!(generic_holder is GenericDialect |  AnsiDialect),
+            true
+        );
+        assert_eq!(dialect_of!(generic_holder is  AnsiDialect), false);
+
+        assert_eq!(dialect_of!(ansi_holder is  AnsiDialect), true);
+        assert_eq!(
+            dialect_of!(ansi_holder is  GenericDialect | AnsiDialect),
+            true
+        );
+        assert_eq!(
+            dialect_of!(ansi_holder is  GenericDialect | MsSqlDialect),
+            false
+        );
+    }
+}
diff --git a/src/lib.rs b/src/lib.rs
index d25b24997..8c9b01702 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -35,6 +35,7 @@
 #![warn(clippy::all)]
 
 pub mod ast;
+#[macro_use]
 pub mod dialect;
 pub mod parser;
 pub mod tokenizer;
diff --git a/src/parser.rs b/src/parser.rs
index 5f77b6691..5f113a070 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -15,9 +15,8 @@
 use log::debug;
 
 use super::ast::*;
-use super::dialect::keywords;
 use super::dialect::keywords::Keyword;
-use super::dialect::Dialect;
+use super::dialect::*;
 use super::tokenizer::*;
 use std::error::Error;
 use std::fmt;
@@ -82,24 +81,28 @@ impl fmt::Display for ParserError {
 
 impl Error for ParserError {}
 
-/// SQL Parser
-pub struct Parser {
+pub struct Parser<'a> {
     tokens: Vec<Token>,
     /// The index of the first unprocessed token in `self.tokens`
     index: usize,
+    dialect: &'a dyn Dialect,
 }
 
-impl Parser {
+impl<'a> Parser<'a> {
     /// Parse the specified tokens
-    pub fn new(tokens: Vec<Token>) -> Self {
-        Parser { tokens, index: 0 }
+    pub fn new(tokens: Vec<Token>, dialect: &'a dyn Dialect) -> Self {
+        Parser {
+            tokens,
+            index: 0,
+            dialect,
+        }
     }
 
     /// Parse a SQL statement and produce an Abstract Syntax Tree (AST)
     pub fn parse_sql(dialect: &dyn Dialect, sql: &str) -> Result<Vec<Statement>, ParserError> {
         let mut tokenizer = Tokenizer::new(dialect, &sql);
         let tokens = tokenizer.tokenize()?;
-        let mut parser = Parser::new(tokens);
+        let mut parser = Parser::new(tokens, dialect);
         let mut stmts = Vec::new();
         let mut expecting_statement_delimiter = false;
         debug!("Parsing sql '{}'...", sql);
@@ -950,7 +953,7 @@ impl Parser {
     /// Parse a comma-separated list of 1+ items accepted by `F`
     pub fn parse_comma_separated<T, F>(&mut self, mut f: F) -> Result<Vec<T>, ParserError>
     where
-        F: FnMut(&mut Parser) -> Result<T, ParserError>,
+        F: FnMut(&mut Parser<'a>) -> Result<T, ParserError>,
     {
         let mut values = vec![];
         loop {
@@ -1285,10 +1288,14 @@ impl Parser {
             let expr = self.parse_expr()?;
             self.expect_token(&Token::RParen)?;
             ColumnOption::Check(expr)
-        } else if self.parse_keyword(Keyword::AUTO_INCREMENT) {
+        } else if self.parse_keyword(Keyword::AUTO_INCREMENT)
+            && dialect_of!(self is MySqlDialect |  GenericDialect)
+        {
             // Support AUTO_INCREMENT for MySQL
             ColumnOption::DialectSpecific(vec![Token::make_keyword("AUTO_INCREMENT")])
-        } else if self.parse_keyword(Keyword::AUTOINCREMENT) {
+        } else if self.parse_keyword(Keyword::AUTOINCREMENT)
+            && dialect_of!(self is SQLiteDialect |  GenericDialect)
+        {
             // Support AUTOINCREMENT for SQLite
             ColumnOption::DialectSpecific(vec![Token::make_keyword("AUTOINCREMENT")])
         } else {
diff --git a/src/test_utils.rs b/src/test_utils.rs
index 4d4d35616..848ea0508 100644
--- a/src/test_utils.rs
+++ b/src/test_utils.rs
@@ -53,7 +53,7 @@ impl TestedDialects {
         self.one_of_identical_results(|dialect| {
             let mut tokenizer = Tokenizer::new(dialect, sql);
             let tokens = tokenizer.tokenize().unwrap();
-            f(&mut Parser::new(tokens))
+            f(&mut Parser::new(tokens, dialect))
         })
     }
 
@@ -104,7 +104,9 @@ impl TestedDialects {
     /// Ensures that `sql` parses as an expression, and is not modified
     /// after a serialization round-trip.
     pub fn verified_expr(&self, sql: &str) -> Expr {
-        let ast = self.run_parser_method(sql, Parser::parse_expr).unwrap();
+        let ast = self
+            .run_parser_method(sql, |parser| parser.parse_expr())
+            .unwrap();
         assert_eq!(sql, &ast.to_string(), "round-tripping without changes");
         ast
     }
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index a96ed1838..f3234e999 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -22,7 +22,7 @@ use matches::assert_matches;
 
 use sqlparser::ast::*;
 use sqlparser::dialect::keywords::ALL_KEYWORDS;
-use sqlparser::parser::{Parser, ParserError};
+use sqlparser::parser::ParserError;
 use sqlparser::test_utils::{all_dialects, expr_from_projection, number, only};
 
 #[test]
@@ -147,13 +147,14 @@ fn parse_update() {
 
 #[test]
 fn parse_invalid_table_name() {
-    let ast = all_dialects().run_parser_method("db.public..customer", Parser::parse_object_name);
+    let ast = all_dialects()
+        .run_parser_method("db.public..customer", |parser| parser.parse_object_name());
     assert!(ast.is_err());
 }
 
 #[test]
 fn parse_no_table_name() {
-    let ast = all_dialects().run_parser_method("", Parser::parse_object_name);
+    let ast = all_dialects().run_parser_method("", |parser| parser.parse_object_name());
     assert!(ast.is_err());
 }
 

From 23f5c7e7ce3146b54411042c0b7b85c1ee721561 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Fri, 31 Jul 2020 16:49:58 +0300
Subject: [PATCH 083/122] Move parse_column_def below parse_columns

...because in the section related to CREATE TABLE parsing, the callers
are defined above the callees.
---
 src/parser.rs | 49 ++++++++++++++++++++++++-------------------------
 1 file changed, 24 insertions(+), 25 deletions(-)

diff --git a/src/parser.rs b/src/parser.rs
index 5f113a070..c38a8f818 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1191,29 +1191,6 @@ impl<'a> Parser<'a> {
         })
     }
 
-    fn parse_column_def(&mut self) -> Result<ColumnDef, ParserError> {
-        let name = self.parse_identifier()?;
-        let data_type = self.parse_data_type()?;
-        let collation = if self.parse_keyword(Keyword::COLLATE) {
-            Some(self.parse_object_name()?)
-        } else {
-            None
-        };
-        let mut options = vec![];
-        loop {
-            match self.peek_token() {
-                Token::EOF | Token::Comma | Token::RParen | Token::SemiColon => break,
-                _ => options.push(self.parse_column_option_def()?),
-            }
-        }
-        Ok(ColumnDef {
-            name,
-            data_type,
-            collation,
-            options,
-        })
-    }
-
     fn parse_columns(&mut self) -> Result<(Vec<ColumnDef>, Vec<TableConstraint>), ParserError> {
         let mut columns = vec![];
         let mut constraints = vec![];
@@ -1225,8 +1202,7 @@ impl<'a> Parser<'a> {
             if let Some(constraint) = self.parse_optional_table_constraint()? {
                 constraints.push(constraint);
             } else if let Token::Word(_) = self.peek_token() {
-                let column_def = self.parse_column_def()?;
-                columns.push(column_def);
+                columns.push(self.parse_column_def()?);
             } else {
                 return self.expected("column name or constraint definition", self.peek_token());
             }
@@ -1242,6 +1218,29 @@ impl<'a> Parser<'a> {
         Ok((columns, constraints))
     }
 
+    fn parse_column_def(&mut self) -> Result<ColumnDef, ParserError> {
+        let name = self.parse_identifier()?;
+        let data_type = self.parse_data_type()?;
+        let collation = if self.parse_keyword(Keyword::COLLATE) {
+            Some(self.parse_object_name()?)
+        } else {
+            None
+        };
+        let mut options = vec![];
+        loop {
+            match self.peek_token() {
+                Token::EOF | Token::Comma | Token::RParen | Token::SemiColon => break,
+                _ => options.push(self.parse_column_option_def()?),
+            }
+        }
+        Ok(ColumnDef {
+            name,
+            data_type,
+            collation,
+            options,
+        })
+    }
+
     pub fn parse_column_option_def(&mut self) -> Result<ColumnOptionDef, ParserError> {
         let name = if self.parse_keyword(Keyword::CONSTRAINT) {
             Some(self.parse_identifier()?)

From 66505ebf9e21d62061eb9df6e37441b5eae007c3 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Mon, 10 Aug 2020 17:12:33 +0300
Subject: [PATCH 084/122] Don't fail parsing a column definition with
 unexpected tokens

Since PR https://github.com/ballista-compute/sqlparser-rs/pull/93
`parse_column_def` parses a set of column options in a loop, e.g. given:

```
                  _______ column_def _______
CREATE TABLE foo (bar INT NOT NULL DEFAULT 1, )
                          -------- ---------
                          option 1  option 2
````

it parses column options until it encounters one of the delimiter tokens

First when we only supported `CREATE TABLE`, the set of delimiters that
stopped the parsing used to be `Token::Comma | Token::RParen`.

Then we added support for `ALTER TABLE ADD COLUMN <column_def>`. Turns
out the parser started to bail if the statement ended with a semicolon,
while attempting to parse the semicolon as a column option, as we forgot
to add it to the set of delimiter tokens.

This was recently fixed in https://github.com/ballista-compute/sqlparser-rs/pull/246
by including Token::SemiColon to the list, but it felt wrong to have
to update this list, and to have a common list of delimiters for two
different contexts (CREATE TABLE with parens vs ALTER TABLE ADD COLUMN
without parens).

Also our current approach cannot handle multiple statements NOT
separated by a semicolon, as is common in MS SQL DDL. We don't
explicitly support it in `parse_statements`, but that's a use-case
like to keep in mind nevertheless.
---
 src/parser.rs             | 59 ++++++++++++++++++++++-----------------
 tests/sqlparser_common.rs |  8 +++++-
 2 files changed, 40 insertions(+), 27 deletions(-)

diff --git a/src/parser.rs b/src/parser.rs
index c38a8f818..431984a19 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1228,10 +1228,21 @@ impl<'a> Parser<'a> {
         };
         let mut options = vec![];
         loop {
-            match self.peek_token() {
-                Token::EOF | Token::Comma | Token::RParen | Token::SemiColon => break,
-                _ => options.push(self.parse_column_option_def()?),
-            }
+            if self.parse_keyword(Keyword::CONSTRAINT) {
+                let name = Some(self.parse_identifier()?);
+                if let Some(option) = self.parse_optional_column_option()? {
+                    options.push(ColumnOptionDef { name, option });
+                } else {
+                    return self.expected(
+                        "constraint details after CONSTRAINT <name>",
+                        self.peek_token(),
+                    );
+                }
+            } else if let Some(option) = self.parse_optional_column_option()? {
+                options.push(ColumnOptionDef { name: None, option });
+            } else {
+                break;
+            };
         }
         Ok(ColumnDef {
             name,
@@ -1241,23 +1252,17 @@ impl<'a> Parser<'a> {
         })
     }
 
-    pub fn parse_column_option_def(&mut self) -> Result<ColumnOptionDef, ParserError> {
-        let name = if self.parse_keyword(Keyword::CONSTRAINT) {
-            Some(self.parse_identifier()?)
-        } else {
-            None
-        };
-
-        let option = if self.parse_keywords(&[Keyword::NOT, Keyword::NULL]) {
-            ColumnOption::NotNull
+    pub fn parse_optional_column_option(&mut self) -> Result<Option<ColumnOption>, ParserError> {
+        if self.parse_keywords(&[Keyword::NOT, Keyword::NULL]) {
+            Ok(Some(ColumnOption::NotNull))
         } else if self.parse_keyword(Keyword::NULL) {
-            ColumnOption::Null
+            Ok(Some(ColumnOption::Null))
         } else if self.parse_keyword(Keyword::DEFAULT) {
-            ColumnOption::Default(self.parse_expr()?)
+            Ok(Some(ColumnOption::Default(self.parse_expr()?)))
         } else if self.parse_keywords(&[Keyword::PRIMARY, Keyword::KEY]) {
-            ColumnOption::Unique { is_primary: true }
+            Ok(Some(ColumnOption::Unique { is_primary: true }))
         } else if self.parse_keyword(Keyword::UNIQUE) {
-            ColumnOption::Unique { is_primary: false }
+            Ok(Some(ColumnOption::Unique { is_primary: false }))
         } else if self.parse_keyword(Keyword::REFERENCES) {
             let foreign_table = self.parse_object_name()?;
             // PostgreSQL allows omitting the column list and
@@ -1276,32 +1281,34 @@ impl<'a> Parser<'a> {
                     break;
                 }
             }
-            ColumnOption::ForeignKey {
+            Ok(Some(ColumnOption::ForeignKey {
                 foreign_table,
                 referred_columns,
                 on_delete,
                 on_update,
-            }
+            }))
         } else if self.parse_keyword(Keyword::CHECK) {
             self.expect_token(&Token::LParen)?;
             let expr = self.parse_expr()?;
             self.expect_token(&Token::RParen)?;
-            ColumnOption::Check(expr)
+            Ok(Some(ColumnOption::Check(expr)))
         } else if self.parse_keyword(Keyword::AUTO_INCREMENT)
             && dialect_of!(self is MySqlDialect |  GenericDialect)
         {
             // Support AUTO_INCREMENT for MySQL
-            ColumnOption::DialectSpecific(vec![Token::make_keyword("AUTO_INCREMENT")])
+            Ok(Some(ColumnOption::DialectSpecific(vec![
+                Token::make_keyword("AUTO_INCREMENT"),
+            ])))
         } else if self.parse_keyword(Keyword::AUTOINCREMENT)
             && dialect_of!(self is SQLiteDialect |  GenericDialect)
         {
             // Support AUTOINCREMENT for SQLite
-            ColumnOption::DialectSpecific(vec![Token::make_keyword("AUTOINCREMENT")])
+            Ok(Some(ColumnOption::DialectSpecific(vec![
+                Token::make_keyword("AUTOINCREMENT"),
+            ])))
         } else {
-            return self.expected("column option", self.peek_token());
-        };
-
-        Ok(ColumnOptionDef { name, option })
+            Ok(None)
+        }
     }
 
     pub fn parse_referential_action(&mut self) -> Result<ReferentialAction, ParserError> {
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index f3234e999..c06e4487f 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1142,7 +1142,13 @@ fn parse_create_table() {
     assert!(res
         .unwrap_err()
         .to_string()
-        .contains("Expected column option, found: GARBAGE"));
+        .contains("Expected \',\' or \')\' after column definition, found: GARBAGE"));
+
+    let res = parse_sql_statements("CREATE TABLE t (a int NOT NULL CONSTRAINT foo)");
+    assert!(res
+        .unwrap_err()
+        .to_string()
+        .contains("Expected constraint details after CONSTRAINT <name>"));
 }
 
 #[test]

From f500a42e990c97bda7fa2904c6f1b14cd66703d5 Mon Sep 17 00:00:00 2001
From: eyalleshem <38852709+eyalleshem@users.noreply.github.com>
Date: Wed, 12 Aug 2020 04:55:22 +0300
Subject: [PATCH 085/122] Add snowflake dialect (#259)

---
 examples/cli.rs              |  1 +
 src/dialect/mod.rs           |  2 ++
 src/dialect/snowflake.rs     | 31 +++++++++++++++++++++++++++++++
 src/test_utils.rs            |  1 +
 tests/sqlparser_snowflake.rs | 31 +++++++++++++++++++++++++++++++
 5 files changed, 66 insertions(+)
 create mode 100644 src/dialect/snowflake.rs
 create mode 100644 tests/sqlparser_snowflake.rs

diff --git a/examples/cli.rs b/examples/cli.rs
index f019c520b..98f6849b8 100644
--- a/examples/cli.rs
+++ b/examples/cli.rs
@@ -39,6 +39,7 @@ $ cargo run --feature json_example --example cli FILENAME.sql [--dialectname]
         "--ansi" => Box::new(AnsiDialect {}),
         "--postgres" => Box::new(PostgreSqlDialect {}),
         "--ms" => Box::new(MsSqlDialect {}),
+        "--snowflake" => Box::new(SnowflakeDialect {}),
         "--generic" | "" => Box::new(GenericDialect {}),
         s => panic!("Unexpected parameter: {}", s),
     };
diff --git a/src/dialect/mod.rs b/src/dialect/mod.rs
index 91d69a33f..e656ab269 100644
--- a/src/dialect/mod.rs
+++ b/src/dialect/mod.rs
@@ -16,6 +16,7 @@ pub mod keywords;
 mod mssql;
 mod mysql;
 mod postgresql;
+mod snowflake;
 mod sqlite;
 
 use std::any::{Any, TypeId};
@@ -26,6 +27,7 @@ pub use self::generic::GenericDialect;
 pub use self::mssql::MsSqlDialect;
 pub use self::mysql::MySqlDialect;
 pub use self::postgresql::PostgreSqlDialect;
+pub use self::snowflake::SnowflakeDialect;
 pub use self::sqlite::SQLiteDialect;
 
 /// `dialect_of!(parser is SQLiteDialect |  GenericDialect)` evaluates
diff --git a/src/dialect/snowflake.rs b/src/dialect/snowflake.rs
new file mode 100644
index 000000000..22fd55fa5
--- /dev/null
+++ b/src/dialect/snowflake.rs
@@ -0,0 +1,31 @@
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+use crate::dialect::Dialect;
+
+#[derive(Debug, Default)]
+pub struct SnowflakeDialect;
+
+impl Dialect for SnowflakeDialect {
+    // see https://docs.snowflake.com/en/sql-reference/identifiers-syntax.html
+    fn is_identifier_start(&self, ch: char) -> bool {
+        (ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <= 'Z') || ch == '_'
+    }
+
+    fn is_identifier_part(&self, ch: char) -> bool {
+        (ch >= 'a' && ch <= 'z')
+            || (ch >= 'A' && ch <= 'Z')
+            || (ch >= '0' && ch <= '9')
+            || ch == '$'
+            || ch == '_'
+    }
+}
diff --git a/src/test_utils.rs b/src/test_utils.rs
index 848ea0508..7d9636068 100644
--- a/src/test_utils.rs
+++ b/src/test_utils.rs
@@ -119,6 +119,7 @@ pub fn all_dialects() -> TestedDialects {
             Box::new(PostgreSqlDialect {}),
             Box::new(MsSqlDialect {}),
             Box::new(AnsiDialect {}),
+            Box::new(SnowflakeDialect {}),
         ],
     }
 }
diff --git a/tests/sqlparser_snowflake.rs b/tests/sqlparser_snowflake.rs
new file mode 100644
index 000000000..086d57264
--- /dev/null
+++ b/tests/sqlparser_snowflake.rs
@@ -0,0 +1,31 @@
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+use sqlparser::ast::*;
+use sqlparser::dialect::{GenericDialect, SnowflakeDialect};
+use sqlparser::test_utils::*;
+
+#[test]
+fn test_snowflake_create_table() {
+    let sql = "CREATE TABLE _my_$table (am00unt number)";
+    match snowflake_and_generic().verified_stmt(sql) {
+        Statement::CreateTable { name, .. } => {
+            assert_eq!("_my_$table", name.to_string());
+        }
+        _ => unreachable!(),
+    }
+}
+
+fn snowflake_and_generic() -> TestedDialects {
+    TestedDialects {
+        dialects: vec![Box::new(SnowflakeDialect {}), Box::new(GenericDialect {})],
+    }
+}

From fcf1eb1b67c4e8ecef9dad90f9b52231d36937b5 Mon Sep 17 00:00:00 2001
From: Max Countryman <maxc@me.com>
Date: Fri, 14 Aug 2020 10:47:35 -0700
Subject: [PATCH 086/122] add a note about cargo release config

---
 Cargo.toml | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/Cargo.toml b/Cargo.toml
index beed4db17..fda803b06 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -36,4 +36,6 @@ simple_logger = "1.6"
 matches = "0.1"
 
 [package.metadata.release]
+# We want to ensure we don't publish via `cargo release` since Actions
+# handles this for us.
 disable-publish = true

From 038ef985a769051abf83b29a5572cd1cadb5a385 Mon Sep 17 00:00:00 2001
From: Andy Grove <andygrove@users.noreply.github.com>
Date: Thu, 27 Aug 2020 11:42:34 -0600
Subject: [PATCH 087/122] Add Ballista to the README as a user of this crate
 (#262)

---
 README.md | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 844ae52a5..ec9689acc 100644
--- a/README.md
+++ b/README.md
@@ -11,8 +11,8 @@ SQL that conforms with the [ANSI/ISO SQL standard][sql-standard] while also
 making it easy to support custom dialects so that this crate can be used as a
 foundation for vendor-specific parsers.
 
-This parser is currently being used by the [DataFusion] query engine and
-[LocustDB].
+This parser is currently being used by the [DataFusion] query engine,
+[LocustDB], and [Ballista].
 
 ## Example
 
@@ -126,6 +126,7 @@ resources.
 [current issues]: https://github.com/ballista-compute/sqlparser-rs/issues
 [DataFusion]: https://github.com/apache/arrow/tree/master/rust/datafusion
 [LocustDB]: https://github.com/cswinter/LocustDB
+[Ballista]: https://github.com/ballista-compute/ballista
 [Pratt Parser]: https://tdop.github.io/
 [sql-2016-grammar]: https://jakewheat.github.io/sql-overview/sql-2016-foundation-grammar.html
 [sql-standard]: https://en.wikipedia.org/wiki/ISO/IEC_9075

From a5b752484e74810ad49d36d95474067a9f627654 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Thu, 27 Aug 2020 21:32:06 +0200
Subject: [PATCH 088/122] Fix clippy linting error, use enumerate (#266)

---
 tests/sqlparser_common.rs | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index c06e4487f..0c1cea5af 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -2388,8 +2388,7 @@ fn parse_ctes() {
     );
 
     fn assert_ctes_in_select(expected: &[&str], sel: &Query) {
-        let mut i = 0;
-        for exp in expected {
+        for (i, exp) in expected.iter().enumerate() {
             let Cte { alias, query } = &sel.ctes[i];
             assert_eq!(*exp, query.to_string());
             assert_eq!(
@@ -2401,7 +2400,6 @@ fn parse_ctes() {
                 alias.name
             );
             assert!(alias.columns.is_empty());
-            i += 1;
         }
     }
 

From e9aa87fa2c4e71a8bb1cd3ec5fcc06a00431ace1 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Wed, 2 Sep 2020 13:47:55 +0200
Subject: [PATCH 089/122] Update bigdecimal requirement from 0.1 to 0.2 (#268)

Updates the requirements on [bigdecimal](https://github.com/akubera/bigdecimal-rs) to permit the latest version.
- [Release notes](https://github.com/akubera/bigdecimal-rs/releases)
- [Commits](https://github.com/akubera/bigdecimal-rs/compare/v0.1.0...v0.2.0)

Signed-off-by: dependabot[bot] <support@github.com>

Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index beed4db17..f6250492f 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -23,7 +23,7 @@ path = "src/lib.rs"
 json_example = ["serde_json", "serde"]
 
 [dependencies]
-bigdecimal = { version = "0.1", features = ["serde"], optional = true }
+bigdecimal = { version = "0.2", features = ["serde"], optional = true }
 log = "0.4"
 serde = { version = "1.0", features = ["derive"], optional = true }
 # serde_json is only used in examples/cli, but we have to put it outside

From 1c6077c0db05f01594ceccbfdb794c50e50d5def Mon Sep 17 00:00:00 2001
From: eyalleshem <38852709+eyalleshem@users.noreply.github.com>
Date: Mon, 7 Sep 2020 03:57:37 +0300
Subject: [PATCH 090/122] [snowflake] Support single line comments starting
 with '#' or '//' (#264)

Co-authored-by: Eyal Leshem <eyal@satoricyber.com>
---
 src/tokenizer.rs             | 56 +++++++++++++++++++++++++++---------
 tests/sqlparser_snowflake.rs | 39 +++++++++++++++++++++++++
 2 files changed, 81 insertions(+), 14 deletions(-)

diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 644066989..f4587f321 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -21,6 +21,7 @@ use std::str::Chars;
 
 use super::dialect::keywords::{Keyword, ALL_KEYWORDS, ALL_KEYWORDS_INDEX};
 use super::dialect::Dialect;
+use super::dialect::SnowflakeDialect;
 #[cfg(feature = "serde")]
 use serde::{Deserialize, Serialize};
 use std::fmt;
@@ -209,7 +210,7 @@ pub enum Whitespace {
     Space,
     Newline,
     Tab,
-    SingleLineComment(String),
+    SingleLineComment { comment: String, prefix: String },
     MultiLineComment(String),
 }
 
@@ -219,7 +220,7 @@ impl fmt::Display for Whitespace {
             Whitespace::Space => f.write_str(" "),
             Whitespace::Newline => f.write_str("\n"),
             Whitespace::Tab => f.write_str("\t"),
-            Whitespace::SingleLineComment(s) => write!(f, "--{}", s),
+            Whitespace::SingleLineComment { prefix, comment } => write!(f, "{}{}", prefix, comment),
             Whitespace::MultiLineComment(s) => write!(f, "/*{}*/", s),
         }
     }
@@ -370,12 +371,11 @@ impl<'a> Tokenizer<'a> {
                     match chars.peek() {
                         Some('-') => {
                             chars.next(); // consume the second '-', starting a single-line comment
-                            let mut s = peeking_take_while(chars, |ch| ch != '\n');
-                            if let Some(ch) = chars.next() {
-                                assert_eq!(ch, '\n');
-                                s.push(ch);
-                            }
-                            Ok(Some(Token::Whitespace(Whitespace::SingleLineComment(s))))
+                            let comment = self.tokenize_single_line_comment(chars);
+                            Ok(Some(Token::Whitespace(Whitespace::SingleLineComment {
+                                prefix: "--".to_owned(),
+                                comment,
+                            })))
                         }
                         // a regular '-' operator
                         _ => Ok(Some(Token::Minus)),
@@ -388,6 +388,14 @@ impl<'a> Tokenizer<'a> {
                             chars.next(); // consume the '*', starting a multi-line comment
                             self.tokenize_multiline_comment(chars)
                         }
+                        Some('/') if dialect_of!(self is SnowflakeDialect) => {
+                            chars.next(); // consume the second '/', starting a snowflake single-line comment
+                            let comment = self.tokenize_single_line_comment(chars);
+                            Ok(Some(Token::Whitespace(Whitespace::SingleLineComment {
+                                prefix: "//".to_owned(),
+                                comment,
+                            })))
+                        }
                         // a regular '/' operator
                         _ => Ok(Some(Token::Div)),
                     }
@@ -448,6 +456,14 @@ impl<'a> Tokenizer<'a> {
                 '^' => self.consume_and_return(chars, Token::Caret),
                 '{' => self.consume_and_return(chars, Token::LBrace),
                 '}' => self.consume_and_return(chars, Token::RBrace),
+                '#' if dialect_of!(self is SnowflakeDialect) => {
+                    chars.next(); // consume the '#', starting a snowflake single-line comment
+                    let comment = self.tokenize_single_line_comment(chars);
+                    Ok(Some(Token::Whitespace(Whitespace::SingleLineComment {
+                        prefix: "#".to_owned(),
+                        comment,
+                    })))
+                }
                 other => self.consume_and_return(chars, Token::Char(other)),
             },
             None => Ok(None),
@@ -462,6 +478,16 @@ impl<'a> Tokenizer<'a> {
         })
     }
 
+    // Consume characters until newline
+    fn tokenize_single_line_comment(&self, chars: &mut Peekable<Chars<'_>>) -> String {
+        let mut comment = peeking_take_while(chars, |ch| ch != '\n');
+        if let Some(ch) = chars.next() {
+            assert_eq!(ch, '\n');
+            comment.push(ch);
+        }
+        comment
+    }
+
     /// Tokenize an identifier or keyword, after the first char is already consumed.
     fn tokenize_word(&self, first_char: char, chars: &mut Peekable<Chars<'_>>) -> String {
         let mut s = first_char.to_string();
@@ -819,9 +845,10 @@ mod tests {
         let tokens = tokenizer.tokenize().unwrap();
         let expected = vec![
             Token::Number("0".to_string()),
-            Token::Whitespace(Whitespace::SingleLineComment(
-                "this is a comment\n".to_string(),
-            )),
+            Token::Whitespace(Whitespace::SingleLineComment {
+                prefix: "--".to_string(),
+                comment: "this is a comment\n".to_string(),
+            }),
             Token::Number("1".to_string()),
         ];
         compare(expected, tokens);
@@ -834,9 +861,10 @@ mod tests {
         let dialect = GenericDialect {};
         let mut tokenizer = Tokenizer::new(&dialect, &sql);
         let tokens = tokenizer.tokenize().unwrap();
-        let expected = vec![Token::Whitespace(Whitespace::SingleLineComment(
-            "this is a comment".to_string(),
-        ))];
+        let expected = vec![Token::Whitespace(Whitespace::SingleLineComment {
+            prefix: "--".to_string(),
+            comment: "this is a comment".to_string(),
+        })];
         compare(expected, tokens);
     }
 
diff --git a/tests/sqlparser_snowflake.rs b/tests/sqlparser_snowflake.rs
index 086d57264..c1aa41db3 100644
--- a/tests/sqlparser_snowflake.rs
+++ b/tests/sqlparser_snowflake.rs
@@ -12,6 +12,7 @@
 use sqlparser::ast::*;
 use sqlparser::dialect::{GenericDialect, SnowflakeDialect};
 use sqlparser::test_utils::*;
+use sqlparser::tokenizer::*;
 
 #[test]
 fn test_snowflake_create_table() {
@@ -24,6 +25,44 @@ fn test_snowflake_create_table() {
     }
 }
 
+#[test]
+fn test_snowflake_single_line_tokenize() {
+    let sql = "CREATE TABLE# this is a comment \ntable_1";
+    let dialect = SnowflakeDialect {};
+    let mut tokenizer = Tokenizer::new(&dialect, &sql);
+    let tokens = tokenizer.tokenize().unwrap();
+
+    let expected = vec![
+        Token::make_keyword("CREATE"),
+        Token::Whitespace(Whitespace::Space),
+        Token::make_keyword("TABLE"),
+        Token::Whitespace(Whitespace::SingleLineComment {
+            prefix: "#".to_string(),
+            comment: " this is a comment \n".to_string(),
+        }),
+        Token::make_word("table_1", None),
+    ];
+
+    assert_eq!(expected, tokens);
+
+    let sql = "CREATE TABLE// this is a comment \ntable_1";
+    let mut tokenizer = Tokenizer::new(&dialect, &sql);
+    let tokens = tokenizer.tokenize().unwrap();
+
+    let expected = vec![
+        Token::make_keyword("CREATE"),
+        Token::Whitespace(Whitespace::Space),
+        Token::make_keyword("TABLE"),
+        Token::Whitespace(Whitespace::SingleLineComment {
+            prefix: "//".to_string(),
+            comment: " this is a comment \n".to_string(),
+        }),
+        Token::make_word("table_1", None),
+    ];
+
+    assert_eq!(expected, tokens);
+}
+
 fn snowflake_and_generic() -> TestedDialects {
     TestedDialects {
         dialects: vec![Box::new(SnowflakeDialect {}), Box::new(GenericDialect {})],

From 01a2a6bd0c6de24d87d2a24e16be8db3c0ce1501 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Mon, 7 Sep 2020 04:11:26 +0300
Subject: [PATCH 091/122] Update CHANGELOG (#261)

---
 CHANGELOG.md | 17 +++++++++++++++--
 1 file changed, 15 insertions(+), 2 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8273062d8..c3e39aab4 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -9,13 +9,26 @@ Given that the parser produces a typed AST, any changes to the AST will technica
 Check https://github.com/ballista-compute/sqlparser-rs/commits/main for undocumented changes.
 
 ### Changed
+- Change the MySQL dialect to support `` `identifiers` `` quoted with backticks instead of the standard `"double-quoted"` identifiers (#247) - thanks @mashuai!
+- Update bigdecimal requirement from 0.1 to 0.2 (#268)
 
 ### Added
-- Support `CREATE OR REPLACE VIEW`/`TABLE` (#239)  - thanks @Dandandan!
+- Enable dialect-specific behaviours in the parser (`dialect_of!()`) (#254) - thanks @eyalleshem!
+- Support named arguments in function invocations (`ARG_NAME => val`) (#250) - thanks @eyalleshem!
+- Support `TABLE()` functions in `FROM` (#253) - thanks @eyalleshem!
+- Support Snowflake's single-line comments starting with '#' or '//' (#264) - thanks @eyalleshem!
 - Support PostgreSQL `PREPARE`, `EXECUTE`, and `DEALLOCATE` (#243) - thanks @silathdiir!
-- Support SQLite `AUTOINCREMENT` and MySQL `AUTO_INCREMENT` column option in `CREATE TABLE` - thanks @mashuai!
+- Add SQLite dialect (#248) - thanks @mashuai!
+- Add Snowflake dialect (#259) - thanks @eyalleshem!
+- DDL:
+    - Support `OR REPLACE` in `CREATE VIEW`/`TABLE` (#239)  - thanks @Dandandan!
+    - Support specifying `ASC`/`DESC` in index columns (#249) - thanks @mashuai!
+    - Support SQLite `AUTOINCREMENT` and MySQL `AUTO_INCREMENT` column option in `CREATE TABLE` (#234) - thanks @mashuai!
 
 ### Fixed
+- Fix a typo in `JSONFILE` serialization, introduced in 0.3.1 (#237)
+- Change `CREATE INDEX` serialization to not end with a semicolon, introduced in 0.5.1 (#245)
+- Don't fail parsing `ALTER TABLE ADD COLUMN` ending with a semicolon, introduced in 0.5.1 (#246) - thanks @mashuai
 
 ## [0.6.1] - 2020-07-20
 

From cf7263c2943b6d92d83577187a83cd1700c0fe04 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Mon, 7 Sep 2020 04:31:07 +0300
Subject: [PATCH 092/122] Fix typo in the README

Closes https://github.com/ballista-compute/sqlparser-rs/issues/269
---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index ec9689acc..893ecd5fc 100644
--- a/README.md
+++ b/README.md
@@ -43,7 +43,7 @@ AST: [Query(Query { ctes: [], body: Select(Select { distinct: false, projection:
 ## Command line
 To parse a file and dump the results as JSON:
 ```
-$ cargo run --feature json_example --example cli FILENAME.sql [--dialectname]
+$ cargo run --features json_example --example cli FILENAME.sql [--dialectname]
 ```
 
 ## SQL compliance

From 2f71324c3337606f3b2ba38f5d4815229d12cc07 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Mon, 7 Sep 2020 09:34:27 +0200
Subject: [PATCH 093/122] Fix deprecated way of initializing SimpleLogger
 (#275)

* Use builder pattern instead as suggested
---
 examples/cli.rs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/examples/cli.rs b/examples/cli.rs
index 98f6849b8..5a3a3034b 100644
--- a/examples/cli.rs
+++ b/examples/cli.rs
@@ -16,11 +16,11 @@
 /// Run with `cargo run --example cli`
 use std::fs;
 
+use simple_logger::SimpleLogger;
 use sqlparser::dialect::*;
 use sqlparser::parser::Parser;
-
 fn main() {
-    simple_logger::init().unwrap();
+    SimpleLogger::new().init().unwrap();
 
     let filename = std::env::args().nth(1).expect(
         r#"

From cc4f51fe10ca6b6dc63915c7f2947878d0a672b6 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Sun, 27 Sep 2020 21:54:01 +0300
Subject: [PATCH 094/122] Update releasing.md docs

---
 Cargo.toml        |  5 ++--
 docs/releasing.md | 59 ++++++++++++++++++++++++++++++++---------------
 2 files changed, 43 insertions(+), 21 deletions(-)

diff --git a/Cargo.toml b/Cargo.toml
index fda803b06..827c5d514 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -36,6 +36,7 @@ simple_logger = "1.6"
 matches = "0.1"
 
 [package.metadata.release]
-# We want to ensure we don't publish via `cargo release` since Actions
-# handles this for us.
+# Instruct `cargo release` to not run `cargo publish` locally:
+# https://github.com/sunng87/cargo-release/blob/master/docs/reference.md#config-fields
+# See docs/releasing.md for details.
 disable-publish = true
diff --git a/docs/releasing.md b/docs/releasing.md
index 66b41901b..58509eca6 100644
--- a/docs/releasing.md
+++ b/docs/releasing.md
@@ -1,6 +1,9 @@
 # Releasing
 
-Releasing, i.e. crate publishing, has been automated via GitHub Actions.
+## Prerequisites
+Publishing to crates.io has been automated via GitHub Actions, so you will only
+need push access to the [ballista-compute GitHub repository](https://github.com/ballista-compute/sqlparser-rs)
+in order to publish a release.
 
 We use the [`cargo release`](https://github.com/sunng87/cargo-release)
 subcommand to ensure correct versioning. Install via:
@@ -9,29 +12,47 @@ subcommand to ensure correct versioning. Install via:
 $ cargo install cargo-release
 ```
 
-**Before releasing** ensure `CHANGELOG.md` is updated appropriately.
-
 ## Process
 
-Using `cargo-release` we can author a new minor release like so:
+1. **Before releasing** ensure `CHANGELOG.md` is updated appropriately and that
+    you have a clean checkout of the `main` branch of the sqlparser repository:
+    ```
+    $ git fetch && git status
+    On branch main
+    Your branch is up to date with 'upstream/main'.
 
-```
-$ cargo release minor --skip-publish
-```
+    nothing to commit, working tree clean
+    ```
+    * If you have the time, check that the examples in the README are up to date.
 
-**Ensure publishing is skipped** since pushing the resulting tag upstream will
-handle crate publishing automatically.
+2. Using `cargo-release` we can publish a new release like so:
 
-This will create a new tag, `0.6.0` with the message,
-`(cargo-release) sqlparser version 0.6.0`.
+    ```
+    $ cargo release minor --push-remote upstream
+    ```
 
-Once the tag is created, pushing the tag upstream will trigger a publishing
-process to crates.io. Now to push our example tag:
+    You can add `--dry-run` to see what the command is going to do,
+    or `--skip-push` to stop before actually publishing the release.
 
-```
-git push origin 0.6.0
-```
+    `cargo release` will then:
+
+    * Bump the minor part of the version in `Cargo.toml` (e.g. `0.7.1-alpha.0`
+       -> `0.8.0`. You can use `patch` instead of `minor`, as appropriate).
+    * Create a new tag (e.g. `v0.8.0`) locally
+    * Push the new tag to the specified remote (`upstream` in the above
+      example), which will trigger a publishing process to crates.io as part of
+      the [corresponding GitHub Action](https://github.com/ballista-compute/sqlparser-rs/blob/main/.github/workflows/rust.yml).
+
+      Note that credentials for authoring in this way are securely stored in
+      the (GitHub) repo secrets as `CRATE_TOKEN`.
+    * Bump the crate version again (to something like `0.8.1-alpha.0`) to
+      indicate the start of new development cycle.
+
+3. Push the updates to the `main` branch upstream:
+    ```
+    $ git push upstream
+    ```
+
+4. Check that the new version of the crate is available on crates.io:
+    https://crates.io/crates/sqlparser
 
-(Note that this process is fully automated; credentials
-for authoring in this way are securely stored in the repo secrets as
-`CRATE_TOKEN`.)

From 0ac343a11648013163f65cbf57e1272b26a5c344 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Sun, 27 Sep 2020 23:36:41 +0300
Subject: [PATCH 095/122] Don't publish on the push of any tag

The tags are named vX.Y, and we'll be 0.x for a while, so limiting the
publish-crate action to run v0 tags seems good enough to avoid
accidental publishes.
---
 .github/workflows/rust.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/rust.yml b/.github/workflows/rust.yml
index 6401d8e5c..078d8bae0 100644
--- a/.github/workflows/rust.yml
+++ b/.github/workflows/rust.yml
@@ -65,7 +65,7 @@ jobs:
         github-token: ${{ secrets.GITHUB_TOKEN }}
 
   publish-crate:
-    if: startsWith(github.ref, 'refs/tags/')
+    if: startsWith(github.ref, 'refs/tags/v0')
     runs-on: ubuntu-latest
     needs: [test]
     steps:

From 926b03a31db65478c9714cc1a56d78bde4a07db2 Mon Sep 17 00:00:00 2001
From: Alex Dukhno <5074607+alex-dukhno@users.noreply.github.com>
Date: Wed, 30 Sep 2020 05:29:31 +0300
Subject: [PATCH 096/122] Add parsing for PostgreSQL math operators (#267)

---
 src/ast/mod.rs              |  8 ++++-
 src/ast/operator.rs         | 24 +++++++++++++++
 src/parser.rs               | 38 +++++++++++++++++++++++-
 src/tokenizer.rs            | 46 +++++++++++++++++++++++++++--
 tests/sqlparser_common.rs   |  2 +-
 tests/sqlparser_postgres.rs | 59 +++++++++++++++++++++++++++++++++++++
 6 files changed, 171 insertions(+), 6 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 7b143349b..31171db7d 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -282,7 +282,13 @@ impl fmt::Display for Expr {
                 high
             ),
             Expr::BinaryOp { left, op, right } => write!(f, "{} {} {}", left, op, right),
-            Expr::UnaryOp { op, expr } => write!(f, "{} {}", op, expr),
+            Expr::UnaryOp { op, expr } => {
+                if op == &UnaryOperator::PGPostfixFactorial {
+                    write!(f, "{}{}", expr, op)
+                } else {
+                    write!(f, "{} {}", op, expr)
+                }
+            }
             Expr::Cast { expr, data_type } => write!(f, "CAST({} AS {})", expr, data_type),
             Expr::Extract { field, expr } => write!(f, "EXTRACT({} FROM {})", field, expr),
             Expr::Collate { expr, collation } => write!(f, "{} COLLATE {}", expr, collation),
diff --git a/src/ast/operator.rs b/src/ast/operator.rs
index 63e75eead..57e70982f 100644
--- a/src/ast/operator.rs
+++ b/src/ast/operator.rs
@@ -21,6 +21,18 @@ pub enum UnaryOperator {
     Plus,
     Minus,
     Not,
+    /// Bitwise Not, e.g. `~9` (PostgreSQL-specific)
+    PGBitwiseNot,
+    /// Square root, e.g. `|/9` (PostgreSQL-specific)
+    PGSquareRoot,
+    /// Cube root, e.g. `||/27` (PostgreSQL-specific)
+    PGCubeRoot,
+    /// Factorial, e.g. `9!` (PostgreSQL-specific)
+    PGPostfixFactorial,
+    /// Factorial, e.g. `!!9` (PostgreSQL-specific)
+    PGPrefixFactorial,
+    /// Absolute value, e.g. `@ -9` (PostgreSQL-specific)
+    PGAbs,
 }
 
 impl fmt::Display for UnaryOperator {
@@ -29,6 +41,12 @@ impl fmt::Display for UnaryOperator {
             UnaryOperator::Plus => "+",
             UnaryOperator::Minus => "-",
             UnaryOperator::Not => "NOT",
+            UnaryOperator::PGBitwiseNot => "~",
+            UnaryOperator::PGSquareRoot => "|/",
+            UnaryOperator::PGCubeRoot => "||/",
+            UnaryOperator::PGPostfixFactorial => "!",
+            UnaryOperator::PGPrefixFactorial => "!!",
+            UnaryOperator::PGAbs => "@",
         })
     }
 }
@@ -56,6 +74,9 @@ pub enum BinaryOperator {
     BitwiseOr,
     BitwiseAnd,
     BitwiseXor,
+    PGBitwiseXor,
+    PGBitwiseShiftLeft,
+    PGBitwiseShiftRight,
 }
 
 impl fmt::Display for BinaryOperator {
@@ -80,6 +101,9 @@ impl fmt::Display for BinaryOperator {
             BinaryOperator::BitwiseOr => "|",
             BinaryOperator::BitwiseAnd => "&",
             BinaryOperator::BitwiseXor => "^",
+            BinaryOperator::PGBitwiseXor => "#",
+            BinaryOperator::PGBitwiseShiftLeft => "<<",
+            BinaryOperator::PGBitwiseShiftRight => ">>",
         })
     }
 }
diff --git a/src/parser.rs b/src/parser.rs
index 431984a19..f7630b037 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -294,6 +294,26 @@ impl<'a> Parser<'a> {
                     expr: Box::new(self.parse_subexpr(Self::PLUS_MINUS_PREC)?),
                 })
             }
+            tok @ Token::DoubleExclamationMark
+            | tok @ Token::PGSquareRoot
+            | tok @ Token::PGCubeRoot
+            | tok @ Token::AtSign
+            | tok @ Token::Tilde
+                if dialect_of!(self is PostgreSqlDialect) =>
+            {
+                let op = match tok {
+                    Token::DoubleExclamationMark => UnaryOperator::PGPrefixFactorial,
+                    Token::PGSquareRoot => UnaryOperator::PGSquareRoot,
+                    Token::PGCubeRoot => UnaryOperator::PGCubeRoot,
+                    Token::AtSign => UnaryOperator::PGAbs,
+                    Token::Tilde => UnaryOperator::PGBitwiseNot,
+                    _ => unreachable!(),
+                };
+                Ok(Expr::UnaryOp {
+                    op,
+                    expr: Box::new(self.parse_subexpr(Self::PLUS_MINUS_PREC)?),
+                })
+            }
             Token::Number(_)
             | Token::SingleQuotedString(_)
             | Token::NationalStringLiteral(_)
@@ -658,6 +678,15 @@ impl<'a> Parser<'a> {
             Token::Caret => Some(BinaryOperator::BitwiseXor),
             Token::Ampersand => Some(BinaryOperator::BitwiseAnd),
             Token::Div => Some(BinaryOperator::Divide),
+            Token::ShiftLeft if dialect_of!(self is PostgreSqlDialect) => {
+                Some(BinaryOperator::PGBitwiseShiftLeft)
+            }
+            Token::ShiftRight if dialect_of!(self is PostgreSqlDialect) => {
+                Some(BinaryOperator::PGBitwiseShiftRight)
+            }
+            Token::Sharp if dialect_of!(self is PostgreSqlDialect) => {
+                Some(BinaryOperator::PGBitwiseXor)
+            }
             Token::Word(w) => match w.keyword {
                 Keyword::AND => Some(BinaryOperator::And),
                 Keyword::OR => Some(BinaryOperator::Or),
@@ -707,6 +736,12 @@ impl<'a> Parser<'a> {
             }
         } else if Token::DoubleColon == tok {
             self.parse_pg_cast(expr)
+        } else if Token::ExclamationMark == tok {
+            // PostgreSQL factorial operation
+            Ok(Expr::UnaryOp {
+                op: UnaryOperator::PGPostfixFactorial,
+                expr: Box::new(expr),
+            })
         } else {
             // Can only happen if `get_next_precedence` got out of sync with this function
             panic!("No infix parser for token {:?}", tok)
@@ -785,11 +820,12 @@ impl<'a> Parser<'a> {
             Token::Word(w) if w.keyword == Keyword::LIKE => Ok(Self::BETWEEN_PREC),
             Token::Eq | Token::Lt | Token::LtEq | Token::Neq | Token::Gt | Token::GtEq => Ok(20),
             Token::Pipe => Ok(21),
-            Token::Caret => Ok(22),
+            Token::Caret | Token::Sharp | Token::ShiftRight | Token::ShiftLeft => Ok(22),
             Token::Ampersand => Ok(23),
             Token::Plus | Token::Minus => Ok(Self::PLUS_MINUS_PREC),
             Token::Mult | Token::Div | Token::Mod | Token::StringConcat => Ok(40),
             Token::DoubleColon => Ok(50),
+            Token::ExclamationMark => Ok(50),
             _ => Ok(0),
         }
     }
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index f4587f321..2496e63a2 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -54,7 +54,7 @@ pub enum Token {
     Neq,
     /// Less Than operator `<`
     Lt,
-    /// Greater han operator `>`
+    /// Greater Than operator `>`
     Gt,
     /// Less Than Or Equals operator `<=`
     LtEq,
@@ -102,6 +102,24 @@ pub enum Token {
     RBrace,
     /// Right Arrow `=>`
     RArrow,
+    /// Sharp `#` used for PostgreSQL Bitwise XOR operator
+    Sharp,
+    /// Tilde `~` used for PostgreSQL Bitwise NOT operator
+    Tilde,
+    /// `<<`, a bitwise shift left operator in PostgreSQL
+    ShiftLeft,
+    /// `>>`, a bitwise shift right operator in PostgreSQL
+    ShiftRight,
+    /// Exclamation Mark `!` used for PostgreSQL factorial operator
+    ExclamationMark,
+    /// Double Exclamation Mark `!!` used for PostgreSQL prefix factorial operator
+    DoubleExclamationMark,
+    /// AtSign `@` used for PostgreSQL abs operator
+    AtSign,
+    /// `|/`, a square root math operator in PostgreSQL
+    PGSquareRoot,
+    /// `||/` , a cube root math operator in PostgreSQL
+    PGCubeRoot,
 }
 
 impl fmt::Display for Token {
@@ -143,6 +161,15 @@ impl fmt::Display for Token {
             Token::LBrace => f.write_str("{"),
             Token::RBrace => f.write_str("}"),
             Token::RArrow => f.write_str("=>"),
+            Token::Sharp => f.write_str("#"),
+            Token::ExclamationMark => f.write_str("!"),
+            Token::DoubleExclamationMark => f.write_str("!!"),
+            Token::Tilde => f.write_str("~"),
+            Token::AtSign => f.write_str("@"),
+            Token::ShiftLeft => f.write_str("<<"),
+            Token::ShiftRight => f.write_str(">>"),
+            Token::PGSquareRoot => f.write_str("|/"),
+            Token::PGCubeRoot => f.write_str("||/"),
         }
     }
 }
@@ -406,7 +433,14 @@ impl<'a> Tokenizer<'a> {
                 '|' => {
                     chars.next(); // consume the '|'
                     match chars.peek() {
-                        Some('|') => self.consume_and_return(chars, Token::StringConcat),
+                        Some('/') => self.consume_and_return(chars, Token::PGSquareRoot),
+                        Some('|') => {
+                            chars.next(); // consume the second '|'
+                            match chars.peek() {
+                                Some('/') => self.consume_and_return(chars, Token::PGCubeRoot),
+                                _ => Ok(Some(Token::StringConcat)),
+                            }
+                        }
                         // Bitshift '|' operator
                         _ => Ok(Some(Token::Pipe)),
                     }
@@ -423,7 +457,8 @@ impl<'a> Tokenizer<'a> {
                     chars.next(); // consume
                     match chars.peek() {
                         Some('=') => self.consume_and_return(chars, Token::Neq),
-                        _ => self.tokenizer_error("Expected to see '=' after '!' character"),
+                        Some('!') => self.consume_and_return(chars, Token::DoubleExclamationMark),
+                        _ => Ok(Some(Token::ExclamationMark)),
                     }
                 }
                 '<' => {
@@ -431,6 +466,7 @@ impl<'a> Tokenizer<'a> {
                     match chars.peek() {
                         Some('=') => self.consume_and_return(chars, Token::LtEq),
                         Some('>') => self.consume_and_return(chars, Token::Neq),
+                        Some('<') => self.consume_and_return(chars, Token::ShiftLeft),
                         _ => Ok(Some(Token::Lt)),
                     }
                 }
@@ -438,6 +474,7 @@ impl<'a> Tokenizer<'a> {
                     chars.next(); // consume
                     match chars.peek() {
                         Some('=') => self.consume_and_return(chars, Token::GtEq),
+                        Some('>') => self.consume_and_return(chars, Token::ShiftRight),
                         _ => Ok(Some(Token::Gt)),
                     }
                 }
@@ -464,6 +501,9 @@ impl<'a> Tokenizer<'a> {
                         comment,
                     })))
                 }
+                '~' => self.consume_and_return(chars, Token::Tilde),
+                '#' => self.consume_and_return(chars, Token::Sharp),
+                '@' => self.consume_and_return(chars, Token::AtSign),
                 other => self.consume_and_return(chars, Token::Char(other)),
             },
             None => Ok(None),
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 0c1cea5af..4050cdf0b 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -343,7 +343,7 @@ fn parse_select_count_distinct() {
             name: ObjectName(vec![Ident::new("COUNT")]),
             args: vec![FunctionArg::Unnamed(Expr::UnaryOp {
                 op: UnaryOperator::Plus,
-                expr: Box::new(Expr::Identifier(Ident::new("x")))
+                expr: Box::new(Expr::Identifier(Ident::new("x"))),
             })],
             over: None,
             distinct: true,
diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index 2b950c0d3..1083e9971 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -551,6 +551,65 @@ fn parse_prepare() {
     );
 }
 
+#[test]
+fn parse_pg_bitwise_binary_ops() {
+    let bitwise_ops = &[
+        ("#", BinaryOperator::PGBitwiseXor),
+        (">>", BinaryOperator::PGBitwiseShiftRight),
+        ("<<", BinaryOperator::PGBitwiseShiftLeft),
+    ];
+
+    for (str_op, op) in bitwise_ops {
+        let select = pg().verified_only_select(&format!("SELECT a {} b", &str_op));
+        assert_eq!(
+            SelectItem::UnnamedExpr(Expr::BinaryOp {
+                left: Box::new(Expr::Identifier(Ident::new("a"))),
+                op: op.clone(),
+                right: Box::new(Expr::Identifier(Ident::new("b"))),
+            }),
+            select.projection[0]
+        );
+    }
+}
+
+#[test]
+fn parse_pg_unary_ops() {
+    let pg_unary_ops = &[
+        ("~", UnaryOperator::PGBitwiseNot),
+        ("|/", UnaryOperator::PGSquareRoot),
+        ("||/", UnaryOperator::PGCubeRoot),
+        ("!!", UnaryOperator::PGPrefixFactorial),
+        ("@", UnaryOperator::PGAbs),
+    ];
+
+    for (str_op, op) in pg_unary_ops {
+        let select = pg().verified_only_select(&format!("SELECT {} a", &str_op));
+        assert_eq!(
+            SelectItem::UnnamedExpr(Expr::UnaryOp {
+                op: op.clone(),
+                expr: Box::new(Expr::Identifier(Ident::new("a"))),
+            }),
+            select.projection[0]
+        );
+    }
+}
+
+#[test]
+fn parse_pg_postfix_factorial() {
+    let postfix_factorial = &[("!", UnaryOperator::PGPostfixFactorial)];
+
+    for (str_op, op) in postfix_factorial {
+        let select = pg().verified_only_select(&format!("SELECT a{}", &str_op));
+        assert_eq!(
+            SelectItem::UnnamedExpr(Expr::UnaryOp {
+                op: op.clone(),
+                expr: Box::new(Expr::Identifier(Ident::new("a"))),
+            }),
+            select.projection[0]
+        );
+    }
+}
+
 fn pg() -> TestedDialects {
     TestedDialects {
         dialects: vec![Box::new(PostgreSqlDialect {})],

From 1ac208307cedcb16b148068c789409449724c19f Mon Sep 17 00:00:00 2001
From: Alex Dukhno <5074607+alex-dukhno@users.noreply.github.com>
Date: Fri, 2 Oct 2020 17:35:20 +0300
Subject: [PATCH 097/122] Support IF NOT EXISTS for CREATE SCHEMA (#276)

This is a Postgres-specific clause: https://www.postgresql.org/docs/12/sql-createschema.html

Also add a test for `DROP SCHEMA IF EXISTS schema_name`, which is already supported in the parser.
---
 src/ast/mod.rs              | 15 +++++++++++++--
 src/parser.rs               |  6 +++++-
 tests/sqlparser_common.rs   |  2 +-
 tests/sqlparser_postgres.rs | 27 +++++++++++++++++++++++++++
 4 files changed, 46 insertions(+), 4 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 31171db7d..8a58207d7 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -558,7 +558,10 @@ pub enum Statement {
     /// `ROLLBACK [ TRANSACTION | WORK ] [ AND [ NO ] CHAIN ]`
     Rollback { chain: bool },
     /// CREATE SCHEMA
-    CreateSchema { schema_name: ObjectName },
+    CreateSchema {
+        schema_name: ObjectName,
+        if_not_exists: bool,
+    },
     /// `ASSERT <condition> [AS <message>]`
     Assert {
         condition: Expr,
@@ -829,7 +832,15 @@ impl fmt::Display for Statement {
             Statement::Rollback { chain } => {
                 write!(f, "ROLLBACK{}", if *chain { " AND CHAIN" } else { "" },)
             }
-            Statement::CreateSchema { schema_name } => write!(f, "CREATE SCHEMA {}", schema_name),
+            Statement::CreateSchema {
+                schema_name,
+                if_not_exists,
+            } => write!(
+                f,
+                "CREATE SCHEMA {if_not_exists}{name}",
+                if_not_exists = if *if_not_exists { "IF NOT EXISTS " } else { "" },
+                name = schema_name
+            ),
             Statement::Assert { condition, message } => {
                 write!(f, "ASSERT {}", condition)?;
                 if let Some(m) = message {
diff --git a/src/parser.rs b/src/parser.rs
index f7630b037..438c9f1ef 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1078,8 +1078,12 @@ impl<'a> Parser<'a> {
     }
 
     pub fn parse_create_schema(&mut self) -> Result<Statement, ParserError> {
+        let if_not_exists = self.parse_keywords(&[Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
         let schema_name = self.parse_object_name()?;
-        Ok(Statement::CreateSchema { schema_name })
+        Ok(Statement::CreateSchema {
+            schema_name,
+            if_not_exists,
+        })
     }
 
     pub fn parse_create_external_table(
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 4050cdf0b..6b032d926 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1204,7 +1204,7 @@ fn parse_create_schema() {
     let sql = "CREATE SCHEMA X";
 
     match verified_stmt(sql) {
-        Statement::CreateSchema { schema_name } => {
+        Statement::CreateSchema { schema_name, .. } => {
             assert_eq!(schema_name.to_string(), "X".to_owned())
         }
         _ => unreachable!(),
diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index 1083e9971..ecc0e77e3 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -300,6 +300,33 @@ fn parse_bad_if_not_exists() {
     );
 }
 
+#[test]
+fn parse_create_schema_if_not_exists() {
+    let sql = "CREATE SCHEMA IF NOT EXISTS schema_name";
+    let ast = pg_and_generic().verified_stmt(sql);
+    match ast {
+        Statement::CreateSchema {
+            if_not_exists: true,
+            schema_name,
+        } => assert_eq!("schema_name", schema_name.to_string()),
+        _ => unreachable!(),
+    }
+}
+
+#[test]
+fn parse_drop_schema_if_exists() {
+    let sql = "DROP SCHEMA IF EXISTS schema_name";
+    let ast = pg().verified_stmt(sql);
+    match ast {
+        Statement::Drop {
+            object_type,
+            if_exists: true,
+            ..
+        } => assert_eq!(object_type, ObjectType::Schema),
+        _ => unreachable!(),
+    }
+}
+
 #[test]
 fn parse_copy_example() {
     let sql = r#"COPY public.actor (actor_id, first_name, last_name, last_update, value) FROM stdin;

From 7dc5d4c35e437c1ed1b0ba64cbf1436547f6ed78 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Sun, 27 Sep 2020 01:32:37 +0300
Subject: [PATCH 098/122] Follow-up to #275: Bump simple_logger version in
 Cargo.toml

SimpleLogger is private in v1.6. Bumping its version in Cargo.toml makes
`git pull && carg test` use the new version in an existing checkout
(with an existing Cargo.lock file referencing the old version)
---
 Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index f6250492f..126f7c4ac 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -32,7 +32,7 @@ serde = { version = "1.0", features = ["derive"], optional = true }
 serde_json = { version = "1.0", optional = true }
 
 [dev-dependencies]
-simple_logger = "1.6"
+simple_logger = "1.9"
 matches = "0.1"
 
 [package.metadata.release]

From 54be3912a9cc0046ad8bd375b6f54023e85a7038 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Mon, 5 Oct 2020 04:30:49 +0300
Subject: [PATCH 099/122] Update CHANGELOG

---
 CHANGELOG.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index c3e39aab4..05dbfdfc4 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -18,12 +18,14 @@ Check https://github.com/ballista-compute/sqlparser-rs/commits/main for undocume
 - Support `TABLE()` functions in `FROM` (#253) - thanks @eyalleshem!
 - Support Snowflake's single-line comments starting with '#' or '//' (#264) - thanks @eyalleshem!
 - Support PostgreSQL `PREPARE`, `EXECUTE`, and `DEALLOCATE` (#243) - thanks @silathdiir!
+- Support PostgreSQL math operators (#267) - thanks @alex-dukhno!
 - Add SQLite dialect (#248) - thanks @mashuai!
 - Add Snowflake dialect (#259) - thanks @eyalleshem!
 - DDL:
     - Support `OR REPLACE` in `CREATE VIEW`/`TABLE` (#239)  - thanks @Dandandan!
     - Support specifying `ASC`/`DESC` in index columns (#249) - thanks @mashuai!
     - Support SQLite `AUTOINCREMENT` and MySQL `AUTO_INCREMENT` column option in `CREATE TABLE` (#234) - thanks @mashuai!
+    - Support PostgreSQL `IF NOT EXISTS` for `CREATE SCHEMA` (#276) - thanks @alex-dukhno!
 
 ### Fixed
 - Fix a typo in `JSONFILE` serialization, introduced in 0.3.1 (#237)

From 99fb633221c48c481edb669cd3b376688c88a5dc Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Mon, 5 Oct 2020 05:08:55 +0300
Subject: [PATCH 100/122] Move existing SF tests to sqlparser_snowflake.rs

Co-authored-by: Eyal Leshem <eyal@satoricyber.com>
---
 src/test_utils.rs            | 16 +++++++++
 tests/macros/mod.rs          | 20 +++++++++++
 tests/sqlparser_common.rs    | 66 +++---------------------------------
 tests/sqlparser_snowflake.rs | 46 ++++++++++++++++++++++++-
 4 files changed, 86 insertions(+), 62 deletions(-)
 create mode 100644 tests/macros/mod.rs

diff --git a/src/test_utils.rs b/src/test_utils.rs
index 7d9636068..0507fa866 100644
--- a/src/test_utils.rs
+++ b/src/test_utils.rs
@@ -143,3 +143,19 @@ pub fn expr_from_projection(item: &SelectItem) -> &Expr {
 pub fn number(n: &'static str) -> Value {
     Value::Number(n.parse().unwrap())
 }
+
+pub fn table(name: impl Into<String>) -> TableFactor {
+    TableFactor::Table {
+        name: ObjectName(vec![Ident::new(name.into())]),
+        alias: None,
+        args: vec![],
+        with_hints: vec![],
+    }
+}
+
+pub fn join(relation: TableFactor) -> Join {
+    Join {
+        relation,
+        join_operator: JoinOperator::Inner(JoinConstraint::Natural),
+    }
+}
diff --git a/tests/macros/mod.rs b/tests/macros/mod.rs
new file mode 100644
index 000000000..365024a90
--- /dev/null
+++ b/tests/macros/mod.rs
@@ -0,0 +1,20 @@
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+macro_rules! nest {
+    ($base:expr $(, $join:expr)*) => {
+        TableFactor::NestedJoin(Box::new(TableWithJoins {
+            relation: $base,
+            joins: vec![$(join($join)),*]
+        }))
+    };
+}
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 6b032d926..a535fa212 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -18,12 +18,15 @@
 //! sqlparser regardless of the chosen dialect (i.e. it doesn't conflict with
 //! dialect-specific parsing rules).
 
-use matches::assert_matches;
+#[macro_use]
+#[path = "macros/mod.rs"]
+mod macros;
 
+use matches::assert_matches;
 use sqlparser::ast::*;
 use sqlparser::dialect::keywords::ALL_KEYWORDS;
 use sqlparser::parser::ParserError;
-use sqlparser::test_utils::{all_dialects, expr_from_projection, number, only};
+use sqlparser::test_utils::{all_dialects, expr_from_projection, join, number, only, table};
 
 #[test]
 fn parse_insert_values() {
@@ -2282,31 +2285,6 @@ fn parse_complex_join() {
 
 #[test]
 fn parse_join_nesting() {
-    fn table(name: impl Into<String>) -> TableFactor {
-        TableFactor::Table {
-            name: ObjectName(vec![Ident::new(name.into())]),
-            alias: None,
-            args: vec![],
-            with_hints: vec![],
-        }
-    }
-
-    fn join(relation: TableFactor) -> Join {
-        Join {
-            relation,
-            join_operator: JoinOperator::Inner(JoinConstraint::Natural),
-        }
-    }
-
-    macro_rules! nest {
-        ($base:expr $(, $join:expr)*) => {
-            TableFactor::NestedJoin(Box::new(TableWithJoins {
-                relation: $base,
-                joins: vec![$(join($join)),*]
-            }))
-        };
-    }
-
     let sql = "SELECT * FROM a NATURAL JOIN (b NATURAL JOIN (c NATURAL JOIN d NATURAL JOIN e)) \
                NATURAL JOIN (f NATURAL JOIN (g NATURAL JOIN h))";
     assert_eq!(
@@ -2337,20 +2315,6 @@ fn parse_join_nesting() {
         from.joins,
         vec![join(nest!(nest!(nest!(table("b"), table("c")))))]
     );
-
-    // Parenthesized table names are non-standard, but supported in Snowflake SQL
-    let sql = "SELECT * FROM (a NATURAL JOIN (b))";
-    let select = verified_only_select(sql);
-    let from = only(select.from);
-
-    assert_eq!(from.relation, nest!(table("a"), nest!(table("b"))));
-
-    // Double parentheses around table names are non-standard, but supported in Snowflake SQL
-    let sql = "SELECT * FROM (a NATURAL JOIN ((b)))";
-    let select = verified_only_select(sql);
-    let from = only(select.from);
-
-    assert_eq!(from.relation, nest!(table("a"), nest!(nest!(table("b")))));
 }
 
 #[test]
@@ -2490,26 +2454,6 @@ fn parse_derived_tables() {
             }],
         }))
     );
-
-    // Nesting a subquery in parentheses is non-standard, but supported in Snowflake SQL
-    let sql = "SELECT * FROM ((SELECT 1) AS t)";
-    let select = verified_only_select(sql);
-    let from = only(select.from);
-
-    assert_eq!(
-        from.relation,
-        TableFactor::NestedJoin(Box::new(TableWithJoins {
-            relation: TableFactor::Derived {
-                lateral: false,
-                subquery: Box::new(verified_query("SELECT 1")),
-                alias: Some(TableAlias {
-                    name: "t".into(),
-                    columns: vec![],
-                })
-            },
-            joins: Vec::new(),
-        }))
-    );
 }
 
 #[test]
diff --git a/tests/sqlparser_snowflake.rs b/tests/sqlparser_snowflake.rs
index c1aa41db3..5915d1231 100644
--- a/tests/sqlparser_snowflake.rs
+++ b/tests/sqlparser_snowflake.rs
@@ -9,9 +9,14 @@
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.
+
+#[macro_use]
+#[path = "macros/mod.rs"]
+mod macros;
+
+use sqlparser::test_utils::*;
 use sqlparser::ast::*;
 use sqlparser::dialect::{GenericDialect, SnowflakeDialect};
-use sqlparser::test_utils::*;
 use sqlparser::tokenizer::*;
 
 #[test]
@@ -63,6 +68,45 @@ fn test_snowflake_single_line_tokenize() {
     assert_eq!(expected, tokens);
 }
 
+#[test]
+fn test_sf_derives_single_table_in_parenthesis() {
+    // Nesting a subquery in parentheses is non-standard, but supported in Snowflake SQL
+    let sql = "SELECT * FROM ((SELECT 1) AS t)";
+    let select = snowflake_and_generic().verified_only_select(sql);
+    let from = only(select.from);
+    assert_eq!(
+        from.relation,
+        TableFactor::NestedJoin(Box::new(TableWithJoins {
+            relation: TableFactor::Derived {
+                lateral: false,
+                subquery: Box::new(snowflake_and_generic().verified_query("SELECT 1")),
+                alias: Some(TableAlias {
+                    name: "t".into(),
+                    columns: vec![],
+                })
+            },
+            joins: Vec::new(),
+        }))
+    );
+}
+
+#[test]
+fn test_single_table_in_parenthesis() {
+    // Parenthesized table names are non-standard, but supported in Snowflake SQL
+    let sql = "SELECT * FROM (a NATURAL JOIN (b))";
+    let select = snowflake_and_generic().verified_only_select(sql);
+    let from = only(select.from);
+
+    assert_eq!(from.relation, nest!(table("a"), nest!(table("b"))));
+
+    // Double parentheses around table names are non-standard, but supported in Snowflake SQL
+    let sql = "SELECT * FROM (a NATURAL JOIN ((b)))";
+    let select = snowflake_and_generic().verified_only_select(sql);
+    let from = only(select.from);
+
+    assert_eq!(from.relation, nest!(table("a"), nest!(nest!(table("b")))));
+}
+
 fn snowflake_and_generic() -> TestedDialects {
     TestedDialects {
         dialects: vec![Box::new(SnowflakeDialect {}), Box::new(GenericDialect {})],

From 9f772f03b0ce17fb8993ddf20c3daf53ad37cff4 Mon Sep 17 00:00:00 2001
From: rhanqtl <my@rhanqtl.com>
Date: Sun, 11 Oct 2020 14:43:51 +0800
Subject: [PATCH 101/122] Add support for Recursive CTEs (#278)

i.e. `WITH RECURSIVE ... AS ( ... ) SELECT` - see https://jakewheat.github.io/sql-overview/sql-2016-foundation-grammar.html#with-clause

Fixes #277
---
 src/ast/mod.rs            |  2 +-
 src/ast/query.rs          | 26 ++++++++++++++++++----
 src/parser.rs             | 12 +++++-----
 src/tokenizer.rs          |  5 +----
 tests/sqlparser_common.rs | 47 ++++++++++++++++++++++++++++++++++-----
 5 files changed, 73 insertions(+), 19 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 8a58207d7..a726b299d 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -30,7 +30,7 @@ pub use self::ddl::{
 pub use self::operator::{BinaryOperator, UnaryOperator};
 pub use self::query::{
     Cte, Fetch, Join, JoinConstraint, JoinOperator, Offset, OffsetRows, OrderByExpr, Query, Select,
-    SelectItem, SetExpr, SetOperator, TableAlias, TableFactor, TableWithJoins, Top, Values,
+    SelectItem, SetExpr, SetOperator, TableAlias, TableFactor, TableWithJoins, Top, Values, With,
 };
 pub use self::value::{DateTimeField, Value};
 
diff --git a/src/ast/query.rs b/src/ast/query.rs
index e0dbe4c72..06ea9c5b0 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -20,8 +20,8 @@ use serde::{Deserialize, Serialize};
 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct Query {
     /// WITH (common table expressions, or CTEs)
-    pub ctes: Vec<Cte>,
-    /// SELECT or UNION / EXCEPT / INTECEPT
+    pub with: Option<With>,
+    /// SELECT or UNION / EXCEPT / INTERSECT
     pub body: SetExpr,
     /// ORDER BY
     pub order_by: Vec<OrderByExpr>,
@@ -35,8 +35,8 @@ pub struct Query {
 
 impl fmt::Display for Query {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
-        if !self.ctes.is_empty() {
-            write!(f, "WITH {} ", display_comma_separated(&self.ctes))?;
+        if let Some(ref with) = self.with {
+            write!(f, "{} ", with)?;
         }
         write!(f, "{}", self.body)?;
         if !self.order_by.is_empty() {
@@ -157,6 +157,24 @@ impl fmt::Display for Select {
     }
 }
 
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
+pub struct With {
+    pub recursive: bool,
+    pub cte_tables: Vec<Cte>,
+}
+
+impl fmt::Display for With {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        write!(
+            f,
+            "WITH {}{}",
+            if self.recursive { "RECURSIVE " } else { "" },
+            display_comma_separated(&self.cte_tables)
+        )
+    }
+}
+
 /// A single CTE (used after `WITH`): `alias [(col1, col2, ...)] AS ( query )`
 /// The names in the column list before `AS`, when specified, replace the names
 /// of the columns returned by the query. The parser does not validate that the
diff --git a/src/parser.rs b/src/parser.rs
index 438c9f1ef..5d98f9c84 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -1795,11 +1795,13 @@ impl<'a> Parser<'a> {
     /// by `ORDER BY`. Unlike some other parse_... methods, this one doesn't
     /// expect the initial keyword to be already consumed
     pub fn parse_query(&mut self) -> Result<Query, ParserError> {
-        let ctes = if self.parse_keyword(Keyword::WITH) {
-            // TODO: optional RECURSIVE
-            self.parse_comma_separated(Parser::parse_cte)?
+        let with = if self.parse_keyword(Keyword::WITH) {
+            Some(With {
+                recursive: self.parse_keyword(Keyword::RECURSIVE),
+                cte_tables: self.parse_comma_separated(Parser::parse_cte)?,
+            })
         } else {
-            vec![]
+            None
         };
 
         let body = self.parse_query_body(0)?;
@@ -1829,7 +1831,7 @@ impl<'a> Parser<'a> {
         };
 
         Ok(Query {
-            ctes,
+            with,
             body,
             limit,
             order_by,
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 2496e63a2..70587f18b 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -382,10 +382,7 @@ impl<'a> Tokenizer<'a> {
                 // numbers
                 '0'..='9' => {
                     // TODO: https://jakewheat.github.io/sql-overview/sql-2011-foundation-grammar.html#unsigned-numeric-literal
-                    let s = peeking_take_while(chars, |ch| match ch {
-                        '0'..='9' | '.' => true,
-                        _ => false,
-                    });
+                    let s = peeking_take_while(chars, |ch| matches!(ch, '0'..='9' | '.'));
                     Ok(Some(Token::Number(s)))
                 }
                 // punctuation
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 6b032d926..411b77f6b 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -2389,7 +2389,7 @@ fn parse_ctes() {
 
     fn assert_ctes_in_select(expected: &[&str], sel: &Query) {
         for (i, exp) in expected.iter().enumerate() {
-            let Cte { alias, query } = &sel.ctes[i];
+            let Cte { alias, query } = &sel.with.as_ref().unwrap().cte_tables[i];
             assert_eq!(*exp, query.to_string());
             assert_eq!(
                 if i == 0 {
@@ -2432,7 +2432,7 @@ fn parse_ctes() {
     // CTE in a CTE...
     let sql = &format!("WITH outer_cte AS ({}) SELECT * FROM outer_cte", with);
     let select = verified_query(sql);
-    assert_ctes_in_select(&cte_sqls, &only(&select.ctes).query);
+    assert_ctes_in_select(&cte_sqls, &only(&select.with.unwrap().cte_tables).query);
 }
 
 #[test]
@@ -2441,10 +2441,47 @@ fn parse_cte_renamed_columns() {
     let query = all_dialects().verified_query(sql);
     assert_eq!(
         vec![Ident::new("col1"), Ident::new("col2")],
-        query.ctes.first().unwrap().alias.columns
+        query
+            .with
+            .unwrap()
+            .cte_tables
+            .first()
+            .unwrap()
+            .alias
+            .columns
     );
 }
 
+#[test]
+fn parse_recursive_cte() {
+    let cte_query = "SELECT 1 UNION ALL SELECT val + 1 FROM nums WHERE val < 10".to_owned();
+    let sql = &format!(
+        "WITH RECURSIVE nums (val) AS ({}) SELECT * FROM nums",
+        cte_query
+    );
+
+    let cte_query = verified_query(&cte_query);
+    let query = verified_query(sql);
+
+    let with = query.with.as_ref().unwrap();
+    assert!(with.recursive);
+    assert_eq!(with.cte_tables.len(), 1);
+    let expected = Cte {
+        alias: TableAlias {
+            name: Ident {
+                value: "nums".to_string(),
+                quote_style: None,
+            },
+            columns: vec![Ident {
+                value: "val".to_string(),
+                quote_style: None,
+            }],
+        },
+        query: cte_query,
+    };
+    assert_eq!(with.cte_tables.first().unwrap(), &expected);
+}
+
 #[test]
 fn parse_derived_tables() {
     let sql = "SELECT a.x, b.y FROM (SELECT x FROM foo) AS a CROSS JOIN (SELECT y FROM bar) AS b";
@@ -3266,8 +3303,8 @@ fn parse_drop_index() {
 fn all_keywords_sorted() {
     // assert!(ALL_KEYWORDS.is_sorted())
     let mut copy = Vec::from(ALL_KEYWORDS);
-    copy.sort();
-    assert!(copy == ALL_KEYWORDS)
+    copy.sort_unstable();
+    assert_eq!(copy, ALL_KEYWORDS)
 }
 
 fn parse_sql_statements(sql: &str) -> Result<Vec<Statement>, ParserError> {

From 4128dfe1db9d5ee80e7282087234cc1dbedbef99 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Mon, 5 Oct 2020 07:43:51 +0300
Subject: [PATCH 102/122] Introduce tests/test_utils/mod.rs and use it
 consistently

To share helper macros between various tests/* we added a new module
(tests/macros/mod.rs). This made the prologue to be used in tests quite
long and a little weird:
```
#[macro_use]
#[path = "macros/mod.rs"]
mod macros;
use sqlparser::test_utils::*;
```

This simplifies it to:
```
#[macro_use]
mod test_utils;
use test_utils::*;
```
- and switches all existing tests to the new prologue simultaneously...

...while fixing a few other inconsistencies and adding a few comments
about the way `test_utils` work.
---
 src/lib.rs                          |  1 +
 src/test_utils.rs                   |  6 ++++++
 tests/sqlparser_common.rs           |  5 ++---
 tests/sqlparser_mssql.rs            |  5 ++++-
 tests/sqlparser_mysql.rs            |  6 ++++--
 tests/sqlparser_postgres.rs         |  5 ++++-
 tests/sqlparser_regression.rs       |  2 ++
 tests/sqlparser_snowflake.rs        |  9 ++++++---
 tests/sqlparser_sqlite.rs           |  5 ++++-
 tests/{macros => test_utils}/mod.rs | 14 ++++++++++++++
 10 files changed, 47 insertions(+), 11 deletions(-)
 rename tests/{macros => test_utils}/mod.rs (53%)

diff --git a/src/lib.rs b/src/lib.rs
index 8c9b01702..5b2324579 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -43,4 +43,5 @@ pub mod tokenizer;
 #[doc(hidden)]
 // This is required to make utilities accessible by both the crate-internal
 // unit-tests and by the integration tests <https://stackoverflow.com/a/44541071/1026>
+// External users are not supposed to rely on this module.
 pub mod test_utils;
diff --git a/src/test_utils.rs b/src/test_utils.rs
index 0507fa866..1c3985750 100644
--- a/src/test_utils.rs
+++ b/src/test_utils.rs
@@ -10,6 +10,12 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
+/// This module contains internal utilities used for testing the library.
+/// While technically public, the library's users are not supposed to rely
+/// on this module, as it will change without notice.
+//
+// Integration tests (i.e. everything under `tests/`) import this
+// via `tests/test_utils/mod.rs`.
 use std::fmt::Debug;
 
 use super::ast::*;
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index a535fa212..6bf3ad060 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -19,14 +19,13 @@
 //! dialect-specific parsing rules).
 
 #[macro_use]
-#[path = "macros/mod.rs"]
-mod macros;
+mod test_utils;
+use test_utils::{all_dialects, expr_from_projection, join, number, only, table};
 
 use matches::assert_matches;
 use sqlparser::ast::*;
 use sqlparser::dialect::keywords::ALL_KEYWORDS;
 use sqlparser::parser::ParserError;
-use sqlparser::test_utils::{all_dialects, expr_from_projection, join, number, only, table};
 
 #[test]
 fn parse_insert_values() {
diff --git a/tests/sqlparser_mssql.rs b/tests/sqlparser_mssql.rs
index 2774d43ef..f4e19dfa5 100644
--- a/tests/sqlparser_mssql.rs
+++ b/tests/sqlparser_mssql.rs
@@ -14,9 +14,12 @@
 //! Test SQL syntax specific to Microsoft's T-SQL. The parser based on the
 //! generic dialect is also tested (on the inputs it can handle).
 
+#[macro_use]
+mod test_utils;
+use test_utils::*;
+
 use sqlparser::ast::*;
 use sqlparser::dialect::{GenericDialect, MsSqlDialect};
-use sqlparser::test_utils::*;
 
 #[test]
 fn parse_mssql_identifiers() {
diff --git a/tests/sqlparser_mysql.rs b/tests/sqlparser_mysql.rs
index c0fc8c8ba..a8f85584c 100644
--- a/tests/sqlparser_mysql.rs
+++ b/tests/sqlparser_mysql.rs
@@ -11,13 +11,15 @@
 // limitations under the License.
 
 #![warn(clippy::all)]
-
 //! Test SQL syntax specific to MySQL. The parser based on the generic dialect
 //! is also tested (on the inputs it can handle).
 
+#[macro_use]
+mod test_utils;
+use test_utils::*;
+
 use sqlparser::ast::*;
 use sqlparser::dialect::{GenericDialect, MySqlDialect};
-use sqlparser::test_utils::*;
 use sqlparser::tokenizer::Token;
 
 #[test]
diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index ecc0e77e3..20f186100 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -14,10 +14,13 @@
 //! Test SQL syntax specific to PostgreSQL. The parser based on the
 //! generic dialect is also tested (on the inputs it can handle).
 
+#[macro_use]
+mod test_utils;
+use test_utils::*;
+
 use sqlparser::ast::*;
 use sqlparser::dialect::{GenericDialect, PostgreSqlDialect};
 use sqlparser::parser::ParserError;
-use sqlparser::test_utils::*;
 
 #[test]
 fn parse_create_table_with_defaults() {
diff --git a/tests/sqlparser_regression.rs b/tests/sqlparser_regression.rs
index 5262ff7aa..bbf1b2977 100644
--- a/tests/sqlparser_regression.rs
+++ b/tests/sqlparser_regression.rs
@@ -10,6 +10,8 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
+#![warn(clippy::all)]
+
 use sqlparser::dialect::GenericDialect;
 use sqlparser::parser::Parser;
 
diff --git a/tests/sqlparser_snowflake.rs b/tests/sqlparser_snowflake.rs
index 5915d1231..694603a7e 100644
--- a/tests/sqlparser_snowflake.rs
+++ b/tests/sqlparser_snowflake.rs
@@ -10,11 +10,14 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
+#![warn(clippy::all)]
+//! Test SQL syntax specific to Snowflake. The parser based on the
+//! generic dialect is also tested (on the inputs it can handle).
+
 #[macro_use]
-#[path = "macros/mod.rs"]
-mod macros;
+mod test_utils;
+use test_utils::*;
 
-use sqlparser::test_utils::*;
 use sqlparser::ast::*;
 use sqlparser::dialect::{GenericDialect, SnowflakeDialect};
 use sqlparser::tokenizer::*;
diff --git a/tests/sqlparser_sqlite.rs b/tests/sqlparser_sqlite.rs
index 2a421e94b..10816e1bb 100644
--- a/tests/sqlparser_sqlite.rs
+++ b/tests/sqlparser_sqlite.rs
@@ -14,9 +14,12 @@
 //! Test SQL syntax specific to SQLite. The parser based on the
 //! generic dialect is also tested (on the inputs it can handle).
 
+#[macro_use]
+mod test_utils;
+use test_utils::*;
+
 use sqlparser::ast::*;
 use sqlparser::dialect::{GenericDialect, SQLiteDialect};
-use sqlparser::test_utils::*;
 use sqlparser::tokenizer::Token;
 
 #[test]
diff --git a/tests/macros/mod.rs b/tests/test_utils/mod.rs
similarity index 53%
rename from tests/macros/mod.rs
rename to tests/test_utils/mod.rs
index 365024a90..f224314b9 100644
--- a/tests/macros/mod.rs
+++ b/tests/test_utils/mod.rs
@@ -10,6 +10,20 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
+// Re-export everything from `src/test_utils.rs`.
+pub use sqlparser::test_utils::*;
+
+// For the test-only macros we take a different approach of keeping them here
+// rather than in the library crate.
+//
+// This is because we don't need any of them to be shared between the
+// integration tests (i.e. `tests/*`) and the unit tests (i.e. `src/*`),
+// but also because Rust doesn't scope macros to a particular module
+// (and while we export internal helpers as sqlparser::test_utils::<...>,
+// expecting our users to abstain from relying on them, exporting internal
+// macros at the top level, like `sqlparser::nest` was deemed too confusing).
+
+#[macro_export]
 macro_rules! nest {
     ($base:expr $(, $join:expr)*) => {
         TableFactor::NestedJoin(Box::new(TableWithJoins {

From d9e044aabbeb90180ee37ce77651d3bc6c7e47f3 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Mon, 12 Oct 2020 06:09:34 +0300
Subject: [PATCH 103/122] Extend one_statement_parses_to to also test parsing
 canonical SQL

It was an omission of the original implementation.
---
 src/test_utils.rs | 12 +++++++++---
 1 file changed, 9 insertions(+), 3 deletions(-)

diff --git a/src/test_utils.rs b/src/test_utils.rs
index 1c3985750..a9e35d9d2 100644
--- a/src/test_utils.rs
+++ b/src/test_utils.rs
@@ -69,13 +69,19 @@ impl TestedDialects {
         // Parser::parse_sql(&**self.dialects.first().unwrap(), sql)
     }
 
-    /// Ensures that `sql` parses as a single statement, optionally checking
-    /// that converting AST back to string equals to `canonical` (unless an
-    /// empty canonical string is provided).
+    /// Ensures that `sql` parses as a single statement and returns it.
+    /// If non-empty `canonical` SQL representation is provided,
+    /// additionally asserts that parsing `sql` results in the same parse
+    /// tree as parsing `canonical`, and that serializing it back to string
+    /// results in the `canonical` representation.
     pub fn one_statement_parses_to(&self, sql: &str, canonical: &str) -> Statement {
         let mut statements = self.parse_sql_statements(&sql).unwrap();
         assert_eq!(statements.len(), 1);
 
+        if !canonical.is_empty() && sql != canonical {
+            assert_eq!(self.parse_sql_statements(&canonical).unwrap(), statements);
+        }
+
         let only_statement = statements.pop().unwrap();
         if !canonical.is_empty() {
             assert_eq!(canonical, only_statement.to_string())

From ad72cda6b0f1797cbd5444e58ba2b2c1a48e0114 Mon Sep 17 00:00:00 2001
From: Nickolay Ponomarev <asqueella@gmail.com>
Date: Tue, 13 Oct 2020 09:29:16 +0300
Subject: [PATCH 104/122] [snowflake] Support specifying an alias after `FROM
 (table_factor)`

Snowflake diverges from the standard and from most of the other
implementations by allowing extra parentheses not only around a join,
but around lone table names (e.g. `FROM (mytable [AS alias])`) and
around derived tables (e.g. `FROM ((SELECT ...)  [AS alias])`) as well.

Initially this was implemented in https://github.com/ballista-compute/sqlparser-rs/issues/154
by (ab)using `TableFactor::NestedJoin` to represent anything nested in
extra set of parens.

Afterwards we learned in https://github.com/ballista-compute/sqlparser-rs/issues/223
that in cases of such extraneous nesting Snowflake allows specifying the
alias both inside and outside parens, but not both - consider:

    FROM (table_factor AS inner_alias) AS outer_alias

We've considered implementing this by changing `TableFactor::NestedJoin`
to a `TableFactor::Nested { inner: TableWithJoins, alias:
Option<TableAlias> }`, but that seemed too generic, as no known dialect
supports duplicate aliases, as shown above, nor naming nested joins
`(foo NATURAL JOIN bar) alias`. So we decided on making a smaller change
(with no modifications to the AST), that is also more appropriate to the
contributors to the Snowflake dialect:


1) Revert #154 by rejecting `FROM (table or derived table)` in most dialects.

2) For `dialect_of!(self is SnowflakeDialect | GenericDialect)` parse
and strip the extraneous parentheses, e.g.

   `(mytable) AS alias` -> `(mytable AS alias)`


Co-authored-by: Eyal Leshem <eyal@satoricyber.com>
---
 src/ast/query.rs             |  7 +--
 src/parser.rs                | 60 ++++++++++++++++++++---
 src/test_utils.rs            |  7 +++
 tests/sqlparser_common.rs    |  9 +---
 tests/sqlparser_snowflake.rs | 94 +++++++++++++++++++++++++-----------
 5 files changed, 131 insertions(+), 46 deletions(-)

diff --git a/src/ast/query.rs b/src/ast/query.rs
index e0dbe4c72..52c0fec27 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -242,9 +242,10 @@ pub enum TableFactor {
     },
     /// Represents a parenthesized table factor. The SQL spec only allows a
     /// join expression (`(foo <JOIN> bar [ <JOIN> baz ... ])`) to be nested,
-    /// possibly several times, but the parser also accepts the non-standard
-    /// nesting of bare tables (`table_with_joins.joins.is_empty()`), so the
-    /// name `NestedJoin` is a bit of misnomer.
+    /// possibly several times.
+    ///
+    /// The parser may also accept non-standard nesting of bare tables for some
+    /// dialects, but the information about such nesting is stripped from AST.
     NestedJoin(Box<TableWithJoins>),
 }
 
diff --git a/src/parser.rs b/src/parser.rs
index 438c9f1ef..7d2242f76 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -2156,14 +2156,58 @@ impl<'a> Parser<'a> {
             // recently consumed does not start a derived table (cases 1, 2, or 4).
             // `maybe_parse` will ignore such an error and rewind to be after the opening '('.
 
-            // Inside the parentheses we expect to find a table factor
-            // followed by some joins or another level of nesting.
-            let table_and_joins = self.parse_table_and_joins()?;
-            self.expect_token(&Token::RParen)?;
-            // The SQL spec prohibits derived and bare tables from appearing
-            // alone in parentheses. We don't enforce this as some databases
-            // (e.g. Snowflake) allow such syntax.
-            Ok(TableFactor::NestedJoin(Box::new(table_and_joins)))
+            // Inside the parentheses we expect to find an (A) table factor
+            // followed by some joins or (B) another level of nesting.
+            let mut table_and_joins = self.parse_table_and_joins()?;
+
+            if !table_and_joins.joins.is_empty() {
+                self.expect_token(&Token::RParen)?;
+                Ok(TableFactor::NestedJoin(Box::new(table_and_joins))) // (A)
+            } else if let TableFactor::NestedJoin(_) = &table_and_joins.relation {
+                // (B): `table_and_joins` (what we found inside the parentheses)
+                // is a nested join `(foo JOIN bar)`, not followed by other joins.
+                self.expect_token(&Token::RParen)?;
+                Ok(TableFactor::NestedJoin(Box::new(table_and_joins)))
+            } else if dialect_of!(self is SnowflakeDialect | GenericDialect) {
+                // Dialect-specific behavior: Snowflake diverges from the
+                // standard and from most of the other implementations by
+                // allowing extra parentheses not only around a join (B), but
+                // around lone table names (e.g. `FROM (mytable [AS alias])`)
+                // and around derived tables (e.g. `FROM ((SELECT ...)
+                // [AS alias])`) as well.
+                self.expect_token(&Token::RParen)?;
+
+                if let Some(outer_alias) =
+                    self.parse_optional_table_alias(keywords::RESERVED_FOR_TABLE_ALIAS)?
+                {
+                    // Snowflake also allows specifying an alias *after* parens
+                    // e.g. `FROM (mytable) AS alias`
+                    match &mut table_and_joins.relation {
+                        TableFactor::Derived { alias, .. }
+                        | TableFactor::Table { alias, .. }
+                        | TableFactor::TableFunction { alias, .. } => {
+                            // but not `FROM (mytable AS alias1) AS alias2`.
+                            if let Some(inner_alias) = alias {
+                                return Err(ParserError::ParserError(format!(
+                                    "duplicate alias {}",
+                                    inner_alias
+                                )));
+                            }
+                            // Act as if the alias was specified normally next
+                            // to the table name: `(mytable) AS alias` ->
+                            // `(mytable AS alias)`
+                            alias.replace(outer_alias);
+                        }
+                        TableFactor::NestedJoin(_) => unreachable!(),
+                    };
+                }
+                // Do not store the extra set of parens in the AST
+                Ok(table_and_joins.relation)
+            } else {
+                // The SQL spec prohibits derived tables and bare tables from
+                // appearing alone in parentheses (e.g. `FROM (mytable)`)
+                self.expected("joined table", self.peek_token())
+            }
         } else {
             let name = self.parse_object_name()?;
             // Postgres, MSSQL: table-valued functions:
diff --git a/src/test_utils.rs b/src/test_utils.rs
index a9e35d9d2..2fcacffa9 100644
--- a/src/test_utils.rs
+++ b/src/test_utils.rs
@@ -156,6 +156,13 @@ pub fn number(n: &'static str) -> Value {
     Value::Number(n.parse().unwrap())
 }
 
+pub fn table_alias(name: impl Into<String>) -> Option<TableAlias> {
+    Some(TableAlias {
+        name: Ident::new(name),
+        columns: vec![],
+    })
+}
+
 pub fn table(name: impl Into<String>) -> TableFactor {
     TableFactor::Table {
         name: ObjectName(vec![Ident::new(name.into())]),
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 6bf3ad060..68b493c43 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -20,7 +20,7 @@
 
 #[macro_use]
 mod test_utils;
-use test_utils::{all_dialects, expr_from_projection, join, number, only, table};
+use test_utils::{all_dialects, expr_from_projection, join, number, only, table, table_alias};
 
 use matches::assert_matches;
 use sqlparser::ast::*;
@@ -2130,13 +2130,6 @@ fn parse_cross_join() {
     );
 }
 
-fn table_alias(name: impl Into<String>) -> Option<TableAlias> {
-    Some(TableAlias {
-        name: Ident::new(name),
-        columns: vec![],
-    })
-}
-
 #[test]
 fn parse_joins_on() {
     fn join_with_constraint(
diff --git a/tests/sqlparser_snowflake.rs b/tests/sqlparser_snowflake.rs
index 694603a7e..1b1aaec9b 100644
--- a/tests/sqlparser_snowflake.rs
+++ b/tests/sqlparser_snowflake.rs
@@ -20,6 +20,7 @@ use test_utils::*;
 
 use sqlparser::ast::*;
 use sqlparser::dialect::{GenericDialect, SnowflakeDialect};
+use sqlparser::parser::ParserError;
 use sqlparser::tokenizer::*;
 
 #[test]
@@ -72,42 +73,81 @@ fn test_snowflake_single_line_tokenize() {
 }
 
 #[test]
-fn test_sf_derives_single_table_in_parenthesis() {
-    // Nesting a subquery in parentheses is non-standard, but supported in Snowflake SQL
-    let sql = "SELECT * FROM ((SELECT 1) AS t)";
-    let select = snowflake_and_generic().verified_only_select(sql);
-    let from = only(select.from);
-    assert_eq!(
-        from.relation,
-        TableFactor::NestedJoin(Box::new(TableWithJoins {
-            relation: TableFactor::Derived {
-                lateral: false,
-                subquery: Box::new(snowflake_and_generic().verified_query("SELECT 1")),
-                alias: Some(TableAlias {
-                    name: "t".into(),
-                    columns: vec![],
-                })
-            },
-            joins: Vec::new(),
-        }))
+fn test_sf_derived_table_in_parenthesis() {
+    // Nesting a subquery in an extra set of parentheses is non-standard,
+    // but supported in Snowflake SQL
+    snowflake_and_generic().one_statement_parses_to(
+        "SELECT * FROM ((SELECT 1) AS t)",
+        "SELECT * FROM (SELECT 1) AS t",
+    );
+    snowflake_and_generic().one_statement_parses_to(
+        "SELECT * FROM (((SELECT 1) AS t))",
+        "SELECT * FROM (SELECT 1) AS t",
     );
 }
 
 #[test]
 fn test_single_table_in_parenthesis() {
     // Parenthesized table names are non-standard, but supported in Snowflake SQL
-    let sql = "SELECT * FROM (a NATURAL JOIN (b))";
-    let select = snowflake_and_generic().verified_only_select(sql);
-    let from = only(select.from);
+    snowflake_and_generic().one_statement_parses_to(
+        "SELECT * FROM (a NATURAL JOIN (b))",
+        "SELECT * FROM (a NATURAL JOIN b)",
+    );
+    snowflake_and_generic().one_statement_parses_to(
+        "SELECT * FROM (a NATURAL JOIN ((b)))",
+        "SELECT * FROM (a NATURAL JOIN b)",
+    );
+}
 
-    assert_eq!(from.relation, nest!(table("a"), nest!(table("b"))));
+#[test]
+fn test_single_table_in_parenthesis_with_alias() {
+    snowflake_and_generic().one_statement_parses_to(
+        "SELECT * FROM (a NATURAL JOIN (b) c )",
+        "SELECT * FROM (a NATURAL JOIN b AS c)",
+    );
 
-    // Double parentheses around table names are non-standard, but supported in Snowflake SQL
-    let sql = "SELECT * FROM (a NATURAL JOIN ((b)))";
-    let select = snowflake_and_generic().verified_only_select(sql);
-    let from = only(select.from);
+    snowflake_and_generic().one_statement_parses_to(
+        "SELECT * FROM (a NATURAL JOIN ((b)) c )",
+        "SELECT * FROM (a NATURAL JOIN b AS c)",
+    );
+
+    snowflake_and_generic().one_statement_parses_to(
+        "SELECT * FROM (a NATURAL JOIN ( (b) c ) )",
+        "SELECT * FROM (a NATURAL JOIN b AS c)",
+    );
 
-    assert_eq!(from.relation, nest!(table("a"), nest!(nest!(table("b")))));
+    snowflake_and_generic().one_statement_parses_to(
+        "SELECT * FROM (a NATURAL JOIN ( (b) as c ) )",
+        "SELECT * FROM (a NATURAL JOIN b AS c)",
+    );
+
+    snowflake_and_generic().one_statement_parses_to(
+        "SELECT * FROM (a alias1 NATURAL JOIN ( (b) c ) )",
+        "SELECT * FROM (a AS alias1 NATURAL JOIN b AS c)",
+    );
+
+    snowflake_and_generic().one_statement_parses_to(
+        "SELECT * FROM (a as alias1 NATURAL JOIN ( (b) as c ) )",
+        "SELECT * FROM (a AS alias1 NATURAL JOIN b AS c)",
+    );
+
+    let res = snowflake_and_generic().parse_sql_statements("SELECT * FROM (a NATURAL JOIN b) c");
+    assert_eq!(
+        ParserError::ParserError("Expected end of statement, found: c".to_string()),
+        res.unwrap_err()
+    );
+
+    let res = snowflake().parse_sql_statements("SELECT * FROM (a b) c");
+    assert_eq!(
+        ParserError::ParserError("duplicate alias b".to_string()),
+        res.unwrap_err()
+    );
+}
+
+fn snowflake() -> TestedDialects {
+    TestedDialects {
+        dialects: vec![Box::new(SnowflakeDialect {})],
+    }
 }
 
 fn snowflake_and_generic() -> TestedDialects {

From 17f2930885145b1080a61d2e5b6fbd9027a88844 Mon Sep 17 00:00:00 2001
From: Dmitry Patsura <zaets28rus@gmail.com>
Date: Mon, 28 Dec 2020 14:22:03 +0300
Subject: [PATCH 105/122] Introduce support for EXPLAIN [ANALYZE] [VERBOSE]
 <STATEMENT> syntax

Introduce support for EXPLAIN [ANALYZE] [VERBOSE] <STATEMENT> syntax
---
 src/ast/mod.rs            | 26 ++++++++++++++++
 src/dialect/keywords.rs   |  7 +++++
 src/parser.rs             | 14 +++++++++
 src/tokenizer.rs          | 62 +++++++++++++++++++++++++++++++++++++++
 tests/sqlparser_common.rs | 58 +++++++++++++++++++++++++++++-------
 5 files changed, 156 insertions(+), 11 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index a726b299d..2d63bbfab 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -431,6 +431,15 @@ impl fmt::Display for WindowFrameBound {
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum Statement {
+    // EXPLAIN
+    Explain {
+        // Carry out the command and show actual run times and other statistics.
+        analyze: bool,
+        // Display additional information regarding the plan.
+        verbose: bool,
+        /// A SQL query that specifies what to explain
+        statement: Box<Statement>,
+    },
     /// SELECT
     Query(Box<Query>),
     /// INSERT
@@ -591,6 +600,23 @@ impl fmt::Display for Statement {
     #[allow(clippy::cognitive_complexity)]
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
         match self {
+            Statement::Explain {
+                verbose,
+                analyze,
+                statement,
+            } => {
+                write!(f, "EXPLAIN ")?;
+
+                if *analyze {
+                    write!(f, "ANALYZE ")?;
+                }
+
+                if *verbose {
+                    write!(f, "VERBOSE ")?;
+                }
+
+                write!(f, "{}", statement)
+            }
             Statement::Query(s) => write!(f, "{}", s),
             Statement::Insert {
                 table_name,
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index d14534881..6e7065043 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -72,6 +72,7 @@ define_keywords!(
     ALL,
     ALLOCATE,
     ALTER,
+    ANALYZE,
     AND,
     ANY,
     APPLY,
@@ -190,6 +191,7 @@ define_keywords!(
     EXECUTE,
     EXISTS,
     EXP,
+    EXPLAIN,
     EXTENDED,
     EXTERNAL,
     EXTRACT,
@@ -443,6 +445,7 @@ define_keywords!(
     VARYING,
     VAR_POP,
     VAR_SAMP,
+    VERBOSE,
     VERSIONING,
     VIEW,
     VIRTUAL,
@@ -465,6 +468,8 @@ define_keywords!(
 pub const RESERVED_FOR_TABLE_ALIAS: &[Keyword] = &[
     // Reserved as both a table and a column alias:
     Keyword::WITH,
+    Keyword::EXPLAIN,
+    Keyword::ANALYZE,
     Keyword::SELECT,
     Keyword::WHERE,
     Keyword::GROUP,
@@ -496,6 +501,8 @@ pub const RESERVED_FOR_TABLE_ALIAS: &[Keyword] = &[
 pub const RESERVED_FOR_COLUMN_ALIAS: &[Keyword] = &[
     // Reserved as both a table and a column alias:
     Keyword::WITH,
+    Keyword::EXPLAIN,
+    Keyword::ANALYZE,
     Keyword::SELECT,
     Keyword::WHERE,
     Keyword::GROUP,
diff --git a/src/parser.rs b/src/parser.rs
index b40e94de7..0db093f93 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -131,6 +131,7 @@ impl<'a> Parser<'a> {
     pub fn parse_statement(&mut self) -> Result<Statement, ParserError> {
         match self.next_token() {
             Token::Word(w) => match w.keyword {
+                Keyword::EXPLAIN => Ok(self.parse_explain()?),
                 Keyword::SELECT | Keyword::WITH | Keyword::VALUES => {
                     self.prev_token();
                     Ok(Statement::Query(Box::new(self.parse_query()?)))
@@ -1790,6 +1791,19 @@ impl<'a> Parser<'a> {
         })
     }
 
+    pub fn parse_explain(&mut self) -> Result<Statement, ParserError> {
+        let analyze = self.parse_keyword(Keyword::ANALYZE);
+        let verbose = self.parse_keyword(Keyword::VERBOSE);
+
+        let statement = Box::new(self.parse_statement()?);
+
+        Ok(Statement::Explain {
+            analyze,
+            verbose,
+            statement,
+        })
+    }
+
     /// Parse a query expression, i.e. a `SELECT` statement optionally
     /// preceeded with some `WITH` CTE declarations and optionally followed
     /// by `ORDER BY`. Unlike some other parse_... methods, this one doesn't
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index 70587f18b..bbad1a4c4 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -734,6 +734,68 @@ mod tests {
         compare(expected, tokens);
     }
 
+    #[test]
+    fn tokenize_explain_select() {
+        let sql = String::from("EXPLAIN SELECT * FROM customer WHERE id = 1");
+        let dialect = GenericDialect {};
+        let mut tokenizer = Tokenizer::new(&dialect, &sql);
+        let tokens = tokenizer.tokenize().unwrap();
+
+        let expected = vec![
+            Token::make_keyword("EXPLAIN"),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_keyword("SELECT"),
+            Token::Whitespace(Whitespace::Space),
+            Token::Mult,
+            Token::Whitespace(Whitespace::Space),
+            Token::make_keyword("FROM"),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_word("customer", None),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_keyword("WHERE"),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_word("id", None),
+            Token::Whitespace(Whitespace::Space),
+            Token::Eq,
+            Token::Whitespace(Whitespace::Space),
+            Token::Number(String::from("1")),
+        ];
+
+        compare(expected, tokens);
+    }
+
+    #[test]
+    fn tokenize_explain_analyze_select() {
+        let sql = String::from("EXPLAIN ANALYZE SELECT * FROM customer WHERE id = 1");
+        let dialect = GenericDialect {};
+        let mut tokenizer = Tokenizer::new(&dialect, &sql);
+        let tokens = tokenizer.tokenize().unwrap();
+
+        let expected = vec![
+            Token::make_keyword("EXPLAIN"),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_keyword("ANALYZE"),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_keyword("SELECT"),
+            Token::Whitespace(Whitespace::Space),
+            Token::Mult,
+            Token::Whitespace(Whitespace::Space),
+            Token::make_keyword("FROM"),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_word("customer", None),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_keyword("WHERE"),
+            Token::Whitespace(Whitespace::Space),
+            Token::make_word("id", None),
+            Token::Whitespace(Whitespace::Space),
+            Token::Eq,
+            Token::Whitespace(Whitespace::Space),
+            Token::Number(String::from("1")),
+        ];
+
+        compare(expected, tokens);
+    }
+
     #[test]
     fn tokenize_string_predicate() {
         let sql = String::from("SELECT * FROM customer WHERE salary != 'Not Provided'");
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index 7fba5dcb9..a311dd267 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -543,17 +543,23 @@ fn parse_is_not_null() {
 fn parse_not_precedence() {
     // NOT has higher precedence than OR/AND, so the following must parse as (NOT true) OR true
     let sql = "NOT true OR true";
-    assert_matches!(verified_expr(sql), Expr::BinaryOp {
-        op: BinaryOperator::Or,
-        ..
-    });
+    assert_matches!(
+        verified_expr(sql),
+        Expr::BinaryOp {
+            op: BinaryOperator::Or,
+            ..
+        }
+    );
 
     // But NOT has lower precedence than comparison operators, so the following parses as NOT (a IS NULL)
     let sql = "NOT a IS NULL";
-    assert_matches!(verified_expr(sql), Expr::UnaryOp {
-        op: UnaryOperator::Not,
-        ..
-    });
+    assert_matches!(
+        verified_expr(sql),
+        Expr::UnaryOp {
+            op: UnaryOperator::Not,
+            ..
+        }
+    );
 
     // NOT has lower precedence than BETWEEN, so the following parses as NOT (1 NOT BETWEEN 1 AND 2)
     let sql = "NOT 1 NOT BETWEEN 1 AND 2";
@@ -1463,7 +1469,7 @@ fn parse_create_external_table_lowercase() {
          lng DOUBLE) \
          STORED AS PARQUET LOCATION '/tmp/example.csv'",
     );
-    assert_matches!(ast, Statement::CreateTable{..});
+    assert_matches!(ast, Statement::CreateTable { .. });
 }
 
 #[test]
@@ -1606,6 +1612,33 @@ fn parse_scalar_function_in_projection() {
     );
 }
 
+fn run_explain_analyze(query: &str, expected_verbose: bool, expected_analyze: bool) {
+    match verified_stmt(query) {
+        Statement::Explain {
+            analyze,
+            verbose,
+            statement,
+        } => {
+            assert_eq!(verbose, expected_verbose);
+            assert_eq!(analyze, expected_analyze);
+            assert_eq!("SELECT sqrt(id) FROM foo", statement.to_string());
+        }
+        _ => panic!("Unexpected Statement, must be Explain"),
+    }
+}
+
+#[test]
+fn parse_explain_analyze_with_simple_select() {
+    run_explain_analyze("EXPLAIN SELECT sqrt(id) FROM foo", false, false);
+    run_explain_analyze("EXPLAIN VERBOSE SELECT sqrt(id) FROM foo", true, false);
+    run_explain_analyze("EXPLAIN ANALYZE SELECT sqrt(id) FROM foo", false, true);
+    run_explain_analyze(
+        "EXPLAIN ANALYZE VERBOSE SELECT sqrt(id) FROM foo",
+        true,
+        true,
+    );
+}
+
 #[test]
 fn parse_named_argument_function() {
     let sql = "SELECT FUN(a => '1', b => '2') FROM foo";
@@ -2554,11 +2587,14 @@ fn parse_multiple_statements() {
 #[test]
 fn parse_scalar_subqueries() {
     let sql = "(SELECT 1) + (SELECT 2)";
-    assert_matches!(verified_expr(sql), Expr::BinaryOp {
+    assert_matches!(
+        verified_expr(sql),
+        Expr::BinaryOp {
         op: BinaryOperator::Plus, ..
         //left: box Subquery { .. },
         //right: box Subquery { .. },
-    });
+    }
+    );
 }
 
 #[test]

From 94ff46802c4e0fd9ddd63667d89329c1ca59685d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Mon, 28 Dec 2020 18:08:32 +0100
Subject: [PATCH 106/122] Support ANALYZE TABLE syntax (#285)

* Support analyze table

* Cleanup
---
 src/ast/mod.rs            | 24 +++++++++++++++---------
 src/parser.rs             | 10 ++++++++++
 tests/sqlparser_common.rs | 12 ++++++++++++
 3 files changed, 37 insertions(+), 9 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 2d63bbfab..4232ad022 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -431,15 +431,6 @@ impl fmt::Display for WindowFrameBound {
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum Statement {
-    // EXPLAIN
-    Explain {
-        // Carry out the command and show actual run times and other statistics.
-        analyze: bool,
-        // Display additional information regarding the plan.
-        verbose: bool,
-        /// A SQL query that specifies what to explain
-        statement: Box<Statement>,
-    },
     /// SELECT
     Query(Box<Query>),
     /// INSERT
@@ -592,6 +583,20 @@ pub enum Statement {
         data_types: Vec<DataType>,
         statement: Box<Statement>,
     },
+    /// EXPLAIN
+    Explain {
+        /// Carry out the command and show actual run times and other statistics.
+        analyze: bool,
+        // Display additional information regarding the plan.
+        verbose: bool,
+        /// A SQL query that specifies what to explain
+        statement: Box<Statement>,
+    },
+    /// ANALYZE
+    Analyze {
+        /// Name of table
+        table_name: ObjectName,
+    },
 }
 
 impl fmt::Display for Statement {
@@ -617,6 +622,7 @@ impl fmt::Display for Statement {
 
                 write!(f, "{}", statement)
             }
+            Statement::Analyze { table_name } => write!(f, "ANALYZE TABLE {}", table_name),
             Statement::Query(s) => write!(f, "{}", s),
             Statement::Insert {
                 table_name,
diff --git a/src/parser.rs b/src/parser.rs
index 0db093f93..94afeb6e9 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -132,6 +132,7 @@ impl<'a> Parser<'a> {
         match self.next_token() {
             Token::Word(w) => match w.keyword {
                 Keyword::EXPLAIN => Ok(self.parse_explain()?),
+                Keyword::ANALYZE => Ok(self.parse_analyze()?),
                 Keyword::SELECT | Keyword::WITH | Keyword::VALUES => {
                     self.prev_token();
                     Ok(Statement::Query(Box::new(self.parse_query()?)))
@@ -1804,6 +1805,15 @@ impl<'a> Parser<'a> {
         })
     }
 
+    pub fn parse_analyze(&mut self) -> Result<Statement, ParserError> {
+        // ANALYZE TABLE table_name
+        self.expect_keyword(Keyword::TABLE)?;
+
+        let table_name = self.parse_object_name()?;
+
+        Ok(Statement::Analyze { table_name })
+    }
+
     /// Parse a query expression, i.e. a `SELECT` statement optionally
     /// preceeded with some `WITH` CTE declarations and optionally followed
     /// by `ORDER BY`. Unlike some other parse_... methods, this one doesn't
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index a311dd267..e7d78f950 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -1639,6 +1639,18 @@ fn parse_explain_analyze_with_simple_select() {
     );
 }
 
+#[test]
+fn parse_simple_analyze() {
+    let sql = "ANALYZE TABLE t";
+    let stmt = verified_stmt(sql);
+    assert_eq!(
+        stmt,
+        Statement::Analyze {
+            table_name: ObjectName(vec![Ident::new("t")])
+        }
+    );
+}
+
 #[test]
 fn parse_named_argument_function() {
     let sql = "SELECT FUN(a => '1', b => '2') FROM foo";

From e18e8dc67498348ab6a50c80400930876d71813a Mon Sep 17 00:00:00 2001
From: "Heres, Daniel" <danielheres@gmail.com>
Date: Mon, 28 Dec 2020 20:31:14 +0100
Subject: [PATCH 107/122] Prepare 0.6.2

---
 CHANGELOG.md | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 05dbfdfc4..cfc0a4893 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -8,6 +8,8 @@ Given that the parser produces a typed AST, any changes to the AST will technica
 ## [Unreleased]
 Check https://github.com/ballista-compute/sqlparser-rs/commits/main for undocumented changes.
 
+## [0.6.2]
+
 ### Changed
 - Change the MySQL dialect to support `` `identifiers` `` quoted with backticks instead of the standard `"double-quoted"` identifiers (#247) - thanks @mashuai!
 - Update bigdecimal requirement from 0.1 to 0.2 (#268)
@@ -21,6 +23,10 @@ Check https://github.com/ballista-compute/sqlparser-rs/commits/main for undocume
 - Support PostgreSQL math operators (#267) - thanks @alex-dukhno!
 - Add SQLite dialect (#248) - thanks @mashuai!
 - Add Snowflake dialect (#259) - thanks @eyalleshem!
+- Support for Recursive CTEs - thanks @rhanqtl!
+- Support `FROM (table_name) alias` syntax - thanks @eyalleshem!
+- Support for `EXPLAIN [ANALYZE] VERBOSE` - thanks @ovr!
+- Support `ANALYZE TABLE`
 - DDL:
     - Support `OR REPLACE` in `CREATE VIEW`/`TABLE` (#239)  - thanks @Dandandan!
     - Support specifying `ASC`/`DESC` in index columns (#249) - thanks @mashuai!

From d66294fab80b88864a0197b02ba97db455d90c4b Mon Sep 17 00:00:00 2001
From: "Heres, Daniel" <danielheres@gmail.com>
Date: Mon, 28 Dec 2020 20:32:11 +0100
Subject: [PATCH 108/122] Add date

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index cfc0a4893..7798d8d6e 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -8,7 +8,7 @@ Given that the parser produces a typed AST, any changes to the AST will technica
 ## [Unreleased]
 Check https://github.com/ballista-compute/sqlparser-rs/commits/main for undocumented changes.
 
-## [0.6.2]
+## [0.6.2] 2020-12-28
 
 ### Changed
 - Change the MySQL dialect to support `` `identifiers` `` quoted with backticks instead of the standard `"double-quoted"` identifiers (#247) - thanks @mashuai!

From 26c281eaf7f3b88828e54dec24b189af357aa2cc Mon Sep 17 00:00:00 2001
From: "Heres, Daniel" <danielheres@gmail.com>
Date: Mon, 28 Dec 2020 20:35:21 +0100
Subject: [PATCH 109/122] (cargo-release) version 0.6.2

---
 Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index b57cbb997..8e9724138 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "sqlparser"
 description = "Extensible SQL Lexer and Parser with support for ANSI SQL:2011"
-version = "0.6.1"
+version = "0.6.2"
 authors = ["Andy Grove <andygrove73@gmail.com>"]
 homepage = "https://github.com/ballista-compute/sqlparser-rs"
 documentation = "https://docs.rs/sqlparser/"

From 9930bdff68c19e2af069c7f38025bb11656b6181 Mon Sep 17 00:00:00 2001
From: "Heres, Daniel" <danielheres@gmail.com>
Date: Mon, 28 Dec 2020 20:35:22 +0100
Subject: [PATCH 110/122] (cargo-release) start next development iteration
 0.6.3-alpha.0

---
 Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index 8e9724138..9720a71a6 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "sqlparser"
 description = "Extensible SQL Lexer and Parser with support for ANSI SQL:2011"
-version = "0.6.2"
+version = "0.6.3-alpha.0"
 authors = ["Andy Grove <andygrove73@gmail.com>"]
 homepage = "https://github.com/ballista-compute/sqlparser-rs"
 documentation = "https://docs.rs/sqlparser/"

From 97cd1c017d590f8ba0476ab715c6383446da8084 Mon Sep 17 00:00:00 2001
From: "Heres, Daniel" <danielheres@gmail.com>
Date: Mon, 28 Dec 2020 21:48:07 +0100
Subject: [PATCH 111/122] Release 0.7.0 instead

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 7798d8d6e..c1c5a763f 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -8,7 +8,7 @@ Given that the parser produces a typed AST, any changes to the AST will technica
 ## [Unreleased]
 Check https://github.com/ballista-compute/sqlparser-rs/commits/main for undocumented changes.
 
-## [0.6.2] 2020-12-28
+## [0.7.0] 2020-12-28
 
 ### Changed
 - Change the MySQL dialect to support `` `identifiers` `` quoted with backticks instead of the standard `"double-quoted"` identifiers (#247) - thanks @mashuai!

From e11b80ecf9c5cca087f9a225d07e574fbf170ade Mon Sep 17 00:00:00 2001
From: "Heres, Daniel" <danielheres@gmail.com>
Date: Mon, 28 Dec 2020 21:51:28 +0100
Subject: [PATCH 112/122] (cargo-release) version 0.7.0

---
 Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index 9720a71a6..fa4abe183 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "sqlparser"
 description = "Extensible SQL Lexer and Parser with support for ANSI SQL:2011"
-version = "0.6.3-alpha.0"
+version = "0.7.0"
 authors = ["Andy Grove <andygrove73@gmail.com>"]
 homepage = "https://github.com/ballista-compute/sqlparser-rs"
 documentation = "https://docs.rs/sqlparser/"

From 200ed5ecfcd2b84fb1c190c057cf0bb7a5770b8a Mon Sep 17 00:00:00 2001
From: "Heres, Daniel" <danielheres@gmail.com>
Date: Mon, 28 Dec 2020 21:51:28 +0100
Subject: [PATCH 113/122] (cargo-release) start next development iteration
 0.7.1-alpha.0

---
 Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index fa4abe183..231d7fee5 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "sqlparser"
 description = "Extensible SQL Lexer and Parser with support for ANSI SQL:2011"
-version = "0.7.0"
+version = "0.7.1-alpha.0"
 authors = ["Andy Grove <andygrove73@gmail.com>"]
 homepage = "https://github.com/ballista-compute/sqlparser-rs"
 documentation = "https://docs.rs/sqlparser/"

From 17f8eb9c5a7170aaee25b8dd92266a4d732ef2c5 Mon Sep 17 00:00:00 2001
From: joshwd36 <joshwd36@users.noreply.github.com>
Date: Thu, 7 Jan 2021 17:30:12 +0000
Subject: [PATCH 114/122] Fix clippy lints (#287)

---
 src/ast/ddl.rs            |  2 +-
 src/ast/query.rs          |  2 +-
 src/dialect/ansi.rs       |  8 ++++----
 src/dialect/generic.rs    | 12 ++++++++----
 src/dialect/mssql.rs      | 12 ++++++++----
 src/dialect/mysql.rs      |  8 ++++----
 src/dialect/postgresql.rs |  8 ++++----
 src/dialect/snowflake.rs  |  8 ++++----
 src/dialect/sqlite.rs     |  8 ++++----
 9 files changed, 38 insertions(+), 30 deletions(-)

diff --git a/src/ast/ddl.rs b/src/ast/ddl.rs
index 847ee71a3..272bf7c25 100644
--- a/src/ast/ddl.rs
+++ b/src/ast/ddl.rs
@@ -254,7 +254,7 @@ impl fmt::Display for ColumnOption {
     }
 }
 
-fn display_constraint_name<'a>(name: &'a Option<Ident>) -> impl fmt::Display + 'a {
+fn display_constraint_name(name: &'_ Option<Ident>) -> impl fmt::Display + '_ {
     struct ConstraintName<'a>(&'a Option<Ident>);
     impl<'a> fmt::Display for ConstraintName<'a> {
         fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
diff --git a/src/ast/query.rs b/src/ast/query.rs
index b28fa92a9..1b8ccf7e4 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -346,7 +346,7 @@ impl fmt::Display for Join {
                 _ => "",
             }
         }
-        fn suffix<'a>(constraint: &'a JoinConstraint) -> impl fmt::Display + 'a {
+        fn suffix(constraint: &'_ JoinConstraint) -> impl fmt::Display + '_ {
             struct Suffix<'a>(&'a JoinConstraint);
             impl<'a> fmt::Display for Suffix<'a> {
                 fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
diff --git a/src/dialect/ansi.rs b/src/dialect/ansi.rs
index ca01fb751..1015ca2d3 100644
--- a/src/dialect/ansi.rs
+++ b/src/dialect/ansi.rs
@@ -17,13 +17,13 @@ pub struct AnsiDialect {}
 
 impl Dialect for AnsiDialect {
     fn is_identifier_start(&self, ch: char) -> bool {
-        (ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <= 'Z')
+        ('a'..='z').contains(&ch) || ('A'..='Z').contains(&ch)
     }
 
     fn is_identifier_part(&self, ch: char) -> bool {
-        (ch >= 'a' && ch <= 'z')
-            || (ch >= 'A' && ch <= 'Z')
-            || (ch >= '0' && ch <= '9')
+        ('a'..='z').contains(&ch)
+            || ('A'..='Z').contains(&ch)
+            || ('0'..='9').contains(&ch)
             || ch == '_'
     }
 }
diff --git a/src/dialect/generic.rs b/src/dialect/generic.rs
index 104d3a9a3..818fa0d0a 100644
--- a/src/dialect/generic.rs
+++ b/src/dialect/generic.rs
@@ -17,13 +17,17 @@ pub struct GenericDialect;
 
 impl Dialect for GenericDialect {
     fn is_identifier_start(&self, ch: char) -> bool {
-        (ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <= 'Z') || ch == '_' || ch == '#' || ch == '@'
+        ('a'..='z').contains(&ch)
+            || ('A'..='Z').contains(&ch)
+            || ch == '_'
+            || ch == '#'
+            || ch == '@'
     }
 
     fn is_identifier_part(&self, ch: char) -> bool {
-        (ch >= 'a' && ch <= 'z')
-            || (ch >= 'A' && ch <= 'Z')
-            || (ch >= '0' && ch <= '9')
+        ('a'..='z').contains(&ch)
+            || ('A'..='Z').contains(&ch)
+            || ('0'..='9').contains(&ch)
             || ch == '@'
             || ch == '$'
             || ch == '#'
diff --git a/src/dialect/mssql.rs b/src/dialect/mssql.rs
index c613a1502..539a17a9f 100644
--- a/src/dialect/mssql.rs
+++ b/src/dialect/mssql.rs
@@ -23,13 +23,17 @@ impl Dialect for MsSqlDialect {
     fn is_identifier_start(&self, ch: char) -> bool {
         // See https://docs.microsoft.com/en-us/sql/relational-databases/databases/database-identifiers?view=sql-server-2017#rules-for-regular-identifiers
         // We don't support non-latin "letters" currently.
-        (ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <= 'Z') || ch == '_' || ch == '#' || ch == '@'
+        ('a'..='z').contains(&ch)
+            || ('A'..='Z').contains(&ch)
+            || ch == '_'
+            || ch == '#'
+            || ch == '@'
     }
 
     fn is_identifier_part(&self, ch: char) -> bool {
-        (ch >= 'a' && ch <= 'z')
-            || (ch >= 'A' && ch <= 'Z')
-            || (ch >= '0' && ch <= '9')
+        ('a'..='z').contains(&ch)
+            || ('A'..='Z').contains(&ch)
+            || ('0'..='9').contains(&ch)
             || ch == '@'
             || ch == '$'
             || ch == '#'
diff --git a/src/dialect/mysql.rs b/src/dialect/mysql.rs
index a4aaafe6b..6581195b8 100644
--- a/src/dialect/mysql.rs
+++ b/src/dialect/mysql.rs
@@ -20,15 +20,15 @@ impl Dialect for MySqlDialect {
         // See https://dev.mysql.com/doc/refman/8.0/en/identifiers.html.
         // We don't yet support identifiers beginning with numbers, as that
         // makes it hard to distinguish numeric literals.
-        (ch >= 'a' && ch <= 'z')
-            || (ch >= 'A' && ch <= 'Z')
+        ('a'..='z').contains(&ch)
+            || ('A'..='Z').contains(&ch)
             || ch == '_'
             || ch == '$'
-            || (ch >= '\u{0080}' && ch <= '\u{ffff}')
+            || ('\u{0080}'..='\u{ffff}').contains(&ch)
     }
 
     fn is_identifier_part(&self, ch: char) -> bool {
-        self.is_identifier_start(ch) || (ch >= '0' && ch <= '9')
+        self.is_identifier_start(ch) || ('0'..='9').contains(&ch)
     }
 
     fn is_delimited_identifier_start(&self, ch: char) -> bool {
diff --git a/src/dialect/postgresql.rs b/src/dialect/postgresql.rs
index 1c11d8a37..0c2eb99f0 100644
--- a/src/dialect/postgresql.rs
+++ b/src/dialect/postgresql.rs
@@ -20,13 +20,13 @@ impl Dialect for PostgreSqlDialect {
         // See https://www.postgresql.org/docs/11/sql-syntax-lexical.html#SQL-SYNTAX-IDENTIFIERS
         // We don't yet support identifiers beginning with "letters with
         // diacritical marks and non-Latin letters"
-        (ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <= 'Z') || ch == '_'
+        ('a'..='z').contains(&ch) || ('A'..='Z').contains(&ch) || ch == '_'
     }
 
     fn is_identifier_part(&self, ch: char) -> bool {
-        (ch >= 'a' && ch <= 'z')
-            || (ch >= 'A' && ch <= 'Z')
-            || (ch >= '0' && ch <= '9')
+        ('a'..='z').contains(&ch)
+            || ('A'..='Z').contains(&ch)
+            || ('0'..='9').contains(&ch)
             || ch == '$'
             || ch == '_'
     }
diff --git a/src/dialect/snowflake.rs b/src/dialect/snowflake.rs
index 22fd55fa5..93db95692 100644
--- a/src/dialect/snowflake.rs
+++ b/src/dialect/snowflake.rs
@@ -18,13 +18,13 @@ pub struct SnowflakeDialect;
 impl Dialect for SnowflakeDialect {
     // see https://docs.snowflake.com/en/sql-reference/identifiers-syntax.html
     fn is_identifier_start(&self, ch: char) -> bool {
-        (ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <= 'Z') || ch == '_'
+        ('a'..='z').contains(&ch) || ('A'..='Z').contains(&ch) || ch == '_'
     }
 
     fn is_identifier_part(&self, ch: char) -> bool {
-        (ch >= 'a' && ch <= 'z')
-            || (ch >= 'A' && ch <= 'Z')
-            || (ch >= '0' && ch <= '9')
+        ('a'..='z').contains(&ch)
+            || ('A'..='Z').contains(&ch)
+            || ('0'..='9').contains(&ch)
             || ch == '$'
             || ch == '_'
     }
diff --git a/src/dialect/sqlite.rs b/src/dialect/sqlite.rs
index 16ec66ac2..4ce2f834b 100644
--- a/src/dialect/sqlite.rs
+++ b/src/dialect/sqlite.rs
@@ -25,14 +25,14 @@ impl Dialect for SQLiteDialect {
 
     fn is_identifier_start(&self, ch: char) -> bool {
         // See https://www.sqlite.org/draft/tokenreq.html
-        (ch >= 'a' && ch <= 'z')
-            || (ch >= 'A' && ch <= 'Z')
+        ('a'..='z').contains(&ch)
+            || ('A'..='Z').contains(&ch)
             || ch == '_'
             || ch == '$'
-            || (ch >= '\u{007f}' && ch <= '\u{ffff}')
+            || ('\u{007f}'..='\u{ffff}').contains(&ch)
     }
 
     fn is_identifier_part(&self, ch: char) -> bool {
-        self.is_identifier_start(ch) || (ch >= '0' && ch <= '9')
+        self.is_identifier_start(ch) || ('0'..='9').contains(&ch)
     }
 }

From 8a214f99192435bd86b102db8002b78bb4187de2 Mon Sep 17 00:00:00 2001
From: Stephen Carman <hntd187@users.noreply.github.com>
Date: Thu, 4 Feb 2021 14:53:20 -0500
Subject: [PATCH 115/122] Implement Hive QL Parsing (#235)

---
 examples/cli.rs             |   1 +
 src/ast/data_type.rs        |   3 +
 src/ast/ddl.rs              |  43 ++-
 src/ast/mod.rs              | 389 ++++++++++++++++++++--
 src/ast/operator.rs         |   2 +
 src/ast/query.rs            |  75 ++++-
 src/ast/value.rs            |   9 +-
 src/dialect/hive.rs         |  39 +++
 src/dialect/keywords.rs     |  38 +++
 src/dialect/mod.rs          |   2 +
 src/parser.rs               | 635 ++++++++++++++++++++++++++++++------
 src/test_utils.rs           |   3 +-
 src/tokenizer.rs            |  59 +++-
 tests/sqlparser_common.rs   |  25 +-
 tests/sqlparser_hive.rs     | 212 ++++++++++++
 tests/sqlparser_postgres.rs |  17 +-
 16 files changed, 1382 insertions(+), 170 deletions(-)
 create mode 100644 src/dialect/hive.rs
 create mode 100644 tests/sqlparser_hive.rs

diff --git a/examples/cli.rs b/examples/cli.rs
index 5a3a3034b..9ac079949 100644
--- a/examples/cli.rs
+++ b/examples/cli.rs
@@ -40,6 +40,7 @@ $ cargo run --feature json_example --example cli FILENAME.sql [--dialectname]
         "--postgres" => Box::new(PostgreSqlDialect {}),
         "--ms" => Box::new(MsSqlDialect {}),
         "--snowflake" => Box::new(SnowflakeDialect {}),
+        "--hive" => Box::new(HiveDialect {}),
         "--generic" | "" => Box::new(GenericDialect {}),
         s => panic!("Unexpected parameter: {}", s),
     };
diff --git a/src/ast/data_type.rs b/src/ast/data_type.rs
index 53122ab5d..388703e76 100644
--- a/src/ast/data_type.rs
+++ b/src/ast/data_type.rs
@@ -61,6 +61,8 @@ pub enum DataType {
     Regclass,
     /// Text
     Text,
+    /// String
+    String,
     /// Bytea
     Bytea,
     /// Custom type such as enums
@@ -101,6 +103,7 @@ impl fmt::Display for DataType {
             DataType::Interval => write!(f, "INTERVAL"),
             DataType::Regclass => write!(f, "REGCLASS"),
             DataType::Text => write!(f, "TEXT"),
+            DataType::String => write!(f, "STRING"),
             DataType::Bytea => write!(f, "BYTEA"),
             DataType::Array(ty) => write!(f, "{}[]", ty),
             DataType::Custom(ty) => write!(f, "{}", ty),
diff --git a/src/ast/ddl.rs b/src/ast/ddl.rs
index 272bf7c25..67dc2e322 100644
--- a/src/ast/ddl.rs
+++ b/src/ast/ddl.rs
@@ -35,22 +35,54 @@ pub enum AlterTableOperation {
         if_exists: bool,
         cascade: bool,
     },
+    /// `RENAME TO PARTITION (partition=val)`
+    RenamePartitions {
+        old_partitions: Vec<Expr>,
+        new_partitions: Vec<Expr>,
+    },
+    /// Add Partitions
+    AddPartitions {
+        if_not_exists: bool,
+        new_partitions: Vec<Expr>,
+    },
+    DropPartitions {
+        partitions: Vec<Expr>,
+        if_exists: bool,
+    },
     /// `RENAME [ COLUMN ] <old_column_name> TO <new_column_name>`
     RenameColumn {
         old_column_name: Ident,
         new_column_name: Ident,
     },
     /// `RENAME TO <table_name>`
-    RenameTable { table_name: Ident },
+    RenameTable { table_name: ObjectName },
 }
 
 impl fmt::Display for AlterTableOperation {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
         match self {
+            AlterTableOperation::AddPartitions {
+                if_not_exists,
+                new_partitions,
+            } => write!(
+                f,
+                "ADD{ine} PARTITION ({})",
+                display_comma_separated(new_partitions),
+                ine = if *if_not_exists { " IF NOT EXISTS" } else { "" }
+            ),
             AlterTableOperation::AddConstraint(c) => write!(f, "ADD {}", c),
             AlterTableOperation::AddColumn { column_def } => {
                 write!(f, "ADD COLUMN {}", column_def.to_string())
             }
+            AlterTableOperation::DropPartitions {
+                partitions,
+                if_exists,
+            } => write!(
+                f,
+                "DROP{ie} PARTITION ({})",
+                display_comma_separated(partitions),
+                ie = if *if_exists { " IF EXISTS" } else { "" }
+            ),
             AlterTableOperation::DropConstraint { name } => write!(f, "DROP CONSTRAINT {}", name),
             AlterTableOperation::DropColumn {
                 column_name,
@@ -63,6 +95,15 @@ impl fmt::Display for AlterTableOperation {
                 column_name,
                 if *cascade { " CASCADE" } else { "" }
             ),
+            AlterTableOperation::RenamePartitions {
+                old_partitions,
+                new_partitions,
+            } => write!(
+                f,
+                "PARTITION ({}) RENAME TO PARTITION ({})",
+                display_comma_separated(old_partitions),
+                display_comma_separated(new_partitions)
+            ),
             AlterTableOperation::RenameColumn {
                 old_column_name,
                 new_column_name,
diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 4232ad022..1999451d5 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -29,8 +29,9 @@ pub use self::ddl::{
 };
 pub use self::operator::{BinaryOperator, UnaryOperator};
 pub use self::query::{
-    Cte, Fetch, Join, JoinConstraint, JoinOperator, Offset, OffsetRows, OrderByExpr, Query, Select,
-    SelectItem, SetExpr, SetOperator, TableAlias, TableFactor, TableWithJoins, Top, Values, With,
+    Cte, Fetch, Join, JoinConstraint, JoinOperator, LateralView, Offset, OffsetRows, OrderByExpr,
+    Query, Select, SelectItem, SetExpr, SetOperator, TableAlias, TableFactor, TableWithJoins, Top,
+    Values, With,
 };
 pub use self::value::{DateTimeField, Value};
 
@@ -191,7 +192,10 @@ pub enum Expr {
         right: Box<Expr>,
     },
     /// Unary operation e.g. `NOT foo`
-    UnaryOp { op: UnaryOperator, expr: Box<Expr> },
+    UnaryOp {
+        op: UnaryOperator,
+        expr: Box<Expr>,
+    },
     /// CAST an expression to a different data type e.g. `CAST(foo AS VARCHAR(123))`
     Cast {
         expr: Box<Expr>,
@@ -213,7 +217,14 @@ pub enum Expr {
     /// A constant of form `<data_type> 'value'`.
     /// This can represent ANSI SQL `DATE`, `TIME`, and `TIMESTAMP` literals (such as `DATE '2020-01-01'`),
     /// as well as constants of other types (a non-standard PostgreSQL extension).
-    TypedString { data_type: DataType, value: String },
+    TypedString {
+        data_type: DataType,
+        value: String,
+    },
+    MapAccess {
+        column: Box<Expr>,
+        key: String,
+    },
     /// Scalar function call e.g. `LEFT(foo, 5)`
     Function(Function),
     /// `CASE [<operand>] WHEN <condition> THEN <result> ... [ELSE <result>] END`
@@ -241,6 +252,7 @@ impl fmt::Display for Expr {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
         match self {
             Expr::Identifier(s) => write!(f, "{}", s),
+            Expr::MapAccess { column, key } => write!(f, "{}[\"{}\"]", column, key),
             Expr::Wildcard => f.write_str("*"),
             Expr::QualifiedWildcard(q) => write!(f, "{}.*", display_separated(q, ".")),
             Expr::CompoundIdentifier(s) => write!(f, "{}", display_separated(s, ".")),
@@ -426,11 +438,50 @@ impl fmt::Display for WindowFrameBound {
     }
 }
 
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
+pub enum AddDropSync {
+    ADD,
+    DROP,
+    SYNC,
+}
+
+impl fmt::Display for AddDropSync {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        match self {
+            AddDropSync::SYNC => f.write_str("SYNC PARTITIONS"),
+            AddDropSync::DROP => f.write_str("DROP PARTITIONS"),
+            AddDropSync::ADD => f.write_str("ADD PARTITIONS"),
+        }
+    }
+}
+
 /// A top-level statement (SELECT, INSERT, CREATE, etc.)
 #[allow(clippy::large_enum_variant)]
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum Statement {
+    /// Analyze (Hive)
+    Analyze {
+        table_name: ObjectName,
+        partitions: Option<Vec<Expr>>,
+        for_columns: bool,
+        columns: Vec<Ident>,
+        cache_metadata: bool,
+        noscan: bool,
+        compute_statistics: bool,
+    },
+    /// Truncate (Hive)
+    Truncate {
+        table_name: ObjectName,
+        partitions: Option<Vec<Expr>>,
+    },
+    /// Msck (Hive)
+    Msck {
+        table_name: ObjectName,
+        repair: bool,
+        partition_action: Option<AddDropSync>,
+    },
     /// SELECT
     Query(Box<Query>),
     /// INSERT
@@ -439,8 +490,24 @@ pub enum Statement {
         table_name: ObjectName,
         /// COLUMNS
         columns: Vec<Ident>,
+        /// Overwrite (Hive)
+        overwrite: bool,
         /// A SQL query that specifies what to insert
         source: Box<Query>,
+        /// partitioned insert (Hive)
+        partitioned: Option<Vec<Expr>>,
+        /// Columns defined after PARTITION
+        after_columns: Vec<Ident>,
+        /// whether the insert has the table keyword (Hive)
+        table: bool,
+    },
+    // TODO: Support ROW FORMAT
+    Directory {
+        overwrite: bool,
+        local: bool,
+        path: String,
+        file_format: Option<FileFormat>,
+        source: Box<Query>,
     },
     Copy {
         /// TABLE
@@ -479,6 +546,7 @@ pub enum Statement {
     /// CREATE TABLE
     CreateTable {
         or_replace: bool,
+        temporary: bool,
         external: bool,
         if_not_exists: bool,
         /// Table name
@@ -486,11 +554,15 @@ pub enum Statement {
         /// Optional schema
         columns: Vec<ColumnDef>,
         constraints: Vec<TableConstraint>,
+        hive_distribution: HiveDistributionStyle,
+        hive_formats: Option<HiveFormat>,
+        table_properties: Vec<SqlOption>,
         with_options: Vec<SqlOption>,
         file_format: Option<FileFormat>,
         location: Option<String>,
         query: Option<Box<Query>>,
         without_rowid: bool,
+        like: Option<ObjectName>,
     },
     /// SQLite's `CREATE VIRTUAL TABLE .. USING <module_name> (<module_args>)`
     CreateVirtualTable {
@@ -525,6 +597,9 @@ pub enum Statement {
         /// Whether `CASCADE` was specified. This will be `false` when
         /// `RESTRICT` or no drop behavior at all was specified.
         cascade: bool,
+        /// Hive allows you specify whether the table's stored data will be
+        /// deleted along with the dropped table
+        purge: bool,
     },
     /// SET <variable>
     ///
@@ -533,8 +608,9 @@ pub enum Statement {
     /// supported yet.
     SetVariable {
         local: bool,
+        hivevar: bool,
         variable: Ident,
-        value: SetVariableValue,
+        value: Vec<SetVariableValue>,
     },
     /// SHOW <variable>
     ///
@@ -562,6 +638,13 @@ pub enum Statement {
         schema_name: ObjectName,
         if_not_exists: bool,
     },
+    /// CREATE DATABASE
+    CreateDatabase {
+        db_name: ObjectName,
+        if_not_exists: bool,
+        location: Option<String>,
+        managed_location: Option<String>,
+    },
     /// `ASSERT <condition> [AS <message>]`
     Assert {
         condition: Expr,
@@ -592,11 +675,6 @@ pub enum Statement {
         /// A SQL query that specifies what to explain
         statement: Box<Statement>,
     },
-    /// ANALYZE
-    Analyze {
-        /// Name of table
-        table_name: ObjectName,
-    },
 }
 
 impl fmt::Display for Statement {
@@ -622,17 +700,114 @@ impl fmt::Display for Statement {
 
                 write!(f, "{}", statement)
             }
-            Statement::Analyze { table_name } => write!(f, "ANALYZE TABLE {}", table_name),
             Statement::Query(s) => write!(f, "{}", s),
+            Statement::Directory {
+                overwrite,
+                local,
+                path,
+                file_format,
+                source,
+            } => {
+                write!(
+                    f,
+                    "INSERT{overwrite}{local} DIRECTORY '{path}'",
+                    overwrite = if *overwrite { " OVERWRITE" } else { "" },
+                    local = if *local { " LOCAL" } else { "" },
+                    path = path
+                )?;
+                if let Some(ref ff) = file_format {
+                    write!(f, " STORED AS {}", ff)?
+                }
+                write!(f, " {}", source)
+            }
+            Statement::Msck {
+                table_name,
+                repair,
+                partition_action,
+            } => {
+                write!(
+                    f,
+                    "MSCK {repair}TABLE {table}",
+                    repair = if *repair { "REPAIR " } else { "" },
+                    table = table_name
+                )?;
+                if let Some(pa) = partition_action {
+                    write!(f, " {}", pa)?;
+                }
+                Ok(())
+            }
+            Statement::Truncate {
+                table_name,
+                partitions,
+            } => {
+                write!(f, "TRUNCATE TABLE {}", table_name)?;
+                if let Some(ref parts) = partitions {
+                    if !parts.is_empty() {
+                        write!(f, " PARTITION ({})", display_comma_separated(parts))?;
+                    }
+                }
+                Ok(())
+            }
+            Statement::Analyze {
+                table_name,
+                partitions,
+                for_columns,
+                columns,
+                cache_metadata,
+                noscan,
+                compute_statistics,
+            } => {
+                write!(f, "ANALYZE TABLE {}", table_name)?;
+                if let Some(ref parts) = partitions {
+                    if !parts.is_empty() {
+                        write!(f, " PARTITION ({})", display_comma_separated(parts))?;
+                    }
+                }
+
+                if *compute_statistics {
+                    write!(f, " COMPUTE STATISTICS")?;
+                }
+                if *noscan {
+                    write!(f, " NOSCAN")?;
+                }
+                if *cache_metadata {
+                    write!(f, " CACHE METADATA")?;
+                }
+                if *for_columns {
+                    write!(f, " FOR COLUMNS")?;
+                    if !columns.is_empty() {
+                        write!(f, " {}", display_comma_separated(columns))?;
+                    }
+                }
+                Ok(())
+            }
             Statement::Insert {
                 table_name,
+                overwrite,
+                partitioned,
                 columns,
+                after_columns,
                 source,
+                table,
             } => {
-                write!(f, "INSERT INTO {} ", table_name)?;
+                write!(
+                    f,
+                    "INSERT {act}{tbl} {table_name} ",
+                    table_name = table_name,
+                    act = if *overwrite { "OVERWRITE" } else { "INTO" },
+                    tbl = if *table { " TABLE" } else { "" }
+                )?;
                 if !columns.is_empty() {
                     write!(f, "({}) ", display_comma_separated(columns))?;
                 }
+                if let Some(ref parts) = partitioned {
+                    if !parts.is_empty() {
+                        write!(f, "PARTITION ({}) ", display_comma_separated(parts))?;
+                    }
+                }
+                if !after_columns.is_empty() {
+                    write!(f, "({}) ", display_comma_separated(after_columns))?;
+                }
                 write!(f, "{}", source)
             }
             Statement::Copy {
@@ -684,6 +859,25 @@ impl fmt::Display for Statement {
                 }
                 Ok(())
             }
+            Statement::CreateDatabase {
+                db_name,
+                if_not_exists,
+                location,
+                managed_location,
+            } => {
+                write!(f, "CREATE")?;
+                if *if_not_exists {
+                    write!(f, " IF NOT EXISTS")?;
+                }
+                write!(f, " {}", db_name)?;
+                if let Some(l) = location {
+                    write!(f, " LOCATION '{}'", l)?;
+                }
+                if let Some(ml) = managed_location {
+                    write!(f, " MANAGEDLOCATION '{}'", ml)?;
+                }
+                Ok(())
+            }
             Statement::CreateView {
                 name,
                 or_replace,
@@ -711,14 +905,19 @@ impl fmt::Display for Statement {
                 name,
                 columns,
                 constraints,
+                table_properties,
                 with_options,
                 or_replace,
                 if_not_exists,
+                hive_distribution,
+                hive_formats,
                 external,
+                temporary,
                 file_format,
                 location,
                 query,
                 without_rowid,
+                like,
             } => {
                 // We want to allow the following options
                 // Empty column list, allowed by PostgreSQL:
@@ -729,10 +928,11 @@ impl fmt::Display for Statement {
                 //   `CREATE TABLE t (a INT) AS SELECT a from t2`
                 write!(
                     f,
-                    "CREATE {or_replace}{external}TABLE {if_not_exists}{name}",
+                    "CREATE {or_replace}{external}{temporary}TABLE {if_not_exists}{name}",
                     or_replace = if *or_replace { "OR REPLACE " } else { "" },
                     external = if *external { "EXTERNAL " } else { "" },
                     if_not_exists = if *if_not_exists { "IF NOT EXISTS " } else { "" },
+                    temporary = if *temporary { "TEMPORARY " } else { "" },
                     name = name,
                 )?;
                 if !columns.is_empty() || !constraints.is_empty() {
@@ -741,7 +941,7 @@ impl fmt::Display for Statement {
                         write!(f, ", ")?;
                     }
                     write!(f, "{})", display_comma_separated(constraints))?;
-                } else if query.is_none() {
+                } else if query.is_none() && like.is_none() {
                     // PostgreSQL allows `CREATE TABLE t ();`, but requires empty parens
                     write!(f, " ()")?;
                 }
@@ -749,6 +949,79 @@ impl fmt::Display for Statement {
                 if *without_rowid {
                     write!(f, " WITHOUT ROWID")?;
                 }
+
+                // Only for Hive
+                if let Some(l) = like {
+                    write!(f, " LIKE {}", l)?;
+                }
+                match hive_distribution {
+                    HiveDistributionStyle::PARTITIONED { columns } => {
+                        write!(f, " PARTITIONED BY ({})", display_comma_separated(&columns))?;
+                    }
+                    HiveDistributionStyle::CLUSTERED {
+                        columns,
+                        sorted_by,
+                        num_buckets,
+                    } => {
+                        write!(f, " CLUSTERED BY ({})", display_comma_separated(&columns))?;
+                        if !sorted_by.is_empty() {
+                            write!(f, " SORTED BY ({})", display_comma_separated(&sorted_by))?;
+                        }
+                        if *num_buckets > 0 {
+                            write!(f, " INTO {} BUCKETS", num_buckets)?;
+                        }
+                    }
+                    HiveDistributionStyle::SKEWED {
+                        columns,
+                        on,
+                        stored_as_directories,
+                    } => {
+                        write!(
+                            f,
+                            " SKEWED BY ({})) ON ({})",
+                            display_comma_separated(&columns),
+                            display_comma_separated(&on)
+                        )?;
+                        if *stored_as_directories {
+                            write!(f, " STORED AS DIRECTORIES")?;
+                        }
+                    }
+                    _ => (),
+                }
+
+                if let Some(HiveFormat {
+                    row_format,
+                    storage,
+                    location,
+                }) = hive_formats
+                {
+                    match row_format {
+                        Some(HiveRowFormat::SERDE { class }) => {
+                            write!(f, " ROW FORMAT SERDE '{}'", class)?
+                        }
+                        Some(HiveRowFormat::DELIMITED) => write!(f, " ROW FORMAT DELIMITED")?,
+                        None => (),
+                    }
+                    match storage {
+                        Some(HiveIOFormat::IOF {
+                            input_format,
+                            output_format,
+                        }) => write!(
+                            f,
+                            " STORED AS INPUTFORMAT {} OUTPUTFORMAT {}",
+                            input_format, output_format
+                        )?,
+                        Some(HiveIOFormat::FileFormat { format }) if !*external => {
+                            write!(f, " STORED AS {}", format)?
+                        }
+                        _ => (),
+                    }
+                    if !*external {
+                        if let Some(loc) = location {
+                            write!(f, " LOCATION '{}'", loc)?;
+                        }
+                    }
+                }
                 if *external {
                     write!(
                         f,
@@ -757,6 +1030,13 @@ impl fmt::Display for Statement {
                         location.as_ref().unwrap()
                     )?;
                 }
+                if !table_properties.is_empty() {
+                    write!(
+                        f,
+                        " TBLPROPERTIES ({})",
+                        display_comma_separated(table_properties)
+                    )?;
+                }
                 if !with_options.is_empty() {
                     write!(f, " WITH ({})", display_comma_separated(with_options))?;
                 }
@@ -806,25 +1086,34 @@ impl fmt::Display for Statement {
                 if_exists,
                 names,
                 cascade,
+                purge,
             } => write!(
                 f,
-                "DROP {}{} {}{}",
+                "DROP {}{} {}{}{}",
                 object_type,
                 if *if_exists { " IF EXISTS" } else { "" },
                 display_comma_separated(names),
                 if *cascade { " CASCADE" } else { "" },
+                if *purge { " PURGE" } else { "" }
             ),
             Statement::SetVariable {
                 local,
                 variable,
+                hivevar,
                 value,
-            } => write!(
-                f,
-                "SET{local} {variable} = {value}",
-                local = if *local { " LOCAL" } else { "" },
-                variable = variable,
-                value = value
-            ),
+            } => {
+                f.write_str("SET ")?;
+                if *local {
+                    f.write_str("LOCAL ")?;
+                }
+                write!(
+                    f,
+                    "{hivevar}{name} = {value}",
+                    hivevar = if *hivevar { "HIVEVAR:" } else { "" },
+                    name = variable,
+                    value = display_comma_separated(value)
+                )
+            }
             Statement::ShowVariable { variable } => write!(f, "SHOW {}", variable),
             Statement::ShowColumns {
                 extended,
@@ -1086,6 +1375,62 @@ impl fmt::Display for ObjectType {
     }
 }
 
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
+pub enum HiveDistributionStyle {
+    PARTITIONED {
+        columns: Vec<ColumnDef>,
+    },
+    CLUSTERED {
+        columns: Vec<Ident>,
+        sorted_by: Vec<ColumnDef>,
+        num_buckets: i32,
+    },
+    SKEWED {
+        columns: Vec<ColumnDef>,
+        on: Vec<ColumnDef>,
+        stored_as_directories: bool,
+    },
+    NONE,
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
+pub enum HiveRowFormat {
+    SERDE { class: String },
+    DELIMITED,
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
+pub enum HiveIOFormat {
+    IOF {
+        input_format: Expr,
+        output_format: Expr,
+    },
+    FileFormat {
+        format: FileFormat,
+    },
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
+pub struct HiveFormat {
+    pub row_format: Option<HiveRowFormat>,
+    pub storage: Option<HiveIOFormat>,
+    pub location: Option<String>,
+}
+
+impl Default for HiveFormat {
+    fn default() -> Self {
+        HiveFormat {
+            row_format: None,
+            location: None,
+            storage: None,
+        }
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct SqlOption {
diff --git a/src/ast/operator.rs b/src/ast/operator.rs
index 57e70982f..732c81232 100644
--- a/src/ast/operator.rs
+++ b/src/ast/operator.rs
@@ -65,6 +65,7 @@ pub enum BinaryOperator {
     Lt,
     GtEq,
     LtEq,
+    Spaceship,
     Eq,
     NotEq,
     And,
@@ -92,6 +93,7 @@ impl fmt::Display for BinaryOperator {
             BinaryOperator::Lt => "<",
             BinaryOperator::GtEq => ">=",
             BinaryOperator::LtEq => "<=",
+            BinaryOperator::Spaceship => "<=>",
             BinaryOperator::Eq => "=",
             BinaryOperator::NotEq => "<>",
             BinaryOperator::And => "AND",
diff --git a/src/ast/query.rs b/src/ast/query.rs
index 1b8ccf7e4..8f9ab499d 100644
--- a/src/ast/query.rs
+++ b/src/ast/query.rs
@@ -57,6 +57,7 @@ impl fmt::Display for Query {
 
 /// A node in a tree, representing a "query body" expression, roughly:
 /// `SELECT ... [ {UNION|EXCEPT|INTERSECT} SELECT ...]`
+#[allow(clippy::large_enum_variant)]
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub enum SetExpr {
@@ -73,6 +74,7 @@ pub enum SetExpr {
         right: Box<SetExpr>,
     },
     Values(Values),
+    Insert(Statement),
     // TODO: ANSI SQL supports `TABLE` here.
 }
 
@@ -82,6 +84,7 @@ impl fmt::Display for SetExpr {
             SetExpr::Select(s) => write!(f, "{}", s),
             SetExpr::Query(q) => write!(f, "({})", q),
             SetExpr::Values(v) => write!(f, "{}", v),
+            SetExpr::Insert(v) => write!(f, "{}", v),
             SetExpr::SetOperation {
                 left,
                 right,
@@ -126,10 +129,18 @@ pub struct Select {
     pub projection: Vec<SelectItem>,
     /// FROM
     pub from: Vec<TableWithJoins>,
+    /// LATERAL VIEWs
+    pub lateral_views: Vec<LateralView>,
     /// WHERE
     pub selection: Option<Expr>,
     /// GROUP BY
     pub group_by: Vec<Expr>,
+    /// CLUSTER BY (Hive)
+    pub cluster_by: Vec<Expr>,
+    /// DISTRIBUTE BY (Hive)
+    pub distribute_by: Vec<Expr>,
+    /// SORT BY (Hive)
+    pub sort_by: Vec<Expr>,
     /// HAVING
     pub having: Option<Expr>,
 }
@@ -144,12 +155,34 @@ impl fmt::Display for Select {
         if !self.from.is_empty() {
             write!(f, " FROM {}", display_comma_separated(&self.from))?;
         }
+        if !self.lateral_views.is_empty() {
+            for lv in &self.lateral_views {
+                write!(f, "{}", lv)?;
+            }
+        }
         if let Some(ref selection) = self.selection {
             write!(f, " WHERE {}", selection)?;
         }
         if !self.group_by.is_empty() {
             write!(f, " GROUP BY {}", display_comma_separated(&self.group_by))?;
         }
+        if !self.cluster_by.is_empty() {
+            write!(
+                f,
+                " CLUSTER BY {}",
+                display_comma_separated(&self.cluster_by)
+            )?;
+        }
+        if !self.distribute_by.is_empty() {
+            write!(
+                f,
+                " DISTRIBUTE BY {}",
+                display_comma_separated(&self.distribute_by)
+            )?;
+        }
+        if !self.sort_by.is_empty() {
+            write!(f, " SORT BY {}", display_comma_separated(&self.sort_by))?;
+        }
         if let Some(ref having) = self.having {
             write!(f, " HAVING {}", having)?;
         }
@@ -157,6 +190,40 @@ impl fmt::Display for Select {
     }
 }
 
+/// A hive LATERAL VIEW with potential column aliases
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
+pub struct LateralView {
+    /// LATERAL VIEW
+    pub lateral_view: Expr,
+    /// LATERAL VIEW table name
+    pub lateral_view_name: ObjectName,
+    /// LATERAL VIEW optional column aliases
+    pub lateral_col_alias: Vec<Ident>,
+    /// LATERAL VIEW OUTER
+    pub outer: bool,
+}
+
+impl fmt::Display for LateralView {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        write!(
+            f,
+            " LATERAL VIEW{outer} {} {}",
+            self.lateral_view,
+            self.lateral_view_name,
+            outer = if self.outer { " OUTER" } else { "" }
+        )?;
+        if !self.lateral_col_alias.is_empty() {
+            write!(
+                f,
+                " AS {}",
+                display_comma_separated(&self.lateral_col_alias)
+            )?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 pub struct With {
@@ -184,11 +251,16 @@ impl fmt::Display for With {
 pub struct Cte {
     pub alias: TableAlias,
     pub query: Query,
+    pub from: Option<Ident>,
 }
 
 impl fmt::Display for Cte {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
-        write!(f, "{} AS ({})", self.alias, self.query)
+        write!(f, "{} AS ({})", self.alias, self.query)?;
+        if let Some(ref fr) = self.from {
+            write!(f, " FROM {}", fr)?;
+        }
+        Ok(())
     }
 }
 
@@ -417,6 +489,7 @@ pub enum JoinConstraint {
     On(Expr),
     Using(Vec<Ident>),
     Natural,
+    None,
 }
 
 /// An `ORDER BY` expression
diff --git a/src/ast/value.rs b/src/ast/value.rs
index 9e82c175d..2afdfaeae 100644
--- a/src/ast/value.rs
+++ b/src/ast/value.rs
@@ -22,15 +22,17 @@ use std::fmt;
 pub enum Value {
     /// Numeric literal
     #[cfg(not(feature = "bigdecimal"))]
-    Number(String),
+    Number(String, bool),
     #[cfg(feature = "bigdecimal")]
-    Number(BigDecimal),
+    Number(BigDecimal, bool),
     /// 'string value'
     SingleQuotedString(String),
     /// N'string value'
     NationalStringLiteral(String),
     /// X'hex value'
     HexStringLiteral(String),
+
+    DoubleQuotedString(String),
     /// Boolean value true or false
     Boolean(bool),
     /// INTERVAL literals, roughly in the following format:
@@ -59,7 +61,8 @@ pub enum Value {
 impl fmt::Display for Value {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
         match self {
-            Value::Number(v) => write!(f, "{}", v),
+            Value::Number(v, l) => write!(f, "{}{long}", v, long = if *l { "L" } else { "" }),
+            Value::DoubleQuotedString(v) => write!(f, "\"{}\"", v),
             Value::SingleQuotedString(v) => write!(f, "'{}'", escape_single_quote_string(v)),
             Value::NationalStringLiteral(v) => write!(f, "N'{}'", v),
             Value::HexStringLiteral(v) => write!(f, "X'{}'", v),
diff --git a/src/dialect/hive.rs b/src/dialect/hive.rs
new file mode 100644
index 000000000..9b42857ec
--- /dev/null
+++ b/src/dialect/hive.rs
@@ -0,0 +1,39 @@
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+use crate::dialect::Dialect;
+
+#[derive(Debug)]
+pub struct HiveDialect {}
+
+impl Dialect for HiveDialect {
+    fn is_delimited_identifier_start(&self, ch: char) -> bool {
+        (ch == '"') || (ch == '`')
+    }
+
+    fn is_identifier_start(&self, ch: char) -> bool {
+        ('a'..='z').contains(&ch)
+            || ('A'..='Z').contains(&ch)
+            || ('0'..='9').contains(&ch)
+            || ch == '$'
+    }
+
+    fn is_identifier_part(&self, ch: char) -> bool {
+        ('a'..='z').contains(&ch)
+            || ('A'..='Z').contains(&ch)
+            || ('0'..='9').contains(&ch)
+            || ch == '_'
+            || ch == '$'
+            || ch == '{'
+            || ch == '}'
+    }
+}
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index 6e7065043..306cd19d6 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -103,6 +103,7 @@ define_keywords!(
     BOTH,
     BY,
     BYTEA,
+    CACHE,
     CALL,
     CALLED,
     CARDINALITY,
@@ -120,6 +121,7 @@ define_keywords!(
     CHECK,
     CLOB,
     CLOSE,
+    CLUSTER,
     COALESCE,
     COLLATE,
     COLLECT,
@@ -127,6 +129,7 @@ define_keywords!(
     COLUMNS,
     COMMIT,
     COMMITTED,
+    COMPUTE,
     CONDITION,
     CONNECT,
     CONSTRAINT,
@@ -157,6 +160,7 @@ define_keywords!(
     CURRENT_USER,
     CURSOR,
     CYCLE,
+    DATABASE,
     DATE,
     DAY,
     DEALLOCATE,
@@ -165,13 +169,16 @@ define_keywords!(
     DECLARE,
     DEFAULT,
     DELETE,
+    DELIMITED,
     DENSE_RANK,
     DEREF,
     DESC,
     DESCRIBE,
     DETERMINISTIC,
+    DIRECTORY,
     DISCONNECT,
     DISTINCT,
+    DISTRIBUTE,
     DOUBLE,
     DROP,
     DYNAMIC,
@@ -206,6 +213,7 @@ define_keywords!(
     FOLLOWING,
     FOR,
     FOREIGN,
+    FORMAT,
     FRAME_ROW,
     FREE,
     FROM,
@@ -220,6 +228,7 @@ define_keywords!(
     GROUPS,
     HAVING,
     HEADER,
+    HIVEVAR,
     HOLD,
     HOUR,
     IDENTITY,
@@ -229,6 +238,7 @@ define_keywords!(
     INDICATOR,
     INNER,
     INOUT,
+    INPUTFORMAT,
     INSENSITIVE,
     INSERT,
     INT,
@@ -262,11 +272,13 @@ define_keywords!(
     LOCALTIMESTAMP,
     LOCATION,
     LOWER,
+    MANAGEDLOCATION,
     MATCH,
     MATERIALIZED,
     MAX,
     MEMBER,
     MERGE,
+    METADATA,
     METHOD,
     MIN,
     MINUTE,
@@ -274,6 +286,7 @@ define_keywords!(
     MODIFIES,
     MODULE,
     MONTH,
+    MSCK,
     MULTISET,
     NATIONAL,
     NATURAL,
@@ -284,6 +297,7 @@ define_keywords!(
     NO,
     NONE,
     NORMALIZE,
+    NOSCAN,
     NOT,
     NTH_VALUE,
     NTILE,
@@ -305,13 +319,17 @@ define_keywords!(
     ORDER,
     OUT,
     OUTER,
+    OUTPUTFORMAT,
     OVER,
     OVERFLOW,
     OVERLAPS,
     OVERLAY,
+    OVERWRITE,
     PARAMETER,
     PARQUET,
     PARTITION,
+    PARTITIONED,
+    PARTITIONS,
     PERCENT,
     PERCENTILE_CONT,
     PERCENTILE_DISC,
@@ -327,6 +345,7 @@ define_keywords!(
     PREPARE,
     PRIMARY,
     PROCEDURE,
+    PURGE,
     RANGE,
     RANK,
     RCFILE,
@@ -349,6 +368,7 @@ define_keywords!(
     REGR_SYY,
     RELEASE,
     RENAME,
+    REPAIR,
     REPEATABLE,
     REPLACE,
     RESTRICT,
@@ -372,6 +392,7 @@ define_keywords!(
     SELECT,
     SENSITIVE,
     SEQUENCEFILE,
+    SERDE,
     SERIALIZABLE,
     SESSION,
     SESSION_USER,
@@ -380,6 +401,7 @@ define_keywords!(
     SIMILAR,
     SMALLINT,
     SOME,
+    SORT,
     SPECIFIC,
     SPECIFICTYPE,
     SQL,
@@ -389,21 +411,27 @@ define_keywords!(
     SQRT,
     START,
     STATIC,
+    STATISTICS,
     STDDEV_POP,
     STDDEV_SAMP,
     STDIN,
     STORED,
+    STRING,
     SUBMULTISET,
     SUBSTRING,
     SUBSTRING_REGEX,
     SUCCEEDS,
     SUM,
     SYMMETRIC,
+    SYNC,
     SYSTEM,
     SYSTEM_TIME,
     SYSTEM_USER,
     TABLE,
     TABLESAMPLE,
+    TBLPROPERTIES,
+    TEMP,
+    TEMPORARY,
     TEXT,
     TEXTFILE,
     THEN,
@@ -473,9 +501,12 @@ pub const RESERVED_FOR_TABLE_ALIAS: &[Keyword] = &[
     Keyword::SELECT,
     Keyword::WHERE,
     Keyword::GROUP,
+    Keyword::SORT,
     Keyword::HAVING,
     Keyword::ORDER,
     Keyword::TOP,
+    Keyword::LATERAL,
+    Keyword::VIEW,
     Keyword::LIMIT,
     Keyword::OFFSET,
     Keyword::FETCH,
@@ -492,6 +523,8 @@ pub const RESERVED_FOR_TABLE_ALIAS: &[Keyword] = &[
     Keyword::RIGHT,
     Keyword::NATURAL,
     Keyword::USING,
+    Keyword::CLUSTER,
+    Keyword::DISTRIBUTE,
     // for MSSQL-specific OUTER APPLY (seems reserved in most dialects)
     Keyword::OUTER,
 ];
@@ -506,15 +539,20 @@ pub const RESERVED_FOR_COLUMN_ALIAS: &[Keyword] = &[
     Keyword::SELECT,
     Keyword::WHERE,
     Keyword::GROUP,
+    Keyword::SORT,
     Keyword::HAVING,
     Keyword::ORDER,
     Keyword::TOP,
+    Keyword::LATERAL,
+    Keyword::VIEW,
     Keyword::LIMIT,
     Keyword::OFFSET,
     Keyword::FETCH,
     Keyword::UNION,
     Keyword::EXCEPT,
     Keyword::INTERSECT,
+    Keyword::CLUSTER,
+    Keyword::DISTRIBUTE,
     // Reserved only as a column alias in the `SELECT` clause
     Keyword::FROM,
 ];
diff --git a/src/dialect/mod.rs b/src/dialect/mod.rs
index e656ab269..c7041ad93 100644
--- a/src/dialect/mod.rs
+++ b/src/dialect/mod.rs
@@ -12,6 +12,7 @@
 
 mod ansi;
 mod generic;
+mod hive;
 pub mod keywords;
 mod mssql;
 mod mysql;
@@ -24,6 +25,7 @@ use std::fmt::Debug;
 
 pub use self::ansi::AnsiDialect;
 pub use self::generic::GenericDialect;
+pub use self::hive::HiveDialect;
 pub use self::mssql::MsSqlDialect;
 pub use self::mysql::MySqlDialect;
 pub use self::postgresql::PostgreSqlDialect;
diff --git a/src/parser.rs b/src/parser.rs
index 94afeb6e9..7a0b23101 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -48,12 +48,14 @@ pub enum IsOptional {
     Optional,
     Mandatory,
 }
+
 use IsOptional::*;
 
 pub enum IsLateral {
     Lateral,
     NotLateral,
 }
+
 use crate::ast::Statement::CreateVirtualTable;
 use IsLateral::*;
 
@@ -137,6 +139,8 @@ impl<'a> Parser<'a> {
                     self.prev_token();
                     Ok(Statement::Query(Box::new(self.parse_query()?)))
                 }
+                Keyword::TRUNCATE => Ok(self.parse_truncate()?),
+                Keyword::MSCK => Ok(self.parse_msck()?),
                 Keyword::CREATE => Ok(self.parse_create()?),
                 Keyword::DROP => Ok(self.parse_drop()?),
                 Keyword::DELETE => Ok(self.parse_delete()?),
@@ -169,6 +173,104 @@ impl<'a> Parser<'a> {
         }
     }
 
+    pub fn parse_msck(&mut self) -> Result<Statement, ParserError> {
+        let repair = self.parse_keyword(Keyword::REPAIR);
+        self.expect_keyword(Keyword::TABLE)?;
+        let table_name = self.parse_object_name()?;
+        let partition_action = self
+            .maybe_parse(|parser| {
+                let pa = match parser.parse_one_of_keywords(&[
+                    Keyword::ADD,
+                    Keyword::DROP,
+                    Keyword::SYNC,
+                ]) {
+                    Some(Keyword::ADD) => Some(AddDropSync::ADD),
+                    Some(Keyword::DROP) => Some(AddDropSync::DROP),
+                    Some(Keyword::SYNC) => Some(AddDropSync::SYNC),
+                    _ => None,
+                };
+                parser.expect_keyword(Keyword::PARTITIONS)?;
+                Ok(pa)
+            })
+            .unwrap_or_default();
+        Ok(Statement::Msck {
+            repair,
+            table_name,
+            partition_action,
+        })
+    }
+
+    pub fn parse_truncate(&mut self) -> Result<Statement, ParserError> {
+        self.expect_keyword(Keyword::TABLE)?;
+        let table_name = self.parse_object_name()?;
+        let mut partitions = None;
+        if self.parse_keyword(Keyword::PARTITION) {
+            self.expect_token(&Token::LParen)?;
+            partitions = Some(self.parse_comma_separated(Parser::parse_expr)?);
+            self.expect_token(&Token::RParen)?;
+        }
+        Ok(Statement::Truncate {
+            table_name,
+            partitions,
+        })
+    }
+
+    pub fn parse_analyze(&mut self) -> Result<Statement, ParserError> {
+        self.expect_keyword(Keyword::TABLE)?;
+        let table_name = self.parse_object_name()?;
+        let mut for_columns = false;
+        let mut cache_metadata = false;
+        let mut noscan = false;
+        let mut partitions = None;
+        let mut compute_statistics = false;
+        let mut columns = vec![];
+        loop {
+            match self.parse_one_of_keywords(&[
+                Keyword::PARTITION,
+                Keyword::FOR,
+                Keyword::CACHE,
+                Keyword::NOSCAN,
+                Keyword::COMPUTE,
+            ]) {
+                Some(Keyword::PARTITION) => {
+                    self.expect_token(&Token::LParen)?;
+                    partitions = Some(self.parse_comma_separated(Parser::parse_expr)?);
+                    self.expect_token(&Token::RParen)?;
+                }
+                Some(Keyword::NOSCAN) => noscan = true,
+                Some(Keyword::FOR) => {
+                    self.expect_keyword(Keyword::COLUMNS)?;
+
+                    columns = self
+                        .maybe_parse(|parser| {
+                            parser.parse_comma_separated(Parser::parse_identifier)
+                        })
+                        .unwrap_or_default();
+                    for_columns = true
+                }
+                Some(Keyword::CACHE) => {
+                    self.expect_keyword(Keyword::METADATA)?;
+                    cache_metadata = true
+                }
+                Some(Keyword::COMPUTE) => {
+                    self.expect_keyword(Keyword::STATISTICS)?;
+                    compute_statistics = true
+                }
+                _ => break,
+            }
+        }
+
+        Ok(Statement::Analyze {
+            table_name,
+            for_columns,
+            columns,
+            partitions,
+            cache_metadata,
+            noscan,
+            compute_statistics,
+        })
+    }
+
     /// Parse a new expression
     pub fn parse_expr(&mut self) -> Result<Expr, ParserError> {
         self.parse_subexpr(0)
@@ -182,6 +284,7 @@ impl<'a> Parser<'a> {
         loop {
             let next_precedence = self.get_next_precedence()?;
             debug!("next precedence: {:?}", next_precedence);
+
             if precedence >= next_precedence {
                 break;
             }
@@ -316,13 +419,14 @@ impl<'a> Parser<'a> {
                     expr: Box::new(self.parse_subexpr(Self::PLUS_MINUS_PREC)?),
                 })
             }
-            Token::Number(_)
+            Token::Number(_, _)
             | Token::SingleQuotedString(_)
             | Token::NationalStringLiteral(_)
             | Token::HexStringLiteral(_) => {
                 self.prev_token();
                 Ok(Expr::Value(self.parse_value()?))
             }
+
             Token::LParen => {
                 let expr =
                     if self.parse_keyword(Keyword::SELECT) || self.parse_keyword(Keyword::WITH) {
@@ -334,7 +438,7 @@ impl<'a> Parser<'a> {
                 self.expect_token(&Token::RParen)?;
                 Ok(expr)
             }
-            unexpected => self.expected("an expression", unexpected),
+            unexpected => self.expected("an expression:", unexpected),
         }?;
 
         if self.parse_keyword(Keyword::COLLATE) {
@@ -665,6 +769,8 @@ impl<'a> Parser<'a> {
     pub fn parse_infix(&mut self, expr: Expr, precedence: u8) -> Result<Expr, ParserError> {
         let tok = self.next_token();
         let regular_binary_operator = match &tok {
+            Token::Spaceship => Some(BinaryOperator::Spaceship),
+            Token::DoubleEq => Some(BinaryOperator::Eq),
             Token::Eq => Some(BinaryOperator::Eq),
             Token::Neq => Some(BinaryOperator::NotEq),
             Token::Gt => Some(BinaryOperator::Gt),
@@ -744,12 +850,27 @@ impl<'a> Parser<'a> {
                 op: UnaryOperator::PGPostfixFactorial,
                 expr: Box::new(expr),
             })
+        } else if Token::LBracket == tok {
+            self.parse_map_access(expr)
         } else {
             // Can only happen if `get_next_precedence` got out of sync with this function
             panic!("No infix parser for token {:?}", tok)
         }
     }
 
+    pub fn parse_map_access(&mut self, expr: Expr) -> Result<Expr, ParserError> {
+        let key = self.parse_literal_string()?;
+        let tok = self.consume_token(&Token::RBracket);
+        debug!("Tok: {}", tok);
+        match expr {
+            e @ Expr::Identifier(_) | e @ Expr::CompoundIdentifier(_) => Ok(Expr::MapAccess {
+                column: Box::new(e),
+                key,
+            }),
+            _ => Ok(expr),
+        }
+    }
+
     /// Parses the parens following the `[ NOT ] IN` operator
     pub fn parse_in(&mut self, expr: Expr, negated: bool) -> Result<Expr, ParserError> {
         self.expect_token(&Token::LParen)?;
@@ -820,7 +941,14 @@ impl<'a> Parser<'a> {
             Token::Word(w) if w.keyword == Keyword::IN => Ok(Self::BETWEEN_PREC),
             Token::Word(w) if w.keyword == Keyword::BETWEEN => Ok(Self::BETWEEN_PREC),
             Token::Word(w) if w.keyword == Keyword::LIKE => Ok(Self::BETWEEN_PREC),
-            Token::Eq | Token::Lt | Token::LtEq | Token::Neq | Token::Gt | Token::GtEq => Ok(20),
+            Token::Eq
+            | Token::Lt
+            | Token::LtEq
+            | Token::Neq
+            | Token::Gt
+            | Token::GtEq
+            | Token::DoubleEq
+            | Token::Spaceship => Ok(20),
             Token::Pipe => Ok(21),
             Token::Caret | Token::Sharp | Token::ShiftRight | Token::ShiftLeft => Ok(22),
             Token::Ampersand => Ok(23),
@@ -828,6 +956,7 @@ impl<'a> Parser<'a> {
             Token::Mult | Token::Div | Token::Mod | Token::StringConcat => Ok(40),
             Token::DoubleColon => Ok(50),
             Token::ExclamationMark => Ok(50),
+            Token::LBracket | Token::RBracket => Ok(10),
             _ => Ok(0),
         }
     }
@@ -911,7 +1040,7 @@ impl<'a> Parser<'a> {
         let index = self.index;
         for &keyword in keywords {
             if !self.parse_keyword(keyword) {
-                //println!("parse_keywords aborting .. did not find {}", keyword);
+                // println!("parse_keywords aborting .. did not find {:?}", keyword);
                 // reset index and return immediately
                 self.index = index;
                 return false;
@@ -1034,8 +1163,11 @@ impl<'a> Parser<'a> {
     /// Parse a SQL CREATE statement
     pub fn parse_create(&mut self) -> Result<Statement, ParserError> {
         let or_replace = self.parse_keywords(&[Keyword::OR, Keyword::REPLACE]);
+        let temporary = self
+            .parse_one_of_keywords(&[Keyword::TEMP, Keyword::TEMPORARY])
+            .is_some();
         if self.parse_keyword(Keyword::TABLE) {
-            self.parse_create_table(or_replace)
+            self.parse_create_table(or_replace, temporary)
         } else if self.parse_keyword(Keyword::MATERIALIZED) || self.parse_keyword(Keyword::VIEW) {
             self.prev_token();
             self.parse_create_view(or_replace)
@@ -1088,31 +1220,67 @@ impl<'a> Parser<'a> {
         })
     }
 
+    pub fn parse_create_database(&mut self) -> Result<Statement, ParserError> {
+        let ine = self.parse_keywords(&[Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
+        let db_name = self.parse_object_name()?;
+        let mut location = None;
+        let mut managed_location = None;
+        loop {
+            match self.parse_one_of_keywords(&[Keyword::LOCATION, Keyword::MANAGEDLOCATION]) {
+                Some(Keyword::LOCATION) => location = Some(self.parse_literal_string()?),
+                Some(Keyword::MANAGEDLOCATION) => {
+                    managed_location = Some(self.parse_literal_string()?)
+                }
+                _ => break,
+            }
+        }
+        Ok(Statement::CreateDatabase {
+            db_name,
+            if_not_exists: ine,
+            location,
+            managed_location,
+        })
+    }
+
     pub fn parse_create_external_table(
         &mut self,
         or_replace: bool,
     ) -> Result<Statement, ParserError> {
         self.expect_keyword(Keyword::TABLE)?;
+        let if_not_exists = self.parse_keywords(&[Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
         let table_name = self.parse_object_name()?;
         let (columns, constraints) = self.parse_columns()?;
-        self.expect_keywords(&[Keyword::STORED, Keyword::AS])?;
-        let file_format = self.parse_file_format()?;
 
-        self.expect_keyword(Keyword::LOCATION)?;
-        let location = self.parse_literal_string()?;
+        let hive_distribution = self.parse_hive_distribution()?;
+        let hive_formats = self.parse_hive_formats()?;
 
+        let file_format = if let Some(ff) = &hive_formats.storage {
+            match ff {
+                HiveIOFormat::FileFormat { format } => Some(format.clone()),
+                _ => None,
+            }
+        } else {
+            None
+        };
+        let location = hive_formats.location.clone();
+        let table_properties = self.parse_options(Keyword::TBLPROPERTIES)?;
         Ok(Statement::CreateTable {
             name: table_name,
             columns,
             constraints,
+            hive_distribution,
+            hive_formats: Some(hive_formats),
             with_options: vec![],
+            table_properties,
             or_replace,
-            if_not_exists: false,
+            if_not_exists,
             external: true,
-            file_format: Some(file_format),
-            location: Some(location),
+            temporary: false,
+            file_format,
+            location,
             query: None,
             without_rowid: false,
+            like: None,
         })
     }
 
@@ -1139,7 +1307,7 @@ impl<'a> Parser<'a> {
         // ANSI SQL and Postgres support RECURSIVE here, but we don't support it either.
         let name = self.parse_object_name()?;
         let columns = self.parse_parenthesized_column_list(Optional)?;
-        let with_options = self.parse_with_options()?;
+        let with_options = self.parse_options(Keyword::WITH)?;
         self.expect_keyword(Keyword::AS)?;
         let query = Box::new(self.parse_query()?);
         // Optional `WITH [ CASCADED | LOCAL ] CHECK OPTION` is widely supported here.
@@ -1171,6 +1339,7 @@ impl<'a> Parser<'a> {
         let names = self.parse_comma_separated(Parser::parse_object_name)?;
         let cascade = self.parse_keyword(Keyword::CASCADE);
         let restrict = self.parse_keyword(Keyword::RESTRICT);
+        let purge = self.parse_keyword(Keyword::PURGE);
         if cascade && restrict {
             return parser_err!("Cannot specify both CASCADE and RESTRICT in DROP");
         }
@@ -1179,6 +1348,7 @@ impl<'a> Parser<'a> {
             if_exists,
             names,
             cascade,
+            purge,
         })
     }
 
@@ -1199,18 +1369,85 @@ impl<'a> Parser<'a> {
         })
     }
 
-    pub fn parse_create_table(&mut self, or_replace: bool) -> Result<Statement, ParserError> {
+    //TODO: Implement parsing for Skewed and Clustered
+    pub fn parse_hive_distribution(&mut self) -> Result<HiveDistributionStyle, ParserError> {
+        if self.parse_keywords(&[Keyword::PARTITIONED, Keyword::BY]) {
+            self.expect_token(&Token::LParen)?;
+            let columns = self.parse_comma_separated(Parser::parse_column_def)?;
+            self.expect_token(&Token::RParen)?;
+            Ok(HiveDistributionStyle::PARTITIONED { columns })
+        } else {
+            Ok(HiveDistributionStyle::NONE)
+        }
+    }
+
+    pub fn parse_hive_formats(&mut self) -> Result<HiveFormat, ParserError> {
+        let mut hive_format = HiveFormat::default();
+        loop {
+            match self.parse_one_of_keywords(&[Keyword::ROW, Keyword::STORED, Keyword::LOCATION]) {
+                Some(Keyword::ROW) => {
+                    hive_format.row_format = Some(self.parse_row_format()?);
+                }
+                Some(Keyword::STORED) => {
+                    self.expect_keyword(Keyword::AS)?;
+                    if self.parse_keyword(Keyword::INPUTFORMAT) {
+                        let input_format = self.parse_expr()?;
+                        self.expect_keyword(Keyword::OUTPUTFORMAT)?;
+                        let output_format = self.parse_expr()?;
+                        hive_format.storage = Some(HiveIOFormat::IOF {
+                            input_format,
+                            output_format,
+                        });
+                    } else {
+                        let format = self.parse_file_format()?;
+                        hive_format.storage = Some(HiveIOFormat::FileFormat { format });
+                    }
+                }
+                Some(Keyword::LOCATION) => {
+                    hive_format.location = Some(self.parse_literal_string()?);
+                }
+                None => break,
+                _ => break,
+            }
+        }
+
+        Ok(hive_format)
+    }
+
+    pub fn parse_row_format(&mut self) -> Result<HiveRowFormat, ParserError> {
+        self.expect_keyword(Keyword::FORMAT)?;
+        match self.parse_one_of_keywords(&[Keyword::SERDE, Keyword::DELIMITED]) {
+            Some(Keyword::SERDE) => {
+                let class = self.parse_literal_string()?;
+                Ok(HiveRowFormat::SERDE { class })
+            }
+            _ => Ok(HiveRowFormat::DELIMITED),
+        }
+    }
+
+    pub fn parse_create_table(
+        &mut self,
+        or_replace: bool,
+        temporary: bool,
+    ) -> Result<Statement, ParserError> {
         let if_not_exists = self.parse_keywords(&[Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
         let table_name = self.parse_object_name()?;
+        let like = if self.parse_keyword(Keyword::LIKE) {
+            self.parse_object_name().ok()
+        } else {
+            None
+        };
         // parse optional column list (schema)
         let (columns, constraints) = self.parse_columns()?;
 
         // SQLite supports `WITHOUT ROWID` at the end of `CREATE TABLE`
         let without_rowid = self.parse_keywords(&[Keyword::WITHOUT, Keyword::ROWID]);
 
+        let hive_distribution = self.parse_hive_distribution()?;
+        let hive_formats = self.parse_hive_formats()?;
         // PostgreSQL supports `WITH ( options )`, before `AS`
-        let with_options = self.parse_with_options()?;
-
+        let with_options = self.parse_options(Keyword::WITH)?;
+        let table_properties = self.parse_options(Keyword::TBLPROPERTIES)?;
         // Parse optional `AS ( query )`
         let query = if self.parse_keyword(Keyword::AS) {
             Some(Box::new(self.parse_query()?))
@@ -1220,16 +1457,21 @@ impl<'a> Parser<'a> {
 
         Ok(Statement::CreateTable {
             name: table_name,
+            temporary,
             columns,
             constraints,
             with_options,
+            table_properties,
             or_replace,
             if_not_exists,
+            hive_distribution,
+            hive_formats: Some(hive_formats),
             external: false,
             file_format: None,
             location: None,
             query,
             without_rowid,
+            like,
         })
     }
 
@@ -1423,8 +1665,8 @@ impl<'a> Parser<'a> {
         }
     }
 
-    pub fn parse_with_options(&mut self) -> Result<Vec<SqlOption>, ParserError> {
-        if self.parse_keyword(Keyword::WITH) {
+    pub fn parse_options(&mut self, keyword: Keyword) -> Result<Vec<SqlOption>, ParserError> {
+        if self.parse_keyword(keyword) {
             self.expect_token(&Token::LParen)?;
             let options = self.parse_comma_separated(Parser::parse_sql_option)?;
             self.expect_token(&Token::RParen)?;
@@ -1449,13 +1691,25 @@ impl<'a> Parser<'a> {
             if let Some(constraint) = self.parse_optional_table_constraint()? {
                 AlterTableOperation::AddConstraint(constraint)
             } else {
-                let _ = self.parse_keyword(Keyword::COLUMN);
-                let column_def = self.parse_column_def()?;
-                AlterTableOperation::AddColumn { column_def }
+                let if_not_exists =
+                    self.parse_keywords(&[Keyword::IF, Keyword::NOT, Keyword::EXISTS]);
+                if self.parse_keyword(Keyword::PARTITION) {
+                    self.expect_token(&Token::LParen)?;
+                    let partitions = self.parse_comma_separated(Parser::parse_expr)?;
+                    self.expect_token(&Token::RParen)?;
+                    AlterTableOperation::AddPartitions {
+                        if_not_exists,
+                        new_partitions: partitions,
+                    }
+                } else {
+                    let _ = self.parse_keyword(Keyword::COLUMN);
+                    let column_def = self.parse_column_def()?;
+                    AlterTableOperation::AddColumn { column_def }
+                }
             }
         } else if self.parse_keyword(Keyword::RENAME) {
             if self.parse_keyword(Keyword::TO) {
-                let table_name = self.parse_identifier()?;
+                let table_name = self.parse_object_name()?;
                 AlterTableOperation::RenameTable { table_name }
             } else {
                 let _ = self.parse_keyword(Keyword::COLUMN);
@@ -1468,17 +1722,51 @@ impl<'a> Parser<'a> {
                 }
             }
         } else if self.parse_keyword(Keyword::DROP) {
-            let _ = self.parse_keyword(Keyword::COLUMN);
-            let if_exists = self.parse_keywords(&[Keyword::IF, Keyword::EXISTS]);
-            let column_name = self.parse_identifier()?;
-            let cascade = self.parse_keyword(Keyword::CASCADE);
-            AlterTableOperation::DropColumn {
-                column_name,
-                if_exists,
-                cascade,
+            if self.parse_keywords(&[Keyword::IF, Keyword::EXISTS, Keyword::PARTITION]) {
+                self.expect_token(&Token::LParen)?;
+                let partitions = self.parse_comma_separated(Parser::parse_expr)?;
+                self.expect_token(&Token::RParen)?;
+                AlterTableOperation::DropPartitions {
+                    partitions,
+                    if_exists: true,
+                }
+            } else if self.parse_keyword(Keyword::PARTITION) {
+                self.expect_token(&Token::LParen)?;
+                let partitions = self.parse_comma_separated(Parser::parse_expr)?;
+                self.expect_token(&Token::RParen)?;
+                AlterTableOperation::DropPartitions {
+                    partitions,
+                    if_exists: false,
+                }
+            } else {
+                let _ = self.parse_keyword(Keyword::COLUMN);
+                let if_exists = self.parse_keywords(&[Keyword::IF, Keyword::EXISTS]);
+                let column_name = self.parse_identifier()?;
+                let cascade = self.parse_keyword(Keyword::CASCADE);
+                AlterTableOperation::DropColumn {
+                    column_name,
+                    if_exists,
+                    cascade,
+                }
+            }
+        } else if self.parse_keyword(Keyword::PARTITION) {
+            self.expect_token(&Token::LParen)?;
+            let before = self.parse_comma_separated(Parser::parse_expr)?;
+            self.expect_token(&Token::RParen)?;
+            self.expect_keyword(Keyword::RENAME)?;
+            self.expect_keywords(&[Keyword::TO, Keyword::PARTITION])?;
+            self.expect_token(&Token::LParen)?;
+            let renames = self.parse_comma_separated(Parser::parse_expr)?;
+            self.expect_token(&Token::RParen)?;
+            AlterTableOperation::RenamePartitions {
+                old_partitions: before,
+                new_partitions: renames,
             }
         } else {
-            return self.expected("ADD, RENAME, or DROP after ALTER TABLE", self.peek_token());
+            return self.expected(
+                "ADD, RENAME, PARTITION or DROP after ALTER TABLE",
+                self.peek_token(),
+            );
         };
         Ok(Statement::AlterTable {
             name: table_name,
@@ -1545,13 +1833,18 @@ impl<'a> Parser<'a> {
                 Keyword::TRUE => Ok(Value::Boolean(true)),
                 Keyword::FALSE => Ok(Value::Boolean(false)),
                 Keyword::NULL => Ok(Value::Null),
+                Keyword::NoKeyword if w.quote_style.is_some() => match w.quote_style {
+                    Some('"') => Ok(Value::DoubleQuotedString(w.value)),
+                    Some('\'') => Ok(Value::SingleQuotedString(w.value)),
+                    _ => self.expected("A value?", Token::Word(w))?,
+                },
                 _ => self.expected("a concrete value", Token::Word(w)),
             },
             // The call to n.parse() returns a bigdecimal when the
             // bigdecimal feature is enabled, and is otherwise a no-op
             // (i.e., it returns the input string).
-            Token::Number(ref n) => match n.parse() {
-                Ok(n) => Ok(Value::Number(n)),
+            Token::Number(ref n, l) => match n.parse() {
+                Ok(n) => Ok(Value::Number(n, l)),
                 Err(e) => parser_err!(format!("Could not parse '{}' as number: {}", n, e)),
             },
             Token::SingleQuotedString(ref s) => Ok(Value::SingleQuotedString(s.to_string())),
@@ -1563,7 +1856,7 @@ impl<'a> Parser<'a> {
 
     pub fn parse_number_value(&mut self) -> Result<Value, ParserError> {
         match self.parse_value()? {
-            v @ Value::Number(_) => Ok(v),
+            v @ Value::Number(_, _) => Ok(v),
             _ => {
                 self.prev_token();
                 self.expected("literal number", self.peek_token())
@@ -1574,7 +1867,7 @@ impl<'a> Parser<'a> {
     /// Parse an unsigned literal integer/long
     pub fn parse_literal_uint(&mut self) -> Result<u64, ParserError> {
         match self.next_token() {
-            Token::Number(s) => s.parse::<u64>().map_err(|e| {
+            Token::Number(s, _) => s.parse::<u64>().map_err(|e| {
                 ParserError::ParserError(format!("Could not parse '{}' as u64: {}", s, e))
             }),
             unexpected => self.expected("literal int", unexpected),
@@ -1584,6 +1877,7 @@ impl<'a> Parser<'a> {
     /// Parse a literal string
     pub fn parse_literal_string(&mut self) -> Result<String, ParserError> {
         match self.next_token() {
+            Token::Word(Word { value, keyword, .. }) if keyword == Keyword::NoKeyword => Ok(value),
             Token::SingleQuotedString(s) => Ok(s),
             unexpected => self.expected("literal string", unexpected),
         }
@@ -1632,6 +1926,7 @@ impl<'a> Parser<'a> {
                 // parse_interval_literal for a taste.
                 Keyword::INTERVAL => Ok(DataType::Interval),
                 Keyword::REGCLASS => Ok(DataType::Regclass),
+                Keyword::STRING => Ok(DataType::String),
                 Keyword::TEXT => {
                     if self.consume_token(&Token::LBracket) {
                         // Note: this is postgresql-specific
@@ -1730,6 +2025,7 @@ impl<'a> Parser<'a> {
     pub fn parse_identifier(&mut self) -> Result<Ident, ParserError> {
         match self.next_token() {
             Token::Word(w) => Ok(w.to_ident()),
+            Token::SingleQuotedString(s) => Ok(Ident::with_quote('\'', s)),
             unexpected => self.expected("identifier", unexpected),
         }
     }
@@ -1805,15 +2101,6 @@ impl<'a> Parser<'a> {
         })
     }
 
-    pub fn parse_analyze(&mut self) -> Result<Statement, ParserError> {
-        // ANALYZE TABLE table_name
-        self.expect_keyword(Keyword::TABLE)?;
-
-        let table_name = self.parse_object_name()?;
-
-        Ok(Statement::Analyze { table_name })
-    }
-
     /// Parse a query expression, i.e. a `SELECT` statement optionally
     /// preceeded with some `WITH` CTE declarations and optionally followed
     /// by `ORDER BY`. Unlike some other parse_... methods, this one doesn't
@@ -1828,53 +2115,88 @@ impl<'a> Parser<'a> {
             None
         };
 
-        let body = self.parse_query_body(0)?;
+        if !self.parse_keyword(Keyword::INSERT) {
+            let body = self.parse_query_body(0)?;
 
-        let order_by = if self.parse_keywords(&[Keyword::ORDER, Keyword::BY]) {
-            self.parse_comma_separated(Parser::parse_order_by_expr)?
-        } else {
-            vec![]
-        };
+            let order_by = if self.parse_keywords(&[Keyword::ORDER, Keyword::BY]) {
+                self.parse_comma_separated(Parser::parse_order_by_expr)?
+            } else {
+                vec![]
+            };
 
-        let limit = if self.parse_keyword(Keyword::LIMIT) {
-            self.parse_limit()?
-        } else {
-            None
-        };
+            let limit = if self.parse_keyword(Keyword::LIMIT) {
+                self.parse_limit()?
+            } else {
+                None
+            };
 
-        let offset = if self.parse_keyword(Keyword::OFFSET) {
-            Some(self.parse_offset()?)
-        } else {
-            None
-        };
+            let offset = if self.parse_keyword(Keyword::OFFSET) {
+                Some(self.parse_offset()?)
+            } else {
+                None
+            };
 
-        let fetch = if self.parse_keyword(Keyword::FETCH) {
-            Some(self.parse_fetch()?)
-        } else {
-            None
-        };
+            let fetch = if self.parse_keyword(Keyword::FETCH) {
+                Some(self.parse_fetch()?)
+            } else {
+                None
+            };
 
-        Ok(Query {
-            with,
-            body,
-            limit,
-            order_by,
-            offset,
-            fetch,
-        })
+            Ok(Query {
+                with,
+                body,
+                limit,
+                order_by,
+                offset,
+                fetch,
+            })
+        } else {
+            let insert = self.parse_insert()?;
+            Ok(Query {
+                with,
+                body: SetExpr::Insert(insert),
+                limit: None,
+                order_by: vec![],
+                offset: None,
+                fetch: None,
+            })
+        }
     }
 
     /// Parse a CTE (`alias [( col1, col2, ... )] AS (subquery)`)
     fn parse_cte(&mut self) -> Result<Cte, ParserError> {
-        let alias = TableAlias {
-            name: self.parse_identifier()?,
-            columns: self.parse_parenthesized_column_list(Optional)?,
+        let name = self.parse_identifier()?;
+
+        let mut cte = if self.parse_keyword(Keyword::AS) {
+            self.expect_token(&Token::LParen)?;
+            let query = self.parse_query()?;
+            self.expect_token(&Token::RParen)?;
+            let alias = TableAlias {
+                name,
+                columns: vec![],
+            };
+            Cte {
+                alias,
+                query,
+                from: None,
+            }
+        } else {
+            let columns = self.parse_parenthesized_column_list(Optional)?;
+            self.expect_keyword(Keyword::AS)?;
+            self.expect_token(&Token::LParen)?;
+            let query = self.parse_query()?;
+            self.expect_token(&Token::RParen)?;
+            let alias = TableAlias { name, columns };
+            Cte {
+                alias,
+                query,
+                from: None,
+            }
         };
-        self.expect_keyword(Keyword::AS)?;
-        self.expect_token(&Token::LParen)?;
-        let query = self.parse_query()?;
-        self.expect_token(&Token::RParen)?;
-        Ok(Cte { alias, query })
+        if self.parse_keyword(Keyword::FROM) {
+            cte.from = Some(self.parse_identifier()?);
+        }
+        Ok(cte)
     }
 
     /// Parse a "query body", which is an expression with roughly the
@@ -1962,6 +2284,37 @@ impl<'a> Parser<'a> {
         } else {
             vec![]
         };
+        let mut lateral_views = vec![];
+        loop {
+            if self.parse_keywords(&[Keyword::LATERAL, Keyword::VIEW]) {
+                let outer = self.parse_keyword(Keyword::OUTER);
+                let lateral_view = self.parse_expr()?;
+                let lateral_view_name = self.parse_object_name()?;
+                let lateral_col_alias = self
+                    .parse_comma_separated(|parser| {
+                        parser.parse_optional_alias(&[
+                            Keyword::WHERE,
+                            Keyword::GROUP,
+                            Keyword::CLUSTER,
+                            Keyword::HAVING,
+                            Keyword::LATERAL,
+                        ]) // This couldn't possibly be a bad idea
+                    })?
+                    .into_iter()
+                    .filter(|i| i.is_some())
+                    .map(|i| i.unwrap())
+                    .collect();
+
+                lateral_views.push(LateralView {
+                    lateral_view,
+                    lateral_view_name,
+                    lateral_col_alias,
+                    outer,
+                });
+            } else {
+                break;
+            }
+        }
 
         let selection = if self.parse_keyword(Keyword::WHERE) {
             Some(self.parse_expr()?)
@@ -1975,6 +2328,24 @@ impl<'a> Parser<'a> {
             vec![]
         };
 
+        let cluster_by = if self.parse_keywords(&[Keyword::CLUSTER, Keyword::BY]) {
+            self.parse_comma_separated(Parser::parse_expr)?
+        } else {
+            vec![]
+        };
+
+        let distribute_by = if self.parse_keywords(&[Keyword::DISTRIBUTE, Keyword::BY]) {
+            self.parse_comma_separated(Parser::parse_expr)?
+        } else {
+            vec![]
+        };
+
+        let sort_by = if self.parse_keywords(&[Keyword::SORT, Keyword::BY]) {
+            self.parse_comma_separated(Parser::parse_expr)?
+        } else {
+            vec![]
+        };
+
         let having = if self.parse_keyword(Keyword::HAVING) {
             Some(self.parse_expr()?)
         } else {
@@ -1987,26 +2358,42 @@ impl<'a> Parser<'a> {
             projection,
             from,
             selection,
+            lateral_views,
             group_by,
+            cluster_by,
+            distribute_by,
+            sort_by,
             having,
         })
     }
 
     pub fn parse_set(&mut self) -> Result<Statement, ParserError> {
-        let modifier = self.parse_one_of_keywords(&[Keyword::SESSION, Keyword::LOCAL]);
+        let modifier =
+            self.parse_one_of_keywords(&[Keyword::SESSION, Keyword::LOCAL, Keyword::HIVEVAR]);
+        if let Some(Keyword::HIVEVAR) = modifier {
+            self.expect_token(&Token::Colon)?;
+        }
         let variable = self.parse_identifier()?;
         if self.consume_token(&Token::Eq) || self.parse_keyword(Keyword::TO) {
-            let token = self.peek_token();
-            let value = match (self.parse_value(), token) {
-                (Ok(value), _) => SetVariableValue::Literal(value),
-                (Err(_), Token::Word(ident)) => SetVariableValue::Ident(ident.to_ident()),
-                (Err(_), unexpected) => self.expected("variable value", unexpected)?,
-            };
-            Ok(Statement::SetVariable {
-                local: modifier == Some(Keyword::LOCAL),
-                variable,
-                value,
-            })
+            let mut values = vec![];
+            loop {
+                let token = self.peek_token();
+                let value = match (self.parse_value(), token) {
+                    (Ok(value), _) => SetVariableValue::Literal(value),
+                    (Err(_), Token::Word(ident)) => SetVariableValue::Ident(ident.to_ident()),
+                    (Err(_), unexpected) => self.expected("variable value", unexpected)?,
+                };
+                values.push(value);
+                if self.consume_token(&Token::Comma) {
+                    continue;
+                }
+                return Ok(Statement::SetVariable {
+                    local: modifier == Some(Keyword::LOCAL),
+                    hivevar: Some(Keyword::HIVEVAR) == modifier,
+                    variable,
+                    value: values,
+                });
+            }
         } else if variable.value == "TRANSACTION" && modifier.is_none() {
             Ok(Statement::SetTransaction {
                 modes: self.parse_transaction_modes()?,
@@ -2119,7 +2506,7 @@ impl<'a> Parser<'a> {
                         }
                     }
                     Keyword::OUTER => {
-                        return self.expected("LEFT, RIGHT, or FULL", self.peek_token())
+                        return self.expected("LEFT, RIGHT, or FULL", self.peek_token());
                     }
                     _ if natural => {
                         return self.expected("a join type after NATURAL", self.peek_token());
@@ -2290,21 +2677,61 @@ impl<'a> Parser<'a> {
             let columns = self.parse_parenthesized_column_list(Mandatory)?;
             Ok(JoinConstraint::Using(columns))
         } else {
-            self.expected("ON, or USING after JOIN", self.peek_token())
+            Ok(JoinConstraint::None)
+            //self.expected("ON, or USING after JOIN", self.peek_token())
         }
     }
 
     /// Parse an INSERT statement
     pub fn parse_insert(&mut self) -> Result<Statement, ParserError> {
-        self.expect_keyword(Keyword::INTO)?;
-        let table_name = self.parse_object_name()?;
-        let columns = self.parse_parenthesized_column_list(Optional)?;
-        let source = Box::new(self.parse_query()?);
-        Ok(Statement::Insert {
-            table_name,
-            columns,
-            source,
-        })
+        let action = self.expect_one_of_keywords(&[Keyword::INTO, Keyword::OVERWRITE])?;
+        let overwrite = action == Keyword::OVERWRITE;
+        let local = self.parse_keyword(Keyword::LOCAL);
+
+        if self.parse_keyword(Keyword::DIRECTORY) {
+            let path = self.parse_literal_string()?;
+            let file_format = if self.parse_keywords(&[Keyword::STORED, Keyword::AS]) {
+                Some(self.parse_file_format()?)
+            } else {
+                None
+            };
+            let source = Box::new(self.parse_query()?);
+            Ok(Statement::Directory {
+                local,
+                path,
+                overwrite,
+                file_format,
+                source,
+            })
+        } else {
+            // Hive lets you put table here regardless
+            let table = self.parse_keyword(Keyword::TABLE);
+            let table_name = self.parse_object_name()?;
+            let columns = self.parse_parenthesized_column_list(Optional)?;
+
+            let partitioned = if self.parse_keyword(Keyword::PARTITION) {
+                self.expect_token(&Token::LParen)?;
+                let r = Some(self.parse_comma_separated(Parser::parse_expr)?);
+                self.expect_token(&Token::RParen)?;
+                r
+            } else {
+                None
+            };
+
+            // Hive allows you to specify columns after partitions as well if you want.
+            let after_columns = self.parse_parenthesized_column_list(Optional)?;
+
+            let source = Box::new(self.parse_query()?);
+            Ok(Statement::Insert {
+                table_name,
+                overwrite,
+                partitioned,
+                columns,
+                after_columns,
+                source,
+                table,
+            })
+        }
     }
 
     pub fn parse_update(&mut self) -> Result<Statement, ParserError> {
diff --git a/src/test_utils.rs b/src/test_utils.rs
index 2fcacffa9..160d2c110 100644
--- a/src/test_utils.rs
+++ b/src/test_utils.rs
@@ -132,6 +132,7 @@ pub fn all_dialects() -> TestedDialects {
             Box::new(MsSqlDialect {}),
             Box::new(AnsiDialect {}),
             Box::new(SnowflakeDialect {}),
+            Box::new(HiveDialect {}),
         ],
     }
 }
@@ -153,7 +154,7 @@ pub fn expr_from_projection(item: &SelectItem) -> &Expr {
 }
 
 pub fn number(n: &'static str) -> Value {
-    Value::Number(n.parse().unwrap())
+    Value::Number(n.parse().unwrap(), false)
 }
 
 pub fn table_alias(name: impl Into<String>) -> Option<TableAlias> {
diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index bbad1a4c4..fd33f9589 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -35,7 +35,7 @@ pub enum Token {
     /// A keyword (like SELECT) or an optionally quoted SQL identifier
     Word(Word),
     /// An unsigned numeric literal
-    Number(String),
+    Number(String, bool),
     /// A character that could not be tokenized
     Char(char),
     /// Single quoted string: i.e: 'string'
@@ -48,6 +48,8 @@ pub enum Token {
     Comma,
     /// Whitespace (space, tab, etc)
     Whitespace(Whitespace),
+    /// Double equals sign `==`
+    DoubleEq,
     /// Equality operator `=`
     Eq,
     /// Not Equals operator `<>` (or `!=` in some dialects)
@@ -60,6 +62,8 @@ pub enum Token {
     LtEq,
     /// Greater Than Or Equals operator `>=`
     GtEq,
+    /// Spaceship operator <=>
+    Spaceship,
     /// Plus operator `+`
     Plus,
     /// Minus operator `-`
@@ -127,13 +131,15 @@ impl fmt::Display for Token {
         match self {
             Token::EOF => f.write_str("EOF"),
             Token::Word(ref w) => write!(f, "{}", w),
-            Token::Number(ref n) => f.write_str(n),
+            Token::Number(ref n, l) => write!(f, "{}{long}", n, long = if *l { "L" } else { "" }),
             Token::Char(ref c) => write!(f, "{}", c),
             Token::SingleQuotedString(ref s) => write!(f, "'{}'", s),
             Token::NationalStringLiteral(ref s) => write!(f, "N'{}'", s),
             Token::HexStringLiteral(ref s) => write!(f, "X'{}'", s),
             Token::Comma => f.write_str(","),
             Token::Whitespace(ws) => write!(f, "{}", ws),
+            Token::DoubleEq => f.write_str("=="),
+            Token::Spaceship => f.write_str("<=>"),
             Token::Eq => f.write_str("="),
             Token::Neq => f.write_str("<>"),
             Token::Lt => f.write_str("<"),
@@ -296,7 +302,7 @@ impl<'a> Tokenizer<'a> {
                 Token::Whitespace(Whitespace::Tab) => self.col += 4,
                 Token::Word(w) if w.quote_style == None => self.col += w.value.len() as u64,
                 Token::Word(w) if w.quote_style != None => self.col += w.value.len() as u64 + 2,
-                Token::Number(s) => self.col += s.len() as u64,
+                Token::Number(s, _) => self.col += s.len() as u64,
                 Token::SingleQuotedString(s) => self.col += s.len() as u64,
                 _ => self.col += 1,
             }
@@ -358,6 +364,15 @@ impl<'a> Tokenizer<'a> {
                 ch if self.dialect.is_identifier_start(ch) => {
                     chars.next(); // consume the first char
                     let s = self.tokenize_word(ch, chars);
+
+                    if s.chars().all(|x| ('0'..='9').contains(&x) || x == '.') {
+                        let mut s = peeking_take_while(&mut s.chars().peekable(), |ch| {
+                            matches!(ch, '0'..='9' | '.')
+                        });
+                        let s2 = peeking_take_while(chars, |ch| matches!(ch, '0'..='9' | '.'));
+                        s += s2.as_str();
+                        return Ok(Some(Token::Number(s, false)));
+                    }
                     Ok(Some(Token::make_word(&s, None)))
                 }
                 // string
@@ -383,7 +398,13 @@ impl<'a> Tokenizer<'a> {
                 '0'..='9' => {
                     // TODO: https://jakewheat.github.io/sql-overview/sql-2011-foundation-grammar.html#unsigned-numeric-literal
                     let s = peeking_take_while(chars, |ch| matches!(ch, '0'..='9' | '.'));
-                    Ok(Some(Token::Number(s)))
+                    let long = if chars.peek() == Some(&'L') {
+                        chars.next();
+                        true
+                    } else {
+                        false
+                    };
+                    Ok(Some(Token::Number(s, long)))
                 }
                 // punctuation
                 '(' => self.consume_and_return(chars, Token::LParen),
@@ -461,7 +482,13 @@ impl<'a> Tokenizer<'a> {
                 '<' => {
                     chars.next(); // consume
                     match chars.peek() {
-                        Some('=') => self.consume_and_return(chars, Token::LtEq),
+                        Some('=') => {
+                            chars.next();
+                            match chars.peek() {
+                                Some('>') => self.consume_and_return(chars, Token::Spaceship),
+                                _ => Ok(Some(Token::LtEq)),
+                            }
+                        }
                         Some('>') => self.consume_and_return(chars, Token::Neq),
                         Some('<') => self.consume_and_return(chars, Token::ShiftLeft),
                         _ => Ok(Some(Token::Lt)),
@@ -634,7 +661,7 @@ mod tests {
         let expected = vec![
             Token::make_keyword("SELECT"),
             Token::Whitespace(Whitespace::Space),
-            Token::Number(String::from("1")),
+            Token::Number(String::from("1"), false),
         ];
 
         compare(expected, tokens);
@@ -652,7 +679,7 @@ mod tests {
             Token::Whitespace(Whitespace::Space),
             Token::make_word("sqrt", None),
             Token::LParen,
-            Token::Number(String::from("1")),
+            Token::Number(String::from("1"), false),
             Token::RParen,
         ];
 
@@ -724,11 +751,11 @@ mod tests {
             Token::Whitespace(Whitespace::Space),
             Token::Eq,
             Token::Whitespace(Whitespace::Space),
-            Token::Number(String::from("1")),
+            Token::Number(String::from("1"), false),
             Token::Whitespace(Whitespace::Space),
             Token::make_keyword("LIMIT"),
             Token::Whitespace(Whitespace::Space),
-            Token::Number(String::from("5")),
+            Token::Number(String::from("5"), false),
         ];
 
         compare(expected, tokens);
@@ -758,7 +785,7 @@ mod tests {
             Token::Whitespace(Whitespace::Space),
             Token::Eq,
             Token::Whitespace(Whitespace::Space),
-            Token::Number(String::from("1")),
+            Token::Number(String::from("1"), false),
         ];
 
         compare(expected, tokens);
@@ -790,7 +817,7 @@ mod tests {
             Token::Whitespace(Whitespace::Space),
             Token::Eq,
             Token::Whitespace(Whitespace::Space),
-            Token::Number(String::from("1")),
+            Token::Number(String::from("1"), false),
         ];
 
         compare(expected, tokens);
@@ -943,12 +970,12 @@ mod tests {
         let mut tokenizer = Tokenizer::new(&dialect, &sql);
         let tokens = tokenizer.tokenize().unwrap();
         let expected = vec![
-            Token::Number("0".to_string()),
+            Token::Number("0".to_string(), false),
             Token::Whitespace(Whitespace::SingleLineComment {
                 prefix: "--".to_string(),
                 comment: "this is a comment\n".to_string(),
             }),
-            Token::Number("1".to_string()),
+            Token::Number("1".to_string(), false),
         ];
         compare(expected, tokens);
     }
@@ -975,11 +1002,11 @@ mod tests {
         let mut tokenizer = Tokenizer::new(&dialect, &sql);
         let tokens = tokenizer.tokenize().unwrap();
         let expected = vec![
-            Token::Number("0".to_string()),
+            Token::Number("0".to_string(), false),
             Token::Whitespace(Whitespace::MultiLineComment(
                 "multi-line\n* /comment".to_string(),
             )),
-            Token::Number("1".to_string()),
+            Token::Number("1".to_string(), false),
         ];
         compare(expected, tokens);
     }
@@ -1046,7 +1073,7 @@ mod tests {
             Token::Whitespace(Whitespace::Space),
             Token::make_keyword("TOP"),
             Token::Whitespace(Whitespace::Space),
-            Token::Number(String::from("5")),
+            Token::Number(String::from("5"), false),
             Token::Whitespace(Whitespace::Space),
             Token::make_word("bar", Some('[')),
             Token::Whitespace(Whitespace::Space),
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index e7d78f950..ab4aa457b 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -92,7 +92,7 @@ fn parse_insert_invalid() {
     let sql = "INSERT public.customer (id, name, active) VALUES (1, 2, 3)";
     let res = parse_sql_statements(sql);
     assert_eq!(
-        ParserError::ParserError("Expected INTO, found: public".to_string()),
+        ParserError::ParserError("Expected one of INTO or OVERWRITE, found: public".to_string()),
         res.unwrap_err()
     );
 }
@@ -454,11 +454,11 @@ fn parse_number() {
     #[cfg(feature = "bigdecimal")]
     assert_eq!(
         expr,
-        Expr::Value(Value::Number(bigdecimal::BigDecimal::from(1)))
+        Expr::Value(Value::Number(bigdecimal::BigDecimal::from(1), false))
     );
 
     #[cfg(not(feature = "bigdecimal"))]
-    assert_eq!(expr, Expr::Value(Value::Number("1.0".into())));
+    assert_eq!(expr, Expr::Value(Value::Number("1.0".into(), false)));
 }
 
 #[test]
@@ -894,7 +894,7 @@ fn parse_select_having() {
                 name: ObjectName(vec![Ident::new("COUNT")]),
                 args: vec![FunctionArg::Unnamed(Expr::Wildcard)],
                 over: None,
-                distinct: false
+                distinct: false,
             })),
             op: BinaryOperator::Gt,
             right: Box::new(Expr::Value(number("1")))
@@ -1639,18 +1639,6 @@ fn parse_explain_analyze_with_simple_select() {
     );
 }
 
-#[test]
-fn parse_simple_analyze() {
-    let sql = "ANALYZE TABLE t";
-    let stmt = verified_stmt(sql);
-    assert_eq!(
-        stmt,
-        Statement::Analyze {
-            table_name: ObjectName(vec![Ident::new("t")])
-        }
-    );
-}
-
 #[test]
 fn parse_named_argument_function() {
     let sql = "SELECT FUN(a => '1', b => '2') FROM foo";
@@ -2390,7 +2378,7 @@ fn parse_ctes() {
 
     fn assert_ctes_in_select(expected: &[&str], sel: &Query) {
         for (i, exp) in expected.iter().enumerate() {
-            let Cte { alias, query } = &sel.with.as_ref().unwrap().cte_tables[i];
+            let Cte { alias, query, .. } = &sel.with.as_ref().unwrap().cte_tables[i];
             assert_eq!(*exp, query.to_string());
             assert_eq!(
                 if i == 0 {
@@ -2479,6 +2467,7 @@ fn parse_recursive_cte() {
             }],
         },
         query: cte_query,
+        from: None,
     };
     assert_eq!(with.cte_tables.first().unwrap(), &expected);
 }
@@ -2799,6 +2788,7 @@ fn parse_drop_table() {
             if_exists,
             names,
             cascade,
+            purge: _,
         } => {
             assert_eq!(false, if_exists);
             assert_eq!(ObjectType::Table, object_type);
@@ -2818,6 +2808,7 @@ fn parse_drop_table() {
             if_exists,
             names,
             cascade,
+            purge: _,
         } => {
             assert_eq!(true, if_exists);
             assert_eq!(ObjectType::Table, object_type);
diff --git a/tests/sqlparser_hive.rs b/tests/sqlparser_hive.rs
new file mode 100644
index 000000000..585be989b
--- /dev/null
+++ b/tests/sqlparser_hive.rs
@@ -0,0 +1,212 @@
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#![warn(clippy::all)]
+
+//! Test SQL syntax specific to Hive. The parser based on the generic dialect
+//! is also tested (on the inputs it can handle).
+
+use sqlparser::dialect::HiveDialect;
+use sqlparser::test_utils::*;
+
+#[test]
+fn parse_table_create() {
+    let sql = r#"CREATE TABLE IF NOT EXISTS db.table (a BIGINT, b STRING, c TIMESTAMP) PARTITIONED BY (d STRING, e TIMESTAMP) STORED AS ORC LOCATION 's3://...' TBLPROPERTIES ("prop" = "2", "asdf" = '1234', 'asdf' = "1234", "asdf" = 2)"#;
+    let iof = r#"CREATE TABLE IF NOT EXISTS db.table (a BIGINT, b STRING, c TIMESTAMP) PARTITIONED BY (d STRING, e TIMESTAMP) STORED AS INPUTFORMAT 'org.apache.hadoop.hive.ql.io.orc.OrcInputFormat' OUTPUTFORMAT 'org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat' LOCATION 's3://...'"#;
+
+    hive().verified_stmt(sql);
+    hive().verified_stmt(iof);
+}
+
+#[test]
+fn parse_insert_overwrite() {
+    let insert_partitions = r#"INSERT OVERWRITE TABLE db.new_table PARTITION (a = '1', b) SELECT a, b, c FROM db.table"#;
+    hive().verified_stmt(insert_partitions);
+}
+
+#[test]
+fn test_truncate() {
+    let truncate = r#"TRUNCATE TABLE db.table"#;
+    hive().verified_stmt(truncate);
+}
+
+#[test]
+fn parse_analyze() {
+    let analyze = r#"ANALYZE TABLE db.table_name PARTITION (a = '1234', b) COMPUTE STATISTICS NOSCAN CACHE METADATA"#;
+    hive().verified_stmt(analyze);
+}
+
+#[test]
+fn parse_analyze_for_columns() {
+    let analyze =
+        r#"ANALYZE TABLE db.table_name PARTITION (a = '1234', b) COMPUTE STATISTICS FOR COLUMNS"#;
+    hive().verified_stmt(analyze);
+}
+
+#[test]
+fn parse_msck() {
+    let msck = r#"MSCK REPAIR TABLE db.table_name ADD PARTITIONS"#;
+    let msck2 = r#"MSCK REPAIR TABLE db.table_name"#;
+    hive().verified_stmt(msck);
+    hive().verified_stmt(msck2);
+}
+
+#[test]
+fn parse_set() {
+    let set = "SET HIVEVAR:name = a, b, c_d";
+    hive().verified_stmt(set);
+}
+
+#[test]
+fn test_spaceship() {
+    let spaceship = "SELECT * FROM db.table WHERE a <=> b";
+    hive().verified_stmt(spaceship);
+}
+
+#[test]
+fn parse_with_cte() {
+    let with = "WITH a AS (SELECT * FROM b) INSERT INTO TABLE db.table_table PARTITION (a) SELECT * FROM b";
+    hive().verified_stmt(with);
+}
+
+#[test]
+fn drop_table_purge() {
+    let purge = "DROP TABLE db.table_name PURGE";
+    hive().verified_stmt(purge);
+}
+
+#[test]
+fn create_table_like() {
+    let like = "CREATE TABLE db.table_name LIKE db.other_table";
+    hive().verified_stmt(like);
+}
+
+// Turning off this test until we can parse identifiers starting with numbers :(
+#[test]
+fn test_identifier() {
+    let between = "SELECT a AS 3_barrr_asdf FROM db.table_name";
+    hive().verified_stmt(between);
+}
+
+#[test]
+fn test_alter_partition() {
+    let alter = "ALTER TABLE db.table PARTITION (a = 2) RENAME TO PARTITION (a = 1)";
+    hive().verified_stmt(alter);
+}
+
+#[test]
+fn test_add_partition() {
+    let add = "ALTER TABLE db.table ADD IF NOT EXISTS PARTITION (a = 'asdf', b = 2)";
+    hive().verified_stmt(add);
+}
+
+#[test]
+fn test_drop_partition() {
+    let drop = "ALTER TABLE db.table DROP PARTITION (a = 1)";
+    hive().verified_stmt(drop);
+}
+
+#[test]
+fn test_drop_if_exists() {
+    let drop = "ALTER TABLE db.table DROP IF EXISTS PARTITION (a = 'b', c = 'd')";
+    hive().verified_stmt(drop);
+}
+
+#[test]
+fn test_cluster_by() {
+    let cluster = "SELECT a FROM db.table CLUSTER BY a, b";
+    hive().verified_stmt(cluster);
+}
+
+#[test]
+fn test_distribute_by() {
+    let cluster = "SELECT a FROM db.table DISTRIBUTE BY a, b";
+    hive().verified_stmt(cluster);
+}
+
+#[test]
+fn no_join_condition() {
+    let join = "SELECT a, b FROM db.table_name JOIN a";
+    hive().verified_stmt(join);
+}
+
+#[test]
+fn columns_after_partition() {
+    let query = "INSERT INTO db.table_name PARTITION (a, b) (c, d) SELECT a, b, c, d FROM db.table";
+    hive().verified_stmt(query);
+}
+
+#[test]
+fn long_numerics() {
+    let query = r#"SELECT MIN(MIN(10, 5), 1L) AS a"#;
+    hive().verified_stmt(query);
+}
+
+#[test]
+fn decimal_precision() {
+    let query = "SELECT CAST(a AS DECIMAL(18,2)) FROM db.table";
+    let expected = "SELECT CAST(a AS NUMERIC(18,2)) FROM db.table";
+    hive().one_statement_parses_to(query, expected);
+}
+
+#[test]
+fn create_temp_table() {
+    let query = "CREATE TEMPORARY TABLE db.table (a INT NOT NULL)";
+    let query2 = "CREATE TEMP TABLE db.table (a INT NOT NULL)";
+
+    hive().verified_stmt(query);
+    hive().one_statement_parses_to(query2, query);
+}
+
+#[test]
+fn create_local_directory() {
+    let query =
+        "INSERT OVERWRITE LOCAL DIRECTORY '/home/blah' STORED AS TEXTFILE SELECT * FROM db.table";
+    hive().verified_stmt(query);
+}
+
+#[test]
+fn lateral_view() {
+    let view = "SELECT a FROM db.table LATERAL VIEW explode(a) t AS j, P LATERAL VIEW OUTER explode(a) t AS a, b WHERE a = 1";
+    hive().verified_stmt(view);
+}
+
+#[test]
+fn sort_by() {
+    let sort_by = "SELECT * FROM db.table SORT BY a";
+    hive().verified_stmt(sort_by);
+}
+
+#[test]
+fn rename_table() {
+    let rename = "ALTER TABLE db.table_name RENAME TO db.table_2";
+    hive().verified_stmt(rename);
+}
+
+#[test]
+fn map_access() {
+    let rename = "SELECT a.b[\"asdf\"] FROM db.table WHERE a = 2";
+    hive().verified_stmt(rename);
+}
+
+#[test]
+fn from_cte() {
+    let rename =
+        "WITH cte AS (SELECT * FROM a.b) FROM cte INSERT INTO TABLE a.b PARTITION (a) SELECT *";
+    println!("{}", hive().verified_stmt(rename));
+}
+
+fn hive() -> TestedDialects {
+    TestedDialects {
+        dialects: vec![Box::new(HiveDialect {})],
+    }
+}
diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index 20f186100..2abd8ae9b 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -364,8 +364,9 @@ fn parse_set() {
         stmt,
         Statement::SetVariable {
             local: false,
+            hivevar: false,
             variable: "a".into(),
-            value: SetVariableValue::Ident("b".into()),
+            value: vec![SetVariableValue::Ident("b".into())],
         }
     );
 
@@ -374,8 +375,11 @@ fn parse_set() {
         stmt,
         Statement::SetVariable {
             local: false,
+            hivevar: false,
             variable: "a".into(),
-            value: SetVariableValue::Literal(Value::SingleQuotedString("b".into())),
+            value: vec![SetVariableValue::Literal(Value::SingleQuotedString(
+                "b".into()
+            ))],
         }
     );
 
@@ -384,8 +388,9 @@ fn parse_set() {
         stmt,
         Statement::SetVariable {
             local: false,
+            hivevar: false,
             variable: "a".into(),
-            value: SetVariableValue::Literal(number("0")),
+            value: vec![SetVariableValue::Literal(number("0"))],
         }
     );
 
@@ -394,8 +399,9 @@ fn parse_set() {
         stmt,
         Statement::SetVariable {
             local: false,
+            hivevar: false,
             variable: "a".into(),
-            value: SetVariableValue::Ident("DEFAULT".into()),
+            value: vec![SetVariableValue::Ident("DEFAULT".into())],
         }
     );
 
@@ -404,8 +410,9 @@ fn parse_set() {
         stmt,
         Statement::SetVariable {
             local: true,
+            hivevar: false,
             variable: "a".into(),
-            value: SetVariableValue::Ident("b".into()),
+            value: vec![SetVariableValue::Ident("b".into())],
         }
     );
 

From 6f0b2dcd92907c871c0a2654b5962c780c0b9046 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Sun, 7 Feb 2021 16:06:50 +0100
Subject: [PATCH 116/122] Implement SUBSTRING(col [FROM <expr>] [FOR <expr>])
 syntax (#293)

---
 src/ast/mod.rs                | 22 ++++++++++++++++++++++
 src/parser.rs                 | 22 ++++++++++++++++++++++
 tests/sqlparser_common.rs     | 17 +++++++++++++++++
 tests/sqlparser_regression.rs |  5 ++---
 4 files changed, 63 insertions(+), 3 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 1999451d5..d0e321185 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -201,10 +201,17 @@ pub enum Expr {
         expr: Box<Expr>,
         data_type: DataType,
     },
+    /// EXTRACT(DateTimeField FROM <expr>)
     Extract {
         field: DateTimeField,
         expr: Box<Expr>,
     },
+    /// SUBSTRING(<expr> [FROM <expr>] [FOR <expr>])
+    Substring {
+        expr: Box<Expr>,
+        substring_from: Option<Box<Expr>>,
+        substring_for: Option<Box<Expr>>,
+    },
     /// `expr COLLATE collation`
     Collate {
         expr: Box<Expr>,
@@ -333,6 +340,21 @@ impl fmt::Display for Expr {
             Expr::Exists(s) => write!(f, "EXISTS ({})", s),
             Expr::Subquery(s) => write!(f, "({})", s),
             Expr::ListAgg(listagg) => write!(f, "{}", listagg),
+            Expr::Substring {
+                expr,
+                substring_from,
+                substring_for,
+            } => {
+                write!(f, "SUBSTRING({}", expr)?;
+                if let Some(from_part) = substring_from {
+                    write!(f, " FROM {}", from_part)?;
+                }
+                if let Some(from_part) = substring_for {
+                    write!(f, " FOR {}", from_part)?;
+                }
+
+                write!(f, ")")
+            }
         }
     }
 }
diff --git a/src/parser.rs b/src/parser.rs
index 7a0b23101..bee671f04 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -350,6 +350,7 @@ impl<'a> Parser<'a> {
                 Keyword::CAST => self.parse_cast_expr(),
                 Keyword::EXISTS => self.parse_exists_expr(),
                 Keyword::EXTRACT => self.parse_extract_expr(),
+                Keyword::SUBSTRING => self.parse_substring_expr(),
                 Keyword::INTERVAL => self.parse_literal_interval(),
                 Keyword::LISTAGG => self.parse_listagg_expr(),
                 Keyword::NOT => Ok(Expr::UnaryOp {
@@ -606,6 +607,27 @@ impl<'a> Parser<'a> {
         })
     }
 
+    pub fn parse_substring_expr(&mut self) -> Result<Expr, ParserError> {
+        // PARSE SUBSTRING (EXPR [FROM 1] [FOR 3])
+        self.expect_token(&Token::LParen)?;
+        let expr = self.parse_expr()?;
+        let mut from_expr = None;
+        let mut to_expr = None;
+        if self.parse_keyword(Keyword::FROM) {
+            from_expr = Some(self.parse_expr()?);
+        }
+        if self.parse_keyword(Keyword::FOR) {
+            to_expr = Some(self.parse_expr()?);
+        }
+        self.expect_token(&Token::RParen)?;
+
+        Ok(Expr::Substring {
+            expr: Box::new(expr),
+            substring_from: from_expr.map(Box::new),
+            substring_for: to_expr.map(Box::new),
+        })
+    }
+
     /// Parse a SQL LISTAGG expression, e.g. `LISTAGG(...) WITHIN GROUP (ORDER BY ...)`.
     pub fn parse_listagg_expr(&mut self) -> Result<Expr, ParserError> {
         self.expect_token(&Token::LParen)?;
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index ab4aa457b..f302245ee 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -2598,6 +2598,23 @@ fn parse_scalar_subqueries() {
     );
 }
 
+#[test]
+fn parse_substring() {
+    one_statement_parses_to("SELECT SUBSTRING('1')", "SELECT SUBSTRING('1')");
+
+    one_statement_parses_to(
+        "SELECT SUBSTRING('1' FROM 1)",
+        "SELECT SUBSTRING('1' FROM 1)",
+    );
+
+    one_statement_parses_to(
+        "SELECT SUBSTRING('1' FROM 1 FOR 3)",
+        "SELECT SUBSTRING('1' FROM 1 FOR 3)",
+    );
+
+    one_statement_parses_to("SELECT SUBSTRING('1' FOR 3)", "SELECT SUBSTRING('1' FOR 3)");
+}
+
 #[test]
 fn parse_exists_subquery() {
     let expected_inner = verified_query("SELECT 1");
diff --git a/tests/sqlparser_regression.rs b/tests/sqlparser_regression.rs
index bbf1b2977..1fc35d99c 100644
--- a/tests/sqlparser_regression.rs
+++ b/tests/sqlparser_regression.rs
@@ -25,10 +25,9 @@ macro_rules! tpch_tests {
         #[test]
         fn $name() {
             let dialect = GenericDialect {};
-
             let res = Parser::parse_sql(&dialect, QUERIES[$value -1]);
-            // Ignore 6.sql and 22.sql
-            if $value != 6 && $value != 22 {
+            // Ignore 6.sql
+            if $value != 6 {
                 assert!(res.is_ok());
             }
         }

From f40955ee82cf2c0c0d411025cdaf62bb7543def8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Dani=C3=ABl=20Heres?= <danielheres@gmail.com>
Date: Mon, 8 Feb 2021 08:11:01 +0100
Subject: [PATCH 117/122] Parse floats without leading number (#294)

* Parse floats without leading number

* Move period token test

* Comments

* Enable test
---
 src/tokenizer.rs              | 36 ++++++++++++++++++++++++++++++-----
 tests/sqlparser_regression.rs |  3 ---
 2 files changed, 31 insertions(+), 8 deletions(-)

diff --git a/src/tokenizer.rs b/src/tokenizer.rs
index fd33f9589..d82810528 100644
--- a/src/tokenizer.rs
+++ b/src/tokenizer.rs
@@ -394,10 +394,21 @@ impl<'a> Tokenizer<'a> {
                         )
                     }
                 }
-                // numbers
-                '0'..='9' => {
-                    // TODO: https://jakewheat.github.io/sql-overview/sql-2011-foundation-grammar.html#unsigned-numeric-literal
-                    let s = peeking_take_while(chars, |ch| matches!(ch, '0'..='9' | '.'));
+                // numbers and period
+                '0'..='9' | '.' => {
+                    let mut s = peeking_take_while(chars, |ch| matches!(ch, '0'..='9'));
+                    // match one period
+                    if let Some('.') = chars.peek() {
+                        s.push('.');
+                        chars.next();
+                    }
+                    s += &peeking_take_while(chars, |ch| matches!(ch, '0'..='9'));
+
+                    // No number -> Token::Period
+                    if s == "." {
+                        return Ok(Some(Token::Period));
+                    }
+
                     let long = if chars.peek() == Some(&'L') {
                         chars.next();
                         true
@@ -470,7 +481,6 @@ impl<'a> Tokenizer<'a> {
                         _ => Ok(Some(Token::Eq)),
                     }
                 }
-                '.' => self.consume_and_return(chars, Token::Period),
                 '!' => {
                     chars.next(); // consume
                     match chars.peek() {
@@ -667,6 +677,22 @@ mod tests {
         compare(expected, tokens);
     }
 
+    #[test]
+    fn tokenize_select_float() {
+        let sql = String::from("SELECT .1");
+        let dialect = GenericDialect {};
+        let mut tokenizer = Tokenizer::new(&dialect, &sql);
+        let tokens = tokenizer.tokenize().unwrap();
+
+        let expected = vec![
+            Token::make_keyword("SELECT"),
+            Token::Whitespace(Whitespace::Space),
+            Token::Number(String::from(".1"), false),
+        ];
+
+        compare(expected, tokens);
+    }
+
     #[test]
     fn tokenize_scalar_function() {
         let sql = String::from("SELECT sqrt(1)");
diff --git a/tests/sqlparser_regression.rs b/tests/sqlparser_regression.rs
index 1fc35d99c..e869e0932 100644
--- a/tests/sqlparser_regression.rs
+++ b/tests/sqlparser_regression.rs
@@ -26,10 +26,7 @@ macro_rules! tpch_tests {
         fn $name() {
             let dialect = GenericDialect {};
             let res = Parser::parse_sql(&dialect, QUERIES[$value -1]);
-            // Ignore 6.sql
-            if $value != 6 {
                 assert!(res.is_ok());
-            }
         }
     )*
     }

From 07342d585321e719e7d729bf96661b3dbb1417ab Mon Sep 17 00:00:00 2001
From: Francis Du <francis@francisdu.com>
Date: Wed, 10 Feb 2021 04:03:49 +0800
Subject: [PATCH 118/122] Support parsing multiple show variables. (#290)

* feat: support parsing multiple show variables.

* fix: fix fmt error
---
 src/ast/mod.rs              | 10 ++++++++--
 src/parser.rs               | 15 ++++++++++++++-
 tests/sqlparser_postgres.rs |  8 ++++----
 3 files changed, 26 insertions(+), 7 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index d0e321185..9a96e34bc 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -637,7 +637,7 @@ pub enum Statement {
     /// SHOW <variable>
     ///
     /// Note: this is a PostgreSQL-specific statement.
-    ShowVariable { variable: Ident },
+    ShowVariable { variable: Vec<Ident> },
     /// SHOW COLUMNS
     ///
     /// Note: this is a MySQL-specific statement.
@@ -1136,7 +1136,13 @@ impl fmt::Display for Statement {
                     value = display_comma_separated(value)
                 )
             }
-            Statement::ShowVariable { variable } => write!(f, "SHOW {}", variable),
+            Statement::ShowVariable { variable } => {
+                write!(f, "SHOW")?;
+                if !variable.is_empty() {
+                    write!(f, " {}", display_separated(variable, " "))?;
+                }
+                Ok(())
+            }
             Statement::ShowColumns {
                 extended,
                 full,
diff --git a/src/parser.rs b/src/parser.rs
index bee671f04..621209fd7 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -2043,6 +2043,19 @@ impl<'a> Parser<'a> {
         Ok(ObjectName(idents))
     }
 
+    /// Parse identifiers
+    pub fn parse_identifiers(&mut self) -> Result<Vec<Ident>, ParserError> {
+        let mut idents = vec![];
+        loop {
+            match self.next_token() {
+                Token::Word(w) => idents.push(w.to_ident()),
+                Token::EOF => break,
+                _ => {}
+            }
+        }
+        Ok(idents)
+    }
+
     /// Parse a simple one-word identifier (possibly quoted, possibly a keyword)
     pub fn parse_identifier(&mut self) -> Result<Ident, ParserError> {
         match self.next_token() {
@@ -2439,7 +2452,7 @@ impl<'a> Parser<'a> {
             self.parse_show_columns()
         } else {
             Ok(Statement::ShowVariable {
-                variable: self.parse_identifier()?,
+                variable: self.parse_identifiers()?,
             })
         }
     }
diff --git a/tests/sqlparser_postgres.rs b/tests/sqlparser_postgres.rs
index 2abd8ae9b..bcfce30fc 100644
--- a/tests/sqlparser_postgres.rs
+++ b/tests/sqlparser_postgres.rs
@@ -443,19 +443,19 @@ fn parse_set() {
 
 #[test]
 fn parse_show() {
-    let stmt = pg_and_generic().verified_stmt("SHOW a");
+    let stmt = pg_and_generic().verified_stmt("SHOW a a");
     assert_eq!(
         stmt,
         Statement::ShowVariable {
-            variable: "a".into()
+            variable: vec!["a".into(), "a".into()]
         }
     );
 
-    let stmt = pg_and_generic().verified_stmt("SHOW ALL");
+    let stmt = pg_and_generic().verified_stmt("SHOW ALL ALL");
     assert_eq!(
         stmt,
         Statement::ShowVariable {
-            variable: "ALL".into()
+            variable: vec!["ALL".into(), "ALL".into()]
         }
     )
 }

From add8991144fa9b3bc259ae566034474e34b395e2 Mon Sep 17 00:00:00 2001
From: zhangli-pear <57003334+zhangli-pear@users.noreply.github.com>
Date: Wed, 10 Feb 2021 04:04:54 +0800
Subject: [PATCH 119/122] feat: support sqlite insert or statement (#281)

---
 src/ast/mod.rs            | 48 +++++++++++++++++++++++++++++++++------
 src/dialect/keywords.rs   |  3 +++
 src/parser.rs             | 22 ++++++++++++++++++
 tests/sqlparser_common.rs | 41 +++++++++++++++++++++++++++++++--
 4 files changed, 105 insertions(+), 9 deletions(-)

diff --git a/src/ast/mod.rs b/src/ast/mod.rs
index 9a96e34bc..94951693c 100644
--- a/src/ast/mod.rs
+++ b/src/ast/mod.rs
@@ -508,6 +508,8 @@ pub enum Statement {
     Query(Box<Query>),
     /// INSERT
     Insert {
+        /// Only for Sqlite
+        or: Option<SqliteOnConflict>,
         /// TABLE
         table_name: ObjectName,
         /// COLUMNS
@@ -804,6 +806,7 @@ impl fmt::Display for Statement {
                 Ok(())
             }
             Statement::Insert {
+                or,
                 table_name,
                 overwrite,
                 partitioned,
@@ -812,13 +815,17 @@ impl fmt::Display for Statement {
                 source,
                 table,
             } => {
-                write!(
-                    f,
-                    "INSERT {act}{tbl} {table_name} ",
-                    table_name = table_name,
-                    act = if *overwrite { "OVERWRITE" } else { "INTO" },
-                    tbl = if *table { " TABLE" } else { "" }
-                )?;
+                if let Some(action) = or {
+                    write!(f, "INSERT OR {} INTO {} ", action, table_name)?;
+                } else {
+                    write!(
+                        f,
+                        "INSERT {act}{tbl} {table_name} ",
+                        table_name = table_name,
+                        act = if *overwrite { "OVERWRITE" } else { "INTO" },
+                        tbl = if *table { " TABLE" } else { "" }
+                    )?;
+                }
                 if !columns.is_empty() {
                     write!(f, "({}) ", display_comma_separated(columns))?;
                 }
@@ -832,6 +839,7 @@ impl fmt::Display for Statement {
                 }
                 write!(f, "{}", source)
             }
+
             Statement::Copy {
                 table_name,
                 columns,
@@ -1560,3 +1568,29 @@ impl fmt::Display for SetVariableValue {
         }
     }
 }
+
+/// Sqlite specific syntax
+///
+/// https://sqlite.org/lang_conflict.html
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
+pub enum SqliteOnConflict {
+    Rollback,
+    Abort,
+    Fail,
+    Ignore,
+    Replace,
+}
+
+impl fmt::Display for SqliteOnConflict {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        use SqliteOnConflict::*;
+        match self {
+            Rollback => write!(f, "ROLLBACK"),
+            Abort => write!(f, "ABORT"),
+            Fail => write!(f, "FAIL"),
+            Ignore => write!(f, "IGNORE"),
+            Replace => write!(f, "REPLACE"),
+        }
+    }
+}
diff --git a/src/dialect/keywords.rs b/src/dialect/keywords.rs
index 306cd19d6..1d2690fc0 100644
--- a/src/dialect/keywords.rs
+++ b/src/dialect/keywords.rs
@@ -66,6 +66,7 @@ macro_rules! define_keywords {
 
 // The following keywords should be sorted to be able to match using binary search
 define_keywords!(
+    ABORT,
     ABS,
     ACTION,
     ADD,
@@ -202,6 +203,7 @@ define_keywords!(
     EXTENDED,
     EXTERNAL,
     EXTRACT,
+    FAIL,
     FALSE,
     FETCH,
     FIELDS,
@@ -233,6 +235,7 @@ define_keywords!(
     HOUR,
     IDENTITY,
     IF,
+    IGNORE,
     IN,
     INDEX,
     INDICATOR,
diff --git a/src/parser.rs b/src/parser.rs
index 621209fd7..eab2ece12 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -163,6 +163,10 @@ impl<'a> Parser<'a> {
                 Keyword::DEALLOCATE => Ok(self.parse_deallocate()?),
                 Keyword::EXECUTE => Ok(self.parse_execute()?),
                 Keyword::PREPARE => Ok(self.parse_prepare()?),
+                Keyword::REPLACE if dialect_of!(self is SQLiteDialect ) => {
+                    self.prev_token();
+                    Ok(self.parse_insert()?)
+                }
                 _ => self.expected("an SQL statement", Token::Word(w)),
             },
             Token::LParen => {
@@ -2719,6 +2723,23 @@ impl<'a> Parser<'a> {
 
     /// Parse an INSERT statement
     pub fn parse_insert(&mut self) -> Result<Statement, ParserError> {
+        let or = if !dialect_of!(self is SQLiteDialect) {
+            None
+        } else if self.parse_keywords(&[Keyword::OR, Keyword::REPLACE]) {
+            Some(SqliteOnConflict::Replace)
+        } else if self.parse_keywords(&[Keyword::OR, Keyword::ROLLBACK]) {
+            Some(SqliteOnConflict::Rollback)
+        } else if self.parse_keywords(&[Keyword::OR, Keyword::ABORT]) {
+            Some(SqliteOnConflict::Abort)
+        } else if self.parse_keywords(&[Keyword::OR, Keyword::FAIL]) {
+            Some(SqliteOnConflict::Fail)
+        } else if self.parse_keywords(&[Keyword::OR, Keyword::IGNORE]) {
+            Some(SqliteOnConflict::Ignore)
+        } else if self.parse_keyword(Keyword::REPLACE) {
+            Some(SqliteOnConflict::Replace)
+        } else {
+            None
+        };
         let action = self.expect_one_of_keywords(&[Keyword::INTO, Keyword::OVERWRITE])?;
         let overwrite = action == Keyword::OVERWRITE;
         let local = self.parse_keyword(Keyword::LOCAL);
@@ -2758,6 +2779,7 @@ impl<'a> Parser<'a> {
 
             let source = Box::new(self.parse_query()?);
             Ok(Statement::Insert {
+                or,
                 table_name,
                 overwrite,
                 partitioned,
diff --git a/tests/sqlparser_common.rs b/tests/sqlparser_common.rs
index f302245ee..fbf2faf9b 100644
--- a/tests/sqlparser_common.rs
+++ b/tests/sqlparser_common.rs
@@ -24,8 +24,8 @@ use test_utils::{all_dialects, expr_from_projection, join, number, only, table,
 
 use matches::assert_matches;
 use sqlparser::ast::*;
-use sqlparser::dialect::keywords::ALL_KEYWORDS;
-use sqlparser::parser::ParserError;
+use sqlparser::dialect::{keywords::ALL_KEYWORDS, SQLiteDialect};
+use sqlparser::parser::{Parser, ParserError};
 
 #[test]
 fn parse_insert_values() {
@@ -97,6 +97,43 @@ fn parse_insert_invalid() {
     );
 }
 
+#[test]
+fn parse_insert_sqlite() {
+    let dialect = SQLiteDialect {};
+
+    let check = |sql: &str, expected_action: Option<SqliteOnConflict>| match Parser::parse_sql(
+        &dialect, &sql,
+    )
+    .unwrap()
+    .pop()
+    .unwrap()
+    {
+        Statement::Insert { or, .. } => assert_eq!(or, expected_action),
+        _ => panic!(sql.to_string()),
+    };
+
+    let sql = "INSERT INTO test_table(id) VALUES(1)";
+    check(sql, None);
+
+    let sql = "REPLACE INTO test_table(id) VALUES(1)";
+    check(sql, Some(SqliteOnConflict::Replace));
+
+    let sql = "INSERT OR REPLACE INTO test_table(id) VALUES(1)";
+    check(sql, Some(SqliteOnConflict::Replace));
+
+    let sql = "INSERT OR ROLLBACK INTO test_table(id) VALUES(1)";
+    check(sql, Some(SqliteOnConflict::Rollback));
+
+    let sql = "INSERT OR ABORT INTO test_table(id) VALUES(1)";
+    check(sql, Some(SqliteOnConflict::Abort));
+
+    let sql = "INSERT OR FAIL INTO test_table(id) VALUES(1)";
+    check(sql, Some(SqliteOnConflict::Fail));
+
+    let sql = "INSERT OR IGNORE INTO test_table(id) VALUES(1)";
+    check(sql, Some(SqliteOnConflict::Ignore));
+}
+
 #[test]
 fn parse_update() {
     let sql = "UPDATE t SET a = 1, b = 2, c = 3 WHERE d";

From a868ff6ebe7102af51e9f0e64c3afa521a74649d Mon Sep 17 00:00:00 2001
From: "Heres, Daniel" <danielheres@gmail.com>
Date: Tue, 9 Feb 2021 21:30:05 +0100
Subject: [PATCH 120/122] Add release notes

---
 CHANGELOG.md | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index c1c5a763f..0701b23dd 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -8,6 +8,16 @@ Given that the parser produces a typed AST, any changes to the AST will technica
 ## [Unreleased]
 Check https://github.com/ballista-compute/sqlparser-rs/commits/main for undocumented changes.
 
+
+## [0.8.0] 2020-02-20
+
+### Added
+* Introduce Hive QL dialect `HiveDialect` and syntax (#235) - Thanks @hntd187!
+* Add `SUBSTRING(col [FROM <expr>] [FOR <expr>])` syntax (#293)
+* Support parsing floats without leading digits `.01` (#294)
+* Support parsing multiple show variables (#290) - Thanks @francis-du!
+* Support SQLite `INSERT OR [..]` syntax (#281) - Thanks @zhangli-pear!
+
 ## [0.7.0] 2020-12-28
 
 ### Changed

From 34cd794cd3ce2578aa2e2474a49146ddcc686d2c Mon Sep 17 00:00:00 2001
From: "Heres, Daniel" <danielheres@gmail.com>
Date: Tue, 9 Feb 2021 21:31:27 +0100
Subject: [PATCH 121/122] (cargo-release) version 0.8.0

---
 Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index 231d7fee5..4b1b6c15c 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "sqlparser"
 description = "Extensible SQL Lexer and Parser with support for ANSI SQL:2011"
-version = "0.7.1-alpha.0"
+version = "0.8.0"
 authors = ["Andy Grove <andygrove73@gmail.com>"]
 homepage = "https://github.com/ballista-compute/sqlparser-rs"
 documentation = "https://docs.rs/sqlparser/"

From 43fef23bc8039b3849c1328c99741875bf76fe54 Mon Sep 17 00:00:00 2001
From: "Heres, Daniel" <danielheres@gmail.com>
Date: Tue, 9 Feb 2021 21:31:27 +0100
Subject: [PATCH 122/122] (cargo-release) start next development iteration
 0.8.1-alpha.0

---
 Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index 4b1b6c15c..8d4ce5b0d 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "sqlparser"
 description = "Extensible SQL Lexer and Parser with support for ANSI SQL:2011"
-version = "0.8.0"
+version = "0.8.1-alpha.0"
 authors = ["Andy Grove <andygrove73@gmail.com>"]
 homepage = "https://github.com/ballista-compute/sqlparser-rs"
 documentation = "https://docs.rs/sqlparser/"