spanner/spansql: add package for parsing Spanner's SQL dialect This will form a basis for an in-memory fake Spanner, but is also reusable for building tools. Updates #1181. Change-Id: If262e555a867e343e2f5582d4443a0bbda49eb06 Reviewed-on: https://code-review.googlesource.com/c/gocloud/+/43010 Reviewed-by: kokoro <noreply+kokoro@google.com> Reviewed-by: Knut Olav Løite <koloite@gmail.com>

commit: fb3c527ecb61102c3e756ad0638abb5ddc40cf6d [log] [tgz]
author: David Symonds <dsymonds@golang.org> Wed Jul 24 08:42:13 2019 +1000
committer: David Symonds <dsymonds@golang.org> Tue Jul 30 20:57:53 2019 +0000
tree: 7e0706b5868b30bc313e6c0c8b0b7aace504cb93
parent: 6f8bf42e39a983252893070befa2663437d27a84 [diff]
diff --git a/internal/kokoro/vet.sh b/internal/kokoro/vet.sh
index 24c7fe4..0af1c9c 100755
--- a/internal/kokoro/vet.sh
+++ b/internal/kokoro/vet.sh

@@ -64,6 +64,7 @@
     grep -v "internal/trace" | \
     grep -v "a blank import should be only in a main or test package" | \
     grep -v "method ExecuteSql should be ExecuteSQL" | \
+    grep -vE "spanner/spansql/(sql|types).go:.*should have comment" | \
     grep -vE "\.pb\.go:" || true) | tee /dev/stderr | (! read)
 
 # TODO(deklerk): It doesn't seem like it, but is it possible to glob both before

diff --git a/spanner/spansql/parser.go b/spanner/spansql/parser.go
new file mode 100644
index 0000000..282cf36
--- /dev/null
+++ b/spanner/spansql/parser.go

@@ -0,0 +1,1344 @@
+/*
+Copyright 2019 Google LLC
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+
+/*
+Package spansql contains types and a parser for the Cloud Spanner SQL dialect.
+
+To parse, use one of the Parse functions (ParseDDL, ParseDDLStmt, ParseQuery, etc.).
+
+Sources:
+	https://cloud.google.com/spanner/docs/lexical
+	https://cloud.google.com/spanner/docs/query-syntax
+	https://cloud.google.com/spanner/docs/data-definition-language
+*/
+package spansql
+
+/*
+This file is structured as follows:
+
+- There are several exported ParseFoo functions that accept an input string
+  and return a type defined in types.go. This is the principal API of this package.
+  These functions are implemented as wrappers around the lower-level functions,
+  with additional checks to ensure things such as input exhaustion.
+- The token and parser types are defined. These constitute the lexical token
+  and parser machinery. parser.next is the main way that other functions get
+  the next token, with parser.back providing a single token rewind, and
+  parser.sniff and parser.expect providing lookahead helpers.
+- The parseFoo methods are defined, matching the SQL grammar. Each consumes its
+  namesake production from the parser. There are also some fooParser helper vars
+  defined that abbreviate the parsing of some of the regular productions.
+*/
+
+import (
+	"fmt"
+	"io"
+	"os"
+	"strconv"
+	"strings"
+)
+
+const debug = false
+
+func debugf(format string, args ...interface{}) {
+	if !debug {
+		return
+	}
+	fmt.Fprintf(os.Stderr, "spansql debug: "+format+"\n", args...)
+}
+
+// ParseDDL parses a DDL file.
+func ParseDDL(s string) (DDL, error) {
+	p := newParser(s)
+
+	var ddl DDL
+	for {
+		p.skipSpace()
+		if p.done {
+			break
+		}
+
+		stmt, err := p.parseDDLStmt()
+		if err != nil {
+			return DDL{}, err
+		}
+		ddl.List = append(ddl.List, stmt)
+
+		tok := p.next()
+		if tok.err == io.EOF {
+			break
+		} else if tok.err != nil {
+			return DDL{}, tok.err
+		}
+		if tok.value == ";" {
+			continue
+		} else {
+			return DDL{}, p.errorf("unexpected token %q", tok.value)
+		}
+	}
+	if p.Rem() != "" {
+		return DDL{}, fmt.Errorf("unexpected trailing contents %q", p.Rem())
+	}
+	return ddl, nil
+}
+
+// ParseDDLStmt parses a single DDL statement.
+func ParseDDLStmt(s string) (DDLStmt, error) {
+	p := newParser(s)
+	stmt, err := p.parseDDLStmt()
+	if err != nil {
+		return nil, err
+	}
+	if p.Rem() != "" {
+		return nil, fmt.Errorf("unexpected trailing contents %q", p.Rem())
+	}
+	return stmt, nil
+}
+
+// ParseQuery parses a query string.
+func ParseQuery(s string) (Query, error) {
+	p := newParser(s)
+	q, err := p.parseQuery()
+	if err != nil {
+		return Query{}, err
+	}
+	if p.Rem() != "" {
+		return Query{}, fmt.Errorf("unexpected trailing query contents %q", p.Rem())
+	}
+	return q, nil
+}
+
+type token struct {
+	value string
+	err   error
+
+	typ     tokenType
+	int64   int64
+	float64 float64
+	string  string // unquoted form
+}
+
+type tokenType int
+
+const (
+	unknownToken tokenType = iota
+	int64Token
+	float64Token
+	stringToken
+)
+
+func (t *token) String() string {
+	if t.err != nil {
+		return fmt.Sprintf("parse error: %v", t.err)
+	}
+	return strconv.Quote(t.value)
+}
+
+type parser struct {
+	s      string // Remaining input.
+	done   bool   // Whether the parsing is finished (success or error).
+	backed bool   // Whether back() was called.
+	cur    token
+}
+
+func newParser(s string) *parser {
+	return &parser{
+		s: s,
+	}
+}
+
+// Rem returns the unparsed remainder, ignoring space.
+func (p *parser) Rem() string {
+	rem := p.s
+	if p.backed {
+		rem = p.cur.value + rem
+	}
+	i := 0
+	for ; i < len(rem); i++ {
+		if !isSpace(rem[i]) {
+			break
+		}
+	}
+	return rem[i:]
+}
+
+func (p *parser) String() string {
+	if p.backed {
+		return fmt.Sprintf("next tok: %s (rem: %q)", &p.cur, p.s)
+	}
+	return fmt.Sprintf("rem: %q", p.s)
+}
+
+func (p *parser) errorf(format string, args ...interface{}) error {
+	err := fmt.Errorf(format, args...)
+	p.cur.err = err
+	p.done = true
+	return err
+}
+
+func isInitialIdentifierChar(c byte) bool {
+	// https://cloud.google.com/spanner/docs/lexical#identifiers
+	switch {
+	case 'A' <= c && c <= 'Z':
+		return true
+	case 'a' <= c && c <= 'z':
+		return true
+	case c == '_':
+		return true
+	}
+	return false
+}
+
+func isIdentifierChar(c byte) bool {
+	// https://cloud.google.com/spanner/docs/lexical#identifiers
+	// This doesn't apply the restriction that an identifier cannot start with [0-9],
+	// nor does it check against reserved keywords.
+	switch {
+	case 'A' <= c && c <= 'Z':
+		return true
+	case 'a' <= c && c <= 'z':
+		return true
+	case '0' <= c && c <= '9':
+		return true
+	case c == '_':
+		return true
+	}
+	return false
+}
+
+func (p *parser) consumeNumber() {
+	/*
+		int64_value:
+			{ decimal_value | hex_value }
+
+		decimal_value:
+			[-]0—9+
+
+		hex_value:
+			[-]0x{0—9|a—f|A—F}+
+
+		(float64_value is not formally specified)
+
+		float64_value :=
+			  [+-]DIGITS.[DIGITS][e[+-]DIGITS]
+			| [DIGITS].DIGITS[e[+-]DIGITS]
+			| DIGITSe[+-]DIGITS
+	*/
+
+	i, neg, base := 0, false, 10
+	float, e, dot := false, false, false
+	if p.s[i] == '-' {
+		neg = true
+		i++
+	} else if p.s[i] == '+' {
+		// This isn't in the formal grammar, but is mentioned informally.
+		// https://cloud.google.com/spanner/docs/lexical#integer-literals
+		i++
+	}
+	if strings.HasPrefix(p.s[i:], "0x") {
+		base = 16
+		i += 2
+	}
+	d0 := i
+digitLoop:
+	for i < len(p.s) {
+		switch c := p.s[i]; {
+		case '0' <= c && c <= '9':
+			i++
+		case base == 16 && 'A' <= c && c <= 'F':
+			i++
+		case base == 16 && 'a' <= c && c <= 'f':
+			i++
+		case base == 10 && (c == 'e' || c == 'E'):
+			if e {
+				p.errorf("bad token %q", p.s[:i])
+				return
+			}
+			// Switch to consuming float.
+			float, e = true, true
+			i++
+
+			if i < len(p.s) && (p.s[i] == '+' || p.s[i] == '-') {
+				i++
+			}
+		case base == 10 && c == '.':
+			if dot || e { // any dot must come before E
+				p.errorf("bad token %q", p.s[:i])
+				return
+			}
+			// Switch to consuming float.
+			float, dot = true, true
+			i++
+		default:
+			break digitLoop
+		}
+	}
+	if d0 == i {
+		p.errorf("no digits in numeric literal")
+		return
+	}
+	p.cur.value, p.s = p.s[:i], p.s[i:]
+	var err error
+	if float {
+		p.cur.typ = float64Token
+		p.cur.float64, err = strconv.ParseFloat(p.cur.value[d0:], 64)
+	} else {
+		p.cur.typ = int64Token
+		p.cur.int64, err = strconv.ParseInt(p.cur.value[d0:], base, 64)
+	}
+	if neg {
+		p.cur.float64 = -p.cur.float64
+		p.cur.int64 = -p.cur.int64
+	}
+	if err != nil {
+		p.errorf("bad numeric literal %q: %v", p.cur.value, err)
+	}
+}
+
+func (p *parser) consumeString() {
+	// TODO: support all the other string literal types.
+	// https://cloud.google.com/spanner/docs/lexical#string-and-bytes-literals
+
+	i := 0
+	if p.s[i] != '"' {
+		p.errorf("invalid string literal")
+		return
+	}
+	i++
+
+	for i < len(p.s) {
+		c := p.s[i]
+		i++
+		if c == '"' {
+			break
+		}
+		if c == '\\' && i < len(p.s) {
+			i++
+		}
+	}
+	if i > len(p.s) {
+		p.errorf("unterminated string literal")
+		return
+	}
+	p.cur.value, p.s = p.s[:i], p.s[i:]
+	p.cur.typ = stringToken
+
+	// TODO: this unescaping isn't entirely correct.
+	var err error
+	p.cur.string, err = strconv.Unquote(p.cur.value)
+	if err != nil {
+		p.errorf("invalid string literal [%s]: %v", p.cur.value, err)
+	}
+}
+
+var operators = map[string]bool{
+	// TODO: There's duplication here with symbolicOperators,
+	// but this should go away with more bespoke handling inside parser.advance.
+	"<":  true,
+	"<=": true,
+	">":  true,
+	">=": true,
+	"=":  true,
+	"!=": true,
+	"<>": true,
+}
+
+func isSpace(c byte) bool {
+	// Per https://cloud.google.com/spanner/docs/lexical, informally,
+	// whitespace is defined as "space, backspace, tab, newline".
+	switch c {
+	case ' ', '\b', '\t', '\n':
+		return true
+	}
+	return false
+}
+
+// skipSpace skips past any space or comments.
+func (p *parser) skipSpace() bool {
+	i := 0
+	for i < len(p.s) {
+		if isSpace(p.s[i]) {
+			i++
+			continue
+		}
+		// Comments.
+		term := ""
+		if p.s[i] == '#' {
+			term = "\n"
+		} else if i+1 < len(p.s) && p.s[i] == '-' && p.s[i+1] == '-' {
+			term = "\n"
+		} else if i+1 < len(p.s) && p.s[i] == '/' && p.s[i+1] == '*' {
+			term = "*/"
+		}
+		if term == "" {
+			break
+		}
+		ti := strings.Index(p.s[i:], term)
+		if ti < 0 {
+			p.errorf("unterminated comment")
+			return false
+		}
+		i += ti + len(term)
+	}
+	p.s = p.s[i:]
+	if p.s == "" {
+		p.done = true
+	}
+	return i > 0
+}
+
+// advance moves the parser to the next token, which will be available in p.cur.
+func (p *parser) advance() {
+	p.skipSpace()
+	if p.done {
+		return
+	}
+	p.cur.err = nil
+	p.cur.typ = unknownToken
+	// TODO: backtick (`) for quoted identifiers.
+	// TODO: array, struct, date, timestamp literals
+	switch p.s[0] {
+	case ',', ';', '(', ')':
+		// Single character symbol.
+		p.cur.value, p.s = p.s[:1], p.s[1:]
+		return
+	}
+	if p.s[0] == '@' || isInitialIdentifierChar(p.s[0]) {
+		// Start consuming identifier.
+		i := 1
+		for i < len(p.s) && isIdentifierChar(p.s[i]) {
+			i++
+		}
+		p.cur.value, p.s = p.s[:i], p.s[i:]
+		return
+	}
+	if len(p.s) >= 2 && (p.s[0] == '+' || p.s[0] == '-' || p.s[0] == '.') && ('0' <= p.s[1] && p.s[1] <= '9') {
+		// [-+.] followed by a digit.
+		p.consumeNumber()
+		return
+	}
+	if '0' <= p.s[0] && p.s[0] <= '9' {
+		p.consumeNumber()
+		return
+	}
+	// More single character symbols.
+	// These are deliberately below the numeric literal parsing.
+	switch p.s[0] {
+	case '-', '+':
+		p.cur.value, p.s = p.s[:1], p.s[1:]
+		return
+	}
+	if p.s[0] == '"' {
+		p.consumeString()
+		return
+	}
+
+	// Look for operator (two or one bytes).
+	for i := 2; i >= 1; i-- {
+		if i < len(p.s) && operators[p.s[:i]] {
+			p.cur.value, p.s = p.s[:i], p.s[i:]
+			return
+		}
+	}
+
+	p.errorf("unexpected byte %#x", p.s[0])
+}
+
+// back steps the parser back one token. It cannot be called twice in succession.
+func (p *parser) back() {
+	if p.backed {
+		panic("parser backed up twice")
+	}
+	p.done = false
+	p.backed = true
+	// If an error was being recovered, we wish to ignore the error.
+	// Don't do that for io.EOF since that'll be returned next.
+	if p.cur.err != io.EOF {
+		p.cur.err = nil
+	}
+}
+
+// next returns the next token.
+func (p *parser) next() *token {
+	if p.backed || p.done {
+		p.backed = false
+		return &p.cur
+	}
+	p.advance()
+	if p.done && p.cur.err == nil {
+		p.cur.value = ""
+		p.cur.err = io.EOF
+	}
+	return &p.cur
+}
+
+// sniff reports whether the next N tokens are as specified.
+func (p *parser) sniff(want ...string) bool {
+	// Store current parser state and restore on the way out.
+	orig := *p
+	defer func() { *p = orig }()
+
+	for _, w := range want {
+		tok := p.next()
+		if tok.err != nil || tok.value != w {
+			return false
+		}
+	}
+	return true
+}
+
+func (p *parser) expect(want string) error {
+	tok := p.next()
+	if tok.err != nil {
+		return tok.err
+	}
+	if tok.value != want {
+		return p.errorf("got %q while expecting %q", tok.value, want)
+	}
+	return nil
+}
+
+func (p *parser) parseDDLStmt() (DDLStmt, error) {
+	debugf("parseDDLStmt: %v", p)
+
+	/*
+		statement:
+			{ create_database | create_table | create_index | alter_table | drop_table | drop_index }
+	*/
+
+	// TODO: support create_database
+
+	if p.sniff("CREATE", "TABLE") {
+		ct, err := p.parseCreateTable()
+		return ct, err
+	} else if p.sniff("CREATE", "INDEX") {
+		ci, err := p.parseCreateIndex()
+		return ci, err
+	} else if p.sniff("ALTER", "TABLE") {
+		a, err := p.parseAlterTable()
+		return a, err
+	} else if p.sniff("DROP") {
+		// These statements are simple.
+		//	DROP TABLE table_name
+		//	DROP INDEX index_name
+		p.expect("DROP")
+		tok := p.next()
+		if tok.err != nil {
+			return nil, tok.err
+		}
+		kind := tok.value
+		if kind != "TABLE" && kind != "INDEX" {
+			return nil, p.errorf("got %q, want TABLE or INDEX", kind)
+		}
+		name, err := p.parseTableOrIndexOrColumnName()
+		if err != nil {
+			return nil, err
+		}
+		if kind == "TABLE" {
+			return DropTable{Name: name}, nil
+		}
+		return DropIndex{Name: name}, nil
+	}
+
+	return nil, p.errorf("unknown DDL statement")
+}
+
+func (p *parser) parseCreateTable() (CreateTable, error) {
+	debugf("parseCreateTable: %v", p)
+
+	/*
+		CREATE TABLE table_name(
+			[column_def, ...] )
+			primary_key [, cluster]
+
+		primary_key:
+			PRIMARY KEY ( [key_part, ...] )
+	*/
+
+	if err := p.expect("CREATE"); err != nil {
+		return CreateTable{}, err
+	}
+	if err := p.expect("TABLE"); err != nil {
+		return CreateTable{}, err
+	}
+	tname, err := p.parseTableOrIndexOrColumnName()
+	if err != nil {
+		return CreateTable{}, err
+	}
+	if err := p.expect("("); err != nil {
+		return CreateTable{}, err
+	}
+
+	ct := CreateTable{Name: tname}
+	for {
+		if err := p.expect(")"); err == nil {
+			break
+		}
+		p.back()
+
+		cd, err := p.parseColumnDef()
+		if err != nil {
+			return CreateTable{}, err
+		}
+		ct.Columns = append(ct.Columns, cd)
+
+		// ")" or "," should be next.
+		tok := p.next()
+		if tok.err != nil {
+			return CreateTable{}, err
+		}
+		if tok.value == ")" {
+			break
+		} else if tok.value == "," {
+			continue
+		} else {
+			return CreateTable{}, p.errorf(`got %q, want ")" or ","`, tok.value)
+		}
+	}
+
+	if err := p.expect("PRIMARY"); err != nil {
+		return CreateTable{}, err
+	}
+	if err := p.expect("KEY"); err != nil {
+		return CreateTable{}, err
+	}
+	ct.PrimaryKey, err = p.parseKeyPartList()
+	if err != nil {
+		return CreateTable{}, err
+	}
+	return ct, nil
+}
+
+func (p *parser) parseCreateIndex() (CreateIndex, error) {
+	debugf("parseCreateIndex: %v", p)
+
+	/*
+		CREATE [UNIQUE] [NULL_FILTERED] INDEX index_name
+			ON table_name ( key_part [, ...] ) [ storing_clause ] [ , interleave_clause ]
+
+		index_name:
+			{a—z|A—Z}[{a—z|A—Z|0—9|_}+]
+	*/
+
+	if err := p.expect("CREATE"); err != nil {
+		return CreateIndex{}, err
+	}
+	// TODO: UNIQUE, NULL_FILTERED
+	if err := p.expect("INDEX"); err != nil {
+		return CreateIndex{}, err
+	}
+	iname, err := p.parseTableOrIndexOrColumnName()
+	if err != nil {
+		return CreateIndex{}, err
+	}
+	if err := p.expect("ON"); err != nil {
+		return CreateIndex{}, err
+	}
+	tname, err := p.parseTableOrIndexOrColumnName()
+	if err != nil {
+		return CreateIndex{}, err
+	}
+	ci := CreateIndex{Name: iname, Table: tname}
+	ci.Columns, err = p.parseKeyPartList()
+	if err != nil {
+		return CreateIndex{}, err
+	}
+	return ci, nil
+}
+
+func (p *parser) parseAlterTable() (AlterTable, error) {
+	debugf("parseAlterTable: %v", p)
+
+	/*
+		alter_table:
+			ALTER TABLE table_name { table_alteration | table_column_alteration }
+
+		table_alteration:
+			{ ADD COLUMN column_def | DROP COLUMN column_name |
+				SET ON DELETE { CASCADE | NO ACTION } }
+
+		table_column_alteration:
+			ALTER COLUMN column_name { { scalar_type | array_type } [NOT NULL] | SET options_def }
+	*/
+
+	if err := p.expect("ALTER"); err != nil {
+		return AlterTable{}, err
+	}
+	if err := p.expect("TABLE"); err != nil {
+		return AlterTable{}, err
+	}
+	tname, err := p.parseTableOrIndexOrColumnName()
+	if err != nil {
+		return AlterTable{}, err
+	}
+	a := AlterTable{Name: tname}
+
+	tok := p.next()
+	if tok.err != nil {
+		return AlterTable{}, tok.err
+	}
+	switch tok.value {
+	default:
+		return AlterTable{}, p.errorf("got %q, expected ADD or DROP or SET or ALTER", tok.value)
+	case "ADD":
+		if err := p.expect("COLUMN"); err != nil {
+			return AlterTable{}, err
+		}
+		cd, err := p.parseColumnDef()
+		if err != nil {
+			return AlterTable{}, err
+		}
+		a.Alteration = AddColumn{Def: cd}
+		return a, nil
+	case "DROP":
+		if err := p.expect("COLUMN"); err != nil {
+			return AlterTable{}, err
+		}
+		name, err := p.parseTableOrIndexOrColumnName()
+		if err != nil {
+			return AlterTable{}, err
+		}
+		a.Alteration = DropColumn{Name: name}
+		return a, nil
+	case "SET":
+		if err := p.expect("ON"); err != nil {
+			return AlterTable{}, err
+		}
+		if err := p.expect("DELETE"); err != nil {
+			return AlterTable{}, err
+		}
+		tok := p.next()
+		if tok.err != nil {
+			return AlterTable{}, tok.err
+		}
+		if tok.value == "CASCADE" {
+			a.Alteration = CascadeOnDelete
+			return a, nil
+		}
+		if tok.value != "NO" {
+			return AlterTable{}, p.errorf("got %q, want NO or CASCADE", tok.value)
+		}
+		if err := p.expect("ACTION"); err != nil {
+			return AlterTable{}, err
+		}
+		a.Alteration = NoActionOnDelete
+		return a, nil
+	}
+	// TODO: "ALTER"
+}
+
+func (p *parser) parseColumnDef() (ColumnDef, error) {
+	debugf("parseColumnDef: %v", p)
+
+	/*
+		column_def:
+			column_name {scalar_type | array_type} [NOT NULL] [options_def]
+	*/
+
+	name, err := p.parseTableOrIndexOrColumnName()
+	if err != nil {
+		return ColumnDef{}, err
+	}
+
+	cd := ColumnDef{Name: name}
+
+	cd.Type, err = p.parseType()
+	if err != nil {
+		return ColumnDef{}, err
+	}
+
+	tok := p.next()
+	if tok.err != nil || tok.value != "NOT" {
+		// End of the column_def.
+		p.back()
+		return cd, nil
+	}
+	if err := p.expect("NULL"); err != nil {
+		return ColumnDef{}, err
+	}
+	cd.NotNull = true
+
+	return cd, nil
+}
+
+func (p *parser) parseKeyPartList() ([]KeyPart, error) {
+	if err := p.expect("("); err != nil {
+		return nil, err
+	}
+	var list []KeyPart
+	for {
+		if err := p.expect(")"); err == nil {
+			break
+		}
+		p.back()
+
+		kp, err := p.parseKeyPart()
+		if err != nil {
+			return nil, err
+		}
+		list = append(list, kp)
+
+		// ")" or "," should be next.
+		tok := p.next()
+		if tok.err != nil {
+			return nil, err
+		}
+		if tok.value == ")" {
+			break
+		} else if tok.value == "," {
+			continue
+		} else {
+			return nil, p.errorf(`got %q, want ")" or ","`, tok.value)
+		}
+	}
+	return list, nil
+}
+
+func (p *parser) parseKeyPart() (KeyPart, error) {
+	debugf("parseKeyPart: %v", p)
+
+	/*
+		key_part:
+			column_name [{ ASC | DESC }]
+	*/
+
+	name, err := p.parseTableOrIndexOrColumnName()
+	if err != nil {
+		return KeyPart{}, err
+	}
+
+	kp := KeyPart{Column: name}
+
+	tok := p.next()
+	if tok.err != nil {
+		// End of the key_part.
+		p.back()
+		return kp, nil
+	}
+	switch tok.value {
+	case "ASC":
+	case "DESC":
+		kp.Desc = true
+	default:
+		p.back()
+	}
+
+	return kp, nil
+}
+
+var baseTypes = map[string]TypeBase{
+	"BOOL":      Bool,
+	"INT64":     Int64,
+	"FLOAT64":   Float64,
+	"STRING":    String,
+	"BYTES":     Bytes,
+	"DATE":      Date,
+	"TIMESTAMP": Timestamp,
+}
+
+func (p *parser) parseType() (Type, error) {
+	debugf("parseType: %v", p)
+
+	/*
+		array_type:
+			ARRAY< scalar_type >
+
+		scalar_type:
+			{ BOOL | INT64 | FLOAT64 | STRING( length ) | BYTES( length ) | DATE | TIMESTAMP }
+		length:
+			{ int64_value | MAX }
+	*/
+
+	var t Type
+
+	tok := p.next()
+	if tok.err != nil {
+		return Type{}, tok.err
+	}
+	if tok.value == "ARRAY" {
+		t.Array = true
+		if err := p.expect("<"); err != nil {
+			return Type{}, err
+		}
+		tok = p.next()
+		if tok.err != nil {
+			return Type{}, tok.err
+		}
+	}
+	base, ok := baseTypes[tok.value]
+	if !ok {
+		return Type{}, p.errorf("got %q, want scalar type", tok.value)
+	}
+	t.Base = base
+
+	if t.Base == String || t.Base == Bytes {
+		if err := p.expect("("); err != nil {
+			return Type{}, err
+		}
+
+		tok = p.next()
+		if tok.err != nil {
+			return Type{}, tok.err
+		}
+		if tok.value == "MAX" {
+			t.Len = MaxLen
+		} else if tok.typ == int64Token {
+			t.Len = tok.int64
+		} else {
+			return Type{}, p.errorf("got %q, want MAX or int64", tok.value)
+		}
+
+		if err := p.expect(")"); err != nil {
+			return Type{}, err
+		}
+	}
+
+	if t.Array {
+		if err := p.expect(">"); err != nil {
+			return Type{}, err
+		}
+	}
+
+	return t, nil
+}
+
+func (p *parser) parseQuery() (Query, error) {
+	debugf("parseQuery: %v", p)
+
+	/*
+		query_statement:
+			[ table_hint_expr ][ join_hint_expr ]
+			query_expr
+
+		query_expr:
+			{ select | ( query_expr ) | query_expr set_op query_expr }
+			[ ORDER BY expression [{ ASC | DESC }] [, ...] ]
+			[ LIMIT count [ OFFSET skip_rows ] ]
+	*/
+
+	// TODO: hints, sub-selects, etc.
+
+	// TODO: use a case-insensitive select.
+	if err := p.expect("SELECT"); err != nil {
+		return Query{}, err
+	}
+	p.back()
+	sel, err := p.parseSelect()
+	if err != nil {
+		return Query{}, err
+	}
+	q := Query{Select: sel}
+
+	if p.sniff("ORDER", "BY") {
+		p.expect("ORDER")
+		p.expect("BY")
+		for {
+			o, err := p.parseOrder()
+			if err != nil {
+				return Query{}, err
+			}
+			q.Order = append(q.Order, o)
+
+			if !p.sniff(",") {
+				break
+			}
+			p.expect(",")
+		}
+	}
+
+	if p.sniff("LIMIT") {
+		p.expect("LIMIT")
+		lim, err := p.parseLimitCount()
+		if err != nil {
+			return Query{}, err
+		}
+		q.Limit = lim
+	}
+
+	return q, nil
+}
+
+func (p *parser) parseSelect() (Select, error) {
+	debugf("parseSelect: %v", p)
+
+	/*
+		select:
+			SELECT  [{ ALL | DISTINCT }]
+				{ [ expression. ]* | expression [ [ AS ] alias ] } [, ...]
+			[ FROM from_item [ tablesample_type ] [, ...] ]
+			[ WHERE bool_expression ]
+			[ GROUP BY expression [, ...] ]
+			[ HAVING bool_expression ]
+	*/
+	if err := p.expect("SELECT"); err != nil {
+		return Select{}, err
+	}
+
+	var sel Select
+
+	// TODO: ALL|DISTINCT
+
+	// Read expressions for the SELECT list.
+	for {
+		expr, err := p.parseExpr()
+		if err != nil {
+			return Select{}, err
+		}
+		sel.List = append(sel.List, expr)
+
+		if p.sniff(",") {
+			p.expect(",")
+			continue
+		}
+		break
+	}
+
+	if p.sniff("FROM") {
+		p.expect("FROM")
+		for {
+			from, err := p.parseSelectFrom()
+			if err != nil {
+				return Select{}, err
+			}
+			sel.From = append(sel.From, from)
+			if p.sniff(",") {
+				p.expect(",")
+				continue
+			}
+			break
+		}
+	}
+
+	if p.sniff("WHERE") {
+		p.expect("WHERE")
+		where, err := p.parseBoolExpr()
+		if err != nil {
+			return Select{}, err
+		}
+		sel.Where = where
+	}
+
+	// TODO: GROUP BY, HAVING
+
+	return sel, nil
+}
+
+func (p *parser) parseSelectFrom() (SelectFrom, error) {
+	// TODO: support more than a single table name.
+	tname, err := p.parseTableOrIndexOrColumnName()
+	return SelectFrom{Table: tname}, err
+}
+
+func (p *parser) parseOrder() (Order, error) {
+	/*
+		expression [{ ASC | DESC }]
+	*/
+
+	expr, err := p.parseExpr()
+	if err != nil {
+		return Order{}, err
+	}
+	o := Order{Expr: expr}
+
+	tok := p.next()
+	switch {
+	case tok.err == nil && tok.value == "ASC":
+	case tok.err == nil && tok.value == "DESC":
+		o.Desc = true
+	default:
+		p.back()
+	}
+
+	return o, nil
+}
+
+func (p *parser) parseLimitCount() (Limit, error) {
+	// "only literal or parameter values"
+	// https://cloud.google.com/spanner/docs/query-syntax#limit-clause-and-offset-clause
+
+	tok := p.next()
+	if tok.err != nil {
+		return nil, tok.err
+	}
+	if tok.typ == int64Token {
+		return IntegerLiteral(tok.int64), nil
+	}
+	// TODO: check character sets.
+	if strings.HasPrefix(tok.value, "@") {
+		return Param(tok.value[1:]), nil
+	}
+	return nil, p.errorf("got %q, want literal or parameter", tok.value)
+}
+
+/*
+Expressions
+
+Cloud Spanner expressions are not formally specified.
+The set of operators and their precedence is listed in
+https://cloud.google.com/spanner/docs/functions-and-operators#operators.
+
+parseExpr works as a classical recursive descent parser, splitting
+precedence levels into separate methods, where the call stack is in
+ascending order of precedence:
+	parseExpr
+	orParser
+	andParser
+	parseIsOp
+	parseComparisonOp
+	parseLit
+
+TODO: there are more levels to break out.
+*/
+
+func (p *parser) parseExpr() (Expr, error) {
+	debugf("parseExpr: %v", p)
+
+	return orParser.parse(p)
+}
+
+// binOpParser is a generic meta-parser for binary operations.
+// It assumes the operation is left associative.
+type binOpParser struct {
+	LHS, RHS func(*parser) (Expr, error)
+	Op       string
+	ArgCheck func(Expr) error
+	Combiner func(lhs, rhs Expr) Expr
+}
+
+func (bin binOpParser) parse(p *parser) (Expr, error) {
+	expr, err := bin.LHS(p)
+	if err != nil {
+		return nil, err
+	}
+
+	for {
+		if !p.sniff(bin.Op) {
+			break
+		}
+		p.expect(bin.Op)
+		rhs, err := bin.RHS(p)
+		if err != nil {
+			return nil, err
+		}
+		if bin.ArgCheck != nil {
+			if err := bin.ArgCheck(expr); err != nil {
+				return nil, p.errorf("%v", err)
+			}
+			if err := bin.ArgCheck(rhs); err != nil {
+				return nil, p.errorf("%v", err)
+			}
+		}
+		expr = bin.Combiner(expr, rhs)
+	}
+	return expr, nil
+}
+
+// Break initialisation loop.
+func init() { orParser = orParserShim }
+
+var (
+	boolExprCheck = func(expr Expr) error {
+		if _, ok := expr.(BoolExpr); !ok {
+			return fmt.Errorf("got %T, want a boolean expression", expr)
+		}
+		return nil
+	}
+
+	orParser binOpParser
+
+	orParserShim = binOpParser{
+		LHS:      andParser.parse,
+		RHS:      andParser.parse,
+		Op:       "OR",
+		ArgCheck: boolExprCheck,
+		Combiner: func(lhs, rhs Expr) Expr {
+			return LogicalOp{LHS: lhs.(BoolExpr), Op: Or, RHS: rhs.(BoolExpr)}
+		},
+	}
+	andParser = binOpParser{
+		LHS:      (*parser).parseLogicalNot,
+		RHS:      (*parser).parseLogicalNot,
+		Op:       "AND",
+		ArgCheck: boolExprCheck,
+		Combiner: func(lhs, rhs Expr) Expr {
+			return LogicalOp{LHS: lhs.(BoolExpr), Op: And, RHS: rhs.(BoolExpr)}
+		},
+	}
+)
+
+func (p *parser) parseLogicalNot() (Expr, error) {
+	if !p.sniff("NOT") {
+		return p.parseIsOp()
+	}
+	p.expect("NOT")
+	be, err := p.parseBoolExpr()
+	if err != nil {
+		return nil, err
+	}
+	return LogicalOp{Op: Not, RHS: be}, nil
+}
+
+func (p *parser) parseIsOp() (Expr, error) {
+	debugf("parseIsOp: %v", p)
+
+	expr, err := p.parseComparisonOp()
+	if err != nil {
+		return nil, err
+	}
+
+	tok := p.next()
+	if tok.err != nil || tok.value != "IS" {
+		p.back()
+		return expr, nil
+	}
+
+	isOp := IsOp{LHS: expr}
+	if p.sniff("NOT") {
+		p.expect("NOT")
+		isOp.Neg = true
+	}
+
+	tok = p.next()
+	if tok.err != nil {
+		return nil, tok.err
+	}
+	switch tok.value {
+	case "NULL":
+		isOp.RHS = Null
+	case "TRUE":
+		isOp.RHS = True
+	case "FALSE":
+		isOp.RHS = False
+	default:
+		return nil, p.errorf("got %q, want NULL or TRUE or FALSE", tok.value)
+	}
+
+	return isOp, nil
+}
+
+var symbolicOperators = map[string]ComparisonOperator{
+	"<":  Lt,
+	"<=": Le,
+	">":  Gt,
+	">=": Ge,
+	"=":  Eq,
+	"!=": Ne,
+	"<>": Ne,
+}
+
+func (p *parser) parseComparisonOp() (Expr, error) {
+	debugf("parseComparisonOp: %v", p)
+
+	// TODO: this should be parsing bitwise/arithmetic subexpressions.
+
+	expr, err := p.parseLit()
+	if err != nil {
+		return nil, err
+	}
+
+	for {
+		tok := p.next()
+		if tok.err != nil {
+			p.back()
+			break
+		}
+		var op ComparisonOperator
+		var ok bool
+		if tok.value == "NOT" {
+			if err := p.expect("LIKE"); err != nil {
+				// TODO: Does this need to push back two?
+				return nil, err
+			}
+			op, ok = NotLike, true
+		} else if tok.value == "LIKE" {
+			op, ok = Like, true
+		} else {
+			op, ok = symbolicOperators[tok.value]
+		}
+		if !ok {
+			p.back()
+			break
+		}
+
+		rhs, err := p.parseLit()
+		if err != nil {
+			return nil, err
+		}
+		expr = ComparisonOp{LHS: expr, Op: op, RHS: rhs}
+	}
+	return expr, nil
+}
+
+func (p *parser) parseLit() (Expr, error) {
+	tok := p.next()
+	if tok.err != nil {
+		return nil, tok.err
+	}
+
+	switch tok.typ {
+	case int64Token:
+		return IntegerLiteral(tok.int64), nil
+	case float64Token:
+		return FloatLiteral(tok.float64), nil
+	case stringToken:
+		return StringLiteral(tok.string), nil
+	}
+
+	// Handle some reserved keywords that become specific values.
+	// TODO: Handle the other 92 keywords.
+	switch tok.value {
+	case "TRUE":
+		return True, nil
+	case "FALSE":
+		return False, nil
+	case "NULL":
+		return Null, nil
+	}
+
+	// TODO: more types of literals (array, struct, date, timestamp).
+
+	// Try a parameter.
+	// TODO: check character sets.
+	if strings.HasPrefix(tok.value, "@") {
+		return Param(tok.value[1:]), nil
+	}
+	return ID(tok.value), nil
+}
+
+func (p *parser) parseBoolExpr() (BoolExpr, error) {
+	expr, err := p.parseExpr()
+	if err != nil {
+		return nil, err
+	}
+	be, ok := expr.(BoolExpr)
+	if !ok {
+		return nil, p.errorf("got non-bool expression %T", expr)
+	}
+	return be, nil
+}
+
+func (p *parser) parseTableOrIndexOrColumnName() (string, error) {
+	/*
+		table_name and column_name and index_name:
+				{a—z|A—Z}[{a—z|A—Z|0—9|_}+]
+	*/
+
+	tok := p.next()
+	if tok.err != nil {
+		return "", tok.err
+	}
+	// TODO: enforce restrictions
+	return tok.value, nil
+}

diff --git a/spanner/spansql/parser_test.go b/spanner/spansql/parser_test.go
new file mode 100644
index 0000000..0a0cde1
--- /dev/null
+++ b/spanner/spansql/parser_test.go

@@ -0,0 +1,233 @@
+/*
+Copyright 2019 Google LLC
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+
+package spansql
+
+import (
+	"reflect"
+	"testing"
+)
+
+func TestParseQuery(t *testing.T) {
+	tests := []struct {
+		in   string
+		want Query
+	}{
+		{`SELECT 17`, Query{Select: Select{List: []Expr{IntegerLiteral(17)}}}},
+		{`SELECT Alias FROM Characters WHERE Age < @ageLimit AND Alias IS NOT NULL ORDER BY Age DESC LIMIT @limit` + "\n\t",
+			Query{
+				Select: Select{
+					List: []Expr{ID("Alias")},
+					From: []SelectFrom{{
+						Table: "Characters",
+					}},
+					Where: LogicalOp{
+						Op: And,
+						LHS: ComparisonOp{
+							LHS: ID("Age"),
+							Op:  Lt,
+							RHS: Param("ageLimit"),
+						},
+						RHS: IsOp{
+							LHS: ID("Alias"),
+							Neg: true,
+							RHS: Null,
+						},
+					},
+				},
+				Order: []Order{{
+					Expr: ID("Age"),
+					Desc: true,
+				}},
+				Limit: Param("limit"),
+			},
+		},
+	}
+	for _, test := range tests {
+		got, err := ParseQuery(test.in)
+		if err != nil {
+			t.Errorf("ParseQuery(%q): %v", test.in, err)
+			continue
+		}
+		if !reflect.DeepEqual(got, test.want) {
+			t.Errorf("ParseQuery(%q) incorrect.\n got %#v\nwant %#v", test.in, got, test.want)
+		}
+	}
+}
+
+func TestParseExpr(t *testing.T) {
+	tests := []struct {
+		in   string
+		want Expr
+	}{
+		{`17`, IntegerLiteral(17)},
+		{`-1`, IntegerLiteral(-1)},
+		{`0xf00d`, IntegerLiteral(0xf00d)},
+		{`-0xbeef`, IntegerLiteral(-0xbeef)},
+		{`123.456e-67`, FloatLiteral(123.456e-67)},
+		{`.1E4`, FloatLiteral(0.1e4)},
+		{`58.`, FloatLiteral(58)},
+		{`4e2`, FloatLiteral(4e2)},
+		{`Count > 0`, ComparisonOp{LHS: ID("Count"), Op: Gt, RHS: IntegerLiteral(0)}},
+		{`Name LIKE "Eve %"`, ComparisonOp{LHS: ID("Name"), Op: Like, RHS: StringLiteral("Eve %")}},
+		{`Speech NOT LIKE "_oo"`, ComparisonOp{LHS: ID("Speech"), Op: NotLike, RHS: StringLiteral("_oo")}},
+		{`A AND NOT B`, LogicalOp{LHS: ID("A"), Op: And, RHS: LogicalOp{Op: Not, RHS: ID("B")}}},
+
+		// OR is lower precedence than AND.
+		{`A AND B OR C`, LogicalOp{LHS: LogicalOp{LHS: ID("A"), Op: And, RHS: ID("B")}, Op: Or, RHS: ID("C")}},
+		{`A OR B AND C`, LogicalOp{LHS: ID("A"), Op: Or, RHS: LogicalOp{LHS: ID("B"), Op: And, RHS: ID("C")}}},
+
+		// This is the same as the WHERE clause from the test in ParseQuery.
+		{`Age < @ageLimit AND Alias IS NOT NULL`,
+			LogicalOp{
+				LHS: ComparisonOp{LHS: ID("Age"), Op: Lt, RHS: Param("ageLimit")},
+				Op:  And,
+				RHS: IsOp{LHS: ID("Alias"), Neg: true, RHS: Null},
+			},
+		},
+
+		// This used to be broken because the lexer didn't reset the token type.
+		{`C < "whelp" AND D IS NOT NULL`,
+			LogicalOp{
+				LHS: ComparisonOp{LHS: ID("C"), Op: Lt, RHS: StringLiteral("whelp")},
+				Op:  And,
+				RHS: IsOp{LHS: ID("D"), Neg: true, RHS: Null},
+			},
+		},
+
+		// Reserved keywords.
+		{`TRUE AND FALSE`, LogicalOp{LHS: True, Op: And, RHS: False}},
+		{`NULL`, Null},
+	}
+	for _, test := range tests {
+		p := newParser(test.in)
+		got, err := p.parseExpr()
+		if err != nil {
+			t.Errorf("[%s]: %v", test.in, err)
+			continue
+		}
+		if !reflect.DeepEqual(got, test.want) {
+			t.Errorf("[%s]: incorrect parse\n got <%T> %#v\nwant <%T> %#v", test.in, got, got, test.want, test.want)
+		}
+		if p.s != "" {
+			t.Errorf("[%s]: Unparsed [%s]", test.in, p.s)
+		}
+	}
+}
+
+func TestParseDDL(t *testing.T) {
+	tests := []struct {
+		in   string
+		want DDL
+	}{
+		{`CREATE TABLE FooBar (
+			System STRING(MAX) NOT NULL,  # This is a comment.
+			RepoPath STRING(MAX) NOT NULL,  -- This is another comment.
+			Count INT64, /* This is a
+			              * multiline comment. */
+		) PRIMARY KEY(System, RepoPath);
+		CREATE INDEX MyFirstIndex ON FooBar (
+			Count DESC
+		);
+
+		ALTER TABLE FooBar ADD COLUMN TZ BYTES(20);
+		ALTER TABLE FooBar DROP COLUMN TZ;
+		ALTER TABLE FooBar SET ON DELETE NO ACTION;
+
+		DROP INDEX MyFirstIndex;
+		DROP TABLE FooBar;
+
+		CREATE TABLE NonScalars (
+			Dummy INT64 NOT NULL,
+			Ids ARRAY<INT64>,
+			Names ARRAY<STRING(MAX)>,
+		) PRIMARY KEY (Dummy);
+		`, DDL{List: []DDLStmt{
+			CreateTable{
+				Name: "FooBar",
+				Columns: []ColumnDef{
+					{Name: "System", Type: Type{Base: String, Len: MaxLen}, NotNull: true},
+					{Name: "RepoPath", Type: Type{Base: String, Len: MaxLen}, NotNull: true},
+					{Name: "Count", Type: Type{Base: Int64}},
+				},
+				PrimaryKey: []KeyPart{
+					{Column: "System"},
+					{Column: "RepoPath"},
+				},
+			},
+			CreateIndex{
+				Name:    "MyFirstIndex",
+				Table:   "FooBar",
+				Columns: []KeyPart{{Column: "Count", Desc: true}},
+			},
+			AlterTable{Name: "FooBar", Alteration: AddColumn{
+				Def: ColumnDef{Name: "TZ", Type: Type{Base: Bytes, Len: 20}},
+			}},
+			AlterTable{Name: "FooBar", Alteration: DropColumn{Name: "TZ"}},
+			AlterTable{Name: "FooBar", Alteration: NoActionOnDelete},
+			DropIndex{Name: "MyFirstIndex"},
+			DropTable{Name: "FooBar"},
+			CreateTable{
+				Name: "NonScalars",
+				Columns: []ColumnDef{
+					{Name: "Dummy", Type: Type{Base: Int64}, NotNull: true},
+					{Name: "Ids", Type: Type{Array: true, Base: Int64}},
+					{Name: "Names", Type: Type{Array: true, Base: String, Len: MaxLen}},
+				},
+				PrimaryKey: []KeyPart{{Column: "Dummy"}},
+			},
+		}}},
+		// No trailing comma:
+		{`ALTER TABLE T ADD COLUMN C2 INT64`, DDL{List: []DDLStmt{
+			AlterTable{Name: "T", Alteration: AddColumn{
+				Def: ColumnDef{Name: "C2", Type: Type{Base: Int64}},
+			}},
+		}}},
+	}
+	for _, test := range tests {
+		got, err := ParseDDL(test.in)
+		if err != nil {
+			t.Errorf("ParseDDL(%q): %v", test.in, err)
+			continue
+		}
+		if !reflect.DeepEqual(got, test.want) {
+			t.Errorf("ParseDDL(%q) incorrect.\n got %v\nwant %v", test.in, got, test.want)
+		}
+	}
+}
+
+func TestParseFailures(t *testing.T) {
+	expr := func(p *parser) error {
+		_, err := p.parseExpr()
+		return err
+	}
+
+	tests := []struct {
+		f    func(p *parser) error
+		in   string
+		desc string
+	}{
+		{expr, `0b337`, "binary literal"},
+		{expr, `"foo\`, "unterminated string"},
+		{expr, `"foo" AND "bar"`, "logical operation on string literals"},
+	}
+	for _, test := range tests {
+		p := newParser(test.in)
+		if test.f(p) == nil && p.Rem() == "" {
+			t.Errorf("%s: parsing [%s] succeeded, should have failed", test.desc, test.in)
+		}
+	}
+}

diff --git a/spanner/spansql/sql.go b/spanner/spansql/sql.go
new file mode 100644
index 0000000..d2553d9
--- /dev/null
+++ b/spanner/spansql/sql.go

@@ -0,0 +1,240 @@
+/*
+Copyright 2019 Google LLC
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+
+package spansql
+
+// This file holds SQL methods for rendering the types in types.go
+// as the SQL dialect that this package parses.
+
+import "strconv"
+
+func (ct CreateTable) SQL() string {
+	str := "CREATE TABLE " + ct.Name + " (\n"
+	for _, c := range ct.Columns {
+		str += "  " + c.SQL() + ",\n"
+	}
+	str += ") PRIMARY KEY("
+	for i, c := range ct.PrimaryKey {
+		if i > 0 {
+			str += ", "
+		}
+		str += c.SQL()
+	}
+	str += ")"
+	return str
+}
+
+func (ci CreateIndex) SQL() string {
+	str := "CREATE INDEX " + ci.Name + " ON " + ci.Table + "("
+	for i, c := range ci.Columns {
+		if i > 0 {
+			str += ", "
+		}
+		str += c.SQL()
+	}
+	str += ")"
+	return str
+}
+
+func (dt DropTable) SQL() string {
+	return "DROP TABLE " + dt.Name
+}
+
+func (di DropIndex) SQL() string {
+	return "DROP INDEX " + di.Name
+}
+
+func (at AlterTable) SQL() string {
+	return "ALTER TABLE " + at.Name + " " + at.Alteration.SQL()
+}
+
+func (ac AddColumn) SQL() string {
+	return "ADD COLUMN " + ac.Def.SQL()
+}
+
+func (dc DropColumn) SQL() string {
+	return "DROP COLUMN " + dc.Name
+}
+
+func (sod SetOnDelete) SQL() string {
+	switch sod {
+	case NoActionOnDelete:
+		return "SET ON DELETE NO ACTION"
+	case CascadeOnDelete:
+		return "SET ON DELETE CASCADE"
+	}
+	panic("unknown SetOnDelete")
+}
+
+// TODO func (ac AlterColumn) SQL() string { }
+
+func (cd ColumnDef) SQL() string {
+	str := cd.Name + " " + cd.Type.SQL()
+	if cd.NotNull {
+		str += " NOT NULL"
+	}
+	return str
+}
+
+func (t Type) SQL() string {
+	str := t.Base.SQL()
+	if t.Base == String || t.Base == Bytes {
+		str += "("
+		if t.Len == MaxLen {
+			str += "MAX"
+		} else {
+			str += strconv.FormatInt(t.Len, 10)
+		}
+		str += ")"
+	}
+	if t.Array {
+		str = "ARRAY<" + str + ">"
+	}
+	return str
+}
+
+func (tb TypeBase) SQL() string {
+	switch tb {
+	case Bool:
+		return "BOOL"
+	case Int64:
+		return "INT64"
+	case Float64:
+		return "FLOAT64"
+	case String:
+		return "STRING"
+	case Bytes:
+		return "BYTES"
+	case Date:
+		return "DATE"
+	case Timestamp:
+		return "TIMESTAMP"
+	}
+	panic("unknown TypeBase")
+}
+
+func (kp KeyPart) SQL() string {
+	str := kp.Column
+	if kp.Desc {
+		str += " DESC"
+	}
+	return str
+}
+
+func (q Query) SQL() string {
+	str := q.Select.SQL()
+	if len(q.Order) > 0 {
+		str += " ORDER BY "
+		for i, o := range q.Order {
+			if i > 0 {
+				str += ", "
+			}
+			str += o.SQL()
+		}
+	}
+	if q.Limit != nil {
+		str += " LIMIT " + q.Limit.SQL()
+	}
+	return str
+}
+
+func (sel Select) SQL() string {
+	str := "SELECT "
+	for i, e := range sel.List {
+		if i > 0 {
+			str += ", "
+		}
+		str += e.SQL()
+	}
+	if len(sel.From) > 0 {
+		str += " FROM "
+		for i, f := range sel.From {
+			if i > 0 {
+				str += ", "
+			}
+			str += f.Table
+		}
+	}
+	if sel.Where != nil {
+		str += " WHERE " + sel.Where.SQL()
+	}
+	return str
+}
+
+func (o Order) SQL() string {
+	str := o.Expr.SQL()
+	if o.Desc {
+		str += " DESC"
+	}
+	return str
+}
+
+func (lo LogicalOp) SQL() string {
+	switch lo.Op {
+	default:
+		panic("unknown LogicalOp")
+	case And:
+		return lo.LHS.SQL() + " AND " + lo.RHS.SQL()
+	case Or:
+		return lo.LHS.SQL() + " OR " + lo.RHS.SQL()
+	case Not:
+		return "NOT " + lo.RHS.SQL()
+	}
+}
+
+var compOps = map[ComparisonOperator]string{
+	Lt:      "<",
+	Le:      "<=",
+	Gt:      ">",
+	Ge:      ">=",
+	Eq:      "=",
+	Ne:      "!=",
+	Like:    "LIKE",
+	NotLike: "NOT LIKE",
+}
+
+func (co ComparisonOp) SQL() string {
+	op, ok := compOps[co.Op]
+	if !ok {
+		panic("unknown ComparisonOp")
+	}
+	return co.LHS.SQL() + " " + op + " " + co.RHS.SQL()
+}
+
+func (io IsOp) SQL() string {
+	str := io.LHS.SQL() + " IS "
+	if io.Neg {
+		str += "NOT "
+	}
+	str += io.RHS.SQL()
+	return str
+}
+
+func (id ID) SQL() string   { return string(id) }
+func (p Param) SQL() string { return "@" + string(p) }
+
+func (b BoolLiteral) SQL() string {
+	if b {
+		return "TRUE"
+	}
+	return "FALSE"
+}
+
+func (n NullLiteral) SQL() string { return "NULL" }
+
+func (il IntegerLiteral) SQL() string { return strconv.Itoa(int(il)) }
+func (fl FloatLiteral) SQL() string   { return strconv.FormatFloat(float64(fl), 'g', -1, 64) }
+func (sl StringLiteral) SQL() string  { return strconv.Quote(string(sl)) }

diff --git a/spanner/spansql/sql_test.go b/spanner/spansql/sql_test.go
new file mode 100644
index 0000000..970f364
--- /dev/null
+++ b/spanner/spansql/sql_test.go

@@ -0,0 +1,185 @@
+/*
+Copyright 2019 Google LLC
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+
+package spansql
+
+import (
+	"reflect"
+	"testing"
+)
+
+func TestSQL(t *testing.T) {
+	reparseDDL := func(s string) (interface{}, error) {
+		ddl, err := ParseDDLStmt(s)
+		return ddl, err
+	}
+	reparseQuery := func(s string) (interface{}, error) {
+		q, err := ParseQuery(s)
+		return q, err
+	}
+
+	tests := []struct {
+		data    interface{ SQL() string }
+		sql     string
+		reparse func(string) (interface{}, error)
+	}{
+		{
+			CreateTable{
+				Name: "Ta",
+				Columns: []ColumnDef{
+					{Name: "Ca", Type: Type{Base: Bool}, NotNull: true},
+					{Name: "Cb", Type: Type{Base: Int64}},
+					{Name: "Cc", Type: Type{Base: Float64}},
+					{Name: "Cd", Type: Type{Base: String, Len: 17}},
+					{Name: "Ce", Type: Type{Base: String, Len: MaxLen}},
+					{Name: "Cf", Type: Type{Base: Bytes, Len: 4711}},
+					{Name: "Cg", Type: Type{Base: Bytes, Len: MaxLen}},
+					{Name: "Ch", Type: Type{Base: Date}},
+					{Name: "Ci", Type: Type{Base: Timestamp}},
+					{Name: "Cj", Type: Type{Array: true, Base: Int64}},
+					{Name: "Ck", Type: Type{Array: true, Base: String, Len: MaxLen}},
+				},
+				PrimaryKey: []KeyPart{
+					{Column: "Ca"},
+					{Column: "Cb", Desc: true},
+				},
+			},
+			`CREATE TABLE Ta (
+  Ca BOOL NOT NULL,
+  Cb INT64,
+  Cc FLOAT64,
+  Cd STRING(17),
+  Ce STRING(MAX),
+  Cf BYTES(4711),
+  Cg BYTES(MAX),
+  Ch DATE,
+  Ci TIMESTAMP,
+  Cj ARRAY<INT64>,
+  Ck ARRAY<STRING(MAX)>,
+) PRIMARY KEY(Ca, Cb DESC)`,
+			reparseDDL,
+		},
+		{
+			DropTable{
+				Name: "Ta",
+			},
+			"DROP TABLE Ta",
+			reparseDDL,
+		},
+		{
+			CreateIndex{
+				Name:  "Ia",
+				Table: "Ta",
+				Columns: []KeyPart{
+					{Column: "Ca"},
+					{Column: "Cb", Desc: true},
+				},
+			},
+			"CREATE INDEX Ia ON Ta(Ca, Cb DESC)",
+			reparseDDL,
+		},
+		{
+			DropIndex{
+				Name: "Ia",
+			},
+			"DROP INDEX Ia",
+			reparseDDL,
+		},
+		{
+			AlterTable{
+				Name:       "Ta",
+				Alteration: AddColumn{Def: ColumnDef{Name: "Ca", Type: Type{Base: Bool}}},
+			},
+			"ALTER TABLE Ta ADD COLUMN Ca BOOL",
+			reparseDDL,
+		},
+		{
+			AlterTable{
+				Name:       "Ta",
+				Alteration: DropColumn{Name: "Ca"},
+			},
+			"ALTER TABLE Ta DROP COLUMN Ca",
+			reparseDDL,
+		},
+		{
+			AlterTable{
+				Name:       "Ta",
+				Alteration: NoActionOnDelete,
+			},
+			"ALTER TABLE Ta SET ON DELETE NO ACTION",
+			reparseDDL,
+		},
+		{
+			AlterTable{
+				Name:       "Ta",
+				Alteration: CascadeOnDelete,
+			},
+			"ALTER TABLE Ta SET ON DELETE CASCADE",
+			reparseDDL,
+		},
+		{
+			Query{
+				Select: Select{
+					List: []Expr{ID("A"), ID("B")},
+					From: []SelectFrom{{Table: "Table"}},
+					Where: LogicalOp{
+						LHS: ComparisonOp{
+							LHS: ID("C"),
+							Op:  Lt,
+							RHS: StringLiteral("whelp"),
+						},
+						Op: And,
+						RHS: IsOp{
+							LHS: ID("D"),
+							Neg: true,
+							RHS: Null,
+						},
+					},
+				},
+				Order: []Order{{Expr: ID("OCol"), Desc: true}},
+				Limit: IntegerLiteral(1000),
+			},
+			`SELECT A, B FROM Table WHERE C < "whelp" AND D IS NOT NULL ORDER BY OCol DESC LIMIT 1000`,
+			reparseQuery,
+		},
+		{
+			Query{
+				Select: Select{
+					List: []Expr{IntegerLiteral(7)},
+				},
+			},
+			`SELECT 7`,
+			reparseQuery,
+		},
+	}
+	for _, test := range tests {
+		sql := test.data.SQL()
+		if sql != test.sql {
+			t.Errorf("%v.SQL() wrong.\n got %s\nwant %s", test.data, sql, test.sql)
+			continue
+		}
+
+		// As a sanity check, confirm that parsing the SQL produces the original input.
+		data, err := test.reparse(sql)
+		if err != nil {
+			t.Errorf("Reparsing %q: %v", sql, err)
+			continue
+		}
+		if !reflect.DeepEqual(data, test.data) {
+			t.Errorf("Reparsing %q wrong.\n got %v\nwant %v", sql, data, test.data)
+		}
+	}
+}

diff --git a/spanner/spansql/types.go b/spanner/spansql/types.go
new file mode 100644
index 0000000..4718f6d
--- /dev/null
+++ b/spanner/spansql/types.go

@@ -0,0 +1,285 @@
+/*
+Copyright 2019 Google LLC
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+
+package spansql
+
+// This file holds the type definitions for the SQL dialect.
+
+import (
+	"math"
+)
+
+// CreateTable represents a CREATE TABLE statement.
+// https://cloud.google.com/spanner/docs/data-definition-language#create_table
+type CreateTable struct {
+	Name       string
+	Columns    []ColumnDef
+	PrimaryKey []KeyPart
+}
+
+// CreateIndex represents a CREATE INDEX statement.
+// https://cloud.google.com/spanner/docs/data-definition-language#create-index
+type CreateIndex struct {
+	Name    string
+	Table   string
+	Columns []KeyPart
+
+	// TODO: UNIQUE, NULL_FILTERED, storing_clause, interleave_clause
+}
+
+// DropTable represents a DROP TABLE statement.
+// https://cloud.google.com/spanner/docs/data-definition-language#drop_table
+type DropTable struct{ Name string }
+
+// DropIndex represents a DROP INDEX statement.
+// https://cloud.google.com/spanner/docs/data-definition-language#drop-index
+type DropIndex struct{ Name string }
+
+// AlterTable represents an ALTER TABLE statement.
+// https://cloud.google.com/spanner/docs/data-definition-language#alter_table
+type AlterTable struct {
+	Name       string
+	Alteration TableAlteration
+}
+
+// TableAlteration is satisfied by AddColumn, DropColumn and SetOnDelete.
+type TableAlteration interface {
+	isTableAlteration()
+	SQL() string
+}
+
+func (AddColumn) isTableAlteration()   {}
+func (DropColumn) isTableAlteration()  {}
+func (SetOnDelete) isTableAlteration() {}
+
+//func (AlterColumn) isTableAlteration() {}
+
+type AddColumn struct{ Def ColumnDef }
+type DropColumn struct{ Name string }
+
+type SetOnDelete int
+
+const (
+	NoActionOnDelete SetOnDelete = iota
+	CascadeOnDelete
+)
+
+/* TODO
+type AlterColumn struct {
+}
+*/
+
+// ColumnDef represents a column definition as part of a CREATE TABLE
+// or ALTER TABLE statement.
+type ColumnDef struct {
+	Name    string
+	Type    Type
+	NotNull bool
+}
+
+// Type represents a column type.
+type Type struct {
+	Array bool
+	Base  TypeBase // Bool, Int64, Float64, String, Bytes, Date, Timestamp
+	Len   int64    // if Base is String or Bytes; may be MaxLen
+}
+
+// MaxLen is a sentinel for Type's Len field, representing the MAX value.
+const MaxLen = math.MaxInt64
+
+type TypeBase int
+
+const (
+	Bool TypeBase = iota
+	Int64
+	Float64
+	String
+	Bytes
+	Date
+	Timestamp
+)
+
+// KeyPart represents a column specification as part of a primary key or index definition.
+type KeyPart struct {
+	Column string
+	Desc   bool
+}
+
+// Query represents a query statement.
+// https://cloud.google.com/spanner/docs/query-syntax#sql-syntax
+type Query struct {
+	Select Select
+	Order  []Order
+	Limit  Limit
+}
+
+// Select represents a SELECT statement.
+// https://cloud.google.com/spanner/docs/query-syntax#select-list
+type Select struct {
+	List  []Expr
+	From  []SelectFrom
+	Where BoolExpr
+	// TODO: GroupBy, Having
+}
+
+type SelectFrom struct {
+	// This only supports a FROM clause directly from a table.
+	Table string
+}
+
+type Order struct {
+	Expr Expr
+	Desc bool
+}
+
+type BoolExpr interface {
+	isBoolExpr()
+	Expr
+}
+
+type Expr interface {
+	isExpr()
+	SQL() string
+}
+
+type Limit interface {
+	isLimit()
+	SQL() string
+}
+
+type LogicalOp struct {
+	Op       LogicalOperator
+	LHS, RHS BoolExpr // only RHS is set for Not
+}
+
+func (LogicalOp) isBoolExpr() {}
+func (LogicalOp) isExpr()     {}
+
+type LogicalOperator int
+
+const (
+	And LogicalOperator = iota
+	Or
+	Not
+)
+
+type ComparisonOp struct {
+	LHS, RHS Expr
+	Op       ComparisonOperator
+
+	// TODO: BETWEEN; it needs a third operand.
+}
+
+func (ComparisonOp) isBoolExpr() {}
+func (ComparisonOp) isExpr()     {}
+
+type ComparisonOperator int
+
+const (
+	Lt ComparisonOperator = iota
+	Le
+	Gt
+	Ge
+	Eq
+	Ne // both "!=" and "<>"
+	Like
+	NotLike
+)
+
+type IsOp struct {
+	LHS Expr
+	Neg bool
+	RHS IsExpr
+}
+
+func (IsOp) isBoolExpr() {}
+func (IsOp) isExpr()     {}
+
+type IsExpr interface {
+	isIsExpr()
+	isExpr()
+	SQL() string
+}
+
+// ID represents an identifier.
+type ID string
+
+func (ID) isBoolExpr() {} // possibly bool
+func (ID) isExpr()     {}
+
+// Param represents a query parameter.
+type Param string
+
+func (Param) isBoolExpr() {} // possibly bool
+func (Param) isExpr()     {}
+func (Param) isLimit()    {}
+
+type BoolLiteral bool
+
+const (
+	True  = BoolLiteral(true)
+	False = BoolLiteral(false)
+)
+
+func (BoolLiteral) isBoolExpr() {}
+func (BoolLiteral) isIsExpr()   {}
+func (BoolLiteral) isExpr()     {}
+
+type NullLiteral int
+
+const Null = NullLiteral(0)
+
+func (NullLiteral) isIsExpr() {}
+func (NullLiteral) isExpr()   {}
+
+// IntegerLiteral represents an integer literal.
+// https://cloud.google.com/spanner/docs/lexical#integer-literals
+type IntegerLiteral int64
+
+func (IntegerLiteral) isLimit() {}
+func (IntegerLiteral) isExpr()  {}
+
+// FloatLiteral represents a floating point literal.
+// https://cloud.google.com/spanner/docs/lexical#floating-point-literals
+type FloatLiteral float64
+
+func (FloatLiteral) isExpr() {}
+
+// StringLiteral represents a string literal.
+// https://cloud.google.com/spanner/docs/lexical#string-and-bytes-literals
+type StringLiteral string
+
+func (StringLiteral) isExpr() {}
+
+// DDL
+// https://cloud.google.com/spanner/docs/data-definition-language#ddl_syntax
+
+// DDL represents a Data Definition Language (DDL) file.
+type DDL struct {
+	List []DDLStmt
+}
+
+// DDLStmt is satisfied by a type that can appear in a DDL.
+type DDLStmt interface {
+	isDDLStmt()
+	SQL() string
+}
+
+func (CreateTable) isDDLStmt() {}
+func (CreateIndex) isDDLStmt() {}
+func (AlterTable) isDDLStmt()  {}
+func (DropTable) isDDLStmt()   {}
+func (DropIndex) isDDLStmt()   {}
commit	fb3c527ecb61102c3e756ad0638abb5ddc40cf6d	[log] [tgz]
author	David Symonds <dsymonds@golang.org>	Wed Jul 24 08:42:13 2019 +1000
committer	David Symonds <dsymonds@golang.org>	Tue Jul 30 20:57:53 2019 +0000
tree	7e0706b5868b30bc313e6c0c8b0b7aace504cb93
parent	6f8bf42e39a983252893070befa2663437d27a84 [diff]