Skip to content

Commit 5abefc6

Browse files
committed
squash-merge: mssql-go-keyword
1 parent 59f62a6 commit 5abefc6

File tree

7 files changed

+369
-6
lines changed

7 files changed

+369
-6
lines changed

src/ast/mod.rs

Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4339,6 +4339,12 @@ pub enum Statement {
43394339
///
43404340
/// See [ReturnStatement]
43414341
Return(ReturnStatement),
4342+
/// Go (MsSql)
4343+
///
4344+
/// GO is not a Transact-SQL statement; it is a command recognized by various tools as a batch delimiter
4345+
///
4346+
/// See: <https://learn.microsoft.com/en-us/sql/t-sql/language-elements/sql-server-utilities-statements-go>
4347+
Go(GoStatement),
43424348
}
43434349

43444350
/// ```sql
@@ -6166,6 +6172,7 @@ impl fmt::Display for Statement {
61666172
Ok(())
61676173
}
61686174
Statement::Print(s) => write!(f, "{s}"),
6175+
Statement::Go(s) => write!(f, "{s}"),
61696176
Statement::Return(r) => write!(f, "{r}"),
61706177
Statement::List(command) => write!(f, "LIST {command}"),
61716178
Statement::Remove(command) => write!(f, "REMOVE {command}"),
@@ -10074,6 +10081,26 @@ impl fmt::Display for MemberOf {
1007410081
}
1007510082
}
1007610083

10084+
/// Represents a `GO` statement.
10085+
///
10086+
/// [MsSql](https://learn.microsoft.com/en-us/sql/t-sql/language-elements/sql-server-utilities-statements-go)
10087+
#[derive(Debug, Clone, PartialEq, PartialOrd, Eq, Ord, Hash)]
10088+
#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
10089+
#[cfg_attr(feature = "visitor", derive(Visit, VisitMut))]
10090+
pub struct GoStatement {
10091+
pub count: Option<u64>,
10092+
}
10093+
10094+
impl Display for GoStatement {
10095+
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
10096+
if let Some(count) = self.count {
10097+
write!(f, "GO {count}")
10098+
} else {
10099+
write!(f, "GO")
10100+
}
10101+
}
10102+
}
10103+
1007710104
#[cfg(test)]
1007810105
mod tests {
1007910106
use crate::tokenizer::Location;

src/ast/spans.rs

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -530,6 +530,7 @@ impl Spanned for Statement {
530530
Statement::RaisError { .. } => Span::empty(),
531531
Statement::Print { .. } => Span::empty(),
532532
Statement::Return { .. } => Span::empty(),
533+
Statement::Go { .. } => Span::empty(),
533534
Statement::List(..) | Statement::Remove(..) => Span::empty(),
534535
}
535536
}

src/dialect/mssql.rs

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -132,7 +132,13 @@ impl Dialect for MsSqlDialect {
132132
&[GranteesType::Public]
133133
}
134134

135-
fn is_column_alias(&self, kw: &Keyword, _parser: &mut Parser) -> bool {
135+
fn is_column_alias(&self, kw: &Keyword, parser: &mut Parser) -> bool {
136+
// if we find maybe whitespace then a newline looking backward, then `GO` ISN'T a column alias
137+
// if we can't find a newline then we assume that `GO` IS a column alias
138+
if kw == &Keyword::GO && parser.prev_only_whitespace_until_newline() {
139+
return false;
140+
}
141+
136142
!keywords::RESERVED_FOR_COLUMN_ALIAS.contains(kw) && !RESERVED_FOR_COLUMN_ALIAS.contains(kw)
137143
}
138144

src/keywords.rs

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -404,6 +404,7 @@ define_keywords!(
404404
GIN,
405405
GIST,
406406
GLOBAL,
407+
GO,
407408
GRANT,
408409
GRANTED,
409410
GRANTS,

src/parser/mod.rs

Lines changed: 142 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -498,12 +498,23 @@ impl<'a> Parser<'a> {
498498
match self.peek_token().token {
499499
Token::EOF => break,
500500

501+
// end of statement
502+
Token::Word(word) => {
503+
if expecting_statement_delimiter && word.keyword == Keyword::END {
504+
break;
505+
}
506+
507+
if expecting_statement_delimiter && word.keyword == Keyword::GO {
508+
expecting_statement_delimiter = false;
509+
}
510+
},
511+
501512
// don't expect a semicolon statement delimiter after a newline when not otherwise required
502513
Token::Whitespace(Whitespace::Newline) => {
503514
if !self.options.require_semicolon_stmt_delimiter {
504515
expecting_statement_delimiter = false;
505516
}
506-
}
517+
},
507518
_ => {}
508519
}
509520

@@ -512,8 +523,9 @@ impl<'a> Parser<'a> {
512523
}
513524

514525
let statement = self.parse_statement()?;
526+
// Treat batch delimiter as an end of statement, so no additional statement delimiter expected here
527+
expecting_statement_delimiter = !matches!(statement, Statement::Go(_)) && self.options.require_semicolon_stmt_delimiter;
515528
stmts.push(statement);
516-
expecting_statement_delimiter = self.options.require_semicolon_stmt_delimiter;
517529
}
518530
Ok(stmts)
519531
}
@@ -653,6 +665,10 @@ impl<'a> Parser<'a> {
653665
Keyword::COMMENT if self.dialect.supports_comment_on() => self.parse_comment(),
654666
Keyword::PRINT => self.parse_print(),
655667
Keyword::RETURN => self.parse_return(),
668+
Keyword::GO => {
669+
self.prev_token();
670+
self.parse_go()
671+
}
656672
_ => self.expected("an SQL statement", next_token),
657673
},
658674
Token::LParen => {
@@ -4039,6 +4055,17 @@ impl<'a> Parser<'a> {
40394055
})
40404056
}
40414057

4058+
/// Return nth previous token, possibly whitespace
4059+
/// (or [`Token::EOF`] when before the beginning of the stream).
4060+
pub(crate) fn peek_prev_nth_token_no_skip_ref(&self, n: usize) -> &TokenWithSpan {
4061+
// 0 = next token, -1 = current token, -2 = previous token
4062+
let peek_index = self.index.saturating_sub(1).saturating_sub(n);
4063+
if peek_index == 0 {
4064+
return &EOF_TOKEN;
4065+
}
4066+
self.tokens.get(peek_index).unwrap_or(&EOF_TOKEN)
4067+
}
4068+
40424069
/// Return true if the next tokens exactly `expected`
40434070
///
40444071
/// Does not advance the current token.
@@ -4155,6 +4182,29 @@ impl<'a> Parser<'a> {
41554182
)
41564183
}
41574184

4185+
/// Look backwards in the token stream and expect that there was only whitespace tokens until the previous newline or beginning of string
4186+
pub(crate) fn prev_only_whitespace_until_newline(&mut self) -> bool {
4187+
let mut look_back_count = 1;
4188+
loop {
4189+
let prev_token = self.peek_prev_nth_token_no_skip_ref(look_back_count);
4190+
match prev_token.token {
4191+
Token::EOF => break true,
4192+
Token::Whitespace(ref w) => match w {
4193+
Whitespace::Newline => break true,
4194+
// special consideration required for single line comments since that string includes the newline
4195+
Whitespace::SingleLineComment { comment, prefix: _ } => {
4196+
if comment.ends_with('\n') {
4197+
break true;
4198+
}
4199+
look_back_count += 1;
4200+
}
4201+
_ => look_back_count += 1,
4202+
},
4203+
_ => break false,
4204+
};
4205+
}
4206+
}
4207+
41584208
/// If the current token is the `expected` keyword, consume it and returns
41594209
/// true. Otherwise, no tokens are consumed and returns false.
41604210
#[must_use]
@@ -16440,6 +16490,71 @@ impl<'a> Parser<'a> {
1644016490
}
1644116491
}
1644216492

16493+
/// Parse [Statement::Go]
16494+
fn parse_go(&mut self) -> Result<Statement, ParserError> {
16495+
self.expect_keyword_is(Keyword::GO)?;
16496+
16497+
// disambiguate between GO as batch delimiter & GO as identifier (etc)
16498+
// compare:
16499+
// ```sql
16500+
// select 1 go
16501+
// ```
16502+
// vs
16503+
// ```sql
16504+
// select 1
16505+
// go
16506+
// ```
16507+
if !self.prev_only_whitespace_until_newline() {
16508+
parser_err!(
16509+
"GO may only be preceded by whitespace on a line",
16510+
self.peek_token().span.start
16511+
)?;
16512+
}
16513+
16514+
let count = loop {
16515+
// using this peek function because we want to halt this statement parsing upon newline
16516+
let next_token = self.peek_token_no_skip();
16517+
match next_token.token {
16518+
Token::EOF => break None::<u64>,
16519+
Token::Whitespace(ref w) => match w {
16520+
Whitespace::Newline => break None,
16521+
_ => _ = self.next_token_no_skip(),
16522+
},
16523+
Token::Number(s, _) => {
16524+
let value = Some(Self::parse::<u64>(s, next_token.span.start)?);
16525+
self.advance_token();
16526+
break value;
16527+
}
16528+
_ => self.expected("literal int or newline", next_token)?,
16529+
};
16530+
};
16531+
16532+
loop {
16533+
let next_token = self.peek_token_no_skip();
16534+
match next_token.token {
16535+
Token::EOF => break,
16536+
Token::Whitespace(ref w) => match w {
16537+
Whitespace::Newline => break,
16538+
Whitespace::SingleLineComment { comment, prefix: _ } => {
16539+
if comment.ends_with('\n') {
16540+
break;
16541+
}
16542+
_ = self.next_token_no_skip();
16543+
}
16544+
_ => _ = self.next_token_no_skip(),
16545+
},
16546+
_ => {
16547+
parser_err!(
16548+
"GO must be followed by a newline or EOF",
16549+
self.peek_token().span.start
16550+
)?;
16551+
}
16552+
};
16553+
}
16554+
16555+
Ok(Statement::Go(GoStatement { count }))
16556+
}
16557+
1644316558
/// Consume the parser and return its underlying token buffer
1644416559
pub fn into_tokens(self) -> Vec<TokenWithSpan> {
1644516560
self.tokens
@@ -16681,6 +16796,31 @@ mod tests {
1668116796
})
1668216797
}
1668316798

16799+
#[test]
16800+
fn test_peek_prev_nth_token_no_skip_ref() {
16801+
all_dialects().run_parser_method(
16802+
"SELECT 1;\n-- a comment\nRAISERROR('test', 16, 0);",
16803+
|parser| {
16804+
parser.index = 1;
16805+
assert_eq!(parser.peek_prev_nth_token_no_skip_ref(0), &Token::EOF);
16806+
assert_eq!(parser.index, 1);
16807+
parser.index = 7;
16808+
assert_eq!(
16809+
parser.token_at(parser.index - 1).token,
16810+
Token::Word(Word {
16811+
value: "RAISERROR".to_string(),
16812+
quote_style: None,
16813+
keyword: Keyword::RAISERROR,
16814+
})
16815+
);
16816+
assert_eq!(
16817+
parser.peek_prev_nth_token_no_skip_ref(2),
16818+
&Token::Whitespace(Whitespace::Newline)
16819+
);
16820+
},
16821+
);
16822+
}
16823+
1668416824
#[cfg(test)]
1668516825
mod test_parse_data_type {
1668616826
use crate::ast::{

src/test_utils.rs

Lines changed: 9 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -153,7 +153,7 @@ impl TestedDialects {
153153
/// 2. re-serializing the result of parsing `sql` produces the same
154154
/// `canonical` sql string
155155
///
156-
/// For multiple statements, use [`statements_parse_to`].
156+
/// For multiple statements, use [`statements_parse_to`].
157157
pub fn one_statement_parses_to(&self, sql: &str, canonical: &str) -> Statement {
158158
let mut statements = self.parse_sql_statements(sql).expect(sql);
159159
assert_eq!(statements.len(), 1);
@@ -170,8 +170,15 @@ impl TestedDialects {
170170
}
171171

172172
/// The same as [`one_statement_parses_to`] but it works for a multiple statements
173-
pub fn statements_parse_to(&self, sql: &str, canonical: &str) -> Vec<Statement> {
173+
pub fn statements_parse_to(
174+
&self,
175+
sql: &str,
176+
statement_count: usize,
177+
canonical: &str,
178+
) -> Vec<Statement> {
174179
let statements = self.parse_sql_statements(sql).expect(sql);
180+
assert_eq!(statements.len(), statement_count);
181+
175182
if !canonical.is_empty() && sql != canonical {
176183
assert_eq!(self.parse_sql_statements(canonical).unwrap(), statements);
177184
} else {

0 commit comments

Comments
 (0)