src/dialect/postgresql.rs - datafusion-sqlparser-rs - Git at Google

 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 // http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.
 use log::debug;

 use crate::ast::{CommentObject, Statement};
 use crate::dialect::{Dialect, Precedence};
 use crate::keywords::Keyword;
 use crate::parser::{Parser, ParserError};
 use crate::tokenizer::Token;

 /// A [`Dialect`] for [PostgreSQL](https://www.postgresql.org/)
 #[derive(Debug)]
 pub struct PostgreSqlDialect {}

 const DOUBLE_COLON_PREC: u8 = 140;
 const BRACKET_PREC: u8 = 130;
 const COLLATE_PREC: u8 = 120;
 const AT_TZ_PREC: u8 = 110;
 const CARET_PREC: u8 = 100;
 const MUL_DIV_MOD_OP_PREC: u8 = 90;
 const PLUS_MINUS_PREC: u8 = 80;
 // there's no XOR operator in PostgreSQL, but support it here to avoid breaking tests
 const XOR_PREC: u8 = 75;
 const PG_OTHER_PREC: u8 = 70;
 const BETWEEN_LIKE_PREC: u8 = 60;
 const EQ_PREC: u8 = 50;
 const IS_PREC: u8 = 40;
 const NOT_PREC: u8 = 30;
 const AND_PREC: u8 = 20;
 const OR_PREC: u8 = 10;

 impl Dialect for PostgreSqlDialect {
     fn identifier_quote_style(&self, _identifier: &str) -> Option<char> {
         Some('"')
     }

     fn is_delimited_identifier_start(&self, ch: char) -> bool {
         ch == '"' // Postgres does not support backticks to quote identifiers
     }

     fn is_identifier_start(&self, ch: char) -> bool {
         // See https://www.postgresql.org/docs/11/sql-syntax-lexical.html#SQL-SYNTAX-IDENTIFIERS
         // We don't yet support identifiers beginning with "letters with
         // diacritical marks"
         ch.is_alphabetic() || ch == '_'
     }

     fn is_identifier_part(&self, ch: char) -> bool {
         ch.is_alphabetic() || ch.is_ascii_digit() || ch == '$' || ch == '_'
     }

     fn supports_unicode_string_literal(&self) -> bool {
         true
     }

     /// See <https://www.postgresql.org/docs/current/sql-createoperator.html>
     fn is_custom_operator_part(&self, ch: char) -> bool {
         matches!(
             ch,
             '+' | '-'
                 | '*'
                 | '/'
                 | '<'
                 | '>'
                 | '='
                 | '~'
                 | '!'
                 | '@'
                 | '#'
                 | '%'
                 | '^'
                 | '&'
                 | '|'
                 | '`'
                 | '?'
         )
     }

     fn get_next_precedence(&self, parser: &Parser) -> Option<Result<u8, ParserError>> {
         let token = parser.peek_token();
         debug!("get_next_precedence() {:?}", token);

         // we only return some custom value here when the behaviour (not merely the numeric value) differs
         // from the default implementation
         match token.token {
             Token::Word(w) if w.keyword == Keyword::COLLATE => Some(Ok(COLLATE_PREC)),
             Token::LBracket => Some(Ok(BRACKET_PREC)),
             Token::Arrow
             | Token::LongArrow
             | Token::HashArrow
             | Token::HashLongArrow
             | Token::AtArrow
             | Token::ArrowAt
             | Token::HashMinus
             | Token::AtQuestion
             | Token::AtAt
             | Token::Question
             | Token::QuestionAnd
             | Token::QuestionPipe
             | Token::ExclamationMark
             | Token::Overlap
             | Token::CaretAt
             | Token::StringConcat
             | Token::Sharp
             | Token::ShiftRight
             | Token::ShiftLeft
             | Token::CustomBinaryOperator(_) => Some(Ok(PG_OTHER_PREC)),
             _ => None,
         }
     }

     fn parse_statement(&self, parser: &mut Parser) -> Option<Result<Statement, ParserError>> {
         if parser.parse_keyword(Keyword::COMMENT) {
             Some(parse_comment(parser))
         } else {
             None
         }
     }

     fn supports_filter_during_aggregation(&self) -> bool {
         true
     }

     fn supports_group_by_expr(&self) -> bool {
         true
     }

     fn prec_value(&self, prec: Precedence) -> u8 {
         match prec {
             Precedence::DoubleColon => DOUBLE_COLON_PREC,
             Precedence::AtTz => AT_TZ_PREC,
             Precedence::MulDivModOp => MUL_DIV_MOD_OP_PREC,
             Precedence::PlusMinus => PLUS_MINUS_PREC,
             Precedence::Xor => XOR_PREC,
             Precedence::Ampersand => PG_OTHER_PREC,
             Precedence::Caret => CARET_PREC,
             Precedence::Pipe => PG_OTHER_PREC,
             Precedence::Between => BETWEEN_LIKE_PREC,
             Precedence::Eq => EQ_PREC,
             Precedence::Like => BETWEEN_LIKE_PREC,
             Precedence::Is => IS_PREC,
             Precedence::PgOther => PG_OTHER_PREC,
             Precedence::UnaryNot => NOT_PREC,
             Precedence::And => AND_PREC,
             Precedence::Or => OR_PREC,
         }
     }
 }

 pub fn parse_comment(parser: &mut Parser) -> Result<Statement, ParserError> {
     let if_exists = parser.parse_keywords(&[Keyword::IF, Keyword::EXISTS]);

     parser.expect_keyword(Keyword::ON)?;
     let token = parser.next_token();

     let (object_type, object_name) = match token.token {
         Token::Word(w) if w.keyword == Keyword::COLUMN => {
             let object_name = parser.parse_object_name(false)?;
             (CommentObject::Column, object_name)
         }
         Token::Word(w) if w.keyword == Keyword::TABLE => {
             let object_name = parser.parse_object_name(false)?;
             (CommentObject::Table, object_name)
         }
         _ => parser.expected("comment object_type", token)?,
     };

     parser.expect_keyword(Keyword::IS)?;
     let comment = if parser.parse_keyword(Keyword::NULL) {
         None
     } else {
         Some(parser.parse_literal_string()?)
     };
     Ok(Statement::Comment {
         object_type,
         object_name,
         comment,
         if_exists,
     })
 }
	// Licensed under the Apache License, Version 2.0 (the "License");
	// you may not use this file except in compliance with the License.
	// You may obtain a copy of the License at
	//
	// http://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS,
	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	// See the License for the specific language governing permissions and
	// limitations under the License.
	use log::debug;

	use crate::ast::{CommentObject, Statement};
	use crate::dialect::{Dialect, Precedence};
	use crate::keywords::Keyword;
	use crate::parser::{Parser, ParserError};
	use crate::tokenizer::Token;

	/// A [`Dialect`] for [PostgreSQL](https://www.postgresql.org/)
	#[derive(Debug)]
	pub struct PostgreSqlDialect {}

	const DOUBLE_COLON_PREC: u8 = 140;
	const BRACKET_PREC: u8 = 130;
	const COLLATE_PREC: u8 = 120;
	const AT_TZ_PREC: u8 = 110;
	const CARET_PREC: u8 = 100;
	const MUL_DIV_MOD_OP_PREC: u8 = 90;
	const PLUS_MINUS_PREC: u8 = 80;
	// there's no XOR operator in PostgreSQL, but support it here to avoid breaking tests
	const XOR_PREC: u8 = 75;
	const PG_OTHER_PREC: u8 = 70;
	const BETWEEN_LIKE_PREC: u8 = 60;
	const EQ_PREC: u8 = 50;
	const IS_PREC: u8 = 40;
	const NOT_PREC: u8 = 30;
	const AND_PREC: u8 = 20;
	const OR_PREC: u8 = 10;

	impl Dialect for PostgreSqlDialect {
	fn identifier_quote_style(&self, _identifier: &str) -> Option<char> {
	Some('"')
	}

	fn is_delimited_identifier_start(&self, ch: char) -> bool {
	ch == '"' // Postgres does not support backticks to quote identifiers
	}

	fn is_identifier_start(&self, ch: char) -> bool {
	// See https://www.postgresql.org/docs/11/sql-syntax-lexical.html#SQL-SYNTAX-IDENTIFIERS
	// We don't yet support identifiers beginning with "letters with
	// diacritical marks"
	ch.is_alphabetic() \|\| ch == '_'
	}

	fn is_identifier_part(&self, ch: char) -> bool {
	ch.is_alphabetic() \|\| ch.is_ascii_digit() \|\| ch == '$' \|\| ch == '_'
	}

	fn supports_unicode_string_literal(&self) -> bool {
	true
	}

	/// See <https://www.postgresql.org/docs/current/sql-createoperator.html>
	fn is_custom_operator_part(&self, ch: char) -> bool {
	matches!(
	ch,
	'+' \| '-'
	\| '*'
	\| '/'
	\| '<'
	\| '>'
	\| '='
	\| '~'
	\| '!'
	\| '@'
	\| '#'
	\| '%'
	\| '^'
	\| '&'
	\| '\|'
	\| '`'
	\| '?'
	)
	}

	fn get_next_precedence(&self, parser: &Parser) -> Option<Result<u8, ParserError>> {
	let token = parser.peek_token();
	debug!("get_next_precedence() {:?}", token);

	// we only return some custom value here when the behaviour (not merely the numeric value) differs
	// from the default implementation
	match token.token {
	Token::Word(w) if w.keyword == Keyword::COLLATE => Some(Ok(COLLATE_PREC)),
	Token::LBracket => Some(Ok(BRACKET_PREC)),
	Token::Arrow
	\| Token::LongArrow
	\| Token::HashArrow
	\| Token::HashLongArrow
	\| Token::AtArrow
	\| Token::ArrowAt
	\| Token::HashMinus
	\| Token::AtQuestion
	\| Token::AtAt
	\| Token::Question
	\| Token::QuestionAnd
	\| Token::QuestionPipe
	\| Token::ExclamationMark
	\| Token::Overlap
	\| Token::CaretAt
	\| Token::StringConcat
	\| Token::Sharp
	\| Token::ShiftRight
	\| Token::ShiftLeft
	\| Token::CustomBinaryOperator(_) => Some(Ok(PG_OTHER_PREC)),
	_ => None,
	}
	}

	fn parse_statement(&self, parser: &mut Parser) -> Option<Result<Statement, ParserError>> {
	if parser.parse_keyword(Keyword::COMMENT) {
	Some(parse_comment(parser))
	} else {
	None
	}
	}

	fn supports_filter_during_aggregation(&self) -> bool {
	true
	}

	fn supports_group_by_expr(&self) -> bool {
	true
	}

	fn prec_value(&self, prec: Precedence) -> u8 {
	match prec {
	Precedence::DoubleColon => DOUBLE_COLON_PREC,
	Precedence::AtTz => AT_TZ_PREC,
	Precedence::MulDivModOp => MUL_DIV_MOD_OP_PREC,
	Precedence::PlusMinus => PLUS_MINUS_PREC,
	Precedence::Xor => XOR_PREC,
	Precedence::Ampersand => PG_OTHER_PREC,
	Precedence::Caret => CARET_PREC,
	Precedence::Pipe => PG_OTHER_PREC,
	Precedence::Between => BETWEEN_LIKE_PREC,
	Precedence::Eq => EQ_PREC,
	Precedence::Like => BETWEEN_LIKE_PREC,
	Precedence::Is => IS_PREC,
	Precedence::PgOther => PG_OTHER_PREC,
	Precedence::UnaryNot => NOT_PREC,
	Precedence::And => AND_PREC,
	Precedence::Or => OR_PREC,
	}
	}
	}

	pub fn parse_comment(parser: &mut Parser) -> Result<Statement, ParserError> {
	let if_exists = parser.parse_keywords(&[Keyword::IF, Keyword::EXISTS]);

	parser.expect_keyword(Keyword::ON)?;
	let token = parser.next_token();

	let (object_type, object_name) = match token.token {
	Token::Word(w) if w.keyword == Keyword::COLUMN => {
	let object_name = parser.parse_object_name(false)?;
	(CommentObject::Column, object_name)
	}
	Token::Word(w) if w.keyword == Keyword::TABLE => {
	let object_name = parser.parse_object_name(false)?;
	(CommentObject::Table, object_name)
	}
	_ => parser.expected("comment object_type", token)?,
	};

	parser.expect_keyword(Keyword::IS)?;
	let comment = if parser.parse_keyword(Keyword::NULL) {
	None
	} else {
	Some(parser.parse_literal_string()?)
	};
	Ok(Statement::Comment {
	object_type,
	object_name,
	comment,
	if_exists,
	})
	}