summaryrefslogtreecommitdiffstats
path: root/sqlglot/generator.py
diff options
context:
space:
mode:
Diffstat (limited to 'sqlglot/generator.py')
-rw-r--r--sqlglot/generator.py1124
1 files changed, 1124 insertions, 0 deletions
diff --git a/sqlglot/generator.py b/sqlglot/generator.py
new file mode 100644
index 0000000..793cff0
--- /dev/null
+++ b/sqlglot/generator.py
@@ -0,0 +1,1124 @@
+import logging
+
+from sqlglot import exp
+from sqlglot.errors import ErrorLevel, UnsupportedError, concat_errors
+from sqlglot.helper import apply_index_offset, csv, ensure_list
+from sqlglot.time import format_time
+from sqlglot.tokens import TokenType
+
+logger = logging.getLogger("sqlglot")
+
+
+class Generator:
+ """
+ Generator interprets the given syntax tree and produces a SQL string as an output.
+
+ Args
+ time_mapping (dict): the dictionary of custom time mappings in which the key
+ represents a python time format and the output the target time format
+ time_trie (trie): a trie of the time_mapping keys
+ pretty (bool): if set to True the returned string will be formatted. Default: False.
+ quote_start (str): specifies which starting character to use to delimit quotes. Default: '.
+ quote_end (str): specifies which ending character to use to delimit quotes. Default: '.
+ identifier_start (str): specifies which starting character to use to delimit identifiers. Default: ".
+ identifier_end (str): specifies which ending character to use to delimit identifiers. Default: ".
+ identify (bool): if set to True all identifiers will be delimited by the corresponding
+ character.
+ normalize (bool): if set to True all identifiers will lower cased
+ escape (str): specifies an escape character. Default: '.
+ pad (int): determines padding in a formatted string. Default: 2.
+ indent (int): determines the size of indentation in a formatted string. Default: 4.
+ unnest_column_only (bool): if true unnest table aliases are considered only as column aliases
+ normalize_functions (str): normalize function names, "upper", "lower", or None
+ Default: "upper"
+ alias_post_tablesample (bool): if the table alias comes after tablesample
+ Default: False
+ unsupported_level (ErrorLevel): determines the generator's behavior when it encounters
+ unsupported expressions. Default ErrorLevel.WARN.
+ null_ordering (str): Indicates the default null ordering method to use if not explicitly set.
+ Options are "nulls_are_small", "nulls_are_large", "nulls_are_last".
+ Default: "nulls_are_small"
+ max_unsupported (int): Maximum number of unsupported messages to include in a raised UnsupportedError.
+ This is only relevant if unsupported_level is ErrorLevel.RAISE.
+ Default: 3
+ """
+
+ TRANSFORMS = {
+ exp.AnonymousProperty: lambda self, e: self.property_sql(e),
+ exp.AutoIncrementProperty: lambda self, e: f"AUTO_INCREMENT={self.sql(e, 'value')}",
+ exp.CharacterSetProperty: lambda self, e: f"{'DEFAULT ' if e.args['default'] else ''}CHARACTER SET={self.sql(e, 'value')}",
+ exp.CollateProperty: lambda self, e: f"COLLATE={self.sql(e, 'value')}",
+ exp.DateAdd: lambda self, e: f"DATE_ADD({self.sql(e, 'this')}, {self.sql(e, 'expression')}, {self.sql(e, 'unit')})",
+ exp.DateDiff: lambda self, e: f"DATE_DIFF({self.sql(e, 'this')}, {self.sql(e, 'expression')})",
+ exp.EngineProperty: lambda self, e: f"ENGINE={self.sql(e, 'value')}",
+ exp.FileFormatProperty: lambda self, e: f"FORMAT={self.sql(e, 'value')}",
+ exp.LocationProperty: lambda self, e: f"LOCATION {self.sql(e, 'value')}",
+ exp.PartitionedByProperty: lambda self, e: f"PARTITIONED_BY={self.sql(e.args['value'])}",
+ exp.SchemaCommentProperty: lambda self, e: f"COMMENT={self.sql(e, 'value')}",
+ exp.TableFormatProperty: lambda self, e: f"TABLE_FORMAT={self.sql(e, 'value')}",
+ exp.TsOrDsAdd: lambda self, e: f"TS_OR_DS_ADD({self.sql(e, 'this')}, {self.sql(e, 'expression')}, {self.sql(e, 'unit')})",
+ }
+
+ NULL_ORDERING_SUPPORTED = True
+
+ TYPE_MAPPING = {
+ exp.DataType.Type.NCHAR: "CHAR",
+ exp.DataType.Type.NVARCHAR: "VARCHAR",
+ }
+
+ TOKEN_MAPPING = {}
+
+ STRUCT_DELIMITER = ("<", ">")
+
+ ROOT_PROPERTIES = [
+ exp.AutoIncrementProperty,
+ exp.CharacterSetProperty,
+ exp.CollateProperty,
+ exp.EngineProperty,
+ exp.SchemaCommentProperty,
+ ]
+ WITH_PROPERTIES = [
+ exp.AnonymousProperty,
+ exp.FileFormatProperty,
+ exp.PartitionedByProperty,
+ exp.TableFormatProperty,
+ ]
+
+ __slots__ = (
+ "time_mapping",
+ "time_trie",
+ "pretty",
+ "configured_pretty",
+ "quote_start",
+ "quote_end",
+ "identifier_start",
+ "identifier_end",
+ "identify",
+ "normalize",
+ "escape",
+ "pad",
+ "index_offset",
+ "unnest_column_only",
+ "alias_post_tablesample",
+ "normalize_functions",
+ "unsupported_level",
+ "unsupported_messages",
+ "null_ordering",
+ "max_unsupported",
+ "_indent",
+ "_replace_backslash",
+ "_escaped_quote_end",
+ )
+
+ def __init__(
+ self,
+ time_mapping=None,
+ time_trie=None,
+ pretty=None,
+ quote_start=None,
+ quote_end=None,
+ identifier_start=None,
+ identifier_end=None,
+ identify=False,
+ normalize=False,
+ escape=None,
+ pad=2,
+ indent=2,
+ index_offset=0,
+ unnest_column_only=False,
+ alias_post_tablesample=False,
+ normalize_functions="upper",
+ unsupported_level=ErrorLevel.WARN,
+ null_ordering=None,
+ max_unsupported=3,
+ ):
+ import sqlglot
+
+ self.time_mapping = time_mapping or {}
+ self.time_trie = time_trie
+ self.pretty = pretty if pretty is not None else sqlglot.pretty
+ self.configured_pretty = self.pretty
+ self.quote_start = quote_start or "'"
+ self.quote_end = quote_end or "'"
+ self.identifier_start = identifier_start or '"'
+ self.identifier_end = identifier_end or '"'
+ self.identify = identify
+ self.normalize = normalize
+ self.escape = escape or "'"
+ self.pad = pad
+ self.index_offset = index_offset
+ self.unnest_column_only = unnest_column_only
+ self.alias_post_tablesample = alias_post_tablesample
+ self.normalize_functions = normalize_functions
+ self.unsupported_level = unsupported_level
+ self.unsupported_messages = []
+ self.max_unsupported = max_unsupported
+ self.null_ordering = null_ordering
+ self._indent = indent
+ self._replace_backslash = self.escape == "\\"
+ self._escaped_quote_end = self.escape + self.quote_end
+
+ def generate(self, expression):
+ """
+ Generates a SQL string by interpreting the given syntax tree.
+
+ Args
+ expression (Expression): the syntax tree.
+
+ Returns
+ the SQL string.
+ """
+ self.unsupported_messages = []
+ sql = self.sql(expression).strip()
+
+ if self.unsupported_level == ErrorLevel.IGNORE:
+ return sql
+
+ if self.unsupported_level == ErrorLevel.WARN:
+ for msg in self.unsupported_messages:
+ logger.warning(msg)
+ elif self.unsupported_level == ErrorLevel.RAISE and self.unsupported_messages:
+ raise UnsupportedError(
+ concat_errors(self.unsupported_messages, self.max_unsupported)
+ )
+
+ return sql
+
+ def unsupported(self, message):
+ if self.unsupported_level == ErrorLevel.IMMEDIATE:
+ raise UnsupportedError(message)
+ self.unsupported_messages.append(message)
+
+ def sep(self, sep=" "):
+ return f"{sep.strip()}\n" if self.pretty else sep
+
+ def seg(self, sql, sep=" "):
+ return f"{self.sep(sep)}{sql}"
+
+ def wrap(self, expression):
+ this_sql = self.indent(
+ self.sql(expression)
+ if isinstance(expression, (exp.Select, exp.Union))
+ else self.sql(expression, "this"),
+ level=1,
+ pad=0,
+ )
+ return f"({self.sep('')}{this_sql}{self.seg(')', sep='')}"
+
+ def no_identify(self, func):
+ original = self.identify
+ self.identify = False
+ result = func()
+ self.identify = original
+ return result
+
+ def normalize_func(self, name):
+ if self.normalize_functions == "upper":
+ return name.upper()
+ if self.normalize_functions == "lower":
+ return name.lower()
+ return name
+
+ def indent(self, sql, level=0, pad=None, skip_first=False, skip_last=False):
+ if not self.pretty:
+ return sql
+
+ pad = self.pad if pad is None else pad
+ lines = sql.split("\n")
+
+ return "\n".join(
+ line
+ if (skip_first and i == 0) or (skip_last and i == len(lines) - 1)
+ else f"{' ' * (level * self._indent + pad)}{line}"
+ for i, line in enumerate(lines)
+ )
+
+ def sql(self, expression, key=None):
+ if not expression:
+ return ""
+
+ if isinstance(expression, str):
+ return expression
+
+ if key:
+ return self.sql(expression.args.get(key))
+
+ transform = self.TRANSFORMS.get(expression.__class__)
+
+ if callable(transform):
+ return transform(self, expression)
+ if transform:
+ return transform
+
+ if not isinstance(expression, exp.Expression):
+ raise ValueError(
+ f"Expected an Expression. Received {type(expression)}: {expression}"
+ )
+
+ exp_handler_name = f"{expression.key}_sql"
+ if hasattr(self, exp_handler_name):
+ return getattr(self, exp_handler_name)(expression)
+
+ if isinstance(expression, exp.Func):
+ return self.function_fallback_sql(expression)
+
+ raise ValueError(f"Unsupported expression type {expression.__class__.__name__}")
+
+ def annotation_sql(self, expression):
+ return self.sql(expression, "expression")
+
+ def uncache_sql(self, expression):
+ table = self.sql(expression, "this")
+ exists_sql = " IF EXISTS" if expression.args.get("exists") else ""
+ return f"UNCACHE TABLE{exists_sql} {table}"
+
+ def cache_sql(self, expression):
+ lazy = " LAZY" if expression.args.get("lazy") else ""
+ table = self.sql(expression, "this")
+ options = expression.args.get("options")
+ options = (
+ f" OPTIONS({self.sql(options[0])} = {self.sql(options[1])})"
+ if options
+ else ""
+ )
+ sql = self.sql(expression, "expression")
+ sql = f" AS{self.sep()}{sql}" if sql else ""
+ sql = f"CACHE{lazy} TABLE {table}{options}{sql}"
+ return self.prepend_ctes(expression, sql)
+
+ def characterset_sql(self, expression):
+ if isinstance(expression.parent, exp.Cast):
+ return f"CHAR CHARACTER SET {self.sql(expression, 'this')}"
+ default = "DEFAULT " if expression.args.get("default") else ""
+ return f"{default}CHARACTER SET={self.sql(expression, 'this')}"
+
+ def column_sql(self, expression):
+ return ".".join(
+ part
+ for part in [
+ self.sql(expression, "db"),
+ self.sql(expression, "table"),
+ self.sql(expression, "this"),
+ ]
+ if part
+ )
+
+ def columndef_sql(self, expression):
+ column = self.sql(expression, "this")
+ kind = self.sql(expression, "kind")
+ constraints = self.expressions(
+ expression, key="constraints", sep=" ", flat=True
+ )
+
+ if not constraints:
+ return f"{column} {kind}"
+ return f"{column} {kind} {constraints}"
+
+ def columnconstraint_sql(self, expression):
+ this = self.sql(expression, "this")
+ kind_sql = self.sql(expression, "kind")
+ return f"CONSTRAINT {this} {kind_sql}" if this else kind_sql
+
+ def autoincrementcolumnconstraint_sql(self, _):
+ return self.token_sql(TokenType.AUTO_INCREMENT)
+
+ def checkcolumnconstraint_sql(self, expression):
+ this = self.sql(expression, "this")
+ return f"CHECK ({this})"
+
+ def commentcolumnconstraint_sql(self, expression):
+ comment = self.sql(expression, "this")
+ return f"COMMENT {comment}"
+
+ def collatecolumnconstraint_sql(self, expression):
+ collate = self.sql(expression, "this")
+ return f"COLLATE {collate}"
+
+ def defaultcolumnconstraint_sql(self, expression):
+ default = self.sql(expression, "this")
+ return f"DEFAULT {default}"
+
+ def notnullcolumnconstraint_sql(self, _):
+ return "NOT NULL"
+
+ def primarykeycolumnconstraint_sql(self, _):
+ return "PRIMARY KEY"
+
+ def uniquecolumnconstraint_sql(self, _):
+ return "UNIQUE"
+
+ def create_sql(self, expression):
+ this = self.sql(expression, "this")
+ kind = self.sql(expression, "kind").upper()
+ expression_sql = self.sql(expression, "expression")
+ expression_sql = f"AS{self.sep()}{expression_sql}" if expression_sql else ""
+ temporary = " TEMPORARY" if expression.args.get("temporary") else ""
+ replace = " OR REPLACE" if expression.args.get("replace") else ""
+ exists_sql = " IF NOT EXISTS" if expression.args.get("exists") else ""
+ unique = " UNIQUE" if expression.args.get("unique") else ""
+ properties = self.sql(expression, "properties")
+
+ expression_sql = f"CREATE{replace}{temporary}{unique} {kind}{exists_sql} {this}{properties} {expression_sql}"
+ return self.prepend_ctes(expression, expression_sql)
+
+ def prepend_ctes(self, expression, sql):
+ with_ = self.sql(expression, "with")
+ if with_:
+ sql = f"{with_}{self.sep()}{sql}"
+ return sql
+
+ def with_sql(self, expression):
+ sql = self.expressions(expression, flat=True)
+ recursive = "RECURSIVE " if expression.args.get("recursive") else ""
+
+ return f"WITH {recursive}{sql}"
+
+ def cte_sql(self, expression):
+ alias = self.sql(expression, "alias")
+ return f"{alias} AS {self.wrap(expression)}"
+
+ def tablealias_sql(self, expression):
+ alias = self.sql(expression, "this")
+ columns = self.expressions(expression, key="columns", flat=True)
+ columns = f"({columns})" if columns else ""
+ return f"{alias}{columns}"
+
+ def bitstring_sql(self, expression):
+ return f"b'{self.sql(expression, 'this')}'"
+
+ def datatype_sql(self, expression):
+ type_value = expression.this
+ type_sql = self.TYPE_MAPPING.get(type_value, type_value.value)
+ nested = ""
+ interior = self.expressions(expression, flat=True)
+ if interior:
+ nested = (
+ f"{self.STRUCT_DELIMITER[0]}{interior}{self.STRUCT_DELIMITER[1]}"
+ if expression.args.get("nested")
+ else f"({interior})"
+ )
+ return f"{type_sql}{nested}"
+
+ def delete_sql(self, expression):
+ this = self.sql(expression, "this")
+ where_sql = self.sql(expression, "where")
+ sql = f"DELETE FROM {this}{where_sql}"
+ return self.prepend_ctes(expression, sql)
+
+ def drop_sql(self, expression):
+ this = self.sql(expression, "this")
+ kind = expression.args["kind"]
+ exists_sql = " IF EXISTS " if expression.args.get("exists") else " "
+ return f"DROP {kind}{exists_sql}{this}"
+
+ def except_sql(self, expression):
+ return self.prepend_ctes(
+ expression,
+ self.set_operation(expression, self.except_op(expression)),
+ )
+
+ def except_op(self, expression):
+ return f"EXCEPT{'' if expression.args.get('distinct') else ' ALL'}"
+
+ def fetch_sql(self, expression):
+ direction = expression.args.get("direction")
+ direction = f" {direction.upper()}" if direction else ""
+ count = expression.args.get("count")
+ count = f" {count}" if count else ""
+ return f"{self.seg('FETCH')}{direction}{count} ROWS ONLY"
+
+ def filter_sql(self, expression):
+ this = self.sql(expression, "this")
+ where = self.sql(expression, "expression")[1:] # where has a leading space
+ return f"{this} FILTER({where})"
+
+ def hint_sql(self, expression):
+ if self.sql(expression, "this"):
+ self.unsupported("Hints are not supported")
+ return ""
+
+ def index_sql(self, expression):
+ this = self.sql(expression, "this")
+ table = self.sql(expression, "table")
+ columns = self.sql(expression, "columns")
+ return f"{this} ON {table} {columns}"
+
+ def identifier_sql(self, expression):
+ value = expression.name
+ value = value.lower() if self.normalize else value
+ if expression.args.get("quoted") or self.identify:
+ return f"{self.identifier_start}{value}{self.identifier_end}"
+ return value
+
+ def partition_sql(self, expression):
+ keys = csv(
+ *[
+ f"{k.args['this']}='{v.args['this']}'" if v else k.args["this"]
+ for k, v in expression.args.get("this")
+ ]
+ )
+ return f"PARTITION({keys})"
+
+ def properties_sql(self, expression):
+ root_properties = []
+ with_properties = []
+
+ for p in expression.expressions:
+ p_class = p.__class__
+ if p_class in self.ROOT_PROPERTIES:
+ root_properties.append(p)
+ elif p_class in self.WITH_PROPERTIES:
+ with_properties.append(p)
+
+ return self.root_properties(
+ exp.Properties(expressions=root_properties)
+ ) + self.with_properties(exp.Properties(expressions=with_properties))
+
+ def root_properties(self, properties):
+ if properties.expressions:
+ return self.sep() + self.expressions(
+ properties,
+ indent=False,
+ sep=" ",
+ )
+ return ""
+
+ def properties(self, properties, prefix="", sep=", "):
+ if properties.expressions:
+ expressions = self.expressions(
+ properties,
+ sep=sep,
+ indent=False,
+ )
+ return f"{self.seg(prefix)}{' ' if prefix else ''}{self.wrap(expressions)}"
+ return ""
+
+ def with_properties(self, properties):
+ return self.properties(
+ properties,
+ prefix="WITH",
+ )
+
+ def property_sql(self, expression):
+ key = expression.name
+ value = self.sql(expression, "value")
+ return f"{key} = {value}"
+
+ def insert_sql(self, expression):
+ kind = "OVERWRITE TABLE" if expression.args.get("overwrite") else "INTO"
+ this = self.sql(expression, "this")
+ exists = " IF EXISTS " if expression.args.get("exists") else " "
+ partition_sql = (
+ self.sql(expression, "partition")
+ if expression.args.get("partition")
+ else ""
+ )
+ expression_sql = self.sql(expression, "expression")
+ sep = self.sep() if partition_sql else ""
+ sql = f"INSERT {kind} {this}{exists}{partition_sql}{sep}{expression_sql}"
+ return self.prepend_ctes(expression, sql)
+
+ def intersect_sql(self, expression):
+ return self.prepend_ctes(
+ expression,
+ self.set_operation(expression, self.intersect_op(expression)),
+ )
+
+ def intersect_op(self, expression):
+ return f"INTERSECT{'' if expression.args.get('distinct') else ' ALL'}"
+
+ def introducer_sql(self, expression):
+ return f"{self.sql(expression, 'this')} {self.sql(expression, 'expression')}"
+
+ def table_sql(self, expression):
+ return ".".join(
+ part
+ for part in [
+ self.sql(expression, "catalog"),
+ self.sql(expression, "db"),
+ self.sql(expression, "this"),
+ ]
+ if part
+ )
+
+ def tablesample_sql(self, expression):
+ if self.alias_post_tablesample and isinstance(expression.this, exp.Alias):
+ this = self.sql(expression.this, "this")
+ alias = f" AS {self.sql(expression.this, 'alias')}"
+ else:
+ this = self.sql(expression, "this")
+ alias = ""
+ method = self.sql(expression, "method")
+ method = f" {method.upper()} " if method else ""
+ numerator = self.sql(expression, "bucket_numerator")
+ denominator = self.sql(expression, "bucket_denominator")
+ field = self.sql(expression, "bucket_field")
+ field = f" ON {field}" if field else ""
+ bucket = f"BUCKET {numerator} OUT OF {denominator}{field}" if numerator else ""
+ percent = self.sql(expression, "percent")
+ percent = f"{percent} PERCENT" if percent else ""
+ rows = self.sql(expression, "rows")
+ rows = f"{rows} ROWS" if rows else ""
+ size = self.sql(expression, "size")
+ return f"{this} TABLESAMPLE{method}({bucket}{percent}{rows}{size}){alias}"
+
+ def tuple_sql(self, expression):
+ return f"({self.expressions(expression, flat=True)})"
+
+ def update_sql(self, expression):
+ this = self.sql(expression, "this")
+ set_sql = self.expressions(expression, flat=True)
+ from_sql = self.sql(expression, "from")
+ where_sql = self.sql(expression, "where")
+ sql = f"UPDATE {this} SET {set_sql}{from_sql}{where_sql}"
+ return self.prepend_ctes(expression, sql)
+
+ def values_sql(self, expression):
+ return f"VALUES{self.seg('')}{self.expressions(expression)}"
+
+ def var_sql(self, expression):
+ return self.sql(expression, "this")
+
+ def from_sql(self, expression):
+ expressions = self.expressions(expression, flat=True)
+ return f"{self.seg('FROM')} {expressions}"
+
+ def group_sql(self, expression):
+ group_by = self.op_expressions("GROUP BY", expression)
+ grouping_sets = self.expressions(expression, key="grouping_sets", indent=False)
+ grouping_sets = (
+ f"{self.seg('GROUPING SETS')} {self.wrap(grouping_sets)}"
+ if grouping_sets
+ else ""
+ )
+ cube = self.expressions(expression, key="cube", indent=False)
+ cube = f"{self.seg('CUBE')} {self.wrap(cube)}" if cube else ""
+ rollup = self.expressions(expression, key="rollup", indent=False)
+ rollup = f"{self.seg('ROLLUP')} {self.wrap(rollup)}" if rollup else ""
+ return f"{group_by}{grouping_sets}{cube}{rollup}"
+
+ def having_sql(self, expression):
+ this = self.indent(self.sql(expression, "this"))
+ return f"{self.seg('HAVING')}{self.sep()}{this}"
+
+ def join_sql(self, expression):
+ op_sql = self.seg(
+ " ".join(op for op in (expression.side, expression.kind, "JOIN") if op)
+ )
+ on_sql = self.sql(expression, "on")
+ using = expression.args.get("using")
+
+ if not on_sql and using:
+ on_sql = csv(*(self.sql(column) for column in using))
+
+ if on_sql:
+ on_sql = self.indent(on_sql, skip_first=True)
+ space = self.seg(" " * self.pad) if self.pretty else " "
+ if using:
+ on_sql = f"{space}USING ({on_sql})"
+ else:
+ on_sql = f"{space}ON {on_sql}"
+
+ expression_sql = self.sql(expression, "expression")
+ this_sql = self.sql(expression, "this")
+ return f"{expression_sql}{op_sql} {this_sql}{on_sql}"
+
+ def lambda_sql(self, expression):
+ args = self.expressions(expression, flat=True)
+ args = f"({args})" if len(args.split(",")) > 1 else args
+ return self.no_identify(lambda: f"{args} -> {self.sql(expression, 'this')}")
+
+ def lateral_sql(self, expression):
+ this = self.sql(expression, "this")
+ op_sql = self.seg(
+ f"LATERAL VIEW{' OUTER' if expression.args.get('outer') else ''}"
+ )
+ alias = expression.args["alias"]
+ table = alias.name
+ table = f" {table}" if table else table
+ columns = self.expressions(alias, key="columns", flat=True)
+ columns = f" AS {columns}" if columns else ""
+ return f"{op_sql}{self.sep()}{this}{table}{columns}"
+
+ def limit_sql(self, expression):
+ this = self.sql(expression, "this")
+ return f"{this}{self.seg('LIMIT')} {self.sql(expression, 'expression')}"
+
+ def offset_sql(self, expression):
+ this = self.sql(expression, "this")
+ return f"{this}{self.seg('OFFSET')} {self.sql(expression, 'expression')}"
+
+ def literal_sql(self, expression):
+ text = expression.this or ""
+ if expression.is_string:
+ if self._replace_backslash:
+ text = text.replace("\\", "\\\\")
+ text = text.replace(self.quote_end, self._escaped_quote_end)
+ return f"{self.quote_start}{text}{self.quote_end}"
+ return text
+
+ def null_sql(self, *_):
+ return "NULL"
+
+ def boolean_sql(self, expression):
+ return "TRUE" if expression.this else "FALSE"
+
+ def order_sql(self, expression, flat=False):
+ this = self.sql(expression, "this")
+ this = f"{this} " if this else this
+ return self.op_expressions(f"{this}ORDER BY", expression, flat=this or flat)
+
+ def cluster_sql(self, expression):
+ return self.op_expressions("CLUSTER BY", expression)
+
+ def distribute_sql(self, expression):
+ return self.op_expressions("DISTRIBUTE BY", expression)
+
+ def sort_sql(self, expression):
+ return self.op_expressions("SORT BY", expression)
+
+ def ordered_sql(self, expression):
+ desc = expression.args.get("desc")
+ asc = not desc
+ nulls_first = expression.args.get("nulls_first")
+ nulls_last = not nulls_first
+ nulls_are_large = self.null_ordering == "nulls_are_large"
+ nulls_are_small = self.null_ordering == "nulls_are_small"
+ nulls_are_last = self.null_ordering == "nulls_are_last"
+
+ sort_order = " DESC" if desc else ""
+ nulls_sort_change = ""
+ if nulls_first and (
+ (asc and nulls_are_large) or (desc and nulls_are_small) or nulls_are_last
+ ):
+ nulls_sort_change = " NULLS FIRST"
+ elif (
+ nulls_last
+ and ((asc and nulls_are_small) or (desc and nulls_are_large))
+ and not nulls_are_last
+ ):
+ nulls_sort_change = " NULLS LAST"
+
+ if nulls_sort_change and not self.NULL_ORDERING_SUPPORTED:
+ self.unsupported(
+ "Sorting in an ORDER BY on NULLS FIRST/NULLS LAST is not supported by this dialect"
+ )
+ nulls_sort_change = ""
+
+ return f"{self.sql(expression, 'this')}{sort_order}{nulls_sort_change}"
+
+ def query_modifiers(self, expression, *sqls):
+ return csv(
+ *sqls,
+ *[self.sql(sql) for sql in expression.args.get("laterals", [])],
+ *[self.sql(sql) for sql in expression.args.get("joins", [])],
+ self.sql(expression, "where"),
+ self.sql(expression, "group"),
+ self.sql(expression, "having"),
+ self.sql(expression, "qualify"),
+ self.sql(expression, "window"),
+ self.sql(expression, "distribute"),
+ self.sql(expression, "sort"),
+ self.sql(expression, "cluster"),
+ self.sql(expression, "order"),
+ self.sql(expression, "limit"),
+ self.sql(expression, "offset"),
+ sep="",
+ )
+
+ def select_sql(self, expression):
+ hint = self.sql(expression, "hint")
+ distinct = self.sql(expression, "distinct")
+ distinct = f" {distinct}" if distinct else ""
+ expressions = self.expressions(expression)
+ expressions = f"{self.sep()}{expressions}" if expressions else expressions
+ sql = self.query_modifiers(
+ expression,
+ f"SELECT{hint}{distinct}{expressions}",
+ self.sql(expression, "from"),
+ )
+ return self.prepend_ctes(expression, sql)
+
+ def schema_sql(self, expression):
+ this = self.sql(expression, "this")
+ this = f"{this} " if this else ""
+ sql = f"({self.sep('')}{self.expressions(expression)}{self.seg(')', sep='')}"
+ return f"{this}{sql}"
+
+ def star_sql(self, expression):
+ except_ = self.expressions(expression, key="except", flat=True)
+ except_ = f"{self.seg('EXCEPT')} ({except_})" if except_ else ""
+ replace = self.expressions(expression, key="replace", flat=True)
+ replace = f"{self.seg('REPLACE')} ({replace})" if replace else ""
+ return f"*{except_}{replace}"
+
+ def structkwarg_sql(self, expression):
+ return f"{self.sql(expression, 'this')} {self.sql(expression, 'expression')}"
+
+ def placeholder_sql(self, *_):
+ return "?"
+
+ def subquery_sql(self, expression):
+ alias = self.sql(expression, "alias")
+
+ return self.query_modifiers(
+ expression,
+ self.wrap(expression),
+ f" AS {alias}" if alias else "",
+ )
+
+ def qualify_sql(self, expression):
+ this = self.indent(self.sql(expression, "this"))
+ return f"{self.seg('QUALIFY')}{self.sep()}{this}"
+
+ def union_sql(self, expression):
+ return self.prepend_ctes(
+ expression,
+ self.set_operation(expression, self.union_op(expression)),
+ )
+
+ def union_op(self, expression):
+ return f"UNION{'' if expression.args.get('distinct') else ' ALL'}"
+
+ def unnest_sql(self, expression):
+ args = self.expressions(expression, flat=True)
+ alias = expression.args.get("alias")
+ if alias and self.unnest_column_only:
+ columns = alias.columns
+ alias = self.sql(columns[0]) if columns else ""
+ else:
+ alias = self.sql(expression, "alias")
+ alias = f" AS {alias}" if alias else alias
+ ordinality = " WITH ORDINALITY" if expression.args.get("ordinality") else ""
+ return f"UNNEST({args}){ordinality}{alias}"
+
+ def where_sql(self, expression):
+ this = self.indent(self.sql(expression, "this"))
+ return f"{self.seg('WHERE')}{self.sep()}{this}"
+
+ def window_sql(self, expression):
+ this = self.sql(expression, "this")
+ partition = self.expressions(expression, key="partition_by", flat=True)
+ partition = f"PARTITION BY {partition}" if partition else ""
+ order = expression.args.get("order")
+ order_sql = self.order_sql(order, flat=True) if order else ""
+ partition_sql = partition + " " if partition and order else partition
+ spec = expression.args.get("spec")
+ spec_sql = " " + self.window_spec_sql(spec) if spec else ""
+ alias = self.sql(expression, "alias")
+ if expression.arg_key == "window":
+ this = this = f"{self.seg('WINDOW')} {this} AS"
+ else:
+ this = f"{this} OVER"
+
+ if not partition and not order and not spec and alias:
+ return f"{this} {alias}"
+
+ return f"{this} ({alias}{partition_sql}{order_sql}{spec_sql})"
+
+ def window_spec_sql(self, expression):
+ kind = self.sql(expression, "kind")
+ start = csv(
+ self.sql(expression, "start"), self.sql(expression, "start_side"), sep=" "
+ )
+ end = (
+ csv(self.sql(expression, "end"), self.sql(expression, "end_side"), sep=" ")
+ or "CURRENT ROW"
+ )
+ return f"{kind} BETWEEN {start} AND {end}"
+
+ def withingroup_sql(self, expression):
+ this = self.sql(expression, "this")
+ expression = self.sql(expression, "expression")[1:] # order has a leading space
+ return f"{this} WITHIN GROUP ({expression})"
+
+ def between_sql(self, expression):
+ this = self.sql(expression, "this")
+ low = self.sql(expression, "low")
+ high = self.sql(expression, "high")
+ return f"{this} BETWEEN {low} AND {high}"
+
+ def bracket_sql(self, expression):
+ expressions = apply_index_offset(expression.expressions, self.index_offset)
+ expressions = ", ".join(self.sql(e) for e in expressions)
+
+ return f"{self.sql(expression, 'this')}[{expressions}]"
+
+ def all_sql(self, expression):
+ return f"ALL {self.wrap(expression)}"
+
+ def any_sql(self, expression):
+ return f"ANY {self.wrap(expression)}"
+
+ def exists_sql(self, expression):
+ return f"EXISTS{self.wrap(expression)}"
+
+ def case_sql(self, expression):
+ this = self.indent(self.sql(expression, "this"), skip_first=True)
+ this = f" {this}" if this else ""
+ ifs = []
+
+ for e in expression.args["ifs"]:
+ ifs.append(self.indent(f"WHEN {self.sql(e, 'this')}"))
+ ifs.append(self.indent(f"THEN {self.sql(e, 'true')}"))
+
+ if expression.args.get("default") is not None:
+ ifs.append(self.indent(f"ELSE {self.sql(expression, 'default')}"))
+
+ ifs = "".join(self.seg(self.indent(e, skip_first=True)) for e in ifs)
+ statement = f"CASE{this}{ifs}{self.seg('END')}"
+ return statement
+
+ def constraint_sql(self, expression):
+ this = self.sql(expression, "this")
+ expressions = self.expressions(expression, flat=True)
+ return f"CONSTRAINT {this} {expressions}"
+
+ def extract_sql(self, expression):
+ this = self.sql(expression, "this")
+ expression_sql = self.sql(expression, "expression")
+ return f"EXTRACT({this} FROM {expression_sql})"
+
+ def check_sql(self, expression):
+ this = self.sql(expression, key="this")
+ return f"CHECK ({this})"
+
+ def foreignkey_sql(self, expression):
+ expressions = self.expressions(expression, flat=True)
+ reference = self.sql(expression, "reference")
+ reference = f" {reference}" if reference else ""
+ delete = self.sql(expression, "delete")
+ delete = f" ON DELETE {delete}" if delete else ""
+ update = self.sql(expression, "update")
+ update = f" ON UPDATE {update}" if update else ""
+ return f"FOREIGN KEY ({expressions}){reference}{delete}{update}"
+
+ def unique_sql(self, expression):
+ columns = self.expressions(expression, key="expressions")
+ return f"UNIQUE ({columns})"
+
+ def if_sql(self, expression):
+ return self.case_sql(
+ exp.Case(ifs=[expression], default=expression.args.get("false"))
+ )
+
+ def in_sql(self, expression):
+ query = expression.args.get("query")
+ unnest = expression.args.get("unnest")
+ if query:
+ in_sql = self.wrap(query)
+ elif unnest:
+ in_sql = self.in_unnest_op(unnest)
+ else:
+ in_sql = f"({self.expressions(expression, flat=True)})"
+ return f"{self.sql(expression, 'this')} IN {in_sql}"
+
+ def in_unnest_op(self, unnest):
+ return f"(SELECT {self.sql(unnest)})"
+
+ def interval_sql(self, expression):
+ return f"INTERVAL {self.sql(expression, 'this')} {self.sql(expression, 'unit')}"
+
+ def reference_sql(self, expression):
+ this = self.sql(expression, "this")
+ expressions = self.expressions(expression, flat=True)
+ return f"REFERENCES {this}({expressions})"
+
+ def anonymous_sql(self, expression):
+ args = self.indent(
+ self.expressions(expression, flat=True), skip_first=True, skip_last=True
+ )
+ return f"{self.normalize_func(self.sql(expression, 'this'))}({args})"
+
+ def paren_sql(self, expression):
+ if isinstance(expression.unnest(), exp.Select):
+ return self.wrap(expression)
+ sql = self.seg(self.indent(self.sql(expression, "this")), sep="")
+ return f"({sql}{self.seg(')', sep='')}"
+
+ def neg_sql(self, expression):
+ return f"-{self.sql(expression, 'this')}"
+
+ def not_sql(self, expression):
+ return f"NOT {self.sql(expression, 'this')}"
+
+ def alias_sql(self, expression):
+ to_sql = self.sql(expression, "alias")
+ to_sql = f" AS {to_sql}" if to_sql else ""
+ return f"{self.sql(expression, 'this')}{to_sql}"
+
+ def aliases_sql(self, expression):
+ return f"{self.sql(expression, 'this')} AS ({self.expressions(expression, flat=True)})"
+
+ def attimezone_sql(self, expression):
+ this = self.sql(expression, "this")
+ zone = self.sql(expression, "zone")
+ return f"{this} AT TIME ZONE {zone}"
+
+ def add_sql(self, expression):
+ return self.binary(expression, "+")
+
+ def and_sql(self, expression):
+ return self.connector_sql(expression, "AND")
+
+ def connector_sql(self, expression, op):
+ if not self.pretty:
+ return self.binary(expression, op)
+
+ return f"\n{op} ".join(self.sql(e) for e in expression.flatten(unnest=False))
+
+ def bitwiseand_sql(self, expression):
+ return self.binary(expression, "&")
+
+ def bitwiseleftshift_sql(self, expression):
+ return self.binary(expression, "<<")
+
+ def bitwisenot_sql(self, expression):
+ return f"~{self.sql(expression, 'this')}"
+
+ def bitwiseor_sql(self, expression):
+ return self.binary(expression, "|")
+
+ def bitwiserightshift_sql(self, expression):
+ return self.binary(expression, ">>")
+
+ def bitwisexor_sql(self, expression):
+ return self.binary(expression, "^")
+
+ def cast_sql(self, expression):
+ return f"CAST({self.sql(expression, 'this')} AS {self.sql(expression, 'to')})"
+
+ def currentdate_sql(self, expression):
+ zone = self.sql(expression, "this")
+ return f"CURRENT_DATE({zone})" if zone else "CURRENT_DATE"
+
+ def command_sql(self, expression):
+ return f"{self.sql(expression, 'this').upper()} {expression.text('expression').strip()}"
+
+ def distinct_sql(self, expression):
+ this = self.sql(expression, "this")
+ this = f" {this}" if this else ""
+
+ on = self.sql(expression, "on")
+ on = f" ON {on}" if on else ""
+ return f"DISTINCT{this}{on}"
+
+ def ignorenulls_sql(self, expression):
+ return f"{self.sql(expression, 'this')} IGNORE NULLS"
+
+ def intdiv_sql(self, expression):
+ return self.sql(
+ exp.Cast(
+ this=exp.Div(
+ this=expression.args["this"],
+ expression=expression.args["expression"],
+ ),
+ to=exp.DataType(this=exp.DataType.Type.INT),
+ )
+ )
+
+ def dpipe_sql(self, expression):
+ return self.binary(expression, "||")
+
+ def div_sql(self, expression):
+ return self.binary(expression, "/")
+
+ def dot_sql(self, expression):
+ return f"{self.sql(expression, 'this')}.{self.sql(expression, 'expression')}"
+
+ def eq_sql(self, expression):
+ return self.binary(expression, "=")
+
+ def escape_sql(self, expression):
+ return self.binary(expression, "ESCAPE")
+
+ def gt_sql(self, expression):
+ return self.binary(expression, ">")
+
+ def gte_sql(self, expression):
+ return self.binary(expression, ">=")
+
+ def ilike_sql(self, expression):
+ return self.binary(expression, "ILIKE")
+
+ def is_sql(self, expression):
+ return self.binary(expression, "IS")
+
+ def like_sql(self, expression):
+ return self.binary(expression, "LIKE")
+
+ def lt_sql(self, expression):
+ return self.binary(expression, "<")
+
+ def lte_sql(self, expression):
+ return self.binary(expression, "<=")
+
+ def mod_sql(self, expression):
+ return self.binary(expression, "%")
+
+ def mul_sql(self, expression):
+ return self.binary(expression, "*")
+
+ def neq_sql(self, expression):
+ return self.binary(expression, "<>")
+
+ def or_sql(self, expression):
+ return self.connector_sql(expression, "OR")
+
+ def sub_sql(self, expression):
+ return self.binary(expression, "-")
+
+ def trycast_sql(self, expression):
+ return (
+ f"TRY_CAST({self.sql(expression, 'this')} AS {self.sql(expression, 'to')})"
+ )
+
+ def binary(self, expression, op):
+ return (
+ f"{self.sql(expression, 'this')} {op} {self.sql(expression, 'expression')}"
+ )
+
+ def function_fallback_sql(self, expression):
+ args = []
+ for arg_key in expression.arg_types:
+ arg_value = ensure_list(expression.args.get(arg_key) or [])
+ for a in arg_value:
+ args.append(self.sql(a))
+
+ args_str = self.indent(", ".join(args), skip_first=True, skip_last=True)
+ return f"{self.normalize_func(expression.sql_name())}({args_str})"
+
+ def format_time(self, expression):
+ return format_time(
+ self.sql(expression, "format"), self.time_mapping, self.time_trie
+ )
+
+ def expressions(self, expression, key=None, flat=False, indent=True, sep=", "):
+ expressions = expression.args.get(key or "expressions")
+
+ if not expressions:
+ return ""
+
+ if flat:
+ return sep.join(self.sql(e) for e in expressions)
+
+ expressions = self.sep(sep).join(self.sql(e) for e in expressions)
+ if indent:
+ return self.indent(expressions, skip_first=False)
+ return expressions
+
+ def op_expressions(self, op, expression, flat=False):
+ expressions_sql = self.expressions(expression, flat=flat)
+ if flat:
+ return f"{op} {expressions_sql}"
+ return f"{self.seg(op)}{self.sep() if expressions_sql else ''}{expressions_sql}"
+
+ def set_operation(self, expression, op):
+ this = self.sql(expression, "this")
+ op = self.seg(op)
+ return self.query_modifiers(
+ expression, f"{this}{op}{self.sep()}{self.sql(expression, 'expression')}"
+ )
+
+ def token_sql(self, token_type):
+ return self.TOKEN_MAPPING.get(token_type, token_type.name)