Edit on GitHub

sqlglot.dialects.snowflake

View Source

  1from __future__ import annotations
  2
  3import typing as t
  4
  5from sqlglot import exp, generator, parser, tokens
  6from sqlglot.dialects.dialect import (
  7    Dialect,
  8    date_trunc_to_time,
  9    datestrtodate_sql,
 10    format_time_lambda,
 11    inline_array_sql,
 12    max_or_greatest,
 13    min_or_least,
 14    rename_func,
 15    timestamptrunc_sql,
 16    timestrtotime_sql,
 17    ts_or_ds_to_date_sql,
 18    var_map_sql,
 19)
 20from sqlglot.expressions import Literal
 21from sqlglot.helper import flatten, seq_get
 22from sqlglot.parser import binary_range_parser
 23from sqlglot.tokens import TokenType
 24
 25
 26def _check_int(s):
 27    if s[0] in ("-", "+"):
 28        return s[1:].isdigit()
 29    return s.isdigit()
 30
 31
 32# from https://docs.snowflake.com/en/sql-reference/functions/to_timestamp.html
 33def _snowflake_to_timestamp(args):
 34    if len(args) == 2:
 35        first_arg, second_arg = args
 36        if second_arg.is_string:
 37            # case: <string_expr> [ , <format> ]
 38            return format_time_lambda(exp.StrToTime, "snowflake")(args)
 39
 40        # case: <numeric_expr> [ , <scale> ]
 41        if second_arg.name not in ["0", "3", "9"]:
 42            raise ValueError(
 43                f"Scale for snowflake numeric timestamp is {second_arg}, but should be 0, 3, or 9"
 44            )
 45
 46        if second_arg.name == "0":
 47            timescale = exp.UnixToTime.SECONDS
 48        elif second_arg.name == "3":
 49            timescale = exp.UnixToTime.MILLIS
 50        elif second_arg.name == "9":
 51            timescale = exp.UnixToTime.MICROS
 52
 53        return exp.UnixToTime(this=first_arg, scale=timescale)
 54
 55    first_arg = seq_get(args, 0)
 56    if not isinstance(first_arg, Literal):
 57        # case: <variant_expr>
 58        return format_time_lambda(exp.StrToTime, "snowflake", default=True)(args)
 59
 60    if first_arg.is_string:
 61        if _check_int(first_arg.this):
 62            # case: <integer>
 63            return exp.UnixToTime.from_arg_list(args)
 64
 65        # case: <date_expr>
 66        return format_time_lambda(exp.StrToTime, "snowflake", default=True)(args)
 67
 68    # case: <numeric_expr>
 69    return exp.UnixToTime.from_arg_list(args)
 70
 71
 72def _unix_to_time_sql(self, expression):
 73    scale = expression.args.get("scale")
 74    timestamp = self.sql(expression, "this")
 75    if scale in [None, exp.UnixToTime.SECONDS]:
 76        return f"TO_TIMESTAMP({timestamp})"
 77    if scale == exp.UnixToTime.MILLIS:
 78        return f"TO_TIMESTAMP({timestamp}, 3)"
 79    if scale == exp.UnixToTime.MICROS:
 80        return f"TO_TIMESTAMP({timestamp}, 9)"
 81
 82    raise ValueError("Improper scale for timestamp")
 83
 84
 85# https://docs.snowflake.com/en/sql-reference/functions/date_part.html
 86# https://docs.snowflake.com/en/sql-reference/functions-date-time.html#label-supported-date-time-parts
 87def _parse_date_part(self):
 88    this = self._parse_var() or self._parse_type()
 89    self._match(TokenType.COMMA)
 90    expression = self._parse_bitwise()
 91
 92    name = this.name.upper()
 93    if name.startswith("EPOCH"):
 94        if name.startswith("EPOCH_MILLISECOND"):
 95            scale = 10**3
 96        elif name.startswith("EPOCH_MICROSECOND"):
 97            scale = 10**6
 98        elif name.startswith("EPOCH_NANOSECOND"):
 99            scale = 10**9
100        else:
101            scale = None
102
103        ts = self.expression(exp.Cast, this=expression, to=exp.DataType.build("TIMESTAMP"))
104        to_unix = self.expression(exp.TimeToUnix, this=ts)
105
106        if scale:
107            to_unix = exp.Mul(this=to_unix, expression=exp.Literal.number(scale))
108
109        return to_unix
110
111    return self.expression(exp.Extract, this=this, expression=expression)
112
113
114# https://docs.snowflake.com/en/sql-reference/functions/div0
115def _div0_to_if(args):
116    cond = exp.EQ(this=seq_get(args, 1), expression=exp.Literal.number(0))
117    true = exp.Literal.number(0)
118    false = exp.Div(this=seq_get(args, 0), expression=seq_get(args, 1))
119    return exp.If(this=cond, true=true, false=false)
120
121
122# https://docs.snowflake.com/en/sql-reference/functions/zeroifnull
123def _zeroifnull_to_if(args):
124    cond = exp.Is(this=seq_get(args, 0), expression=exp.Null())
125    return exp.If(this=cond, true=exp.Literal.number(0), false=seq_get(args, 0))
126
127
128# https://docs.snowflake.com/en/sql-reference/functions/zeroifnull
129def _nullifzero_to_if(args):
130    cond = exp.EQ(this=seq_get(args, 0), expression=exp.Literal.number(0))
131    return exp.If(this=cond, true=exp.Null(), false=seq_get(args, 0))
132
133
134def _datatype_sql(self, expression):
135    if expression.this == exp.DataType.Type.ARRAY:
136        return "ARRAY"
137    elif expression.this == exp.DataType.Type.MAP:
138        return "OBJECT"
139    return self.datatype_sql(expression)
140
141
142class Snowflake(Dialect):
143    null_ordering = "nulls_are_large"
144    time_format = "'yyyy-mm-dd hh24:mi:ss'"
145
146    time_mapping = {
147        "YYYY": "%Y",
148        "yyyy": "%Y",
149        "YY": "%y",
150        "yy": "%y",
151        "MMMM": "%B",
152        "mmmm": "%B",
153        "MON": "%b",
154        "mon": "%b",
155        "MM": "%m",
156        "mm": "%m",
157        "DD": "%d",
158        "dd": "%d",
159        "d": "%-d",
160        "DY": "%w",
161        "dy": "%w",
162        "HH24": "%H",
163        "hh24": "%H",
164        "HH12": "%I",
165        "hh12": "%I",
166        "MI": "%M",
167        "mi": "%M",
168        "SS": "%S",
169        "ss": "%S",
170        "FF": "%f",
171        "ff": "%f",
172        "FF6": "%f",
173        "ff6": "%f",
174    }
175
176    class Parser(parser.Parser):
177        FUNCTIONS = {
178            **parser.Parser.FUNCTIONS,
179            "ARRAYAGG": exp.ArrayAgg.from_arg_list,
180            "ARRAY_CONSTRUCT": exp.Array.from_arg_list,
181            "ARRAY_TO_STRING": exp.ArrayJoin.from_arg_list,
182            "DATE_TRUNC": date_trunc_to_time,
183            "DATEADD": lambda args: exp.DateAdd(
184                this=seq_get(args, 2),
185                expression=seq_get(args, 1),
186                unit=seq_get(args, 0),
187            ),
188            "DATEDIFF": lambda args: exp.DateDiff(
189                this=seq_get(args, 2),
190                expression=seq_get(args, 1),
191                unit=seq_get(args, 0),
192            ),
193            "DECODE": exp.Matches.from_arg_list,
194            "DIV0": _div0_to_if,
195            "IFF": exp.If.from_arg_list,
196            "NULLIFZERO": _nullifzero_to_if,
197            "OBJECT_CONSTRUCT": parser.parse_var_map,
198            "RLIKE": exp.RegexpLike.from_arg_list,
199            "SQUARE": lambda args: exp.Pow(this=seq_get(args, 0), expression=exp.Literal.number(2)),
200            "TO_ARRAY": exp.Array.from_arg_list,
201            "TO_VARCHAR": exp.ToChar.from_arg_list,
202            "TO_TIMESTAMP": _snowflake_to_timestamp,
203            "ZEROIFNULL": _zeroifnull_to_if,
204        }
205
206        FUNCTION_PARSERS = {
207            **parser.Parser.FUNCTION_PARSERS,
208            "DATE_PART": _parse_date_part,
209        }
210        FUNCTION_PARSERS.pop("TRIM")
211
212        FUNC_TOKENS = {
213            *parser.Parser.FUNC_TOKENS,
214            TokenType.RLIKE,
215            TokenType.TABLE,
216        }
217
218        COLUMN_OPERATORS = {
219            **parser.Parser.COLUMN_OPERATORS,  # type: ignore
220            TokenType.COLON: lambda self, this, path: self.expression(
221                exp.Bracket,
222                this=this,
223                expressions=[path],
224            ),
225        }
226
227        RANGE_PARSERS = {
228            **parser.Parser.RANGE_PARSERS,  # type: ignore
229            TokenType.LIKE_ANY: binary_range_parser(exp.LikeAny),
230            TokenType.ILIKE_ANY: binary_range_parser(exp.ILikeAny),
231        }
232
233        ALTER_PARSERS = {
234            **parser.Parser.ALTER_PARSERS,  # type: ignore
235            "UNSET": lambda self: self._parse_alter_table_set_tag(unset=True),
236            "SET": lambda self: self._parse_alter_table_set_tag(),
237        }
238
239        def _parse_alter_table_set_tag(self, unset: bool = False) -> exp.Expression:
240            self._match_text_seq("TAG")
241            parser = t.cast(t.Callable, self._parse_id_var if unset else self._parse_conjunction)
242            return self.expression(exp.SetTag, expressions=self._parse_csv(parser), unset=unset)
243
244    class Tokenizer(tokens.Tokenizer):
245        QUOTES = ["'", "$$"]
246        STRING_ESCAPES = ["\\", "'"]
247
248        KEYWORDS = {
249            **tokens.Tokenizer.KEYWORDS,
250            "EXCLUDE": TokenType.EXCEPT,
251            "ILIKE ANY": TokenType.ILIKE_ANY,
252            "LIKE ANY": TokenType.LIKE_ANY,
253            "MATCH_RECOGNIZE": TokenType.MATCH_RECOGNIZE,
254            "PUT": TokenType.COMMAND,
255            "RENAME": TokenType.REPLACE,
256            "TIMESTAMP_LTZ": TokenType.TIMESTAMPLTZ,
257            "TIMESTAMP_NTZ": TokenType.TIMESTAMP,
258            "TIMESTAMP_TZ": TokenType.TIMESTAMPTZ,
259            "TIMESTAMPNTZ": TokenType.TIMESTAMP,
260            "MINUS": TokenType.EXCEPT,
261            "SAMPLE": TokenType.TABLE_SAMPLE,
262        }
263
264        SINGLE_TOKENS = {
265            **tokens.Tokenizer.SINGLE_TOKENS,
266            "$": TokenType.PARAMETER,
267        }
268
269    class Generator(generator.Generator):
270        PARAMETER_TOKEN = "$"
271        MATCHED_BY_SOURCE = False
272
273        TRANSFORMS = {
274            **generator.Generator.TRANSFORMS,  # type: ignore
275            exp.Array: inline_array_sql,
276            exp.ArrayConcat: rename_func("ARRAY_CAT"),
277            exp.ArrayJoin: rename_func("ARRAY_TO_STRING"),
278            exp.DateAdd: lambda self, e: self.func("DATEADD", e.text("unit"), e.expression, e.this),
279            exp.DateDiff: lambda self, e: self.func(
280                "DATEDIFF", e.text("unit"), e.expression, e.this
281            ),
282            exp.DateStrToDate: datestrtodate_sql,
283            exp.DataType: _datatype_sql,
284            exp.If: rename_func("IFF"),
285            exp.Map: lambda self, e: var_map_sql(self, e, "OBJECT_CONSTRUCT"),
286            exp.LogicalOr: rename_func("BOOLOR_AGG"),
287            exp.LogicalAnd: rename_func("BOOLAND_AGG"),
288            exp.VarMap: lambda self, e: var_map_sql(self, e, "OBJECT_CONSTRUCT"),
289            exp.PartitionedByProperty: lambda self, e: f"PARTITION BY {self.sql(e, 'this')}",
290            exp.Matches: rename_func("DECODE"),
291            exp.StrPosition: lambda self, e: self.func(
292                "POSITION", e.args.get("substr"), e.this, e.args.get("position")
293            ),
294            exp.StrToTime: lambda self, e: f"TO_TIMESTAMP({self.sql(e, 'this')}, {self.format_time(e)})",
295            exp.TimestampTrunc: timestamptrunc_sql,
296            exp.TimeStrToTime: timestrtotime_sql,
297            exp.TimeToUnix: lambda self, e: f"EXTRACT(epoch_second FROM {self.sql(e, 'this')})",
298            exp.Trim: lambda self, e: self.func("TRIM", e.this, e.expression),
299            exp.ToChar: lambda self, e: self.function_fallback_sql(e),
300            exp.TsOrDsToDate: ts_or_ds_to_date_sql("snowflake"),
301            exp.UnixToTime: _unix_to_time_sql,
302            exp.DayOfWeek: rename_func("DAYOFWEEK"),
303            exp.Max: max_or_greatest,
304            exp.Min: min_or_least,
305        }
306
307        TYPE_MAPPING = {
308            **generator.Generator.TYPE_MAPPING,  # type: ignore
309            exp.DataType.Type.TIMESTAMP: "TIMESTAMPNTZ",
310        }
311
312        STAR_MAPPING = {
313            "except": "EXCLUDE",
314            "replace": "RENAME",
315        }
316
317        PROPERTIES_LOCATION = {
318            **generator.Generator.PROPERTIES_LOCATION,  # type: ignore
319            exp.SetProperty: exp.Properties.Location.UNSUPPORTED,
320        }
321
322        def ilikeany_sql(self, expression: exp.ILikeAny) -> str:
323            return self.binary(expression, "ILIKE ANY")
324
325        def likeany_sql(self, expression: exp.LikeAny) -> str:
326            return self.binary(expression, "LIKE ANY")
327
328        def except_op(self, expression):
329            if not expression.args.get("distinct", False):
330                self.unsupported("EXCEPT with All is not supported in Snowflake")
331            return super().except_op(expression)
332
333        def intersect_op(self, expression):
334            if not expression.args.get("distinct", False):
335                self.unsupported("INTERSECT with All is not supported in Snowflake")
336            return super().intersect_op(expression)
337
338        def values_sql(self, expression: exp.Values) -> str:
339            """Due to a bug in Snowflake we want to make sure that all columns in a VALUES table alias are unquoted.
340
341            We also want to make sure that after we find matches where we need to unquote a column that we prevent users
342            from adding quotes to the column by using the `identify` argument when generating the SQL.
343            """
344            alias = expression.args.get("alias")
345            if alias and alias.args.get("columns"):
346                expression = expression.transform(
347                    lambda node: exp.Identifier(**{**node.args, "quoted": False})
348                    if isinstance(node, exp.Identifier)
349                    and isinstance(node.parent, exp.TableAlias)
350                    and node.arg_key == "columns"
351                    else node,
352                )
353                return self.no_identify(lambda: super(self.__class__, self).values_sql(expression))
354            return super().values_sql(expression)
355
356        def settag_sql(self, expression: exp.SetTag) -> str:
357            action = "UNSET" if expression.args.get("unset") else "SET"
358            return f"{action} TAG {self.expressions(expression)}"
359
360        def select_sql(self, expression: exp.Select) -> str:
361            """Due to a bug in Snowflake we want to make sure that all columns in a VALUES table alias are unquoted and also
362            that all columns in a SELECT are unquoted. We also want to make sure that after we find matches where we need
363            to unquote a column that we prevent users from adding quotes to the column by using the `identify` argument when
364            generating the SQL.
365
366            Note: We make an assumption that any columns referenced in a VALUES expression should be unquoted throughout the
367            expression. This might not be true in a case where the same column name can be sourced from another table that can
368            properly quote but should be true in most cases.
369            """
370            values_identifiers = set(
371                flatten(
372                    (v.args.get("alias") or exp.Alias()).args.get("columns", [])
373                    for v in expression.find_all(exp.Values)
374                )
375            )
376            if values_identifiers:
377                expression = expression.transform(
378                    lambda node: exp.Identifier(**{**node.args, "quoted": False})
379                    if isinstance(node, exp.Identifier) and node in values_identifiers
380                    else node,
381                )
382                return self.no_identify(lambda: super(self.__class__, self).select_sql(expression))
383            return super().select_sql(expression)
384
385        def describe_sql(self, expression: exp.Describe) -> str:
386            # Default to table if kind is unknown
387            kind_value = expression.args.get("kind") or "TABLE"
388            kind = f" {kind_value}" if kind_value else ""
389            this = f" {self.sql(expression, 'this')}"
390            return f"DESCRIBE{kind}{this}"
391
392        def generatedasidentitycolumnconstraint_sql(
393            self, expression: exp.GeneratedAsIdentityColumnConstraint
394        ) -> str:
395            start = expression.args.get("start")
396            start = f" START {start}" if start else ""
397            increment = expression.args.get("increment")
398            increment = f" INCREMENT {increment}" if increment else ""
399            return f"AUTOINCREMENT{start}{increment}"

class Snowflake(sqlglot.dialects.dialect.Dialect): View Source

143class Snowflake(Dialect):
144    null_ordering = "nulls_are_large"
145    time_format = "'yyyy-mm-dd hh24:mi:ss'"
146
147    time_mapping = {
148        "YYYY": "%Y",
149        "yyyy": "%Y",
150        "YY": "%y",
151        "yy": "%y",
152        "MMMM": "%B",
153        "mmmm": "%B",
154        "MON": "%b",
155        "mon": "%b",
156        "MM": "%m",
157        "mm": "%m",
158        "DD": "%d",
159        "dd": "%d",
160        "d": "%-d",
161        "DY": "%w",
162        "dy": "%w",
163        "HH24": "%H",
164        "hh24": "%H",
165        "HH12": "%I",
166        "hh12": "%I",
167        "MI": "%M",
168        "mi": "%M",
169        "SS": "%S",
170        "ss": "%S",
171        "FF": "%f",
172        "ff": "%f",
173        "FF6": "%f",
174        "ff6": "%f",
175    }
176
177    class Parser(parser.Parser):
178        FUNCTIONS = {
179            **parser.Parser.FUNCTIONS,
180            "ARRAYAGG": exp.ArrayAgg.from_arg_list,
181            "ARRAY_CONSTRUCT": exp.Array.from_arg_list,
182            "ARRAY_TO_STRING": exp.ArrayJoin.from_arg_list,
183            "DATE_TRUNC": date_trunc_to_time,
184            "DATEADD": lambda args: exp.DateAdd(
185                this=seq_get(args, 2),
186                expression=seq_get(args, 1),
187                unit=seq_get(args, 0),
188            ),
189            "DATEDIFF": lambda args: exp.DateDiff(
190                this=seq_get(args, 2),
191                expression=seq_get(args, 1),
192                unit=seq_get(args, 0),
193            ),
194            "DECODE": exp.Matches.from_arg_list,
195            "DIV0": _div0_to_if,
196            "IFF": exp.If.from_arg_list,
197            "NULLIFZERO": _nullifzero_to_if,
198            "OBJECT_CONSTRUCT": parser.parse_var_map,
199            "RLIKE": exp.RegexpLike.from_arg_list,
200            "SQUARE": lambda args: exp.Pow(this=seq_get(args, 0), expression=exp.Literal.number(2)),
201            "TO_ARRAY": exp.Array.from_arg_list,
202            "TO_VARCHAR": exp.ToChar.from_arg_list,
203            "TO_TIMESTAMP": _snowflake_to_timestamp,
204            "ZEROIFNULL": _zeroifnull_to_if,
205        }
206
207        FUNCTION_PARSERS = {
208            **parser.Parser.FUNCTION_PARSERS,
209            "DATE_PART": _parse_date_part,
210        }
211        FUNCTION_PARSERS.pop("TRIM")
212
213        FUNC_TOKENS = {
214            *parser.Parser.FUNC_TOKENS,
215            TokenType.RLIKE,
216            TokenType.TABLE,
217        }
218
219        COLUMN_OPERATORS = {
220            **parser.Parser.COLUMN_OPERATORS,  # type: ignore
221            TokenType.COLON: lambda self, this, path: self.expression(
222                exp.Bracket,
223                this=this,
224                expressions=[path],
225            ),
226        }
227
228        RANGE_PARSERS = {
229            **parser.Parser.RANGE_PARSERS,  # type: ignore
230            TokenType.LIKE_ANY: binary_range_parser(exp.LikeAny),
231            TokenType.ILIKE_ANY: binary_range_parser(exp.ILikeAny),
232        }
233
234        ALTER_PARSERS = {
235            **parser.Parser.ALTER_PARSERS,  # type: ignore
236            "UNSET": lambda self: self._parse_alter_table_set_tag(unset=True),
237            "SET": lambda self: self._parse_alter_table_set_tag(),
238        }
239
240        def _parse_alter_table_set_tag(self, unset: bool = False) -> exp.Expression:
241            self._match_text_seq("TAG")
242            parser = t.cast(t.Callable, self._parse_id_var if unset else self._parse_conjunction)
243            return self.expression(exp.SetTag, expressions=self._parse_csv(parser), unset=unset)
244
245    class Tokenizer(tokens.Tokenizer):
246        QUOTES = ["'", "$$"]
247        STRING_ESCAPES = ["\\", "'"]
248
249        KEYWORDS = {
250            **tokens.Tokenizer.KEYWORDS,
251            "EXCLUDE": TokenType.EXCEPT,
252            "ILIKE ANY": TokenType.ILIKE_ANY,
253            "LIKE ANY": TokenType.LIKE_ANY,
254            "MATCH_RECOGNIZE": TokenType.MATCH_RECOGNIZE,
255            "PUT": TokenType.COMMAND,
256            "RENAME": TokenType.REPLACE,
257            "TIMESTAMP_LTZ": TokenType.TIMESTAMPLTZ,
258            "TIMESTAMP_NTZ": TokenType.TIMESTAMP,
259            "TIMESTAMP_TZ": TokenType.TIMESTAMPTZ,
260            "TIMESTAMPNTZ": TokenType.TIMESTAMP,
261            "MINUS": TokenType.EXCEPT,
262            "SAMPLE": TokenType.TABLE_SAMPLE,
263        }
264
265        SINGLE_TOKENS = {
266            **tokens.Tokenizer.SINGLE_TOKENS,
267            "$": TokenType.PARAMETER,
268        }
269
270    class Generator(generator.Generator):
271        PARAMETER_TOKEN = "$"
272        MATCHED_BY_SOURCE = False
273
274        TRANSFORMS = {
275            **generator.Generator.TRANSFORMS,  # type: ignore
276            exp.Array: inline_array_sql,
277            exp.ArrayConcat: rename_func("ARRAY_CAT"),
278            exp.ArrayJoin: rename_func("ARRAY_TO_STRING"),
279            exp.DateAdd: lambda self, e: self.func("DATEADD", e.text("unit"), e.expression, e.this),
280            exp.DateDiff: lambda self, e: self.func(
281                "DATEDIFF", e.text("unit"), e.expression, e.this
282            ),
283            exp.DateStrToDate: datestrtodate_sql,
284            exp.DataType: _datatype_sql,
285            exp.If: rename_func("IFF"),
286            exp.Map: lambda self, e: var_map_sql(self, e, "OBJECT_CONSTRUCT"),
287            exp.LogicalOr: rename_func("BOOLOR_AGG"),
288            exp.LogicalAnd: rename_func("BOOLAND_AGG"),
289            exp.VarMap: lambda self, e: var_map_sql(self, e, "OBJECT_CONSTRUCT"),
290            exp.PartitionedByProperty: lambda self, e: f"PARTITION BY {self.sql(e, 'this')}",
291            exp.Matches: rename_func("DECODE"),
292            exp.StrPosition: lambda self, e: self.func(
293                "POSITION", e.args.get("substr"), e.this, e.args.get("position")
294            ),
295            exp.StrToTime: lambda self, e: f"TO_TIMESTAMP({self.sql(e, 'this')}, {self.format_time(e)})",
296            exp.TimestampTrunc: timestamptrunc_sql,
297            exp.TimeStrToTime: timestrtotime_sql,
298            exp.TimeToUnix: lambda self, e: f"EXTRACT(epoch_second FROM {self.sql(e, 'this')})",
299            exp.Trim: lambda self, e: self.func("TRIM", e.this, e.expression),
300            exp.ToChar: lambda self, e: self.function_fallback_sql(e),
301            exp.TsOrDsToDate: ts_or_ds_to_date_sql("snowflake"),
302            exp.UnixToTime: _unix_to_time_sql,
303            exp.DayOfWeek: rename_func("DAYOFWEEK"),
304            exp.Max: max_or_greatest,
305            exp.Min: min_or_least,
306        }
307
308        TYPE_MAPPING = {
309            **generator.Generator.TYPE_MAPPING,  # type: ignore
310            exp.DataType.Type.TIMESTAMP: "TIMESTAMPNTZ",
311        }
312
313        STAR_MAPPING = {
314            "except": "EXCLUDE",
315            "replace": "RENAME",
316        }
317
318        PROPERTIES_LOCATION = {
319            **generator.Generator.PROPERTIES_LOCATION,  # type: ignore
320            exp.SetProperty: exp.Properties.Location.UNSUPPORTED,
321        }
322
323        def ilikeany_sql(self, expression: exp.ILikeAny) -> str:
324            return self.binary(expression, "ILIKE ANY")
325
326        def likeany_sql(self, expression: exp.LikeAny) -> str:
327            return self.binary(expression, "LIKE ANY")
328
329        def except_op(self, expression):
330            if not expression.args.get("distinct", False):
331                self.unsupported("EXCEPT with All is not supported in Snowflake")
332            return super().except_op(expression)
333
334        def intersect_op(self, expression):
335            if not expression.args.get("distinct", False):
336                self.unsupported("INTERSECT with All is not supported in Snowflake")
337            return super().intersect_op(expression)
338
339        def values_sql(self, expression: exp.Values) -> str:
340            """Due to a bug in Snowflake we want to make sure that all columns in a VALUES table alias are unquoted.
341
342            We also want to make sure that after we find matches where we need to unquote a column that we prevent users
343            from adding quotes to the column by using the `identify` argument when generating the SQL.
344            """
345            alias = expression.args.get("alias")
346            if alias and alias.args.get("columns"):
347                expression = expression.transform(
348                    lambda node: exp.Identifier(**{**node.args, "quoted": False})
349                    if isinstance(node, exp.Identifier)
350                    and isinstance(node.parent, exp.TableAlias)
351                    and node.arg_key == "columns"
352                    else node,
353                )
354                return self.no_identify(lambda: super(self.__class__, self).values_sql(expression))
355            return super().values_sql(expression)
356
357        def settag_sql(self, expression: exp.SetTag) -> str:
358            action = "UNSET" if expression.args.get("unset") else "SET"
359            return f"{action} TAG {self.expressions(expression)}"
360
361        def select_sql(self, expression: exp.Select) -> str:
362            """Due to a bug in Snowflake we want to make sure that all columns in a VALUES table alias are unquoted and also
363            that all columns in a SELECT are unquoted. We also want to make sure that after we find matches where we need
364            to unquote a column that we prevent users from adding quotes to the column by using the `identify` argument when
365            generating the SQL.
366
367            Note: We make an assumption that any columns referenced in a VALUES expression should be unquoted throughout the
368            expression. This might not be true in a case where the same column name can be sourced from another table that can
369            properly quote but should be true in most cases.
370            """
371            values_identifiers = set(
372                flatten(
373                    (v.args.get("alias") or exp.Alias()).args.get("columns", [])
374                    for v in expression.find_all(exp.Values)
375                )
376            )
377            if values_identifiers:
378                expression = expression.transform(
379                    lambda node: exp.Identifier(**{**node.args, "quoted": False})
380                    if isinstance(node, exp.Identifier) and node in values_identifiers
381                    else node,
382                )
383                return self.no_identify(lambda: super(self.__class__, self).select_sql(expression))
384            return super().select_sql(expression)
385
386        def describe_sql(self, expression: exp.Describe) -> str:
387            # Default to table if kind is unknown
388            kind_value = expression.args.get("kind") or "TABLE"
389            kind = f" {kind_value}" if kind_value else ""
390            this = f" {self.sql(expression, 'this')}"
391            return f"DESCRIBE{kind}{this}"
392
393        def generatedasidentitycolumnconstraint_sql(
394            self, expression: exp.GeneratedAsIdentityColumnConstraint
395        ) -> str:
396            start = expression.args.get("start")
397            start = f" START {start}" if start else ""
398            increment = expression.args.get("increment")
399            increment = f" INCREMENT {increment}" if increment else ""
400            return f"AUTOINCREMENT{start}{increment}"

Inherited Members

sqlglot.dialects.dialect.Dialect: get_or_raise; format_time; parse; parse_into; generate; transpile; tokenize; parser; generator

class Snowflake.Parser(sqlglot.parser.Parser): View Source

177    class Parser(parser.Parser):
178        FUNCTIONS = {
179            **parser.Parser.FUNCTIONS,
180            "ARRAYAGG": exp.ArrayAgg.from_arg_list,
181            "ARRAY_CONSTRUCT": exp.Array.from_arg_list,
182            "ARRAY_TO_STRING": exp.ArrayJoin.from_arg_list,
183            "DATE_TRUNC": date_trunc_to_time,
184            "DATEADD": lambda args: exp.DateAdd(
185                this=seq_get(args, 2),
186                expression=seq_get(args, 1),
187                unit=seq_get(args, 0),
188            ),
189            "DATEDIFF": lambda args: exp.DateDiff(
190                this=seq_get(args, 2),
191                expression=seq_get(args, 1),
192                unit=seq_get(args, 0),
193            ),
194            "DECODE": exp.Matches.from_arg_list,
195            "DIV0": _div0_to_if,
196            "IFF": exp.If.from_arg_list,
197            "NULLIFZERO": _nullifzero_to_if,
198            "OBJECT_CONSTRUCT": parser.parse_var_map,
199            "RLIKE": exp.RegexpLike.from_arg_list,
200            "SQUARE": lambda args: exp.Pow(this=seq_get(args, 0), expression=exp.Literal.number(2)),
201            "TO_ARRAY": exp.Array.from_arg_list,
202            "TO_VARCHAR": exp.ToChar.from_arg_list,
203            "TO_TIMESTAMP": _snowflake_to_timestamp,
204            "ZEROIFNULL": _zeroifnull_to_if,
205        }
206
207        FUNCTION_PARSERS = {
208            **parser.Parser.FUNCTION_PARSERS,
209            "DATE_PART": _parse_date_part,
210        }
211        FUNCTION_PARSERS.pop("TRIM")
212
213        FUNC_TOKENS = {
214            *parser.Parser.FUNC_TOKENS,
215            TokenType.RLIKE,
216            TokenType.TABLE,
217        }
218
219        COLUMN_OPERATORS = {
220            **parser.Parser.COLUMN_OPERATORS,  # type: ignore
221            TokenType.COLON: lambda self, this, path: self.expression(
222                exp.Bracket,
223                this=this,
224                expressions=[path],
225            ),
226        }
227
228        RANGE_PARSERS = {
229            **parser.Parser.RANGE_PARSERS,  # type: ignore
230            TokenType.LIKE_ANY: binary_range_parser(exp.LikeAny),
231            TokenType.ILIKE_ANY: binary_range_parser(exp.ILikeAny),
232        }
233
234        ALTER_PARSERS = {
235            **parser.Parser.ALTER_PARSERS,  # type: ignore
236            "UNSET": lambda self: self._parse_alter_table_set_tag(unset=True),
237            "SET": lambda self: self._parse_alter_table_set_tag(),
238        }
239
240        def _parse_alter_table_set_tag(self, unset: bool = False) -> exp.Expression:
241            self._match_text_seq("TAG")
242            parser = t.cast(t.Callable, self._parse_id_var if unset else self._parse_conjunction)
243            return self.expression(exp.SetTag, expressions=self._parse_csv(parser), unset=unset)

Parser consumes a list of tokens produced by the sqlglot.tokens.Tokenizer and produces a parsed syntax tree.

Arguments:

error_level: the desired error level. Default: ErrorLevel.RAISE
error_message_context: determines the amount of context to capture from a query string when displaying the error message (in number of characters). Default: 50.
index_offset: Index offset for arrays eg ARRAY[0] vs ARRAY[1] as the head of a list. Default: 0
alias_post_tablesample: If the table alias comes after tablesample. Default: False
max_errors: Maximum number of error messages to include in a raised ParseError. This is only relevant if error_level is ErrorLevel.RAISE. Default: 3
null_ordering: Indicates the default null ordering method to use if not explicitly set. Options are "nulls_are_small", "nulls_are_large", "nulls_are_last". Default: "nulls_are_small"

Inherited Members

sqlglot.parser.Parser: Parser; reset; parse; parse_into; check_errors; raise_error; expression; validate_expression

class Snowflake.Tokenizer(sqlglot.tokens.Tokenizer): View Source

245    class Tokenizer(tokens.Tokenizer):
246        QUOTES = ["'", "$$"]
247        STRING_ESCAPES = ["\\", "'"]
248
249        KEYWORDS = {
250            **tokens.Tokenizer.KEYWORDS,
251            "EXCLUDE": TokenType.EXCEPT,
252            "ILIKE ANY": TokenType.ILIKE_ANY,
253            "LIKE ANY": TokenType.LIKE_ANY,
254            "MATCH_RECOGNIZE": TokenType.MATCH_RECOGNIZE,
255            "PUT": TokenType.COMMAND,
256            "RENAME": TokenType.REPLACE,
257            "TIMESTAMP_LTZ": TokenType.TIMESTAMPLTZ,
258            "TIMESTAMP_NTZ": TokenType.TIMESTAMP,
259            "TIMESTAMP_TZ": TokenType.TIMESTAMPTZ,
260            "TIMESTAMPNTZ": TokenType.TIMESTAMP,
261            "MINUS": TokenType.EXCEPT,
262            "SAMPLE": TokenType.TABLE_SAMPLE,
263        }
264
265        SINGLE_TOKENS = {
266            **tokens.Tokenizer.SINGLE_TOKENS,
267            "$": TokenType.PARAMETER,
268        }

Inherited Members

sqlglot.tokens.Tokenizer: reset; tokenize