Edit on GitHub

sqlglot.dialects.bigquery

  1from __future__ import annotations
  2
  3import logging
  4import re
  5import typing as t
  6
  7from sqlglot import exp, generator, parser, tokens, transforms
  8from sqlglot.dialects.dialect import (
  9    Dialect,
 10    NormalizationStrategy,
 11    arg_max_or_min_no_count,
 12    binary_from_function,
 13    date_add_interval_sql,
 14    datestrtodate_sql,
 15    format_time_lambda,
 16    if_sql,
 17    inline_array_sql,
 18    max_or_greatest,
 19    min_or_least,
 20    no_ilike_sql,
 21    parse_date_delta_with_interval,
 22    path_to_jsonpath,
 23    regexp_replace_sql,
 24    rename_func,
 25    timestrtotime_sql,
 26    ts_or_ds_add_cast,
 27)
 28from sqlglot.helper import seq_get, split_num_words
 29from sqlglot.tokens import TokenType
 30
 31if t.TYPE_CHECKING:
 32    from sqlglot._typing import E, Lit
 33
 34logger = logging.getLogger("sqlglot")
 35
 36
 37def _derived_table_values_to_unnest(self: BigQuery.Generator, expression: exp.Values) -> str:
 38    if not expression.find_ancestor(exp.From, exp.Join):
 39        return self.values_sql(expression)
 40
 41    alias = expression.args.get("alias")
 42
 43    structs = [
 44        exp.Struct(
 45            expressions=[
 46                exp.alias_(value, column_name)
 47                for value, column_name in zip(
 48                    t.expressions,
 49                    (
 50                        alias.columns
 51                        if alias and alias.columns
 52                        else (f"_c{i}" for i in range(len(t.expressions)))
 53                    ),
 54                )
 55            ]
 56        )
 57        for t in expression.find_all(exp.Tuple)
 58    ]
 59
 60    return self.unnest_sql(exp.Unnest(expressions=[exp.Array(expressions=structs)]))
 61
 62
 63def _returnsproperty_sql(self: BigQuery.Generator, expression: exp.ReturnsProperty) -> str:
 64    this = expression.this
 65    if isinstance(this, exp.Schema):
 66        this = f"{this.this} <{self.expressions(this)}>"
 67    else:
 68        this = self.sql(this)
 69    return f"RETURNS {this}"
 70
 71
 72def _create_sql(self: BigQuery.Generator, expression: exp.Create) -> str:
 73    kind = expression.args["kind"]
 74    returns = expression.find(exp.ReturnsProperty)
 75
 76    if kind.upper() == "FUNCTION" and returns and returns.args.get("is_table"):
 77        expression.set("kind", "TABLE FUNCTION")
 78
 79        if isinstance(expression.expression, (exp.Subquery, exp.Literal)):
 80            expression.set("expression", expression.expression.this)
 81
 82        return self.create_sql(expression)
 83
 84    return self.create_sql(expression)
 85
 86
 87def _unqualify_unnest(expression: exp.Expression) -> exp.Expression:
 88    """Remove references to unnest table aliases since bigquery doesn't allow them.
 89
 90    These are added by the optimizer's qualify_column step.
 91    """
 92    from sqlglot.optimizer.scope import find_all_in_scope
 93
 94    if isinstance(expression, exp.Select):
 95        unnest_aliases = {
 96            unnest.alias
 97            for unnest in find_all_in_scope(expression, exp.Unnest)
 98            if isinstance(unnest.parent, (exp.From, exp.Join))
 99        }
100        if unnest_aliases:
101            for column in expression.find_all(exp.Column):
102                if column.table in unnest_aliases:
103                    column.set("table", None)
104                elif column.db in unnest_aliases:
105                    column.set("db", None)
106
107    return expression
108
109
110# https://issuetracker.google.com/issues/162294746
111# workaround for bigquery bug when grouping by an expression and then ordering
112# WITH x AS (SELECT 1 y)
113# SELECT y + 1 z
114# FROM x
115# GROUP BY x + 1
116# ORDER by z
117def _alias_ordered_group(expression: exp.Expression) -> exp.Expression:
118    if isinstance(expression, exp.Select):
119        group = expression.args.get("group")
120        order = expression.args.get("order")
121
122        if group and order:
123            aliases = {
124                select.this: select.args["alias"]
125                for select in expression.selects
126                if isinstance(select, exp.Alias)
127            }
128
129            for e in group.expressions:
130                alias = aliases.get(e)
131
132                if alias:
133                    e.replace(exp.column(alias))
134
135    return expression
136
137
138def _pushdown_cte_column_names(expression: exp.Expression) -> exp.Expression:
139    """BigQuery doesn't allow column names when defining a CTE, so we try to push them down."""
140    if isinstance(expression, exp.CTE) and expression.alias_column_names:
141        cte_query = expression.this
142
143        if cte_query.is_star:
144            logger.warning(
145                "Can't push down CTE column names for star queries. Run the query through"
146                " the optimizer or use 'qualify' to expand the star projections first."
147            )
148            return expression
149
150        column_names = expression.alias_column_names
151        expression.args["alias"].set("columns", None)
152
153        for name, select in zip(column_names, cte_query.selects):
154            to_replace = select
155
156            if isinstance(select, exp.Alias):
157                select = select.this
158
159            # Inner aliases are shadowed by the CTE column names
160            to_replace.replace(exp.alias_(select, name))
161
162    return expression
163
164
165def _parse_timestamp(args: t.List) -> exp.StrToTime:
166    this = format_time_lambda(exp.StrToTime, "bigquery")([seq_get(args, 1), seq_get(args, 0)])
167    this.set("zone", seq_get(args, 2))
168    return this
169
170
171def _parse_date(args: t.List) -> exp.Date | exp.DateFromParts:
172    expr_type = exp.DateFromParts if len(args) == 3 else exp.Date
173    return expr_type.from_arg_list(args)
174
175
176def _parse_to_hex(args: t.List) -> exp.Hex | exp.MD5:
177    # TO_HEX(MD5(..)) is common in BigQuery, so it's parsed into MD5 to simplify its transpilation
178    arg = seq_get(args, 0)
179    return exp.MD5(this=arg.this) if isinstance(arg, exp.MD5Digest) else exp.Hex(this=arg)
180
181
182def _array_contains_sql(self: BigQuery.Generator, expression: exp.ArrayContains) -> str:
183    return self.sql(
184        exp.Exists(
185            this=exp.select("1")
186            .from_(exp.Unnest(expressions=[expression.left]).as_("_unnest", table=["_col"]))
187            .where(exp.column("_col").eq(expression.right))
188        )
189    )
190
191
192def _ts_or_ds_add_sql(self: BigQuery.Generator, expression: exp.TsOrDsAdd) -> str:
193    return date_add_interval_sql("DATE", "ADD")(self, ts_or_ds_add_cast(expression))
194
195
196def _ts_or_ds_diff_sql(self: BigQuery.Generator, expression: exp.TsOrDsDiff) -> str:
197    expression.this.replace(exp.cast(expression.this, "TIMESTAMP", copy=True))
198    expression.expression.replace(exp.cast(expression.expression, "TIMESTAMP", copy=True))
199    unit = expression.args.get("unit") or "DAY"
200    return self.func("DATE_DIFF", expression.this, expression.expression, unit)
201
202
203def _unix_to_time_sql(self: BigQuery.Generator, expression: exp.UnixToTime) -> str:
204    scale = expression.args.get("scale")
205    timestamp = self.sql(expression, "this")
206    if scale in (None, exp.UnixToTime.SECONDS):
207        return f"TIMESTAMP_SECONDS({timestamp})"
208    if scale == exp.UnixToTime.MILLIS:
209        return f"TIMESTAMP_MILLIS({timestamp})"
210    if scale == exp.UnixToTime.MICROS:
211        return f"TIMESTAMP_MICROS({timestamp})"
212
213    return f"TIMESTAMP_SECONDS(CAST({timestamp} / POW(10, {scale}) AS INT64))"
214
215
216def _parse_time(args: t.List) -> exp.Func:
217    if len(args) == 1:
218        return exp.TsOrDsToTime(this=args[0])
219    if len(args) == 3:
220        return exp.TimeFromParts.from_arg_list(args)
221
222    return exp.Anonymous(this="TIME", expressions=args)
223
224
225class BigQuery(Dialect):
226    WEEK_OFFSET = -1
227    UNNEST_COLUMN_ONLY = True
228    SUPPORTS_USER_DEFINED_TYPES = False
229    SUPPORTS_SEMI_ANTI_JOIN = False
230    LOG_BASE_FIRST = False
231
232    # https://cloud.google.com/bigquery/docs/reference/standard-sql/lexical#case_sensitivity
233    NORMALIZATION_STRATEGY = NormalizationStrategy.CASE_INSENSITIVE
234
235    # bigquery udfs are case sensitive
236    NORMALIZE_FUNCTIONS = False
237
238    TIME_MAPPING = {
239        "%D": "%m/%d/%y",
240    }
241
242    ESCAPE_SEQUENCES = {
243        "\\a": "\a",
244        "\\b": "\b",
245        "\\f": "\f",
246        "\\n": "\n",
247        "\\r": "\r",
248        "\\t": "\t",
249        "\\v": "\v",
250    }
251
252    FORMAT_MAPPING = {
253        "DD": "%d",
254        "MM": "%m",
255        "MON": "%b",
256        "MONTH": "%B",
257        "YYYY": "%Y",
258        "YY": "%y",
259        "HH": "%I",
260        "HH12": "%I",
261        "HH24": "%H",
262        "MI": "%M",
263        "SS": "%S",
264        "SSSSS": "%f",
265        "TZH": "%z",
266    }
267
268    # The _PARTITIONTIME and _PARTITIONDATE pseudo-columns are not returned by a SELECT * statement
269    # https://cloud.google.com/bigquery/docs/querying-partitioned-tables#query_an_ingestion-time_partitioned_table
270    PSEUDOCOLUMNS = {"_PARTITIONTIME", "_PARTITIONDATE"}
271
272    def normalize_identifier(self, expression: E) -> E:
273        if isinstance(expression, exp.Identifier):
274            parent = expression.parent
275            while isinstance(parent, exp.Dot):
276                parent = parent.parent
277
278            # In BigQuery, CTEs aren't case-sensitive, but table names are (by default, at least).
279            # The following check is essentially a heuristic to detect tables based on whether or
280            # not they're qualified. It also avoids normalizing UDFs, because they're case-sensitive.
281            if (
282                not isinstance(parent, exp.UserDefinedFunction)
283                and not (isinstance(parent, exp.Table) and parent.db)
284                and not expression.meta.get("is_table")
285            ):
286                expression.set("this", expression.this.lower())
287
288        return expression
289
290    class Tokenizer(tokens.Tokenizer):
291        QUOTES = ["'", '"', '"""', "'''"]
292        COMMENTS = ["--", "#", ("/*", "*/")]
293        IDENTIFIERS = ["`"]
294        STRING_ESCAPES = ["\\"]
295
296        HEX_STRINGS = [("0x", ""), ("0X", "")]
297
298        BYTE_STRINGS = [
299            (prefix + q, q) for q in t.cast(t.List[str], QUOTES) for prefix in ("b", "B")
300        ]
301
302        RAW_STRINGS = [
303            (prefix + q, q) for q in t.cast(t.List[str], QUOTES) for prefix in ("r", "R")
304        ]
305
306        KEYWORDS = {
307            **tokens.Tokenizer.KEYWORDS,
308            "ANY TYPE": TokenType.VARIANT,
309            "BEGIN": TokenType.COMMAND,
310            "BEGIN TRANSACTION": TokenType.BEGIN,
311            "BYTES": TokenType.BINARY,
312            "CURRENT_DATETIME": TokenType.CURRENT_DATETIME,
313            "DECLARE": TokenType.COMMAND,
314            "FLOAT64": TokenType.DOUBLE,
315            "FOR SYSTEM_TIME": TokenType.TIMESTAMP_SNAPSHOT,
316            "MODEL": TokenType.MODEL,
317            "NOT DETERMINISTIC": TokenType.VOLATILE,
318            "RECORD": TokenType.STRUCT,
319            "TIMESTAMP": TokenType.TIMESTAMPTZ,
320        }
321        KEYWORDS.pop("DIV")
322
323    class Parser(parser.Parser):
324        PREFIXED_PIVOT_COLUMNS = True
325
326        LOG_DEFAULTS_TO_LN = True
327
328        FUNCTIONS = {
329            **parser.Parser.FUNCTIONS,
330            "DATE": _parse_date,
331            "DATE_ADD": parse_date_delta_with_interval(exp.DateAdd),
332            "DATE_SUB": parse_date_delta_with_interval(exp.DateSub),
333            "DATE_TRUNC": lambda args: exp.DateTrunc(
334                unit=exp.Literal.string(str(seq_get(args, 1))),
335                this=seq_get(args, 0),
336            ),
337            "DATETIME_ADD": parse_date_delta_with_interval(exp.DatetimeAdd),
338            "DATETIME_SUB": parse_date_delta_with_interval(exp.DatetimeSub),
339            "DIV": binary_from_function(exp.IntDiv),
340            "FORMAT_DATE": lambda args: exp.TimeToStr(
341                this=exp.TsOrDsToDate(this=seq_get(args, 1)), format=seq_get(args, 0)
342            ),
343            "GENERATE_ARRAY": exp.GenerateSeries.from_arg_list,
344            "JSON_EXTRACT_SCALAR": lambda args: exp.JSONExtractScalar(
345                this=seq_get(args, 0), expression=seq_get(args, 1) or exp.Literal.string("$")
346            ),
347            "MD5": exp.MD5Digest.from_arg_list,
348            "TO_HEX": _parse_to_hex,
349            "PARSE_DATE": lambda args: format_time_lambda(exp.StrToDate, "bigquery")(
350                [seq_get(args, 1), seq_get(args, 0)]
351            ),
352            "PARSE_TIMESTAMP": _parse_timestamp,
353            "REGEXP_CONTAINS": exp.RegexpLike.from_arg_list,
354            "REGEXP_EXTRACT": lambda args: exp.RegexpExtract(
355                this=seq_get(args, 0),
356                expression=seq_get(args, 1),
357                position=seq_get(args, 2),
358                occurrence=seq_get(args, 3),
359                group=exp.Literal.number(1) if re.compile(args[1].name).groups == 1 else None,
360            ),
361            "SHA256": lambda args: exp.SHA2(this=seq_get(args, 0), length=exp.Literal.number(256)),
362            "SHA512": lambda args: exp.SHA2(this=seq_get(args, 0), length=exp.Literal.number(512)),
363            "SPLIT": lambda args: exp.Split(
364                # https://cloud.google.com/bigquery/docs/reference/standard-sql/string_functions#split
365                this=seq_get(args, 0),
366                expression=seq_get(args, 1) or exp.Literal.string(","),
367            ),
368            "TIME": _parse_time,
369            "TIME_ADD": parse_date_delta_with_interval(exp.TimeAdd),
370            "TIME_SUB": parse_date_delta_with_interval(exp.TimeSub),
371            "TIMESTAMP_ADD": parse_date_delta_with_interval(exp.TimestampAdd),
372            "TIMESTAMP_SUB": parse_date_delta_with_interval(exp.TimestampSub),
373            "TIMESTAMP_MICROS": lambda args: exp.UnixToTime(
374                this=seq_get(args, 0), scale=exp.UnixToTime.MICROS
375            ),
376            "TIMESTAMP_MILLIS": lambda args: exp.UnixToTime(
377                this=seq_get(args, 0), scale=exp.UnixToTime.MILLIS
378            ),
379            "TIMESTAMP_SECONDS": lambda args: exp.UnixToTime(this=seq_get(args, 0)),
380            "TO_JSON_STRING": exp.JSONFormat.from_arg_list,
381        }
382
383        FUNCTION_PARSERS = {
384            **parser.Parser.FUNCTION_PARSERS,
385            "ARRAY": lambda self: self.expression(exp.Array, expressions=[self._parse_statement()]),
386        }
387        FUNCTION_PARSERS.pop("TRIM")
388
389        NO_PAREN_FUNCTIONS = {
390            **parser.Parser.NO_PAREN_FUNCTIONS,
391            TokenType.CURRENT_DATETIME: exp.CurrentDatetime,
392        }
393
394        NESTED_TYPE_TOKENS = {
395            *parser.Parser.NESTED_TYPE_TOKENS,
396            TokenType.TABLE,
397        }
398
399        ID_VAR_TOKENS = {
400            *parser.Parser.ID_VAR_TOKENS,
401            TokenType.VALUES,
402        }
403
404        PROPERTY_PARSERS = {
405            **parser.Parser.PROPERTY_PARSERS,
406            "NOT DETERMINISTIC": lambda self: self.expression(
407                exp.StabilityProperty, this=exp.Literal.string("VOLATILE")
408            ),
409            "OPTIONS": lambda self: self._parse_with_property(),
410        }
411
412        CONSTRAINT_PARSERS = {
413            **parser.Parser.CONSTRAINT_PARSERS,
414            "OPTIONS": lambda self: exp.Properties(expressions=self._parse_with_property()),
415        }
416
417        RANGE_PARSERS = parser.Parser.RANGE_PARSERS.copy()
418        RANGE_PARSERS.pop(TokenType.OVERLAPS, None)
419
420        NULL_TOKENS = {TokenType.NULL, TokenType.UNKNOWN}
421
422        STATEMENT_PARSERS = {
423            **parser.Parser.STATEMENT_PARSERS,
424            TokenType.END: lambda self: self._parse_as_command(self._prev),
425            TokenType.FOR: lambda self: self._parse_for_in(),
426        }
427
428        BRACKET_OFFSETS = {
429            "OFFSET": (0, False),
430            "ORDINAL": (1, False),
431            "SAFE_OFFSET": (0, True),
432            "SAFE_ORDINAL": (1, True),
433        }
434
435        def _parse_for_in(self) -> exp.ForIn:
436            this = self._parse_range()
437            self._match_text_seq("DO")
438            return self.expression(exp.ForIn, this=this, expression=self._parse_statement())
439
440        def _parse_table_part(self, schema: bool = False) -> t.Optional[exp.Expression]:
441            this = super()._parse_table_part(schema=schema) or self._parse_number()
442
443            # https://cloud.google.com/bigquery/docs/reference/standard-sql/lexical#table_names
444            if isinstance(this, exp.Identifier):
445                table_name = this.name
446                while self._match(TokenType.DASH, advance=False) and self._next:
447                    self._advance(2)
448                    table_name += f"-{self._prev.text}"
449
450                this = exp.Identifier(this=table_name, quoted=this.args.get("quoted"))
451            elif isinstance(this, exp.Literal):
452                table_name = this.name
453
454                if self._is_connected() and self._parse_var(any_token=True):
455                    table_name += self._prev.text
456
457                this = exp.Identifier(this=table_name, quoted=True)
458
459            return this
460
461        def _parse_table_parts(self, schema: bool = False) -> exp.Table:
462            table = super()._parse_table_parts(schema=schema)
463            if isinstance(table.this, exp.Identifier) and "." in table.name:
464                catalog, db, this, *rest = (
465                    t.cast(t.Optional[exp.Expression], exp.to_identifier(x))
466                    for x in split_num_words(table.name, ".", 3)
467                )
468
469                if rest and this:
470                    this = exp.Dot.build(t.cast(t.List[exp.Expression], [this, *rest]))
471
472                table = exp.Table(this=this, db=db, catalog=catalog)
473
474            return table
475
476        @t.overload
477        def _parse_json_object(self, agg: Lit[False]) -> exp.JSONObject: ...
478
479        @t.overload
480        def _parse_json_object(self, agg: Lit[True]) -> exp.JSONObjectAgg: ...
481
482        def _parse_json_object(self, agg=False):
483            json_object = super()._parse_json_object()
484            array_kv_pair = seq_get(json_object.expressions, 0)
485
486            # Converts BQ's "signature 2" of JSON_OBJECT into SQLGlot's canonical representation
487            # https://cloud.google.com/bigquery/docs/reference/standard-sql/json_functions#json_object_signature2
488            if (
489                array_kv_pair
490                and isinstance(array_kv_pair.this, exp.Array)
491                and isinstance(array_kv_pair.expression, exp.Array)
492            ):
493                keys = array_kv_pair.this.expressions
494                values = array_kv_pair.expression.expressions
495
496                json_object.set(
497                    "expressions",
498                    [exp.JSONKeyValue(this=k, expression=v) for k, v in zip(keys, values)],
499                )
500
501            return json_object
502
503        def _parse_bracket(self, this: t.Optional[exp.Expression]) -> t.Optional[exp.Expression]:
504            bracket = super()._parse_bracket(this)
505
506            if this is bracket:
507                return bracket
508
509            if isinstance(bracket, exp.Bracket):
510                for expression in bracket.expressions:
511                    name = expression.name.upper()
512
513                    if name not in self.BRACKET_OFFSETS:
514                        break
515
516                    offset, safe = self.BRACKET_OFFSETS[name]
517                    bracket.set("offset", offset)
518                    bracket.set("safe", safe)
519                    expression.replace(expression.expressions[0])
520
521            return bracket
522
523    class Generator(generator.Generator):
524        EXPLICIT_UNION = True
525        INTERVAL_ALLOWS_PLURAL_FORM = False
526        JOIN_HINTS = False
527        QUERY_HINTS = False
528        TABLE_HINTS = False
529        LIMIT_FETCH = "LIMIT"
530        RENAME_TABLE_WITH_DB = False
531        NVL2_SUPPORTED = False
532        UNNEST_WITH_ORDINALITY = False
533        COLLATE_IS_FUNC = True
534        LIMIT_ONLY_LITERALS = True
535        SUPPORTS_TABLE_ALIAS_COLUMNS = False
536        UNPIVOT_ALIASES_ARE_IDENTIFIERS = False
537        JSON_KEY_VALUE_PAIR_SEP = ","
538        NULL_ORDERING_SUPPORTED = False
539
540        TRANSFORMS = {
541            **generator.Generator.TRANSFORMS,
542            exp.ApproxDistinct: rename_func("APPROX_COUNT_DISTINCT"),
543            exp.ArgMax: arg_max_or_min_no_count("MAX_BY"),
544            exp.ArgMin: arg_max_or_min_no_count("MIN_BY"),
545            exp.ArrayContains: _array_contains_sql,
546            exp.ArraySize: rename_func("ARRAY_LENGTH"),
547            exp.Cast: transforms.preprocess([transforms.remove_precision_parameterized_types]),
548            exp.CollateProperty: lambda self, e: (
549                f"DEFAULT COLLATE {self.sql(e, 'this')}"
550                if e.args.get("default")
551                else f"COLLATE {self.sql(e, 'this')}"
552            ),
553            exp.CountIf: rename_func("COUNTIF"),
554            exp.Create: _create_sql,
555            exp.CTE: transforms.preprocess([_pushdown_cte_column_names]),
556            exp.DateAdd: date_add_interval_sql("DATE", "ADD"),
557            exp.DateDiff: lambda self, e: f"DATE_DIFF({self.sql(e, 'this')}, {self.sql(e, 'expression')}, {self.sql(e.args.get('unit', 'DAY'))})",
558            exp.DateFromParts: rename_func("DATE"),
559            exp.DateStrToDate: datestrtodate_sql,
560            exp.DateSub: date_add_interval_sql("DATE", "SUB"),
561            exp.DatetimeAdd: date_add_interval_sql("DATETIME", "ADD"),
562            exp.DatetimeSub: date_add_interval_sql("DATETIME", "SUB"),
563            exp.DateTrunc: lambda self, e: self.func("DATE_TRUNC", e.this, e.text("unit")),
564            exp.FromTimeZone: lambda self, e: self.func(
565                "DATETIME", self.func("TIMESTAMP", e.this, e.args.get("zone")), "'UTC'"
566            ),
567            exp.GenerateSeries: rename_func("GENERATE_ARRAY"),
568            exp.GetPath: path_to_jsonpath(),
569            exp.GroupConcat: rename_func("STRING_AGG"),
570            exp.Hex: rename_func("TO_HEX"),
571            exp.If: if_sql(false_value="NULL"),
572            exp.ILike: no_ilike_sql,
573            exp.IntDiv: rename_func("DIV"),
574            exp.JSONFormat: rename_func("TO_JSON_STRING"),
575            exp.Max: max_or_greatest,
576            exp.MD5: lambda self, e: self.func("TO_HEX", self.func("MD5", e.this)),
577            exp.MD5Digest: rename_func("MD5"),
578            exp.Min: min_or_least,
579            exp.PartitionedByProperty: lambda self, e: f"PARTITION BY {self.sql(e, 'this')}",
580            exp.RegexpExtract: lambda self, e: self.func(
581                "REGEXP_EXTRACT",
582                e.this,
583                e.expression,
584                e.args.get("position"),
585                e.args.get("occurrence"),
586            ),
587            exp.RegexpReplace: regexp_replace_sql,
588            exp.RegexpLike: rename_func("REGEXP_CONTAINS"),
589            exp.ReturnsProperty: _returnsproperty_sql,
590            exp.Select: transforms.preprocess(
591                [
592                    transforms.explode_to_unnest(),
593                    _unqualify_unnest,
594                    transforms.eliminate_distinct_on,
595                    _alias_ordered_group,
596                    transforms.eliminate_semi_and_anti_joins,
597                ]
598            ),
599            exp.SHA2: lambda self, e: self.func(
600                f"SHA256" if e.text("length") == "256" else "SHA512", e.this
601            ),
602            exp.StabilityProperty: lambda self, e: (
603                f"DETERMINISTIC" if e.name == "IMMUTABLE" else "NOT DETERMINISTIC"
604            ),
605            exp.StrToDate: lambda self, e: f"PARSE_DATE({self.format_time(e)}, {self.sql(e, 'this')})",
606            exp.StrToTime: lambda self, e: self.func(
607                "PARSE_TIMESTAMP", self.format_time(e), e.this, e.args.get("zone")
608            ),
609            exp.TimeAdd: date_add_interval_sql("TIME", "ADD"),
610            exp.TimeFromParts: rename_func("TIME"),
611            exp.TimeSub: date_add_interval_sql("TIME", "SUB"),
612            exp.TimestampAdd: date_add_interval_sql("TIMESTAMP", "ADD"),
613            exp.TimestampSub: date_add_interval_sql("TIMESTAMP", "SUB"),
614            exp.TimeStrToTime: timestrtotime_sql,
615            exp.Trim: lambda self, e: self.func(f"TRIM", e.this, e.expression),
616            exp.TsOrDsAdd: _ts_or_ds_add_sql,
617            exp.TsOrDsDiff: _ts_or_ds_diff_sql,
618            exp.TsOrDsToTime: rename_func("TIME"),
619            exp.Unhex: rename_func("FROM_HEX"),
620            exp.UnixDate: rename_func("UNIX_DATE"),
621            exp.UnixToTime: _unix_to_time_sql,
622            exp.Values: _derived_table_values_to_unnest,
623            exp.VariancePop: rename_func("VAR_POP"),
624        }
625
626        TYPE_MAPPING = {
627            **generator.Generator.TYPE_MAPPING,
628            exp.DataType.Type.BIGDECIMAL: "BIGNUMERIC",
629            exp.DataType.Type.BIGINT: "INT64",
630            exp.DataType.Type.BINARY: "BYTES",
631            exp.DataType.Type.BOOLEAN: "BOOL",
632            exp.DataType.Type.CHAR: "STRING",
633            exp.DataType.Type.DECIMAL: "NUMERIC",
634            exp.DataType.Type.DOUBLE: "FLOAT64",
635            exp.DataType.Type.FLOAT: "FLOAT64",
636            exp.DataType.Type.INT: "INT64",
637            exp.DataType.Type.NCHAR: "STRING",
638            exp.DataType.Type.NVARCHAR: "STRING",
639            exp.DataType.Type.SMALLINT: "INT64",
640            exp.DataType.Type.TEXT: "STRING",
641            exp.DataType.Type.TIMESTAMP: "DATETIME",
642            exp.DataType.Type.TIMESTAMPTZ: "TIMESTAMP",
643            exp.DataType.Type.TIMESTAMPLTZ: "TIMESTAMP",
644            exp.DataType.Type.TINYINT: "INT64",
645            exp.DataType.Type.VARBINARY: "BYTES",
646            exp.DataType.Type.VARCHAR: "STRING",
647            exp.DataType.Type.VARIANT: "ANY TYPE",
648        }
649
650        PROPERTIES_LOCATION = {
651            **generator.Generator.PROPERTIES_LOCATION,
652            exp.PartitionedByProperty: exp.Properties.Location.POST_SCHEMA,
653            exp.VolatileProperty: exp.Properties.Location.UNSUPPORTED,
654        }
655
656        # from: https://cloud.google.com/bigquery/docs/reference/standard-sql/lexical#reserved_keywords
657        RESERVED_KEYWORDS = {
658            *generator.Generator.RESERVED_KEYWORDS,
659            "all",
660            "and",
661            "any",
662            "array",
663            "as",
664            "asc",
665            "assert_rows_modified",
666            "at",
667            "between",
668            "by",
669            "case",
670            "cast",
671            "collate",
672            "contains",
673            "create",
674            "cross",
675            "cube",
676            "current",
677            "default",
678            "define",
679            "desc",
680            "distinct",
681            "else",
682            "end",
683            "enum",
684            "escape",
685            "except",
686            "exclude",
687            "exists",
688            "extract",
689            "false",
690            "fetch",
691            "following",
692            "for",
693            "from",
694            "full",
695            "group",
696            "grouping",
697            "groups",
698            "hash",
699            "having",
700            "if",
701            "ignore",
702            "in",
703            "inner",
704            "intersect",
705            "interval",
706            "into",
707            "is",
708            "join",
709            "lateral",
710            "left",
711            "like",
712            "limit",
713            "lookup",
714            "merge",
715            "natural",
716            "new",
717            "no",
718            "not",
719            "null",
720            "nulls",
721            "of",
722            "on",
723            "or",
724            "order",
725            "outer",
726            "over",
727            "partition",
728            "preceding",
729            "proto",
730            "qualify",
731            "range",
732            "recursive",
733            "respect",
734            "right",
735            "rollup",
736            "rows",
737            "select",
738            "set",
739            "some",
740            "struct",
741            "tablesample",
742            "then",
743            "to",
744            "treat",
745            "true",
746            "unbounded",
747            "union",
748            "unnest",
749            "using",
750            "when",
751            "where",
752            "window",
753            "with",
754            "within",
755        }
756
757        def timetostr_sql(self, expression: exp.TimeToStr) -> str:
758            if isinstance(expression.this, exp.TsOrDsToDate):
759                this: exp.Expression = expression.this
760            else:
761                this = expression
762
763            return f"FORMAT_DATE({self.format_time(expression)}, {self.sql(this, 'this')})"
764
765        def struct_sql(self, expression: exp.Struct) -> str:
766            args = []
767            for expr in expression.expressions:
768                if isinstance(expr, self.KEY_VALUE_DEFINITIONS):
769                    arg = f"{self.sql(expr, 'expression')} AS {expr.this.name}"
770                else:
771                    arg = self.sql(expr)
772
773                args.append(arg)
774
775            return self.func("STRUCT", *args)
776
777        def eq_sql(self, expression: exp.EQ) -> str:
778            # Operands of = cannot be NULL in BigQuery
779            if isinstance(expression.left, exp.Null) or isinstance(expression.right, exp.Null):
780                if not isinstance(expression.parent, exp.Update):
781                    return "NULL"
782
783            return self.binary(expression, "=")
784
785        def attimezone_sql(self, expression: exp.AtTimeZone) -> str:
786            parent = expression.parent
787
788            # BigQuery allows CAST(.. AS {STRING|TIMESTAMP} [FORMAT <fmt> [AT TIME ZONE <tz>]]).
789            # Only the TIMESTAMP one should use the below conversion, when AT TIME ZONE is included.
790            if not isinstance(parent, exp.Cast) or not parent.to.is_type("text"):
791                return self.func(
792                    "TIMESTAMP", self.func("DATETIME", expression.this, expression.args.get("zone"))
793                )
794
795            return super().attimezone_sql(expression)
796
797        def trycast_sql(self, expression: exp.TryCast) -> str:
798            return self.cast_sql(expression, safe_prefix="SAFE_")
799
800        def cte_sql(self, expression: exp.CTE) -> str:
801            if expression.alias_column_names:
802                self.unsupported("Column names in CTE definition are not supported.")
803            return super().cte_sql(expression)
804
805        def array_sql(self, expression: exp.Array) -> str:
806            first_arg = seq_get(expression.expressions, 0)
807            if isinstance(first_arg, exp.Subqueryable):
808                return f"ARRAY{self.wrap(self.sql(first_arg))}"
809
810            return inline_array_sql(self, expression)
811
812        def bracket_sql(self, expression: exp.Bracket) -> str:
813            this = self.sql(expression, "this")
814            expressions = expression.expressions
815
816            if len(expressions) == 1:
817                arg = expressions[0]
818                if arg.type is None:
819                    from sqlglot.optimizer.annotate_types import annotate_types
820
821                    arg = annotate_types(arg)
822
823                if arg.type and arg.type.this in exp.DataType.TEXT_TYPES:
824                    # BQ doesn't support bracket syntax with string values
825                    return f"{this}.{arg.name}"
826
827            expressions_sql = ", ".join(self.sql(e) for e in expressions)
828            offset = expression.args.get("offset")
829
830            if offset == 0:
831                expressions_sql = f"OFFSET({expressions_sql})"
832            elif offset == 1:
833                expressions_sql = f"ORDINAL({expressions_sql})"
834            elif offset is not None:
835                self.unsupported(f"Unsupported array offset: {offset}")
836
837            if expression.args.get("safe"):
838                expressions_sql = f"SAFE_{expressions_sql}"
839
840            return f"{this}[{expressions_sql}]"
841
842        def transaction_sql(self, *_) -> str:
843            return "BEGIN TRANSACTION"
844
845        def commit_sql(self, *_) -> str:
846            return "COMMIT TRANSACTION"
847
848        def rollback_sql(self, *_) -> str:
849            return "ROLLBACK TRANSACTION"
850
851        def in_unnest_op(self, expression: exp.Unnest) -> str:
852            return self.sql(expression)
853
854        def except_op(self, expression: exp.Except) -> str:
855            if not expression.args.get("distinct", False):
856                self.unsupported("EXCEPT without DISTINCT is not supported in BigQuery")
857            return f"EXCEPT{' DISTINCT' if expression.args.get('distinct') else ' ALL'}"
858
859        def intersect_op(self, expression: exp.Intersect) -> str:
860            if not expression.args.get("distinct", False):
861                self.unsupported("INTERSECT without DISTINCT is not supported in BigQuery")
862            return f"INTERSECT{' DISTINCT' if expression.args.get('distinct') else ' ALL'}"
863
864        def with_properties(self, properties: exp.Properties) -> str:
865            return self.properties(properties, prefix=self.seg("OPTIONS"))
866
867        def version_sql(self, expression: exp.Version) -> str:
868            if expression.name == "TIMESTAMP":
869                expression.set("this", "SYSTEM_TIME")
870            return super().version_sql(expression)
logger = <Logger sqlglot (WARNING)>
class BigQuery(sqlglot.dialects.dialect.Dialect):
226class BigQuery(Dialect):
227    WEEK_OFFSET = -1
228    UNNEST_COLUMN_ONLY = True
229    SUPPORTS_USER_DEFINED_TYPES = False
230    SUPPORTS_SEMI_ANTI_JOIN = False
231    LOG_BASE_FIRST = False
232
233    # https://cloud.google.com/bigquery/docs/reference/standard-sql/lexical#case_sensitivity
234    NORMALIZATION_STRATEGY = NormalizationStrategy.CASE_INSENSITIVE
235
236    # bigquery udfs are case sensitive
237    NORMALIZE_FUNCTIONS = False
238
239    TIME_MAPPING = {
240        "%D": "%m/%d/%y",
241    }
242
243    ESCAPE_SEQUENCES = {
244        "\\a": "\a",
245        "\\b": "\b",
246        "\\f": "\f",
247        "\\n": "\n",
248        "\\r": "\r",
249        "\\t": "\t",
250        "\\v": "\v",
251    }
252
253    FORMAT_MAPPING = {
254        "DD": "%d",
255        "MM": "%m",
256        "MON": "%b",
257        "MONTH": "%B",
258        "YYYY": "%Y",
259        "YY": "%y",
260        "HH": "%I",
261        "HH12": "%I",
262        "HH24": "%H",
263        "MI": "%M",
264        "SS": "%S",
265        "SSSSS": "%f",
266        "TZH": "%z",
267    }
268
269    # The _PARTITIONTIME and _PARTITIONDATE pseudo-columns are not returned by a SELECT * statement
270    # https://cloud.google.com/bigquery/docs/querying-partitioned-tables#query_an_ingestion-time_partitioned_table
271    PSEUDOCOLUMNS = {"_PARTITIONTIME", "_PARTITIONDATE"}
272
273    def normalize_identifier(self, expression: E) -> E:
274        if isinstance(expression, exp.Identifier):
275            parent = expression.parent
276            while isinstance(parent, exp.Dot):
277                parent = parent.parent
278
279            # In BigQuery, CTEs aren't case-sensitive, but table names are (by default, at least).
280            # The following check is essentially a heuristic to detect tables based on whether or
281            # not they're qualified. It also avoids normalizing UDFs, because they're case-sensitive.
282            if (
283                not isinstance(parent, exp.UserDefinedFunction)
284                and not (isinstance(parent, exp.Table) and parent.db)
285                and not expression.meta.get("is_table")
286            ):
287                expression.set("this", expression.this.lower())
288
289        return expression
290
291    class Tokenizer(tokens.Tokenizer):
292        QUOTES = ["'", '"', '"""', "'''"]
293        COMMENTS = ["--", "#", ("/*", "*/")]
294        IDENTIFIERS = ["`"]
295        STRING_ESCAPES = ["\\"]
296
297        HEX_STRINGS = [("0x", ""), ("0X", "")]
298
299        BYTE_STRINGS = [
300            (prefix + q, q) for q in t.cast(t.List[str], QUOTES) for prefix in ("b", "B")
301        ]
302
303        RAW_STRINGS = [
304            (prefix + q, q) for q in t.cast(t.List[str], QUOTES) for prefix in ("r", "R")
305        ]
306
307        KEYWORDS = {
308            **tokens.Tokenizer.KEYWORDS,
309            "ANY TYPE": TokenType.VARIANT,
310            "BEGIN": TokenType.COMMAND,
311            "BEGIN TRANSACTION": TokenType.BEGIN,
312            "BYTES": TokenType.BINARY,
313            "CURRENT_DATETIME": TokenType.CURRENT_DATETIME,
314            "DECLARE": TokenType.COMMAND,
315            "FLOAT64": TokenType.DOUBLE,
316            "FOR SYSTEM_TIME": TokenType.TIMESTAMP_SNAPSHOT,
317            "MODEL": TokenType.MODEL,
318            "NOT DETERMINISTIC": TokenType.VOLATILE,
319            "RECORD": TokenType.STRUCT,
320            "TIMESTAMP": TokenType.TIMESTAMPTZ,
321        }
322        KEYWORDS.pop("DIV")
323
324    class Parser(parser.Parser):
325        PREFIXED_PIVOT_COLUMNS = True
326
327        LOG_DEFAULTS_TO_LN = True
328
329        FUNCTIONS = {
330            **parser.Parser.FUNCTIONS,
331            "DATE": _parse_date,
332            "DATE_ADD": parse_date_delta_with_interval(exp.DateAdd),
333            "DATE_SUB": parse_date_delta_with_interval(exp.DateSub),
334            "DATE_TRUNC": lambda args: exp.DateTrunc(
335                unit=exp.Literal.string(str(seq_get(args, 1))),
336                this=seq_get(args, 0),
337            ),
338            "DATETIME_ADD": parse_date_delta_with_interval(exp.DatetimeAdd),
339            "DATETIME_SUB": parse_date_delta_with_interval(exp.DatetimeSub),
340            "DIV": binary_from_function(exp.IntDiv),
341            "FORMAT_DATE": lambda args: exp.TimeToStr(
342                this=exp.TsOrDsToDate(this=seq_get(args, 1)), format=seq_get(args, 0)
343            ),
344            "GENERATE_ARRAY": exp.GenerateSeries.from_arg_list,
345            "JSON_EXTRACT_SCALAR": lambda args: exp.JSONExtractScalar(
346                this=seq_get(args, 0), expression=seq_get(args, 1) or exp.Literal.string("$")
347            ),
348            "MD5": exp.MD5Digest.from_arg_list,
349            "TO_HEX": _parse_to_hex,
350            "PARSE_DATE": lambda args: format_time_lambda(exp.StrToDate, "bigquery")(
351                [seq_get(args, 1), seq_get(args, 0)]
352            ),
353            "PARSE_TIMESTAMP": _parse_timestamp,
354            "REGEXP_CONTAINS": exp.RegexpLike.from_arg_list,
355            "REGEXP_EXTRACT": lambda args: exp.RegexpExtract(
356                this=seq_get(args, 0),
357                expression=seq_get(args, 1),
358                position=seq_get(args, 2),
359                occurrence=seq_get(args, 3),
360                group=exp.Literal.number(1) if re.compile(args[1].name).groups == 1 else None,
361            ),
362            "SHA256": lambda args: exp.SHA2(this=seq_get(args, 0), length=exp.Literal.number(256)),
363            "SHA512": lambda args: exp.SHA2(this=seq_get(args, 0), length=exp.Literal.number(512)),
364            "SPLIT": lambda args: exp.Split(
365                # https://cloud.google.com/bigquery/docs/reference/standard-sql/string_functions#split
366                this=seq_get(args, 0),
367                expression=seq_get(args, 1) or exp.Literal.string(","),
368            ),
369            "TIME": _parse_time,
370            "TIME_ADD": parse_date_delta_with_interval(exp.TimeAdd),
371            "TIME_SUB": parse_date_delta_with_interval(exp.TimeSub),
372            "TIMESTAMP_ADD": parse_date_delta_with_interval(exp.TimestampAdd),
373            "TIMESTAMP_SUB": parse_date_delta_with_interval(exp.TimestampSub),
374            "TIMESTAMP_MICROS": lambda args: exp.UnixToTime(
375                this=seq_get(args, 0), scale=exp.UnixToTime.MICROS
376            ),
377            "TIMESTAMP_MILLIS": lambda args: exp.UnixToTime(
378                this=seq_get(args, 0), scale=exp.UnixToTime.MILLIS
379            ),
380            "TIMESTAMP_SECONDS": lambda args: exp.UnixToTime(this=seq_get(args, 0)),
381            "TO_JSON_STRING": exp.JSONFormat.from_arg_list,
382        }
383
384        FUNCTION_PARSERS = {
385            **parser.Parser.FUNCTION_PARSERS,
386            "ARRAY": lambda self: self.expression(exp.Array, expressions=[self._parse_statement()]),
387        }
388        FUNCTION_PARSERS.pop("TRIM")
389
390        NO_PAREN_FUNCTIONS = {
391            **parser.Parser.NO_PAREN_FUNCTIONS,
392            TokenType.CURRENT_DATETIME: exp.CurrentDatetime,
393        }
394
395        NESTED_TYPE_TOKENS = {
396            *parser.Parser.NESTED_TYPE_TOKENS,
397            TokenType.TABLE,
398        }
399
400        ID_VAR_TOKENS = {
401            *parser.Parser.ID_VAR_TOKENS,
402            TokenType.VALUES,
403        }
404
405        PROPERTY_PARSERS = {
406            **parser.Parser.PROPERTY_PARSERS,
407            "NOT DETERMINISTIC": lambda self: self.expression(
408                exp.StabilityProperty, this=exp.Literal.string("VOLATILE")
409            ),
410            "OPTIONS": lambda self: self._parse_with_property(),
411        }
412
413        CONSTRAINT_PARSERS = {
414            **parser.Parser.CONSTRAINT_PARSERS,
415            "OPTIONS": lambda self: exp.Properties(expressions=self._parse_with_property()),
416        }
417
418        RANGE_PARSERS = parser.Parser.RANGE_PARSERS.copy()
419        RANGE_PARSERS.pop(TokenType.OVERLAPS, None)
420
421        NULL_TOKENS = {TokenType.NULL, TokenType.UNKNOWN}
422
423        STATEMENT_PARSERS = {
424            **parser.Parser.STATEMENT_PARSERS,
425            TokenType.END: lambda self: self._parse_as_command(self._prev),
426            TokenType.FOR: lambda self: self._parse_for_in(),
427        }
428
429        BRACKET_OFFSETS = {
430            "OFFSET": (0, False),
431            "ORDINAL": (1, False),
432            "SAFE_OFFSET": (0, True),
433            "SAFE_ORDINAL": (1, True),
434        }
435
436        def _parse_for_in(self) -> exp.ForIn:
437            this = self._parse_range()
438            self._match_text_seq("DO")
439            return self.expression(exp.ForIn, this=this, expression=self._parse_statement())
440
441        def _parse_table_part(self, schema: bool = False) -> t.Optional[exp.Expression]:
442            this = super()._parse_table_part(schema=schema) or self._parse_number()
443
444            # https://cloud.google.com/bigquery/docs/reference/standard-sql/lexical#table_names
445            if isinstance(this, exp.Identifier):
446                table_name = this.name
447                while self._match(TokenType.DASH, advance=False) and self._next:
448                    self._advance(2)
449                    table_name += f"-{self._prev.text}"
450
451                this = exp.Identifier(this=table_name, quoted=this.args.get("quoted"))
452            elif isinstance(this, exp.Literal):
453                table_name = this.name
454
455                if self._is_connected() and self._parse_var(any_token=True):
456                    table_name += self._prev.text
457
458                this = exp.Identifier(this=table_name, quoted=True)
459
460            return this
461
462        def _parse_table_parts(self, schema: bool = False) -> exp.Table:
463            table = super()._parse_table_parts(schema=schema)
464            if isinstance(table.this, exp.Identifier) and "." in table.name:
465                catalog, db, this, *rest = (
466                    t.cast(t.Optional[exp.Expression], exp.to_identifier(x))
467                    for x in split_num_words(table.name, ".", 3)
468                )
469
470                if rest and this:
471                    this = exp.Dot.build(t.cast(t.List[exp.Expression], [this, *rest]))
472
473                table = exp.Table(this=this, db=db, catalog=catalog)
474
475            return table
476
477        @t.overload
478        def _parse_json_object(self, agg: Lit[False]) -> exp.JSONObject: ...
479
480        @t.overload
481        def _parse_json_object(self, agg: Lit[True]) -> exp.JSONObjectAgg: ...
482
483        def _parse_json_object(self, agg=False):
484            json_object = super()._parse_json_object()
485            array_kv_pair = seq_get(json_object.expressions, 0)
486
487            # Converts BQ's "signature 2" of JSON_OBJECT into SQLGlot's canonical representation
488            # https://cloud.google.com/bigquery/docs/reference/standard-sql/json_functions#json_object_signature2
489            if (
490                array_kv_pair
491                and isinstance(array_kv_pair.this, exp.Array)
492                and isinstance(array_kv_pair.expression, exp.Array)
493            ):
494                keys = array_kv_pair.this.expressions
495                values = array_kv_pair.expression.expressions
496
497                json_object.set(
498                    "expressions",
499                    [exp.JSONKeyValue(this=k, expression=v) for k, v in zip(keys, values)],
500                )
501
502            return json_object
503
504        def _parse_bracket(self, this: t.Optional[exp.Expression]) -> t.Optional[exp.Expression]:
505            bracket = super()._parse_bracket(this)
506
507            if this is bracket:
508                return bracket
509
510            if isinstance(bracket, exp.Bracket):
511                for expression in bracket.expressions:
512                    name = expression.name.upper()
513
514                    if name not in self.BRACKET_OFFSETS:
515                        break
516
517                    offset, safe = self.BRACKET_OFFSETS[name]
518                    bracket.set("offset", offset)
519                    bracket.set("safe", safe)
520                    expression.replace(expression.expressions[0])
521
522            return bracket
523
524    class Generator(generator.Generator):
525        EXPLICIT_UNION = True
526        INTERVAL_ALLOWS_PLURAL_FORM = False
527        JOIN_HINTS = False
528        QUERY_HINTS = False
529        TABLE_HINTS = False
530        LIMIT_FETCH = "LIMIT"
531        RENAME_TABLE_WITH_DB = False
532        NVL2_SUPPORTED = False
533        UNNEST_WITH_ORDINALITY = False
534        COLLATE_IS_FUNC = True
535        LIMIT_ONLY_LITERALS = True
536        SUPPORTS_TABLE_ALIAS_COLUMNS = False
537        UNPIVOT_ALIASES_ARE_IDENTIFIERS = False
538        JSON_KEY_VALUE_PAIR_SEP = ","
539        NULL_ORDERING_SUPPORTED = False
540
541        TRANSFORMS = {
542            **generator.Generator.TRANSFORMS,
543            exp.ApproxDistinct: rename_func("APPROX_COUNT_DISTINCT"),
544            exp.ArgMax: arg_max_or_min_no_count("MAX_BY"),
545            exp.ArgMin: arg_max_or_min_no_count("MIN_BY"),
546            exp.ArrayContains: _array_contains_sql,
547            exp.ArraySize: rename_func("ARRAY_LENGTH"),
548            exp.Cast: transforms.preprocess([transforms.remove_precision_parameterized_types]),
549            exp.CollateProperty: lambda self, e: (
550                f"DEFAULT COLLATE {self.sql(e, 'this')}"
551                if e.args.get("default")
552                else f"COLLATE {self.sql(e, 'this')}"
553            ),
554            exp.CountIf: rename_func("COUNTIF"),
555            exp.Create: _create_sql,
556            exp.CTE: transforms.preprocess([_pushdown_cte_column_names]),
557            exp.DateAdd: date_add_interval_sql("DATE", "ADD"),
558            exp.DateDiff: lambda self, e: f"DATE_DIFF({self.sql(e, 'this')}, {self.sql(e, 'expression')}, {self.sql(e.args.get('unit', 'DAY'))})",
559            exp.DateFromParts: rename_func("DATE"),
560            exp.DateStrToDate: datestrtodate_sql,
561            exp.DateSub: date_add_interval_sql("DATE", "SUB"),
562            exp.DatetimeAdd: date_add_interval_sql("DATETIME", "ADD"),
563            exp.DatetimeSub: date_add_interval_sql("DATETIME", "SUB"),
564            exp.DateTrunc: lambda self, e: self.func("DATE_TRUNC", e.this, e.text("unit")),
565            exp.FromTimeZone: lambda self, e: self.func(
566                "DATETIME", self.func("TIMESTAMP", e.this, e.args.get("zone")), "'UTC'"
567            ),
568            exp.GenerateSeries: rename_func("GENERATE_ARRAY"),
569            exp.GetPath: path_to_jsonpath(),
570            exp.GroupConcat: rename_func("STRING_AGG"),
571            exp.Hex: rename_func("TO_HEX"),
572            exp.If: if_sql(false_value="NULL"),
573            exp.ILike: no_ilike_sql,
574            exp.IntDiv: rename_func("DIV"),
575            exp.JSONFormat: rename_func("TO_JSON_STRING"),
576            exp.Max: max_or_greatest,
577            exp.MD5: lambda self, e: self.func("TO_HEX", self.func("MD5", e.this)),
578            exp.MD5Digest: rename_func("MD5"),
579            exp.Min: min_or_least,
580            exp.PartitionedByProperty: lambda self, e: f"PARTITION BY {self.sql(e, 'this')}",
581            exp.RegexpExtract: lambda self, e: self.func(
582                "REGEXP_EXTRACT",
583                e.this,
584                e.expression,
585                e.args.get("position"),
586                e.args.get("occurrence"),
587            ),
588            exp.RegexpReplace: regexp_replace_sql,
589            exp.RegexpLike: rename_func("REGEXP_CONTAINS"),
590            exp.ReturnsProperty: _returnsproperty_sql,
591            exp.Select: transforms.preprocess(
592                [
593                    transforms.explode_to_unnest(),
594                    _unqualify_unnest,
595                    transforms.eliminate_distinct_on,
596                    _alias_ordered_group,
597                    transforms.eliminate_semi_and_anti_joins,
598                ]
599            ),
600            exp.SHA2: lambda self, e: self.func(
601                f"SHA256" if e.text("length") == "256" else "SHA512", e.this
602            ),
603            exp.StabilityProperty: lambda self, e: (
604                f"DETERMINISTIC" if e.name == "IMMUTABLE" else "NOT DETERMINISTIC"
605            ),
606            exp.StrToDate: lambda self, e: f"PARSE_DATE({self.format_time(e)}, {self.sql(e, 'this')})",
607            exp.StrToTime: lambda self, e: self.func(
608                "PARSE_TIMESTAMP", self.format_time(e), e.this, e.args.get("zone")
609            ),
610            exp.TimeAdd: date_add_interval_sql("TIME", "ADD"),
611            exp.TimeFromParts: rename_func("TIME"),
612            exp.TimeSub: date_add_interval_sql("TIME", "SUB"),
613            exp.TimestampAdd: date_add_interval_sql("TIMESTAMP", "ADD"),
614            exp.TimestampSub: date_add_interval_sql("TIMESTAMP", "SUB"),
615            exp.TimeStrToTime: timestrtotime_sql,
616            exp.Trim: lambda self, e: self.func(f"TRIM", e.this, e.expression),
617            exp.TsOrDsAdd: _ts_or_ds_add_sql,
618            exp.TsOrDsDiff: _ts_or_ds_diff_sql,
619            exp.TsOrDsToTime: rename_func("TIME"),
620            exp.Unhex: rename_func("FROM_HEX"),
621            exp.UnixDate: rename_func("UNIX_DATE"),
622            exp.UnixToTime: _unix_to_time_sql,
623            exp.Values: _derived_table_values_to_unnest,
624            exp.VariancePop: rename_func("VAR_POP"),
625        }
626
627        TYPE_MAPPING = {
628            **generator.Generator.TYPE_MAPPING,
629            exp.DataType.Type.BIGDECIMAL: "BIGNUMERIC",
630            exp.DataType.Type.BIGINT: "INT64",
631            exp.DataType.Type.BINARY: "BYTES",
632            exp.DataType.Type.BOOLEAN: "BOOL",
633            exp.DataType.Type.CHAR: "STRING",
634            exp.DataType.Type.DECIMAL: "NUMERIC",
635            exp.DataType.Type.DOUBLE: "FLOAT64",
636            exp.DataType.Type.FLOAT: "FLOAT64",
637            exp.DataType.Type.INT: "INT64",
638            exp.DataType.Type.NCHAR: "STRING",
639            exp.DataType.Type.NVARCHAR: "STRING",
640            exp.DataType.Type.SMALLINT: "INT64",
641            exp.DataType.Type.TEXT: "STRING",
642            exp.DataType.Type.TIMESTAMP: "DATETIME",
643            exp.DataType.Type.TIMESTAMPTZ: "TIMESTAMP",
644            exp.DataType.Type.TIMESTAMPLTZ: "TIMESTAMP",
645            exp.DataType.Type.TINYINT: "INT64",
646            exp.DataType.Type.VARBINARY: "BYTES",
647            exp.DataType.Type.VARCHAR: "STRING",
648            exp.DataType.Type.VARIANT: "ANY TYPE",
649        }
650
651        PROPERTIES_LOCATION = {
652            **generator.Generator.PROPERTIES_LOCATION,
653            exp.PartitionedByProperty: exp.Properties.Location.POST_SCHEMA,
654            exp.VolatileProperty: exp.Properties.Location.UNSUPPORTED,
655        }
656
657        # from: https://cloud.google.com/bigquery/docs/reference/standard-sql/lexical#reserved_keywords
658        RESERVED_KEYWORDS = {
659            *generator.Generator.RESERVED_KEYWORDS,
660            "all",
661            "and",
662            "any",
663            "array",
664            "as",
665            "asc",
666            "assert_rows_modified",
667            "at",
668            "between",
669            "by",
670            "case",
671            "cast",
672            "collate",
673            "contains",
674            "create",
675            "cross",
676            "cube",
677            "current",
678            "default",
679            "define",
680            "desc",
681            "distinct",
682            "else",
683            "end",
684            "enum",
685            "escape",
686            "except",
687            "exclude",
688            "exists",
689            "extract",
690            "false",
691            "fetch",
692            "following",
693            "for",
694            "from",
695            "full",
696            "group",
697            "grouping",
698            "groups",
699            "hash",
700            "having",
701            "if",
702            "ignore",
703            "in",
704            "inner",
705            "intersect",
706            "interval",
707            "into",
708            "is",
709            "join",
710            "lateral",
711            "left",
712            "like",
713            "limit",
714            "lookup",
715            "merge",
716            "natural",
717            "new",
718            "no",
719            "not",
720            "null",
721            "nulls",
722            "of",
723            "on",
724            "or",
725            "order",
726            "outer",
727            "over",
728            "partition",
729            "preceding",
730            "proto",
731            "qualify",
732            "range",
733            "recursive",
734            "respect",
735            "right",
736            "rollup",
737            "rows",
738            "select",
739            "set",
740            "some",
741            "struct",
742            "tablesample",
743            "then",
744            "to",
745            "treat",
746            "true",
747            "unbounded",
748            "union",
749            "unnest",
750            "using",
751            "when",
752            "where",
753            "window",
754            "with",
755            "within",
756        }
757
758        def timetostr_sql(self, expression: exp.TimeToStr) -> str:
759            if isinstance(expression.this, exp.TsOrDsToDate):
760                this: exp.Expression = expression.this
761            else:
762                this = expression
763
764            return f"FORMAT_DATE({self.format_time(expression)}, {self.sql(this, 'this')})"
765
766        def struct_sql(self, expression: exp.Struct) -> str:
767            args = []
768            for expr in expression.expressions:
769                if isinstance(expr, self.KEY_VALUE_DEFINITIONS):
770                    arg = f"{self.sql(expr, 'expression')} AS {expr.this.name}"
771                else:
772                    arg = self.sql(expr)
773
774                args.append(arg)
775
776            return self.func("STRUCT", *args)
777
778        def eq_sql(self, expression: exp.EQ) -> str:
779            # Operands of = cannot be NULL in BigQuery
780            if isinstance(expression.left, exp.Null) or isinstance(expression.right, exp.Null):
781                if not isinstance(expression.parent, exp.Update):
782                    return "NULL"
783
784            return self.binary(expression, "=")
785
786        def attimezone_sql(self, expression: exp.AtTimeZone) -> str:
787            parent = expression.parent
788
789            # BigQuery allows CAST(.. AS {STRING|TIMESTAMP} [FORMAT <fmt> [AT TIME ZONE <tz>]]).
790            # Only the TIMESTAMP one should use the below conversion, when AT TIME ZONE is included.
791            if not isinstance(parent, exp.Cast) or not parent.to.is_type("text"):
792                return self.func(
793                    "TIMESTAMP", self.func("DATETIME", expression.this, expression.args.get("zone"))
794                )
795
796            return super().attimezone_sql(expression)
797
798        def trycast_sql(self, expression: exp.TryCast) -> str:
799            return self.cast_sql(expression, safe_prefix="SAFE_")
800
801        def cte_sql(self, expression: exp.CTE) -> str:
802            if expression.alias_column_names:
803                self.unsupported("Column names in CTE definition are not supported.")
804            return super().cte_sql(expression)
805
806        def array_sql(self, expression: exp.Array) -> str:
807            first_arg = seq_get(expression.expressions, 0)
808            if isinstance(first_arg, exp.Subqueryable):
809                return f"ARRAY{self.wrap(self.sql(first_arg))}"
810
811            return inline_array_sql(self, expression)
812
813        def bracket_sql(self, expression: exp.Bracket) -> str:
814            this = self.sql(expression, "this")
815            expressions = expression.expressions
816
817            if len(expressions) == 1:
818                arg = expressions[0]
819                if arg.type is None:
820                    from sqlglot.optimizer.annotate_types import annotate_types
821
822                    arg = annotate_types(arg)
823
824                if arg.type and arg.type.this in exp.DataType.TEXT_TYPES:
825                    # BQ doesn't support bracket syntax with string values
826                    return f"{this}.{arg.name}"
827
828            expressions_sql = ", ".join(self.sql(e) for e in expressions)
829            offset = expression.args.get("offset")
830
831            if offset == 0:
832                expressions_sql = f"OFFSET({expressions_sql})"
833            elif offset == 1:
834                expressions_sql = f"ORDINAL({expressions_sql})"
835            elif offset is not None:
836                self.unsupported(f"Unsupported array offset: {offset}")
837
838            if expression.args.get("safe"):
839                expressions_sql = f"SAFE_{expressions_sql}"
840
841            return f"{this}[{expressions_sql}]"
842
843        def transaction_sql(self, *_) -> str:
844            return "BEGIN TRANSACTION"
845
846        def commit_sql(self, *_) -> str:
847            return "COMMIT TRANSACTION"
848
849        def rollback_sql(self, *_) -> str:
850            return "ROLLBACK TRANSACTION"
851
852        def in_unnest_op(self, expression: exp.Unnest) -> str:
853            return self.sql(expression)
854
855        def except_op(self, expression: exp.Except) -> str:
856            if not expression.args.get("distinct", False):
857                self.unsupported("EXCEPT without DISTINCT is not supported in BigQuery")
858            return f"EXCEPT{' DISTINCT' if expression.args.get('distinct') else ' ALL'}"
859
860        def intersect_op(self, expression: exp.Intersect) -> str:
861            if not expression.args.get("distinct", False):
862                self.unsupported("INTERSECT without DISTINCT is not supported in BigQuery")
863            return f"INTERSECT{' DISTINCT' if expression.args.get('distinct') else ' ALL'}"
864
865        def with_properties(self, properties: exp.Properties) -> str:
866            return self.properties(properties, prefix=self.seg("OPTIONS"))
867
868        def version_sql(self, expression: exp.Version) -> str:
869            if expression.name == "TIMESTAMP":
870                expression.set("this", "SYSTEM_TIME")
871            return super().version_sql(expression)
WEEK_OFFSET = -1

Determines the day of week of DATE_TRUNC(week). Defaults to 0 (Monday). -1 would be Sunday.

UNNEST_COLUMN_ONLY = True

Determines whether or not UNNEST table aliases are treated as column aliases.

SUPPORTS_USER_DEFINED_TYPES = False

Determines whether or not user-defined data types are supported.

SUPPORTS_SEMI_ANTI_JOIN = False

Determines whether or not SEMI or ANTI joins are supported.

LOG_BASE_FIRST = False

Determines whether the base comes first in the LOG function.

NORMALIZATION_STRATEGY = <NormalizationStrategy.CASE_INSENSITIVE: 'CASE_INSENSITIVE'>

Specifies the strategy according to which identifiers should be normalized.

NORMALIZE_FUNCTIONS: bool | str = False

Determines how function names are going to be normalized.

TIME_MAPPING: Dict[str, str] = {'%D': '%m/%d/%y'}

Associates this dialect's time formats with their equivalent Python strftime format.

ESCAPE_SEQUENCES: Dict[str, str] = {'\\a': '\x07', '\\b': '\x08', '\\f': '\x0c', '\\n': '\n', '\\r': '\r', '\\t': '\t', '\\v': '\x0b'}

Mapping of an unescaped escape sequence to the corresponding character.

FORMAT_MAPPING: Dict[str, str] = {'DD': '%d', 'MM': '%m', 'MON': '%b', 'MONTH': '%B', 'YYYY': '%Y', 'YY': '%y', 'HH': '%I', 'HH12': '%I', 'HH24': '%H', 'MI': '%M', 'SS': '%S', 'SSSSS': '%f', 'TZH': '%z'}

Helper which is used for parsing the special syntax CAST(x AS DATE FORMAT 'yyyy'). If empty, the corresponding trie will be constructed off of TIME_MAPPING.

PSEUDOCOLUMNS: Set[str] = {'_PARTITIONDATE', '_PARTITIONTIME'}

Columns that are auto-generated by the engine corresponding to this dialect. For example, such columns may be excluded from SELECT * queries.

def normalize_identifier(self, expression: ~E) -> ~E:
273    def normalize_identifier(self, expression: E) -> E:
274        if isinstance(expression, exp.Identifier):
275            parent = expression.parent
276            while isinstance(parent, exp.Dot):
277                parent = parent.parent
278
279            # In BigQuery, CTEs aren't case-sensitive, but table names are (by default, at least).
280            # The following check is essentially a heuristic to detect tables based on whether or
281            # not they're qualified. It also avoids normalizing UDFs, because they're case-sensitive.
282            if (
283                not isinstance(parent, exp.UserDefinedFunction)
284                and not (isinstance(parent, exp.Table) and parent.db)
285                and not expression.meta.get("is_table")
286            ):
287                expression.set("this", expression.this.lower())
288
289        return expression

Transforms an identifier in a way that resembles how it'd be resolved by this dialect.

For example, an identifier like FoO would be resolved as foo in Postgres, because it lowercases all unquoted identifiers. On the other hand, Snowflake uppercases them, so it would resolve it as FOO. If it was quoted, it'd need to be treated as case-sensitive, and so any normalization would be prohibited in order to avoid "breaking" the identifier.

There are also dialects like Spark, which are case-insensitive even when quotes are present, and dialects like MySQL, whose resolution rules match those employed by the underlying operating system, for example they may always be case-sensitive in Linux.

Finally, the normalization behavior of some engines can even be controlled through flags, like in Redshift's case, where users can explicitly set enable_case_sensitive_identifier.

SQLGlot aims to understand and handle all of these different behaviors gracefully, so that it can analyze queries in the optimizer and successfully capture their semantics.

tokenizer_class = <class 'BigQuery.Tokenizer'>
parser_class = <class 'BigQuery.Parser'>
generator_class = <class 'BigQuery.Generator'>
TIME_TRIE: Dict = {'%': {'D': {0: True}}}
FORMAT_TRIE: Dict = {'D': {'D': {0: True}}, 'M': {'M': {0: True}, 'O': {'N': {0: True, 'T': {'H': {0: True}}}}, 'I': {0: True}}, 'Y': {'Y': {'Y': {'Y': {0: True}}, 0: True}}, 'H': {'H': {0: True, '1': {'2': {0: True}}, '2': {'4': {0: True}}}}, 'S': {'S': {0: True, 'S': {'S': {'S': {0: True}}}}}, 'T': {'Z': {'H': {0: True}}}}
INVERSE_TIME_MAPPING: Dict[str, str] = {'%m/%d/%y': '%D'}
INVERSE_TIME_TRIE: Dict = {'%': {'m': {'/': {'%': {'d': {'/': {'%': {'y': {0: True}}}}}}}}}
INVERSE_ESCAPE_SEQUENCES: Dict[str, str] = {'\x07': '\\a', '\x08': '\\b', '\x0c': '\\f', '\n': '\\n', '\r': '\\r', '\t': '\\t', '\x0b': '\\v'}
QUOTE_START = "'"
QUOTE_END = "'"
IDENTIFIER_START = '`'
IDENTIFIER_END = '`'
BIT_START: Optional[str] = None
BIT_END: Optional[str] = None
HEX_START: Optional[str] = '0x'
HEX_END: Optional[str] = ''
BYTE_START: Optional[str] = "b'"
BYTE_END: Optional[str] = "'"
UNICODE_START: Optional[str] = None
UNICODE_END: Optional[str] = None
class BigQuery.Tokenizer(sqlglot.tokens.Tokenizer):
291    class Tokenizer(tokens.Tokenizer):
292        QUOTES = ["'", '"', '"""', "'''"]
293        COMMENTS = ["--", "#", ("/*", "*/")]
294        IDENTIFIERS = ["`"]
295        STRING_ESCAPES = ["\\"]
296
297        HEX_STRINGS = [("0x", ""), ("0X", "")]
298
299        BYTE_STRINGS = [
300            (prefix + q, q) for q in t.cast(t.List[str], QUOTES) for prefix in ("b", "B")
301        ]
302
303        RAW_STRINGS = [
304            (prefix + q, q) for q in t.cast(t.List[str], QUOTES) for prefix in ("r", "R")
305        ]
306
307        KEYWORDS = {
308            **tokens.Tokenizer.KEYWORDS,
309            "ANY TYPE": TokenType.VARIANT,
310            "BEGIN": TokenType.COMMAND,
311            "BEGIN TRANSACTION": TokenType.BEGIN,
312            "BYTES": TokenType.BINARY,
313            "CURRENT_DATETIME": TokenType.CURRENT_DATETIME,
314            "DECLARE": TokenType.COMMAND,
315            "FLOAT64": TokenType.DOUBLE,
316            "FOR SYSTEM_TIME": TokenType.TIMESTAMP_SNAPSHOT,
317            "MODEL": TokenType.MODEL,
318            "NOT DETERMINISTIC": TokenType.VOLATILE,
319            "RECORD": TokenType.STRUCT,
320            "TIMESTAMP": TokenType.TIMESTAMPTZ,
321        }
322        KEYWORDS.pop("DIV")
QUOTES = ["'", '"', '"""', "'''"]
COMMENTS = ['--', '#', ('/*', '*/')]
IDENTIFIERS = ['`']
STRING_ESCAPES = ['\\']
HEX_STRINGS = [('0x', ''), ('0X', '')]
BYTE_STRINGS = [("b'", "'"), ("B'", "'"), ('b"', '"'), ('B"', '"'), ('b"""', '"""'), ('B"""', '"""'), ("b'''", "'''"), ("B'''", "'''")]
RAW_STRINGS = [("r'", "'"), ("R'", "'"), ('r"', '"'), ('R"', '"'), ('r"""', '"""'), ('R"""', '"""'), ("r'''", "'''"), ("R'''", "'''")]
KEYWORDS = {'{%': <TokenType.BLOCK_START: 'BLOCK_START'>, '{%+': <TokenType.BLOCK_START: 'BLOCK_START'>, '{%-': <TokenType.BLOCK_START: 'BLOCK_START'>, '%}': <TokenType.BLOCK_END: 'BLOCK_END'>, '+%}': <TokenType.BLOCK_END: 'BLOCK_END'>, '-%}': <TokenType.BLOCK_END: 'BLOCK_END'>, '{{+': <TokenType.BLOCK_START: 'BLOCK_START'>, '{{-': <TokenType.BLOCK_START: 'BLOCK_START'>, '+}}': <TokenType.BLOCK_END: 'BLOCK_END'>, '-}}': <TokenType.BLOCK_END: 'BLOCK_END'>, '/*+': <TokenType.HINT: 'HINT'>, '==': <TokenType.EQ: 'EQ'>, '::': <TokenType.DCOLON: 'DCOLON'>, '||': <TokenType.DPIPE: 'DPIPE'>, '>=': <TokenType.GTE: 'GTE'>, '<=': <TokenType.LTE: 'LTE'>, '<>': <TokenType.NEQ: 'NEQ'>, '!=': <TokenType.NEQ: 'NEQ'>, ':=': <TokenType.COLON_EQ: 'COLON_EQ'>, '<=>': <TokenType.NULLSAFE_EQ: 'NULLSAFE_EQ'>, '->': <TokenType.ARROW: 'ARROW'>, '->>': <TokenType.DARROW: 'DARROW'>, '=>': <TokenType.FARROW: 'FARROW'>, '#>': <TokenType.HASH_ARROW: 'HASH_ARROW'>, '#>>': <TokenType.DHASH_ARROW: 'DHASH_ARROW'>, '<->': <TokenType.LR_ARROW: 'LR_ARROW'>, '&&': <TokenType.DAMP: 'DAMP'>, '??': <TokenType.DQMARK: 'DQMARK'>, 'ALL': <TokenType.ALL: 'ALL'>, 'ALWAYS': <TokenType.ALWAYS: 'ALWAYS'>, 'AND': <TokenType.AND: 'AND'>, 'ANTI': <TokenType.ANTI: 'ANTI'>, 'ANY': <TokenType.ANY: 'ANY'>, 'ASC': <TokenType.ASC: 'ASC'>, 'AS': <TokenType.ALIAS: 'ALIAS'>, 'ASOF': <TokenType.ASOF: 'ASOF'>, 'AUTOINCREMENT': <TokenType.AUTO_INCREMENT: 'AUTO_INCREMENT'>, 'AUTO_INCREMENT': <TokenType.AUTO_INCREMENT: 'AUTO_INCREMENT'>, 'BEGIN': <TokenType.COMMAND: 'COMMAND'>, 'BETWEEN': <TokenType.BETWEEN: 'BETWEEN'>, 'CACHE': <TokenType.CACHE: 'CACHE'>, 'UNCACHE': <TokenType.UNCACHE: 'UNCACHE'>, 'CASE': <TokenType.CASE: 'CASE'>, 'CHARACTER SET': <TokenType.CHARACTER_SET: 'CHARACTER_SET'>, 'CLUSTER BY': <TokenType.CLUSTER_BY: 'CLUSTER_BY'>, 'COLLATE': <TokenType.COLLATE: 'COLLATE'>, 'COLUMN': <TokenType.COLUMN: 'COLUMN'>, 'COMMIT': <TokenType.COMMIT: 'COMMIT'>, 'CONNECT BY': <TokenType.CONNECT_BY: 'CONNECT_BY'>, 'CONSTRAINT': <TokenType.CONSTRAINT: 'CONSTRAINT'>, 'CREATE': <TokenType.CREATE: 'CREATE'>, 'CROSS': <TokenType.CROSS: 'CROSS'>, 'CUBE': <TokenType.CUBE: 'CUBE'>, 'CURRENT_DATE': <TokenType.CURRENT_DATE: 'CURRENT_DATE'>, 'CURRENT_TIME': <TokenType.CURRENT_TIME: 'CURRENT_TIME'>, 'CURRENT_TIMESTAMP': <TokenType.CURRENT_TIMESTAMP: 'CURRENT_TIMESTAMP'>, 'CURRENT_USER': <TokenType.CURRENT_USER: 'CURRENT_USER'>, 'DATABASE': <TokenType.DATABASE: 'DATABASE'>, 'DEFAULT': <TokenType.DEFAULT: 'DEFAULT'>, 'DELETE': <TokenType.DELETE: 'DELETE'>, 'DESC': <TokenType.DESC: 'DESC'>, 'DESCRIBE': <TokenType.DESCRIBE: 'DESCRIBE'>, 'DISTINCT': <TokenType.DISTINCT: 'DISTINCT'>, 'DISTRIBUTE BY': <TokenType.DISTRIBUTE_BY: 'DISTRIBUTE_BY'>, 'DROP': <TokenType.DROP: 'DROP'>, 'ELSE': <TokenType.ELSE: 'ELSE'>, 'END': <TokenType.END: 'END'>, 'ESCAPE': <TokenType.ESCAPE: 'ESCAPE'>, 'EXCEPT': <TokenType.EXCEPT: 'EXCEPT'>, 'EXECUTE': <TokenType.EXECUTE: 'EXECUTE'>, 'EXISTS': <TokenType.EXISTS: 'EXISTS'>, 'FALSE': <TokenType.FALSE: 'FALSE'>, 'FETCH': <TokenType.FETCH: 'FETCH'>, 'FILTER': <TokenType.FILTER: 'FILTER'>, 'FIRST': <TokenType.FIRST: 'FIRST'>, 'FULL': <TokenType.FULL: 'FULL'>, 'FUNCTION': <TokenType.FUNCTION: 'FUNCTION'>, 'FOR': <TokenType.FOR: 'FOR'>, 'FOREIGN KEY': <TokenType.FOREIGN_KEY: 'FOREIGN_KEY'>, 'FORMAT': <TokenType.FORMAT: 'FORMAT'>, 'FROM': <TokenType.FROM: 'FROM'>, 'GEOGRAPHY': <TokenType.GEOGRAPHY: 'GEOGRAPHY'>, 'GEOMETRY': <TokenType.GEOMETRY: 'GEOMETRY'>, 'GLOB': <TokenType.GLOB: 'GLOB'>, 'GROUP BY': <TokenType.GROUP_BY: 'GROUP_BY'>, 'GROUPING SETS': <TokenType.GROUPING_SETS: 'GROUPING_SETS'>, 'HAVING': <TokenType.HAVING: 'HAVING'>, 'ILIKE': <TokenType.ILIKE: 'ILIKE'>, 'IN': <TokenType.IN: 'IN'>, 'INDEX': <TokenType.INDEX: 'INDEX'>, 'INET': <TokenType.INET: 'INET'>, 'INNER': <TokenType.INNER: 'INNER'>, 'INSERT': <TokenType.INSERT: 'INSERT'>, 'INTERVAL': <TokenType.INTERVAL: 'INTERVAL'>, 'INTERSECT': <TokenType.INTERSECT: 'INTERSECT'>, 'INTO': <TokenType.INTO: 'INTO'>, 'IS': <TokenType.IS: 'IS'>, 'ISNULL': <TokenType.ISNULL: 'ISNULL'>, 'JOIN': <TokenType.JOIN: 'JOIN'>, 'KEEP': <TokenType.KEEP: 'KEEP'>, 'KILL': <TokenType.KILL: 'KILL'>, 'LATERAL': <TokenType.LATERAL: 'LATERAL'>, 'LEFT': <TokenType.LEFT: 'LEFT'>, 'LIKE': <TokenType.LIKE: 'LIKE'>, 'LIMIT': <TokenType.LIMIT: 'LIMIT'>, 'LOAD': <TokenType.LOAD: 'LOAD'>, 'LOCK': <TokenType.LOCK: 'LOCK'>, 'MERGE': <TokenType.MERGE: 'MERGE'>, 'NATURAL': <TokenType.NATURAL: 'NATURAL'>, 'NEXT': <TokenType.NEXT: 'NEXT'>, 'NOT': <TokenType.NOT: 'NOT'>, 'NOTNULL': <TokenType.NOTNULL: 'NOTNULL'>, 'NULL': <TokenType.NULL: 'NULL'>, 'OBJECT': <TokenType.OBJECT: 'OBJECT'>, 'OFFSET': <TokenType.OFFSET: 'OFFSET'>, 'ON': <TokenType.ON: 'ON'>, 'OR': <TokenType.OR: 'OR'>, 'XOR': <TokenType.XOR: 'XOR'>, 'ORDER BY': <TokenType.ORDER_BY: 'ORDER_BY'>, 'ORDINALITY': <TokenType.ORDINALITY: 'ORDINALITY'>, 'OUTER': <TokenType.OUTER: 'OUTER'>, 'OVER': <TokenType.OVER: 'OVER'>, 'OVERLAPS': <TokenType.OVERLAPS: 'OVERLAPS'>, 'OVERWRITE': <TokenType.OVERWRITE: 'OVERWRITE'>, 'PARTITION': <TokenType.PARTITION: 'PARTITION'>, 'PARTITION BY': <TokenType.PARTITION_BY: 'PARTITION_BY'>, 'PARTITIONED BY': <TokenType.PARTITION_BY: 'PARTITION_BY'>, 'PARTITIONED_BY': <TokenType.PARTITION_BY: 'PARTITION_BY'>, 'PERCENT': <TokenType.PERCENT: 'PERCENT'>, 'PIVOT': <TokenType.PIVOT: 'PIVOT'>, 'PRAGMA': <TokenType.PRAGMA: 'PRAGMA'>, 'PRIMARY KEY': <TokenType.PRIMARY_KEY: 'PRIMARY_KEY'>, 'PROCEDURE': <TokenType.PROCEDURE: 'PROCEDURE'>, 'QUALIFY': <TokenType.QUALIFY: 'QUALIFY'>, 'RANGE': <TokenType.RANGE: 'RANGE'>, 'RECURSIVE': <TokenType.RECURSIVE: 'RECURSIVE'>, 'REGEXP': <TokenType.RLIKE: 'RLIKE'>, 'REPLACE': <TokenType.REPLACE: 'REPLACE'>, 'RETURNING': <TokenType.RETURNING: 'RETURNING'>, 'REFERENCES': <TokenType.REFERENCES: 'REFERENCES'>, 'RIGHT': <TokenType.RIGHT: 'RIGHT'>, 'RLIKE': <TokenType.RLIKE: 'RLIKE'>, 'ROLLBACK': <TokenType.ROLLBACK: 'ROLLBACK'>, 'ROLLUP': <TokenType.ROLLUP: 'ROLLUP'>, 'ROW': <TokenType.ROW: 'ROW'>, 'ROWS': <TokenType.ROWS: 'ROWS'>, 'SCHEMA': <TokenType.SCHEMA: 'SCHEMA'>, 'SELECT': <TokenType.SELECT: 'SELECT'>, 'SEMI': <TokenType.SEMI: 'SEMI'>, 'SET': <TokenType.SET: 'SET'>, 'SETTINGS': <TokenType.SETTINGS: 'SETTINGS'>, 'SHOW': <TokenType.SHOW: 'SHOW'>, 'SIMILAR TO': <TokenType.SIMILAR_TO: 'SIMILAR_TO'>, 'SOME': <TokenType.SOME: 'SOME'>, 'SORT BY': <TokenType.SORT_BY: 'SORT_BY'>, 'START WITH': <TokenType.START_WITH: 'START_WITH'>, 'TABLE': <TokenType.TABLE: 'TABLE'>, 'TABLESAMPLE': <TokenType.TABLE_SAMPLE: 'TABLE_SAMPLE'>, 'TEMP': <TokenType.TEMPORARY: 'TEMPORARY'>, 'TEMPORARY': <TokenType.TEMPORARY: 'TEMPORARY'>, 'THEN': <TokenType.THEN: 'THEN'>, 'TRUE': <TokenType.TRUE: 'TRUE'>, 'UNION': <TokenType.UNION: 'UNION'>, 'UNKNOWN': <TokenType.UNKNOWN: 'UNKNOWN'>, 'UNNEST': <TokenType.UNNEST: 'UNNEST'>, 'UNPIVOT': <TokenType.UNPIVOT: 'UNPIVOT'>, 'UPDATE': <TokenType.UPDATE: 'UPDATE'>, 'USE': <TokenType.USE: 'USE'>, 'USING': <TokenType.USING: 'USING'>, 'UUID': <TokenType.UUID: 'UUID'>, 'VALUES': <TokenType.VALUES: 'VALUES'>, 'VIEW': <TokenType.VIEW: 'VIEW'>, 'VOLATILE': <TokenType.VOLATILE: 'VOLATILE'>, 'WHEN': <TokenType.WHEN: 'WHEN'>, 'WHERE': <TokenType.WHERE: 'WHERE'>, 'WINDOW': <TokenType.WINDOW: 'WINDOW'>, 'WITH': <TokenType.WITH: 'WITH'>, 'APPLY': <TokenType.APPLY: 'APPLY'>, 'ARRAY': <TokenType.ARRAY: 'ARRAY'>, 'BIT': <TokenType.BIT: 'BIT'>, 'BOOL': <TokenType.BOOLEAN: 'BOOLEAN'>, 'BOOLEAN': <TokenType.BOOLEAN: 'BOOLEAN'>, 'BYTE': <TokenType.TINYINT: 'TINYINT'>, 'MEDIUMINT': <TokenType.MEDIUMINT: 'MEDIUMINT'>, 'INT1': <TokenType.TINYINT: 'TINYINT'>, 'TINYINT': <TokenType.TINYINT: 'TINYINT'>, 'INT16': <TokenType.SMALLINT: 'SMALLINT'>, 'SHORT': <TokenType.SMALLINT: 'SMALLINT'>, 'SMALLINT': <TokenType.SMALLINT: 'SMALLINT'>, 'INT128': <TokenType.INT128: 'INT128'>, 'HUGEINT': <TokenType.INT128: 'INT128'>, 'INT2': <TokenType.SMALLINT: 'SMALLINT'>, 'INTEGER': <TokenType.INT: 'INT'>, 'INT': <TokenType.INT: 'INT'>, 'INT4': <TokenType.INT: 'INT'>, 'INT32': <TokenType.INT: 'INT'>, 'INT64': <TokenType.BIGINT: 'BIGINT'>, 'LONG': <TokenType.BIGINT: 'BIGINT'>, 'BIGINT': <TokenType.BIGINT: 'BIGINT'>, 'INT8': <TokenType.TINYINT: 'TINYINT'>, 'DEC': <TokenType.DECIMAL: 'DECIMAL'>, 'DECIMAL': <TokenType.DECIMAL: 'DECIMAL'>, 'BIGDECIMAL': <TokenType.BIGDECIMAL: 'BIGDECIMAL'>, 'BIGNUMERIC': <TokenType.BIGDECIMAL: 'BIGDECIMAL'>, 'MAP': <TokenType.MAP: 'MAP'>, 'NULLABLE': <TokenType.NULLABLE: 'NULLABLE'>, 'NUMBER': <TokenType.DECIMAL: 'DECIMAL'>, 'NUMERIC': <TokenType.DECIMAL: 'DECIMAL'>, 'FIXED': <TokenType.DECIMAL: 'DECIMAL'>, 'REAL': <TokenType.FLOAT: 'FLOAT'>, 'FLOAT': <TokenType.FLOAT: 'FLOAT'>, 'FLOAT4': <TokenType.FLOAT: 'FLOAT'>, 'FLOAT8': <TokenType.DOUBLE: 'DOUBLE'>, 'DOUBLE': <TokenType.DOUBLE: 'DOUBLE'>, 'DOUBLE PRECISION': <TokenType.DOUBLE: 'DOUBLE'>, 'JSON': <TokenType.JSON: 'JSON'>, 'CHAR': <TokenType.CHAR: 'CHAR'>, 'CHARACTER': <TokenType.CHAR: 'CHAR'>, 'NCHAR': <TokenType.NCHAR: 'NCHAR'>, 'VARCHAR': <TokenType.VARCHAR: 'VARCHAR'>, 'VARCHAR2': <TokenType.VARCHAR: 'VARCHAR'>, 'NVARCHAR': <TokenType.NVARCHAR: 'NVARCHAR'>, 'NVARCHAR2': <TokenType.NVARCHAR: 'NVARCHAR'>, 'STR': <TokenType.TEXT: 'TEXT'>, 'STRING': <TokenType.TEXT: 'TEXT'>, 'TEXT': <TokenType.TEXT: 'TEXT'>, 'LONGTEXT': <TokenType.LONGTEXT: 'LONGTEXT'>, 'MEDIUMTEXT': <TokenType.MEDIUMTEXT: 'MEDIUMTEXT'>, 'TINYTEXT': <TokenType.TINYTEXT: 'TINYTEXT'>, 'CLOB': <TokenType.TEXT: 'TEXT'>, 'LONGVARCHAR': <TokenType.TEXT: 'TEXT'>, 'BINARY': <TokenType.BINARY: 'BINARY'>, 'BLOB': <TokenType.VARBINARY: 'VARBINARY'>, 'LONGBLOB': <TokenType.LONGBLOB: 'LONGBLOB'>, 'MEDIUMBLOB': <TokenType.MEDIUMBLOB: 'MEDIUMBLOB'>, 'TINYBLOB': <TokenType.TINYBLOB: 'TINYBLOB'>, 'BYTEA': <TokenType.VARBINARY: 'VARBINARY'>, 'VARBINARY': <TokenType.VARBINARY: 'VARBINARY'>, 'TIME': <TokenType.TIME: 'TIME'>, 'TIMETZ': <TokenType.TIMETZ: 'TIMETZ'>, 'TIMESTAMP': <TokenType.TIMESTAMPTZ: 'TIMESTAMPTZ'>, 'TIMESTAMPTZ': <TokenType.TIMESTAMPTZ: 'TIMESTAMPTZ'>, 'TIMESTAMPLTZ': <TokenType.TIMESTAMPLTZ: 'TIMESTAMPLTZ'>, 'DATE': <TokenType.DATE: 'DATE'>, 'DATETIME': <TokenType.DATETIME: 'DATETIME'>, 'INT4RANGE': <TokenType.INT4RANGE: 'INT4RANGE'>, 'INT4MULTIRANGE': <TokenType.INT4MULTIRANGE: 'INT4MULTIRANGE'>, 'INT8RANGE': <TokenType.INT8RANGE: 'INT8RANGE'>, 'INT8MULTIRANGE': <TokenType.INT8MULTIRANGE: 'INT8MULTIRANGE'>, 'NUMRANGE': <TokenType.NUMRANGE: 'NUMRANGE'>, 'NUMMULTIRANGE': <TokenType.NUMMULTIRANGE: 'NUMMULTIRANGE'>, 'TSRANGE': <TokenType.TSRANGE: 'TSRANGE'>, 'TSMULTIRANGE': <TokenType.TSMULTIRANGE: 'TSMULTIRANGE'>, 'TSTZRANGE': <TokenType.TSTZRANGE: 'TSTZRANGE'>, 'TSTZMULTIRANGE': <TokenType.TSTZMULTIRANGE: 'TSTZMULTIRANGE'>, 'DATERANGE': <TokenType.DATERANGE: 'DATERANGE'>, 'DATEMULTIRANGE': <TokenType.DATEMULTIRANGE: 'DATEMULTIRANGE'>, 'UNIQUE': <TokenType.UNIQUE: 'UNIQUE'>, 'STRUCT': <TokenType.STRUCT: 'STRUCT'>, 'VARIANT': <TokenType.VARIANT: 'VARIANT'>, 'ALTER': <TokenType.ALTER: 'ALTER'>, 'ANALYZE': <TokenType.COMMAND: 'COMMAND'>, 'CALL': <TokenType.COMMAND: 'COMMAND'>, 'COMMENT': <TokenType.COMMENT: 'COMMENT'>, 'COPY': <TokenType.COMMAND: 'COMMAND'>, 'EXPLAIN': <TokenType.COMMAND: 'COMMAND'>, 'GRANT': <TokenType.COMMAND: 'COMMAND'>, 'OPTIMIZE': <TokenType.COMMAND: 'COMMAND'>, 'PREPARE': <TokenType.COMMAND: 'COMMAND'>, 'TRUNCATE': <TokenType.COMMAND: 'COMMAND'>, 'VACUUM': <TokenType.COMMAND: 'COMMAND'>, 'USER-DEFINED': <TokenType.USERDEFINED: 'USERDEFINED'>, 'FOR VERSION': <TokenType.VERSION_SNAPSHOT: 'VERSION_SNAPSHOT'>, 'FOR TIMESTAMP': <TokenType.TIMESTAMP_SNAPSHOT: 'TIMESTAMP_SNAPSHOT'>, 'ANY TYPE': <TokenType.VARIANT: 'VARIANT'>, 'BEGIN TRANSACTION': <TokenType.BEGIN: 'BEGIN'>, 'BYTES': <TokenType.BINARY: 'BINARY'>, 'CURRENT_DATETIME': <TokenType.CURRENT_DATETIME: 'CURRENT_DATETIME'>, 'DECLARE': <TokenType.COMMAND: 'COMMAND'>, 'FLOAT64': <TokenType.DOUBLE: 'DOUBLE'>, 'FOR SYSTEM_TIME': <TokenType.TIMESTAMP_SNAPSHOT: 'TIMESTAMP_SNAPSHOT'>, 'MODEL': <TokenType.MODEL: 'MODEL'>, 'NOT DETERMINISTIC': <TokenType.VOLATILE: 'VOLATILE'>, 'RECORD': <TokenType.STRUCT: 'STRUCT'>}
class BigQuery.Parser(sqlglot.parser.Parser):
324    class Parser(parser.Parser):
325        PREFIXED_PIVOT_COLUMNS = True
326
327        LOG_DEFAULTS_TO_LN = True
328
329        FUNCTIONS = {
330            **parser.Parser.FUNCTIONS,
331            "DATE": _parse_date,
332            "DATE_ADD": parse_date_delta_with_interval(exp.DateAdd),
333            "DATE_SUB": parse_date_delta_with_interval(exp.DateSub),
334            "DATE_TRUNC": lambda args: exp.DateTrunc(
335                unit=exp.Literal.string(str(seq_get(args, 1))),
336                this=seq_get(args, 0),
337            ),
338            "DATETIME_ADD": parse_date_delta_with_interval(exp.DatetimeAdd),
339            "DATETIME_SUB": parse_date_delta_with_interval(exp.DatetimeSub),
340            "DIV": binary_from_function(exp.IntDiv),
341            "FORMAT_DATE": lambda args: exp.TimeToStr(
342                this=exp.TsOrDsToDate(this=seq_get(args, 1)), format=seq_get(args, 0)
343            ),
344            "GENERATE_ARRAY": exp.GenerateSeries.from_arg_list,
345            "JSON_EXTRACT_SCALAR": lambda args: exp.JSONExtractScalar(
346                this=seq_get(args, 0), expression=seq_get(args, 1) or exp.Literal.string("$")
347            ),
348            "MD5": exp.MD5Digest.from_arg_list,
349            "TO_HEX": _parse_to_hex,
350            "PARSE_DATE": lambda args: format_time_lambda(exp.StrToDate, "bigquery")(
351                [seq_get(args, 1), seq_get(args, 0)]
352            ),
353            "PARSE_TIMESTAMP": _parse_timestamp,
354            "REGEXP_CONTAINS": exp.RegexpLike.from_arg_list,
355            "REGEXP_EXTRACT": lambda args: exp.RegexpExtract(
356                this=seq_get(args, 0),
357                expression=seq_get(args, 1),
358                position=seq_get(args, 2),
359                occurrence=seq_get(args, 3),
360                group=exp.Literal.number(1) if re.compile(args[1].name).groups == 1 else None,
361            ),
362            "SHA256": lambda args: exp.SHA2(this=seq_get(args, 0), length=exp.Literal.number(256)),
363            "SHA512": lambda args: exp.SHA2(this=seq_get(args, 0), length=exp.Literal.number(512)),
364            "SPLIT": lambda args: exp.Split(
365                # https://cloud.google.com/bigquery/docs/reference/standard-sql/string_functions#split
366                this=seq_get(args, 0),
367                expression=seq_get(args, 1) or exp.Literal.string(","),
368            ),
369            "TIME": _parse_time,
370            "TIME_ADD": parse_date_delta_with_interval(exp.TimeAdd),
371            "TIME_SUB": parse_date_delta_with_interval(exp.TimeSub),
372            "TIMESTAMP_ADD": parse_date_delta_with_interval(exp.TimestampAdd),
373            "TIMESTAMP_SUB": parse_date_delta_with_interval(exp.TimestampSub),
374            "TIMESTAMP_MICROS": lambda args: exp.UnixToTime(
375                this=seq_get(args, 0), scale=exp.UnixToTime.MICROS
376            ),
377            "TIMESTAMP_MILLIS": lambda args: exp.UnixToTime(
378                this=seq_get(args, 0), scale=exp.UnixToTime.MILLIS
379            ),
380            "TIMESTAMP_SECONDS": lambda args: exp.UnixToTime(this=seq_get(args, 0)),
381            "TO_JSON_STRING": exp.JSONFormat.from_arg_list,
382        }
383
384        FUNCTION_PARSERS = {
385            **parser.Parser.FUNCTION_PARSERS,
386            "ARRAY": lambda self: self.expression(exp.Array, expressions=[self._parse_statement()]),
387        }
388        FUNCTION_PARSERS.pop("TRIM")
389
390        NO_PAREN_FUNCTIONS = {
391            **parser.Parser.NO_PAREN_FUNCTIONS,
392            TokenType.CURRENT_DATETIME: exp.CurrentDatetime,
393        }
394
395        NESTED_TYPE_TOKENS = {
396            *parser.Parser.NESTED_TYPE_TOKENS,
397            TokenType.TABLE,
398        }
399
400        ID_VAR_TOKENS = {
401            *parser.Parser.ID_VAR_TOKENS,
402            TokenType.VALUES,
403        }
404
405        PROPERTY_PARSERS = {
406            **parser.Parser.PROPERTY_PARSERS,
407            "NOT DETERMINISTIC": lambda self: self.expression(
408                exp.StabilityProperty, this=exp.Literal.string("VOLATILE")
409            ),
410            "OPTIONS": lambda self: self._parse_with_property(),
411        }
412
413        CONSTRAINT_PARSERS = {
414            **parser.Parser.CONSTRAINT_PARSERS,
415            "OPTIONS": lambda self: exp.Properties(expressions=self._parse_with_property()),
416        }
417
418        RANGE_PARSERS = parser.Parser.RANGE_PARSERS.copy()
419        RANGE_PARSERS.pop(TokenType.OVERLAPS, None)
420
421        NULL_TOKENS = {TokenType.NULL, TokenType.UNKNOWN}
422
423        STATEMENT_PARSERS = {
424            **parser.Parser.STATEMENT_PARSERS,
425            TokenType.END: lambda self: self._parse_as_command(self._prev),
426            TokenType.FOR: lambda self: self._parse_for_in(),
427        }
428
429        BRACKET_OFFSETS = {
430            "OFFSET": (0, False),
431            "ORDINAL": (1, False),
432            "SAFE_OFFSET": (0, True),
433            "SAFE_ORDINAL": (1, True),
434        }
435
436        def _parse_for_in(self) -> exp.ForIn:
437            this = self._parse_range()
438            self._match_text_seq("DO")
439            return self.expression(exp.ForIn, this=this, expression=self._parse_statement())
440
441        def _parse_table_part(self, schema: bool = False) -> t.Optional[exp.Expression]:
442            this = super()._parse_table_part(schema=schema) or self._parse_number()
443
444            # https://cloud.google.com/bigquery/docs/reference/standard-sql/lexical#table_names
445            if isinstance(this, exp.Identifier):
446                table_name = this.name
447                while self._match(TokenType.DASH, advance=False) and self._next:
448                    self._advance(2)
449                    table_name += f"-{self._prev.text}"
450
451                this = exp.Identifier(this=table_name, quoted=this.args.get("quoted"))
452            elif isinstance(this, exp.Literal):
453                table_name = this.name
454
455                if self._is_connected() and self._parse_var(any_token=True):
456                    table_name += self._prev.text
457
458                this = exp.Identifier(this=table_name, quoted=True)
459
460            return this
461
462        def _parse_table_parts(self, schema: bool = False) -> exp.Table:
463            table = super()._parse_table_parts(schema=schema)
464            if isinstance(table.this, exp.Identifier) and "." in table.name:
465                catalog, db, this, *rest = (
466                    t.cast(t.Optional[exp.Expression], exp.to_identifier(x))
467                    for x in split_num_words(table.name, ".", 3)
468                )
469
470                if rest and this:
471                    this = exp.Dot.build(t.cast(t.List[exp.Expression], [this, *rest]))
472
473                table = exp.Table(this=this, db=db, catalog=catalog)
474
475            return table
476
477        @t.overload
478        def _parse_json_object(self, agg: Lit[False]) -> exp.JSONObject: ...
479
480        @t.overload
481        def _parse_json_object(self, agg: Lit[True]) -> exp.JSONObjectAgg: ...
482
483        def _parse_json_object(self, agg=False):
484            json_object = super()._parse_json_object()
485            array_kv_pair = seq_get(json_object.expressions, 0)
486
487            # Converts BQ's "signature 2" of JSON_OBJECT into SQLGlot's canonical representation
488            # https://cloud.google.com/bigquery/docs/reference/standard-sql/json_functions#json_object_signature2
489            if (
490                array_kv_pair
491                and isinstance(array_kv_pair.this, exp.Array)
492                and isinstance(array_kv_pair.expression, exp.Array)
493            ):
494                keys = array_kv_pair.this.expressions
495                values = array_kv_pair.expression.expressions
496
497                json_object.set(
498                    "expressions",
499                    [exp.JSONKeyValue(this=k, expression=v) for k, v in zip(keys, values)],
500                )
501
502            return json_object
503
504        def _parse_bracket(self, this: t.Optional[exp.Expression]) -> t.Optional[exp.Expression]:
505            bracket = super()._parse_bracket(this)
506
507            if this is bracket:
508                return bracket
509
510            if isinstance(bracket, exp.Bracket):
511                for expression in bracket.expressions:
512                    name = expression.name.upper()
513
514                    if name not in self.BRACKET_OFFSETS:
515                        break
516
517                    offset, safe = self.BRACKET_OFFSETS[name]
518                    bracket.set("offset", offset)
519                    bracket.set("safe", safe)
520                    expression.replace(expression.expressions[0])
521
522            return bracket

Parser consumes a list of tokens produced by the Tokenizer and produces a parsed syntax tree.

Arguments:
  • error_level: The desired error level. Default: ErrorLevel.IMMEDIATE
  • error_message_context: Determines the amount of context to capture from a query string when displaying the error message (in number of characters). Default: 100
  • max_errors: Maximum number of error messages to include in a raised ParseError. This is only relevant if error_level is ErrorLevel.RAISE. Default: 3
PREFIXED_PIVOT_COLUMNS = True
LOG_DEFAULTS_TO_LN = True
FUNCTIONS = {'ABS': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Abs'>>, 'ANONYMOUS_AGG_FUNC': <bound method Func.from_arg_list of <class 'sqlglot.expressions.AnonymousAggFunc'>>, 'ANY_VALUE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.AnyValue'>>, 'APPROX_DISTINCT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ApproxDistinct'>>, 'APPROX_COUNT_DISTINCT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ApproxDistinct'>>, 'APPROX_QUANTILE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ApproxQuantile'>>, 'APPROX_TOP_K': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ApproxTopK'>>, 'ARG_MAX': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArgMax'>>, 'ARGMAX': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArgMax'>>, 'MAX_BY': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArgMax'>>, 'ARG_MIN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArgMin'>>, 'ARGMIN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArgMin'>>, 'MIN_BY': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArgMin'>>, 'ARRAY': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Array'>>, 'ARRAY_AGG': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArrayAgg'>>, 'ARRAY_ALL': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArrayAll'>>, 'ARRAY_ANY': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArrayAny'>>, 'ARRAY_CONCAT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArrayConcat'>>, 'ARRAY_CAT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArrayConcat'>>, 'ARRAY_CONTAINS': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArrayContains'>>, 'FILTER': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArrayFilter'>>, 'ARRAY_FILTER': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArrayFilter'>>, 'ARRAY_JOIN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArrayJoin'>>, 'ARRAY_SIZE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArraySize'>>, 'ARRAY_SORT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArraySort'>>, 'ARRAY_SUM': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArraySum'>>, 'ARRAY_UNION_AGG': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArrayUnionAgg'>>, 'ARRAY_UNIQUE_AGG': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ArrayUniqueAgg'>>, 'AVG': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Avg'>>, 'CASE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Case'>>, 'CAST': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Cast'>>, 'CAST_TO_STR_TYPE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.CastToStrType'>>, 'CEIL': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Ceil'>>, 'CEILING': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Ceil'>>, 'CHR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Chr'>>, 'CHAR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Chr'>>, 'COALESCE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Coalesce'>>, 'IFNULL': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Coalesce'>>, 'NVL': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Coalesce'>>, 'COLLATE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Collate'>>, 'COMBINED_AGG_FUNC': <bound method Func.from_arg_list of <class 'sqlglot.expressions.CombinedAggFunc'>>, 'COMBINED_PARAMETERIZED_AGG': <bound method Func.from_arg_list of <class 'sqlglot.expressions.CombinedParameterizedAgg'>>, 'CONCAT': <function Parser.<lambda>>, 'CONCAT_WS': <function Parser.<lambda>>, 'COUNT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Count'>>, 'COUNT_IF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.CountIf'>>, 'COUNTIF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.CountIf'>>, 'CURRENT_DATE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.CurrentDate'>>, 'CURRENT_DATETIME': <bound method Func.from_arg_list of <class 'sqlglot.expressions.CurrentDatetime'>>, 'CURRENT_TIME': <bound method Func.from_arg_list of <class 'sqlglot.expressions.CurrentTime'>>, 'CURRENT_TIMESTAMP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.CurrentTimestamp'>>, 'CURRENT_USER': <bound method Func.from_arg_list of <class 'sqlglot.expressions.CurrentUser'>>, 'DATE': <function _parse_date>, 'DATE_ADD': <function parse_date_delta_with_interval.<locals>.func>, 'DATEDIFF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DateDiff'>>, 'DATE_DIFF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DateDiff'>>, 'DATE_FROM_PARTS': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DateFromParts'>>, 'DATEFROMPARTS': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DateFromParts'>>, 'DATE_STR_TO_DATE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DateStrToDate'>>, 'DATE_SUB': <function parse_date_delta_with_interval.<locals>.func>, 'DATE_TO_DATE_STR': <function Parser.<lambda>>, 'DATE_TO_DI': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DateToDi'>>, 'DATE_TRUNC': <function BigQuery.Parser.<lambda>>, 'DATETIME_ADD': <function parse_date_delta_with_interval.<locals>.func>, 'DATETIME_DIFF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DatetimeDiff'>>, 'DATETIME_SUB': <function parse_date_delta_with_interval.<locals>.func>, 'DATETIME_TRUNC': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DatetimeTrunc'>>, 'DAY': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Day'>>, 'DAY_OF_MONTH': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DayOfMonth'>>, 'DAYOFMONTH': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DayOfMonth'>>, 'DAY_OF_WEEK': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DayOfWeek'>>, 'DAYOFWEEK': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DayOfWeek'>>, 'DAY_OF_YEAR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DayOfYear'>>, 'DAYOFYEAR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DayOfYear'>>, 'DECODE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Decode'>>, 'DI_TO_DATE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.DiToDate'>>, 'ENCODE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Encode'>>, 'EXP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Exp'>>, 'EXPLODE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Explode'>>, 'EXPLODE_OUTER': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ExplodeOuter'>>, 'EXTRACT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Extract'>>, 'FIRST': <bound method Func.from_arg_list of <class 'sqlglot.expressions.First'>>, 'FLATTEN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Flatten'>>, 'FLOOR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Floor'>>, 'FROM_BASE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.FromBase'>>, 'FROM_BASE64': <bound method Func.from_arg_list of <class 'sqlglot.expressions.FromBase64'>>, 'GENERATE_SERIES': <bound method Func.from_arg_list of <class 'sqlglot.expressions.GenerateSeries'>>, 'GET_PATH': <bound method Func.from_arg_list of <class 'sqlglot.expressions.GetPath'>>, 'GREATEST': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Greatest'>>, 'GROUP_CONCAT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.GroupConcat'>>, 'HEX': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Hex'>>, 'HLL': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Hll'>>, 'IF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.If'>>, 'INITCAP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Initcap'>>, 'IS_INF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.IsInf'>>, 'ISINF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.IsInf'>>, 'IS_NAN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.IsNan'>>, 'ISNAN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.IsNan'>>, 'J_S_O_N_ARRAY': <bound method Func.from_arg_list of <class 'sqlglot.expressions.JSONArray'>>, 'J_S_O_N_ARRAY_AGG': <bound method Func.from_arg_list of <class 'sqlglot.expressions.JSONArrayAgg'>>, 'JSON_ARRAY_CONTAINS': <bound method Func.from_arg_list of <class 'sqlglot.expressions.JSONArrayContains'>>, 'JSONB_EXTRACT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.JSONBExtract'>>, 'JSONB_EXTRACT_SCALAR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.JSONBExtractScalar'>>, 'JSON_EXTRACT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.JSONExtract'>>, 'JSON_EXTRACT_SCALAR': <function BigQuery.Parser.<lambda>>, 'JSON_FORMAT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.JSONFormat'>>, 'J_S_O_N_OBJECT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.JSONObject'>>, 'J_S_O_N_OBJECT_AGG': <bound method Func.from_arg_list of <class 'sqlglot.expressions.JSONObjectAgg'>>, 'J_S_O_N_TABLE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.JSONTable'>>, 'LAST': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Last'>>, 'LAST_DAY': <bound method Func.from_arg_list of <class 'sqlglot.expressions.LastDay'>>, 'LAST_DAY_OF_MONTH': <bound method Func.from_arg_list of <class 'sqlglot.expressions.LastDay'>>, 'LEAST': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Least'>>, 'LEFT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Left'>>, 'LENGTH': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Length'>>, 'LEN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Length'>>, 'LEVENSHTEIN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Levenshtein'>>, 'LN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Ln'>>, 'LOG': <function parse_logarithm>, 'LOG10': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Log10'>>, 'LOG2': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Log2'>>, 'LOGICAL_AND': <bound method Func.from_arg_list of <class 'sqlglot.expressions.LogicalAnd'>>, 'BOOL_AND': <bound method Func.from_arg_list of <class 'sqlglot.expressions.LogicalAnd'>>, 'BOOLAND_AGG': <bound method Func.from_arg_list of <class 'sqlglot.expressions.LogicalAnd'>>, 'LOGICAL_OR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.LogicalOr'>>, 'BOOL_OR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.LogicalOr'>>, 'BOOLOR_AGG': <bound method Func.from_arg_list of <class 'sqlglot.expressions.LogicalOr'>>, 'LOWER': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Lower'>>, 'LCASE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Lower'>>, 'MD5': <bound method Func.from_arg_list of <class 'sqlglot.expressions.MD5Digest'>>, 'MD5_DIGEST': <bound method Func.from_arg_list of <class 'sqlglot.expressions.MD5Digest'>>, 'MAP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Map'>>, 'MAP_FROM_ENTRIES': <bound method Func.from_arg_list of <class 'sqlglot.expressions.MapFromEntries'>>, 'MATCH_AGAINST': <bound method Func.from_arg_list of <class 'sqlglot.expressions.MatchAgainst'>>, 'MAX': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Max'>>, 'MIN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Min'>>, 'MONTH': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Month'>>, 'MONTHS_BETWEEN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.MonthsBetween'>>, 'NEXT_VALUE_FOR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.NextValueFor'>>, 'NULLIF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Nullif'>>, 'NUMBER_TO_STR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.NumberToStr'>>, 'NVL2': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Nvl2'>>, 'OPEN_J_S_O_N': <bound method Func.from_arg_list of <class 'sqlglot.expressions.OpenJSON'>>, 'PARAMETERIZED_AGG': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ParameterizedAgg'>>, 'PARSE_JSON': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ParseJSON'>>, 'JSON_PARSE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ParseJSON'>>, 'PERCENTILE_CONT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.PercentileCont'>>, 'PERCENTILE_DISC': <bound method Func.from_arg_list of <class 'sqlglot.expressions.PercentileDisc'>>, 'POSEXPLODE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Posexplode'>>, 'POSEXPLODE_OUTER': <bound method Func.from_arg_list of <class 'sqlglot.expressions.PosexplodeOuter'>>, 'POWER': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Pow'>>, 'POW': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Pow'>>, 'PREDICT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Predict'>>, 'QUANTILE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Quantile'>>, 'RAND': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Rand'>>, 'RANDOM': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Rand'>>, 'RANDN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Randn'>>, 'RANGE_N': <bound method Func.from_arg_list of <class 'sqlglot.expressions.RangeN'>>, 'READ_CSV': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ReadCSV'>>, 'REDUCE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Reduce'>>, 'REGEXP_EXTRACT': <function BigQuery.Parser.<lambda>>, 'REGEXP_I_LIKE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.RegexpILike'>>, 'REGEXP_LIKE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.RegexpLike'>>, 'REGEXP_REPLACE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.RegexpReplace'>>, 'REGEXP_SPLIT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.RegexpSplit'>>, 'REPEAT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Repeat'>>, 'RIGHT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Right'>>, 'ROUND': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Round'>>, 'ROW_NUMBER': <bound method Func.from_arg_list of <class 'sqlglot.expressions.RowNumber'>>, 'SHA': <bound method Func.from_arg_list of <class 'sqlglot.expressions.SHA'>>, 'SHA1': <bound method Func.from_arg_list of <class 'sqlglot.expressions.SHA'>>, 'SHA2': <bound method Func.from_arg_list of <class 'sqlglot.expressions.SHA2'>>, 'SAFE_DIVIDE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.SafeDivide'>>, 'SORT_ARRAY': <bound method Func.from_arg_list of <class 'sqlglot.expressions.SortArray'>>, 'SPLIT': <function BigQuery.Parser.<lambda>>, 'SQRT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Sqrt'>>, 'STANDARD_HASH': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StandardHash'>>, 'STAR_MAP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StarMap'>>, 'STARTS_WITH': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StartsWith'>>, 'STARTSWITH': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StartsWith'>>, 'STDDEV': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Stddev'>>, 'STDDEV_POP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StddevPop'>>, 'STDDEV_SAMP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StddevSamp'>>, 'STR_POSITION': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StrPosition'>>, 'STR_TO_DATE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StrToDate'>>, 'STR_TO_MAP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StrToMap'>>, 'STR_TO_TIME': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StrToTime'>>, 'STR_TO_UNIX': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StrToUnix'>>, 'STRUCT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Struct'>>, 'STRUCT_EXTRACT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.StructExtract'>>, 'STUFF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Stuff'>>, 'INSERT': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Stuff'>>, 'SUBSTRING': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Substring'>>, 'SUM': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Sum'>>, 'TIME_ADD': <function parse_date_delta_with_interval.<locals>.func>, 'TIME_DIFF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimeDiff'>>, 'TIME_FROM_PARTS': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimeFromParts'>>, 'TIMEFROMPARTS': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimeFromParts'>>, 'TIME_STR_TO_DATE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimeStrToDate'>>, 'TIME_STR_TO_TIME': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimeStrToTime'>>, 'TIME_STR_TO_UNIX': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimeStrToUnix'>>, 'TIME_SUB': <function parse_date_delta_with_interval.<locals>.func>, 'TIME_TO_STR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimeToStr'>>, 'TIME_TO_TIME_STR': <function Parser.<lambda>>, 'TIME_TO_UNIX': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimeToUnix'>>, 'TIME_TRUNC': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimeTrunc'>>, 'TIMESTAMP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Timestamp'>>, 'TIMESTAMP_ADD': <function parse_date_delta_with_interval.<locals>.func>, 'TIMESTAMP_DIFF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimestampDiff'>>, 'TIMESTAMP_FROM_PARTS': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimestampFromParts'>>, 'TIMESTAMPFROMPARTS': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimestampFromParts'>>, 'TIMESTAMP_SUB': <function parse_date_delta_with_interval.<locals>.func>, 'TIMESTAMP_TRUNC': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TimestampTrunc'>>, 'TO_ARRAY': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ToArray'>>, 'TO_BASE64': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ToBase64'>>, 'TO_CHAR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ToChar'>>, 'TO_DAYS': <bound method Func.from_arg_list of <class 'sqlglot.expressions.ToDays'>>, 'TRANSFORM': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Transform'>>, 'TRIM': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Trim'>>, 'TRY_CAST': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TryCast'>>, 'TS_OR_DI_TO_DI': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TsOrDiToDi'>>, 'TS_OR_DS_ADD': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TsOrDsAdd'>>, 'TS_OR_DS_DIFF': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TsOrDsDiff'>>, 'TS_OR_DS_TO_DATE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TsOrDsToDate'>>, 'TS_OR_DS_TO_DATE_STR': <function Parser.<lambda>>, 'TS_OR_DS_TO_TIME': <bound method Func.from_arg_list of <class 'sqlglot.expressions.TsOrDsToTime'>>, 'UNHEX': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Unhex'>>, 'UNIX_DATE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.UnixDate'>>, 'UNIX_TO_STR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.UnixToStr'>>, 'UNIX_TO_TIME': <bound method Func.from_arg_list of <class 'sqlglot.expressions.UnixToTime'>>, 'UNIX_TO_TIME_STR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.UnixToTimeStr'>>, 'UPPER': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Upper'>>, 'UCASE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Upper'>>, 'VAR_MAP': <function parse_var_map>, 'VARIANCE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Variance'>>, 'VARIANCE_SAMP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Variance'>>, 'VAR_SAMP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Variance'>>, 'VARIANCE_POP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.VariancePop'>>, 'VAR_POP': <bound method Func.from_arg_list of <class 'sqlglot.expressions.VariancePop'>>, 'WEEK': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Week'>>, 'WEEK_OF_YEAR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.WeekOfYear'>>, 'WEEKOFYEAR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.WeekOfYear'>>, 'WHEN': <bound method Func.from_arg_list of <class 'sqlglot.expressions.When'>>, 'X_M_L_TABLE': <bound method Func.from_arg_list of <class 'sqlglot.expressions.XMLTable'>>, 'XOR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Xor'>>, 'YEAR': <bound method Func.from_arg_list of <class 'sqlglot.expressions.Year'>>, 'GLOB': <function Parser.<lambda>>, 'LIKE': <function parse_like>, 'DIV': <function binary_from_function.<locals>.<lambda>>, 'FORMAT_DATE': <function BigQuery.Parser.<lambda>>, 'GENERATE_ARRAY': <bound method Func.from_arg_list of <class 'sqlglot.expressions.GenerateSeries'>>, 'TO_HEX': <function _parse_to_hex>, 'PARSE_DATE': <function BigQuery.Parser.<lambda>>, 'PARSE_TIMESTAMP': <function _parse_timestamp>, 'REGEXP_CONTAINS': <bound method Func.from_arg_list of <class 'sqlglot.expressions.RegexpLike'>>, 'SHA256': <function BigQuery.Parser.<lambda>>, 'SHA512': <function BigQuery.Parser.<lambda>>, 'TIME': <function _parse_time>, 'TIMESTAMP_MICROS': <function BigQuery.Parser.<lambda>>, 'TIMESTAMP_MILLIS': <function BigQuery.Parser.<lambda>>, 'TIMESTAMP_SECONDS': <function BigQuery.Parser.<lambda>>, 'TO_JSON_STRING': <bound method Func.from_arg_list of <class 'sqlglot.expressions.JSONFormat'>>}
FUNCTION_PARSERS = {'ANY_VALUE': <function Parser.<lambda>>, 'CAST': <function Parser.<lambda>>, 'CONVERT': <function Parser.<lambda>>, 'DECODE': <function Parser.<lambda>>, 'EXTRACT': <function Parser.<lambda>>, 'JSON_OBJECT': <function Parser.<lambda>>, 'JSON_OBJECTAGG': <function Parser.<lambda>>, 'JSON_TABLE': <function Parser.<lambda>>, 'MATCH': <function Parser.<lambda>>, 'OPENJSON': <function Parser.<lambda>>, 'POSITION': <function Parser.<lambda>>, 'PREDICT': <function Parser.<lambda>>, 'SAFE_CAST': <function Parser.<lambda>>, 'STRING_AGG': <function Parser.<lambda>>, 'SUBSTRING': <function Parser.<lambda>>, 'TRY_CAST': <function Parser.<lambda>>, 'TRY_CONVERT': <function Parser.<lambda>>, 'ARRAY': <function BigQuery.Parser.<lambda>>}
NO_PAREN_FUNCTIONS = {<TokenType.CURRENT_DATE: 'CURRENT_DATE'>: <class 'sqlglot.expressions.CurrentDate'>, <TokenType.CURRENT_DATETIME: 'CURRENT_DATETIME'>: <class 'sqlglot.expressions.CurrentDatetime'>, <TokenType.CURRENT_TIME: 'CURRENT_TIME'>: <class 'sqlglot.expressions.CurrentTime'>, <TokenType.CURRENT_TIMESTAMP: 'CURRENT_TIMESTAMP'>: <class 'sqlglot.expressions.CurrentTimestamp'>, <TokenType.CURRENT_USER: 'CURRENT_USER'>: <class 'sqlglot.expressions.CurrentUser'>}
NESTED_TYPE_TOKENS = {<TokenType.MAP: 'MAP'>, <TokenType.ARRAY: 'ARRAY'>, <TokenType.STRUCT: 'STRUCT'>, <TokenType.NESTED: 'NESTED'>, <TokenType.TABLE: 'TABLE'>, <TokenType.NULLABLE: 'NULLABLE'>, <TokenType.LOWCARDINALITY: 'LOWCARDINALITY'>}
ID_VAR_TOKENS = {<TokenType.TOP: 'TOP'>, <TokenType.ANTI: 'ANTI'>, <TokenType.PIVOT: 'PIVOT'>, <TokenType.BINARY: 'BINARY'>, <TokenType.UTINYINT: 'UTINYINT'>, <TokenType.BEGIN: 'BEGIN'>, <TokenType.CURRENT_DATETIME: 'CURRENT_DATETIME'>, <TokenType.OBJECT: 'OBJECT'>, <TokenType.VAR: 'VAR'>, <TokenType.OVERWRITE: 'OVERWRITE'>, <TokenType.PARTITION: 'PARTITION'>, <TokenType.EXISTS: 'EXISTS'>, <TokenType.DIV: 'DIV'>, <TokenType.TSMULTIRANGE: 'TSMULTIRANGE'>, <TokenType.PSEUDO_TYPE: 'PSEUDO_TYPE'>, <TokenType.VARIANT: 'VARIANT'>, <TokenType.FALSE: 'FALSE'>, <TokenType.UMEDIUMINT: 'UMEDIUMINT'>, <TokenType.MERGE: 'MERGE'>, <TokenType.DATETIME64: 'DATETIME64'>, <TokenType.COMMENT: 'COMMENT'>, <TokenType.FLOAT: 'FLOAT'>, <TokenType.MEDIUMBLOB: 'MEDIUMBLOB'>, <TokenType.TIMETZ: 'TIMETZ'>, <TokenType.MODEL: 'MODEL'>, <TokenType.BIT: 'BIT'>, <TokenType.RIGHT: 'RIGHT'>, <TokenType.UUID: 'UUID'>, <TokenType.DATE32: 'DATE32'>, <TokenType.VALUES: 'VALUES'>, <TokenType.ESCAPE: 'ESCAPE'>, <TokenType.MEDIUMTEXT: 'MEDIUMTEXT'>, <TokenType.LOWCARDINALITY: 'LOWCARDINALITY'>, <TokenType.COLUMN: 'COLUMN'>, <TokenType.IPV4: 'IPV4'>, <TokenType.COMMIT: 'COMMIT'>, <TokenType.UINT: 'UINT'>, <TokenType.ALL: 'ALL'>, <TokenType.UDECIMAL: 'UDECIMAL'>, <TokenType.TSTZMULTIRANGE: 'TSTZMULTIRANGE'>, <TokenType.USMALLINT: 'USMALLINT'>, <TokenType.NULL: 'NULL'>, <TokenType.SEMI: 'SEMI'>, <TokenType.VARCHAR: 'VARCHAR'>, <TokenType.FIRST: 'FIRST'>, <TokenType.PRAGMA: 'PRAGMA'>, <TokenType.EXECUTE: 'EXECUTE'>, <TokenType.INTERVAL: 'INTERVAL'>, <TokenType.NEXT: 'NEXT'>, <TokenType.UINT128: 'UINT128'>, <TokenType.DATEMULTIRANGE: 'DATEMULTIRANGE'>, <TokenType.ROW: 'ROW'>, <TokenType.DEFAULT: 'DEFAULT'>, <TokenType.KEEP: 'KEEP'>, <TokenType.TIMESTAMP_S: 'TIMESTAMP_S'>, <TokenType.ENUM: 'ENUM'>, <TokenType.TIMESTAMP_NS: 'TIMESTAMP_NS'>, <TokenType.NCHAR: 'NCHAR'>, <TokenType.TABLE: 'TABLE'>, <TokenType.MEDIUMINT: 'MEDIUMINT'>, <TokenType.TIMESTAMPTZ: 'TIMESTAMPTZ'>, <TokenType.SUPER: 'SUPER'>, <TokenType.AGGREGATEFUNCTION: 'AGGREGATEFUNCTION'>, <TokenType.FOREIGN_KEY: 'FOREIGN_KEY'>, <TokenType.IPADDRESS: 'IPADDRESS'>, <TokenType.INT4MULTIRANGE: 'INT4MULTIRANGE'>, <TokenType.UBIGINT: 'UBIGINT'>, <TokenType.VIEW: 'VIEW'>, <TokenType.BIGINT: 'BIGINT'>, <TokenType.XML: 'XML'>, <TokenType.COLLATE: 'COLLATE'>, <TokenType.FORMAT: 'FORMAT'>, <TokenType.JSON: 'JSON'>, <TokenType.HSTORE: 'HSTORE'>, <TokenType.SOME: 'SOME'>, <TokenType.ISNULL: 'ISNULL'>, <TokenType.UNPIVOT: 'UNPIVOT'>, <TokenType.SIMPLEAGGREGATEFUNCTION: 'SIMPLEAGGREGATEFUNCTION'>, <TokenType.TSRANGE: 'TSRANGE'>, <TokenType.IMAGE: 'IMAGE'>, <TokenType.IPPREFIX: 'IPPREFIX'>, <TokenType.CASE: 'CASE'>, <TokenType.CONSTRAINT: 'CONSTRAINT'>, <TokenType.TSTZRANGE: 'TSTZRANGE'>, <TokenType.TRUE: 'TRUE'>, <TokenType.DATERANGE: 'DATERANGE'>, <TokenType.INT8RANGE: 'INT8RANGE'>, <TokenType.INT128: 'INT128'>, <TokenType.REFRESH: 'REFRESH'>, <TokenType.INT: 'INT'>, <TokenType.TEXT: 'TEXT'>, <TokenType.FIXEDSTRING: 'FIXEDSTRING'>, <TokenType.TIMESTAMP: 'TIMESTAMP'>, <TokenType.END: 'END'>, <TokenType.SMALLINT: 'SMALLINT'>, <TokenType.HLLSKETCH: 'HLLSKETCH'>, <TokenType.CURRENT_DATE: 'CURRENT_DATE'>, <TokenType.ENUM16: 'ENUM16'>, <TokenType.IPV6: 'IPV6'>, <TokenType.STRUCT: 'STRUCT'>, <TokenType.NULLABLE: 'NULLABLE'>, <TokenType.CURRENT_TIMESTAMP: 'CURRENT_TIMESTAMP'>, <TokenType.RANGE: 'RANGE'>, <TokenType.FUNCTION: 'FUNCTION'>, <TokenType.SCHEMA: 'SCHEMA'>, <TokenType.ASC: 'ASC'>, <TokenType.DESCRIBE: 'DESCRIBE'>, <TokenType.OFFSET: 'OFFSET'>, <TokenType.APPLY: 'APPLY'>, <TokenType.UPDATE: 'UPDATE'>, <TokenType.NATURAL: 'NATURAL'>, <TokenType.NUMMULTIRANGE: 'NUMMULTIRANGE'>, <TokenType.WINDOW: 'WINDOW'>, <TokenType.ROWS: 'ROWS'>, <TokenType.COMMAND: 'COMMAND'>, <TokenType.INT8MULTIRANGE: 'INT8MULTIRANGE'>, <TokenType.BIGDECIMAL: 'BIGDECIMAL'>, <TokenType.LOAD: 'LOAD'>, <TokenType.USE: 'USE'>, <TokenType.UNIQUEIDENTIFIER: 'UNIQUEIDENTIFIER'>, <TokenType.INT4RANGE: 'INT4RANGE'>, <TokenType.SMALLSERIAL: 'SMALLSERIAL'>, <TokenType.ROWVERSION: 'ROWVERSION'>, <TokenType.ARRAY: 'ARRAY'>, <TokenType.INDEX: 'INDEX'>, <TokenType.NUMRANGE: 'NUMRANGE'>, <TokenType.PROCEDURE: 'PROCEDURE'>, <TokenType.CACHE: 'CACHE'>, <TokenType.UNKNOWN: 'UNKNOWN'>, <TokenType.KILL: 'KILL'>, <TokenType.SET: 'SET'>, <TokenType.JSONB: 'JSONB'>, <TokenType.PERCENT: 'PERCENT'>, <TokenType.SETTINGS: 'SETTINGS'>, <TokenType.REFERENCES: 'REFERENCES'>, <TokenType.ENUM8: 'ENUM8'>, <TokenType.NESTED: 'NESTED'>, <TokenType.TIME: 'TIME'>, <TokenType.BOOLEAN: 'BOOLEAN'>, <TokenType.DATETIME: 'DATETIME'>, <TokenType.DELETE: 'DELETE'>, <TokenType.INET: 'INET'>, <TokenType.CURRENT_USER: 'CURRENT_USER'>, <TokenType.DESC: 'DESC'>, <TokenType.FULL: 'FULL'>, <TokenType.TIMESTAMP_MS: 'TIMESTAMP_MS'>, <TokenType.SMALLMONEY: 'SMALLMONEY'>, <TokenType.DATE: 'DATE'>, <TokenType.ORDINALITY: 'ORDINALITY'>, <TokenType.VARBINARY: 'VARBINARY'>, <TokenType.LEFT: 'LEFT'>, <TokenType.BIGSERIAL: 'BIGSERIAL'>, <TokenType.OPERATOR: 'OPERATOR'>, <TokenType.TIMESTAMPLTZ: 'TIMESTAMPLTZ'>, <TokenType.GEOMETRY: 'GEOMETRY'>, <TokenType.MAP: 'MAP'>, <TokenType.FINAL: 'FINAL'>, <TokenType.DECIMAL: 'DECIMAL'>, <TokenType.UINT256: 'UINT256'>, <TokenType.IS: 'IS'>, <TokenType.NVARCHAR: 'NVARCHAR'>, <TokenType.INT256: 'INT256'>, <TokenType.TINYBLOB: 'TINYBLOB'>, <TokenType.MONEY: 'MONEY'>, <TokenType.REPLACE: 'REPLACE'>, <TokenType.DATABASE: 'DATABASE'>, <TokenType.ANY: 'ANY'>, <TokenType.UNIQUE: 'UNIQUE'>, <TokenType.OBJECT_IDENTIFIER: 'OBJECT_IDENTIFIER'>, <TokenType.YEAR: 'YEAR'>, <TokenType.CHAR: 'CHAR'>, <TokenType.DICTIONARY: 'DICTIONARY'>, <TokenType.USERDEFINED: 'USERDEFINED'>, <TokenType.OVERLAPS: 'OVERLAPS'>, <TokenType.SERIAL: 'SERIAL'>, <TokenType.FILTER: 'FILTER'>, <TokenType.DOUBLE: 'DOUBLE'>, <TokenType.AUTO_INCREMENT: 'AUTO_INCREMENT'>, <TokenType.RECURSIVE: 'RECURSIVE'>, <TokenType.VOLATILE: 'VOLATILE'>, <TokenType.SHOW: 'SHOW'>, <TokenType.LONGTEXT: 'LONGTEXT'>, <TokenType.CURRENT_TIME: 'CURRENT_TIME'>, <TokenType.TINYINT: 'TINYINT'>, <TokenType.TEMPORARY: 'TEMPORARY'>, <TokenType.GEOGRAPHY: 'GEOGRAPHY'>, <TokenType.LONGBLOB: 'LONGBLOB'>, <TokenType.TINYTEXT: 'TINYTEXT'>}
PROPERTY_PARSERS = {'ALGORITHM': <function Parser.<lambda>>, 'AUTO': <function Parser.<lambda>>, 'AUTO_INCREMENT': <function Parser.<lambda>>, 'BLOCKCOMPRESSION': <function Parser.<lambda>>, 'CHARSET': <function Parser.<lambda>>, 'CHARACTER SET': <function Parser.<lambda>>, 'CHECKSUM': <function Parser.<lambda>>, 'CLUSTER BY': <function Parser.<lambda>>, 'CLUSTERED': <function Parser.<lambda>>, 'COLLATE': <function Parser.<lambda>>, 'COMMENT': <function Parser.<lambda>>, 'CONTAINS': <function Parser.<lambda>>, 'COPY': <function Parser.<lambda>>, 'DATABLOCKSIZE': <function Parser.<lambda>>, 'DEFINER': <function Parser.<lambda>>, 'DETERMINISTIC': <function Parser.<lambda>>, 'DISTKEY': <function Parser.<lambda>>, 'DISTSTYLE': <function Parser.<lambda>>, 'ENGINE': <function Parser.<lambda>>, 'EXECUTE': <function Parser.<lambda>>, 'EXTERNAL': <function Parser.<lambda>>, 'FALLBACK': <function Parser.<lambda>>, 'FORMAT': <function Parser.<lambda>>, 'FREESPACE': <function Parser.<lambda>>, 'HEAP': <function Parser.<lambda>>, 'IMMUTABLE': <function Parser.<lambda>>, 'INHERITS': <function Parser.<lambda>>, 'INPUT': <function Parser.<lambda>>, 'JOURNAL': <function Parser.<lambda>>, 'LANGUAGE': <function Parser.<lambda>>, 'LAYOUT': <function Parser.<lambda>>, 'LIFETIME': <function Parser.<lambda>>, 'LIKE': <function Parser.<lambda>>, 'LOCATION': <function Parser.<lambda>>, 'LOCK': <function Parser.<lambda>>, 'LOCKING': <function Parser.<lambda>>, 'LOG': <function Parser.<lambda>>, 'MATERIALIZED': <function Parser.<lambda>>, 'MERGEBLOCKRATIO': <function Parser.<lambda>>, 'MODIFIES': <function Parser.<lambda>>, 'MULTISET': <function Parser.<lambda>>, 'NO': <function Parser.<lambda>>, 'ON': <function Parser.<lambda>>, 'ORDER BY': <function Parser.<lambda>>, 'OUTPUT': <function Parser.<lambda>>, 'PARTITION': <function Parser.<lambda>>, 'PARTITION BY': <function Parser.<lambda>>, 'PARTITIONED BY': <function Parser.<lambda>>, 'PARTITIONED_BY': <function Parser.<lambda>>, 'PRIMARY KEY': <function Parser.<lambda>>, 'RANGE': <function Parser.<lambda>>, 'READS': <function Parser.<lambda>>, 'REMOTE': <function Parser.<lambda>>, 'RETURNS': <function Parser.<lambda>>, 'ROW': <function Parser.<lambda>>, 'ROW_FORMAT': <function Parser.<lambda>>, 'SAMPLE': <function Parser.<lambda>>, 'SET': <function Parser.<lambda>>, 'SETTINGS': <function Parser.<lambda>>, 'SORTKEY': <function Parser.<lambda>>, 'SOURCE': <function Parser.<lambda>>, 'STABLE': <function Parser.<lambda>>, 'STORED': <function Parser.<lambda>>, 'SYSTEM_VERSIONING': <function Parser.<lambda>>, 'TBLPROPERTIES': <function Parser.<lambda>>, 'TEMP': <function Parser.<lambda>>, 'TEMPORARY': <function Parser.<lambda>>, 'TO': <function Parser.<lambda>>, 'TRANSIENT': <function Parser.<lambda>>, 'TRANSFORM': <function Parser.<lambda>>, 'TTL': <function Parser.<lambda>>, 'USING': <function Parser.<lambda>>, 'VOLATILE': <function Parser.<lambda>>, 'WITH': <function Parser.<lambda>>, 'NOT DETERMINISTIC': <function BigQuery.Parser.<lambda>>, 'OPTIONS': <function BigQuery.Parser.<lambda>>}
CONSTRAINT_PARSERS = {'AUTOINCREMENT': <function Parser.<lambda>>, 'AUTO_INCREMENT': <function Parser.<lambda>>, 'CASESPECIFIC': <function Parser.<lambda>>, 'CHARACTER SET': <function Parser.<lambda>>, 'CHECK': <function Parser.<lambda>>, 'COLLATE': <function Parser.<lambda>>, 'COMMENT': <function Parser.<lambda>>, 'COMPRESS': <function Parser.<lambda>>, 'CLUSTERED': <function Parser.<lambda>>, 'NONCLUSTERED': <function Parser.<lambda>>, 'DEFAULT': <function Parser.<lambda>>, 'ENCODE': <function Parser.<lambda>>, 'FOREIGN KEY': <function Parser.<lambda>>, 'FORMAT': <function Parser.<lambda>>, 'GENERATED': <function Parser.<lambda>>, 'IDENTITY': <function Parser.<lambda>>, 'INLINE': <function Parser.<lambda>>, 'LIKE': <function Parser.<lambda>>, 'NOT': <function Parser.<lambda>>, 'NULL': <function Parser.<lambda>>, 'ON': <function Parser.<lambda>>, 'PATH': <function Parser.<lambda>>, 'PERIOD': <function Parser.<lambda>>, 'PRIMARY KEY': <function Parser.<lambda>>, 'REFERENCES': <function Parser.<lambda>>, 'TITLE': <function Parser.<lambda>>, 'TTL': <function Parser.<lambda>>, 'UNIQUE': <function Parser.<lambda>>, 'UPPERCASE': <function Parser.<lambda>>, 'WITH': <function Parser.<lambda>>, 'OPTIONS': <function BigQuery.Parser.<lambda>>}
RANGE_PARSERS = {<TokenType.BETWEEN: 'BETWEEN'>: <function Parser.<lambda>>, <TokenType.GLOB: 'GLOB'>: <function binary_range_parser.<locals>.<lambda>>, <TokenType.ILIKE: 'ILIKE'>: <function binary_range_parser.<locals>.<lambda>>, <TokenType.IN: 'IN'>: <function Parser.<lambda>>, <TokenType.IRLIKE: 'IRLIKE'>: <function binary_range_parser.<locals>.<lambda>>, <TokenType.IS: 'IS'>: <function Parser.<lambda>>, <TokenType.LIKE: 'LIKE'>: <function binary_range_parser.<locals>.<lambda>>, <TokenType.RLIKE: 'RLIKE'>: <function binary_range_parser.<locals>.<lambda>>, <TokenType.SIMILAR_TO: 'SIMILAR_TO'>: <function binary_range_parser.<locals>.<lambda>>, <TokenType.FOR: 'FOR'>: <function Parser.<lambda>>}
NULL_TOKENS = {<TokenType.NULL: 'NULL'>, <TokenType.UNKNOWN: 'UNKNOWN'>}
STATEMENT_PARSERS = {<TokenType.ALTER: 'ALTER'>: <function Parser.<lambda>>, <TokenType.BEGIN: 'BEGIN'>: <function Parser.<lambda>>, <TokenType.CACHE: 'CACHE'>: <function Parser.<lambda>>, <TokenType.COMMIT: 'COMMIT'>: <function Parser.<lambda>>, <TokenType.COMMENT: 'COMMENT'>: <function Parser.<lambda>>, <TokenType.CREATE: 'CREATE'>: <function Parser.<lambda>>, <TokenType.DELETE: 'DELETE'>: <function Parser.<lambda>>, <TokenType.DESC: 'DESC'>: <function Parser.<lambda>>, <TokenType.DESCRIBE: 'DESCRIBE'>: <function Parser.<lambda>>, <TokenType.DROP: 'DROP'>: <function Parser.<lambda>>, <TokenType.INSERT: 'INSERT'>: <function Parser.<lambda>>, <TokenType.KILL: 'KILL'>: <function Parser.<lambda>>, <TokenType.LOAD: 'LOAD'>: <function Parser.<lambda>>, <TokenType.MERGE: 'MERGE'>: <function Parser.<lambda>>, <TokenType.PIVOT: 'PIVOT'>: <function Parser.<lambda>>, <TokenType.PRAGMA: 'PRAGMA'>: <function Parser.<lambda>>, <TokenType.REFRESH: 'REFRESH'>: <function Parser.<lambda>>, <TokenType.ROLLBACK: 'ROLLBACK'>: <function Parser.<lambda>>, <TokenType.SET: 'SET'>: <function Parser.<lambda>>, <TokenType.UNCACHE: 'UNCACHE'>: <function Parser.<lambda>>, <TokenType.UPDATE: 'UPDATE'>: <function Parser.<lambda>>, <TokenType.USE: 'USE'>: <function Parser.<lambda>>, <TokenType.END: 'END'>: <function BigQuery.Parser.<lambda>>, <TokenType.FOR: 'FOR'>: <function BigQuery.Parser.<lambda>>}
BRACKET_OFFSETS = {'OFFSET': (0, False), 'ORDINAL': (1, False), 'SAFE_OFFSET': (0, True), 'SAFE_ORDINAL': (1, True)}
TABLE_ALIAS_TOKENS = {<TokenType.TOP: 'TOP'>, <TokenType.PIVOT: 'PIVOT'>, <TokenType.BINARY: 'BINARY'>, <TokenType.ANTI: 'ANTI'>, <TokenType.UTINYINT: 'UTINYINT'>, <TokenType.BEGIN: 'BEGIN'>, <TokenType.CURRENT_DATETIME: 'CURRENT_DATETIME'>, <TokenType.OBJECT: 'OBJECT'>, <TokenType.VAR: 'VAR'>, <TokenType.OVERWRITE: 'OVERWRITE'>, <TokenType.PARTITION: 'PARTITION'>, <TokenType.EXISTS: 'EXISTS'>, <TokenType.DIV: 'DIV'>, <TokenType.TSMULTIRANGE: 'TSMULTIRANGE'>, <TokenType.PSEUDO_TYPE: 'PSEUDO_TYPE'>, <TokenType.VARIANT: 'VARIANT'>, <TokenType.FALSE: 'FALSE'>, <TokenType.UMEDIUMINT: 'UMEDIUMINT'>, <TokenType.MERGE: 'MERGE'>, <TokenType.DATETIME64: 'DATETIME64'>, <TokenType.COMMENT: 'COMMENT'>, <TokenType.FLOAT: 'FLOAT'>, <TokenType.MEDIUMBLOB: 'MEDIUMBLOB'>, <TokenType.TIMETZ: 'TIMETZ'>, <TokenType.MODEL: 'MODEL'>, <TokenType.BIT: 'BIT'>, <TokenType.UUID: 'UUID'>, <TokenType.DATE32: 'DATE32'>, <TokenType.ESCAPE: 'ESCAPE'>, <TokenType.MEDIUMTEXT: 'MEDIUMTEXT'>, <TokenType.LOWCARDINALITY: 'LOWCARDINALITY'>, <TokenType.COLUMN: 'COLUMN'>, <TokenType.IPV4: 'IPV4'>, <TokenType.COMMIT: 'COMMIT'>, <TokenType.UINT: 'UINT'>, <TokenType.ALL: 'ALL'>, <TokenType.UDECIMAL: 'UDECIMAL'>, <TokenType.TSTZMULTIRANGE: 'TSTZMULTIRANGE'>, <TokenType.USMALLINT: 'USMALLINT'>, <TokenType.NULL: 'NULL'>, <TokenType.VARCHAR: 'VARCHAR'>, <TokenType.SEMI: 'SEMI'>, <TokenType.FIRST: 'FIRST'>, <TokenType.PRAGMA: 'PRAGMA'>, <TokenType.EXECUTE: 'EXECUTE'>, <TokenType.TINYTEXT: 'TINYTEXT'>, <TokenType.INTERVAL: 'INTERVAL'>, <TokenType.NEXT: 'NEXT'>, <TokenType.UINT128: 'UINT128'>, <TokenType.DATEMULTIRANGE: 'DATEMULTIRANGE'>, <TokenType.ROW: 'ROW'>, <TokenType.DEFAULT: 'DEFAULT'>, <TokenType.KEEP: 'KEEP'>, <TokenType.TIMESTAMP_S: 'TIMESTAMP_S'>, <TokenType.ENUM: 'ENUM'>, <TokenType.TIMESTAMP_NS: 'TIMESTAMP_NS'>, <TokenType.NCHAR: 'NCHAR'>, <TokenType.TABLE: 'TABLE'>, <TokenType.MEDIUMINT: 'MEDIUMINT'>, <TokenType.TIMESTAMPTZ: 'TIMESTAMPTZ'>, <TokenType.SUPER: 'SUPER'>, <TokenType.AGGREGATEFUNCTION: 'AGGREGATEFUNCTION'>, <TokenType.FOREIGN_KEY: 'FOREIGN_KEY'>, <TokenType.IPADDRESS: 'IPADDRESS'>, <TokenType.INT4MULTIRANGE: 'INT4MULTIRANGE'>, <TokenType.UBIGINT: 'UBIGINT'>, <TokenType.VIEW: 'VIEW'>, <TokenType.BIGINT: 'BIGINT'>, <TokenType.XML: 'XML'>, <TokenType.COLLATE: 'COLLATE'>, <TokenType.FORMAT: 'FORMAT'>, <TokenType.JSON: 'JSON'>, <TokenType.HSTORE: 'HSTORE'>, <TokenType.SOME: 'SOME'>, <TokenType.ISNULL: 'ISNULL'>, <TokenType.UNPIVOT: 'UNPIVOT'>, <TokenType.SIMPLEAGGREGATEFUNCTION: 'SIMPLEAGGREGATEFUNCTION'>, <TokenType.TSRANGE: 'TSRANGE'>, <TokenType.IMAGE: 'IMAGE'>, <TokenType.IPPREFIX: 'IPPREFIX'>, <TokenType.CASE: 'CASE'>, <TokenType.CONSTRAINT: 'CONSTRAINT'>, <TokenType.TSTZRANGE: 'TSTZRANGE'>, <TokenType.TRUE: 'TRUE'>, <TokenType.DATERANGE: 'DATERANGE'>, <TokenType.INT8RANGE: 'INT8RANGE'>, <TokenType.INT128: 'INT128'>, <TokenType.REFRESH: 'REFRESH'>, <TokenType.INT: 'INT'>, <TokenType.TEXT: 'TEXT'>, <TokenType.FIXEDSTRING: 'FIXEDSTRING'>, <TokenType.TIMESTAMP: 'TIMESTAMP'>, <TokenType.END: 'END'>, <TokenType.SMALLINT: 'SMALLINT'>, <TokenType.HLLSKETCH: 'HLLSKETCH'>, <TokenType.CURRENT_DATE: 'CURRENT_DATE'>, <TokenType.ENUM16: 'ENUM16'>, <TokenType.IPV6: 'IPV6'>, <TokenType.STRUCT: 'STRUCT'>, <TokenType.NULLABLE: 'NULLABLE'>, <TokenType.RANGE: 'RANGE'>, <TokenType.FUNCTION: 'FUNCTION'>, <TokenType.SCHEMA: 'SCHEMA'>, <TokenType.ASC: 'ASC'>, <TokenType.DESCRIBE: 'DESCRIBE'>, <TokenType.UPDATE: 'UPDATE'>, <TokenType.NUMMULTIRANGE: 'NUMMULTIRANGE'>, <TokenType.ROWS: 'ROWS'>, <TokenType.COMMAND: 'COMMAND'>, <TokenType.INT8MULTIRANGE: 'INT8MULTIRANGE'>, <TokenType.BIGDECIMAL: 'BIGDECIMAL'>, <TokenType.LOAD: 'LOAD'>, <TokenType.USE: 'USE'>, <TokenType.UNIQUEIDENTIFIER: 'UNIQUEIDENTIFIER'>, <TokenType.INT4RANGE: 'INT4RANGE'>, <TokenType.SMALLSERIAL: 'SMALLSERIAL'>, <TokenType.ROWVERSION: 'ROWVERSION'>, <TokenType.ARRAY: 'ARRAY'>, <TokenType.INDEX: 'INDEX'>, <TokenType.NUMRANGE: 'NUMRANGE'>, <TokenType.PROCEDURE: 'PROCEDURE'>, <TokenType.CACHE: 'CACHE'>, <TokenType.UNKNOWN: 'UNKNOWN'>, <TokenType.KILL: 'KILL'>, <TokenType.SET: 'SET'>, <TokenType.JSONB: 'JSONB'>, <TokenType.PERCENT: 'PERCENT'>, <TokenType.SETTINGS: 'SETTINGS'>, <TokenType.REFERENCES: 'REFERENCES'>, <TokenType.ENUM8: 'ENUM8'>, <TokenType.NESTED: 'NESTED'>, <TokenType.TIME: 'TIME'>, <TokenType.BOOLEAN: 'BOOLEAN'>, <TokenType.DATETIME: 'DATETIME'>, <TokenType.DELETE: 'DELETE'>, <TokenType.INET: 'INET'>, <TokenType.CURRENT_USER: 'CURRENT_USER'>, <TokenType.DESC: 'DESC'>, <TokenType.TIMESTAMP_MS: 'TIMESTAMP_MS'>, <TokenType.SMALLMONEY: 'SMALLMONEY'>, <TokenType.DATE: 'DATE'>, <TokenType.ORDINALITY: 'ORDINALITY'>, <TokenType.VARBINARY: 'VARBINARY'>, <TokenType.BIGSERIAL: 'BIGSERIAL'>, <TokenType.OPERATOR: 'OPERATOR'>, <TokenType.TIMESTAMPLTZ: 'TIMESTAMPLTZ'>, <TokenType.GEOMETRY: 'GEOMETRY'>, <TokenType.MAP: 'MAP'>, <TokenType.FINAL: 'FINAL'>, <TokenType.DECIMAL: 'DECIMAL'>, <TokenType.UINT256: 'UINT256'>, <TokenType.IS: 'IS'>, <TokenType.NVARCHAR: 'NVARCHAR'>, <TokenType.INT256: 'INT256'>, <TokenType.TINYBLOB: 'TINYBLOB'>, <TokenType.MONEY: 'MONEY'>, <TokenType.REPLACE: 'REPLACE'>, <TokenType.DATABASE: 'DATABASE'>, <TokenType.ANY: 'ANY'>, <TokenType.UNIQUE: 'UNIQUE'>, <TokenType.OBJECT_IDENTIFIER: 'OBJECT_IDENTIFIER'>, <TokenType.YEAR: 'YEAR'>, <TokenType.CHAR: 'CHAR'>, <TokenType.DICTIONARY: 'DICTIONARY'>, <TokenType.USERDEFINED: 'USERDEFINED'>, <TokenType.OVERLAPS: 'OVERLAPS'>, <TokenType.SERIAL: 'SERIAL'>, <TokenType.FILTER: 'FILTER'>, <TokenType.DOUBLE: 'DOUBLE'>, <TokenType.AUTO_INCREMENT: 'AUTO_INCREMENT'>, <TokenType.RECURSIVE: 'RECURSIVE'>, <TokenType.VOLATILE: 'VOLATILE'>, <TokenType.SHOW: 'SHOW'>, <TokenType.LONGTEXT: 'LONGTEXT'>, <TokenType.CURRENT_TIME: 'CURRENT_TIME'>, <TokenType.TINYINT: 'TINYINT'>, <TokenType.TEMPORARY: 'TEMPORARY'>, <TokenType.GEOGRAPHY: 'GEOGRAPHY'>, <TokenType.LONGBLOB: 'LONGBLOB'>, <TokenType.CURRENT_TIMESTAMP: 'CURRENT_TIMESTAMP'>}
SHOW_TRIE: Dict = {}
SET_TRIE: Dict = {'GLOBAL': {0: True}, 'LOCAL': {0: True}, 'SESSION': {0: True}, 'TRANSACTION': {0: True}}
class BigQuery.Generator(sqlglot.generator.Generator):
524    class Generator(generator.Generator):
525        EXPLICIT_UNION = True
526        INTERVAL_ALLOWS_PLURAL_FORM = False
527        JOIN_HINTS = False
528        QUERY_HINTS = False
529        TABLE_HINTS = False
530        LIMIT_FETCH = "LIMIT"
531        RENAME_TABLE_WITH_DB = False
532        NVL2_SUPPORTED = False
533        UNNEST_WITH_ORDINALITY = False
534        COLLATE_IS_FUNC = True
535        LIMIT_ONLY_LITERALS = True
536        SUPPORTS_TABLE_ALIAS_COLUMNS = False
537        UNPIVOT_ALIASES_ARE_IDENTIFIERS = False
538        JSON_KEY_VALUE_PAIR_SEP = ","
539        NULL_ORDERING_SUPPORTED = False
540
541        TRANSFORMS = {
542            **generator.Generator.TRANSFORMS,
543            exp.ApproxDistinct: rename_func("APPROX_COUNT_DISTINCT"),
544            exp.ArgMax: arg_max_or_min_no_count("MAX_BY"),
545            exp.ArgMin: arg_max_or_min_no_count("MIN_BY"),
546            exp.ArrayContains: _array_contains_sql,
547            exp.ArraySize: rename_func("ARRAY_LENGTH"),
548            exp.Cast: transforms.preprocess([transforms.remove_precision_parameterized_types]),
549            exp.CollateProperty: lambda self, e: (
550                f"DEFAULT COLLATE {self.sql(e, 'this')}"
551                if e.args.get("default")
552                else f"COLLATE {self.sql(e, 'this')}"
553            ),
554            exp.CountIf: rename_func("COUNTIF"),
555            exp.Create: _create_sql,
556            exp.CTE: transforms.preprocess([_pushdown_cte_column_names]),
557            exp.DateAdd: date_add_interval_sql("DATE", "ADD"),
558            exp.DateDiff: lambda self, e: f"DATE_DIFF({self.sql(e, 'this')}, {self.sql(e, 'expression')}, {self.sql(e.args.get('unit', 'DAY'))})",
559            exp.DateFromParts: rename_func("DATE"),
560            exp.DateStrToDate: datestrtodate_sql,
561            exp.DateSub: date_add_interval_sql("DATE", "SUB"),
562            exp.DatetimeAdd: date_add_interval_sql("DATETIME", "ADD"),
563            exp.DatetimeSub: date_add_interval_sql("DATETIME", "SUB"),
564            exp.DateTrunc: lambda self, e: self.func("DATE_TRUNC", e.this, e.text("unit")),
565            exp.FromTimeZone: lambda self, e: self.func(
566                "DATETIME", self.func("TIMESTAMP", e.this, e.args.get("zone")), "'UTC'"
567            ),
568            exp.GenerateSeries: rename_func("GENERATE_ARRAY"),
569            exp.GetPath: path_to_jsonpath(),
570            exp.GroupConcat: rename_func("STRING_AGG"),
571            exp.Hex: rename_func("TO_HEX"),
572            exp.If: if_sql(false_value="NULL"),
573            exp.ILike: no_ilike_sql,
574            exp.IntDiv: rename_func("DIV"),
575            exp.JSONFormat: rename_func("TO_JSON_STRING"),
576            exp.Max: max_or_greatest,
577            exp.MD5: lambda self, e: self.func("TO_HEX", self.func("MD5", e.this)),
578            exp.MD5Digest: rename_func("MD5"),
579            exp.Min: min_or_least,
580            exp.PartitionedByProperty: lambda self, e: f"PARTITION BY {self.sql(e, 'this')}",
581            exp.RegexpExtract: lambda self, e: self.func(
582                "REGEXP_EXTRACT",
583                e.this,
584                e.expression,
585                e.args.get("position"),
586                e.args.get("occurrence"),
587            ),
588            exp.RegexpReplace: regexp_replace_sql,
589            exp.RegexpLike: rename_func("REGEXP_CONTAINS"),
590            exp.ReturnsProperty: _returnsproperty_sql,
591            exp.Select: transforms.preprocess(
592                [
593                    transforms.explode_to_unnest(),
594                    _unqualify_unnest,
595                    transforms.eliminate_distinct_on,
596                    _alias_ordered_group,
597                    transforms.eliminate_semi_and_anti_joins,
598                ]
599            ),
600            exp.SHA2: lambda self, e: self.func(
601                f"SHA256" if e.text("length") == "256" else "SHA512", e.this
602            ),
603            exp.StabilityProperty: lambda self, e: (
604                f"DETERMINISTIC" if e.name == "IMMUTABLE" else "NOT DETERMINISTIC"
605            ),
606            exp.StrToDate: lambda self, e: f"PARSE_DATE({self.format_time(e)}, {self.sql(e, 'this')})",
607            exp.StrToTime: lambda self, e: self.func(
608                "PARSE_TIMESTAMP", self.format_time(e), e.this, e.args.get("zone")
609            ),
610            exp.TimeAdd: date_add_interval_sql("TIME", "ADD"),
611            exp.TimeFromParts: rename_func("TIME"),
612            exp.TimeSub: date_add_interval_sql("TIME", "SUB"),
613            exp.TimestampAdd: date_add_interval_sql("TIMESTAMP", "ADD"),
614            exp.TimestampSub: date_add_interval_sql("TIMESTAMP", "SUB"),
615            exp.TimeStrToTime: timestrtotime_sql,
616            exp.Trim: lambda self, e: self.func(f"TRIM", e.this, e.expression),
617            exp.TsOrDsAdd: _ts_or_ds_add_sql,
618            exp.TsOrDsDiff: _ts_or_ds_diff_sql,
619            exp.TsOrDsToTime: rename_func("TIME"),
620            exp.Unhex: rename_func("FROM_HEX"),
621            exp.UnixDate: rename_func("UNIX_DATE"),
622            exp.UnixToTime: _unix_to_time_sql,
623            exp.Values: _derived_table_values_to_unnest,
624            exp.VariancePop: rename_func("VAR_POP"),
625        }
626
627        TYPE_MAPPING = {
628            **generator.Generator.TYPE_MAPPING,
629            exp.DataType.Type.BIGDECIMAL: "BIGNUMERIC",
630            exp.DataType.Type.BIGINT: "INT64",
631            exp.DataType.Type.BINARY: "BYTES",
632            exp.DataType.Type.BOOLEAN: "BOOL",
633            exp.DataType.Type.CHAR: "STRING",
634            exp.DataType.Type.DECIMAL: "NUMERIC",
635            exp.DataType.Type.DOUBLE: "FLOAT64",
636            exp.DataType.Type.FLOAT: "FLOAT64",
637            exp.DataType.Type.INT: "INT64",
638            exp.DataType.Type.NCHAR: "STRING",
639            exp.DataType.Type.NVARCHAR: "STRING",
640            exp.DataType.Type.SMALLINT: "INT64",
641            exp.DataType.Type.TEXT: "STRING",
642            exp.DataType.Type.TIMESTAMP: "DATETIME",
643            exp.DataType.Type.TIMESTAMPTZ: "TIMESTAMP",
644            exp.DataType.Type.TIMESTAMPLTZ: "TIMESTAMP",
645            exp.DataType.Type.TINYINT: "INT64",
646            exp.DataType.Type.VARBINARY: "BYTES",
647            exp.DataType.Type.VARCHAR: "STRING",
648            exp.DataType.Type.VARIANT: "ANY TYPE",
649        }
650
651        PROPERTIES_LOCATION = {
652            **generator.Generator.PROPERTIES_LOCATION,
653            exp.PartitionedByProperty: exp.Properties.Location.POST_SCHEMA,
654            exp.VolatileProperty: exp.Properties.Location.UNSUPPORTED,
655        }
656
657        # from: https://cloud.google.com/bigquery/docs/reference/standard-sql/lexical#reserved_keywords
658        RESERVED_KEYWORDS = {
659            *generator.Generator.RESERVED_KEYWORDS,
660            "all",
661            "and",
662            "any",
663            "array",
664            "as",
665            "asc",
666            "assert_rows_modified",
667            "at",
668            "between",
669            "by",
670            "case",
671            "cast",
672            "collate",
673            "contains",
674            "create",
675            "cross",
676            "cube",
677            "current",
678            "default",
679            "define",
680            "desc",
681            "distinct",
682            "else",
683            "end",
684            "enum",
685            "escape",
686            "except",
687            "exclude",
688            "exists",
689            "extract",
690            "false",
691            "fetch",
692            "following",
693            "for",
694            "from",
695            "full",
696            "group",
697            "grouping",
698            "groups",
699            "hash",
700            "having",
701            "if",
702            "ignore",
703            "in",
704            "inner",
705            "intersect",
706            "interval",
707            "into",
708            "is",
709            "join",
710            "lateral",
711            "left",
712            "like",
713            "limit",
714            "lookup",
715            "merge",
716            "natural",
717            "new",
718            "no",
719            "not",
720            "null",
721            "nulls",
722            "of",
723            "on",
724            "or",
725            "order",
726            "outer",
727            "over",
728            "partition",
729            "preceding",
730            "proto",
731            "qualify",
732            "range",
733            "recursive",
734            "respect",
735            "right",
736            "rollup",
737            "rows",
738            "select",
739            "set",
740            "some",
741            "struct",
742            "tablesample",
743            "then",
744            "to",
745            "treat",
746            "true",
747            "unbounded",
748            "union",
749            "unnest",
750            "using",
751            "when",
752            "where",
753            "window",
754            "with",
755            "within",
756        }
757
758        def timetostr_sql(self, expression: exp.TimeToStr) -> str:
759            if isinstance(expression.this, exp.TsOrDsToDate):
760                this: exp.Expression = expression.this
761            else:
762                this = expression
763
764            return f"FORMAT_DATE({self.format_time(expression)}, {self.sql(this, 'this')})"
765
766        def struct_sql(self, expression: exp.Struct) -> str:
767            args = []
768            for expr in expression.expressions:
769                if isinstance(expr, self.KEY_VALUE_DEFINITIONS):
770                    arg = f"{self.sql(expr, 'expression')} AS {expr.this.name}"
771                else:
772                    arg = self.sql(expr)
773
774                args.append(arg)
775
776            return self.func("STRUCT", *args)
777
778        def eq_sql(self, expression: exp.EQ) -> str:
779            # Operands of = cannot be NULL in BigQuery
780            if isinstance(expression.left, exp.Null) or isinstance(expression.right, exp.Null):
781                if not isinstance(expression.parent, exp.Update):
782                    return "NULL"
783
784            return self.binary(expression, "=")
785
786        def attimezone_sql(self, expression: exp.AtTimeZone) -> str:
787            parent = expression.parent
788
789            # BigQuery allows CAST(.. AS {STRING|TIMESTAMP} [FORMAT <fmt> [AT TIME ZONE <tz>]]).
790            # Only the TIMESTAMP one should use the below conversion, when AT TIME ZONE is included.
791            if not isinstance(parent, exp.Cast) or not parent.to.is_type("text"):
792                return self.func(
793                    "TIMESTAMP", self.func("DATETIME", expression.this, expression.args.get("zone"))
794                )
795
796            return super().attimezone_sql(expression)
797
798        def trycast_sql(self, expression: exp.TryCast) -> str:
799            return self.cast_sql(expression, safe_prefix="SAFE_")
800
801        def cte_sql(self, expression: exp.CTE) -> str:
802            if expression.alias_column_names:
803                self.unsupported("Column names in CTE definition are not supported.")
804            return super().cte_sql(expression)
805
806        def array_sql(self, expression: exp.Array) -> str:
807            first_arg = seq_get(expression.expressions, 0)
808            if isinstance(first_arg, exp.Subqueryable):
809                return f"ARRAY{self.wrap(self.sql(first_arg))}"
810
811            return inline_array_sql(self, expression)
812
813        def bracket_sql(self, expression: exp.Bracket) -> str:
814            this = self.sql(expression, "this")
815            expressions = expression.expressions
816
817            if len(expressions) == 1:
818                arg = expressions[0]
819                if arg.type is None:
820                    from sqlglot.optimizer.annotate_types import annotate_types
821
822                    arg = annotate_types(arg)
823
824                if arg.type and arg.type.this in exp.DataType.TEXT_TYPES:
825                    # BQ doesn't support bracket syntax with string values
826                    return f"{this}.{arg.name}"
827
828            expressions_sql = ", ".join(self.sql(e) for e in expressions)
829            offset = expression.args.get("offset")
830
831            if offset == 0:
832                expressions_sql = f"OFFSET({expressions_sql})"
833            elif offset == 1:
834                expressions_sql = f"ORDINAL({expressions_sql})"
835            elif offset is not None:
836                self.unsupported(f"Unsupported array offset: {offset}")
837
838            if expression.args.get("safe"):
839                expressions_sql = f"SAFE_{expressions_sql}"
840
841            return f"{this}[{expressions_sql}]"
842
843        def transaction_sql(self, *_) -> str:
844            return "BEGIN TRANSACTION"
845
846        def commit_sql(self, *_) -> str:
847            return "COMMIT TRANSACTION"
848
849        def rollback_sql(self, *_) -> str:
850            return "ROLLBACK TRANSACTION"
851
852        def in_unnest_op(self, expression: exp.Unnest) -> str:
853            return self.sql(expression)
854
855        def except_op(self, expression: exp.Except) -> str:
856            if not expression.args.get("distinct", False):
857                self.unsupported("EXCEPT without DISTINCT is not supported in BigQuery")
858            return f"EXCEPT{' DISTINCT' if expression.args.get('distinct') else ' ALL'}"
859
860        def intersect_op(self, expression: exp.Intersect) -> str:
861            if not expression.args.get("distinct", False):
862                self.unsupported("INTERSECT without DISTINCT is not supported in BigQuery")
863            return f"INTERSECT{' DISTINCT' if expression.args.get('distinct') else ' ALL'}"
864
865        def with_properties(self, properties: exp.Properties) -> str:
866            return self.properties(properties, prefix=self.seg("OPTIONS"))
867
868        def version_sql(self, expression: exp.Version) -> str:
869            if expression.name == "TIMESTAMP":
870                expression.set("this", "SYSTEM_TIME")
871            return super().version_sql(expression)

Generator converts a given syntax tree to the corresponding SQL string.

Arguments:
  • pretty: Whether or not to format the produced SQL string. Default: False.
  • identify: Determines when an identifier should be quoted. Possible values are: False (default): Never quote, except in cases where it's mandatory by the dialect. True or 'always': Always quote. 'safe': Only quote identifiers that are case insensitive.
  • normalize: Whether or not to normalize identifiers to lowercase. Default: False.
  • pad: Determines the pad size in a formatted string. Default: 2.
  • indent: Determines the indentation size in a formatted string. Default: 2.
  • normalize_functions: Whether or not to normalize all function names. Possible values are: "upper" or True (default): Convert names to uppercase. "lower": Convert names to lowercase. False: Disables function name normalization.
  • unsupported_level: Determines the generator's behavior when it encounters unsupported expressions. Default ErrorLevel.WARN.
  • max_unsupported: Maximum number of unsupported messages to include in a raised UnsupportedError. This is only relevant if unsupported_level is ErrorLevel.RAISE. Default: 3
  • leading_comma: Determines whether or not the comma is leading or trailing in select expressions. This is only relevant when generating in pretty mode. Default: False
  • max_text_width: The max number of characters in a segment before creating new lines in pretty mode. The default is on the smaller end because the length only represents a segment and not the true line length. Default: 80
  • comments: Whether or not to preserve comments in the output SQL code. Default: True
EXPLICIT_UNION = True
INTERVAL_ALLOWS_PLURAL_FORM = False
JOIN_HINTS = False
QUERY_HINTS = False
TABLE_HINTS = False
LIMIT_FETCH = 'LIMIT'
RENAME_TABLE_WITH_DB = False
NVL2_SUPPORTED = False
UNNEST_WITH_ORDINALITY = False
COLLATE_IS_FUNC = True
LIMIT_ONLY_LITERALS = True
SUPPORTS_TABLE_ALIAS_COLUMNS = False
UNPIVOT_ALIASES_ARE_IDENTIFIERS = False
JSON_KEY_VALUE_PAIR_SEP = ','
NULL_ORDERING_SUPPORTED = False
TRANSFORMS = {<class 'sqlglot.expressions.DateAdd'>: <function date_add_interval_sql.<locals>.func>, <class 'sqlglot.expressions.CaseSpecificColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.CharacterSetColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.CharacterSetProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.CheckColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.ClusteredColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.CollateColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.AutoRefreshProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.CopyGrantsProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.CommentColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.DateFormatColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.DefaultColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.EncodeColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.ExecuteAsProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.ExternalProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.HeapProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.InheritsProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.InlineLengthColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.InputModelProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.IntervalSpan'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.LanguageProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.LocationProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.LogProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.MaterializedProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.NoPrimaryIndexProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.NonClusteredColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.NotForReplicationColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.OnCommitProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.OnProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.OnUpdateColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.OutputModelProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.PathColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.RemoteWithConnectionModelProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.ReturnsProperty'>: <function _returnsproperty_sql>, <class 'sqlglot.expressions.SampleProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.SetProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.SetConfigProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.SettingsProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.SqlReadWriteProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.SqlSecurityProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.StabilityProperty'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.TemporaryProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.ToTableProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.TransientProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.TransformModelProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.TitleColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.UppercaseColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.VarMap'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.VolatileProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.WithJournalTableProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.ApproxDistinct'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.ArgMax'>: <function arg_max_or_min_no_count.<locals>._arg_max_or_min_sql>, <class 'sqlglot.expressions.ArgMin'>: <function arg_max_or_min_no_count.<locals>._arg_max_or_min_sql>, <class 'sqlglot.expressions.ArrayContains'>: <function _array_contains_sql>, <class 'sqlglot.expressions.ArraySize'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.Cast'>: <function preprocess.<locals>._to_sql>, <class 'sqlglot.expressions.CollateProperty'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.CountIf'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.Create'>: <function _create_sql>, <class 'sqlglot.expressions.CTE'>: <function preprocess.<locals>._to_sql>, <class 'sqlglot.expressions.DateDiff'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.DateFromParts'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.DateStrToDate'>: <function datestrtodate_sql>, <class 'sqlglot.expressions.DateSub'>: <function date_add_interval_sql.<locals>.func>, <class 'sqlglot.expressions.DatetimeAdd'>: <function date_add_interval_sql.<locals>.func>, <class 'sqlglot.expressions.DatetimeSub'>: <function date_add_interval_sql.<locals>.func>, <class 'sqlglot.expressions.DateTrunc'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.FromTimeZone'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.GenerateSeries'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.GetPath'>: <function path_to_jsonpath.<locals>._transform>, <class 'sqlglot.expressions.GroupConcat'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.Hex'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.If'>: <function if_sql.<locals>._if_sql>, <class 'sqlglot.expressions.ILike'>: <function no_ilike_sql>, <class 'sqlglot.expressions.IntDiv'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.JSONFormat'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.Max'>: <function max_or_greatest>, <class 'sqlglot.expressions.MD5'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.MD5Digest'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.Min'>: <function min_or_least>, <class 'sqlglot.expressions.PartitionedByProperty'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.RegexpExtract'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.RegexpReplace'>: <function regexp_replace_sql>, <class 'sqlglot.expressions.RegexpLike'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.Select'>: <function preprocess.<locals>._to_sql>, <class 'sqlglot.expressions.SHA2'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.StrToDate'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.StrToTime'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.TimeAdd'>: <function date_add_interval_sql.<locals>.func>, <class 'sqlglot.expressions.TimeFromParts'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.TimeSub'>: <function date_add_interval_sql.<locals>.func>, <class 'sqlglot.expressions.TimestampAdd'>: <function date_add_interval_sql.<locals>.func>, <class 'sqlglot.expressions.TimestampSub'>: <function date_add_interval_sql.<locals>.func>, <class 'sqlglot.expressions.TimeStrToTime'>: <function timestrtotime_sql>, <class 'sqlglot.expressions.Trim'>: <function BigQuery.Generator.<lambda>>, <class 'sqlglot.expressions.TsOrDsAdd'>: <function _ts_or_ds_add_sql>, <class 'sqlglot.expressions.TsOrDsDiff'>: <function _ts_or_ds_diff_sql>, <class 'sqlglot.expressions.TsOrDsToTime'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.Unhex'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.UnixDate'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.UnixToTime'>: <function _unix_to_time_sql>, <class 'sqlglot.expressions.Values'>: <function _derived_table_values_to_unnest>, <class 'sqlglot.expressions.VariancePop'>: <function rename_func.<locals>.<lambda>>}
TYPE_MAPPING = {<Type.NCHAR: 'NCHAR'>: 'STRING', <Type.NVARCHAR: 'NVARCHAR'>: 'STRING', <Type.MEDIUMTEXT: 'MEDIUMTEXT'>: 'TEXT', <Type.LONGTEXT: 'LONGTEXT'>: 'TEXT', <Type.TINYTEXT: 'TINYTEXT'>: 'TEXT', <Type.MEDIUMBLOB: 'MEDIUMBLOB'>: 'BLOB', <Type.LONGBLOB: 'LONGBLOB'>: 'BLOB', <Type.TINYBLOB: 'TINYBLOB'>: 'BLOB', <Type.INET: 'INET'>: 'INET', <Type.BIGDECIMAL: 'BIGDECIMAL'>: 'BIGNUMERIC', <Type.BIGINT: 'BIGINT'>: 'INT64', <Type.BINARY: 'BINARY'>: 'BYTES', <Type.BOOLEAN: 'BOOLEAN'>: 'BOOL', <Type.CHAR: 'CHAR'>: 'STRING', <Type.DECIMAL: 'DECIMAL'>: 'NUMERIC', <Type.DOUBLE: 'DOUBLE'>: 'FLOAT64', <Type.FLOAT: 'FLOAT'>: 'FLOAT64', <Type.INT: 'INT'>: 'INT64', <Type.SMALLINT: 'SMALLINT'>: 'INT64', <Type.TEXT: 'TEXT'>: 'STRING', <Type.TIMESTAMP: 'TIMESTAMP'>: 'DATETIME', <Type.TIMESTAMPTZ: 'TIMESTAMPTZ'>: 'TIMESTAMP', <Type.TIMESTAMPLTZ: 'TIMESTAMPLTZ'>: 'TIMESTAMP', <Type.TINYINT: 'TINYINT'>: 'INT64', <Type.VARBINARY: 'VARBINARY'>: 'BYTES', <Type.VARCHAR: 'VARCHAR'>: 'STRING', <Type.VARIANT: 'VARIANT'>: 'ANY TYPE'}
PROPERTIES_LOCATION = {<class 'sqlglot.expressions.AlgorithmProperty'>: <Location.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.AutoIncrementProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.AutoRefreshProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.BlockCompressionProperty'>: <Location.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.CharacterSetProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.ChecksumProperty'>: <Location.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.CollateProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.CopyGrantsProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.Cluster'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.ClusteredByProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.DataBlocksizeProperty'>: <Location.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.DefinerProperty'>: <Location.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.DictRange'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.DictProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.DistKeyProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.DistStyleProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.EngineProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.ExecuteAsProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.ExternalProperty'>: <Location.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.FallbackProperty'>: <Location.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.FileFormatProperty'>: <Location.POST_WITH: 'POST_WITH'>, <class 'sqlglot.expressions.FreespaceProperty'>: <Location.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.HeapProperty'>: <Location.POST_WITH: 'POST_WITH'>, <class 'sqlglot.expressions.InheritsProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.InputModelProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.IsolatedLoadingProperty'>: <Location.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.JournalProperty'>: <Location.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.LanguageProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.LikeProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.LocationProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.LockingProperty'>: <Location.POST_ALIAS: 'POST_ALIAS'>, <class 'sqlglot.expressions.LogProperty'>: <Location.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.MaterializedProperty'>: <Location.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.MergeBlockRatioProperty'>: <Location.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.NoPrimaryIndexProperty'>: <Location.POST_EXPRESSION: 'POST_EXPRESSION'>, <class 'sqlglot.expressions.OnProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.OnCommitProperty'>: <Location.POST_EXPRESSION: 'POST_EXPRESSION'>, <class 'sqlglot.expressions.Order'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.OutputModelProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.PartitionedByProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.PartitionedOfProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.PrimaryKey'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.Property'>: <Location.POST_WITH: 'POST_WITH'>, <class 'sqlglot.expressions.RemoteWithConnectionModelProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.ReturnsProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.RowFormatProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.RowFormatDelimitedProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.RowFormatSerdeProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.SampleProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.SchemaCommentProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.SerdeProperties'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.Set'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.SettingsProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.SetProperty'>: <Location.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.SetConfigProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.SortKeyProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.SqlReadWriteProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.SqlSecurityProperty'>: <Location.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.StabilityProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.TemporaryProperty'>: <Location.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.ToTableProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.TransientProperty'>: <Location.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.TransformModelProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.MergeTreeTTL'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.VolatileProperty'>: <Location.UNSUPPORTED: 'UNSUPPORTED'>, <class 'sqlglot.expressions.WithDataProperty'>: <Location.POST_EXPRESSION: 'POST_EXPRESSION'>, <class 'sqlglot.expressions.WithJournalTableProperty'>: <Location.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.WithSystemVersioningProperty'>: <Location.POST_SCHEMA: 'POST_SCHEMA'>}
RESERVED_KEYWORDS = {'like', 'intersect', 'recursive', 'and', 'when', 'rows', 'by', 'all', 'fetch', 'case', 'left', 'end', 'limit', 'unnest', 'cast', 'any', 'asc', 'distinct', 'union', 'qualify', 'within', 'from', 'no', 'set', 'interval', 'inner', 'some', 'range', 'as', 'exists', 'contains', 'group', 'create', 'for', 'unbounded', 'rollup', 'except', 'join', 'window', 'merge', 'extract', 'assert_rows_modified', 'full', 'array', 'enum', 'else', 'hash', 'not', 'new', 'following', 'lookup', 'exclude', 'order', 'escape', 'groups', 'default', 'right', 'desc', 'true', 'where', 'null', 'on', 'proto', 'if', 'then', 'at', 'using', 'outer', 'or', 'in', 'grouping', 'cross', 'struct', 'collate', 'over', 'with', 'natural', 'nulls', 'tablesample', 'of', 'having', 'lateral', 'false', 'is', 'treat', 'respect', 'into', 'current', 'partition', 'define', 'to', 'select', 'between', 'preceding', 'cube', 'ignore'}
def timetostr_sql(self, expression: sqlglot.expressions.TimeToStr) -> str:
758        def timetostr_sql(self, expression: exp.TimeToStr) -> str:
759            if isinstance(expression.this, exp.TsOrDsToDate):
760                this: exp.Expression = expression.this
761            else:
762                this = expression
763
764            return f"FORMAT_DATE({self.format_time(expression)}, {self.sql(this, 'this')})"
def struct_sql(self, expression: sqlglot.expressions.Struct) -> str:
766        def struct_sql(self, expression: exp.Struct) -> str:
767            args = []
768            for expr in expression.expressions:
769                if isinstance(expr, self.KEY_VALUE_DEFINITIONS):
770                    arg = f"{self.sql(expr, 'expression')} AS {expr.this.name}"
771                else:
772                    arg = self.sql(expr)
773
774                args.append(arg)
775
776            return self.func("STRUCT", *args)
def eq_sql(self, expression: sqlglot.expressions.EQ) -> str:
778        def eq_sql(self, expression: exp.EQ) -> str:
779            # Operands of = cannot be NULL in BigQuery
780            if isinstance(expression.left, exp.Null) or isinstance(expression.right, exp.Null):
781                if not isinstance(expression.parent, exp.Update):
782                    return "NULL"
783
784            return self.binary(expression, "=")
def attimezone_sql(self, expression: sqlglot.expressions.AtTimeZone) -> str:
786        def attimezone_sql(self, expression: exp.AtTimeZone) -> str:
787            parent = expression.parent
788
789            # BigQuery allows CAST(.. AS {STRING|TIMESTAMP} [FORMAT <fmt> [AT TIME ZONE <tz>]]).
790            # Only the TIMESTAMP one should use the below conversion, when AT TIME ZONE is included.
791            if not isinstance(parent, exp.Cast) or not parent.to.is_type("text"):
792                return self.func(
793                    "TIMESTAMP", self.func("DATETIME", expression.this, expression.args.get("zone"))
794                )
795
796            return super().attimezone_sql(expression)
def trycast_sql(self, expression: sqlglot.expressions.TryCast) -> str:
798        def trycast_sql(self, expression: exp.TryCast) -> str:
799            return self.cast_sql(expression, safe_prefix="SAFE_")
def cte_sql(self, expression: sqlglot.expressions.CTE) -> str:
801        def cte_sql(self, expression: exp.CTE) -> str:
802            if expression.alias_column_names:
803                self.unsupported("Column names in CTE definition are not supported.")
804            return super().cte_sql(expression)
def array_sql(self, expression: sqlglot.expressions.Array) -> str:
806        def array_sql(self, expression: exp.Array) -> str:
807            first_arg = seq_get(expression.expressions, 0)
808            if isinstance(first_arg, exp.Subqueryable):
809                return f"ARRAY{self.wrap(self.sql(first_arg))}"
810
811            return inline_array_sql(self, expression)
def bracket_sql(self, expression: sqlglot.expressions.Bracket) -> str:
813        def bracket_sql(self, expression: exp.Bracket) -> str:
814            this = self.sql(expression, "this")
815            expressions = expression.expressions
816
817            if len(expressions) == 1:
818                arg = expressions[0]
819                if arg.type is None:
820                    from sqlglot.optimizer.annotate_types import annotate_types
821
822                    arg = annotate_types(arg)
823
824                if arg.type and arg.type.this in exp.DataType.TEXT_TYPES:
825                    # BQ doesn't support bracket syntax with string values
826                    return f"{this}.{arg.name}"
827
828            expressions_sql = ", ".join(self.sql(e) for e in expressions)
829            offset = expression.args.get("offset")
830
831            if offset == 0:
832                expressions_sql = f"OFFSET({expressions_sql})"
833            elif offset == 1:
834                expressions_sql = f"ORDINAL({expressions_sql})"
835            elif offset is not None:
836                self.unsupported(f"Unsupported array offset: {offset}")
837
838            if expression.args.get("safe"):
839                expressions_sql = f"SAFE_{expressions_sql}"
840
841            return f"{this}[{expressions_sql}]"
def transaction_sql(self, *_) -> str:
843        def transaction_sql(self, *_) -> str:
844            return "BEGIN TRANSACTION"
def commit_sql(self, *_) -> str:
846        def commit_sql(self, *_) -> str:
847            return "COMMIT TRANSACTION"
def rollback_sql(self, *_) -> str:
849        def rollback_sql(self, *_) -> str:
850            return "ROLLBACK TRANSACTION"
def in_unnest_op(self, expression: sqlglot.expressions.Unnest) -> str:
852        def in_unnest_op(self, expression: exp.Unnest) -> str:
853            return self.sql(expression)
def except_op(self, expression: sqlglot.expressions.Except) -> str:
855        def except_op(self, expression: exp.Except) -> str:
856            if not expression.args.get("distinct", False):
857                self.unsupported("EXCEPT without DISTINCT is not supported in BigQuery")
858            return f"EXCEPT{' DISTINCT' if expression.args.get('distinct') else ' ALL'}"
def intersect_op(self, expression: sqlglot.expressions.Intersect) -> str:
860        def intersect_op(self, expression: exp.Intersect) -> str:
861            if not expression.args.get("distinct", False):
862                self.unsupported("INTERSECT without DISTINCT is not supported in BigQuery")
863            return f"INTERSECT{' DISTINCT' if expression.args.get('distinct') else ' ALL'}"
def with_properties(self, properties: sqlglot.expressions.Properties) -> str:
865        def with_properties(self, properties: exp.Properties) -> str:
866            return self.properties(properties, prefix=self.seg("OPTIONS"))
def version_sql(self, expression: sqlglot.expressions.Version) -> str:
868        def version_sql(self, expression: exp.Version) -> str:
869            if expression.name == "TIMESTAMP":
870                expression.set("this", "SYSTEM_TIME")
871            return super().version_sql(expression)
Inherited Members
sqlglot.generator.Generator
Generator
LOCKING_READS_SUPPORTED
WRAP_DERIVED_VALUES
CREATE_FUNCTION_RETURN_AS
MATCHED_BY_SOURCE
SINGLE_STRING_INTERVAL
GROUPINGS_SEP
INDEX_ON
QUERY_HINT_SEP
IS_BOOL_ALLOWED
DUPLICATE_KEY_UPDATE_WITH_SET
LIMIT_IS_TOP
RETURNING_END
COLUMN_JOIN_MARKS_SUPPORTED
EXTRACT_ALLOWS_QUOTES
TZ_TO_WITH_TIME_ZONE
SELECT_KINDS
VALUES_AS_TABLE
ALTER_TABLE_INCLUDE_COLUMN_KEYWORD
AGGREGATE_FILTER_SUPPORTED
SEMI_ANTI_JOIN_WITH_SIDE
COMPUTED_COLUMN_WITH_TYPE
SUPPORTS_TABLE_COPY
TABLESAMPLE_REQUIRES_PARENS
TABLESAMPLE_SIZE_IS_ROWS
TABLESAMPLE_KEYWORDS
TABLESAMPLE_WITH_METHOD
TABLESAMPLE_SEED_KEYWORD
DATA_TYPE_SPECIFIERS_ALLOWED
ENSURE_BOOLS
CTE_RECURSIVE_KEYWORD_REQUIRED
SUPPORTS_SINGLE_ARG_CONCAT
LAST_DAY_SUPPORTS_DATE_PART
INSERT_OVERWRITE
SUPPORTS_SELECT_INTO
SUPPORTS_UNLOGGED_TABLES
STAR_MAPPING
TIME_PART_SINGULARS
TOKEN_MAPPING
STRUCT_DELIMITER
PARAMETER_TOKEN
WITH_SEPARATED_COMMENTS
EXCLUDE_COMMENTS
UNWRAPPED_INTERVAL_VALUES
EXPRESSIONS_WITHOUT_NESTED_CTES
KEY_VALUE_DEFINITIONS
SENTINEL_LINE_BREAK
pretty
identify
normalize
pad
unsupported_level
max_unsupported
leading_comma
max_text_width
comments
dialect
normalize_functions
unsupported_messages
generate
preprocess
unsupported
sep
seg
pad_comment
maybe_comment
wrap
no_identify
normalize_func
indent
sql
uncache_sql
cache_sql
characterset_sql
column_sql
columnposition_sql
columndef_sql
columnconstraint_sql
computedcolumnconstraint_sql
autoincrementcolumnconstraint_sql
compresscolumnconstraint_sql
generatedasidentitycolumnconstraint_sql
generatedasrowcolumnconstraint_sql
periodforsystemtimeconstraint_sql
notnullcolumnconstraint_sql
transformcolumnconstraint_sql
primarykeycolumnconstraint_sql
uniquecolumnconstraint_sql
createable_sql
create_sql
clone_sql
describe_sql
heredoc_sql
prepend_ctes
with_sql
tablealias_sql
bitstring_sql
hexstring_sql
bytestring_sql
unicodestring_sql
rawstring_sql
datatypeparam_sql
datatype_sql
directory_sql
delete_sql
drop_sql
except_sql
fetch_sql
filter_sql
hint_sql
index_sql
identifier_sql
inputoutputformat_sql
national_sql
partition_sql
properties_sql
root_properties
properties
locate_properties
property_name
property_sql
likeproperty_sql
fallbackproperty_sql
journalproperty_sql
freespaceproperty_sql
checksumproperty_sql
mergeblockratioproperty_sql
datablocksizeproperty_sql
blockcompressionproperty_sql
isolatedloadingproperty_sql
partitionboundspec_sql
partitionedofproperty_sql
lockingproperty_sql
withdataproperty_sql
withsystemversioningproperty_sql
insert_sql
intersect_sql
introducer_sql
kill_sql
pseudotype_sql
objectidentifier_sql
onconflict_sql
returning_sql
rowformatdelimitedproperty_sql
withtablehint_sql
indextablehint_sql
historicaldata_sql
table_sql
tablesample_sql
pivot_sql
tuple_sql
update_sql
values_sql
var_sql
into_sql
from_sql
group_sql
having_sql
connect_sql
prior_sql
join_sql
lambda_sql
lateral_op
lateral_sql
limit_sql
offset_sql
setitem_sql
set_sql
pragma_sql
lock_sql
literal_sql
escape_str
loaddata_sql
null_sql
boolean_sql
order_sql
withfill_sql
cluster_sql
distribute_sql
sort_sql
ordered_sql
matchrecognize_sql
query_modifiers
offset_limit_modifiers
after_having_modifiers
after_limit_modifiers
select_sql
schema_sql
schema_columns_sql
star_sql
parameter_sql
sessionparameter_sql
placeholder_sql
subquery_sql
qualify_sql
union_sql
union_op
unnest_sql
where_sql
window_sql
partition_by_sql
windowspec_sql
withingroup_sql
between_sql
all_sql
any_sql
exists_sql
case_sql
constraint_sql
nextvaluefor_sql
extract_sql
trim_sql
convert_concat_args
concat_sql
concatws_sql
check_sql
foreignkey_sql
primarykey_sql
if_sql
matchagainst_sql
jsonkeyvalue_sql
formatjson_sql
jsonobject_sql
jsonobjectagg_sql
jsonarray_sql
jsonarrayagg_sql
jsoncolumndef_sql
jsonschema_sql
jsontable_sql
openjsoncolumndef_sql
openjson_sql
in_sql
interval_sql
return_sql
reference_sql
anonymous_sql
paren_sql
neg_sql
not_sql
alias_sql
pivotalias_sql
aliases_sql
atindex_sql
fromtimezone_sql
add_sql
and_sql
xor_sql
connector_sql
bitwiseand_sql
bitwiseleftshift_sql
bitwisenot_sql
bitwiseor_sql
bitwiserightshift_sql
bitwisexor_sql
cast_sql
currentdate_sql
collate_sql
command_sql
comment_sql
mergetreettlaction_sql
mergetreettl_sql
altercolumn_sql
renametable_sql
renamecolumn_sql
altertable_sql
add_column_sql
droppartition_sql
addconstraint_sql
distinct_sql
ignorenulls_sql
respectnulls_sql
intdiv_sql
dpipe_sql
div_sql
overlaps_sql
distance_sql
dot_sql
propertyeq_sql
escape_sql
glob_sql
gt_sql
gte_sql
ilike_sql
ilikeany_sql
is_sql
like_sql
likeany_sql
similarto_sql
lt_sql
lte_sql
mod_sql
mul_sql
neq_sql
nullsafeeq_sql
nullsafeneq_sql
or_sql
slice_sql
sub_sql
log_sql
use_sql
binary
function_fallback_sql
func
format_args
text_width
format_time
expressions
op_expressions
naked_property
set_operation
tag_sql
token_sql
userdefinedfunction_sql
joinhint_sql
kwarg_sql
when_sql
merge_sql
tochar_sql
dictproperty_sql
dictrange_sql
dictsubproperty_sql
oncluster_sql
clusteredbyproperty_sql
anyvalue_sql
querytransform_sql
indexconstraintoption_sql
indexcolumnconstraint_sql
nvl2_sql
comprehension_sql
columnprefix_sql
opclass_sql
predict_sql
forin_sql
refresh_sql
operator_sql
toarray_sql
tsordstotime_sql
tsordstodate_sql
unixdate_sql
lastday_sql