sqlglot.dialects.tsql
1from __future__ import annotations 2 3import datetime 4import re 5import typing as t 6from functools import partial 7 8from sqlglot import exp, generator, parser, tokens, transforms 9from sqlglot.dialects.dialect import ( 10 Dialect, 11 NormalizationStrategy, 12 any_value_to_max_sql, 13 date_delta_sql, 14 datestrtodate_sql, 15 generatedasidentitycolumnconstraint_sql, 16 max_or_greatest, 17 min_or_least, 18 build_date_delta, 19 rename_func, 20 trim_sql, 21) 22from sqlglot.helper import seq_get 23from sqlglot.time import format_time 24from sqlglot.tokens import TokenType 25 26if t.TYPE_CHECKING: 27 from sqlglot._typing import E 28 29FULL_FORMAT_TIME_MAPPING = { 30 "weekday": "%A", 31 "dw": "%A", 32 "w": "%A", 33 "month": "%B", 34 "mm": "%B", 35 "m": "%B", 36} 37 38DATE_DELTA_INTERVAL = { 39 "year": "year", 40 "yyyy": "year", 41 "yy": "year", 42 "quarter": "quarter", 43 "qq": "quarter", 44 "q": "quarter", 45 "month": "month", 46 "mm": "month", 47 "m": "month", 48 "week": "week", 49 "ww": "week", 50 "wk": "week", 51 "day": "day", 52 "dd": "day", 53 "d": "day", 54} 55 56 57DATE_FMT_RE = re.compile("([dD]{1,2})|([mM]{1,2})|([yY]{1,4})|([hH]{1,2})|([sS]{1,2})") 58 59# N = Numeric, C=Currency 60TRANSPILE_SAFE_NUMBER_FMT = {"N", "C"} 61 62DEFAULT_START_DATE = datetime.date(1900, 1, 1) 63 64BIT_TYPES = {exp.EQ, exp.NEQ, exp.Is, exp.In, exp.Select, exp.Alias} 65 66# Unsupported options: 67# - OPTIMIZE FOR ( @variable_name { UNKNOWN | = <literal_constant> } [ , ...n ] ) 68# - TABLE HINT 69OPTIONS: parser.OPTIONS_TYPE = { 70 **dict.fromkeys( 71 ( 72 "DISABLE_OPTIMIZED_PLAN_FORCING", 73 "FAST", 74 "IGNORE_NONCLUSTERED_COLUMNSTORE_INDEX", 75 "LABEL", 76 "MAXDOP", 77 "MAXRECURSION", 78 "MAX_GRANT_PERCENT", 79 "MIN_GRANT_PERCENT", 80 "NO_PERFORMANCE_SPOOL", 81 "QUERYTRACEON", 82 "RECOMPILE", 83 ), 84 tuple(), 85 ), 86 "CONCAT": ("UNION",), 87 "DISABLE": ("EXTERNALPUSHDOWN", "SCALEOUTEXECUTION"), 88 "EXPAND": ("VIEWS",), 89 "FORCE": ("EXTERNALPUSHDOWN", "ORDER", "SCALEOUTEXECUTION"), 90 "HASH": ("GROUP", "JOIN", "UNION"), 91 "KEEP": ("PLAN",), 92 "KEEPFIXED": ("PLAN",), 93 "LOOP": ("JOIN",), 94 "MERGE": ("JOIN", "UNION"), 95 "OPTIMIZE": (("FOR", "UNKNOWN"),), 96 "ORDER": ("GROUP",), 97 "PARAMETERIZATION": ("FORCED", "SIMPLE"), 98 "ROBUST": ("PLAN",), 99 "USE": ("PLAN",), 100} 101 102OPTIONS_THAT_REQUIRE_EQUAL = ("MAX_GRANT_PERCENT", "MIN_GRANT_PERCENT", "LABEL") 103 104 105def _build_formatted_time( 106 exp_class: t.Type[E], full_format_mapping: t.Optional[bool] = None 107) -> t.Callable[[t.List], E]: 108 def _builder(args: t.List) -> E: 109 assert len(args) == 2 110 111 return exp_class( 112 this=exp.cast(args[1], exp.DataType.Type.DATETIME), 113 format=exp.Literal.string( 114 format_time( 115 args[0].name.lower(), 116 ( 117 {**TSQL.TIME_MAPPING, **FULL_FORMAT_TIME_MAPPING} 118 if full_format_mapping 119 else TSQL.TIME_MAPPING 120 ), 121 ) 122 ), 123 ) 124 125 return _builder 126 127 128def _build_format(args: t.List) -> exp.NumberToStr | exp.TimeToStr: 129 this = seq_get(args, 0) 130 fmt = seq_get(args, 1) 131 culture = seq_get(args, 2) 132 133 number_fmt = fmt and (fmt.name in TRANSPILE_SAFE_NUMBER_FMT or not DATE_FMT_RE.search(fmt.name)) 134 135 if number_fmt: 136 return exp.NumberToStr(this=this, format=fmt, culture=culture) 137 138 if fmt: 139 fmt = exp.Literal.string( 140 format_time(fmt.name, TSQL.FORMAT_TIME_MAPPING) 141 if len(fmt.name) == 1 142 else format_time(fmt.name, TSQL.TIME_MAPPING) 143 ) 144 145 return exp.TimeToStr(this=this, format=fmt, culture=culture) 146 147 148def _build_eomonth(args: t.List) -> exp.LastDay: 149 date = exp.TsOrDsToDate(this=seq_get(args, 0)) 150 month_lag = seq_get(args, 1) 151 152 if month_lag is None: 153 this: exp.Expression = date 154 else: 155 unit = DATE_DELTA_INTERVAL.get("month") 156 this = exp.DateAdd(this=date, expression=month_lag, unit=unit and exp.var(unit)) 157 158 return exp.LastDay(this=this) 159 160 161def _build_hashbytes(args: t.List) -> exp.Expression: 162 kind, data = args 163 kind = kind.name.upper() if kind.is_string else "" 164 165 if kind == "MD5": 166 args.pop(0) 167 return exp.MD5(this=data) 168 if kind in ("SHA", "SHA1"): 169 args.pop(0) 170 return exp.SHA(this=data) 171 if kind == "SHA2_256": 172 return exp.SHA2(this=data, length=exp.Literal.number(256)) 173 if kind == "SHA2_512": 174 return exp.SHA2(this=data, length=exp.Literal.number(512)) 175 176 return exp.func("HASHBYTES", *args) 177 178 179DATEPART_ONLY_FORMATS = {"DW", "HOUR", "QUARTER"} 180 181 182def _format_sql(self: TSQL.Generator, expression: exp.NumberToStr | exp.TimeToStr) -> str: 183 fmt = expression.args["format"] 184 185 if not isinstance(expression, exp.NumberToStr): 186 if fmt.is_string: 187 mapped_fmt = format_time(fmt.name, TSQL.INVERSE_TIME_MAPPING) 188 189 name = (mapped_fmt or "").upper() 190 if name in DATEPART_ONLY_FORMATS: 191 return self.func("DATEPART", name, expression.this) 192 193 fmt_sql = self.sql(exp.Literal.string(mapped_fmt)) 194 else: 195 fmt_sql = self.format_time(expression) or self.sql(fmt) 196 else: 197 fmt_sql = self.sql(fmt) 198 199 return self.func("FORMAT", expression.this, fmt_sql, expression.args.get("culture")) 200 201 202def _string_agg_sql(self: TSQL.Generator, expression: exp.GroupConcat) -> str: 203 this = expression.this 204 distinct = expression.find(exp.Distinct) 205 if distinct: 206 # exp.Distinct can appear below an exp.Order or an exp.GroupConcat expression 207 self.unsupported("T-SQL STRING_AGG doesn't support DISTINCT.") 208 this = distinct.pop().expressions[0] 209 210 order = "" 211 if isinstance(expression.this, exp.Order): 212 if expression.this.this: 213 this = expression.this.this.pop() 214 # Order has a leading space 215 order = f" WITHIN GROUP ({self.sql(expression.this)[1:]})" 216 217 separator = expression.args.get("separator") or exp.Literal.string(",") 218 return f"STRING_AGG({self.format_args(this, separator)}){order}" 219 220 221def _build_date_delta( 222 exp_class: t.Type[E], unit_mapping: t.Optional[t.Dict[str, str]] = None 223) -> t.Callable[[t.List], E]: 224 def _builder(args: t.List) -> E: 225 unit = seq_get(args, 0) 226 if unit and unit_mapping: 227 unit = exp.var(unit_mapping.get(unit.name.lower(), unit.name)) 228 229 start_date = seq_get(args, 1) 230 if start_date and start_date.is_number: 231 # Numeric types are valid DATETIME values 232 if start_date.is_int: 233 adds = DEFAULT_START_DATE + datetime.timedelta(days=int(start_date.this)) 234 start_date = exp.Literal.string(adds.strftime("%F")) 235 else: 236 # We currently don't handle float values, i.e. they're not converted to equivalent DATETIMEs. 237 # This is not a problem when generating T-SQL code, it is when transpiling to other dialects. 238 return exp_class(this=seq_get(args, 2), expression=start_date, unit=unit) 239 240 return exp_class( 241 this=exp.TimeStrToTime(this=seq_get(args, 2)), 242 expression=exp.TimeStrToTime(this=start_date), 243 unit=unit, 244 ) 245 246 return _builder 247 248 249def qualify_derived_table_outputs(expression: exp.Expression) -> exp.Expression: 250 """Ensures all (unnamed) output columns are aliased for CTEs and Subqueries.""" 251 alias = expression.args.get("alias") 252 253 if ( 254 isinstance(expression, (exp.CTE, exp.Subquery)) 255 and isinstance(alias, exp.TableAlias) 256 and not alias.columns 257 ): 258 from sqlglot.optimizer.qualify_columns import qualify_outputs 259 260 # We keep track of the unaliased column projection indexes instead of the expressions 261 # themselves, because the latter are going to be replaced by new nodes when the aliases 262 # are added and hence we won't be able to reach these newly added Alias parents 263 query = expression.this 264 unaliased_column_indexes = ( 265 i for i, c in enumerate(query.selects) if isinstance(c, exp.Column) and not c.alias 266 ) 267 268 qualify_outputs(query) 269 270 # Preserve the quoting information of columns for newly added Alias nodes 271 query_selects = query.selects 272 for select_index in unaliased_column_indexes: 273 alias = query_selects[select_index] 274 column = alias.this 275 if isinstance(column.this, exp.Identifier): 276 alias.args["alias"].set("quoted", column.this.quoted) 277 278 return expression 279 280 281# https://learn.microsoft.com/en-us/sql/t-sql/functions/datetimefromparts-transact-sql?view=sql-server-ver16#syntax 282def _build_datetimefromparts(args: t.List) -> exp.TimestampFromParts: 283 return exp.TimestampFromParts( 284 year=seq_get(args, 0), 285 month=seq_get(args, 1), 286 day=seq_get(args, 2), 287 hour=seq_get(args, 3), 288 min=seq_get(args, 4), 289 sec=seq_get(args, 5), 290 milli=seq_get(args, 6), 291 ) 292 293 294# https://learn.microsoft.com/en-us/sql/t-sql/functions/timefromparts-transact-sql?view=sql-server-ver16#syntax 295def _build_timefromparts(args: t.List) -> exp.TimeFromParts: 296 return exp.TimeFromParts( 297 hour=seq_get(args, 0), 298 min=seq_get(args, 1), 299 sec=seq_get(args, 2), 300 fractions=seq_get(args, 3), 301 precision=seq_get(args, 4), 302 ) 303 304 305def _build_with_arg_as_text( 306 klass: t.Type[exp.Expression], 307) -> t.Callable[[t.List[exp.Expression]], exp.Expression]: 308 def _parse(args: t.List[exp.Expression]) -> exp.Expression: 309 this = seq_get(args, 0) 310 311 if this and not this.is_string: 312 this = exp.cast(this, exp.DataType.Type.TEXT) 313 314 expression = seq_get(args, 1) 315 kwargs = {"this": this} 316 317 if expression: 318 kwargs["expression"] = expression 319 320 return klass(**kwargs) 321 322 return _parse 323 324 325def _json_extract_sql( 326 self: TSQL.Generator, expression: exp.JSONExtract | exp.JSONExtractScalar 327) -> str: 328 json_query = self.func("JSON_QUERY", expression.this, expression.expression) 329 json_value = self.func("JSON_VALUE", expression.this, expression.expression) 330 return self.func("ISNULL", json_query, json_value) 331 332 333class TSQL(Dialect): 334 NORMALIZATION_STRATEGY = NormalizationStrategy.CASE_INSENSITIVE 335 TIME_FORMAT = "'yyyy-mm-dd hh:mm:ss'" 336 SUPPORTS_SEMI_ANTI_JOIN = False 337 LOG_BASE_FIRST = False 338 TYPED_DIVISION = True 339 CONCAT_COALESCE = True 340 341 TIME_MAPPING = { 342 "year": "%Y", 343 "dayofyear": "%j", 344 "day": "%d", 345 "dy": "%d", 346 "y": "%Y", 347 "week": "%W", 348 "ww": "%W", 349 "wk": "%W", 350 "hour": "%h", 351 "hh": "%I", 352 "minute": "%M", 353 "mi": "%M", 354 "n": "%M", 355 "second": "%S", 356 "ss": "%S", 357 "s": "%-S", 358 "millisecond": "%f", 359 "ms": "%f", 360 "weekday": "%W", 361 "dw": "%W", 362 "month": "%m", 363 "mm": "%M", 364 "m": "%-M", 365 "Y": "%Y", 366 "YYYY": "%Y", 367 "YY": "%y", 368 "MMMM": "%B", 369 "MMM": "%b", 370 "MM": "%m", 371 "M": "%-m", 372 "dddd": "%A", 373 "dd": "%d", 374 "d": "%-d", 375 "HH": "%H", 376 "H": "%-H", 377 "h": "%-I", 378 "S": "%f", 379 "yyyy": "%Y", 380 "yy": "%y", 381 } 382 383 CONVERT_FORMAT_MAPPING = { 384 "0": "%b %d %Y %-I:%M%p", 385 "1": "%m/%d/%y", 386 "2": "%y.%m.%d", 387 "3": "%d/%m/%y", 388 "4": "%d.%m.%y", 389 "5": "%d-%m-%y", 390 "6": "%d %b %y", 391 "7": "%b %d, %y", 392 "8": "%H:%M:%S", 393 "9": "%b %d %Y %-I:%M:%S:%f%p", 394 "10": "mm-dd-yy", 395 "11": "yy/mm/dd", 396 "12": "yymmdd", 397 "13": "%d %b %Y %H:%M:ss:%f", 398 "14": "%H:%M:%S:%f", 399 "20": "%Y-%m-%d %H:%M:%S", 400 "21": "%Y-%m-%d %H:%M:%S.%f", 401 "22": "%m/%d/%y %-I:%M:%S %p", 402 "23": "%Y-%m-%d", 403 "24": "%H:%M:%S", 404 "25": "%Y-%m-%d %H:%M:%S.%f", 405 "100": "%b %d %Y %-I:%M%p", 406 "101": "%m/%d/%Y", 407 "102": "%Y.%m.%d", 408 "103": "%d/%m/%Y", 409 "104": "%d.%m.%Y", 410 "105": "%d-%m-%Y", 411 "106": "%d %b %Y", 412 "107": "%b %d, %Y", 413 "108": "%H:%M:%S", 414 "109": "%b %d %Y %-I:%M:%S:%f%p", 415 "110": "%m-%d-%Y", 416 "111": "%Y/%m/%d", 417 "112": "%Y%m%d", 418 "113": "%d %b %Y %H:%M:%S:%f", 419 "114": "%H:%M:%S:%f", 420 "120": "%Y-%m-%d %H:%M:%S", 421 "121": "%Y-%m-%d %H:%M:%S.%f", 422 } 423 424 FORMAT_TIME_MAPPING = { 425 "y": "%B %Y", 426 "d": "%m/%d/%Y", 427 "H": "%-H", 428 "h": "%-I", 429 "s": "%Y-%m-%d %H:%M:%S", 430 "D": "%A,%B,%Y", 431 "f": "%A,%B,%Y %-I:%M %p", 432 "F": "%A,%B,%Y %-I:%M:%S %p", 433 "g": "%m/%d/%Y %-I:%M %p", 434 "G": "%m/%d/%Y %-I:%M:%S %p", 435 "M": "%B %-d", 436 "m": "%B %-d", 437 "O": "%Y-%m-%dT%H:%M:%S", 438 "u": "%Y-%M-%D %H:%M:%S%z", 439 "U": "%A, %B %D, %Y %H:%M:%S%z", 440 "T": "%-I:%M:%S %p", 441 "t": "%-I:%M", 442 "Y": "%a %Y", 443 } 444 445 class Tokenizer(tokens.Tokenizer): 446 IDENTIFIERS = [("[", "]"), '"'] 447 QUOTES = ["'", '"'] 448 HEX_STRINGS = [("0x", ""), ("0X", "")] 449 VAR_SINGLE_TOKENS = {"@", "$", "#"} 450 451 KEYWORDS = { 452 **tokens.Tokenizer.KEYWORDS, 453 "CLUSTERED INDEX": TokenType.INDEX, 454 "DATETIME2": TokenType.DATETIME, 455 "DATETIMEOFFSET": TokenType.TIMESTAMPTZ, 456 "DECLARE": TokenType.DECLARE, 457 "EXEC": TokenType.COMMAND, 458 "FOR SYSTEM_TIME": TokenType.TIMESTAMP_SNAPSHOT, 459 "IMAGE": TokenType.IMAGE, 460 "MONEY": TokenType.MONEY, 461 "NONCLUSTERED INDEX": TokenType.INDEX, 462 "NTEXT": TokenType.TEXT, 463 "OPTION": TokenType.OPTION, 464 "OUTPUT": TokenType.RETURNING, 465 "PRINT": TokenType.COMMAND, 466 "PROC": TokenType.PROCEDURE, 467 "REAL": TokenType.FLOAT, 468 "ROWVERSION": TokenType.ROWVERSION, 469 "SMALLDATETIME": TokenType.DATETIME, 470 "SMALLMONEY": TokenType.SMALLMONEY, 471 "SQL_VARIANT": TokenType.VARIANT, 472 "SYSTEM_USER": TokenType.CURRENT_USER, 473 "TOP": TokenType.TOP, 474 "TIMESTAMP": TokenType.ROWVERSION, 475 "TINYINT": TokenType.UTINYINT, 476 "UNIQUEIDENTIFIER": TokenType.UNIQUEIDENTIFIER, 477 "UPDATE STATISTICS": TokenType.COMMAND, 478 "XML": TokenType.XML, 479 } 480 KEYWORDS.pop("/*+") 481 482 COMMANDS = {*tokens.Tokenizer.COMMANDS, TokenType.END} 483 484 class Parser(parser.Parser): 485 SET_REQUIRES_ASSIGNMENT_DELIMITER = False 486 LOG_DEFAULTS_TO_LN = True 487 ALTER_TABLE_ADD_REQUIRED_FOR_EACH_COLUMN = False 488 STRING_ALIASES = True 489 NO_PAREN_IF_COMMANDS = False 490 491 QUERY_MODIFIER_PARSERS = { 492 **parser.Parser.QUERY_MODIFIER_PARSERS, 493 TokenType.OPTION: lambda self: ("options", self._parse_options()), 494 } 495 496 FUNCTIONS = { 497 **parser.Parser.FUNCTIONS, 498 "CHARINDEX": lambda args: exp.StrPosition( 499 this=seq_get(args, 1), 500 substr=seq_get(args, 0), 501 position=seq_get(args, 2), 502 ), 503 "DATEADD": build_date_delta(exp.DateAdd, unit_mapping=DATE_DELTA_INTERVAL), 504 "DATEDIFF": _build_date_delta(exp.DateDiff, unit_mapping=DATE_DELTA_INTERVAL), 505 "DATENAME": _build_formatted_time(exp.TimeToStr, full_format_mapping=True), 506 "DATEPART": _build_formatted_time(exp.TimeToStr), 507 "DATETIMEFROMPARTS": _build_datetimefromparts, 508 "EOMONTH": _build_eomonth, 509 "FORMAT": _build_format, 510 "GETDATE": exp.CurrentTimestamp.from_arg_list, 511 "HASHBYTES": _build_hashbytes, 512 "ISNULL": exp.Coalesce.from_arg_list, 513 "JSON_QUERY": parser.build_extract_json_with_path(exp.JSONExtract), 514 "JSON_VALUE": parser.build_extract_json_with_path(exp.JSONExtractScalar), 515 "LEN": _build_with_arg_as_text(exp.Length), 516 "LEFT": _build_with_arg_as_text(exp.Left), 517 "RIGHT": _build_with_arg_as_text(exp.Right), 518 "REPLICATE": exp.Repeat.from_arg_list, 519 "SQUARE": lambda args: exp.Pow(this=seq_get(args, 0), expression=exp.Literal.number(2)), 520 "SYSDATETIME": exp.CurrentTimestamp.from_arg_list, 521 "SUSER_NAME": exp.CurrentUser.from_arg_list, 522 "SUSER_SNAME": exp.CurrentUser.from_arg_list, 523 "SYSTEM_USER": exp.CurrentUser.from_arg_list, 524 "TIMEFROMPARTS": _build_timefromparts, 525 } 526 527 JOIN_HINTS = {"LOOP", "HASH", "MERGE", "REMOTE"} 528 529 RETURNS_TABLE_TOKENS = parser.Parser.ID_VAR_TOKENS - { 530 TokenType.TABLE, 531 *parser.Parser.TYPE_TOKENS, 532 } 533 534 STATEMENT_PARSERS = { 535 **parser.Parser.STATEMENT_PARSERS, 536 TokenType.DECLARE: lambda self: self._parse_declare(), 537 } 538 539 RANGE_PARSERS = { 540 **parser.Parser.RANGE_PARSERS, 541 TokenType.DCOLON: lambda self, this: self.expression( 542 exp.ScopeResolution, 543 this=this, 544 expression=self._parse_function() or self._parse_var(any_token=True), 545 ), 546 } 547 548 # The DCOLON (::) operator serves as a scope resolution (exp.ScopeResolution) operator in T-SQL 549 COLUMN_OPERATORS = { 550 **parser.Parser.COLUMN_OPERATORS, 551 TokenType.DCOLON: lambda self, this, to: self.expression(exp.Cast, this=this, to=to) 552 if isinstance(to, exp.DataType) and to.this != exp.DataType.Type.USERDEFINED 553 else self.expression(exp.ScopeResolution, this=this, expression=to), 554 } 555 556 def _parse_dcolon(self) -> t.Optional[exp.Expression]: 557 # We want to use _parse_types() if the first token after :: is a known type, 558 # otherwise we could parse something like x::varchar(max) into a function 559 if self._match_set(self.TYPE_TOKENS, advance=False): 560 return self._parse_types() 561 562 return self._parse_function() or self._parse_types() 563 564 def _parse_options(self) -> t.Optional[t.List[exp.Expression]]: 565 if not self._match(TokenType.OPTION): 566 return None 567 568 def _parse_option() -> t.Optional[exp.Expression]: 569 option = self._parse_var_from_options(OPTIONS) 570 if not option: 571 return None 572 573 self._match(TokenType.EQ) 574 return self.expression( 575 exp.QueryOption, this=option, expression=self._parse_primary_or_var() 576 ) 577 578 return self._parse_wrapped_csv(_parse_option) 579 580 def _parse_projections(self) -> t.List[exp.Expression]: 581 """ 582 T-SQL supports the syntax alias = expression in the SELECT's projection list, 583 so we transform all parsed Selects to convert their EQ projections into Aliases. 584 585 See: https://learn.microsoft.com/en-us/sql/t-sql/queries/select-clause-transact-sql?view=sql-server-ver16#syntax 586 """ 587 return [ 588 ( 589 exp.alias_(projection.expression, projection.this.this, copy=False) 590 if isinstance(projection, exp.EQ) and isinstance(projection.this, exp.Column) 591 else projection 592 ) 593 for projection in super()._parse_projections() 594 ] 595 596 def _parse_commit_or_rollback(self) -> exp.Commit | exp.Rollback: 597 """Applies to SQL Server and Azure SQL Database 598 COMMIT [ { TRAN | TRANSACTION } 599 [ transaction_name | @tran_name_variable ] ] 600 [ WITH ( DELAYED_DURABILITY = { OFF | ON } ) ] 601 602 ROLLBACK { TRAN | TRANSACTION } 603 [ transaction_name | @tran_name_variable 604 | savepoint_name | @savepoint_variable ] 605 """ 606 rollback = self._prev.token_type == TokenType.ROLLBACK 607 608 self._match_texts(("TRAN", "TRANSACTION")) 609 this = self._parse_id_var() 610 611 if rollback: 612 return self.expression(exp.Rollback, this=this) 613 614 durability = None 615 if self._match_pair(TokenType.WITH, TokenType.L_PAREN): 616 self._match_text_seq("DELAYED_DURABILITY") 617 self._match(TokenType.EQ) 618 619 if self._match_text_seq("OFF"): 620 durability = False 621 else: 622 self._match(TokenType.ON) 623 durability = True 624 625 self._match_r_paren() 626 627 return self.expression(exp.Commit, this=this, durability=durability) 628 629 def _parse_transaction(self) -> exp.Transaction | exp.Command: 630 """Applies to SQL Server and Azure SQL Database 631 BEGIN { TRAN | TRANSACTION } 632 [ { transaction_name | @tran_name_variable } 633 [ WITH MARK [ 'description' ] ] 634 ] 635 """ 636 if self._match_texts(("TRAN", "TRANSACTION")): 637 transaction = self.expression(exp.Transaction, this=self._parse_id_var()) 638 if self._match_text_seq("WITH", "MARK"): 639 transaction.set("mark", self._parse_string()) 640 641 return transaction 642 643 return self._parse_as_command(self._prev) 644 645 def _parse_returns(self) -> exp.ReturnsProperty: 646 table = self._parse_id_var(any_token=False, tokens=self.RETURNS_TABLE_TOKENS) 647 returns = super()._parse_returns() 648 returns.set("table", table) 649 return returns 650 651 def _parse_convert( 652 self, strict: bool, safe: t.Optional[bool] = None 653 ) -> t.Optional[exp.Expression]: 654 this = self._parse_types() 655 self._match(TokenType.COMMA) 656 args = [this, *self._parse_csv(self._parse_assignment)] 657 convert = exp.Convert.from_arg_list(args) 658 convert.set("safe", safe) 659 convert.set("strict", strict) 660 return convert 661 662 def _parse_user_defined_function( 663 self, kind: t.Optional[TokenType] = None 664 ) -> t.Optional[exp.Expression]: 665 this = super()._parse_user_defined_function(kind=kind) 666 667 if ( 668 kind == TokenType.FUNCTION 669 or isinstance(this, exp.UserDefinedFunction) 670 or self._match(TokenType.ALIAS, advance=False) 671 ): 672 return this 673 674 expressions = self._parse_csv(self._parse_function_parameter) 675 return self.expression(exp.UserDefinedFunction, this=this, expressions=expressions) 676 677 def _parse_id_var( 678 self, 679 any_token: bool = True, 680 tokens: t.Optional[t.Collection[TokenType]] = None, 681 ) -> t.Optional[exp.Expression]: 682 is_temporary = self._match(TokenType.HASH) 683 is_global = is_temporary and self._match(TokenType.HASH) 684 685 this = super()._parse_id_var(any_token=any_token, tokens=tokens) 686 if this: 687 if is_global: 688 this.set("global", True) 689 elif is_temporary: 690 this.set("temporary", True) 691 692 return this 693 694 def _parse_create(self) -> exp.Create | exp.Command: 695 create = super()._parse_create() 696 697 if isinstance(create, exp.Create): 698 table = create.this.this if isinstance(create.this, exp.Schema) else create.this 699 if isinstance(table, exp.Table) and table.this.args.get("temporary"): 700 if not create.args.get("properties"): 701 create.set("properties", exp.Properties(expressions=[])) 702 703 create.args["properties"].append("expressions", exp.TemporaryProperty()) 704 705 return create 706 707 def _parse_if(self) -> t.Optional[exp.Expression]: 708 index = self._index 709 710 if self._match_text_seq("OBJECT_ID"): 711 self._parse_wrapped_csv(self._parse_string) 712 if self._match_text_seq("IS", "NOT", "NULL") and self._match(TokenType.DROP): 713 return self._parse_drop(exists=True) 714 self._retreat(index) 715 716 return super()._parse_if() 717 718 def _parse_unique(self) -> exp.UniqueColumnConstraint: 719 if self._match_texts(("CLUSTERED", "NONCLUSTERED")): 720 this = self.CONSTRAINT_PARSERS[self._prev.text.upper()](self) 721 else: 722 this = self._parse_schema(self._parse_id_var(any_token=False)) 723 724 return self.expression(exp.UniqueColumnConstraint, this=this) 725 726 def _parse_partition(self) -> t.Optional[exp.Partition]: 727 if not self._match_text_seq("WITH", "(", "PARTITIONS"): 728 return None 729 730 def parse_range(): 731 low = self._parse_bitwise() 732 high = self._parse_bitwise() if self._match_text_seq("TO") else None 733 734 return ( 735 self.expression(exp.PartitionRange, this=low, expression=high) if high else low 736 ) 737 738 partition = self.expression( 739 exp.Partition, expressions=self._parse_wrapped_csv(parse_range) 740 ) 741 742 self._match_r_paren() 743 744 return partition 745 746 def _parse_declare(self) -> exp.Declare | exp.Command: 747 index = self._index 748 expressions = self._try_parse(partial(self._parse_csv, self._parse_declareitem)) 749 750 if not expressions or self._curr: 751 self._retreat(index) 752 return self._parse_as_command(self._prev) 753 754 return self.expression(exp.Declare, expressions=expressions) 755 756 def _parse_declareitem(self) -> t.Optional[exp.DeclareItem]: 757 var = self._parse_id_var() 758 if not var: 759 return None 760 761 value = None 762 self._match(TokenType.ALIAS) 763 if self._match(TokenType.TABLE): 764 data_type = self._parse_schema() 765 else: 766 data_type = self._parse_types() 767 if self._match(TokenType.EQ): 768 value = self._parse_bitwise() 769 770 return self.expression(exp.DeclareItem, this=var, kind=data_type, default=value) 771 772 class Generator(generator.Generator): 773 LIMIT_IS_TOP = True 774 QUERY_HINTS = False 775 RETURNING_END = False 776 NVL2_SUPPORTED = False 777 ALTER_TABLE_INCLUDE_COLUMN_KEYWORD = False 778 LIMIT_FETCH = "FETCH" 779 COMPUTED_COLUMN_WITH_TYPE = False 780 CTE_RECURSIVE_KEYWORD_REQUIRED = False 781 ENSURE_BOOLS = True 782 NULL_ORDERING_SUPPORTED = None 783 SUPPORTS_SINGLE_ARG_CONCAT = False 784 TABLESAMPLE_SEED_KEYWORD = "REPEATABLE" 785 SUPPORTS_SELECT_INTO = True 786 JSON_PATH_BRACKETED_KEY_SUPPORTED = False 787 SUPPORTS_TO_NUMBER = False 788 SET_OP_MODIFIERS = False 789 COPY_PARAMS_EQ_REQUIRED = True 790 PARSE_JSON_NAME = None 791 792 EXPRESSIONS_WITHOUT_NESTED_CTES = { 793 exp.Delete, 794 exp.Insert, 795 exp.Intersect, 796 exp.Except, 797 exp.Merge, 798 exp.Select, 799 exp.Subquery, 800 exp.Union, 801 exp.Update, 802 } 803 804 SUPPORTED_JSON_PATH_PARTS = { 805 exp.JSONPathKey, 806 exp.JSONPathRoot, 807 exp.JSONPathSubscript, 808 } 809 810 TYPE_MAPPING = { 811 **generator.Generator.TYPE_MAPPING, 812 exp.DataType.Type.BOOLEAN: "BIT", 813 exp.DataType.Type.DECIMAL: "NUMERIC", 814 exp.DataType.Type.DATETIME: "DATETIME2", 815 exp.DataType.Type.DOUBLE: "FLOAT", 816 exp.DataType.Type.INT: "INTEGER", 817 exp.DataType.Type.ROWVERSION: "ROWVERSION", 818 exp.DataType.Type.TEXT: "VARCHAR(MAX)", 819 exp.DataType.Type.TIMESTAMP: "DATETIME2", 820 exp.DataType.Type.TIMESTAMPTZ: "DATETIMEOFFSET", 821 exp.DataType.Type.UTINYINT: "TINYINT", 822 exp.DataType.Type.VARIANT: "SQL_VARIANT", 823 } 824 825 TYPE_MAPPING.pop(exp.DataType.Type.NCHAR) 826 TYPE_MAPPING.pop(exp.DataType.Type.NVARCHAR) 827 828 TRANSFORMS = { 829 **generator.Generator.TRANSFORMS, 830 exp.AnyValue: any_value_to_max_sql, 831 exp.ArrayToString: rename_func("STRING_AGG"), 832 exp.AutoIncrementColumnConstraint: lambda *_: "IDENTITY", 833 exp.DateAdd: date_delta_sql("DATEADD"), 834 exp.DateDiff: date_delta_sql("DATEDIFF"), 835 exp.CTE: transforms.preprocess([qualify_derived_table_outputs]), 836 exp.CurrentDate: rename_func("GETDATE"), 837 exp.CurrentTimestamp: rename_func("GETDATE"), 838 exp.DateStrToDate: datestrtodate_sql, 839 exp.Extract: rename_func("DATEPART"), 840 exp.GeneratedAsIdentityColumnConstraint: generatedasidentitycolumnconstraint_sql, 841 exp.GroupConcat: _string_agg_sql, 842 exp.If: rename_func("IIF"), 843 exp.JSONExtract: _json_extract_sql, 844 exp.JSONExtractScalar: _json_extract_sql, 845 exp.LastDay: lambda self, e: self.func("EOMONTH", e.this), 846 exp.Max: max_or_greatest, 847 exp.MD5: lambda self, e: self.func("HASHBYTES", exp.Literal.string("MD5"), e.this), 848 exp.Min: min_or_least, 849 exp.NumberToStr: _format_sql, 850 exp.Repeat: rename_func("REPLICATE"), 851 exp.Select: transforms.preprocess( 852 [ 853 transforms.eliminate_distinct_on, 854 transforms.eliminate_semi_and_anti_joins, 855 transforms.eliminate_qualify, 856 ] 857 ), 858 exp.Stddev: rename_func("STDEV"), 859 exp.StrPosition: lambda self, e: self.func( 860 "CHARINDEX", e.args.get("substr"), e.this, e.args.get("position") 861 ), 862 exp.Subquery: transforms.preprocess([qualify_derived_table_outputs]), 863 exp.SHA: lambda self, e: self.func("HASHBYTES", exp.Literal.string("SHA1"), e.this), 864 exp.SHA2: lambda self, e: self.func( 865 "HASHBYTES", exp.Literal.string(f"SHA2_{e.args.get('length', 256)}"), e.this 866 ), 867 exp.TemporaryProperty: lambda self, e: "", 868 exp.TimeStrToTime: lambda self, e: self.sql( 869 exp.cast(e.this, exp.DataType.Type.DATETIME) 870 ), 871 exp.TimeToStr: _format_sql, 872 exp.Trim: trim_sql, 873 exp.TsOrDsAdd: date_delta_sql("DATEADD", cast=True), 874 exp.TsOrDsDiff: date_delta_sql("DATEDIFF"), 875 } 876 877 TRANSFORMS.pop(exp.ReturnsProperty) 878 879 PROPERTIES_LOCATION = { 880 **generator.Generator.PROPERTIES_LOCATION, 881 exp.VolatileProperty: exp.Properties.Location.UNSUPPORTED, 882 } 883 884 def scope_resolution(self, rhs: str, scope_name: str) -> str: 885 return f"{scope_name}::{rhs}" 886 887 def select_sql(self, expression: exp.Select) -> str: 888 if expression.args.get("offset"): 889 if not expression.args.get("order"): 890 # ORDER BY is required in order to use OFFSET in a query, so we use 891 # a noop order by, since we don't really care about the order. 892 # See: https://www.microsoftpressstore.com/articles/article.aspx?p=2314819 893 expression.order_by(exp.select(exp.null()).subquery(), copy=False) 894 895 limit = expression.args.get("limit") 896 if isinstance(limit, exp.Limit): 897 # TOP and OFFSET can't be combined, we need use FETCH instead of TOP 898 # we replace here because otherwise TOP would be generated in select_sql 899 limit.replace(exp.Fetch(direction="FIRST", count=limit.expression)) 900 901 return super().select_sql(expression) 902 903 def convert_sql(self, expression: exp.Convert) -> str: 904 name = "TRY_CONVERT" if expression.args.get("safe") else "CONVERT" 905 return self.func( 906 name, expression.this, expression.expression, expression.args.get("style") 907 ) 908 909 def queryoption_sql(self, expression: exp.QueryOption) -> str: 910 option = self.sql(expression, "this") 911 value = self.sql(expression, "expression") 912 if value: 913 optional_equal_sign = "= " if option in OPTIONS_THAT_REQUIRE_EQUAL else "" 914 return f"{option} {optional_equal_sign}{value}" 915 return option 916 917 def lateral_op(self, expression: exp.Lateral) -> str: 918 cross_apply = expression.args.get("cross_apply") 919 if cross_apply is True: 920 return "CROSS APPLY" 921 if cross_apply is False: 922 return "OUTER APPLY" 923 924 # TODO: perhaps we can check if the parent is a Join and transpile it appropriately 925 self.unsupported("LATERAL clause is not supported.") 926 return "LATERAL" 927 928 def timefromparts_sql(self, expression: exp.TimeFromParts) -> str: 929 nano = expression.args.get("nano") 930 if nano is not None: 931 nano.pop() 932 self.unsupported("Specifying nanoseconds is not supported in TIMEFROMPARTS.") 933 934 if expression.args.get("fractions") is None: 935 expression.set("fractions", exp.Literal.number(0)) 936 if expression.args.get("precision") is None: 937 expression.set("precision", exp.Literal.number(0)) 938 939 return rename_func("TIMEFROMPARTS")(self, expression) 940 941 def timestampfromparts_sql(self, expression: exp.TimestampFromParts) -> str: 942 zone = expression.args.get("zone") 943 if zone is not None: 944 zone.pop() 945 self.unsupported("Time zone is not supported in DATETIMEFROMPARTS.") 946 947 nano = expression.args.get("nano") 948 if nano is not None: 949 nano.pop() 950 self.unsupported("Specifying nanoseconds is not supported in DATETIMEFROMPARTS.") 951 952 if expression.args.get("milli") is None: 953 expression.set("milli", exp.Literal.number(0)) 954 955 return rename_func("DATETIMEFROMPARTS")(self, expression) 956 957 def setitem_sql(self, expression: exp.SetItem) -> str: 958 this = expression.this 959 if isinstance(this, exp.EQ) and not isinstance(this.left, exp.Parameter): 960 # T-SQL does not use '=' in SET command, except when the LHS is a variable. 961 return f"{self.sql(this.left)} {self.sql(this.right)}" 962 963 return super().setitem_sql(expression) 964 965 def boolean_sql(self, expression: exp.Boolean) -> str: 966 if type(expression.parent) in BIT_TYPES: 967 return "1" if expression.this else "0" 968 969 return "(1 = 1)" if expression.this else "(1 = 0)" 970 971 def is_sql(self, expression: exp.Is) -> str: 972 if isinstance(expression.expression, exp.Boolean): 973 return self.binary(expression, "=") 974 return self.binary(expression, "IS") 975 976 def createable_sql(self, expression: exp.Create, locations: t.DefaultDict) -> str: 977 sql = self.sql(expression, "this") 978 properties = expression.args.get("properties") 979 980 if sql[:1] != "#" and any( 981 isinstance(prop, exp.TemporaryProperty) 982 for prop in (properties.expressions if properties else []) 983 ): 984 sql = f"[#{sql[1:]}" if sql.startswith("[") else f"#{sql}" 985 986 return sql 987 988 def create_sql(self, expression: exp.Create) -> str: 989 kind = expression.kind 990 exists = expression.args.pop("exists", None) 991 992 if kind == "VIEW": 993 expression.this.set("catalog", None) 994 995 sql = super().create_sql(expression) 996 997 like_property = expression.find(exp.LikeProperty) 998 if like_property: 999 ctas_expression = like_property.this 1000 else: 1001 ctas_expression = expression.expression 1002 1003 table = expression.find(exp.Table) 1004 1005 # Convert CTAS statement to SELECT .. INTO .. 1006 if kind == "TABLE" and ctas_expression: 1007 ctas_with = ctas_expression.args.get("with") 1008 if ctas_with: 1009 ctas_with = ctas_with.pop() 1010 1011 if isinstance(ctas_expression, exp.UNWRAPPED_QUERIES): 1012 ctas_expression = ctas_expression.subquery() 1013 1014 select_into = exp.select("*").from_(exp.alias_(ctas_expression, "temp", table=True)) 1015 select_into.set("into", exp.Into(this=table)) 1016 select_into.set("with", ctas_with) 1017 1018 if like_property: 1019 select_into.limit(0, copy=False) 1020 1021 sql = self.sql(select_into) 1022 1023 if exists: 1024 identifier = self.sql(exp.Literal.string(exp.table_name(table) if table else "")) 1025 sql = self.sql(exp.Literal.string(sql)) 1026 if kind == "SCHEMA": 1027 sql = f"""IF NOT EXISTS (SELECT * FROM information_schema.schemata WHERE schema_name = {identifier}) EXEC({sql})""" 1028 elif kind == "TABLE": 1029 assert table 1030 where = exp.and_( 1031 exp.column("table_name").eq(table.name), 1032 exp.column("table_schema").eq(table.db) if table.db else None, 1033 exp.column("table_catalog").eq(table.catalog) if table.catalog else None, 1034 ) 1035 sql = f"""IF NOT EXISTS (SELECT * FROM information_schema.tables WHERE {where}) EXEC({sql})""" 1036 elif kind == "INDEX": 1037 index = self.sql(exp.Literal.string(expression.this.text("this"))) 1038 sql = f"""IF NOT EXISTS (SELECT * FROM sys.indexes WHERE object_id = object_id({identifier}) AND name = {index}) EXEC({sql})""" 1039 elif expression.args.get("replace"): 1040 sql = sql.replace("CREATE OR REPLACE ", "CREATE OR ALTER ", 1) 1041 1042 return self.prepend_ctes(expression, sql) 1043 1044 def offset_sql(self, expression: exp.Offset) -> str: 1045 return f"{super().offset_sql(expression)} ROWS" 1046 1047 def version_sql(self, expression: exp.Version) -> str: 1048 name = "SYSTEM_TIME" if expression.name == "TIMESTAMP" else expression.name 1049 this = f"FOR {name}" 1050 expr = expression.expression 1051 kind = expression.text("kind") 1052 if kind in ("FROM", "BETWEEN"): 1053 args = expr.expressions 1054 sep = "TO" if kind == "FROM" else "AND" 1055 expr_sql = f"{self.sql(seq_get(args, 0))} {sep} {self.sql(seq_get(args, 1))}" 1056 else: 1057 expr_sql = self.sql(expr) 1058 1059 expr_sql = f" {expr_sql}" if expr_sql else "" 1060 return f"{this} {kind}{expr_sql}" 1061 1062 def returnsproperty_sql(self, expression: exp.ReturnsProperty) -> str: 1063 table = expression.args.get("table") 1064 table = f"{table} " if table else "" 1065 return f"RETURNS {table}{self.sql(expression, 'this')}" 1066 1067 def returning_sql(self, expression: exp.Returning) -> str: 1068 into = self.sql(expression, "into") 1069 into = self.seg(f"INTO {into}") if into else "" 1070 return f"{self.seg('OUTPUT')} {self.expressions(expression, flat=True)}{into}" 1071 1072 def transaction_sql(self, expression: exp.Transaction) -> str: 1073 this = self.sql(expression, "this") 1074 this = f" {this}" if this else "" 1075 mark = self.sql(expression, "mark") 1076 mark = f" WITH MARK {mark}" if mark else "" 1077 return f"BEGIN TRANSACTION{this}{mark}" 1078 1079 def commit_sql(self, expression: exp.Commit) -> str: 1080 this = self.sql(expression, "this") 1081 this = f" {this}" if this else "" 1082 durability = expression.args.get("durability") 1083 durability = ( 1084 f" WITH (DELAYED_DURABILITY = {'ON' if durability else 'OFF'})" 1085 if durability is not None 1086 else "" 1087 ) 1088 return f"COMMIT TRANSACTION{this}{durability}" 1089 1090 def rollback_sql(self, expression: exp.Rollback) -> str: 1091 this = self.sql(expression, "this") 1092 this = f" {this}" if this else "" 1093 return f"ROLLBACK TRANSACTION{this}" 1094 1095 def identifier_sql(self, expression: exp.Identifier) -> str: 1096 identifier = super().identifier_sql(expression) 1097 1098 if expression.args.get("global"): 1099 identifier = f"##{identifier}" 1100 elif expression.args.get("temporary"): 1101 identifier = f"#{identifier}" 1102 1103 return identifier 1104 1105 def constraint_sql(self, expression: exp.Constraint) -> str: 1106 this = self.sql(expression, "this") 1107 expressions = self.expressions(expression, flat=True, sep=" ") 1108 return f"CONSTRAINT {this} {expressions}" 1109 1110 def length_sql(self, expression: exp.Length) -> str: 1111 return self._uncast_text(expression, "LEN") 1112 1113 def right_sql(self, expression: exp.Right) -> str: 1114 return self._uncast_text(expression, "RIGHT") 1115 1116 def left_sql(self, expression: exp.Left) -> str: 1117 return self._uncast_text(expression, "LEFT") 1118 1119 def _uncast_text(self, expression: exp.Expression, name: str) -> str: 1120 this = expression.this 1121 if isinstance(this, exp.Cast) and this.is_type(exp.DataType.Type.TEXT): 1122 this_sql = self.sql(this, "this") 1123 else: 1124 this_sql = self.sql(this) 1125 expression_sql = self.sql(expression, "expression") 1126 return self.func(name, this_sql, expression_sql if expression_sql else None) 1127 1128 def partition_sql(self, expression: exp.Partition) -> str: 1129 return f"WITH (PARTITIONS({self.expressions(expression, flat=True)}))" 1130 1131 def altertable_sql(self, expression: exp.AlterTable) -> str: 1132 action = seq_get(expression.args.get("actions") or [], 0) 1133 if isinstance(action, exp.RenameTable): 1134 return f"EXEC sp_rename '{self.sql(expression.this)}', '{action.this.name}'" 1135 return super().altertable_sql(expression) 1136 1137 def drop_sql(self, expression: exp.Drop) -> str: 1138 if expression.args["kind"] == "VIEW": 1139 expression.this.set("catalog", None) 1140 return super().drop_sql(expression) 1141 1142 def declare_sql(self, expression: exp.Declare) -> str: 1143 return f"DECLARE {self.expressions(expression, flat=True)}" 1144 1145 def declareitem_sql(self, expression: exp.DeclareItem) -> str: 1146 variable = self.sql(expression, "this") 1147 default = self.sql(expression, "default") 1148 default = f" = {default}" if default else "" 1149 1150 kind = self.sql(expression, "kind") 1151 if isinstance(expression.args.get("kind"), exp.Schema): 1152 kind = f"TABLE {kind}" 1153 1154 return f"{variable} AS {kind}{default}" 1155 1156 def options_modifier(self, expression: exp.Expression) -> str: 1157 options = self.expressions(expression, key="options") 1158 return f" OPTION{self.wrap(options)}" if options else ""
250def qualify_derived_table_outputs(expression: exp.Expression) -> exp.Expression: 251 """Ensures all (unnamed) output columns are aliased for CTEs and Subqueries.""" 252 alias = expression.args.get("alias") 253 254 if ( 255 isinstance(expression, (exp.CTE, exp.Subquery)) 256 and isinstance(alias, exp.TableAlias) 257 and not alias.columns 258 ): 259 from sqlglot.optimizer.qualify_columns import qualify_outputs 260 261 # We keep track of the unaliased column projection indexes instead of the expressions 262 # themselves, because the latter are going to be replaced by new nodes when the aliases 263 # are added and hence we won't be able to reach these newly added Alias parents 264 query = expression.this 265 unaliased_column_indexes = ( 266 i for i, c in enumerate(query.selects) if isinstance(c, exp.Column) and not c.alias 267 ) 268 269 qualify_outputs(query) 270 271 # Preserve the quoting information of columns for newly added Alias nodes 272 query_selects = query.selects 273 for select_index in unaliased_column_indexes: 274 alias = query_selects[select_index] 275 column = alias.this 276 if isinstance(column.this, exp.Identifier): 277 alias.args["alias"].set("quoted", column.this.quoted) 278 279 return expression
Ensures all (unnamed) output columns are aliased for CTEs and Subqueries.
334class TSQL(Dialect): 335 NORMALIZATION_STRATEGY = NormalizationStrategy.CASE_INSENSITIVE 336 TIME_FORMAT = "'yyyy-mm-dd hh:mm:ss'" 337 SUPPORTS_SEMI_ANTI_JOIN = False 338 LOG_BASE_FIRST = False 339 TYPED_DIVISION = True 340 CONCAT_COALESCE = True 341 342 TIME_MAPPING = { 343 "year": "%Y", 344 "dayofyear": "%j", 345 "day": "%d", 346 "dy": "%d", 347 "y": "%Y", 348 "week": "%W", 349 "ww": "%W", 350 "wk": "%W", 351 "hour": "%h", 352 "hh": "%I", 353 "minute": "%M", 354 "mi": "%M", 355 "n": "%M", 356 "second": "%S", 357 "ss": "%S", 358 "s": "%-S", 359 "millisecond": "%f", 360 "ms": "%f", 361 "weekday": "%W", 362 "dw": "%W", 363 "month": "%m", 364 "mm": "%M", 365 "m": "%-M", 366 "Y": "%Y", 367 "YYYY": "%Y", 368 "YY": "%y", 369 "MMMM": "%B", 370 "MMM": "%b", 371 "MM": "%m", 372 "M": "%-m", 373 "dddd": "%A", 374 "dd": "%d", 375 "d": "%-d", 376 "HH": "%H", 377 "H": "%-H", 378 "h": "%-I", 379 "S": "%f", 380 "yyyy": "%Y", 381 "yy": "%y", 382 } 383 384 CONVERT_FORMAT_MAPPING = { 385 "0": "%b %d %Y %-I:%M%p", 386 "1": "%m/%d/%y", 387 "2": "%y.%m.%d", 388 "3": "%d/%m/%y", 389 "4": "%d.%m.%y", 390 "5": "%d-%m-%y", 391 "6": "%d %b %y", 392 "7": "%b %d, %y", 393 "8": "%H:%M:%S", 394 "9": "%b %d %Y %-I:%M:%S:%f%p", 395 "10": "mm-dd-yy", 396 "11": "yy/mm/dd", 397 "12": "yymmdd", 398 "13": "%d %b %Y %H:%M:ss:%f", 399 "14": "%H:%M:%S:%f", 400 "20": "%Y-%m-%d %H:%M:%S", 401 "21": "%Y-%m-%d %H:%M:%S.%f", 402 "22": "%m/%d/%y %-I:%M:%S %p", 403 "23": "%Y-%m-%d", 404 "24": "%H:%M:%S", 405 "25": "%Y-%m-%d %H:%M:%S.%f", 406 "100": "%b %d %Y %-I:%M%p", 407 "101": "%m/%d/%Y", 408 "102": "%Y.%m.%d", 409 "103": "%d/%m/%Y", 410 "104": "%d.%m.%Y", 411 "105": "%d-%m-%Y", 412 "106": "%d %b %Y", 413 "107": "%b %d, %Y", 414 "108": "%H:%M:%S", 415 "109": "%b %d %Y %-I:%M:%S:%f%p", 416 "110": "%m-%d-%Y", 417 "111": "%Y/%m/%d", 418 "112": "%Y%m%d", 419 "113": "%d %b %Y %H:%M:%S:%f", 420 "114": "%H:%M:%S:%f", 421 "120": "%Y-%m-%d %H:%M:%S", 422 "121": "%Y-%m-%d %H:%M:%S.%f", 423 } 424 425 FORMAT_TIME_MAPPING = { 426 "y": "%B %Y", 427 "d": "%m/%d/%Y", 428 "H": "%-H", 429 "h": "%-I", 430 "s": "%Y-%m-%d %H:%M:%S", 431 "D": "%A,%B,%Y", 432 "f": "%A,%B,%Y %-I:%M %p", 433 "F": "%A,%B,%Y %-I:%M:%S %p", 434 "g": "%m/%d/%Y %-I:%M %p", 435 "G": "%m/%d/%Y %-I:%M:%S %p", 436 "M": "%B %-d", 437 "m": "%B %-d", 438 "O": "%Y-%m-%dT%H:%M:%S", 439 "u": "%Y-%M-%D %H:%M:%S%z", 440 "U": "%A, %B %D, %Y %H:%M:%S%z", 441 "T": "%-I:%M:%S %p", 442 "t": "%-I:%M", 443 "Y": "%a %Y", 444 } 445 446 class Tokenizer(tokens.Tokenizer): 447 IDENTIFIERS = [("[", "]"), '"'] 448 QUOTES = ["'", '"'] 449 HEX_STRINGS = [("0x", ""), ("0X", "")] 450 VAR_SINGLE_TOKENS = {"@", "$", "#"} 451 452 KEYWORDS = { 453 **tokens.Tokenizer.KEYWORDS, 454 "CLUSTERED INDEX": TokenType.INDEX, 455 "DATETIME2": TokenType.DATETIME, 456 "DATETIMEOFFSET": TokenType.TIMESTAMPTZ, 457 "DECLARE": TokenType.DECLARE, 458 "EXEC": TokenType.COMMAND, 459 "FOR SYSTEM_TIME": TokenType.TIMESTAMP_SNAPSHOT, 460 "IMAGE": TokenType.IMAGE, 461 "MONEY": TokenType.MONEY, 462 "NONCLUSTERED INDEX": TokenType.INDEX, 463 "NTEXT": TokenType.TEXT, 464 "OPTION": TokenType.OPTION, 465 "OUTPUT": TokenType.RETURNING, 466 "PRINT": TokenType.COMMAND, 467 "PROC": TokenType.PROCEDURE, 468 "REAL": TokenType.FLOAT, 469 "ROWVERSION": TokenType.ROWVERSION, 470 "SMALLDATETIME": TokenType.DATETIME, 471 "SMALLMONEY": TokenType.SMALLMONEY, 472 "SQL_VARIANT": TokenType.VARIANT, 473 "SYSTEM_USER": TokenType.CURRENT_USER, 474 "TOP": TokenType.TOP, 475 "TIMESTAMP": TokenType.ROWVERSION, 476 "TINYINT": TokenType.UTINYINT, 477 "UNIQUEIDENTIFIER": TokenType.UNIQUEIDENTIFIER, 478 "UPDATE STATISTICS": TokenType.COMMAND, 479 "XML": TokenType.XML, 480 } 481 KEYWORDS.pop("/*+") 482 483 COMMANDS = {*tokens.Tokenizer.COMMANDS, TokenType.END} 484 485 class Parser(parser.Parser): 486 SET_REQUIRES_ASSIGNMENT_DELIMITER = False 487 LOG_DEFAULTS_TO_LN = True 488 ALTER_TABLE_ADD_REQUIRED_FOR_EACH_COLUMN = False 489 STRING_ALIASES = True 490 NO_PAREN_IF_COMMANDS = False 491 492 QUERY_MODIFIER_PARSERS = { 493 **parser.Parser.QUERY_MODIFIER_PARSERS, 494 TokenType.OPTION: lambda self: ("options", self._parse_options()), 495 } 496 497 FUNCTIONS = { 498 **parser.Parser.FUNCTIONS, 499 "CHARINDEX": lambda args: exp.StrPosition( 500 this=seq_get(args, 1), 501 substr=seq_get(args, 0), 502 position=seq_get(args, 2), 503 ), 504 "DATEADD": build_date_delta(exp.DateAdd, unit_mapping=DATE_DELTA_INTERVAL), 505 "DATEDIFF": _build_date_delta(exp.DateDiff, unit_mapping=DATE_DELTA_INTERVAL), 506 "DATENAME": _build_formatted_time(exp.TimeToStr, full_format_mapping=True), 507 "DATEPART": _build_formatted_time(exp.TimeToStr), 508 "DATETIMEFROMPARTS": _build_datetimefromparts, 509 "EOMONTH": _build_eomonth, 510 "FORMAT": _build_format, 511 "GETDATE": exp.CurrentTimestamp.from_arg_list, 512 "HASHBYTES": _build_hashbytes, 513 "ISNULL": exp.Coalesce.from_arg_list, 514 "JSON_QUERY": parser.build_extract_json_with_path(exp.JSONExtract), 515 "JSON_VALUE": parser.build_extract_json_with_path(exp.JSONExtractScalar), 516 "LEN": _build_with_arg_as_text(exp.Length), 517 "LEFT": _build_with_arg_as_text(exp.Left), 518 "RIGHT": _build_with_arg_as_text(exp.Right), 519 "REPLICATE": exp.Repeat.from_arg_list, 520 "SQUARE": lambda args: exp.Pow(this=seq_get(args, 0), expression=exp.Literal.number(2)), 521 "SYSDATETIME": exp.CurrentTimestamp.from_arg_list, 522 "SUSER_NAME": exp.CurrentUser.from_arg_list, 523 "SUSER_SNAME": exp.CurrentUser.from_arg_list, 524 "SYSTEM_USER": exp.CurrentUser.from_arg_list, 525 "TIMEFROMPARTS": _build_timefromparts, 526 } 527 528 JOIN_HINTS = {"LOOP", "HASH", "MERGE", "REMOTE"} 529 530 RETURNS_TABLE_TOKENS = parser.Parser.ID_VAR_TOKENS - { 531 TokenType.TABLE, 532 *parser.Parser.TYPE_TOKENS, 533 } 534 535 STATEMENT_PARSERS = { 536 **parser.Parser.STATEMENT_PARSERS, 537 TokenType.DECLARE: lambda self: self._parse_declare(), 538 } 539 540 RANGE_PARSERS = { 541 **parser.Parser.RANGE_PARSERS, 542 TokenType.DCOLON: lambda self, this: self.expression( 543 exp.ScopeResolution, 544 this=this, 545 expression=self._parse_function() or self._parse_var(any_token=True), 546 ), 547 } 548 549 # The DCOLON (::) operator serves as a scope resolution (exp.ScopeResolution) operator in T-SQL 550 COLUMN_OPERATORS = { 551 **parser.Parser.COLUMN_OPERATORS, 552 TokenType.DCOLON: lambda self, this, to: self.expression(exp.Cast, this=this, to=to) 553 if isinstance(to, exp.DataType) and to.this != exp.DataType.Type.USERDEFINED 554 else self.expression(exp.ScopeResolution, this=this, expression=to), 555 } 556 557 def _parse_dcolon(self) -> t.Optional[exp.Expression]: 558 # We want to use _parse_types() if the first token after :: is a known type, 559 # otherwise we could parse something like x::varchar(max) into a function 560 if self._match_set(self.TYPE_TOKENS, advance=False): 561 return self._parse_types() 562 563 return self._parse_function() or self._parse_types() 564 565 def _parse_options(self) -> t.Optional[t.List[exp.Expression]]: 566 if not self._match(TokenType.OPTION): 567 return None 568 569 def _parse_option() -> t.Optional[exp.Expression]: 570 option = self._parse_var_from_options(OPTIONS) 571 if not option: 572 return None 573 574 self._match(TokenType.EQ) 575 return self.expression( 576 exp.QueryOption, this=option, expression=self._parse_primary_or_var() 577 ) 578 579 return self._parse_wrapped_csv(_parse_option) 580 581 def _parse_projections(self) -> t.List[exp.Expression]: 582 """ 583 T-SQL supports the syntax alias = expression in the SELECT's projection list, 584 so we transform all parsed Selects to convert their EQ projections into Aliases. 585 586 See: https://learn.microsoft.com/en-us/sql/t-sql/queries/select-clause-transact-sql?view=sql-server-ver16#syntax 587 """ 588 return [ 589 ( 590 exp.alias_(projection.expression, projection.this.this, copy=False) 591 if isinstance(projection, exp.EQ) and isinstance(projection.this, exp.Column) 592 else projection 593 ) 594 for projection in super()._parse_projections() 595 ] 596 597 def _parse_commit_or_rollback(self) -> exp.Commit | exp.Rollback: 598 """Applies to SQL Server and Azure SQL Database 599 COMMIT [ { TRAN | TRANSACTION } 600 [ transaction_name | @tran_name_variable ] ] 601 [ WITH ( DELAYED_DURABILITY = { OFF | ON } ) ] 602 603 ROLLBACK { TRAN | TRANSACTION } 604 [ transaction_name | @tran_name_variable 605 | savepoint_name | @savepoint_variable ] 606 """ 607 rollback = self._prev.token_type == TokenType.ROLLBACK 608 609 self._match_texts(("TRAN", "TRANSACTION")) 610 this = self._parse_id_var() 611 612 if rollback: 613 return self.expression(exp.Rollback, this=this) 614 615 durability = None 616 if self._match_pair(TokenType.WITH, TokenType.L_PAREN): 617 self._match_text_seq("DELAYED_DURABILITY") 618 self._match(TokenType.EQ) 619 620 if self._match_text_seq("OFF"): 621 durability = False 622 else: 623 self._match(TokenType.ON) 624 durability = True 625 626 self._match_r_paren() 627 628 return self.expression(exp.Commit, this=this, durability=durability) 629 630 def _parse_transaction(self) -> exp.Transaction | exp.Command: 631 """Applies to SQL Server and Azure SQL Database 632 BEGIN { TRAN | TRANSACTION } 633 [ { transaction_name | @tran_name_variable } 634 [ WITH MARK [ 'description' ] ] 635 ] 636 """ 637 if self._match_texts(("TRAN", "TRANSACTION")): 638 transaction = self.expression(exp.Transaction, this=self._parse_id_var()) 639 if self._match_text_seq("WITH", "MARK"): 640 transaction.set("mark", self._parse_string()) 641 642 return transaction 643 644 return self._parse_as_command(self._prev) 645 646 def _parse_returns(self) -> exp.ReturnsProperty: 647 table = self._parse_id_var(any_token=False, tokens=self.RETURNS_TABLE_TOKENS) 648 returns = super()._parse_returns() 649 returns.set("table", table) 650 return returns 651 652 def _parse_convert( 653 self, strict: bool, safe: t.Optional[bool] = None 654 ) -> t.Optional[exp.Expression]: 655 this = self._parse_types() 656 self._match(TokenType.COMMA) 657 args = [this, *self._parse_csv(self._parse_assignment)] 658 convert = exp.Convert.from_arg_list(args) 659 convert.set("safe", safe) 660 convert.set("strict", strict) 661 return convert 662 663 def _parse_user_defined_function( 664 self, kind: t.Optional[TokenType] = None 665 ) -> t.Optional[exp.Expression]: 666 this = super()._parse_user_defined_function(kind=kind) 667 668 if ( 669 kind == TokenType.FUNCTION 670 or isinstance(this, exp.UserDefinedFunction) 671 or self._match(TokenType.ALIAS, advance=False) 672 ): 673 return this 674 675 expressions = self._parse_csv(self._parse_function_parameter) 676 return self.expression(exp.UserDefinedFunction, this=this, expressions=expressions) 677 678 def _parse_id_var( 679 self, 680 any_token: bool = True, 681 tokens: t.Optional[t.Collection[TokenType]] = None, 682 ) -> t.Optional[exp.Expression]: 683 is_temporary = self._match(TokenType.HASH) 684 is_global = is_temporary and self._match(TokenType.HASH) 685 686 this = super()._parse_id_var(any_token=any_token, tokens=tokens) 687 if this: 688 if is_global: 689 this.set("global", True) 690 elif is_temporary: 691 this.set("temporary", True) 692 693 return this 694 695 def _parse_create(self) -> exp.Create | exp.Command: 696 create = super()._parse_create() 697 698 if isinstance(create, exp.Create): 699 table = create.this.this if isinstance(create.this, exp.Schema) else create.this 700 if isinstance(table, exp.Table) and table.this.args.get("temporary"): 701 if not create.args.get("properties"): 702 create.set("properties", exp.Properties(expressions=[])) 703 704 create.args["properties"].append("expressions", exp.TemporaryProperty()) 705 706 return create 707 708 def _parse_if(self) -> t.Optional[exp.Expression]: 709 index = self._index 710 711 if self._match_text_seq("OBJECT_ID"): 712 self._parse_wrapped_csv(self._parse_string) 713 if self._match_text_seq("IS", "NOT", "NULL") and self._match(TokenType.DROP): 714 return self._parse_drop(exists=True) 715 self._retreat(index) 716 717 return super()._parse_if() 718 719 def _parse_unique(self) -> exp.UniqueColumnConstraint: 720 if self._match_texts(("CLUSTERED", "NONCLUSTERED")): 721 this = self.CONSTRAINT_PARSERS[self._prev.text.upper()](self) 722 else: 723 this = self._parse_schema(self._parse_id_var(any_token=False)) 724 725 return self.expression(exp.UniqueColumnConstraint, this=this) 726 727 def _parse_partition(self) -> t.Optional[exp.Partition]: 728 if not self._match_text_seq("WITH", "(", "PARTITIONS"): 729 return None 730 731 def parse_range(): 732 low = self._parse_bitwise() 733 high = self._parse_bitwise() if self._match_text_seq("TO") else None 734 735 return ( 736 self.expression(exp.PartitionRange, this=low, expression=high) if high else low 737 ) 738 739 partition = self.expression( 740 exp.Partition, expressions=self._parse_wrapped_csv(parse_range) 741 ) 742 743 self._match_r_paren() 744 745 return partition 746 747 def _parse_declare(self) -> exp.Declare | exp.Command: 748 index = self._index 749 expressions = self._try_parse(partial(self._parse_csv, self._parse_declareitem)) 750 751 if not expressions or self._curr: 752 self._retreat(index) 753 return self._parse_as_command(self._prev) 754 755 return self.expression(exp.Declare, expressions=expressions) 756 757 def _parse_declareitem(self) -> t.Optional[exp.DeclareItem]: 758 var = self._parse_id_var() 759 if not var: 760 return None 761 762 value = None 763 self._match(TokenType.ALIAS) 764 if self._match(TokenType.TABLE): 765 data_type = self._parse_schema() 766 else: 767 data_type = self._parse_types() 768 if self._match(TokenType.EQ): 769 value = self._parse_bitwise() 770 771 return self.expression(exp.DeclareItem, this=var, kind=data_type, default=value) 772 773 class Generator(generator.Generator): 774 LIMIT_IS_TOP = True 775 QUERY_HINTS = False 776 RETURNING_END = False 777 NVL2_SUPPORTED = False 778 ALTER_TABLE_INCLUDE_COLUMN_KEYWORD = False 779 LIMIT_FETCH = "FETCH" 780 COMPUTED_COLUMN_WITH_TYPE = False 781 CTE_RECURSIVE_KEYWORD_REQUIRED = False 782 ENSURE_BOOLS = True 783 NULL_ORDERING_SUPPORTED = None 784 SUPPORTS_SINGLE_ARG_CONCAT = False 785 TABLESAMPLE_SEED_KEYWORD = "REPEATABLE" 786 SUPPORTS_SELECT_INTO = True 787 JSON_PATH_BRACKETED_KEY_SUPPORTED = False 788 SUPPORTS_TO_NUMBER = False 789 SET_OP_MODIFIERS = False 790 COPY_PARAMS_EQ_REQUIRED = True 791 PARSE_JSON_NAME = None 792 793 EXPRESSIONS_WITHOUT_NESTED_CTES = { 794 exp.Delete, 795 exp.Insert, 796 exp.Intersect, 797 exp.Except, 798 exp.Merge, 799 exp.Select, 800 exp.Subquery, 801 exp.Union, 802 exp.Update, 803 } 804 805 SUPPORTED_JSON_PATH_PARTS = { 806 exp.JSONPathKey, 807 exp.JSONPathRoot, 808 exp.JSONPathSubscript, 809 } 810 811 TYPE_MAPPING = { 812 **generator.Generator.TYPE_MAPPING, 813 exp.DataType.Type.BOOLEAN: "BIT", 814 exp.DataType.Type.DECIMAL: "NUMERIC", 815 exp.DataType.Type.DATETIME: "DATETIME2", 816 exp.DataType.Type.DOUBLE: "FLOAT", 817 exp.DataType.Type.INT: "INTEGER", 818 exp.DataType.Type.ROWVERSION: "ROWVERSION", 819 exp.DataType.Type.TEXT: "VARCHAR(MAX)", 820 exp.DataType.Type.TIMESTAMP: "DATETIME2", 821 exp.DataType.Type.TIMESTAMPTZ: "DATETIMEOFFSET", 822 exp.DataType.Type.UTINYINT: "TINYINT", 823 exp.DataType.Type.VARIANT: "SQL_VARIANT", 824 } 825 826 TYPE_MAPPING.pop(exp.DataType.Type.NCHAR) 827 TYPE_MAPPING.pop(exp.DataType.Type.NVARCHAR) 828 829 TRANSFORMS = { 830 **generator.Generator.TRANSFORMS, 831 exp.AnyValue: any_value_to_max_sql, 832 exp.ArrayToString: rename_func("STRING_AGG"), 833 exp.AutoIncrementColumnConstraint: lambda *_: "IDENTITY", 834 exp.DateAdd: date_delta_sql("DATEADD"), 835 exp.DateDiff: date_delta_sql("DATEDIFF"), 836 exp.CTE: transforms.preprocess([qualify_derived_table_outputs]), 837 exp.CurrentDate: rename_func("GETDATE"), 838 exp.CurrentTimestamp: rename_func("GETDATE"), 839 exp.DateStrToDate: datestrtodate_sql, 840 exp.Extract: rename_func("DATEPART"), 841 exp.GeneratedAsIdentityColumnConstraint: generatedasidentitycolumnconstraint_sql, 842 exp.GroupConcat: _string_agg_sql, 843 exp.If: rename_func("IIF"), 844 exp.JSONExtract: _json_extract_sql, 845 exp.JSONExtractScalar: _json_extract_sql, 846 exp.LastDay: lambda self, e: self.func("EOMONTH", e.this), 847 exp.Max: max_or_greatest, 848 exp.MD5: lambda self, e: self.func("HASHBYTES", exp.Literal.string("MD5"), e.this), 849 exp.Min: min_or_least, 850 exp.NumberToStr: _format_sql, 851 exp.Repeat: rename_func("REPLICATE"), 852 exp.Select: transforms.preprocess( 853 [ 854 transforms.eliminate_distinct_on, 855 transforms.eliminate_semi_and_anti_joins, 856 transforms.eliminate_qualify, 857 ] 858 ), 859 exp.Stddev: rename_func("STDEV"), 860 exp.StrPosition: lambda self, e: self.func( 861 "CHARINDEX", e.args.get("substr"), e.this, e.args.get("position") 862 ), 863 exp.Subquery: transforms.preprocess([qualify_derived_table_outputs]), 864 exp.SHA: lambda self, e: self.func("HASHBYTES", exp.Literal.string("SHA1"), e.this), 865 exp.SHA2: lambda self, e: self.func( 866 "HASHBYTES", exp.Literal.string(f"SHA2_{e.args.get('length', 256)}"), e.this 867 ), 868 exp.TemporaryProperty: lambda self, e: "", 869 exp.TimeStrToTime: lambda self, e: self.sql( 870 exp.cast(e.this, exp.DataType.Type.DATETIME) 871 ), 872 exp.TimeToStr: _format_sql, 873 exp.Trim: trim_sql, 874 exp.TsOrDsAdd: date_delta_sql("DATEADD", cast=True), 875 exp.TsOrDsDiff: date_delta_sql("DATEDIFF"), 876 } 877 878 TRANSFORMS.pop(exp.ReturnsProperty) 879 880 PROPERTIES_LOCATION = { 881 **generator.Generator.PROPERTIES_LOCATION, 882 exp.VolatileProperty: exp.Properties.Location.UNSUPPORTED, 883 } 884 885 def scope_resolution(self, rhs: str, scope_name: str) -> str: 886 return f"{scope_name}::{rhs}" 887 888 def select_sql(self, expression: exp.Select) -> str: 889 if expression.args.get("offset"): 890 if not expression.args.get("order"): 891 # ORDER BY is required in order to use OFFSET in a query, so we use 892 # a noop order by, since we don't really care about the order. 893 # See: https://www.microsoftpressstore.com/articles/article.aspx?p=2314819 894 expression.order_by(exp.select(exp.null()).subquery(), copy=False) 895 896 limit = expression.args.get("limit") 897 if isinstance(limit, exp.Limit): 898 # TOP and OFFSET can't be combined, we need use FETCH instead of TOP 899 # we replace here because otherwise TOP would be generated in select_sql 900 limit.replace(exp.Fetch(direction="FIRST", count=limit.expression)) 901 902 return super().select_sql(expression) 903 904 def convert_sql(self, expression: exp.Convert) -> str: 905 name = "TRY_CONVERT" if expression.args.get("safe") else "CONVERT" 906 return self.func( 907 name, expression.this, expression.expression, expression.args.get("style") 908 ) 909 910 def queryoption_sql(self, expression: exp.QueryOption) -> str: 911 option = self.sql(expression, "this") 912 value = self.sql(expression, "expression") 913 if value: 914 optional_equal_sign = "= " if option in OPTIONS_THAT_REQUIRE_EQUAL else "" 915 return f"{option} {optional_equal_sign}{value}" 916 return option 917 918 def lateral_op(self, expression: exp.Lateral) -> str: 919 cross_apply = expression.args.get("cross_apply") 920 if cross_apply is True: 921 return "CROSS APPLY" 922 if cross_apply is False: 923 return "OUTER APPLY" 924 925 # TODO: perhaps we can check if the parent is a Join and transpile it appropriately 926 self.unsupported("LATERAL clause is not supported.") 927 return "LATERAL" 928 929 def timefromparts_sql(self, expression: exp.TimeFromParts) -> str: 930 nano = expression.args.get("nano") 931 if nano is not None: 932 nano.pop() 933 self.unsupported("Specifying nanoseconds is not supported in TIMEFROMPARTS.") 934 935 if expression.args.get("fractions") is None: 936 expression.set("fractions", exp.Literal.number(0)) 937 if expression.args.get("precision") is None: 938 expression.set("precision", exp.Literal.number(0)) 939 940 return rename_func("TIMEFROMPARTS")(self, expression) 941 942 def timestampfromparts_sql(self, expression: exp.TimestampFromParts) -> str: 943 zone = expression.args.get("zone") 944 if zone is not None: 945 zone.pop() 946 self.unsupported("Time zone is not supported in DATETIMEFROMPARTS.") 947 948 nano = expression.args.get("nano") 949 if nano is not None: 950 nano.pop() 951 self.unsupported("Specifying nanoseconds is not supported in DATETIMEFROMPARTS.") 952 953 if expression.args.get("milli") is None: 954 expression.set("milli", exp.Literal.number(0)) 955 956 return rename_func("DATETIMEFROMPARTS")(self, expression) 957 958 def setitem_sql(self, expression: exp.SetItem) -> str: 959 this = expression.this 960 if isinstance(this, exp.EQ) and not isinstance(this.left, exp.Parameter): 961 # T-SQL does not use '=' in SET command, except when the LHS is a variable. 962 return f"{self.sql(this.left)} {self.sql(this.right)}" 963 964 return super().setitem_sql(expression) 965 966 def boolean_sql(self, expression: exp.Boolean) -> str: 967 if type(expression.parent) in BIT_TYPES: 968 return "1" if expression.this else "0" 969 970 return "(1 = 1)" if expression.this else "(1 = 0)" 971 972 def is_sql(self, expression: exp.Is) -> str: 973 if isinstance(expression.expression, exp.Boolean): 974 return self.binary(expression, "=") 975 return self.binary(expression, "IS") 976 977 def createable_sql(self, expression: exp.Create, locations: t.DefaultDict) -> str: 978 sql = self.sql(expression, "this") 979 properties = expression.args.get("properties") 980 981 if sql[:1] != "#" and any( 982 isinstance(prop, exp.TemporaryProperty) 983 for prop in (properties.expressions if properties else []) 984 ): 985 sql = f"[#{sql[1:]}" if sql.startswith("[") else f"#{sql}" 986 987 return sql 988 989 def create_sql(self, expression: exp.Create) -> str: 990 kind = expression.kind 991 exists = expression.args.pop("exists", None) 992 993 if kind == "VIEW": 994 expression.this.set("catalog", None) 995 996 sql = super().create_sql(expression) 997 998 like_property = expression.find(exp.LikeProperty) 999 if like_property: 1000 ctas_expression = like_property.this 1001 else: 1002 ctas_expression = expression.expression 1003 1004 table = expression.find(exp.Table) 1005 1006 # Convert CTAS statement to SELECT .. INTO .. 1007 if kind == "TABLE" and ctas_expression: 1008 ctas_with = ctas_expression.args.get("with") 1009 if ctas_with: 1010 ctas_with = ctas_with.pop() 1011 1012 if isinstance(ctas_expression, exp.UNWRAPPED_QUERIES): 1013 ctas_expression = ctas_expression.subquery() 1014 1015 select_into = exp.select("*").from_(exp.alias_(ctas_expression, "temp", table=True)) 1016 select_into.set("into", exp.Into(this=table)) 1017 select_into.set("with", ctas_with) 1018 1019 if like_property: 1020 select_into.limit(0, copy=False) 1021 1022 sql = self.sql(select_into) 1023 1024 if exists: 1025 identifier = self.sql(exp.Literal.string(exp.table_name(table) if table else "")) 1026 sql = self.sql(exp.Literal.string(sql)) 1027 if kind == "SCHEMA": 1028 sql = f"""IF NOT EXISTS (SELECT * FROM information_schema.schemata WHERE schema_name = {identifier}) EXEC({sql})""" 1029 elif kind == "TABLE": 1030 assert table 1031 where = exp.and_( 1032 exp.column("table_name").eq(table.name), 1033 exp.column("table_schema").eq(table.db) if table.db else None, 1034 exp.column("table_catalog").eq(table.catalog) if table.catalog else None, 1035 ) 1036 sql = f"""IF NOT EXISTS (SELECT * FROM information_schema.tables WHERE {where}) EXEC({sql})""" 1037 elif kind == "INDEX": 1038 index = self.sql(exp.Literal.string(expression.this.text("this"))) 1039 sql = f"""IF NOT EXISTS (SELECT * FROM sys.indexes WHERE object_id = object_id({identifier}) AND name = {index}) EXEC({sql})""" 1040 elif expression.args.get("replace"): 1041 sql = sql.replace("CREATE OR REPLACE ", "CREATE OR ALTER ", 1) 1042 1043 return self.prepend_ctes(expression, sql) 1044 1045 def offset_sql(self, expression: exp.Offset) -> str: 1046 return f"{super().offset_sql(expression)} ROWS" 1047 1048 def version_sql(self, expression: exp.Version) -> str: 1049 name = "SYSTEM_TIME" if expression.name == "TIMESTAMP" else expression.name 1050 this = f"FOR {name}" 1051 expr = expression.expression 1052 kind = expression.text("kind") 1053 if kind in ("FROM", "BETWEEN"): 1054 args = expr.expressions 1055 sep = "TO" if kind == "FROM" else "AND" 1056 expr_sql = f"{self.sql(seq_get(args, 0))} {sep} {self.sql(seq_get(args, 1))}" 1057 else: 1058 expr_sql = self.sql(expr) 1059 1060 expr_sql = f" {expr_sql}" if expr_sql else "" 1061 return f"{this} {kind}{expr_sql}" 1062 1063 def returnsproperty_sql(self, expression: exp.ReturnsProperty) -> str: 1064 table = expression.args.get("table") 1065 table = f"{table} " if table else "" 1066 return f"RETURNS {table}{self.sql(expression, 'this')}" 1067 1068 def returning_sql(self, expression: exp.Returning) -> str: 1069 into = self.sql(expression, "into") 1070 into = self.seg(f"INTO {into}") if into else "" 1071 return f"{self.seg('OUTPUT')} {self.expressions(expression, flat=True)}{into}" 1072 1073 def transaction_sql(self, expression: exp.Transaction) -> str: 1074 this = self.sql(expression, "this") 1075 this = f" {this}" if this else "" 1076 mark = self.sql(expression, "mark") 1077 mark = f" WITH MARK {mark}" if mark else "" 1078 return f"BEGIN TRANSACTION{this}{mark}" 1079 1080 def commit_sql(self, expression: exp.Commit) -> str: 1081 this = self.sql(expression, "this") 1082 this = f" {this}" if this else "" 1083 durability = expression.args.get("durability") 1084 durability = ( 1085 f" WITH (DELAYED_DURABILITY = {'ON' if durability else 'OFF'})" 1086 if durability is not None 1087 else "" 1088 ) 1089 return f"COMMIT TRANSACTION{this}{durability}" 1090 1091 def rollback_sql(self, expression: exp.Rollback) -> str: 1092 this = self.sql(expression, "this") 1093 this = f" {this}" if this else "" 1094 return f"ROLLBACK TRANSACTION{this}" 1095 1096 def identifier_sql(self, expression: exp.Identifier) -> str: 1097 identifier = super().identifier_sql(expression) 1098 1099 if expression.args.get("global"): 1100 identifier = f"##{identifier}" 1101 elif expression.args.get("temporary"): 1102 identifier = f"#{identifier}" 1103 1104 return identifier 1105 1106 def constraint_sql(self, expression: exp.Constraint) -> str: 1107 this = self.sql(expression, "this") 1108 expressions = self.expressions(expression, flat=True, sep=" ") 1109 return f"CONSTRAINT {this} {expressions}" 1110 1111 def length_sql(self, expression: exp.Length) -> str: 1112 return self._uncast_text(expression, "LEN") 1113 1114 def right_sql(self, expression: exp.Right) -> str: 1115 return self._uncast_text(expression, "RIGHT") 1116 1117 def left_sql(self, expression: exp.Left) -> str: 1118 return self._uncast_text(expression, "LEFT") 1119 1120 def _uncast_text(self, expression: exp.Expression, name: str) -> str: 1121 this = expression.this 1122 if isinstance(this, exp.Cast) and this.is_type(exp.DataType.Type.TEXT): 1123 this_sql = self.sql(this, "this") 1124 else: 1125 this_sql = self.sql(this) 1126 expression_sql = self.sql(expression, "expression") 1127 return self.func(name, this_sql, expression_sql if expression_sql else None) 1128 1129 def partition_sql(self, expression: exp.Partition) -> str: 1130 return f"WITH (PARTITIONS({self.expressions(expression, flat=True)}))" 1131 1132 def altertable_sql(self, expression: exp.AlterTable) -> str: 1133 action = seq_get(expression.args.get("actions") or [], 0) 1134 if isinstance(action, exp.RenameTable): 1135 return f"EXEC sp_rename '{self.sql(expression.this)}', '{action.this.name}'" 1136 return super().altertable_sql(expression) 1137 1138 def drop_sql(self, expression: exp.Drop) -> str: 1139 if expression.args["kind"] == "VIEW": 1140 expression.this.set("catalog", None) 1141 return super().drop_sql(expression) 1142 1143 def declare_sql(self, expression: exp.Declare) -> str: 1144 return f"DECLARE {self.expressions(expression, flat=True)}" 1145 1146 def declareitem_sql(self, expression: exp.DeclareItem) -> str: 1147 variable = self.sql(expression, "this") 1148 default = self.sql(expression, "default") 1149 default = f" = {default}" if default else "" 1150 1151 kind = self.sql(expression, "kind") 1152 if isinstance(expression.args.get("kind"), exp.Schema): 1153 kind = f"TABLE {kind}" 1154 1155 return f"{variable} AS {kind}{default}" 1156 1157 def options_modifier(self, expression: exp.Expression) -> str: 1158 options = self.expressions(expression, key="options") 1159 return f" OPTION{self.wrap(options)}" if options else ""
Specifies the strategy according to which identifiers should be normalized.
Whether the base comes first in the LOG
function.
Possible values: True
, False
, None
(two arguments are not supported by LOG
)
Whether the behavior of a / b
depends on the types of a
and b
.
False means a / b
is always float division.
True means a / b
is integer division if both a
and b
are integers.
A NULL
arg in CONCAT
yields NULL
by default, but in some dialects it yields an empty string.
Associates this dialect's time formats with their equivalent Python strftime
formats.
Inherited Members
- sqlglot.dialects.dialect.Dialect
- Dialect
- INDEX_OFFSET
- WEEK_OFFSET
- UNNEST_COLUMN_ONLY
- ALIAS_POST_TABLESAMPLE
- TABLESAMPLE_SIZE_IS_PERCENT
- IDENTIFIERS_CAN_START_WITH_DIGIT
- DPIPE_IS_STRING_CONCAT
- STRICT_STRING_CONCAT
- SUPPORTS_USER_DEFINED_TYPES
- COPY_PARAMS_ARE_CSV
- NORMALIZE_FUNCTIONS
- NULL_ORDERING
- SAFE_DIVISION
- HEX_LOWERCASE
- DATE_FORMAT
- DATEINT_FORMAT
- FORMAT_MAPPING
- UNESCAPED_SEQUENCES
- PSEUDOCOLUMNS
- PREFER_CTE_ALIAS_COLUMN
- FORCE_EARLY_ALIAS_REF_EXPANSION
- EXPAND_ALIAS_REFS_EARLY_ONLY_IN_GROUP_BY
- SUPPORTS_ORDER_BY_ALL
- DATE_PART_MAPPING
- TYPE_TO_EXPRESSIONS
- ANNOTATORS
- get_or_raise
- format_time
- settings
- normalize_identifier
- case_sensitive
- can_identify
- quote_identifier
- to_json_path
- parse
- parse_into
- generate
- transpile
- tokenize
- tokenizer
- jsonpath_tokenizer
- parser
- generator
446 class Tokenizer(tokens.Tokenizer): 447 IDENTIFIERS = [("[", "]"), '"'] 448 QUOTES = ["'", '"'] 449 HEX_STRINGS = [("0x", ""), ("0X", "")] 450 VAR_SINGLE_TOKENS = {"@", "$", "#"} 451 452 KEYWORDS = { 453 **tokens.Tokenizer.KEYWORDS, 454 "CLUSTERED INDEX": TokenType.INDEX, 455 "DATETIME2": TokenType.DATETIME, 456 "DATETIMEOFFSET": TokenType.TIMESTAMPTZ, 457 "DECLARE": TokenType.DECLARE, 458 "EXEC": TokenType.COMMAND, 459 "FOR SYSTEM_TIME": TokenType.TIMESTAMP_SNAPSHOT, 460 "IMAGE": TokenType.IMAGE, 461 "MONEY": TokenType.MONEY, 462 "NONCLUSTERED INDEX": TokenType.INDEX, 463 "NTEXT": TokenType.TEXT, 464 "OPTION": TokenType.OPTION, 465 "OUTPUT": TokenType.RETURNING, 466 "PRINT": TokenType.COMMAND, 467 "PROC": TokenType.PROCEDURE, 468 "REAL": TokenType.FLOAT, 469 "ROWVERSION": TokenType.ROWVERSION, 470 "SMALLDATETIME": TokenType.DATETIME, 471 "SMALLMONEY": TokenType.SMALLMONEY, 472 "SQL_VARIANT": TokenType.VARIANT, 473 "SYSTEM_USER": TokenType.CURRENT_USER, 474 "TOP": TokenType.TOP, 475 "TIMESTAMP": TokenType.ROWVERSION, 476 "TINYINT": TokenType.UTINYINT, 477 "UNIQUEIDENTIFIER": TokenType.UNIQUEIDENTIFIER, 478 "UPDATE STATISTICS": TokenType.COMMAND, 479 "XML": TokenType.XML, 480 } 481 KEYWORDS.pop("/*+") 482 483 COMMANDS = {*tokens.Tokenizer.COMMANDS, TokenType.END}
Inherited Members
- sqlglot.tokens.Tokenizer
- Tokenizer
- SINGLE_TOKENS
- BIT_STRINGS
- BYTE_STRINGS
- RAW_STRINGS
- HEREDOC_STRINGS
- UNICODE_STRINGS
- IDENTIFIER_ESCAPES
- STRING_ESCAPES
- HEREDOC_TAG_IS_IDENTIFIER
- HEREDOC_STRING_ALTERNATIVE
- STRING_ESCAPES_ALLOWED_IN_RAW_STRINGS
- WHITE_SPACE
- COMMAND_PREFIX_TOKENS
- NUMERIC_LITERALS
- COMMENTS
- dialect
- reset
- tokenize
- tokenize_rs
- size
- sql
- tokens
485 class Parser(parser.Parser): 486 SET_REQUIRES_ASSIGNMENT_DELIMITER = False 487 LOG_DEFAULTS_TO_LN = True 488 ALTER_TABLE_ADD_REQUIRED_FOR_EACH_COLUMN = False 489 STRING_ALIASES = True 490 NO_PAREN_IF_COMMANDS = False 491 492 QUERY_MODIFIER_PARSERS = { 493 **parser.Parser.QUERY_MODIFIER_PARSERS, 494 TokenType.OPTION: lambda self: ("options", self._parse_options()), 495 } 496 497 FUNCTIONS = { 498 **parser.Parser.FUNCTIONS, 499 "CHARINDEX": lambda args: exp.StrPosition( 500 this=seq_get(args, 1), 501 substr=seq_get(args, 0), 502 position=seq_get(args, 2), 503 ), 504 "DATEADD": build_date_delta(exp.DateAdd, unit_mapping=DATE_DELTA_INTERVAL), 505 "DATEDIFF": _build_date_delta(exp.DateDiff, unit_mapping=DATE_DELTA_INTERVAL), 506 "DATENAME": _build_formatted_time(exp.TimeToStr, full_format_mapping=True), 507 "DATEPART": _build_formatted_time(exp.TimeToStr), 508 "DATETIMEFROMPARTS": _build_datetimefromparts, 509 "EOMONTH": _build_eomonth, 510 "FORMAT": _build_format, 511 "GETDATE": exp.CurrentTimestamp.from_arg_list, 512 "HASHBYTES": _build_hashbytes, 513 "ISNULL": exp.Coalesce.from_arg_list, 514 "JSON_QUERY": parser.build_extract_json_with_path(exp.JSONExtract), 515 "JSON_VALUE": parser.build_extract_json_with_path(exp.JSONExtractScalar), 516 "LEN": _build_with_arg_as_text(exp.Length), 517 "LEFT": _build_with_arg_as_text(exp.Left), 518 "RIGHT": _build_with_arg_as_text(exp.Right), 519 "REPLICATE": exp.Repeat.from_arg_list, 520 "SQUARE": lambda args: exp.Pow(this=seq_get(args, 0), expression=exp.Literal.number(2)), 521 "SYSDATETIME": exp.CurrentTimestamp.from_arg_list, 522 "SUSER_NAME": exp.CurrentUser.from_arg_list, 523 "SUSER_SNAME": exp.CurrentUser.from_arg_list, 524 "SYSTEM_USER": exp.CurrentUser.from_arg_list, 525 "TIMEFROMPARTS": _build_timefromparts, 526 } 527 528 JOIN_HINTS = {"LOOP", "HASH", "MERGE", "REMOTE"} 529 530 RETURNS_TABLE_TOKENS = parser.Parser.ID_VAR_TOKENS - { 531 TokenType.TABLE, 532 *parser.Parser.TYPE_TOKENS, 533 } 534 535 STATEMENT_PARSERS = { 536 **parser.Parser.STATEMENT_PARSERS, 537 TokenType.DECLARE: lambda self: self._parse_declare(), 538 } 539 540 RANGE_PARSERS = { 541 **parser.Parser.RANGE_PARSERS, 542 TokenType.DCOLON: lambda self, this: self.expression( 543 exp.ScopeResolution, 544 this=this, 545 expression=self._parse_function() or self._parse_var(any_token=True), 546 ), 547 } 548 549 # The DCOLON (::) operator serves as a scope resolution (exp.ScopeResolution) operator in T-SQL 550 COLUMN_OPERATORS = { 551 **parser.Parser.COLUMN_OPERATORS, 552 TokenType.DCOLON: lambda self, this, to: self.expression(exp.Cast, this=this, to=to) 553 if isinstance(to, exp.DataType) and to.this != exp.DataType.Type.USERDEFINED 554 else self.expression(exp.ScopeResolution, this=this, expression=to), 555 } 556 557 def _parse_dcolon(self) -> t.Optional[exp.Expression]: 558 # We want to use _parse_types() if the first token after :: is a known type, 559 # otherwise we could parse something like x::varchar(max) into a function 560 if self._match_set(self.TYPE_TOKENS, advance=False): 561 return self._parse_types() 562 563 return self._parse_function() or self._parse_types() 564 565 def _parse_options(self) -> t.Optional[t.List[exp.Expression]]: 566 if not self._match(TokenType.OPTION): 567 return None 568 569 def _parse_option() -> t.Optional[exp.Expression]: 570 option = self._parse_var_from_options(OPTIONS) 571 if not option: 572 return None 573 574 self._match(TokenType.EQ) 575 return self.expression( 576 exp.QueryOption, this=option, expression=self._parse_primary_or_var() 577 ) 578 579 return self._parse_wrapped_csv(_parse_option) 580 581 def _parse_projections(self) -> t.List[exp.Expression]: 582 """ 583 T-SQL supports the syntax alias = expression in the SELECT's projection list, 584 so we transform all parsed Selects to convert their EQ projections into Aliases. 585 586 See: https://learn.microsoft.com/en-us/sql/t-sql/queries/select-clause-transact-sql?view=sql-server-ver16#syntax 587 """ 588 return [ 589 ( 590 exp.alias_(projection.expression, projection.this.this, copy=False) 591 if isinstance(projection, exp.EQ) and isinstance(projection.this, exp.Column) 592 else projection 593 ) 594 for projection in super()._parse_projections() 595 ] 596 597 def _parse_commit_or_rollback(self) -> exp.Commit | exp.Rollback: 598 """Applies to SQL Server and Azure SQL Database 599 COMMIT [ { TRAN | TRANSACTION } 600 [ transaction_name | @tran_name_variable ] ] 601 [ WITH ( DELAYED_DURABILITY = { OFF | ON } ) ] 602 603 ROLLBACK { TRAN | TRANSACTION } 604 [ transaction_name | @tran_name_variable 605 | savepoint_name | @savepoint_variable ] 606 """ 607 rollback = self._prev.token_type == TokenType.ROLLBACK 608 609 self._match_texts(("TRAN", "TRANSACTION")) 610 this = self._parse_id_var() 611 612 if rollback: 613 return self.expression(exp.Rollback, this=this) 614 615 durability = None 616 if self._match_pair(TokenType.WITH, TokenType.L_PAREN): 617 self._match_text_seq("DELAYED_DURABILITY") 618 self._match(TokenType.EQ) 619 620 if self._match_text_seq("OFF"): 621 durability = False 622 else: 623 self._match(TokenType.ON) 624 durability = True 625 626 self._match_r_paren() 627 628 return self.expression(exp.Commit, this=this, durability=durability) 629 630 def _parse_transaction(self) -> exp.Transaction | exp.Command: 631 """Applies to SQL Server and Azure SQL Database 632 BEGIN { TRAN | TRANSACTION } 633 [ { transaction_name | @tran_name_variable } 634 [ WITH MARK [ 'description' ] ] 635 ] 636 """ 637 if self._match_texts(("TRAN", "TRANSACTION")): 638 transaction = self.expression(exp.Transaction, this=self._parse_id_var()) 639 if self._match_text_seq("WITH", "MARK"): 640 transaction.set("mark", self._parse_string()) 641 642 return transaction 643 644 return self._parse_as_command(self._prev) 645 646 def _parse_returns(self) -> exp.ReturnsProperty: 647 table = self._parse_id_var(any_token=False, tokens=self.RETURNS_TABLE_TOKENS) 648 returns = super()._parse_returns() 649 returns.set("table", table) 650 return returns 651 652 def _parse_convert( 653 self, strict: bool, safe: t.Optional[bool] = None 654 ) -> t.Optional[exp.Expression]: 655 this = self._parse_types() 656 self._match(TokenType.COMMA) 657 args = [this, *self._parse_csv(self._parse_assignment)] 658 convert = exp.Convert.from_arg_list(args) 659 convert.set("safe", safe) 660 convert.set("strict", strict) 661 return convert 662 663 def _parse_user_defined_function( 664 self, kind: t.Optional[TokenType] = None 665 ) -> t.Optional[exp.Expression]: 666 this = super()._parse_user_defined_function(kind=kind) 667 668 if ( 669 kind == TokenType.FUNCTION 670 or isinstance(this, exp.UserDefinedFunction) 671 or self._match(TokenType.ALIAS, advance=False) 672 ): 673 return this 674 675 expressions = self._parse_csv(self._parse_function_parameter) 676 return self.expression(exp.UserDefinedFunction, this=this, expressions=expressions) 677 678 def _parse_id_var( 679 self, 680 any_token: bool = True, 681 tokens: t.Optional[t.Collection[TokenType]] = None, 682 ) -> t.Optional[exp.Expression]: 683 is_temporary = self._match(TokenType.HASH) 684 is_global = is_temporary and self._match(TokenType.HASH) 685 686 this = super()._parse_id_var(any_token=any_token, tokens=tokens) 687 if this: 688 if is_global: 689 this.set("global", True) 690 elif is_temporary: 691 this.set("temporary", True) 692 693 return this 694 695 def _parse_create(self) -> exp.Create | exp.Command: 696 create = super()._parse_create() 697 698 if isinstance(create, exp.Create): 699 table = create.this.this if isinstance(create.this, exp.Schema) else create.this 700 if isinstance(table, exp.Table) and table.this.args.get("temporary"): 701 if not create.args.get("properties"): 702 create.set("properties", exp.Properties(expressions=[])) 703 704 create.args["properties"].append("expressions", exp.TemporaryProperty()) 705 706 return create 707 708 def _parse_if(self) -> t.Optional[exp.Expression]: 709 index = self._index 710 711 if self._match_text_seq("OBJECT_ID"): 712 self._parse_wrapped_csv(self._parse_string) 713 if self._match_text_seq("IS", "NOT", "NULL") and self._match(TokenType.DROP): 714 return self._parse_drop(exists=True) 715 self._retreat(index) 716 717 return super()._parse_if() 718 719 def _parse_unique(self) -> exp.UniqueColumnConstraint: 720 if self._match_texts(("CLUSTERED", "NONCLUSTERED")): 721 this = self.CONSTRAINT_PARSERS[self._prev.text.upper()](self) 722 else: 723 this = self._parse_schema(self._parse_id_var(any_token=False)) 724 725 return self.expression(exp.UniqueColumnConstraint, this=this) 726 727 def _parse_partition(self) -> t.Optional[exp.Partition]: 728 if not self._match_text_seq("WITH", "(", "PARTITIONS"): 729 return None 730 731 def parse_range(): 732 low = self._parse_bitwise() 733 high = self._parse_bitwise() if self._match_text_seq("TO") else None 734 735 return ( 736 self.expression(exp.PartitionRange, this=low, expression=high) if high else low 737 ) 738 739 partition = self.expression( 740 exp.Partition, expressions=self._parse_wrapped_csv(parse_range) 741 ) 742 743 self._match_r_paren() 744 745 return partition 746 747 def _parse_declare(self) -> exp.Declare | exp.Command: 748 index = self._index 749 expressions = self._try_parse(partial(self._parse_csv, self._parse_declareitem)) 750 751 if not expressions or self._curr: 752 self._retreat(index) 753 return self._parse_as_command(self._prev) 754 755 return self.expression(exp.Declare, expressions=expressions) 756 757 def _parse_declareitem(self) -> t.Optional[exp.DeclareItem]: 758 var = self._parse_id_var() 759 if not var: 760 return None 761 762 value = None 763 self._match(TokenType.ALIAS) 764 if self._match(TokenType.TABLE): 765 data_type = self._parse_schema() 766 else: 767 data_type = self._parse_types() 768 if self._match(TokenType.EQ): 769 value = self._parse_bitwise() 770 771 return self.expression(exp.DeclareItem, this=var, kind=data_type, default=value)
Parser consumes a list of tokens produced by the Tokenizer and produces a parsed syntax tree.
Arguments:
- error_level: The desired error level. Default: ErrorLevel.IMMEDIATE
- error_message_context: The amount of context to capture from a query string when displaying the error message (in number of characters). Default: 100
- max_errors: Maximum number of error messages to include in a raised ParseError. This is only relevant if error_level is ErrorLevel.RAISE. Default: 3
Inherited Members
- sqlglot.parser.Parser
- Parser
- NO_PAREN_FUNCTIONS
- STRUCT_TYPE_TOKENS
- NESTED_TYPE_TOKENS
- ENUM_TYPE_TOKENS
- AGGREGATE_TYPE_TOKENS
- TYPE_TOKENS
- SIGNED_TO_UNSIGNED_TYPE_TOKEN
- SUBQUERY_PREDICATES
- RESERVED_TOKENS
- DB_CREATABLES
- CREATABLES
- INTERVAL_VARS
- ALIAS_TOKENS
- ARRAY_CONSTRUCTORS
- COMMENT_TABLE_ALIAS_TOKENS
- UPDATE_ALIAS_TOKENS
- TRIM_TYPES
- FUNC_TOKENS
- CONJUNCTION
- ASSIGNMENT
- DISJUNCTION
- EQUALITY
- COMPARISON
- BITWISE
- TERM
- FACTOR
- EXPONENT
- TIMES
- TIMESTAMPS
- SET_OPERATIONS
- JOIN_METHODS
- JOIN_SIDES
- JOIN_KINDS
- LAMBDAS
- EXPRESSION_PARSERS
- UNARY_PARSERS
- STRING_PARSERS
- NUMERIC_PARSERS
- PRIMARY_PARSERS
- PLACEHOLDER_PARSERS
- PROPERTY_PARSERS
- CONSTRAINT_PARSERS
- ALTER_PARSERS
- ALTER_ALTER_PARSERS
- SCHEMA_UNNAMED_CONSTRAINTS
- NO_PAREN_FUNCTION_PARSERS
- INVALID_FUNC_NAME_TOKENS
- FUNCTIONS_WITH_ALIASED_ARGS
- KEY_VALUE_DEFINITIONS
- FUNCTION_PARSERS
- SET_PARSERS
- SHOW_PARSERS
- TYPE_LITERAL_PARSERS
- TYPE_CONVERTERS
- DDL_SELECT_TOKENS
- PRE_VOLATILE_TOKENS
- TRANSACTION_KIND
- TRANSACTION_CHARACTERISTICS
- CONFLICT_ACTIONS
- CREATE_SEQUENCE
- ISOLATED_LOADING_OPTIONS
- USABLES
- CAST_ACTIONS
- SCHEMA_BINDING_OPTIONS
- KEY_CONSTRAINT_OPTIONS
- INSERT_ALTERNATIVES
- CLONE_KEYWORDS
- HISTORICAL_DATA_PREFIX
- HISTORICAL_DATA_KIND
- OPCLASS_FOLLOW_KEYWORDS
- OPTYPE_FOLLOW_TOKENS
- TABLE_INDEX_HINT_TOKENS
- VIEW_ATTRIBUTES
- WINDOW_ALIAS_TOKENS
- WINDOW_BEFORE_PAREN_TOKENS
- WINDOW_SIDES
- JSON_KEY_VALUE_SEPARATOR_TOKENS
- FETCH_TOKENS
- ADD_CONSTRAINT_TOKENS
- DISTINCT_TOKENS
- NULL_TOKENS
- UNNEST_OFFSET_ALIAS_TOKENS
- SELECT_START_TOKENS
- COPY_INTO_VARLEN_OPTIONS
- STRICT_CAST
- PREFIXED_PIVOT_COLUMNS
- IDENTIFY_PIVOT_STRINGS
- TABLESAMPLE_CSV
- DEFAULT_SAMPLING_METHOD
- TRIM_PATTERN_FIRST
- MODIFIERS_ATTACHED_TO_SET_OP
- SET_OP_MODIFIERS
- JSON_ARROWS_REQUIRE_JSON_TYPE
- COLON_IS_VARIANT_EXTRACT
- VALUES_FOLLOWED_BY_PAREN
- SUPPORTS_IMPLICIT_UNNEST
- INTERVAL_SPANS
- SUPPORTS_PARTITION_SELECTION
- error_level
- error_message_context
- max_errors
- dialect
- reset
- parse
- parse_into
- check_errors
- raise_error
- expression
- validate_expression
- errors
- sql
773 class Generator(generator.Generator): 774 LIMIT_IS_TOP = True 775 QUERY_HINTS = False 776 RETURNING_END = False 777 NVL2_SUPPORTED = False 778 ALTER_TABLE_INCLUDE_COLUMN_KEYWORD = False 779 LIMIT_FETCH = "FETCH" 780 COMPUTED_COLUMN_WITH_TYPE = False 781 CTE_RECURSIVE_KEYWORD_REQUIRED = False 782 ENSURE_BOOLS = True 783 NULL_ORDERING_SUPPORTED = None 784 SUPPORTS_SINGLE_ARG_CONCAT = False 785 TABLESAMPLE_SEED_KEYWORD = "REPEATABLE" 786 SUPPORTS_SELECT_INTO = True 787 JSON_PATH_BRACKETED_KEY_SUPPORTED = False 788 SUPPORTS_TO_NUMBER = False 789 SET_OP_MODIFIERS = False 790 COPY_PARAMS_EQ_REQUIRED = True 791 PARSE_JSON_NAME = None 792 793 EXPRESSIONS_WITHOUT_NESTED_CTES = { 794 exp.Delete, 795 exp.Insert, 796 exp.Intersect, 797 exp.Except, 798 exp.Merge, 799 exp.Select, 800 exp.Subquery, 801 exp.Union, 802 exp.Update, 803 } 804 805 SUPPORTED_JSON_PATH_PARTS = { 806 exp.JSONPathKey, 807 exp.JSONPathRoot, 808 exp.JSONPathSubscript, 809 } 810 811 TYPE_MAPPING = { 812 **generator.Generator.TYPE_MAPPING, 813 exp.DataType.Type.BOOLEAN: "BIT", 814 exp.DataType.Type.DECIMAL: "NUMERIC", 815 exp.DataType.Type.DATETIME: "DATETIME2", 816 exp.DataType.Type.DOUBLE: "FLOAT", 817 exp.DataType.Type.INT: "INTEGER", 818 exp.DataType.Type.ROWVERSION: "ROWVERSION", 819 exp.DataType.Type.TEXT: "VARCHAR(MAX)", 820 exp.DataType.Type.TIMESTAMP: "DATETIME2", 821 exp.DataType.Type.TIMESTAMPTZ: "DATETIMEOFFSET", 822 exp.DataType.Type.UTINYINT: "TINYINT", 823 exp.DataType.Type.VARIANT: "SQL_VARIANT", 824 } 825 826 TYPE_MAPPING.pop(exp.DataType.Type.NCHAR) 827 TYPE_MAPPING.pop(exp.DataType.Type.NVARCHAR) 828 829 TRANSFORMS = { 830 **generator.Generator.TRANSFORMS, 831 exp.AnyValue: any_value_to_max_sql, 832 exp.ArrayToString: rename_func("STRING_AGG"), 833 exp.AutoIncrementColumnConstraint: lambda *_: "IDENTITY", 834 exp.DateAdd: date_delta_sql("DATEADD"), 835 exp.DateDiff: date_delta_sql("DATEDIFF"), 836 exp.CTE: transforms.preprocess([qualify_derived_table_outputs]), 837 exp.CurrentDate: rename_func("GETDATE"), 838 exp.CurrentTimestamp: rename_func("GETDATE"), 839 exp.DateStrToDate: datestrtodate_sql, 840 exp.Extract: rename_func("DATEPART"), 841 exp.GeneratedAsIdentityColumnConstraint: generatedasidentitycolumnconstraint_sql, 842 exp.GroupConcat: _string_agg_sql, 843 exp.If: rename_func("IIF"), 844 exp.JSONExtract: _json_extract_sql, 845 exp.JSONExtractScalar: _json_extract_sql, 846 exp.LastDay: lambda self, e: self.func("EOMONTH", e.this), 847 exp.Max: max_or_greatest, 848 exp.MD5: lambda self, e: self.func("HASHBYTES", exp.Literal.string("MD5"), e.this), 849 exp.Min: min_or_least, 850 exp.NumberToStr: _format_sql, 851 exp.Repeat: rename_func("REPLICATE"), 852 exp.Select: transforms.preprocess( 853 [ 854 transforms.eliminate_distinct_on, 855 transforms.eliminate_semi_and_anti_joins, 856 transforms.eliminate_qualify, 857 ] 858 ), 859 exp.Stddev: rename_func("STDEV"), 860 exp.StrPosition: lambda self, e: self.func( 861 "CHARINDEX", e.args.get("substr"), e.this, e.args.get("position") 862 ), 863 exp.Subquery: transforms.preprocess([qualify_derived_table_outputs]), 864 exp.SHA: lambda self, e: self.func("HASHBYTES", exp.Literal.string("SHA1"), e.this), 865 exp.SHA2: lambda self, e: self.func( 866 "HASHBYTES", exp.Literal.string(f"SHA2_{e.args.get('length', 256)}"), e.this 867 ), 868 exp.TemporaryProperty: lambda self, e: "", 869 exp.TimeStrToTime: lambda self, e: self.sql( 870 exp.cast(e.this, exp.DataType.Type.DATETIME) 871 ), 872 exp.TimeToStr: _format_sql, 873 exp.Trim: trim_sql, 874 exp.TsOrDsAdd: date_delta_sql("DATEADD", cast=True), 875 exp.TsOrDsDiff: date_delta_sql("DATEDIFF"), 876 } 877 878 TRANSFORMS.pop(exp.ReturnsProperty) 879 880 PROPERTIES_LOCATION = { 881 **generator.Generator.PROPERTIES_LOCATION, 882 exp.VolatileProperty: exp.Properties.Location.UNSUPPORTED, 883 } 884 885 def scope_resolution(self, rhs: str, scope_name: str) -> str: 886 return f"{scope_name}::{rhs}" 887 888 def select_sql(self, expression: exp.Select) -> str: 889 if expression.args.get("offset"): 890 if not expression.args.get("order"): 891 # ORDER BY is required in order to use OFFSET in a query, so we use 892 # a noop order by, since we don't really care about the order. 893 # See: https://www.microsoftpressstore.com/articles/article.aspx?p=2314819 894 expression.order_by(exp.select(exp.null()).subquery(), copy=False) 895 896 limit = expression.args.get("limit") 897 if isinstance(limit, exp.Limit): 898 # TOP and OFFSET can't be combined, we need use FETCH instead of TOP 899 # we replace here because otherwise TOP would be generated in select_sql 900 limit.replace(exp.Fetch(direction="FIRST", count=limit.expression)) 901 902 return super().select_sql(expression) 903 904 def convert_sql(self, expression: exp.Convert) -> str: 905 name = "TRY_CONVERT" if expression.args.get("safe") else "CONVERT" 906 return self.func( 907 name, expression.this, expression.expression, expression.args.get("style") 908 ) 909 910 def queryoption_sql(self, expression: exp.QueryOption) -> str: 911 option = self.sql(expression, "this") 912 value = self.sql(expression, "expression") 913 if value: 914 optional_equal_sign = "= " if option in OPTIONS_THAT_REQUIRE_EQUAL else "" 915 return f"{option} {optional_equal_sign}{value}" 916 return option 917 918 def lateral_op(self, expression: exp.Lateral) -> str: 919 cross_apply = expression.args.get("cross_apply") 920 if cross_apply is True: 921 return "CROSS APPLY" 922 if cross_apply is False: 923 return "OUTER APPLY" 924 925 # TODO: perhaps we can check if the parent is a Join and transpile it appropriately 926 self.unsupported("LATERAL clause is not supported.") 927 return "LATERAL" 928 929 def timefromparts_sql(self, expression: exp.TimeFromParts) -> str: 930 nano = expression.args.get("nano") 931 if nano is not None: 932 nano.pop() 933 self.unsupported("Specifying nanoseconds is not supported in TIMEFROMPARTS.") 934 935 if expression.args.get("fractions") is None: 936 expression.set("fractions", exp.Literal.number(0)) 937 if expression.args.get("precision") is None: 938 expression.set("precision", exp.Literal.number(0)) 939 940 return rename_func("TIMEFROMPARTS")(self, expression) 941 942 def timestampfromparts_sql(self, expression: exp.TimestampFromParts) -> str: 943 zone = expression.args.get("zone") 944 if zone is not None: 945 zone.pop() 946 self.unsupported("Time zone is not supported in DATETIMEFROMPARTS.") 947 948 nano = expression.args.get("nano") 949 if nano is not None: 950 nano.pop() 951 self.unsupported("Specifying nanoseconds is not supported in DATETIMEFROMPARTS.") 952 953 if expression.args.get("milli") is None: 954 expression.set("milli", exp.Literal.number(0)) 955 956 return rename_func("DATETIMEFROMPARTS")(self, expression) 957 958 def setitem_sql(self, expression: exp.SetItem) -> str: 959 this = expression.this 960 if isinstance(this, exp.EQ) and not isinstance(this.left, exp.Parameter): 961 # T-SQL does not use '=' in SET command, except when the LHS is a variable. 962 return f"{self.sql(this.left)} {self.sql(this.right)}" 963 964 return super().setitem_sql(expression) 965 966 def boolean_sql(self, expression: exp.Boolean) -> str: 967 if type(expression.parent) in BIT_TYPES: 968 return "1" if expression.this else "0" 969 970 return "(1 = 1)" if expression.this else "(1 = 0)" 971 972 def is_sql(self, expression: exp.Is) -> str: 973 if isinstance(expression.expression, exp.Boolean): 974 return self.binary(expression, "=") 975 return self.binary(expression, "IS") 976 977 def createable_sql(self, expression: exp.Create, locations: t.DefaultDict) -> str: 978 sql = self.sql(expression, "this") 979 properties = expression.args.get("properties") 980 981 if sql[:1] != "#" and any( 982 isinstance(prop, exp.TemporaryProperty) 983 for prop in (properties.expressions if properties else []) 984 ): 985 sql = f"[#{sql[1:]}" if sql.startswith("[") else f"#{sql}" 986 987 return sql 988 989 def create_sql(self, expression: exp.Create) -> str: 990 kind = expression.kind 991 exists = expression.args.pop("exists", None) 992 993 if kind == "VIEW": 994 expression.this.set("catalog", None) 995 996 sql = super().create_sql(expression) 997 998 like_property = expression.find(exp.LikeProperty) 999 if like_property: 1000 ctas_expression = like_property.this 1001 else: 1002 ctas_expression = expression.expression 1003 1004 table = expression.find(exp.Table) 1005 1006 # Convert CTAS statement to SELECT .. INTO .. 1007 if kind == "TABLE" and ctas_expression: 1008 ctas_with = ctas_expression.args.get("with") 1009 if ctas_with: 1010 ctas_with = ctas_with.pop() 1011 1012 if isinstance(ctas_expression, exp.UNWRAPPED_QUERIES): 1013 ctas_expression = ctas_expression.subquery() 1014 1015 select_into = exp.select("*").from_(exp.alias_(ctas_expression, "temp", table=True)) 1016 select_into.set("into", exp.Into(this=table)) 1017 select_into.set("with", ctas_with) 1018 1019 if like_property: 1020 select_into.limit(0, copy=False) 1021 1022 sql = self.sql(select_into) 1023 1024 if exists: 1025 identifier = self.sql(exp.Literal.string(exp.table_name(table) if table else "")) 1026 sql = self.sql(exp.Literal.string(sql)) 1027 if kind == "SCHEMA": 1028 sql = f"""IF NOT EXISTS (SELECT * FROM information_schema.schemata WHERE schema_name = {identifier}) EXEC({sql})""" 1029 elif kind == "TABLE": 1030 assert table 1031 where = exp.and_( 1032 exp.column("table_name").eq(table.name), 1033 exp.column("table_schema").eq(table.db) if table.db else None, 1034 exp.column("table_catalog").eq(table.catalog) if table.catalog else None, 1035 ) 1036 sql = f"""IF NOT EXISTS (SELECT * FROM information_schema.tables WHERE {where}) EXEC({sql})""" 1037 elif kind == "INDEX": 1038 index = self.sql(exp.Literal.string(expression.this.text("this"))) 1039 sql = f"""IF NOT EXISTS (SELECT * FROM sys.indexes WHERE object_id = object_id({identifier}) AND name = {index}) EXEC({sql})""" 1040 elif expression.args.get("replace"): 1041 sql = sql.replace("CREATE OR REPLACE ", "CREATE OR ALTER ", 1) 1042 1043 return self.prepend_ctes(expression, sql) 1044 1045 def offset_sql(self, expression: exp.Offset) -> str: 1046 return f"{super().offset_sql(expression)} ROWS" 1047 1048 def version_sql(self, expression: exp.Version) -> str: 1049 name = "SYSTEM_TIME" if expression.name == "TIMESTAMP" else expression.name 1050 this = f"FOR {name}" 1051 expr = expression.expression 1052 kind = expression.text("kind") 1053 if kind in ("FROM", "BETWEEN"): 1054 args = expr.expressions 1055 sep = "TO" if kind == "FROM" else "AND" 1056 expr_sql = f"{self.sql(seq_get(args, 0))} {sep} {self.sql(seq_get(args, 1))}" 1057 else: 1058 expr_sql = self.sql(expr) 1059 1060 expr_sql = f" {expr_sql}" if expr_sql else "" 1061 return f"{this} {kind}{expr_sql}" 1062 1063 def returnsproperty_sql(self, expression: exp.ReturnsProperty) -> str: 1064 table = expression.args.get("table") 1065 table = f"{table} " if table else "" 1066 return f"RETURNS {table}{self.sql(expression, 'this')}" 1067 1068 def returning_sql(self, expression: exp.Returning) -> str: 1069 into = self.sql(expression, "into") 1070 into = self.seg(f"INTO {into}") if into else "" 1071 return f"{self.seg('OUTPUT')} {self.expressions(expression, flat=True)}{into}" 1072 1073 def transaction_sql(self, expression: exp.Transaction) -> str: 1074 this = self.sql(expression, "this") 1075 this = f" {this}" if this else "" 1076 mark = self.sql(expression, "mark") 1077 mark = f" WITH MARK {mark}" if mark else "" 1078 return f"BEGIN TRANSACTION{this}{mark}" 1079 1080 def commit_sql(self, expression: exp.Commit) -> str: 1081 this = self.sql(expression, "this") 1082 this = f" {this}" if this else "" 1083 durability = expression.args.get("durability") 1084 durability = ( 1085 f" WITH (DELAYED_DURABILITY = {'ON' if durability else 'OFF'})" 1086 if durability is not None 1087 else "" 1088 ) 1089 return f"COMMIT TRANSACTION{this}{durability}" 1090 1091 def rollback_sql(self, expression: exp.Rollback) -> str: 1092 this = self.sql(expression, "this") 1093 this = f" {this}" if this else "" 1094 return f"ROLLBACK TRANSACTION{this}" 1095 1096 def identifier_sql(self, expression: exp.Identifier) -> str: 1097 identifier = super().identifier_sql(expression) 1098 1099 if expression.args.get("global"): 1100 identifier = f"##{identifier}" 1101 elif expression.args.get("temporary"): 1102 identifier = f"#{identifier}" 1103 1104 return identifier 1105 1106 def constraint_sql(self, expression: exp.Constraint) -> str: 1107 this = self.sql(expression, "this") 1108 expressions = self.expressions(expression, flat=True, sep=" ") 1109 return f"CONSTRAINT {this} {expressions}" 1110 1111 def length_sql(self, expression: exp.Length) -> str: 1112 return self._uncast_text(expression, "LEN") 1113 1114 def right_sql(self, expression: exp.Right) -> str: 1115 return self._uncast_text(expression, "RIGHT") 1116 1117 def left_sql(self, expression: exp.Left) -> str: 1118 return self._uncast_text(expression, "LEFT") 1119 1120 def _uncast_text(self, expression: exp.Expression, name: str) -> str: 1121 this = expression.this 1122 if isinstance(this, exp.Cast) and this.is_type(exp.DataType.Type.TEXT): 1123 this_sql = self.sql(this, "this") 1124 else: 1125 this_sql = self.sql(this) 1126 expression_sql = self.sql(expression, "expression") 1127 return self.func(name, this_sql, expression_sql if expression_sql else None) 1128 1129 def partition_sql(self, expression: exp.Partition) -> str: 1130 return f"WITH (PARTITIONS({self.expressions(expression, flat=True)}))" 1131 1132 def altertable_sql(self, expression: exp.AlterTable) -> str: 1133 action = seq_get(expression.args.get("actions") or [], 0) 1134 if isinstance(action, exp.RenameTable): 1135 return f"EXEC sp_rename '{self.sql(expression.this)}', '{action.this.name}'" 1136 return super().altertable_sql(expression) 1137 1138 def drop_sql(self, expression: exp.Drop) -> str: 1139 if expression.args["kind"] == "VIEW": 1140 expression.this.set("catalog", None) 1141 return super().drop_sql(expression) 1142 1143 def declare_sql(self, expression: exp.Declare) -> str: 1144 return f"DECLARE {self.expressions(expression, flat=True)}" 1145 1146 def declareitem_sql(self, expression: exp.DeclareItem) -> str: 1147 variable = self.sql(expression, "this") 1148 default = self.sql(expression, "default") 1149 default = f" = {default}" if default else "" 1150 1151 kind = self.sql(expression, "kind") 1152 if isinstance(expression.args.get("kind"), exp.Schema): 1153 kind = f"TABLE {kind}" 1154 1155 return f"{variable} AS {kind}{default}" 1156 1157 def options_modifier(self, expression: exp.Expression) -> str: 1158 options = self.expressions(expression, key="options") 1159 return f" OPTION{self.wrap(options)}" if options else ""
Generator converts a given syntax tree to the corresponding SQL string.
Arguments:
- pretty: Whether to format the produced SQL string. Default: False.
- identify: Determines when an identifier should be quoted. Possible values are: False (default): Never quote, except in cases where it's mandatory by the dialect. True or 'always': Always quote. 'safe': Only quote identifiers that are case insensitive.
- normalize: Whether to normalize identifiers to lowercase. Default: False.
- pad: The pad size in a formatted string. For example, this affects the indentation of a projection in a query, relative to its nesting level. Default: 2.
- indent: The indentation size in a formatted string. For example, this affects the
indentation of subqueries and filters under a
WHERE
clause. Default: 2. - normalize_functions: How to normalize function names. Possible values are: "upper" or True (default): Convert names to uppercase. "lower": Convert names to lowercase. False: Disables function name normalization.
- unsupported_level: Determines the generator's behavior when it encounters unsupported expressions. Default ErrorLevel.WARN.
- max_unsupported: Maximum number of unsupported messages to include in a raised UnsupportedError. This is only relevant if unsupported_level is ErrorLevel.RAISE. Default: 3
- leading_comma: Whether the comma is leading or trailing in select expressions. This is only relevant when generating in pretty mode. Default: False
- max_text_width: The max number of characters in a segment before creating new lines in pretty mode. The default is on the smaller end because the length only represents a segment and not the true line length. Default: 80
- comments: Whether to preserve comments in the output SQL code. Default: True
888 def select_sql(self, expression: exp.Select) -> str: 889 if expression.args.get("offset"): 890 if not expression.args.get("order"): 891 # ORDER BY is required in order to use OFFSET in a query, so we use 892 # a noop order by, since we don't really care about the order. 893 # See: https://www.microsoftpressstore.com/articles/article.aspx?p=2314819 894 expression.order_by(exp.select(exp.null()).subquery(), copy=False) 895 896 limit = expression.args.get("limit") 897 if isinstance(limit, exp.Limit): 898 # TOP and OFFSET can't be combined, we need use FETCH instead of TOP 899 # we replace here because otherwise TOP would be generated in select_sql 900 limit.replace(exp.Fetch(direction="FIRST", count=limit.expression)) 901 902 return super().select_sql(expression)
910 def queryoption_sql(self, expression: exp.QueryOption) -> str: 911 option = self.sql(expression, "this") 912 value = self.sql(expression, "expression") 913 if value: 914 optional_equal_sign = "= " if option in OPTIONS_THAT_REQUIRE_EQUAL else "" 915 return f"{option} {optional_equal_sign}{value}" 916 return option
918 def lateral_op(self, expression: exp.Lateral) -> str: 919 cross_apply = expression.args.get("cross_apply") 920 if cross_apply is True: 921 return "CROSS APPLY" 922 if cross_apply is False: 923 return "OUTER APPLY" 924 925 # TODO: perhaps we can check if the parent is a Join and transpile it appropriately 926 self.unsupported("LATERAL clause is not supported.") 927 return "LATERAL"
929 def timefromparts_sql(self, expression: exp.TimeFromParts) -> str: 930 nano = expression.args.get("nano") 931 if nano is not None: 932 nano.pop() 933 self.unsupported("Specifying nanoseconds is not supported in TIMEFROMPARTS.") 934 935 if expression.args.get("fractions") is None: 936 expression.set("fractions", exp.Literal.number(0)) 937 if expression.args.get("precision") is None: 938 expression.set("precision", exp.Literal.number(0)) 939 940 return rename_func("TIMEFROMPARTS")(self, expression)
942 def timestampfromparts_sql(self, expression: exp.TimestampFromParts) -> str: 943 zone = expression.args.get("zone") 944 if zone is not None: 945 zone.pop() 946 self.unsupported("Time zone is not supported in DATETIMEFROMPARTS.") 947 948 nano = expression.args.get("nano") 949 if nano is not None: 950 nano.pop() 951 self.unsupported("Specifying nanoseconds is not supported in DATETIMEFROMPARTS.") 952 953 if expression.args.get("milli") is None: 954 expression.set("milli", exp.Literal.number(0)) 955 956 return rename_func("DATETIMEFROMPARTS")(self, expression)
958 def setitem_sql(self, expression: exp.SetItem) -> str: 959 this = expression.this 960 if isinstance(this, exp.EQ) and not isinstance(this.left, exp.Parameter): 961 # T-SQL does not use '=' in SET command, except when the LHS is a variable. 962 return f"{self.sql(this.left)} {self.sql(this.right)}" 963 964 return super().setitem_sql(expression)
977 def createable_sql(self, expression: exp.Create, locations: t.DefaultDict) -> str: 978 sql = self.sql(expression, "this") 979 properties = expression.args.get("properties") 980 981 if sql[:1] != "#" and any( 982 isinstance(prop, exp.TemporaryProperty) 983 for prop in (properties.expressions if properties else []) 984 ): 985 sql = f"[#{sql[1:]}" if sql.startswith("[") else f"#{sql}" 986 987 return sql
989 def create_sql(self, expression: exp.Create) -> str: 990 kind = expression.kind 991 exists = expression.args.pop("exists", None) 992 993 if kind == "VIEW": 994 expression.this.set("catalog", None) 995 996 sql = super().create_sql(expression) 997 998 like_property = expression.find(exp.LikeProperty) 999 if like_property: 1000 ctas_expression = like_property.this 1001 else: 1002 ctas_expression = expression.expression 1003 1004 table = expression.find(exp.Table) 1005 1006 # Convert CTAS statement to SELECT .. INTO .. 1007 if kind == "TABLE" and ctas_expression: 1008 ctas_with = ctas_expression.args.get("with") 1009 if ctas_with: 1010 ctas_with = ctas_with.pop() 1011 1012 if isinstance(ctas_expression, exp.UNWRAPPED_QUERIES): 1013 ctas_expression = ctas_expression.subquery() 1014 1015 select_into = exp.select("*").from_(exp.alias_(ctas_expression, "temp", table=True)) 1016 select_into.set("into", exp.Into(this=table)) 1017 select_into.set("with", ctas_with) 1018 1019 if like_property: 1020 select_into.limit(0, copy=False) 1021 1022 sql = self.sql(select_into) 1023 1024 if exists: 1025 identifier = self.sql(exp.Literal.string(exp.table_name(table) if table else "")) 1026 sql = self.sql(exp.Literal.string(sql)) 1027 if kind == "SCHEMA": 1028 sql = f"""IF NOT EXISTS (SELECT * FROM information_schema.schemata WHERE schema_name = {identifier}) EXEC({sql})""" 1029 elif kind == "TABLE": 1030 assert table 1031 where = exp.and_( 1032 exp.column("table_name").eq(table.name), 1033 exp.column("table_schema").eq(table.db) if table.db else None, 1034 exp.column("table_catalog").eq(table.catalog) if table.catalog else None, 1035 ) 1036 sql = f"""IF NOT EXISTS (SELECT * FROM information_schema.tables WHERE {where}) EXEC({sql})""" 1037 elif kind == "INDEX": 1038 index = self.sql(exp.Literal.string(expression.this.text("this"))) 1039 sql = f"""IF NOT EXISTS (SELECT * FROM sys.indexes WHERE object_id = object_id({identifier}) AND name = {index}) EXEC({sql})""" 1040 elif expression.args.get("replace"): 1041 sql = sql.replace("CREATE OR REPLACE ", "CREATE OR ALTER ", 1) 1042 1043 return self.prepend_ctes(expression, sql)
1048 def version_sql(self, expression: exp.Version) -> str: 1049 name = "SYSTEM_TIME" if expression.name == "TIMESTAMP" else expression.name 1050 this = f"FOR {name}" 1051 expr = expression.expression 1052 kind = expression.text("kind") 1053 if kind in ("FROM", "BETWEEN"): 1054 args = expr.expressions 1055 sep = "TO" if kind == "FROM" else "AND" 1056 expr_sql = f"{self.sql(seq_get(args, 0))} {sep} {self.sql(seq_get(args, 1))}" 1057 else: 1058 expr_sql = self.sql(expr) 1059 1060 expr_sql = f" {expr_sql}" if expr_sql else "" 1061 return f"{this} {kind}{expr_sql}"
1080 def commit_sql(self, expression: exp.Commit) -> str: 1081 this = self.sql(expression, "this") 1082 this = f" {this}" if this else "" 1083 durability = expression.args.get("durability") 1084 durability = ( 1085 f" WITH (DELAYED_DURABILITY = {'ON' if durability else 'OFF'})" 1086 if durability is not None 1087 else "" 1088 ) 1089 return f"COMMIT TRANSACTION{this}{durability}"
1096 def identifier_sql(self, expression: exp.Identifier) -> str: 1097 identifier = super().identifier_sql(expression) 1098 1099 if expression.args.get("global"): 1100 identifier = f"##{identifier}" 1101 elif expression.args.get("temporary"): 1102 identifier = f"#{identifier}" 1103 1104 return identifier
1132 def altertable_sql(self, expression: exp.AlterTable) -> str: 1133 action = seq_get(expression.args.get("actions") or [], 0) 1134 if isinstance(action, exp.RenameTable): 1135 return f"EXEC sp_rename '{self.sql(expression.this)}', '{action.this.name}'" 1136 return super().altertable_sql(expression)
1146 def declareitem_sql(self, expression: exp.DeclareItem) -> str: 1147 variable = self.sql(expression, "this") 1148 default = self.sql(expression, "default") 1149 default = f" = {default}" if default else "" 1150 1151 kind = self.sql(expression, "kind") 1152 if isinstance(expression.args.get("kind"), exp.Schema): 1153 kind = f"TABLE {kind}" 1154 1155 return f"{variable} AS {kind}{default}"
Inherited Members
- sqlglot.generator.Generator
- Generator
- IGNORE_NULLS_IN_FUNC
- LOCKING_READS_SUPPORTED
- EXPLICIT_SET_OP
- WRAP_DERIVED_VALUES
- CREATE_FUNCTION_RETURN_AS
- MATCHED_BY_SOURCE
- SINGLE_STRING_INTERVAL
- INTERVAL_ALLOWS_PLURAL_FORM
- LIMIT_ONLY_LITERALS
- RENAME_TABLE_WITH_DB
- GROUPINGS_SEP
- INDEX_ON
- JOIN_HINTS
- TABLE_HINTS
- QUERY_HINT_SEP
- IS_BOOL_ALLOWED
- DUPLICATE_KEY_UPDATE_WITH_SET
- EXTRACT_ALLOWS_QUOTES
- TZ_TO_WITH_TIME_ZONE
- VALUES_AS_TABLE
- UNNEST_WITH_ORDINALITY
- AGGREGATE_FILTER_SUPPORTED
- SEMI_ANTI_JOIN_WITH_SIDE
- SUPPORTS_TABLE_COPY
- TABLESAMPLE_REQUIRES_PARENS
- TABLESAMPLE_SIZE_IS_ROWS
- TABLESAMPLE_KEYWORDS
- TABLESAMPLE_WITH_METHOD
- COLLATE_IS_FUNC
- DATA_TYPE_SPECIFIERS_ALLOWED
- LAST_DAY_SUPPORTS_DATE_PART
- SUPPORTS_TABLE_ALIAS_COLUMNS
- UNPIVOT_ALIASES_ARE_IDENTIFIERS
- JSON_KEY_VALUE_PAIR_SEP
- INSERT_OVERWRITE
- SUPPORTS_UNLOGGED_TABLES
- SUPPORTS_CREATE_TABLE_LIKE
- LIKE_PROPERTY_INSIDE_SCHEMA
- MULTI_ARG_DISTINCT
- JSON_TYPE_REQUIRED_FOR_EXTRACTION
- JSON_PATH_SINGLE_QUOTE_ESCAPE
- CAN_IMPLEMENT_ARRAY_ANY
- COPY_PARAMS_ARE_WRAPPED
- COPY_HAS_INTO_KEYWORD
- STAR_EXCEPT
- HEX_FUNC
- WITH_PROPERTIES_PREFIX
- QUOTE_JSON_PATH
- PAD_FILL_PATTERN_IS_REQUIRED
- TIME_PART_SINGULARS
- TOKEN_MAPPING
- STRUCT_DELIMITER
- PARAMETER_TOKEN
- NAMED_PLACEHOLDER_TOKEN
- RESERVED_KEYWORDS
- WITH_SEPARATED_COMMENTS
- EXCLUDE_COMMENTS
- UNWRAPPED_INTERVAL_VALUES
- PARAMETERIZABLE_TEXT_TYPES
- SENTINEL_LINE_BREAK
- pretty
- identify
- normalize
- pad
- unsupported_level
- max_unsupported
- leading_comma
- max_text_width
- comments
- dialect
- normalize_functions
- unsupported_messages
- generate
- preprocess
- unsupported
- sep
- seg
- pad_comment
- maybe_comment
- wrap
- no_identify
- normalize_func
- indent
- sql
- uncache_sql
- cache_sql
- characterset_sql
- column_parts
- column_sql
- columnposition_sql
- columndef_sql
- columnconstraint_sql
- computedcolumnconstraint_sql
- autoincrementcolumnconstraint_sql
- compresscolumnconstraint_sql
- generatedasidentitycolumnconstraint_sql
- generatedasrowcolumnconstraint_sql
- periodforsystemtimeconstraint_sql
- notnullcolumnconstraint_sql
- transformcolumnconstraint_sql
- primarykeycolumnconstraint_sql
- uniquecolumnconstraint_sql
- sequenceproperties_sql
- clone_sql
- describe_sql
- heredoc_sql
- prepend_ctes
- with_sql
- cte_sql
- tablealias_sql
- bitstring_sql
- hexstring_sql
- bytestring_sql
- unicodestring_sql
- rawstring_sql
- datatypeparam_sql
- datatype_sql
- directory_sql
- delete_sql
- except_sql
- except_op
- fetch_sql
- filter_sql
- hint_sql
- indexparameters_sql
- index_sql
- hex_sql
- lowerhex_sql
- inputoutputformat_sql
- national_sql
- properties_sql
- root_properties
- properties
- with_properties
- locate_properties
- property_name
- property_sql
- likeproperty_sql
- fallbackproperty_sql
- journalproperty_sql
- freespaceproperty_sql
- checksumproperty_sql
- mergeblockratioproperty_sql
- datablocksizeproperty_sql
- blockcompressionproperty_sql
- isolatedloadingproperty_sql
- partitionboundspec_sql
- partitionedofproperty_sql
- lockingproperty_sql
- withdataproperty_sql
- withsystemversioningproperty_sql
- insert_sql
- intersect_sql
- intersect_op
- introducer_sql
- kill_sql
- pseudotype_sql
- objectidentifier_sql
- onconflict_sql
- rowformatdelimitedproperty_sql
- withtablehint_sql
- indextablehint_sql
- historicaldata_sql
- table_parts
- table_sql
- tablesample_sql
- pivot_sql
- tuple_sql
- update_sql
- values_sql
- var_sql
- into_sql
- from_sql
- group_sql
- having_sql
- connect_sql
- prior_sql
- join_sql
- lambda_sql
- lateral_sql
- limit_sql
- set_sql
- pragma_sql
- lock_sql
- literal_sql
- escape_str
- loaddata_sql
- null_sql
- order_sql
- withfill_sql
- cluster_sql
- distribute_sql
- sort_sql
- ordered_sql
- matchrecognizemeasure_sql
- matchrecognize_sql
- query_modifiers
- offset_limit_modifiers
- after_limit_modifiers
- schema_sql
- schema_columns_sql
- star_sql
- parameter_sql
- sessionparameter_sql
- placeholder_sql
- subquery_sql
- qualify_sql
- set_operations
- union_sql
- union_op
- unnest_sql
- prewhere_sql
- where_sql
- window_sql
- partition_by_sql
- windowspec_sql
- withingroup_sql
- between_sql
- bracket_offset_expressions
- bracket_sql
- all_sql
- any_sql
- exists_sql
- case_sql
- nextvaluefor_sql
- extract_sql
- trim_sql
- convert_concat_args
- concat_sql
- concatws_sql
- check_sql
- foreignkey_sql
- primarykey_sql
- if_sql
- matchagainst_sql
- jsonkeyvalue_sql
- jsonpath_sql
- json_path_part
- formatjson_sql
- jsonobject_sql
- jsonobjectagg_sql
- jsonarray_sql
- jsonarrayagg_sql
- jsoncolumndef_sql
- jsonschema_sql
- jsontable_sql
- openjsoncolumndef_sql
- openjson_sql
- in_sql
- in_unnest_op
- interval_sql
- return_sql
- reference_sql
- anonymous_sql
- paren_sql
- neg_sql
- not_sql
- alias_sql
- pivotalias_sql
- aliases_sql
- atindex_sql
- attimezone_sql
- fromtimezone_sql
- add_sql
- and_sql
- or_sql
- xor_sql
- connector_sql
- bitwiseand_sql
- bitwiseleftshift_sql
- bitwisenot_sql
- bitwiseor_sql
- bitwiserightshift_sql
- bitwisexor_sql
- cast_sql
- currentdate_sql
- currenttimestamp_sql
- collate_sql
- command_sql
- comment_sql
- mergetreettlaction_sql
- mergetreettl_sql
- altercolumn_sql
- alterdiststyle_sql
- altersortkey_sql
- renametable_sql
- renamecolumn_sql
- alterset_sql
- add_column_sql
- droppartition_sql
- addconstraint_sql
- distinct_sql
- ignorenulls_sql
- respectnulls_sql
- havingmax_sql
- intdiv_sql
- dpipe_sql
- div_sql
- overlaps_sql
- distance_sql
- dot_sql
- eq_sql
- propertyeq_sql
- escape_sql
- glob_sql
- gt_sql
- gte_sql
- ilike_sql
- ilikeany_sql
- like_sql
- likeany_sql
- similarto_sql
- lt_sql
- lte_sql
- mod_sql
- mul_sql
- neq_sql
- nullsafeeq_sql
- nullsafeneq_sql
- slice_sql
- sub_sql
- trycast_sql
- try_sql
- log_sql
- use_sql
- binary
- function_fallback_sql
- func
- format_args
- too_wide
- format_time
- expressions
- op_expressions
- naked_property
- tag_sql
- token_sql
- userdefinedfunction_sql
- joinhint_sql
- kwarg_sql
- when_sql
- merge_sql
- tochar_sql
- tonumber_sql
- dictproperty_sql
- dictrange_sql
- dictsubproperty_sql
- oncluster_sql
- clusteredbyproperty_sql
- anyvalue_sql
- querytransform_sql
- indexconstraintoption_sql
- checkcolumnconstraint_sql
- indexcolumnconstraint_sql
- nvl2_sql
- comprehension_sql
- columnprefix_sql
- opclass_sql
- predict_sql
- forin_sql
- refresh_sql
- operator_sql
- toarray_sql
- tsordstotime_sql
- tsordstotimestamp_sql
- tsordstodate_sql
- unixdate_sql
- lastday_sql
- dateadd_sql
- arrayany_sql
- generateseries_sql
- struct_sql
- partitionrange_sql
- truncatetable_sql
- copyparameter_sql
- credentials_sql
- copy_sql
- semicolon_sql
- datadeletionproperty_sql
- maskingpolicycolumnconstraint_sql
- gapfill_sql
- scoperesolution_sql
- parsejson_sql
- rand_sql
- strtodate_sql
- strtotime_sql
- changes_sql
- pad_sql