sqlglot.generators.clickhouse
1from __future__ import annotations 2 3import datetime 4import typing as t 5 6from sqlglot import exp, generator 7from sqlglot.dialects.dialect import ( 8 arg_max_or_min_no_count, 9 inline_array_sql, 10 jarowinkler_similarity, 11 json_extract_segments, 12 json_path_key_only_name, 13 length_or_char_length_sql, 14 no_pivot_sql, 15 rename_func, 16 remove_from_array_using_filter, 17 sha256_sql, 18 strposition_sql, 19 var_map_sql, 20 unit_to_str, 21 unit_to_var, 22 trim_sql, 23 sha2_digest_sql, 24) 25from sqlglot.generator import unsupported_args 26from sqlglot.helper import is_int 27from collections import defaultdict 28 29DATETIME_DELTA = t.Union[exp.DateAdd, exp.DateDiff, exp.DateSub, exp.TimestampSub, exp.TimestampAdd] 30 31 32def _unix_to_time_sql(self: ClickHouseGenerator, expression: exp.UnixToTime) -> str: 33 scale = expression.args.get("scale") 34 timestamp = expression.this 35 36 if scale in (None, exp.UnixToTime.SECONDS): 37 return self.func("fromUnixTimestamp", exp.cast(timestamp, exp.DType.BIGINT)) 38 if scale == exp.UnixToTime.MILLIS: 39 return self.func("fromUnixTimestamp64Milli", exp.cast(timestamp, exp.DType.BIGINT)) 40 if scale == exp.UnixToTime.MICROS: 41 return self.func("fromUnixTimestamp64Micro", exp.cast(timestamp, exp.DType.BIGINT)) 42 if scale == exp.UnixToTime.NANOS: 43 return self.func("fromUnixTimestamp64Nano", exp.cast(timestamp, exp.DType.BIGINT)) 44 45 return self.func( 46 "fromUnixTimestamp", 47 exp.cast(exp.Div(this=timestamp, expression=exp.func("POW", 10, scale)), exp.DType.BIGINT), 48 ) 49 50 51def _lower_func(sql: str) -> str: 52 index = sql.index("(") 53 return sql[:index].lower() + sql[index:] 54 55 56def _quantile_sql(self: ClickHouseGenerator, expression: exp.Quantile) -> str: 57 quantile = expression.args["quantile"] 58 args = f"({self.sql(expression, 'this')})" 59 60 if isinstance(quantile, exp.Array): 61 func = self.func("quantiles", *quantile) 62 else: 63 func = self.func("quantile", quantile) 64 65 return func + args 66 67 68def _datetime_delta_sql(name: str) -> t.Callable[[generator.Generator, DATETIME_DELTA], str]: 69 def _delta_sql(self: generator.Generator, expression: DATETIME_DELTA) -> str: 70 if not expression.unit: 71 return rename_func(name)(self, expression) 72 73 return self.func( 74 name, 75 unit_to_var(expression), 76 expression.expression, 77 expression.this, 78 expression.args.get("zone"), 79 ) 80 81 return _delta_sql 82 83 84def _timestrtotime_sql(self: ClickHouseGenerator, expression: exp.TimeStrToTime): 85 ts = expression.this 86 87 tz = expression.args.get("zone") 88 if tz and isinstance(ts, exp.Literal): 89 # Clickhouse will not accept timestamps that include a UTC offset, so we must remove them. 90 # The first step to removing is parsing the string with `datetime.datetime.fromisoformat`. 91 # 92 # In python <3.11, `fromisoformat()` can only parse timestamps of millisecond (3 digit) 93 # or microsecond (6 digit) precision. It will error if passed any other number of fractional 94 # digits, so we extract the fractional seconds and pad to 6 digits before parsing. 95 ts_string = ts.name.strip() 96 97 # separate [date and time] from [fractional seconds and UTC offset] 98 ts_parts = ts_string.split(".") 99 if len(ts_parts) == 2: 100 # separate fractional seconds and UTC offset 101 offset_sep = "+" if "+" in ts_parts[1] else "-" 102 ts_frac_parts = ts_parts[1].split(offset_sep) 103 num_frac_parts = len(ts_frac_parts) 104 105 # pad to 6 digits if fractional seconds present 106 ts_frac_parts[0] = ts_frac_parts[0].ljust(6, "0") 107 ts_string = "".join( 108 [ 109 ts_parts[0], # date and time 110 ".", 111 ts_frac_parts[0], # fractional seconds 112 offset_sep if num_frac_parts > 1 else "", 113 ts_frac_parts[1] if num_frac_parts > 1 else "", # utc offset (if present) 114 ] 115 ) 116 117 # return literal with no timezone, eg turn '2020-01-01 12:13:14-08:00' into '2020-01-01 12:13:14' 118 # this is because Clickhouse encodes the timezone as a data type parameter and throws an error if 119 # it's part of the timestamp string 120 ts_without_tz = ( 121 datetime.datetime.fromisoformat(ts_string).replace(tzinfo=None).isoformat(sep=" ") 122 ) 123 ts = exp.Literal.string(ts_without_tz) 124 125 # Non-nullable DateTime64 with microsecond precision 126 expressions = [exp.DataTypeParam(this=tz)] if tz else [] 127 datatype = exp.DType.DATETIME64.into_expr( 128 expressions=[exp.DataTypeParam(this=exp.Literal.number(6)), *expressions], 129 nullable=False, 130 ) 131 132 return self.sql(exp.cast(ts, datatype, dialect=self.dialect)) 133 134 135def _map_sql(self: ClickHouseGenerator, expression: exp.Map | exp.VarMap) -> str: 136 if not (expression.parent and expression.parent.arg_key == "settings"): 137 return _lower_func(var_map_sql(self, expression)) 138 139 keys = expression.args.get("keys") 140 values = expression.args.get("values") 141 142 if not isinstance(keys, exp.Array) or not isinstance(values, exp.Array): 143 self.unsupported("Cannot convert array columns into map.") 144 return "" 145 146 args = [] 147 for key, value in zip(keys.expressions, values.expressions): 148 args.append(f"{self.sql(key)}: {self.sql(value)}") 149 150 csv_args = ", ".join(args) 151 152 return f"{{{csv_args}}}" 153 154 155def _json_cast_sql(self: ClickHouseGenerator, expression: exp.JSONCast) -> str: 156 this = self.sql(expression, "this") 157 to = expression.to 158 to_sql = self.sql(to) 159 160 if to.expressions: 161 to_sql = self.sql(exp.to_identifier(to_sql)) 162 163 return f"{this}.:{to_sql}" 164 165 166class ClickHouseGenerator(generator.Generator): 167 SELECT_KINDS: tuple[str, ...] = () 168 TRY_SUPPORTED = False 169 SUPPORTS_UESCAPE = False 170 SUPPORTS_DECODE_CASE = False 171 172 AFTER_HAVING_MODIFIER_TRANSFORMS = generator.AFTER_HAVING_MODIFIER_TRANSFORMS 173 174 QUERY_HINTS = False 175 STRUCT_DELIMITER = ("(", ")") 176 NVL2_SUPPORTED = False 177 TABLESAMPLE_REQUIRES_PARENS = False 178 TABLESAMPLE_SIZE_IS_ROWS = False 179 TABLESAMPLE_KEYWORDS = "SAMPLE" 180 LAST_DAY_SUPPORTS_DATE_PART = False 181 CAN_IMPLEMENT_ARRAY_ANY = True 182 SUPPORTS_TO_NUMBER = False 183 JOIN_HINTS = False 184 TABLE_HINTS = False 185 GROUPINGS_SEP = "" 186 SET_OP_MODIFIERS = False 187 ARRAY_SIZE_NAME = "LENGTH" 188 WRAP_DERIVED_VALUES = False 189 190 STRING_TYPE_MAPPING: t.ClassVar = { 191 exp.DType.BLOB: "String", 192 exp.DType.CHAR: "String", 193 exp.DType.LONGBLOB: "String", 194 exp.DType.LONGTEXT: "String", 195 exp.DType.MEDIUMBLOB: "String", 196 exp.DType.MEDIUMTEXT: "String", 197 exp.DType.TINYBLOB: "String", 198 exp.DType.TINYTEXT: "String", 199 exp.DType.TEXT: "String", 200 exp.DType.VARBINARY: "String", 201 exp.DType.VARCHAR: "String", 202 } 203 204 SUPPORTED_JSON_PATH_PARTS = { 205 exp.JSONPathKey, 206 exp.JSONPathRoot, 207 exp.JSONPathSubscript, 208 } 209 210 TYPE_MAPPING = { 211 **generator.Generator.TYPE_MAPPING, 212 exp.DType.BLOB: "String", 213 exp.DType.CHAR: "String", 214 exp.DType.LONGBLOB: "String", 215 exp.DType.LONGTEXT: "String", 216 exp.DType.MEDIUMBLOB: "String", 217 exp.DType.MEDIUMTEXT: "String", 218 exp.DType.TINYBLOB: "String", 219 exp.DType.TINYTEXT: "String", 220 exp.DType.TEXT: "String", 221 exp.DType.VARBINARY: "String", 222 exp.DType.VARCHAR: "String", 223 exp.DType.ARRAY: "Array", 224 exp.DType.BOOLEAN: "Bool", 225 exp.DType.BIGINT: "Int64", 226 exp.DType.DATE32: "Date32", 227 exp.DType.DATETIME: "DateTime", 228 exp.DType.DATETIME2: "DateTime", 229 exp.DType.SMALLDATETIME: "DateTime", 230 exp.DType.DATETIME64: "DateTime64", 231 exp.DType.DECIMAL: "Decimal", 232 exp.DType.DECIMAL32: "Decimal32", 233 exp.DType.DECIMAL64: "Decimal64", 234 exp.DType.DECIMAL128: "Decimal128", 235 exp.DType.DECIMAL256: "Decimal256", 236 exp.DType.TIMESTAMP: "DateTime", 237 exp.DType.TIMESTAMPNTZ: "DateTime", 238 exp.DType.TIMESTAMPTZ: "DateTime", 239 exp.DType.DOUBLE: "Float64", 240 exp.DType.ENUM: "Enum", 241 exp.DType.ENUM8: "Enum8", 242 exp.DType.ENUM16: "Enum16", 243 exp.DType.FIXEDSTRING: "FixedString", 244 exp.DType.FLOAT: "Float32", 245 exp.DType.INT: "Int32", 246 exp.DType.MEDIUMINT: "Int32", 247 exp.DType.INT128: "Int128", 248 exp.DType.INT256: "Int256", 249 exp.DType.LOWCARDINALITY: "LowCardinality", 250 exp.DType.MAP: "Map", 251 exp.DType.NESTED: "Nested", 252 exp.DType.NOTHING: "Nothing", 253 exp.DType.SMALLINT: "Int16", 254 exp.DType.STRUCT: "Tuple", 255 exp.DType.TINYINT: "Int8", 256 exp.DType.UBIGINT: "UInt64", 257 exp.DType.UINT: "UInt32", 258 exp.DType.UINT128: "UInt128", 259 exp.DType.UINT256: "UInt256", 260 exp.DType.USMALLINT: "UInt16", 261 exp.DType.UTINYINT: "UInt8", 262 exp.DType.IPV4: "IPv4", 263 exp.DType.IPV6: "IPv6", 264 exp.DType.POINT: "Point", 265 exp.DType.RING: "Ring", 266 exp.DType.LINESTRING: "LineString", 267 exp.DType.MULTILINESTRING: "MultiLineString", 268 exp.DType.POLYGON: "Polygon", 269 exp.DType.MULTIPOLYGON: "MultiPolygon", 270 exp.DType.AGGREGATEFUNCTION: "AggregateFunction", 271 exp.DType.SIMPLEAGGREGATEFUNCTION: "SimpleAggregateFunction", 272 exp.DType.DYNAMIC: "Dynamic", 273 } 274 275 TRANSFORMS = { 276 **generator.Generator.TRANSFORMS, 277 exp.AnyValue: rename_func("any"), 278 exp.ApproxDistinct: rename_func("uniq"), 279 exp.ArrayDistinct: rename_func("arrayDistinct"), 280 exp.ArrayConcat: rename_func("arrayConcat"), 281 exp.ArrayContains: rename_func("has"), 282 exp.ArrayFilter: lambda self, e: self.func("arrayFilter", e.expression, e.this), 283 exp.ArrayRemove: remove_from_array_using_filter, 284 exp.ArrayReverse: rename_func("arrayReverse"), 285 exp.ArraySlice: rename_func("arraySlice"), 286 exp.ArraySum: rename_func("arraySum"), 287 exp.ArrayMax: rename_func("arrayMax"), 288 exp.ArrayMin: rename_func("arrayMin"), 289 exp.ArgMax: arg_max_or_min_no_count("argMax"), 290 exp.ArgMin: arg_max_or_min_no_count("argMin"), 291 exp.Array: inline_array_sql, 292 exp.CityHash64: rename_func("cityHash64"), 293 exp.CastToStrType: rename_func("CAST"), 294 exp.CurrentDatabase: rename_func("CURRENT_DATABASE"), 295 exp.CurrentSchemas: rename_func("CURRENT_SCHEMAS"), 296 exp.CountIf: rename_func("countIf"), 297 exp.CosineDistance: rename_func("cosineDistance"), 298 exp.CompressColumnConstraint: lambda self, e: ( 299 f"CODEC({self.expressions(e, key='this', flat=True)})" 300 ), 301 exp.ComputedColumnConstraint: lambda self, e: ( 302 f"{'MATERIALIZED' if e.args.get('persisted') else 'ALIAS'} {self.sql(e, 'this')}" 303 ), 304 exp.CurrentDate: lambda self, e: self.func("CURRENT_DATE"), 305 exp.CurrentVersion: rename_func("VERSION"), 306 exp.DateAdd: _datetime_delta_sql("DATE_ADD"), 307 exp.DateDiff: _datetime_delta_sql("DATE_DIFF"), 308 exp.DateStrToDate: rename_func("toDate"), 309 exp.DateSub: _datetime_delta_sql("DATE_SUB"), 310 exp.Explode: rename_func("arrayJoin"), 311 exp.FarmFingerprint: rename_func("farmFingerprint64"), 312 exp.Final: lambda self, e: f"{self.sql(e, 'this')} FINAL", 313 exp.IsNan: rename_func("isNaN"), 314 exp.JarowinklerSimilarity: jarowinkler_similarity("jaroWinklerSimilarity"), 315 exp.JSONCast: _json_cast_sql, 316 exp.JSONExtract: json_extract_segments("JSONExtractString", quoted_index=False), 317 exp.JSONExtractScalar: json_extract_segments("JSONExtractString", quoted_index=False), 318 exp.JSONPathKey: json_path_key_only_name, 319 exp.JSONPathRoot: lambda *_: "", 320 exp.Length: length_or_char_length_sql, 321 exp.Map: _map_sql, 322 exp.Median: rename_func("median"), 323 exp.Nullif: rename_func("nullIf"), 324 exp.PartitionedByProperty: lambda self, e: f"PARTITION BY {self.sql(e, 'this')}", 325 exp.Pivot: no_pivot_sql, 326 exp.Quantile: _quantile_sql, 327 exp.RegexpLike: lambda self, e: self.func("match", e.this, e.expression), 328 exp.Rand: rename_func("randCanonical"), 329 exp.StartsWith: rename_func("startsWith"), 330 exp.Struct: rename_func("tuple"), 331 exp.Trunc: rename_func("trunc"), 332 exp.EndsWith: rename_func("endsWith"), 333 exp.EuclideanDistance: rename_func("L2Distance"), 334 exp.StrPosition: lambda self, e: strposition_sql( 335 self, 336 e, 337 func_name="POSITION", 338 supports_position=True, 339 use_ansi_position=False, 340 ), 341 exp.TimeToStr: lambda self, e: self.func( 342 "formatDateTime", 343 e.this.this if isinstance(e.this, exp.TsOrDsToTimestamp) else e.this, 344 self.format_time(e), 345 e.args.get("zone"), 346 ), 347 exp.TimeStrToTime: _timestrtotime_sql, 348 exp.TimestampAdd: _datetime_delta_sql("TIMESTAMP_ADD"), 349 exp.TimestampSub: _datetime_delta_sql("TIMESTAMP_SUB"), 350 exp.Typeof: rename_func("toTypeName"), 351 exp.VarMap: _map_sql, 352 exp.Xor: lambda self, e: self.func("xor", e.this, e.expression, *e.expressions), 353 exp.MD5Digest: rename_func("MD5"), 354 exp.MD5: lambda self, e: self.func("LOWER", self.func("HEX", self.func("MD5", e.this))), 355 exp.SHA: rename_func("SHA1"), 356 exp.SHA1Digest: rename_func("SHA1"), 357 exp.SHA2: sha256_sql, 358 exp.SHA2Digest: sha2_digest_sql, 359 exp.Split: lambda self, e: self.func( 360 "splitByString", e.args.get("expression"), e.this, e.args.get("limit") 361 ), 362 exp.RegexpSplit: lambda self, e: self.func( 363 "splitByRegexp", e.args.get("expression"), e.this, e.args.get("limit") 364 ), 365 exp.UnixToTime: _unix_to_time_sql, 366 exp.Trim: lambda self, e: trim_sql(self, e, default_trim_type="BOTH"), 367 exp.Variance: rename_func("varSamp"), 368 exp.SchemaCommentProperty: lambda self, e: self.naked_property(e), 369 exp.Stddev: rename_func("stddevSamp"), 370 exp.Chr: rename_func("CHAR"), 371 exp.Lag: lambda self, e: self.func( 372 "lagInFrame", e.this, e.args.get("offset"), e.args.get("default") 373 ), 374 exp.Lead: lambda self, e: self.func( 375 "leadInFrame", e.this, e.args.get("offset"), e.args.get("default") 376 ), 377 exp.Levenshtein: unsupported_args("ins_cost", "del_cost", "sub_cost", "max_dist")( 378 rename_func("editDistance") 379 ), 380 exp.ParseDatetime: rename_func("parseDateTime"), 381 } 382 383 PROPERTIES_LOCATION = { 384 **generator.Generator.PROPERTIES_LOCATION, 385 exp.DefinerProperty: exp.Properties.Location.POST_SCHEMA, 386 exp.OnCluster: exp.Properties.Location.POST_NAME, 387 exp.PartitionedByProperty: exp.Properties.Location.POST_SCHEMA, 388 exp.ToTableProperty: exp.Properties.Location.POST_NAME, 389 exp.UuidProperty: exp.Properties.Location.POST_NAME, 390 exp.VolatileProperty: exp.Properties.Location.UNSUPPORTED, 391 } 392 393 # There's no list in docs, but it can be found in Clickhouse code 394 # see `ClickHouse/src/Parsers/ParserCreate*.cpp` 395 ON_CLUSTER_TARGETS = { 396 "SCHEMA", # Transpiled CREATE SCHEMA may have OnCluster property set 397 "DATABASE", 398 "TABLE", 399 "VIEW", 400 "DICTIONARY", 401 "INDEX", 402 "FUNCTION", 403 "NAMED COLLECTION", 404 } 405 406 # https://clickhouse.com/docs/en/sql-reference/data-types/nullable 407 NON_NULLABLE_TYPES = { 408 exp.DType.ARRAY, 409 exp.DType.MAP, 410 exp.DType.STRUCT, 411 exp.DType.POINT, 412 exp.DType.RING, 413 exp.DType.LINESTRING, 414 exp.DType.MULTILINESTRING, 415 exp.DType.POLYGON, 416 exp.DType.MULTIPOLYGON, 417 } 418 419 def groupconcat_sql(self, expression: exp.GroupConcat) -> str: 420 this = expression.this 421 separator = expression.args.get("separator") 422 423 if isinstance(this, exp.Limit) and this.this: 424 limit = this 425 this = limit.this.pop() 426 return self.sql( 427 exp.ParameterizedAgg( 428 this="groupConcat", 429 params=[this], 430 expressions=[separator, limit.expression], 431 ) 432 ) 433 434 if separator: 435 return self.sql( 436 exp.ParameterizedAgg( 437 this="groupConcat", 438 params=[this], 439 expressions=[separator], 440 ) 441 ) 442 443 return self.func("groupConcat", this) 444 445 def offset_sql(self, expression: exp.Offset) -> str: 446 offset = super().offset_sql(expression) 447 448 # OFFSET ... FETCH syntax requires a "ROW" or "ROWS" keyword 449 # https://clickhouse.com/docs/sql-reference/statements/select/offset 450 parent = expression.parent 451 if isinstance(parent, exp.Select) and isinstance(parent.args.get("limit"), exp.Fetch): 452 offset = f"{offset} ROWS" 453 454 return offset 455 456 def strtodate_sql(self, expression: exp.StrToDate) -> str: 457 strtodate_sql = self.function_fallback_sql(expression) 458 459 if not isinstance(expression.parent, exp.Cast): 460 # StrToDate returns DATEs in other dialects (eg. postgres), so 461 # this branch aims to improve the transpilation to clickhouse 462 return self.cast_sql(exp.cast(expression, "DATE")) 463 464 return strtodate_sql 465 466 def cast_sql(self, expression: exp.Cast, safe_prefix: str | None = None) -> str: 467 this = expression.this 468 469 if isinstance(this, exp.StrToDate) and expression.to == exp.DType.DATETIME.into_expr(): 470 return self.sql(this) 471 472 return super().cast_sql(expression, safe_prefix=safe_prefix) 473 474 def trycast_sql(self, expression: exp.TryCast) -> str: 475 dtype = expression.to 476 if not dtype.is_type(*self.NON_NULLABLE_TYPES, check_nullable=True): 477 # Casting x into Nullable(T) appears to behave similarly to TRY_CAST(x AS T) 478 dtype.set("nullable", True) 479 480 return super().cast_sql(expression) 481 482 def _jsonpathsubscript_sql(self, expression: exp.JSONPathSubscript) -> str: 483 this = self.json_path_part(expression.this) 484 return str(int(this) + 1) if is_int(this) else this 485 486 def likeproperty_sql(self, expression: exp.LikeProperty) -> str: 487 return f"AS {self.sql(expression, 'this')}" 488 489 def _any_to_has( 490 self, 491 expression: exp.EQ | exp.NEQ, 492 default: t.Callable[[t.Any], str], 493 prefix: str = "", 494 ) -> str: 495 if isinstance(expression.left, exp.Any): 496 arr = expression.left 497 this = expression.right 498 elif isinstance(expression.right, exp.Any): 499 arr = expression.right 500 this = expression.left 501 else: 502 return default(expression) 503 504 return prefix + self.func("has", arr.this.unnest(), this) 505 506 def eq_sql(self, expression: exp.EQ) -> str: 507 return self._any_to_has(expression, super().eq_sql) 508 509 def neq_sql(self, expression: exp.NEQ) -> str: 510 return self._any_to_has(expression, super().neq_sql, "NOT ") 511 512 def regexpilike_sql(self, expression: exp.RegexpILike) -> str: 513 # Manually add a flag to make the search case-insensitive 514 regex = self.func("CONCAT", "'(?i)'", expression.expression) 515 return self.func("match", expression.this, regex) 516 517 def datatype_sql(self, expression: exp.DataType) -> str: 518 # String is the standard ClickHouse type, every other variant is just an alias. 519 # Additionally, any supplied length parameter will be ignored. 520 # 521 # https://clickhouse.com/docs/en/sql-reference/data-types/string 522 if expression.this in self.STRING_TYPE_MAPPING: 523 dtype = "String" 524 else: 525 dtype = super().datatype_sql(expression) 526 527 # This section changes the type to `Nullable(...)` if the following conditions hold: 528 # - It's marked as nullable - this ensures we won't wrap ClickHouse types with `Nullable` 529 # and change their semantics 530 # - It's not the key type of a `Map`. This is because ClickHouse enforces the following 531 # constraint: "Type of Map key must be a type, that can be represented by integer or 532 # String or FixedString (possibly LowCardinality) or UUID or IPv6" 533 # - It's not a composite type, e.g. `Nullable(Array(...))` is not a valid type 534 parent = expression.parent 535 nullable = expression.args.get("nullable") 536 if nullable is True or ( 537 nullable is None 538 and not ( 539 isinstance(parent, exp.DataType) 540 and parent.is_type(exp.DType.MAP, check_nullable=True) 541 and expression.index in (None, 0) 542 ) 543 and not expression.is_type(*self.NON_NULLABLE_TYPES, check_nullable=True) 544 ): 545 dtype = f"Nullable({dtype})" 546 547 return dtype 548 549 def cte_sql(self, expression: exp.CTE) -> str: 550 if expression.args.get("scalar"): 551 this = self.sql(expression, "this") 552 alias = self.sql(expression, "alias") 553 return f"{this} AS {alias}" 554 555 return super().cte_sql(expression) 556 557 def after_limit_modifiers(self, expression: exp.Expr) -> list[str]: 558 return super().after_limit_modifiers(expression) + [ 559 ( 560 self.seg("SETTINGS ") + self.expressions(expression, key="settings", flat=True) 561 if expression.args.get("settings") 562 else "" 563 ), 564 ( 565 self.seg("FORMAT ") + self.sql(expression, "format") 566 if expression.args.get("format") 567 else "" 568 ), 569 ] 570 571 def placeholder_sql(self, expression: exp.Placeholder) -> str: 572 return f"{{{expression.name}: {self.sql(expression, 'kind')}}}" 573 574 def oncluster_sql(self, expression: exp.OnCluster) -> str: 575 return f"ON CLUSTER {self.sql(expression, 'this')}" 576 577 def createable_sql(self, expression: exp.Create, locations: defaultdict) -> str: 578 if expression.kind in self.ON_CLUSTER_TARGETS and locations.get( 579 exp.Properties.Location.POST_NAME 580 ): 581 this_name = self.sql( 582 expression.this if isinstance(expression.this, exp.Schema) else expression, 583 "this", 584 ) 585 this_properties = " ".join( 586 [self.sql(prop) for prop in locations[exp.Properties.Location.POST_NAME]] 587 ) 588 this_schema = self.schema_columns_sql(expression.this) 589 this_schema = f"{self.sep()}{this_schema}" if this_schema else "" 590 591 return f"{this_name}{self.sep()}{this_properties}{this_schema}" 592 593 return super().createable_sql(expression, locations) 594 595 def create_sql(self, expression: exp.Create) -> str: 596 # The comment property comes last in CTAS statements, i.e. after the query 597 query = expression.expression 598 if isinstance(query, exp.Query): 599 comment_prop = expression.find(exp.SchemaCommentProperty) 600 if comment_prop: 601 comment_prop.pop() 602 query.replace(exp.paren(query)) 603 else: 604 comment_prop = None 605 606 create_sql = super().create_sql(expression) 607 608 comment_sql = self.sql(comment_prop) 609 comment_sql = f" {comment_sql}" if comment_sql else "" 610 611 return f"{create_sql}{comment_sql}" 612 613 def prewhere_sql(self, expression: exp.PreWhere) -> str: 614 this = self.indent(self.sql(expression, "this")) 615 return f"{self.seg('PREWHERE')}{self.sep()}{this}" 616 617 def indexcolumnconstraint_sql(self, expression: exp.IndexColumnConstraint) -> str: 618 this = self.sql(expression, "this") 619 this = f" {this}" if this else "" 620 expr = self.sql(expression, "expression") 621 expr = f" {expr}" if expr else "" 622 index_type = self.sql(expression, "index_type") 623 index_type = f" TYPE {index_type}" if index_type else "" 624 granularity = self.sql(expression, "granularity") 625 granularity = f" GRANULARITY {granularity}" if granularity else "" 626 627 return f"INDEX{this}{expr}{index_type}{granularity}" 628 629 def partition_sql(self, expression: exp.Partition) -> str: 630 return f"PARTITION {self.expressions(expression, flat=True)}" 631 632 def partitionid_sql(self, expression: exp.PartitionId) -> str: 633 return f"ID {self.sql(expression.this)}" 634 635 def replacepartition_sql(self, expression: exp.ReplacePartition) -> str: 636 return f"REPLACE {self.sql(expression.expression)} FROM {self.sql(expression, 'source')}" 637 638 def projectiondef_sql(self, expression: exp.ProjectionDef) -> str: 639 return f"PROJECTION {self.sql(expression.this)} {self.wrap(expression.expression)}" 640 641 def nestedjsonselect_sql(self, expression: exp.NestedJSONSelect) -> str: 642 return f"{self.sql(expression, 'this')}.^{self.sql(expression, 'expression')}" 643 644 def is_sql(self, expression: exp.Is) -> str: 645 is_sql = super().is_sql(expression) 646 647 if isinstance(expression.parent, exp.Not): 648 # value IS NOT NULL -> NOT (value IS NULL) 649 is_sql = self.wrap(is_sql) 650 651 return is_sql 652 653 def in_sql(self, expression: exp.In) -> str: 654 in_sql = super().in_sql(expression) 655 656 if isinstance(expression.parent, exp.Not) and expression.args.get("is_global"): 657 in_sql = in_sql.replace("GLOBAL IN", "GLOBAL NOT IN", 1) 658 659 return in_sql 660 661 def not_sql(self, expression: exp.Not) -> str: 662 if isinstance(expression.this, exp.In): 663 if expression.this.args.get("is_global"): 664 # let `GLOBAL IN` child interpose `NOT` 665 return self.sql(expression, "this") 666 667 expression.set("this", exp.paren(expression.this, copy=False)) 668 669 return super().not_sql(expression) 670 671 def values_sql(self, expression: exp.Values, values_as_table: bool = True) -> str: 672 # If the VALUES clause contains tuples of expressions, we need to treat it 673 # as a table since Clickhouse will automatically alias it as such. 674 alias = expression.args.get("alias") 675 676 if alias and alias.args.get("columns") and expression.expressions: 677 values = expression.expressions[0].expressions 678 values_as_table = any(isinstance(value, exp.Tuple) for value in values) 679 else: 680 values_as_table = True 681 682 return super().values_sql(expression, values_as_table=values_as_table) 683 684 def timestamptrunc_sql(self, expression: exp.TimestampTrunc) -> str: 685 unit = unit_to_str(expression) 686 # https://clickhouse.com/docs/whats-new/changelog/2023#improvement 687 if self.dialect.version < (23, 12) and unit and unit.is_string: 688 unit = exp.Literal.string(unit.name.lower()) 689 return self.func("dateTrunc", unit, expression.this, expression.args.get("zone"))
167class ClickHouseGenerator(generator.Generator): 168 SELECT_KINDS: tuple[str, ...] = () 169 TRY_SUPPORTED = False 170 SUPPORTS_UESCAPE = False 171 SUPPORTS_DECODE_CASE = False 172 173 AFTER_HAVING_MODIFIER_TRANSFORMS = generator.AFTER_HAVING_MODIFIER_TRANSFORMS 174 175 QUERY_HINTS = False 176 STRUCT_DELIMITER = ("(", ")") 177 NVL2_SUPPORTED = False 178 TABLESAMPLE_REQUIRES_PARENS = False 179 TABLESAMPLE_SIZE_IS_ROWS = False 180 TABLESAMPLE_KEYWORDS = "SAMPLE" 181 LAST_DAY_SUPPORTS_DATE_PART = False 182 CAN_IMPLEMENT_ARRAY_ANY = True 183 SUPPORTS_TO_NUMBER = False 184 JOIN_HINTS = False 185 TABLE_HINTS = False 186 GROUPINGS_SEP = "" 187 SET_OP_MODIFIERS = False 188 ARRAY_SIZE_NAME = "LENGTH" 189 WRAP_DERIVED_VALUES = False 190 191 STRING_TYPE_MAPPING: t.ClassVar = { 192 exp.DType.BLOB: "String", 193 exp.DType.CHAR: "String", 194 exp.DType.LONGBLOB: "String", 195 exp.DType.LONGTEXT: "String", 196 exp.DType.MEDIUMBLOB: "String", 197 exp.DType.MEDIUMTEXT: "String", 198 exp.DType.TINYBLOB: "String", 199 exp.DType.TINYTEXT: "String", 200 exp.DType.TEXT: "String", 201 exp.DType.VARBINARY: "String", 202 exp.DType.VARCHAR: "String", 203 } 204 205 SUPPORTED_JSON_PATH_PARTS = { 206 exp.JSONPathKey, 207 exp.JSONPathRoot, 208 exp.JSONPathSubscript, 209 } 210 211 TYPE_MAPPING = { 212 **generator.Generator.TYPE_MAPPING, 213 exp.DType.BLOB: "String", 214 exp.DType.CHAR: "String", 215 exp.DType.LONGBLOB: "String", 216 exp.DType.LONGTEXT: "String", 217 exp.DType.MEDIUMBLOB: "String", 218 exp.DType.MEDIUMTEXT: "String", 219 exp.DType.TINYBLOB: "String", 220 exp.DType.TINYTEXT: "String", 221 exp.DType.TEXT: "String", 222 exp.DType.VARBINARY: "String", 223 exp.DType.VARCHAR: "String", 224 exp.DType.ARRAY: "Array", 225 exp.DType.BOOLEAN: "Bool", 226 exp.DType.BIGINT: "Int64", 227 exp.DType.DATE32: "Date32", 228 exp.DType.DATETIME: "DateTime", 229 exp.DType.DATETIME2: "DateTime", 230 exp.DType.SMALLDATETIME: "DateTime", 231 exp.DType.DATETIME64: "DateTime64", 232 exp.DType.DECIMAL: "Decimal", 233 exp.DType.DECIMAL32: "Decimal32", 234 exp.DType.DECIMAL64: "Decimal64", 235 exp.DType.DECIMAL128: "Decimal128", 236 exp.DType.DECIMAL256: "Decimal256", 237 exp.DType.TIMESTAMP: "DateTime", 238 exp.DType.TIMESTAMPNTZ: "DateTime", 239 exp.DType.TIMESTAMPTZ: "DateTime", 240 exp.DType.DOUBLE: "Float64", 241 exp.DType.ENUM: "Enum", 242 exp.DType.ENUM8: "Enum8", 243 exp.DType.ENUM16: "Enum16", 244 exp.DType.FIXEDSTRING: "FixedString", 245 exp.DType.FLOAT: "Float32", 246 exp.DType.INT: "Int32", 247 exp.DType.MEDIUMINT: "Int32", 248 exp.DType.INT128: "Int128", 249 exp.DType.INT256: "Int256", 250 exp.DType.LOWCARDINALITY: "LowCardinality", 251 exp.DType.MAP: "Map", 252 exp.DType.NESTED: "Nested", 253 exp.DType.NOTHING: "Nothing", 254 exp.DType.SMALLINT: "Int16", 255 exp.DType.STRUCT: "Tuple", 256 exp.DType.TINYINT: "Int8", 257 exp.DType.UBIGINT: "UInt64", 258 exp.DType.UINT: "UInt32", 259 exp.DType.UINT128: "UInt128", 260 exp.DType.UINT256: "UInt256", 261 exp.DType.USMALLINT: "UInt16", 262 exp.DType.UTINYINT: "UInt8", 263 exp.DType.IPV4: "IPv4", 264 exp.DType.IPV6: "IPv6", 265 exp.DType.POINT: "Point", 266 exp.DType.RING: "Ring", 267 exp.DType.LINESTRING: "LineString", 268 exp.DType.MULTILINESTRING: "MultiLineString", 269 exp.DType.POLYGON: "Polygon", 270 exp.DType.MULTIPOLYGON: "MultiPolygon", 271 exp.DType.AGGREGATEFUNCTION: "AggregateFunction", 272 exp.DType.SIMPLEAGGREGATEFUNCTION: "SimpleAggregateFunction", 273 exp.DType.DYNAMIC: "Dynamic", 274 } 275 276 TRANSFORMS = { 277 **generator.Generator.TRANSFORMS, 278 exp.AnyValue: rename_func("any"), 279 exp.ApproxDistinct: rename_func("uniq"), 280 exp.ArrayDistinct: rename_func("arrayDistinct"), 281 exp.ArrayConcat: rename_func("arrayConcat"), 282 exp.ArrayContains: rename_func("has"), 283 exp.ArrayFilter: lambda self, e: self.func("arrayFilter", e.expression, e.this), 284 exp.ArrayRemove: remove_from_array_using_filter, 285 exp.ArrayReverse: rename_func("arrayReverse"), 286 exp.ArraySlice: rename_func("arraySlice"), 287 exp.ArraySum: rename_func("arraySum"), 288 exp.ArrayMax: rename_func("arrayMax"), 289 exp.ArrayMin: rename_func("arrayMin"), 290 exp.ArgMax: arg_max_or_min_no_count("argMax"), 291 exp.ArgMin: arg_max_or_min_no_count("argMin"), 292 exp.Array: inline_array_sql, 293 exp.CityHash64: rename_func("cityHash64"), 294 exp.CastToStrType: rename_func("CAST"), 295 exp.CurrentDatabase: rename_func("CURRENT_DATABASE"), 296 exp.CurrentSchemas: rename_func("CURRENT_SCHEMAS"), 297 exp.CountIf: rename_func("countIf"), 298 exp.CosineDistance: rename_func("cosineDistance"), 299 exp.CompressColumnConstraint: lambda self, e: ( 300 f"CODEC({self.expressions(e, key='this', flat=True)})" 301 ), 302 exp.ComputedColumnConstraint: lambda self, e: ( 303 f"{'MATERIALIZED' if e.args.get('persisted') else 'ALIAS'} {self.sql(e, 'this')}" 304 ), 305 exp.CurrentDate: lambda self, e: self.func("CURRENT_DATE"), 306 exp.CurrentVersion: rename_func("VERSION"), 307 exp.DateAdd: _datetime_delta_sql("DATE_ADD"), 308 exp.DateDiff: _datetime_delta_sql("DATE_DIFF"), 309 exp.DateStrToDate: rename_func("toDate"), 310 exp.DateSub: _datetime_delta_sql("DATE_SUB"), 311 exp.Explode: rename_func("arrayJoin"), 312 exp.FarmFingerprint: rename_func("farmFingerprint64"), 313 exp.Final: lambda self, e: f"{self.sql(e, 'this')} FINAL", 314 exp.IsNan: rename_func("isNaN"), 315 exp.JarowinklerSimilarity: jarowinkler_similarity("jaroWinklerSimilarity"), 316 exp.JSONCast: _json_cast_sql, 317 exp.JSONExtract: json_extract_segments("JSONExtractString", quoted_index=False), 318 exp.JSONExtractScalar: json_extract_segments("JSONExtractString", quoted_index=False), 319 exp.JSONPathKey: json_path_key_only_name, 320 exp.JSONPathRoot: lambda *_: "", 321 exp.Length: length_or_char_length_sql, 322 exp.Map: _map_sql, 323 exp.Median: rename_func("median"), 324 exp.Nullif: rename_func("nullIf"), 325 exp.PartitionedByProperty: lambda self, e: f"PARTITION BY {self.sql(e, 'this')}", 326 exp.Pivot: no_pivot_sql, 327 exp.Quantile: _quantile_sql, 328 exp.RegexpLike: lambda self, e: self.func("match", e.this, e.expression), 329 exp.Rand: rename_func("randCanonical"), 330 exp.StartsWith: rename_func("startsWith"), 331 exp.Struct: rename_func("tuple"), 332 exp.Trunc: rename_func("trunc"), 333 exp.EndsWith: rename_func("endsWith"), 334 exp.EuclideanDistance: rename_func("L2Distance"), 335 exp.StrPosition: lambda self, e: strposition_sql( 336 self, 337 e, 338 func_name="POSITION", 339 supports_position=True, 340 use_ansi_position=False, 341 ), 342 exp.TimeToStr: lambda self, e: self.func( 343 "formatDateTime", 344 e.this.this if isinstance(e.this, exp.TsOrDsToTimestamp) else e.this, 345 self.format_time(e), 346 e.args.get("zone"), 347 ), 348 exp.TimeStrToTime: _timestrtotime_sql, 349 exp.TimestampAdd: _datetime_delta_sql("TIMESTAMP_ADD"), 350 exp.TimestampSub: _datetime_delta_sql("TIMESTAMP_SUB"), 351 exp.Typeof: rename_func("toTypeName"), 352 exp.VarMap: _map_sql, 353 exp.Xor: lambda self, e: self.func("xor", e.this, e.expression, *e.expressions), 354 exp.MD5Digest: rename_func("MD5"), 355 exp.MD5: lambda self, e: self.func("LOWER", self.func("HEX", self.func("MD5", e.this))), 356 exp.SHA: rename_func("SHA1"), 357 exp.SHA1Digest: rename_func("SHA1"), 358 exp.SHA2: sha256_sql, 359 exp.SHA2Digest: sha2_digest_sql, 360 exp.Split: lambda self, e: self.func( 361 "splitByString", e.args.get("expression"), e.this, e.args.get("limit") 362 ), 363 exp.RegexpSplit: lambda self, e: self.func( 364 "splitByRegexp", e.args.get("expression"), e.this, e.args.get("limit") 365 ), 366 exp.UnixToTime: _unix_to_time_sql, 367 exp.Trim: lambda self, e: trim_sql(self, e, default_trim_type="BOTH"), 368 exp.Variance: rename_func("varSamp"), 369 exp.SchemaCommentProperty: lambda self, e: self.naked_property(e), 370 exp.Stddev: rename_func("stddevSamp"), 371 exp.Chr: rename_func("CHAR"), 372 exp.Lag: lambda self, e: self.func( 373 "lagInFrame", e.this, e.args.get("offset"), e.args.get("default") 374 ), 375 exp.Lead: lambda self, e: self.func( 376 "leadInFrame", e.this, e.args.get("offset"), e.args.get("default") 377 ), 378 exp.Levenshtein: unsupported_args("ins_cost", "del_cost", "sub_cost", "max_dist")( 379 rename_func("editDistance") 380 ), 381 exp.ParseDatetime: rename_func("parseDateTime"), 382 } 383 384 PROPERTIES_LOCATION = { 385 **generator.Generator.PROPERTIES_LOCATION, 386 exp.DefinerProperty: exp.Properties.Location.POST_SCHEMA, 387 exp.OnCluster: exp.Properties.Location.POST_NAME, 388 exp.PartitionedByProperty: exp.Properties.Location.POST_SCHEMA, 389 exp.ToTableProperty: exp.Properties.Location.POST_NAME, 390 exp.UuidProperty: exp.Properties.Location.POST_NAME, 391 exp.VolatileProperty: exp.Properties.Location.UNSUPPORTED, 392 } 393 394 # There's no list in docs, but it can be found in Clickhouse code 395 # see `ClickHouse/src/Parsers/ParserCreate*.cpp` 396 ON_CLUSTER_TARGETS = { 397 "SCHEMA", # Transpiled CREATE SCHEMA may have OnCluster property set 398 "DATABASE", 399 "TABLE", 400 "VIEW", 401 "DICTIONARY", 402 "INDEX", 403 "FUNCTION", 404 "NAMED COLLECTION", 405 } 406 407 # https://clickhouse.com/docs/en/sql-reference/data-types/nullable 408 NON_NULLABLE_TYPES = { 409 exp.DType.ARRAY, 410 exp.DType.MAP, 411 exp.DType.STRUCT, 412 exp.DType.POINT, 413 exp.DType.RING, 414 exp.DType.LINESTRING, 415 exp.DType.MULTILINESTRING, 416 exp.DType.POLYGON, 417 exp.DType.MULTIPOLYGON, 418 } 419 420 def groupconcat_sql(self, expression: exp.GroupConcat) -> str: 421 this = expression.this 422 separator = expression.args.get("separator") 423 424 if isinstance(this, exp.Limit) and this.this: 425 limit = this 426 this = limit.this.pop() 427 return self.sql( 428 exp.ParameterizedAgg( 429 this="groupConcat", 430 params=[this], 431 expressions=[separator, limit.expression], 432 ) 433 ) 434 435 if separator: 436 return self.sql( 437 exp.ParameterizedAgg( 438 this="groupConcat", 439 params=[this], 440 expressions=[separator], 441 ) 442 ) 443 444 return self.func("groupConcat", this) 445 446 def offset_sql(self, expression: exp.Offset) -> str: 447 offset = super().offset_sql(expression) 448 449 # OFFSET ... FETCH syntax requires a "ROW" or "ROWS" keyword 450 # https://clickhouse.com/docs/sql-reference/statements/select/offset 451 parent = expression.parent 452 if isinstance(parent, exp.Select) and isinstance(parent.args.get("limit"), exp.Fetch): 453 offset = f"{offset} ROWS" 454 455 return offset 456 457 def strtodate_sql(self, expression: exp.StrToDate) -> str: 458 strtodate_sql = self.function_fallback_sql(expression) 459 460 if not isinstance(expression.parent, exp.Cast): 461 # StrToDate returns DATEs in other dialects (eg. postgres), so 462 # this branch aims to improve the transpilation to clickhouse 463 return self.cast_sql(exp.cast(expression, "DATE")) 464 465 return strtodate_sql 466 467 def cast_sql(self, expression: exp.Cast, safe_prefix: str | None = None) -> str: 468 this = expression.this 469 470 if isinstance(this, exp.StrToDate) and expression.to == exp.DType.DATETIME.into_expr(): 471 return self.sql(this) 472 473 return super().cast_sql(expression, safe_prefix=safe_prefix) 474 475 def trycast_sql(self, expression: exp.TryCast) -> str: 476 dtype = expression.to 477 if not dtype.is_type(*self.NON_NULLABLE_TYPES, check_nullable=True): 478 # Casting x into Nullable(T) appears to behave similarly to TRY_CAST(x AS T) 479 dtype.set("nullable", True) 480 481 return super().cast_sql(expression) 482 483 def _jsonpathsubscript_sql(self, expression: exp.JSONPathSubscript) -> str: 484 this = self.json_path_part(expression.this) 485 return str(int(this) + 1) if is_int(this) else this 486 487 def likeproperty_sql(self, expression: exp.LikeProperty) -> str: 488 return f"AS {self.sql(expression, 'this')}" 489 490 def _any_to_has( 491 self, 492 expression: exp.EQ | exp.NEQ, 493 default: t.Callable[[t.Any], str], 494 prefix: str = "", 495 ) -> str: 496 if isinstance(expression.left, exp.Any): 497 arr = expression.left 498 this = expression.right 499 elif isinstance(expression.right, exp.Any): 500 arr = expression.right 501 this = expression.left 502 else: 503 return default(expression) 504 505 return prefix + self.func("has", arr.this.unnest(), this) 506 507 def eq_sql(self, expression: exp.EQ) -> str: 508 return self._any_to_has(expression, super().eq_sql) 509 510 def neq_sql(self, expression: exp.NEQ) -> str: 511 return self._any_to_has(expression, super().neq_sql, "NOT ") 512 513 def regexpilike_sql(self, expression: exp.RegexpILike) -> str: 514 # Manually add a flag to make the search case-insensitive 515 regex = self.func("CONCAT", "'(?i)'", expression.expression) 516 return self.func("match", expression.this, regex) 517 518 def datatype_sql(self, expression: exp.DataType) -> str: 519 # String is the standard ClickHouse type, every other variant is just an alias. 520 # Additionally, any supplied length parameter will be ignored. 521 # 522 # https://clickhouse.com/docs/en/sql-reference/data-types/string 523 if expression.this in self.STRING_TYPE_MAPPING: 524 dtype = "String" 525 else: 526 dtype = super().datatype_sql(expression) 527 528 # This section changes the type to `Nullable(...)` if the following conditions hold: 529 # - It's marked as nullable - this ensures we won't wrap ClickHouse types with `Nullable` 530 # and change their semantics 531 # - It's not the key type of a `Map`. This is because ClickHouse enforces the following 532 # constraint: "Type of Map key must be a type, that can be represented by integer or 533 # String or FixedString (possibly LowCardinality) or UUID or IPv6" 534 # - It's not a composite type, e.g. `Nullable(Array(...))` is not a valid type 535 parent = expression.parent 536 nullable = expression.args.get("nullable") 537 if nullable is True or ( 538 nullable is None 539 and not ( 540 isinstance(parent, exp.DataType) 541 and parent.is_type(exp.DType.MAP, check_nullable=True) 542 and expression.index in (None, 0) 543 ) 544 and not expression.is_type(*self.NON_NULLABLE_TYPES, check_nullable=True) 545 ): 546 dtype = f"Nullable({dtype})" 547 548 return dtype 549 550 def cte_sql(self, expression: exp.CTE) -> str: 551 if expression.args.get("scalar"): 552 this = self.sql(expression, "this") 553 alias = self.sql(expression, "alias") 554 return f"{this} AS {alias}" 555 556 return super().cte_sql(expression) 557 558 def after_limit_modifiers(self, expression: exp.Expr) -> list[str]: 559 return super().after_limit_modifiers(expression) + [ 560 ( 561 self.seg("SETTINGS ") + self.expressions(expression, key="settings", flat=True) 562 if expression.args.get("settings") 563 else "" 564 ), 565 ( 566 self.seg("FORMAT ") + self.sql(expression, "format") 567 if expression.args.get("format") 568 else "" 569 ), 570 ] 571 572 def placeholder_sql(self, expression: exp.Placeholder) -> str: 573 return f"{{{expression.name}: {self.sql(expression, 'kind')}}}" 574 575 def oncluster_sql(self, expression: exp.OnCluster) -> str: 576 return f"ON CLUSTER {self.sql(expression, 'this')}" 577 578 def createable_sql(self, expression: exp.Create, locations: defaultdict) -> str: 579 if expression.kind in self.ON_CLUSTER_TARGETS and locations.get( 580 exp.Properties.Location.POST_NAME 581 ): 582 this_name = self.sql( 583 expression.this if isinstance(expression.this, exp.Schema) else expression, 584 "this", 585 ) 586 this_properties = " ".join( 587 [self.sql(prop) for prop in locations[exp.Properties.Location.POST_NAME]] 588 ) 589 this_schema = self.schema_columns_sql(expression.this) 590 this_schema = f"{self.sep()}{this_schema}" if this_schema else "" 591 592 return f"{this_name}{self.sep()}{this_properties}{this_schema}" 593 594 return super().createable_sql(expression, locations) 595 596 def create_sql(self, expression: exp.Create) -> str: 597 # The comment property comes last in CTAS statements, i.e. after the query 598 query = expression.expression 599 if isinstance(query, exp.Query): 600 comment_prop = expression.find(exp.SchemaCommentProperty) 601 if comment_prop: 602 comment_prop.pop() 603 query.replace(exp.paren(query)) 604 else: 605 comment_prop = None 606 607 create_sql = super().create_sql(expression) 608 609 comment_sql = self.sql(comment_prop) 610 comment_sql = f" {comment_sql}" if comment_sql else "" 611 612 return f"{create_sql}{comment_sql}" 613 614 def prewhere_sql(self, expression: exp.PreWhere) -> str: 615 this = self.indent(self.sql(expression, "this")) 616 return f"{self.seg('PREWHERE')}{self.sep()}{this}" 617 618 def indexcolumnconstraint_sql(self, expression: exp.IndexColumnConstraint) -> str: 619 this = self.sql(expression, "this") 620 this = f" {this}" if this else "" 621 expr = self.sql(expression, "expression") 622 expr = f" {expr}" if expr else "" 623 index_type = self.sql(expression, "index_type") 624 index_type = f" TYPE {index_type}" if index_type else "" 625 granularity = self.sql(expression, "granularity") 626 granularity = f" GRANULARITY {granularity}" if granularity else "" 627 628 return f"INDEX{this}{expr}{index_type}{granularity}" 629 630 def partition_sql(self, expression: exp.Partition) -> str: 631 return f"PARTITION {self.expressions(expression, flat=True)}" 632 633 def partitionid_sql(self, expression: exp.PartitionId) -> str: 634 return f"ID {self.sql(expression.this)}" 635 636 def replacepartition_sql(self, expression: exp.ReplacePartition) -> str: 637 return f"REPLACE {self.sql(expression.expression)} FROM {self.sql(expression, 'source')}" 638 639 def projectiondef_sql(self, expression: exp.ProjectionDef) -> str: 640 return f"PROJECTION {self.sql(expression.this)} {self.wrap(expression.expression)}" 641 642 def nestedjsonselect_sql(self, expression: exp.NestedJSONSelect) -> str: 643 return f"{self.sql(expression, 'this')}.^{self.sql(expression, 'expression')}" 644 645 def is_sql(self, expression: exp.Is) -> str: 646 is_sql = super().is_sql(expression) 647 648 if isinstance(expression.parent, exp.Not): 649 # value IS NOT NULL -> NOT (value IS NULL) 650 is_sql = self.wrap(is_sql) 651 652 return is_sql 653 654 def in_sql(self, expression: exp.In) -> str: 655 in_sql = super().in_sql(expression) 656 657 if isinstance(expression.parent, exp.Not) and expression.args.get("is_global"): 658 in_sql = in_sql.replace("GLOBAL IN", "GLOBAL NOT IN", 1) 659 660 return in_sql 661 662 def not_sql(self, expression: exp.Not) -> str: 663 if isinstance(expression.this, exp.In): 664 if expression.this.args.get("is_global"): 665 # let `GLOBAL IN` child interpose `NOT` 666 return self.sql(expression, "this") 667 668 expression.set("this", exp.paren(expression.this, copy=False)) 669 670 return super().not_sql(expression) 671 672 def values_sql(self, expression: exp.Values, values_as_table: bool = True) -> str: 673 # If the VALUES clause contains tuples of expressions, we need to treat it 674 # as a table since Clickhouse will automatically alias it as such. 675 alias = expression.args.get("alias") 676 677 if alias and alias.args.get("columns") and expression.expressions: 678 values = expression.expressions[0].expressions 679 values_as_table = any(isinstance(value, exp.Tuple) for value in values) 680 else: 681 values_as_table = True 682 683 return super().values_sql(expression, values_as_table=values_as_table) 684 685 def timestamptrunc_sql(self, expression: exp.TimestampTrunc) -> str: 686 unit = unit_to_str(expression) 687 # https://clickhouse.com/docs/whats-new/changelog/2023#improvement 688 if self.dialect.version < (23, 12) and unit and unit.is_string: 689 unit = exp.Literal.string(unit.name.lower()) 690 return self.func("dateTrunc", unit, expression.this, expression.args.get("zone"))
Generator converts a given syntax tree to the corresponding SQL string.
Arguments:
- pretty: Whether to format the produced SQL string. Default: False.
- identify: Determines when an identifier should be quoted. Possible values are: False (default): Never quote, except in cases where it's mandatory by the dialect. True: Always quote except for specials cases. 'safe': Only quote identifiers that are case insensitive.
- normalize: Whether to normalize identifiers to lowercase. Default: False.
- pad: The pad size in a formatted string. For example, this affects the indentation of a projection in a query, relative to its nesting level. Default: 2.
- indent: The indentation size in a formatted string. For example, this affects the
indentation of subqueries and filters under a
WHEREclause. Default: 2. - normalize_functions: How to normalize function names. Possible values are: "upper" or True (default): Convert names to uppercase. "lower": Convert names to lowercase. False: Disables function name normalization.
- unsupported_level: Determines the generator's behavior when it encounters unsupported expressions. Default ErrorLevel.WARN.
- max_unsupported: Maximum number of unsupported messages to include in a raised UnsupportedError. This is only relevant if unsupported_level is ErrorLevel.RAISE. Default: 3
- leading_comma: Whether the comma is leading or trailing in select expressions. This is only relevant when generating in pretty mode. Default: False
- max_text_width: The max number of characters in a segment before creating new lines in pretty mode. The default is on the smaller end because the length only represents a segment and not the true line length. Default: 80
- comments: Whether to preserve comments in the output SQL code. Default: True
STRING_TYPE_MAPPING: ClassVar =
{<DType.BLOB: 'BLOB'>: 'String', <DType.CHAR: 'CHAR'>: 'String', <DType.LONGBLOB: 'LONGBLOB'>: 'String', <DType.LONGTEXT: 'LONGTEXT'>: 'String', <DType.MEDIUMBLOB: 'MEDIUMBLOB'>: 'String', <DType.MEDIUMTEXT: 'MEDIUMTEXT'>: 'String', <DType.TINYBLOB: 'TINYBLOB'>: 'String', <DType.TINYTEXT: 'TINYTEXT'>: 'String', <DType.TEXT: 'TEXT'>: 'String', <DType.VARBINARY: 'VARBINARY'>: 'String', <DType.VARCHAR: 'VARCHAR'>: 'String'}
SUPPORTED_JSON_PATH_PARTS =
{<class 'sqlglot.expressions.query.JSONPathRoot'>, <class 'sqlglot.expressions.query.JSONPathSubscript'>, <class 'sqlglot.expressions.query.JSONPathKey'>}
TYPE_MAPPING =
{<DType.DATETIME2: 'DATETIME2'>: 'DateTime', <DType.NCHAR: 'NCHAR'>: 'CHAR', <DType.NVARCHAR: 'NVARCHAR'>: 'VARCHAR', <DType.MEDIUMTEXT: 'MEDIUMTEXT'>: 'String', <DType.LONGTEXT: 'LONGTEXT'>: 'String', <DType.TINYTEXT: 'TINYTEXT'>: 'String', <DType.BLOB: 'BLOB'>: 'String', <DType.MEDIUMBLOB: 'MEDIUMBLOB'>: 'String', <DType.LONGBLOB: 'LONGBLOB'>: 'String', <DType.TINYBLOB: 'TINYBLOB'>: 'String', <DType.INET: 'INET'>: 'INET', <DType.ROWVERSION: 'ROWVERSION'>: 'VARBINARY', <DType.SMALLDATETIME: 'SMALLDATETIME'>: 'DateTime', <DType.CHAR: 'CHAR'>: 'String', <DType.TEXT: 'TEXT'>: 'String', <DType.VARBINARY: 'VARBINARY'>: 'String', <DType.VARCHAR: 'VARCHAR'>: 'String', <DType.ARRAY: 'ARRAY'>: 'Array', <DType.BOOLEAN: 'BOOLEAN'>: 'Bool', <DType.BIGINT: 'BIGINT'>: 'Int64', <DType.DATE32: 'DATE32'>: 'Date32', <DType.DATETIME: 'DATETIME'>: 'DateTime', <DType.DATETIME64: 'DATETIME64'>: 'DateTime64', <DType.DECIMAL: 'DECIMAL'>: 'Decimal', <DType.DECIMAL32: 'DECIMAL32'>: 'Decimal32', <DType.DECIMAL64: 'DECIMAL64'>: 'Decimal64', <DType.DECIMAL128: 'DECIMAL128'>: 'Decimal128', <DType.DECIMAL256: 'DECIMAL256'>: 'Decimal256', <DType.TIMESTAMP: 'TIMESTAMP'>: 'DateTime', <DType.TIMESTAMPNTZ: 'TIMESTAMPNTZ'>: 'DateTime', <DType.TIMESTAMPTZ: 'TIMESTAMPTZ'>: 'DateTime', <DType.DOUBLE: 'DOUBLE'>: 'Float64', <DType.ENUM: 'ENUM'>: 'Enum', <DType.ENUM8: 'ENUM8'>: 'Enum8', <DType.ENUM16: 'ENUM16'>: 'Enum16', <DType.FIXEDSTRING: 'FIXEDSTRING'>: 'FixedString', <DType.FLOAT: 'FLOAT'>: 'Float32', <DType.INT: 'INT'>: 'Int32', <DType.MEDIUMINT: 'MEDIUMINT'>: 'Int32', <DType.INT128: 'INT128'>: 'Int128', <DType.INT256: 'INT256'>: 'Int256', <DType.LOWCARDINALITY: 'LOWCARDINALITY'>: 'LowCardinality', <DType.MAP: 'MAP'>: 'Map', <DType.NESTED: 'NESTED'>: 'Nested', <DType.NOTHING: 'NOTHING'>: 'Nothing', <DType.SMALLINT: 'SMALLINT'>: 'Int16', <DType.STRUCT: 'STRUCT'>: 'Tuple', <DType.TINYINT: 'TINYINT'>: 'Int8', <DType.UBIGINT: 'UBIGINT'>: 'UInt64', <DType.UINT: 'UINT'>: 'UInt32', <DType.UINT128: 'UINT128'>: 'UInt128', <DType.UINT256: 'UINT256'>: 'UInt256', <DType.USMALLINT: 'USMALLINT'>: 'UInt16', <DType.UTINYINT: 'UTINYINT'>: 'UInt8', <DType.IPV4: 'IPV4'>: 'IPv4', <DType.IPV6: 'IPV6'>: 'IPv6', <DType.POINT: 'POINT'>: 'Point', <DType.RING: 'RING'>: 'Ring', <DType.LINESTRING: 'LINESTRING'>: 'LineString', <DType.MULTILINESTRING: 'MULTILINESTRING'>: 'MultiLineString', <DType.POLYGON: 'POLYGON'>: 'Polygon', <DType.MULTIPOLYGON: 'MULTIPOLYGON'>: 'MultiPolygon', <DType.AGGREGATEFUNCTION: 'AGGREGATEFUNCTION'>: 'AggregateFunction', <DType.SIMPLEAGGREGATEFUNCTION: 'SIMPLEAGGREGATEFUNCTION'>: 'SimpleAggregateFunction', <DType.DYNAMIC: 'DYNAMIC'>: 'Dynamic'}
TRANSFORMS =
{<class 'sqlglot.expressions.query.JSONPathKey'>: <function json_path_key_only_name>, <class 'sqlglot.expressions.query.JSONPathRoot'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.query.JSONPathSubscript'>: <function <lambda>>, <class 'sqlglot.expressions.core.Adjacent'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.AllowedValuesProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.AnalyzeColumns'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.AnalyzeWith'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.array.ArrayContainsAll'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.array.ArrayOverlaps'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.AssumeColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.AutoRefreshProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.BackupProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.CaseSpecificColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.math.Ceil'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.CharacterSetColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.CharacterSetProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.ClusteredColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.CollateColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.CommentColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.functions.ConnectByRoot'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.string.ConvertToCharset'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.CopyGrantsProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.CredentialsProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.functions.CurrentCatalog'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.functions.SessionUser'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.DateFormatColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.DefaultColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.ApiProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.ApplicationProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.CatalogProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.ComputeProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.DatabaseProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.DynamicProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.EmptyProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.EncodeColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.EndStatement'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.EnviromentProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.HandlerProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.ParameterStyleProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.EphemeralColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.ExcludeColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.ExecuteAsProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.Except'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.ExternalProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.math.Floor'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.Get'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.GlobalProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.HeapProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.HybridProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.IcebergProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.InheritsProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.InlineLengthColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.InputModelProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.Intersect'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.datatypes.IntervalSpan'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.functions.Int64'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.json.JSONBContainsAnyTopKeys'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.json.JSONBContainsAllTopKeys'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.json.JSONBDeleteAtPath'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.json.JSONObject'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.json.JSONObjectAgg'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.LanguageProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.LocationProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.LogProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.MaskingProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.MaterializedProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.functions.NetFunc'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.NetworkProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.NonClusteredColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.NoPrimaryIndexProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.NotForReplicationColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.OnCommitProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.OnProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.OnUpdateColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.core.Operator'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.OutputModelProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.core.ExtendsLeft'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.core.ExtendsRight'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.PathColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.PartitionedByBucket'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.PartitionByTruncate'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.core.PivotAny'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.array.PositionalColumn'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.ProjectionPolicyColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.InvisibleColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.ZeroFillColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.Put'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.RemoteWithConnectionModelProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.ReturnsProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.RowAccessProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.core.SafeFunc'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.SampleProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.SecureProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.SecurityIntegrationProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.SetConfigProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.SetProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.SettingsProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.SharingProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.SqlReadWriteProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.SqlSecurityProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.StabilityProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.Stream'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.StreamingTableProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.StrictProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.ddl.SwapTable'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.TableColumn'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.Tags'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.TemporaryProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.TitleColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.array.ToMap'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.ToTableProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.TransformModelProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.TransientProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.VirtualProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.ddl.TriggerExecute'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.Union'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.UnloggedProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.UsingTemplateProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.UsingData'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.UppercaseColumnConstraint'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.temporal.UtcDate'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.temporal.UtcTime'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.temporal.UtcTimestamp'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.query.Variadic'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.array.VarMap'>: <function _map_sql>, <class 'sqlglot.expressions.properties.ViewAttributeProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.VolatileProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.WithJournalTableProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.WithProcedureOptions'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.WithSchemaBindingProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.constraints.WithOperator'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.properties.ForceProperty'>: <function Generator.<lambda>>, <class 'sqlglot.expressions.aggregate.AnyValue'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.core.ApproxDistinct'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.array.ArrayDistinct'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.array.ArrayConcat'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.array.ArrayContains'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.array.ArrayFilter'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.array.ArrayRemove'>: <function remove_from_array_using_filter>, <class 'sqlglot.expressions.array.ArrayReverse'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.array.ArraySlice'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.array.ArraySum'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.array.ArrayMax'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.array.ArrayMin'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.aggregate.ArgMax'>: <function arg_max_or_min_no_count.<locals>._arg_max_or_min_sql>, <class 'sqlglot.expressions.aggregate.ArgMin'>: <function arg_max_or_min_no_count.<locals>._arg_max_or_min_sql>, <class 'sqlglot.expressions.array.Array'>: <function inline_array_sql>, <class 'sqlglot.expressions.string.CityHash64'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.functions.CastToStrType'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.functions.CurrentDatabase'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.functions.CurrentSchemas'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.aggregate.CountIf'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.math.CosineDistance'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.constraints.CompressColumnConstraint'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.constraints.ComputedColumnConstraint'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.temporal.CurrentDate'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.functions.CurrentVersion'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.temporal.DateAdd'>: <function _datetime_delta_sql.<locals>._delta_sql>, <class 'sqlglot.expressions.temporal.DateDiff'>: <function _datetime_delta_sql.<locals>._delta_sql>, <class 'sqlglot.expressions.temporal.DateStrToDate'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.temporal.DateSub'>: <function _datetime_delta_sql.<locals>._delta_sql>, <class 'sqlglot.expressions.array.Explode'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.string.FarmFingerprint'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.query.Final'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.math.IsNan'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.math.JarowinklerSimilarity'>: <function jarowinkler_similarity.<locals>.jarowinklersimilarity_sql>, <class 'sqlglot.expressions.functions.JSONCast'>: <function _json_cast_sql>, <class 'sqlglot.expressions.json.JSONExtract'>: <function json_extract_segments.<locals>._json_extract_segments>, <class 'sqlglot.expressions.json.JSONExtractScalar'>: <function json_extract_segments.<locals>._json_extract_segments>, <class 'sqlglot.expressions.string.Length'>: <function length_or_char_length_sql>, <class 'sqlglot.expressions.array.Map'>: <function _map_sql>, <class 'sqlglot.expressions.aggregate.Median'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.functions.Nullif'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.properties.PartitionedByProperty'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.query.Pivot'>: <function no_pivot_sql>, <class 'sqlglot.expressions.aggregate.Quantile'>: <function _quantile_sql>, <class 'sqlglot.expressions.core.RegexpLike'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.functions.Rand'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.string.StartsWith'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.array.Struct'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.math.Trunc'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.string.EndsWith'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.math.EuclideanDistance'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.string.StrPosition'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.temporal.TimeToStr'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.temporal.TimeStrToTime'>: <function _timestrtotime_sql>, <class 'sqlglot.expressions.temporal.TimestampAdd'>: <function _datetime_delta_sql.<locals>._delta_sql>, <class 'sqlglot.expressions.temporal.TimestampSub'>: <function _datetime_delta_sql.<locals>._delta_sql>, <class 'sqlglot.expressions.core.Typeof'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.core.Xor'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.string.MD5Digest'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.string.MD5'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.string.SHA'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.string.SHA1Digest'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.string.SHA2'>: <function sha256_sql>, <class 'sqlglot.expressions.string.SHA2Digest'>: <function sha2_digest_sql>, <class 'sqlglot.expressions.string.Split'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.string.RegexpSplit'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.temporal.UnixToTime'>: <function _unix_to_time_sql>, <class 'sqlglot.expressions.string.Trim'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.aggregate.Variance'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.properties.SchemaCommentProperty'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.aggregate.Stddev'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.string.Chr'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.aggregate.Lag'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.aggregate.Lead'>: <function ClickHouseGenerator.<lambda>>, <class 'sqlglot.expressions.string.Levenshtein'>: <function rename_func.<locals>.<lambda>>, <class 'sqlglot.expressions.temporal.ParseDatetime'>: <function rename_func.<locals>.<lambda>>}
PROPERTIES_LOCATION =
{<class 'sqlglot.expressions.properties.AllowedValuesProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.AlgorithmProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.ApiProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.ApplicationProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.AutoIncrementProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.AutoRefreshProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.BackupProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.BlockCompressionProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.CatalogProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.CharacterSetProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.ChecksumProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.CollateProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.ComputeProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.CopyGrantsProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.query.Cluster'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.ClusteredByProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.DistributedByProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.DuplicateKeyProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.DataBlocksizeProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.DatabaseProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.DataDeletionProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.DefinerProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.DictRange'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.DictProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.DynamicProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.DistKeyProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.DistStyleProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.EmptyProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.EncodeProperty'>: <PropertiesLocation.POST_EXPRESSION: 'POST_EXPRESSION'>, <class 'sqlglot.expressions.properties.EngineProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.EnviromentProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.HandlerProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.ParameterStyleProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.ExecuteAsProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.ExternalProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.FallbackProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.FileFormatProperty'>: <PropertiesLocation.POST_WITH: 'POST_WITH'>, <class 'sqlglot.expressions.properties.FreespaceProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.GlobalProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.HeapProperty'>: <PropertiesLocation.POST_WITH: 'POST_WITH'>, <class 'sqlglot.expressions.properties.HybridProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.InheritsProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.IcebergProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.IncludeProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.InputModelProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.IsolatedLoadingProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.JournalProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.LanguageProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.LikeProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.LocationProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.LockProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.LockingProperty'>: <PropertiesLocation.POST_ALIAS: 'POST_ALIAS'>, <class 'sqlglot.expressions.properties.LogProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.MaskingProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.MaterializedProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.MergeBlockRatioProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.ModuleProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.NetworkProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.NoPrimaryIndexProperty'>: <PropertiesLocation.POST_EXPRESSION: 'POST_EXPRESSION'>, <class 'sqlglot.expressions.properties.OnProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.OnCommitProperty'>: <PropertiesLocation.POST_EXPRESSION: 'POST_EXPRESSION'>, <class 'sqlglot.expressions.query.Order'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.OutputModelProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.PartitionedByProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.PartitionedOfProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.constraints.PrimaryKey'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.Property'>: <PropertiesLocation.POST_WITH: 'POST_WITH'>, <class 'sqlglot.expressions.properties.RefreshTriggerProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.RemoteWithConnectionModelProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.ReturnsProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.RollupProperty'>: <PropertiesLocation.UNSUPPORTED: 'UNSUPPORTED'>, <class 'sqlglot.expressions.properties.RowAccessProperty'>: <PropertiesLocation.UNSUPPORTED: 'UNSUPPORTED'>, <class 'sqlglot.expressions.properties.RowFormatProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.RowFormatDelimitedProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.RowFormatSerdeProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.SampleProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.SchemaCommentProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.SecureProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.SecurityIntegrationProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.SerdeProperties'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.ddl.Set'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.SettingsProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.SetProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.SetConfigProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.SharingProperty'>: <PropertiesLocation.POST_EXPRESSION: 'POST_EXPRESSION'>, <class 'sqlglot.expressions.ddl.SequenceProperties'>: <PropertiesLocation.POST_EXPRESSION: 'POST_EXPRESSION'>, <class 'sqlglot.expressions.ddl.TriggerProperties'>: <PropertiesLocation.POST_EXPRESSION: 'POST_EXPRESSION'>, <class 'sqlglot.expressions.properties.SortKeyProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.SqlReadWriteProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.SqlSecurityProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.StabilityProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.StorageHandlerProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.StreamingTableProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.StrictProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.Tags'>: <PropertiesLocation.POST_WITH: 'POST_WITH'>, <class 'sqlglot.expressions.properties.TemporaryProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.ToTableProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.TransientProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.TransformModelProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.ddl.MergeTreeTTL'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.UnloggedProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.UsingProperty'>: <PropertiesLocation.POST_EXPRESSION: 'POST_EXPRESSION'>, <class 'sqlglot.expressions.properties.UsingTemplateProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.ViewAttributeProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.VirtualProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.VolatileProperty'>: <PropertiesLocation.UNSUPPORTED: 'UNSUPPORTED'>, <class 'sqlglot.expressions.properties.WithDataProperty'>: <PropertiesLocation.POST_EXPRESSION: 'POST_EXPRESSION'>, <class 'sqlglot.expressions.properties.WithJournalTableProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.WithProcedureOptions'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.WithSchemaBindingProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.WithSystemVersioningProperty'>: <PropertiesLocation.POST_SCHEMA: 'POST_SCHEMA'>, <class 'sqlglot.expressions.properties.ForceProperty'>: <PropertiesLocation.POST_CREATE: 'POST_CREATE'>, <class 'sqlglot.expressions.properties.OnCluster'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>, <class 'sqlglot.expressions.properties.UuidProperty'>: <PropertiesLocation.POST_NAME: 'POST_NAME'>}
ON_CLUSTER_TARGETS =
{'DICTIONARY', 'INDEX', 'TABLE', 'FUNCTION', 'DATABASE', 'SCHEMA', 'NAMED COLLECTION', 'VIEW'}
NON_NULLABLE_TYPES =
{<DType.RING: 'RING'>, <DType.ARRAY: 'ARRAY'>, <DType.POLYGON: 'POLYGON'>, <DType.MAP: 'MAP'>, <DType.LINESTRING: 'LINESTRING'>, <DType.MULTIPOLYGON: 'MULTIPOLYGON'>, <DType.POINT: 'POINT'>, <DType.STRUCT: 'STRUCT'>, <DType.MULTILINESTRING: 'MULTILINESTRING'>}
420 def groupconcat_sql(self, expression: exp.GroupConcat) -> str: 421 this = expression.this 422 separator = expression.args.get("separator") 423 424 if isinstance(this, exp.Limit) and this.this: 425 limit = this 426 this = limit.this.pop() 427 return self.sql( 428 exp.ParameterizedAgg( 429 this="groupConcat", 430 params=[this], 431 expressions=[separator, limit.expression], 432 ) 433 ) 434 435 if separator: 436 return self.sql( 437 exp.ParameterizedAgg( 438 this="groupConcat", 439 params=[this], 440 expressions=[separator], 441 ) 442 ) 443 444 return self.func("groupConcat", this)
446 def offset_sql(self, expression: exp.Offset) -> str: 447 offset = super().offset_sql(expression) 448 449 # OFFSET ... FETCH syntax requires a "ROW" or "ROWS" keyword 450 # https://clickhouse.com/docs/sql-reference/statements/select/offset 451 parent = expression.parent 452 if isinstance(parent, exp.Select) and isinstance(parent.args.get("limit"), exp.Fetch): 453 offset = f"{offset} ROWS" 454 455 return offset
457 def strtodate_sql(self, expression: exp.StrToDate) -> str: 458 strtodate_sql = self.function_fallback_sql(expression) 459 460 if not isinstance(expression.parent, exp.Cast): 461 # StrToDate returns DATEs in other dialects (eg. postgres), so 462 # this branch aims to improve the transpilation to clickhouse 463 return self.cast_sql(exp.cast(expression, "DATE")) 464 465 return strtodate_sql
def
cast_sql( self, expression: sqlglot.expressions.functions.Cast, safe_prefix: str | None = None) -> str:
467 def cast_sql(self, expression: exp.Cast, safe_prefix: str | None = None) -> str: 468 this = expression.this 469 470 if isinstance(this, exp.StrToDate) and expression.to == exp.DType.DATETIME.into_expr(): 471 return self.sql(this) 472 473 return super().cast_sql(expression, safe_prefix=safe_prefix)
475 def trycast_sql(self, expression: exp.TryCast) -> str: 476 dtype = expression.to 477 if not dtype.is_type(*self.NON_NULLABLE_TYPES, check_nullable=True): 478 # Casting x into Nullable(T) appears to behave similarly to TRY_CAST(x AS T) 479 dtype.set("nullable", True) 480 481 return super().cast_sql(expression)
518 def datatype_sql(self, expression: exp.DataType) -> str: 519 # String is the standard ClickHouse type, every other variant is just an alias. 520 # Additionally, any supplied length parameter will be ignored. 521 # 522 # https://clickhouse.com/docs/en/sql-reference/data-types/string 523 if expression.this in self.STRING_TYPE_MAPPING: 524 dtype = "String" 525 else: 526 dtype = super().datatype_sql(expression) 527 528 # This section changes the type to `Nullable(...)` if the following conditions hold: 529 # - It's marked as nullable - this ensures we won't wrap ClickHouse types with `Nullable` 530 # and change their semantics 531 # - It's not the key type of a `Map`. This is because ClickHouse enforces the following 532 # constraint: "Type of Map key must be a type, that can be represented by integer or 533 # String or FixedString (possibly LowCardinality) or UUID or IPv6" 534 # - It's not a composite type, e.g. `Nullable(Array(...))` is not a valid type 535 parent = expression.parent 536 nullable = expression.args.get("nullable") 537 if nullable is True or ( 538 nullable is None 539 and not ( 540 isinstance(parent, exp.DataType) 541 and parent.is_type(exp.DType.MAP, check_nullable=True) 542 and expression.index in (None, 0) 543 ) 544 and not expression.is_type(*self.NON_NULLABLE_TYPES, check_nullable=True) 545 ): 546 dtype = f"Nullable({dtype})" 547 548 return dtype
558 def after_limit_modifiers(self, expression: exp.Expr) -> list[str]: 559 return super().after_limit_modifiers(expression) + [ 560 ( 561 self.seg("SETTINGS ") + self.expressions(expression, key="settings", flat=True) 562 if expression.args.get("settings") 563 else "" 564 ), 565 ( 566 self.seg("FORMAT ") + self.sql(expression, "format") 567 if expression.args.get("format") 568 else "" 569 ), 570 ]
def
createable_sql( self, expression: sqlglot.expressions.ddl.Create, locations: collections.defaultdict) -> str:
578 def createable_sql(self, expression: exp.Create, locations: defaultdict) -> str: 579 if expression.kind in self.ON_CLUSTER_TARGETS and locations.get( 580 exp.Properties.Location.POST_NAME 581 ): 582 this_name = self.sql( 583 expression.this if isinstance(expression.this, exp.Schema) else expression, 584 "this", 585 ) 586 this_properties = " ".join( 587 [self.sql(prop) for prop in locations[exp.Properties.Location.POST_NAME]] 588 ) 589 this_schema = self.schema_columns_sql(expression.this) 590 this_schema = f"{self.sep()}{this_schema}" if this_schema else "" 591 592 return f"{this_name}{self.sep()}{this_properties}{this_schema}" 593 594 return super().createable_sql(expression, locations)
596 def create_sql(self, expression: exp.Create) -> str: 597 # The comment property comes last in CTAS statements, i.e. after the query 598 query = expression.expression 599 if isinstance(query, exp.Query): 600 comment_prop = expression.find(exp.SchemaCommentProperty) 601 if comment_prop: 602 comment_prop.pop() 603 query.replace(exp.paren(query)) 604 else: 605 comment_prop = None 606 607 create_sql = super().create_sql(expression) 608 609 comment_sql = self.sql(comment_prop) 610 comment_sql = f" {comment_sql}" if comment_sql else "" 611 612 return f"{create_sql}{comment_sql}"
def
indexcolumnconstraint_sql( self, expression: sqlglot.expressions.constraints.IndexColumnConstraint) -> str:
618 def indexcolumnconstraint_sql(self, expression: exp.IndexColumnConstraint) -> str: 619 this = self.sql(expression, "this") 620 this = f" {this}" if this else "" 621 expr = self.sql(expression, "expression") 622 expr = f" {expr}" if expr else "" 623 index_type = self.sql(expression, "index_type") 624 index_type = f" TYPE {index_type}" if index_type else "" 625 granularity = self.sql(expression, "granularity") 626 granularity = f" GRANULARITY {granularity}" if granularity else "" 627 628 return f"INDEX{this}{expr}{index_type}{granularity}"
662 def not_sql(self, expression: exp.Not) -> str: 663 if isinstance(expression.this, exp.In): 664 if expression.this.args.get("is_global"): 665 # let `GLOBAL IN` child interpose `NOT` 666 return self.sql(expression, "this") 667 668 expression.set("this", exp.paren(expression.this, copy=False)) 669 670 return super().not_sql(expression)
def
values_sql( self, expression: sqlglot.expressions.query.Values, values_as_table: bool = True) -> str:
672 def values_sql(self, expression: exp.Values, values_as_table: bool = True) -> str: 673 # If the VALUES clause contains tuples of expressions, we need to treat it 674 # as a table since Clickhouse will automatically alias it as such. 675 alias = expression.args.get("alias") 676 677 if alias and alias.args.get("columns") and expression.expressions: 678 values = expression.expressions[0].expressions 679 values_as_table = any(isinstance(value, exp.Tuple) for value in values) 680 else: 681 values_as_table = True 682 683 return super().values_sql(expression, values_as_table=values_as_table)
685 def timestamptrunc_sql(self, expression: exp.TimestampTrunc) -> str: 686 unit = unit_to_str(expression) 687 # https://clickhouse.com/docs/whats-new/changelog/2023#improvement 688 if self.dialect.version < (23, 12) and unit and unit.is_string: 689 unit = exp.Literal.string(unit.name.lower()) 690 return self.func("dateTrunc", unit, expression.this, expression.args.get("zone"))
Inherited Members
- sqlglot.generator.Generator
- Generator
- NULL_ORDERING_SUPPORTED
- WINDOW_FUNCS_WITH_NULL_ORDERING
- IGNORE_NULLS_IN_FUNC
- IGNORE_NULLS_BEFORE_ORDER
- LOCKING_READS_SUPPORTED
- EXCEPT_INTERSECT_SUPPORT_ALL_CLAUSE
- CREATE_FUNCTION_RETURN_AS
- MATCHED_BY_SOURCE
- SUPPORTS_MERGE_WHERE
- SINGLE_STRING_INTERVAL
- INTERVAL_ALLOWS_PLURAL_FORM
- LIMIT_FETCH
- LIMIT_ONLY_LITERALS
- RENAME_TABLE_WITH_DB
- INDEX_ON
- INOUT_SEPARATOR
- DIRECTED_JOINS
- QUERY_HINT_SEP
- IS_BOOL_ALLOWED
- DUPLICATE_KEY_UPDATE_WITH_SET
- LIMIT_IS_TOP
- RETURNING_END
- EXTRACT_ALLOWS_QUOTES
- TZ_TO_WITH_TIME_ZONE
- VALUES_AS_TABLE
- ALTER_TABLE_INCLUDE_COLUMN_KEYWORD
- UNNEST_WITH_ORDINALITY
- AGGREGATE_FILTER_SUPPORTED
- SEMI_ANTI_JOIN_WITH_SIDE
- COMPUTED_COLUMN_WITH_TYPE
- SUPPORTS_TABLE_COPY
- TABLESAMPLE_WITH_METHOD
- TABLESAMPLE_SEED_KEYWORD
- COLLATE_IS_FUNC
- DATA_TYPE_SPECIFIERS_ALLOWED
- ENSURE_BOOLS
- CTE_RECURSIVE_KEYWORD_REQUIRED
- SUPPORTS_SINGLE_ARG_CONCAT
- SUPPORTS_TABLE_ALIAS_COLUMNS
- UNPIVOT_ALIASES_ARE_IDENTIFIERS
- JSON_KEY_VALUE_PAIR_SEP
- INSERT_OVERWRITE
- SUPPORTS_SELECT_INTO
- SUPPORTS_UNLOGGED_TABLES
- SUPPORTS_CREATE_TABLE_LIKE
- LIKE_PROPERTY_INSIDE_SCHEMA
- MULTI_ARG_DISTINCT
- JSON_TYPE_REQUIRED_FOR_EXTRACTION
- JSON_PATH_BRACKETED_KEY_SUPPORTED
- JSON_PATH_SINGLE_QUOTE_ESCAPE
- SUPPORTS_WINDOW_EXCLUDE
- COPY_PARAMS_ARE_WRAPPED
- COPY_PARAMS_EQ_REQUIRED
- COPY_HAS_INTO_KEYWORD
- UNICODE_SUBSTITUTE
- STAR_EXCEPT
- HEX_FUNC
- WITH_PROPERTIES_PREFIX
- QUOTE_JSON_PATH
- PAD_FILL_PATTERN_IS_REQUIRED
- SUPPORTS_EXPLODING_PROJECTIONS
- ARRAY_CONCAT_IS_VAR_LEN
- SUPPORTS_CONVERT_TIMEZONE
- SUPPORTS_MEDIAN
- SUPPORTS_UNIX_SECONDS
- ALTER_SET_WRAPPED
- NORMALIZE_EXTRACT_DATE_PARTS
- PARSE_JSON_NAME
- ALTER_SET_TYPE
- ARRAY_SIZE_DIM_REQUIRED
- SUPPORTS_BETWEEN_FLAGS
- SUPPORTS_LIKE_QUANTIFIERS
- MATCH_AGAINST_TABLE_PREFIX
- SET_ASSIGNMENT_REQUIRES_VARIABLE_KEYWORD
- DECLARE_DEFAULT_ASSIGNMENT
- UPDATE_STATEMENT_SUPPORTS_FROM
- STAR_EXCLUDE_REQUIRES_DERIVED_TABLE
- SUPPORTS_DROP_ALTER_ICEBERG_PROPERTY
- UNSUPPORTED_TYPES
- TIME_PART_SINGULARS
- TOKEN_MAPPING
- PARAMETER_TOKEN
- NAMED_PLACEHOLDER_TOKEN
- EXPRESSION_PRECEDES_PROPERTIES_CREATABLES
- RESERVED_KEYWORDS
- WITH_SEPARATED_COMMENTS
- EXCLUDE_COMMENTS
- UNWRAPPED_INTERVAL_VALUES
- PARAMETERIZABLE_TEXT_TYPES
- EXPRESSIONS_WITHOUT_NESTED_CTES
- RESPECT_IGNORE_NULLS_UNSUPPORTED_EXPRESSIONS
- SAFE_JSON_PATH_KEY_RE
- SENTINEL_LINE_BREAK
- pretty
- identify
- normalize
- pad
- unsupported_level
- max_unsupported
- leading_comma
- max_text_width
- comments
- dialect
- normalize_functions
- unsupported_messages
- generate
- preprocess
- unsupported
- sep
- seg
- sanitize_comment
- maybe_comment
- wrap
- no_identify
- normalize_func
- indent
- sql
- uncache_sql
- cache_sql
- characterset_sql
- column_parts
- column_sql
- pseudocolumn_sql
- columnposition_sql
- columndef_sql
- columnconstraint_sql
- computedcolumnconstraint_sql
- autoincrementcolumnconstraint_sql
- compresscolumnconstraint_sql
- generatedasidentitycolumnconstraint_sql
- generatedasrowcolumnconstraint_sql
- periodforsystemtimeconstraint_sql
- notnullcolumnconstraint_sql
- primarykeycolumnconstraint_sql
- uniquecolumnconstraint_sql
- inoutcolumnconstraint_sql
- sequenceproperties_sql
- triggerproperties_sql
- triggerreferencing_sql
- triggerevent_sql
- clone_sql
- describe_sql
- heredoc_sql
- prepend_ctes
- with_sql
- tablealias_sql
- bitstring_sql
- hexstring_sql
- bytestring_sql
- unicodestring_sql
- rawstring_sql
- datatypeparam_sql
- directory_sql
- delete_sql
- drop_sql
- set_operation
- set_operations
- fetch_sql
- limitoptions_sql
- filter_sql
- hint_sql
- indexparameters_sql
- index_sql
- identifier_sql
- hex_sql
- lowerhex_sql
- inputoutputformat_sql
- national_sql
- properties_sql
- root_properties
- properties
- with_properties
- locate_properties
- property_name
- property_sql
- uuidproperty_sql
- fallbackproperty_sql
- journalproperty_sql
- freespaceproperty_sql
- checksumproperty_sql
- mergeblockratioproperty_sql
- moduleproperty_sql
- datablocksizeproperty_sql
- blockcompressionproperty_sql
- isolatedloadingproperty_sql
- partitionboundspec_sql
- partitionedofproperty_sql
- lockingproperty_sql
- withdataproperty_sql
- withsystemversioningproperty_sql
- insert_sql
- introducer_sql
- kill_sql
- pseudotype_sql
- objectidentifier_sql
- onconflict_sql
- returning_sql
- rowformatdelimitedproperty_sql
- withtablehint_sql
- indextablehint_sql
- historicaldata_sql
- table_parts
- table_sql
- tablefromrows_sql
- tablesample_sql
- pivot_sql
- version_sql
- tuple_sql
- update_sql
- var_sql
- into_sql
- from_sql
- groupingsets_sql
- rollup_sql
- rollupindex_sql
- rollupproperty_sql
- cube_sql
- group_sql
- having_sql
- connect_sql
- prior_sql
- join_sql
- lambda_sql
- lateral_op
- lateral_sql
- limit_sql
- setitem_sql
- set_sql
- queryband_sql
- pragma_sql
- lock_sql
- literal_sql
- escape_str
- loaddata_sql
- null_sql
- boolean_sql
- booland_sql
- boolor_sql
- order_sql
- withfill_sql
- cluster_sql
- distribute_sql
- sort_sql
- ordered_sql
- matchrecognizemeasure_sql
- matchrecognize_sql
- query_modifiers
- options_modifier
- for_modifiers
- queryoption_sql
- offset_limit_modifiers
- select_sql
- schema_sql
- schema_columns_sql
- star_sql
- parameter_sql
- sessionparameter_sql
- subquery_sql
- qualify_sql
- unnest_sql
- where_sql
- window_sql
- partition_by_sql
- windowspec_sql
- withingroup_sql
- between_sql
- bracket_offset_expressions
- bracket_sql
- all_sql
- any_sql
- exists_sql
- case_sql
- constraint_sql
- nextvaluefor_sql
- extract_sql
- trim_sql
- convert_concat_args
- concat_sql
- concatws_sql
- check_sql
- foreignkey_sql
- primarykey_sql
- if_sql
- matchagainst_sql
- jsonkeyvalue_sql
- jsonpath_sql
- json_path_part
- formatjson_sql
- formatphrase_sql
- jsonarray_sql
- jsonarrayagg_sql
- jsoncolumndef_sql
- jsonschema_sql
- jsontable_sql
- openjsoncolumndef_sql
- openjson_sql
- in_unnest_op
- interval_sql
- return_sql
- reference_sql
- anonymous_sql
- paren_sql
- neg_sql
- alias_sql
- pivotalias_sql
- aliases_sql
- atindex_sql
- attimezone_sql
- fromtimezone_sql
- add_sql
- and_sql
- or_sql
- xor_sql
- connector_sql
- bitwiseand_sql
- bitwiseleftshift_sql
- bitwisenot_sql
- bitwiseor_sql
- bitwiserightshift_sql
- bitwisexor_sql
- strtotime_sql
- currentdate_sql
- collate_sql
- command_sql
- comment_sql
- mergetreettlaction_sql
- mergetreettl_sql
- transaction_sql
- commit_sql
- rollback_sql
- altercolumn_sql
- alterindex_sql
- alterdiststyle_sql
- altersortkey_sql
- alterrename_sql
- renamecolumn_sql
- alterset_sql
- alter_sql
- altersession_sql
- add_column_sql
- droppartition_sql
- addconstraint_sql
- addpartition_sql
- distinct_sql
- ignorenulls_sql
- respectnulls_sql
- havingmax_sql
- intdiv_sql
- dpipe_sql
- div_sql
- safedivide_sql
- overlaps_sql
- distance_sql
- dot_sql
- propertyeq_sql
- escape_sql
- glob_sql
- gt_sql
- gte_sql
- like_sql
- ilike_sql
- match_sql
- similarto_sql
- lt_sql
- lte_sql
- mod_sql
- mul_sql
- nullsafeeq_sql
- nullsafeneq_sql
- sub_sql
- jsoncast_sql
- try_sql
- log_sql
- use_sql
- binary
- ceil_floor
- function_fallback_sql
- func
- format_args
- too_wide
- format_time
- expressions
- op_expressions
- naked_property
- tag_sql
- token_sql
- userdefinedfunction_sql
- joinhint_sql
- kwarg_sql
- when_sql
- whens_sql
- merge_sql
- tochar_sql
- tonumber_sql
- dictproperty_sql
- dictrange_sql
- dictsubproperty_sql
- duplicatekeyproperty_sql
- uniquekeyproperty_sql
- distributedbyproperty_sql
- clusteredbyproperty_sql
- anyvalue_sql
- querytransform_sql
- indexconstraintoption_sql
- checkcolumnconstraint_sql
- nvl2_sql
- comprehension_sql
- columnprefix_sql
- opclass_sql
- predict_sql
- generateembedding_sql
- generatetext_sql
- generatetable_sql
- generatebool_sql
- generateint_sql
- generatedouble_sql
- mltranslate_sql
- mlforecast_sql
- aiforecast_sql
- featuresattime_sql
- vectorsearch_sql
- forin_sql
- refresh_sql
- toarray_sql
- tsordstotime_sql
- tsordstotimestamp_sql
- tsordstodatetime_sql
- tsordstodate_sql
- unixdate_sql
- lastday_sql
- dateadd_sql
- arrayany_sql
- struct_sql
- partitionrange_sql
- truncatetable_sql
- convert_sql
- copyparameter_sql
- credentials_sql
- copy_sql
- semicolon_sql
- datadeletionproperty_sql
- maskingpolicycolumnconstraint_sql
- gapfill_sql
- scope_resolution
- scoperesolution_sql
- parsejson_sql
- rand_sql
- changes_sql
- pad_sql
- summarize_sql
- explodinggenerateseries_sql
- converttimezone_sql
- json_sql
- jsonvalue_sql
- skipjsoncolumn_sql
- conditionalinsert_sql
- multitableinserts_sql
- oncondition_sql
- jsonextractquote_sql
- jsonexists_sql
- arrayagg_sql
- slice_sql
- apply_sql
- grant_sql
- revoke_sql
- grantprivilege_sql
- grantprincipal_sql
- columns_sql
- overlay_sql
- todouble_sql
- string_sql
- median_sql
- overflowtruncatebehavior_sql
- unixseconds_sql
- arraysize_sql
- attach_sql
- detach_sql
- attachoption_sql
- watermarkcolumnconstraint_sql
- encodeproperty_sql
- includeproperty_sql
- xmlelement_sql
- xmlkeyvalueoption_sql
- partitionbyrangeproperty_sql
- partitionbyrangepropertydynamic_sql
- unpivotcolumns_sql
- analyzesample_sql
- analyzestatistics_sql
- analyzehistogram_sql
- analyzedelete_sql
- analyzelistchainedrows_sql
- analyzevalidate_sql
- analyze_sql
- xmltable_sql
- xmlnamespace_sql
- export_sql
- declare_sql
- declareitem_sql
- recursivewithsearch_sql
- parameterizedagg_sql
- anonymousaggfunc_sql
- combinedaggfunc_sql
- combinedparameterizedagg_sql
- show_sql
- install_sql
- get_put_sql
- translatecharacters_sql
- decodecase_sql
- semanticview_sql
- getextract_sql
- datefromunixdate_sql
- space_sql
- buildproperty_sql
- refreshtriggerproperty_sql
- modelattribute_sql
- directorystage_sql
- uuid_sql
- initcap_sql
- localtime_sql
- localtimestamp_sql
- weekstart_sql
- chr_sql
- block_sql
- storedprocedure_sql
- ifblock_sql
- whileblock_sql
- execute_sql
- executesql_sql
- altermodifysqlsecurity_sql
- usingproperty_sql
- renameindex_sql