sqlglot/sqlglot/__init__.py

"""
.. include:: ../README.md

----
"""

from __future__ import annotations

import logging
import typing as t

from sqlglot import expressions as exp
from sqlglot.dialects.dialect import Dialect as Dialect, Dialects as Dialects
from sqlglot.diff import diff as diff
from sqlglot.errors import (
    ErrorLevel as ErrorLevel,
    ParseError as ParseError,
    TokenError as TokenError,
    UnsupportedError as UnsupportedError,
)
from sqlglot.expressions import (
    Expression as Expression,
    alias_ as alias,
    and_ as and_,
    cast as cast,
    column as column,
    condition as condition,
    except_ as except_,
    from_ as from_,
    func as func,
    intersect as intersect,
    maybe_parse as maybe_parse,
    not_ as not_,
    or_ as or_,
    select as select,
    subquery as subquery,
    table_ as table,
    to_column as to_column,
    to_identifier as to_identifier,
    to_table as to_table,
    union as union,
)
from sqlglot.generator import Generator as Generator
from sqlglot.parser import Parser as Parser
from sqlglot.schema import MappingSchema as MappingSchema, Schema as Schema
from sqlglot.tokens import Tokenizer as Tokenizer, TokenType as TokenType

if t.TYPE_CHECKING:
    from sqlglot._typing import E
    from sqlglot.dialects.dialect import DialectType as DialectType

logger = logging.getLogger("sqlglot")


try:
    from sqlglot._version import __version__, __version_tuple__
except ImportError:
    logger.error(
        "Unable to set __version__, run `pip install -e .` or `python setup.py develop` first."
    )


pretty = False
"""Whether to format generated SQL by default."""

schema = MappingSchema()
"""The default schema used by SQLGlot (e.g. in the optimizer)."""


def parse(sql: str, read: DialectType = None, **opts) -> t.List[t.Optional[Expression]]:
    """
    Parses the given SQL string into a collection of syntax trees, one per parsed SQL statement.

    Args:
        sql: the SQL code string to parse.
        read: the SQL dialect to apply during parsing (eg. "spark", "hive", "presto", "mysql").
        **opts: other `sqlglot.parser.Parser` options.

    Returns:
        The resulting syntax tree collection.
    """
    dialect = Dialect.get_or_raise(read)()
    return dialect.parse(sql, **opts)


@t.overload
def parse_one(sql: str, *, into: t.Type[E], **opts) -> E:
    ...


@t.overload
def parse_one(sql: str, **opts) -> Expression:
    ...


def parse_one(
    sql: str, read: DialectType = None, into: t.Optional[exp.IntoType] = None, **opts
) -> Expression:
    """
    Parses the given SQL string and returns a syntax tree for the first parsed SQL statement.

    Args:
        sql: the SQL code string to parse.
        read: the SQL dialect to apply during parsing (eg. "spark", "hive", "presto", "mysql").
        into: the SQLGlot Expression to parse into.
        **opts: other `sqlglot.parser.Parser` options.

    Returns:
        The syntax tree for the first parsed statement.
    """

    dialect = Dialect.get_or_raise(read)()

    if into:
        result = dialect.parse_into(into, sql, **opts)
    else:
        result = dialect.parse(sql, **opts)

    for expression in result:
        if not expression:
            raise ParseError(f"No expression was parsed from '{sql}'")
        return expression
    else:
        raise ParseError(f"No expression was parsed from '{sql}'")


def transpile(
    sql: str,
    read: DialectType = None,
    write: DialectType = None,
    identity: bool = True,
    error_level: t.Optional[ErrorLevel] = None,
    **opts,
) -> t.List[str]:
    """
    Parses the given SQL string in accordance with the source dialect and returns a list of SQL strings transformed
    to conform to the target dialect. Each string in the returned list represents a single transformed SQL statement.

    Args:
        sql: the SQL code string to transpile.
        read: the source dialect used to parse the input string (eg. "spark", "hive", "presto", "mysql").
        write: the target dialect into which the input should be transformed (eg. "spark", "hive", "presto", "mysql").
        identity: if set to `True` and if the target dialect is not specified the source dialect will be used as both:
            the source and the target dialect.
        error_level: the desired error level of the parser.
        **opts: other `sqlglot.generator.Generator` options.

    Returns:
        The list of transpiled SQL statements.
    """
    write = (read if write is None else write) if identity else write
    return [
        Dialect.get_or_raise(write)().generate(expression, **opts)
        for expression in parse(sql, read, error_level=error_level)
    ]
Merging upstream version 10.4.2. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:01:55 +01:00			`"""`
			`.. include:: ../README.md`
Merging upstream version 11.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:23:26 +01:00
Merging upstream version 10.5.10. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:07:05 +01:00			`----`
Merging upstream version 10.4.2. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:01:55 +01:00			`"""`
Merging upstream version 9.0.6. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:51:47 +01:00
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`from __future__ import annotations`

Merging upstream version 15.0.0. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:57:23 +01:00			`import logging`
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`import typing as t`

Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00			`from sqlglot import expressions as exp`
Merging upstream version 11.2.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:40:23 +01:00			`from sqlglot.dialects.dialect import Dialect as Dialect, Dialects as Dialects`
			`from sqlglot.diff import diff as diff`
			`from sqlglot.errors import (`
			`ErrorLevel as ErrorLevel,`
			`ParseError as ParseError,`
			`TokenError as TokenError,`
			`UnsupportedError as UnsupportedError,`
			`)`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00			`from sqlglot.expressions import (`
Merging upstream version 11.2.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:40:23 +01:00			`Expression as Expression,`
			`alias_ as alias,`
			`and_ as and_,`
Merging upstream version 11.7.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:52:09 +01:00			`cast as cast,`
Merging upstream version 11.2.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:40:23 +01:00			`column as column,`
			`condition as condition,`
			`except_ as except_,`
			`from_ as from_,`
Merging upstream version 11.7.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:52:09 +01:00			`func as func,`
Merging upstream version 11.2.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:40:23 +01:00			`intersect as intersect,`
			`maybe_parse as maybe_parse,`
			`not_ as not_,`
			`or_ as or_,`
			`select as select,`
			`subquery as subquery,`
			`table_ as table,`
			`to_column as to_column,`
Merging upstream version 11.7.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:52:09 +01:00			`to_identifier as to_identifier,`
Merging upstream version 11.2.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:40:23 +01:00			`to_table as to_table,`
			`union as union,`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00			`)`
Merging upstream version 11.2.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:40:23 +01:00			`from sqlglot.generator import Generator as Generator`
			`from sqlglot.parser import Parser as Parser`
			`from sqlglot.schema import MappingSchema as MappingSchema, Schema as Schema`
			`from sqlglot.tokens import Tokenizer as Tokenizer, TokenType as TokenType`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00
Merging upstream version 10.6.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:09:58 +01:00			`if t.TYPE_CHECKING:`
Merging upstream version 15.0.0. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:57:23 +01:00			`from sqlglot._typing import E`
Merging upstream version 11.2.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:40:23 +01:00			`from sqlglot.dialects.dialect import DialectType as DialectType`
Merging upstream version 10.6.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:09:58 +01:00
Merging upstream version 15.0.0. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:57:23 +01:00			`logger = logging.getLogger("sqlglot")`
Merging upstream version 10.6.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:09:58 +01:00

Merging upstream version 15.0.0. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:57:23 +01:00			`try:`
			`from sqlglot._version import __version__, __version_tuple__`
			`except ImportError:`
			`logger.error(`
			"Unable to set __version__, run `pip install -e .` or `python setup.py develop` first."
			`)`

Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00
			`pretty = False`
Merging upstream version 10.5.10. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:07:05 +01:00			`"""Whether to format generated SQL by default."""`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00
Merging upstream version 9.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:48:46 +01:00			`schema = MappingSchema()`
Merging upstream version 10.5.10. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:07:05 +01:00			`"""The default schema used by SQLGlot (e.g. in the optimizer)."""`
Merging upstream version 9.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:48:46 +01:00
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00
Merging upstream version 10.6.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:09:58 +01:00			`def parse(sql: str, read: DialectType = None, **opts) -> t.List[t.Optional[Expression]]:`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00			`"""`
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`Parses the given SQL string into a collection of syntax trees, one per parsed SQL statement.`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00
			`Args:`
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`sql: the SQL code string to parse.`
			`read: the SQL dialect to apply during parsing (eg. "spark", "hive", "presto", "mysql").`
Merging upstream version 10.5.10. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:07:05 +01:00			**opts: other `sqlglot.parser.Parser` options.
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00
			`Returns:`
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`The resulting syntax tree collection.`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00			`"""`
			`dialect = Dialect.get_or_raise(read)()`
			`return dialect.parse(sql, **opts)`


Merging upstream version 10.6.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:09:58 +01:00			`@t.overload`
Merging upstream version 16.4.0. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 20:04:59 +01:00			`def parse_one(sql: str, , into: t.Type[E], *opts) -> E:`
Merging upstream version 10.6.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:09:58 +01:00			`...`


			`@t.overload`
Merging upstream version 16.4.0. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 20:04:59 +01:00			`def parse_one(sql: str, **opts) -> Expression:`
Merging upstream version 10.6.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:09:58 +01:00			`...`


Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`def parse_one(`
Merging upstream version 16.4.0. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 20:04:59 +01:00			`sql: str, read: DialectType = None, into: t.Optional[exp.IntoType] = None, **opts`
Merging upstream version 10.5.2. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:03:38 +01:00			`) -> Expression:`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00			`"""`
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`Parses the given SQL string and returns a syntax tree for the first parsed SQL statement.`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00
			`Args:`
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`sql: the SQL code string to parse.`
			`read: the SQL dialect to apply during parsing (eg. "spark", "hive", "presto", "mysql").`
			`into: the SQLGlot Expression to parse into.`
Merging upstream version 10.5.10. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:07:05 +01:00			**opts: other `sqlglot.parser.Parser` options.
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00
			`Returns:`
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`The syntax tree for the first parsed statement.`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00			`"""`

			`dialect = Dialect.get_or_raise(read)()`

			`if into:`
			`result = dialect.parse_into(into, sql, **opts)`
			`else:`
			`result = dialect.parse(sql, **opts)`

Merging upstream version 10.5.2. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:03:38 +01:00			`for expression in result:`
			`if not expression:`
			`raise ParseError(f"No expression was parsed from '{sql}'")`
			`return expression`
			`else:`
			`raise ParseError(f"No expression was parsed from '{sql}'")`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00

Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`def transpile(`
			`sql: str,`
Merging upstream version 10.6.3. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:09:58 +01:00			`read: DialectType = None,`
			`write: DialectType = None,`
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`identity: bool = True,`
			`error_level: t.Optional[ErrorLevel] = None,`
			`**opts,`
			`) -> t.List[str]:`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00			`"""`
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`Parses the given SQL string in accordance with the source dialect and returns a list of SQL strings transformed`
			`to conform to the target dialect. Each string in the returned list represents a single transformed SQL statement.`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00
			`Args:`
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`sql: the SQL code string to transpile.`
			`read: the source dialect used to parse the input string (eg. "spark", "hive", "presto", "mysql").`
			`write: the target dialect into which the input should be transformed (eg. "spark", "hive", "presto", "mysql").`
			identity: if set to `True` and if the target dialect is not specified the source dialect will be used as both:
			`the source and the target dialect.`
			`error_level: the desired error level of the parser.`
Merging upstream version 10.5.10. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:07:05 +01:00			**opts: other `sqlglot.generator.Generator` options.
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00
			`Returns:`
Merging upstream version 10.0.1. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 14:53:05 +01:00			`The list of transpiled SQL statements.`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00			`"""`
Merging upstream version 12.2.0. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 15:53:39 +01:00			`write = (read if write is None else write) if identity else write`
Adding upstream version 6.0.4. Signed-off-by: Daniel Baumann <daniel@debian.org> 2025-02-13 06:15:54 +01:00			`return [`
			`Dialect.get_or_raise(write)().generate(expression, **opts)`
			`for expression in parse(sql, read, error_level=error_level)`
			`]`