Typing : added ParquetCompression and ProfilerFormat literals

OutSquareCapital · evertlammerts · commit afba0abc854a · 2026-03-20T17:29:20.000+01:00
diff --git a/_duckdb-stubs/__init__.pyi b/_duckdb-stubs/__init__.pyi
@@ -38,6 +38,8 @@ if typing.TYPE_CHECKING:
         CsvCompression,
         HiveTypes,
         ColumnsTypes,
+        ProfilerFormat,
+        ParquetCompression,
     )
     from ._enums import ExplainTypeLiteral, CSVLineTerminatorLiteral, RenderModeLiteral
     from duckdb import sqltypes, func
@@ -302,7 +304,7 @@ class DuckDBPyConnection:
         filename: bool = False,
         hive_partitioning: bool = False,
         union_by_name: bool = False,
-        compression: str | None = None,
+        compression: ParquetCompression | None = None,
     ) -> DuckDBPyRelation: ...
     @typing.overload
     def from_parquet(
@@ -314,7 +316,7 @@ class DuckDBPyConnection:
         filename: bool = False,
         hive_partitioning: bool = False,
         union_by_name: bool = False,
-        compression: str | None = None,
+        compression: ParquetCompression | None = None,
     ) -> DuckDBPyRelation: ...
     def from_query(self, query: str, *, alias: str = "", params: object = None) -> DuckDBPyRelation: ...
     def get_table_names(self, query: str, *, qualified: bool = False) -> set[str]: ...
@@ -327,7 +329,7 @@ class DuckDBPyConnection:
         repository_url: str | None = None,
         version: str | None = None,
     ) -> None: ...
-    def get_profiling_information(self, format: str = "json") -> str: ...
+    def get_profiling_information(self, format: ProfilerFormat = "json") -> str: ...
     def enable_profiling(self) -> None: ...
     def disable_profiling(self) -> None: ...
     def interrupt(self) -> None: ...
@@ -426,7 +428,7 @@ class DuckDBPyConnection:
         filename: bool = False,
         hive_partitioning: bool = False,
         union_by_name: bool = False,
-        compression: str | None = None,
+        compression: ParquetCompression | None = None,
     ) -> DuckDBPyRelation: ...
     @typing.overload
     def read_parquet(
@@ -438,7 +440,7 @@ class DuckDBPyConnection:
         filename: bool = False,
         hive_partitioning: bool = False,
         union_by_name: bool = False,
-        compression: typing.Any = None,
+        compression: ParquetCompression | None = None,
     ) -> DuckDBPyRelation: ...
     def register(self, view_name: str, python_object: object) -> DuckDBPyConnection: ...
     def register_filesystem(self, filesystem: fsspec.AbstractFileSystem) -> None: ...
@@ -725,7 +727,7 @@ class DuckDBPyRelation:
         self,
         file_name: str,
         *,
-        compression: str | None = None,
+        compression: ParquetCompression | None = None,
         field_ids: ParquetFieldsOptions | None = None,
         row_group_size_bytes: int | str | None = None,
         row_group_size: int | None = None,
@@ -781,7 +783,7 @@ class DuckDBPyRelation:
         self,
         file_name: str,
         *,
-        compression: str | None = None,
+        compression: ParquetCompression | None = None,
         field_ids: ParquetFieldsOptions | None = None,
         row_group_size_bytes: str | int | None = None,
         row_group_size: int | None = None,
@@ -1039,7 +1041,7 @@ def from_parquet(
     filename: bool = False,
     hive_partitioning: bool = False,
     union_by_name: bool = False,
-    compression: str | None = None,
+    compression: ParquetCompression | None = None,
     connection: DuckDBPyConnection | None = None,
 ) -> DuckDBPyRelation: ...
 @typing.overload
@@ -1051,7 +1053,7 @@ def from_parquet(
     filename: bool = False,
     hive_partitioning: bool = False,
     union_by_name: bool = False,
-    compression: typing.Any = None,
+    compression: ParquetCompression | None = None,
     connection: DuckDBPyConnection | None = None,
 ) -> DuckDBPyRelation: ...
 def from_query(
@@ -1081,7 +1083,9 @@ def limit(
     *,
     connection: DuckDBPyConnection | None = None,
 ) -> DuckDBPyRelation: ...
-def get_profiling_information(*, connection: DuckDBPyConnection | None = None, format: str = "json") -> str: ...
+def get_profiling_information(
+    *, connection: DuckDBPyConnection | None = None, format: ProfilerFormat = "json"
+) -> str: ...
 def enable_profiling(*, connection: DuckDBPyConnection | None = None) -> None: ...
 def disable_profiling(*, connection: DuckDBPyConnection | None = None) -> None: ...
 def list_filesystems(*, connection: DuckDBPyConnection | None = None) -> lst[str]: ...
@@ -1208,7 +1212,7 @@ def read_parquet(
     filename: bool = False,
     hive_partitioning: bool = False,
     union_by_name: bool = False,
-    compression: str | None = None,
+    compression: ParquetCompression | None = None,
     connection: DuckDBPyConnection | None = None,
 ) -> DuckDBPyRelation: ...
 @typing.overload
@@ -1220,7 +1224,7 @@ def read_parquet(
     filename: bool = False,
     hive_partitioning: bool = False,
     union_by_name: bool = False,
-    compression: typing.Any = None,
+    compression: ParquetCompression | None = None,
     connection: DuckDBPyConnection | None = None,
 ) -> DuckDBPyRelation: ...
 def register(
diff --git a/_duckdb-stubs/_typing.pyi b/_duckdb-stubs/_typing.pyi
@@ -138,7 +138,7 @@ PyTypeIds: TypeAlias = Builtins | NestedIds
 StrIntoPyType: TypeAlias = Builtins | Literal["json"] | str
 """Any `str` that can be converted into a `DuckDBPyType`.
 
-The pytypes not present in the literal values are the composed ones, like `STRUCT` or `DECIMAL`.
+The `DuckDBPyType` not present in the literal values are the composed ones, like `STRUCT` or `DECIMAL`.
 
 Note:
     A `StrEnum` will be handled the same way as a `str`."""
@@ -186,21 +186,28 @@ _Auto: TypeAlias = Literal["auto"]
 ParquetFieldsOptions: TypeAlias = _Auto | ParquetFieldIdsType
 """Types accepted for the `field_ids` parameter in parquet writing methods."""
 
-_CompressionOptions: TypeAlias = Literal["none", "gzip", "zstd"]
-"""Generally available compression options."""
-
-CsvCompression: TypeAlias = _Auto | _CompressionOptions
 CsvEncoding: TypeAlias = Literal["utf-8", "utf-16", "latin-1"] | str
 """Encdoding options.
 
 All availables options not in the literal values can be seen here:
     https://duckdb.org/docs/stable/core_extensions/encodings
 """
-JsonCompression: TypeAlias = Literal["auto_detect"] | _CompressionOptions
 JsonFormat: TypeAlias = _Auto | Literal["unstructured", "newline_delimited", "array"]
 JsonRecordOptions: TypeAlias = _Auto | Literal["true", "false"]
 
+# compression kinds
+
+_CompressionOptions: TypeAlias = Literal["gzip", "zstd"]
+"""Generally available compression options."""
+_None: TypeAlias = Literal["none"]
+CsvCompression: TypeAlias = _Auto | _None | _CompressionOptions
+JsonCompression: TypeAlias = Literal["auto_detect"] | _None | _CompressionOptions
+ParquetCompression: TypeAlias = Literal["uncompressed", "brotli", "snappy", "lz4", "lz4_raw"] | _CompressionOptions
+
 # Other
 
 JoinType: TypeAlias = Literal["inner", "left", "right", "outer", "semi", "anti"]
 """Types of join accepted by `DuckDBPyRelation.join` method."""
+
+ProfilerFormat: TypeAlias = Literal["json", "query_tree", "query_tree_optimizer", "no_output", "html", "graphviz"]
+"""Formats available in `get_profiling_information` method/function."""