-
Notifications
You must be signed in to change notification settings - Fork 330
chore: Add envvars to override writer configs and cometConf minor clean up #3540
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 2 commits
7b341d9
4e8a773
7e04d58
e954bc9
0202a09
cdcf5f7
08e5914
d4595b6
ffe088f
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -54,9 +54,6 @@ object CometConf extends ShimCometConf { | |
| private val TRACING_GUIDE = "For more information, refer to the Comet Tracing " + | ||
| "Guide (https://datafusion.apache.org/comet/contributor-guide/tracing.html)" | ||
|
|
||
| private val DEBUGGING_GUIDE = "For more information, refer to the Comet Debugging " + | ||
| "Guide (https://datafusion.apache.org/comet/contributor-guide/debugging.html)" | ||
|
|
||
| /** List of all configs that is used for generating documentation */ | ||
| val allConfs = new ListBuffer[ConfigEntry[_]] | ||
|
|
||
|
|
@@ -112,7 +109,7 @@ object CometConf extends ShimCometConf { | |
| "feature is highly experimental and only partially implemented. It should not " + | ||
| "be used in production.") | ||
| .booleanConf | ||
| .createWithDefault(false) | ||
| .createWithEnvVarOrDefault("ENABLE_COMET_WRITE", false) | ||
|
|
||
| // Deprecated: native_comet uses mutable buffers incompatible with Arrow FFI best practices | ||
| // and does not support complex types. Use native_iceberg_compat or auto instead. | ||
|
|
@@ -552,13 +549,6 @@ object CometConf extends ShimCometConf { | |
| .booleanConf | ||
| .createWithDefault(false) | ||
|
|
||
| val COMET_DEBUG_MEMORY_ENABLED: ConfigEntry[Boolean] = | ||
| conf(s"$COMET_PREFIX.debug.memory") | ||
| .category(CATEGORY_TESTING) | ||
| .doc(s"When enabled, log all native memory pool interactions. $DEBUGGING_GUIDE.") | ||
| .booleanConf | ||
| .createWithDefault(false) | ||
|
|
||
| val COMET_EXTENDED_EXPLAIN_FORMAT_VERBOSE = "verbose" | ||
| val COMET_EXTENDED_EXPLAIN_FORMAT_FALLBACK = "fallback" | ||
|
|
||
|
|
@@ -795,14 +785,6 @@ object CometConf extends ShimCometConf { | |
| .booleanConf | ||
| .createWithDefault(false) | ||
|
|
||
| val COMET_REGEXP_ALLOW_INCOMPATIBLE: ConfigEntry[Boolean] = | ||
| conf("spark.comet.regexp.allowIncompatible") | ||
| .category(CATEGORY_EXEC) | ||
| .doc("Comet is not currently fully compatible with Spark for all regular expressions. " + | ||
| s"Set this config to true to allow them anyway. $COMPAT_GUIDE.") | ||
| .booleanConf | ||
| .createWithDefault(false) | ||
|
|
||
| val COMET_METRICS_UPDATE_INTERVAL: ConfigEntry[Long] = | ||
| conf("spark.comet.metrics.updateInterval") | ||
| .category(CATEGORY_EXEC) | ||
|
|
@@ -821,13 +803,6 @@ object CometConf extends ShimCometConf { | |
| .stringConf | ||
| .createOptional | ||
|
|
||
| val COMET_MAX_TEMP_DIRECTORY_SIZE: ConfigEntry[Long] = | ||
|
Member
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Some of these configs are used directly from native code. We add them here so that they get documented.
Member
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. in pub(crate) const COMET_TRACING_ENABLED: &str = "spark.comet.tracing.enabled";
pub(crate) const COMET_DEBUG_ENABLED: &str = "spark.comet.debug.enabled";
pub(crate) const COMET_EXPLAIN_NATIVE_ENABLED: &str = "spark.comet.explain.native.enabled";
pub(crate) const COMET_MAX_TEMP_DIRECTORY_SIZE: &str = "spark.comet.maxTempDirectorySize";
pub(crate) const COMET_DEBUG_MEMORY: &str = "spark.comet.debug.memory";
Contributor
Author
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Ic, I'll add comments! |
||
| conf("spark.comet.maxTempDirectorySize") | ||
| .category(CATEGORY_EXEC) | ||
| .doc("The maximum amount of data (in bytes) stored inside the temporary directories.") | ||
| .bytesConf(ByteUnit.BYTE) | ||
| .createWithDefault(100L * 1024 * 1024 * 1024) // 100 GB | ||
|
|
||
| val COMET_RESPECT_DATAFUSION_CONFIGS: ConfigEntry[Boolean] = | ||
| conf(s"$COMET_EXEC_CONFIG_PREFIX.respectDataFusionConfigs") | ||
| .category(CATEGORY_TESTING) | ||
|
|
||
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Removing the config here will remove it from the configuration guide, but maybe that is fine, so long as we are explaining it in the compatibility guide.