Struct datafusion::execution::context::ExecutionConfig [−][src]
pub struct ExecutionConfig {
pub target_partitions: usize,
pub batch_size: usize,
pub physical_optimizers: Vec<Arc<dyn PhysicalOptimizerRule + Send + Sync>>,
pub repartition_joins: bool,
pub repartition_aggregations: bool,
pub repartition_windows: bool,
// some fields omitted
}
Expand description
Configuration options for execution context
Fields
target_partitions: usize
Number of partitions for query execution. Increasing partitions can increase concurrency.
batch_size: usize
Default batch size when reading data sources
physical_optimizers: Vec<Arc<dyn PhysicalOptimizerRule + Send + Sync>>
Responsible for optimizing a physical execution plan
repartition_joins: bool
Should DataFusion repartition data using the join keys to execute joins in parallel
using the provided target_partitions
level
repartition_aggregations: bool
Should DataFusion repartition data using the aggregate keys to execute aggregates in parallel
using the provided target_partitions
level
repartition_windows: bool
Should DataFusion repartition data using the partition keys to execute window functions in
parallel using the provided target_partitions
level
Implementations
Customize target_partitions
Customize batch size
Replace the default query planner
pub fn with_optimizer_rules(
self,
optimizers: Vec<Arc<dyn OptimizerRule + Send + Sync>>
) -> Self
pub fn with_optimizer_rules(
self,
optimizers: Vec<Arc<dyn OptimizerRule + Send + Sync>>
) -> Self
Replace the optimizer rules
pub fn with_physical_optimizer_rules(
self,
physical_optimizers: Vec<Arc<dyn PhysicalOptimizerRule + Send + Sync>>
) -> Self
pub fn with_physical_optimizer_rules(
self,
physical_optimizers: Vec<Arc<dyn PhysicalOptimizerRule + Send + Sync>>
) -> Self
Replace the physical optimizer rules
Adds a new OptimizerRule
pub fn add_physical_optimizer_rule(
self,
optimizer_rule: Arc<dyn PhysicalOptimizerRule + Send + Sync>
) -> Self
pub fn add_physical_optimizer_rule(
self,
optimizer_rule: Arc<dyn PhysicalOptimizerRule + Send + Sync>
) -> Self
Adds a new PhysicalOptimizerRule
Selects a name for the default catalog and schema
Controls whether the default catalog and schema will be automatically created
Enables or disables the inclusion of information_schema
virtual tables
Enables or disables the use of repartitioning for joins to improve parallelism
Enables or disables the use of repartitioning for aggregations to improve parallelism
Enables or disables the use of repartitioning for window functions to improve parallelism
Enables or disables the use of pruning predicate for parquet readers to skip row groups
Trait Implementations
Auto Trait Implementations
impl !RefUnwindSafe for ExecutionConfig
impl Send for ExecutionConfig
impl Sync for ExecutionConfig
impl Unpin for ExecutionConfig
impl !UnwindSafe for ExecutionConfig
Blanket Implementations
Mutably borrows from an owned value. Read more