Class: DeltaLake::TableOptimizer
- Inherits:
-
Object
- Object
- DeltaLake::TableOptimizer
- Defined in:
- lib/deltalake/table_optimizer.rb
Instance Method Summary collapse
- #compact(partition_filters: nil, target_size: nil, max_concurrent_tasks: nil, min_commit_interval: nil, writer_properties: nil, post_commithook_properties: nil, commit_properties: nil) ⇒ Object
-
#initialize(table) ⇒ TableOptimizer
constructor
A new instance of TableOptimizer.
- #z_order(columns, partition_filters: nil, target_size: nil, max_concurrent_tasks: nil, max_spill_size: 20 * 1024 * 1024 * 1024, min_commit_interval: nil, writer_properties: nil, post_commithook_properties: nil, commit_properties: nil) ⇒ Object
Constructor Details
#initialize(table) ⇒ TableOptimizer
Returns a new instance of TableOptimizer.
3 4 5 |
# File 'lib/deltalake/table_optimizer.rb', line 3 def initialize(table) @table = table end |
Instance Method Details
#compact(partition_filters: nil, target_size: nil, max_concurrent_tasks: nil, min_commit_interval: nil, writer_properties: nil, post_commithook_properties: nil, commit_properties: nil) ⇒ Object
7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 |
# File 'lib/deltalake/table_optimizer.rb', line 7 def compact( partition_filters: nil, target_size: nil, max_concurrent_tasks: nil, min_commit_interval: nil, writer_properties: nil, post_commithook_properties: nil, commit_properties: nil ) metrics = @table._table.compact_optimize( @table._stringify_partition_values(partition_filters), target_size, max_concurrent_tasks, min_commit_interval, writer_properties, post_commithook_properties, commit_properties ) @table.update_incremental result = JSON.parse(metrics) ["filesAdded", "filesRemoved"].each do |key| result[key] = JSON.parse(result[key]) if result[key].is_a?(String) end # TODO return underscore symbols like delete result end |
#z_order(columns, partition_filters: nil, target_size: nil, max_concurrent_tasks: nil, max_spill_size: 20 * 1024 * 1024 * 1024, min_commit_interval: nil, writer_properties: nil, post_commithook_properties: nil, commit_properties: nil) ⇒ Object
35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 |
# File 'lib/deltalake/table_optimizer.rb', line 35 def z_order( columns, partition_filters: nil, target_size: nil, max_concurrent_tasks: nil, max_spill_size: 20 * 1024 * 1024 * 1024, min_commit_interval: nil, writer_properties: nil, post_commithook_properties: nil, commit_properties: nil ) metrics = @table._table.z_order_optimize( Array(columns), @table._stringify_partition_values(partition_filters), target_size, max_concurrent_tasks, max_spill_size, min_commit_interval, writer_properties, post_commithook_properties, commit_properties ) @table.update_incremental result = JSON.parse(metrics) ["filesAdded", "filesRemoved"].each do |key| result[key] = JSON.parse(result[key]) if result[key].is_a?(String) end # TODO return underscore symbols like delete result end |