Class: DeltaLake::TableOptimizer

Inherits:
Object
  • Object
show all
Defined in:
lib/deltalake/table_optimizer.rb

Instance Method Summary collapse

Constructor Details

#initialize(table) ⇒ TableOptimizer

Returns a new instance of TableOptimizer.



3
4
5
# File 'lib/deltalake/table_optimizer.rb', line 3

def initialize(table)
  @table = table
end

Instance Method Details

#compact(partition_filters: nil, target_size: nil, max_concurrent_tasks: nil, min_commit_interval: nil, writer_properties: nil, post_commithook_properties: nil, commit_properties: nil) ⇒ Object



7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
# File 'lib/deltalake/table_optimizer.rb', line 7

def compact(
  partition_filters: nil,
  target_size: nil,
  max_concurrent_tasks: nil,
  min_commit_interval: nil,
  writer_properties: nil,
  post_commithook_properties: nil,
  commit_properties: nil
)
  metrics =
    @table._table.compact_optimize(
      @table._stringify_partition_values(partition_filters),
      target_size,
      max_concurrent_tasks,
      min_commit_interval,
      writer_properties,
      post_commithook_properties,
      commit_properties
    )
  @table.update_incremental
  result = JSON.parse(metrics)
  ["filesAdded", "filesRemoved"].each do |key|
    result[key] = JSON.parse(result[key]) if result[key].is_a?(String)
  end
  # TODO return underscore symbols like delete
  result
end

#z_order(columns, partition_filters: nil, target_size: nil, max_concurrent_tasks: nil, max_spill_size: 20 * 1024 * 1024 * 1024, min_commit_interval: nil, writer_properties: nil, post_commithook_properties: nil, commit_properties: nil) ⇒ Object



35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
# File 'lib/deltalake/table_optimizer.rb', line 35

def z_order(
  columns,
  partition_filters: nil,
  target_size: nil,
  max_concurrent_tasks:  nil,
  max_spill_size: 20 * 1024 * 1024 * 1024,
  min_commit_interval: nil,
  writer_properties: nil,
  post_commithook_properties: nil,
  commit_properties: nil
)
  metrics =
    @table._table.z_order_optimize(
      Array(columns),
      @table._stringify_partition_values(partition_filters),
      target_size,
      max_concurrent_tasks,
      max_spill_size,
      min_commit_interval,
      writer_properties,
      post_commithook_properties,
      commit_properties
    )
  @table.update_incremental
  result = JSON.parse(metrics)
  ["filesAdded", "filesRemoved"].each do |key|
    result[key] = JSON.parse(result[key]) if result[key].is_a?(String)
  end
  # TODO return underscore symbols like delete
  result
end