forked from apache/datafusion-comet
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathMetadataColumnReader.java
More file actions
111 lines (92 loc) · 3.33 KB
/
MetadataColumnReader.java
File metadata and controls
111 lines (92 loc) · 3.33 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.comet.parquet;
import org.apache.arrow.c.ArrowArray;
import org.apache.arrow.c.ArrowSchema;
import org.apache.arrow.c.Data;
import org.apache.arrow.memory.BufferAllocator;
import org.apache.arrow.memory.RootAllocator;
import org.apache.arrow.vector.FieldVector;
import org.apache.parquet.column.ColumnDescriptor;
import org.apache.spark.sql.types.DataType;
import org.apache.comet.IcebergApi;
import org.apache.comet.vector.CometPlainVector;
import org.apache.comet.vector.CometVector;
/** A metadata column reader that can be extended by {@link RowIndexColumnReader} etc. */
@IcebergApi
public class MetadataColumnReader extends AbstractColumnReader {
private final BufferAllocator allocator = new RootAllocator();
private CometVector vector;
private ArrowArray array = null;
private ArrowSchema schema = null;
private boolean isConstant;
/**
* @see <a href="https://github.com/apache/datafusion-comet/issues/2079">Comet Issue #2079</a>
*/
@IcebergApi
public MetadataColumnReader(
DataType type, ColumnDescriptor descriptor, boolean useDecimal128, boolean isConstant) {
// TODO: should we handle legacy dates & timestamps for metadata columns?
super(type, descriptor, useDecimal128, false);
this.isConstant = isConstant;
}
// Used by Iceberg
@IcebergApi
public MetadataColumnReader(
DataType type, ParquetColumnSpec spec, boolean useDecimal128, boolean isConstant) {
// TODO: should we handle legacy dates & timestamps for metadata columns?
super(type, Utils.buildColumnDescriptor(spec), useDecimal128, false);
this.isConstant = isConstant;
}
@Override
public void setBatchSize(int batchSize) {
close();
super.setBatchSize(batchSize);
}
@IcebergApi
@Override
public void readBatch(int total) {
if (vector == null) {
array = ArrowArray.allocateNew(allocator);
schema = ArrowSchema.allocateNew(allocator);
long arrayAddr = array.memoryAddress();
long schemaAddr = schema.memoryAddress();
Native.currentBatch(nativeHandle, arrayAddr, schemaAddr);
FieldVector fieldVector = Data.importVector(allocator, array, schema, null);
vector = new CometPlainVector(fieldVector, useDecimal128, false, isConstant);
}
vector.setNumValues(total);
}
void setNumNulls(int total) {
vector.setNumNulls(total);
}
@IcebergApi
@Override
public CometVector currentBatch() {
return vector;
}
@Override
public void close() {
if (vector != null) {
vector.close();
vector = null;
}
super.close();
}
}