Skip to content

Commit 61bc607

Browse files
committed
Drop unnecessary churn in tests
After the last refactor restored toParquetStatistics(stats) and fromParquetStatistics(String, Statistics, PrimitiveTypeName) as static, several test sites that had been switched to instance calls no longer need to be. Revert TestParquetFileWriter entirely to its pre-PR state, drop the CREATED_BY constant from TestParquetMetadataConverter (the existing Version.FULL_VERSION references the actual writer version), and revert the three testSkippedV2Stats / testV2OnlyStats / testV2StatsEqualMinMax helpers and one round-trip call site back to static ParquetMetadataConverter.toParquetStatistics(stats).
1 parent 43e0c29 commit 61bc607

2 files changed

Lines changed: 16 additions & 19 deletions

File tree

parquet-hadoop/src/test/java/org/apache/parquet/format/converter/TestParquetMetadataConverter.java

Lines changed: 11 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -150,7 +150,6 @@ public class TestParquetMetadataConverter {
150150
private static final String CHAR_UPPER = CHAR_LOWER.toUpperCase();
151151
private static final String NUMBER = "0123456789";
152152
private static final String DATA_FOR_RANDOM_STRING = CHAR_LOWER + CHAR_UPPER + NUMBER;
153-
private static final String CREATED_BY = "parquet-mr";
154153

155154
@Rule
156155
public TemporaryFolder temporaryFolder = new TemporaryFolder();
@@ -820,7 +819,7 @@ private void testBinaryStats(StatsHelper helper) {
820819
Assert.assertFalse("Num nulls should not be set", formatStats.isSetNull_count());
821820
ParquetMetadataConverter converter = new ParquetMetadataConverter();
822821
Statistics roundTripStats = converter.fromParquetStatisticsInternal(
823-
CREATED_BY,
822+
Version.FULL_VERSION,
824823
formatStats,
825824
new PrimitiveType(Repetition.OPTIONAL, PrimitiveTypeName.BINARY, ""),
826825
ParquetMetadataConverter.SortOrder.SIGNED);
@@ -1067,8 +1066,8 @@ private void testStillUseStatsWithSignedSortOrderIfSingleValue(StatsHelper helpe
10671066

10681067
PrimitiveType binaryType =
10691068
Types.required(PrimitiveTypeName.BINARY).as(OriginalType.UTF8).named("b");
1070-
Statistics convertedStats =
1071-
converter.fromParquetStatistics(Version.FULL_VERSION, converter.toParquetStatistics(stats), binaryType);
1069+
Statistics convertedStats = converter.fromParquetStatistics(
1070+
Version.FULL_VERSION, ParquetMetadataConverter.toParquetStatistics(stats), binaryType);
10721071

10731072
Assert.assertFalse("Stats should not be empty: " + convertedStats, convertedStats.isEmpty());
10741073
Assert.assertArrayEquals(
@@ -1143,7 +1142,7 @@ public void testMissingValuesFromStats() {
11431142
PrimitiveType type = Types.required(PrimitiveTypeName.INT32).named("test_int32");
11441143

11451144
org.apache.parquet.format.Statistics formatStats = new org.apache.parquet.format.Statistics();
1146-
Statistics<?> stats = converter.fromParquetStatistics(CREATED_BY, formatStats, type);
1145+
Statistics<?> stats = converter.fromParquetStatistics(Version.FULL_VERSION, formatStats, type);
11471146
assertFalse(stats.isNumNullsSet());
11481147
assertFalse(stats.hasNonNullValue());
11491148
assertTrue(stats.isEmpty());
@@ -1152,7 +1151,7 @@ public void testMissingValuesFromStats() {
11521151
formatStats.clear();
11531152
formatStats.setMin(BytesUtils.intToBytes(-100));
11541153
formatStats.setMax(BytesUtils.intToBytes(100));
1155-
stats = converter.fromParquetStatistics(CREATED_BY, formatStats, type);
1154+
stats = converter.fromParquetStatistics(Version.FULL_VERSION, formatStats, type);
11561155
assertFalse(stats.isNumNullsSet());
11571156
assertTrue(stats.hasNonNullValue());
11581157
assertFalse(stats.isEmpty());
@@ -1162,7 +1161,7 @@ public void testMissingValuesFromStats() {
11621161

11631162
formatStats.clear();
11641163
formatStats.setNull_count(2000);
1165-
stats = converter.fromParquetStatistics(CREATED_BY, formatStats, type);
1164+
stats = converter.fromParquetStatistics(Version.FULL_VERSION, formatStats, type);
11661165
assertTrue(stats.isNumNullsSet());
11671166
assertFalse(stats.hasNonNullValue());
11681167
assertFalse(stats.isEmpty());
@@ -1182,8 +1181,7 @@ public void testSkippedV2Stats() {
11821181

11831182
private void testSkippedV2Stats(PrimitiveType type, Object min, Object max) {
11841183
Statistics<?> stats = createStats(type, min, max);
1185-
ParquetMetadataConverter converter = new ParquetMetadataConverter();
1186-
org.apache.parquet.format.Statistics statistics = converter.toParquetStatistics(stats);
1184+
org.apache.parquet.format.Statistics statistics = ParquetMetadataConverter.toParquetStatistics(stats);
11871185
assertFalse(statistics.isSetMin());
11881186
assertFalse(statistics.isSetMax());
11891187
assertFalse(statistics.isSetMin_value());
@@ -1221,8 +1219,7 @@ public void testV2OnlyStats() {
12211219

12221220
private void testV2OnlyStats(PrimitiveType type, Object min, Object max) {
12231221
Statistics<?> stats = createStats(type, min, max);
1224-
ParquetMetadataConverter converter = new ParquetMetadataConverter();
1225-
org.apache.parquet.format.Statistics statistics = converter.toParquetStatistics(stats);
1222+
org.apache.parquet.format.Statistics statistics = ParquetMetadataConverter.toParquetStatistics(stats);
12261223
assertFalse(statistics.isSetMin());
12271224
assertFalse(statistics.isSetMax());
12281225
assertEquals(ByteBuffer.wrap(stats.getMinBytes()), statistics.min_value);
@@ -1264,8 +1261,7 @@ public void testV2StatsEqualMinMax() {
12641261

12651262
private void testV2StatsEqualMinMax(PrimitiveType type, Object min, Object max) {
12661263
Statistics<?> stats = createStats(type, min, max);
1267-
ParquetMetadataConverter converter = new ParquetMetadataConverter();
1268-
org.apache.parquet.format.Statistics statistics = converter.toParquetStatistics(stats);
1264+
org.apache.parquet.format.Statistics statistics = ParquetMetadataConverter.toParquetStatistics(stats);
12691265
assertEquals(ByteBuffer.wrap(stats.getMinBytes()), statistics.min);
12701266
assertEquals(ByteBuffer.wrap(stats.getMaxBytes()), statistics.max);
12711267
assertEquals(ByteBuffer.wrap(stats.getMinBytes()), statistics.min_value);
@@ -1469,7 +1465,7 @@ public void testColumnIndexConversion() {
14691465
org.apache.parquet.format.ColumnIndex parquetColumnIndex =
14701466
converter.toParquetColumnIndex(type, builder.build());
14711467

1472-
ColumnIndex columnIndex = converter.fromParquetColumnIndex(CREATED_BY, type, parquetColumnIndex);
1468+
ColumnIndex columnIndex = converter.fromParquetColumnIndex(Version.FULL_VERSION, type, parquetColumnIndex);
14731469
assertEquals(BoundaryOrder.ASCENDING, columnIndex.getBoundaryOrder());
14741470
assertTrue(List.of(false, true, false).equals(columnIndex.getNullPages()));
14751471
assertTrue(List.of(16l, 111l, 0l).equals(columnIndex.getNullCounts()));
@@ -1498,7 +1494,7 @@ public void testColumnIndexConversion() {
14981494
assertNull(
14991495
"Should ignore unsupported types",
15001496
converter.fromParquetColumnIndex(
1501-
CREATED_BY,
1497+
Version.FULL_VERSION,
15021498
Types.required(PrimitiveTypeName.FIXED_LEN_BYTE_ARRAY)
15031499
.length(12)
15041500
.as(OriginalType.INTERVAL)

parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestParquetFileWriter.java

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -81,6 +81,7 @@
8181
import org.apache.parquet.column.values.bloomfilter.BloomFilter;
8282
import org.apache.parquet.example.data.Group;
8383
import org.apache.parquet.example.data.simple.SimpleGroup;
84+
import org.apache.parquet.format.Statistics;
8485
import org.apache.parquet.hadoop.ParquetOutputFormat.JobSummaryLevel;
8586
import org.apache.parquet.hadoop.example.GroupReadSupport;
8687
import org.apache.parquet.hadoop.example.GroupWriteSupport;
@@ -865,11 +866,11 @@ public void testConvertToThriftStatistics() throws Exception {
865866
parquetMRstats.updateStats(l);
866867
}
867868
final String createdBy = "parquet-mr version 1.8.0 (build d4d5a07ec9bd262ca1e93c309f1d7d4a74ebda4c)";
868-
org.apache.parquet.format.converter.ParquetMetadataConverter converter =
869-
new org.apache.parquet.format.converter.ParquetMetadataConverter();
870-
org.apache.parquet.format.Statistics thriftStats = converter.toParquetStatistics(parquetMRstats);
869+
Statistics thriftStats =
870+
org.apache.parquet.format.converter.ParquetMetadataConverter.toParquetStatistics(parquetMRstats);
871871
LongStatistics convertedBackStats =
872-
(LongStatistics) converter.fromParquetStatistics(createdBy, thriftStats, PrimitiveTypeName.INT64);
872+
(LongStatistics) org.apache.parquet.format.converter.ParquetMetadataConverter.fromParquetStatistics(
873+
createdBy, thriftStats, PrimitiveTypeName.INT64);
873874

874875
assertEquals(parquetMRstats.getMax(), convertedBackStats.getMax());
875876
assertEquals(parquetMRstats.getMin(), convertedBackStats.getMin());

0 commit comments

Comments
 (0)