|
53 | 53 |
|
54 | 54 | import static org.apache.paimon.data.BinaryString.fromString; |
55 | 55 | import static org.assertj.core.api.Assertions.assertThat; |
| 56 | +import static org.assertj.core.api.Assertions.assertThatThrownBy; |
56 | 57 |
|
57 | 58 | /** Test for {@link CsvFileFormat}. */ |
58 | 59 | public class CsvFileFormatTest extends FormatReadWriteTest { |
@@ -444,6 +445,71 @@ public void testCsvOptionsCombinationWriteRead() throws IOException { |
444 | 445 | assertThat(result.get(3).isNullAt(3)).isTrue(); |
445 | 446 | } |
446 | 447 |
|
| 448 | + @Test |
| 449 | + public void testCsvModeWriteRead() throws IOException { |
| 450 | + RowType rowType = |
| 451 | + DataTypes.ROW(DataTypes.INT().notNull(), DataTypes.STRING(), DataTypes.DOUBLE()); |
| 452 | + |
| 453 | + // Test PERMISSIVE mode |
| 454 | + Options permissiveOptions = new Options(); |
| 455 | + permissiveOptions.set(CsvOptions.MODE, CsvOptions.Mode.PERMISSIVE); |
| 456 | + FileFormat format = |
| 457 | + new CsvFileFormatFactory().create(new FormatContext(permissiveOptions, 1024, 1024)); |
| 458 | + Path testFile = new Path(parent, "test_mode_" + UUID.randomUUID() + ".csv"); |
| 459 | + |
| 460 | + fileIO.writeFile(testFile, "1,Alice,aaaa,100.23\n2,Bob,200.75", false); |
| 461 | + List<InternalRow> permissiveResult = read(format, rowType, rowType, testFile); |
| 462 | + assertThat(permissiveResult).hasSize(2); |
| 463 | + assertThat(permissiveResult.get(0).getInt(0)).isEqualTo(1); |
| 464 | + assertThat(permissiveResult.get(0).getString(1).toString()).isEqualTo("Alice"); |
| 465 | + assertThat(permissiveResult.get(0).isNullAt(2)).isTrue(); |
| 466 | + assertThat(permissiveResult.get(1).getInt(0)).isEqualTo(2); |
| 467 | + assertThat(permissiveResult.get(1).getString(1).toString()).isEqualTo("Bob"); |
| 468 | + assertThat(permissiveResult.get(1).getDouble(2)).isEqualTo(200.75); |
| 469 | + |
| 470 | + // Test DROPMALFORMED mode |
| 471 | + Options dropMalformedOptions = new Options(); |
| 472 | + dropMalformedOptions.set(CsvOptions.MODE, CsvOptions.Mode.DROPMALFORMED); |
| 473 | + format = |
| 474 | + new CsvFileFormatFactory() |
| 475 | + .create(new FormatContext(dropMalformedOptions, 1024, 1024)); |
| 476 | + List<InternalRow> dropMalformedResult = read(format, rowType, rowType, testFile); |
| 477 | + assertThat(dropMalformedResult).hasSize(1); |
| 478 | + assertThat(dropMalformedResult.get(0).getInt(0)).isEqualTo(2); |
| 479 | + assertThat(dropMalformedResult.get(0).getString(1).toString()).isEqualTo("Bob"); |
| 480 | + assertThat(dropMalformedResult.get(0).getDouble(2)).isEqualTo(200.75); |
| 481 | + |
| 482 | + // Test FAILFAST mode |
| 483 | + Options failFastOptions = new Options(); |
| 484 | + failFastOptions.set(CsvOptions.MODE, CsvOptions.Mode.FAILFAST); |
| 485 | + assertThatThrownBy( |
| 486 | + () -> { |
| 487 | + read( |
| 488 | + new CsvFileFormatFactory() |
| 489 | + .create(new FormatContext(failFastOptions, 1024, 1024)), |
| 490 | + rowType, |
| 491 | + rowType, |
| 492 | + testFile); |
| 493 | + }) |
| 494 | + .isInstanceOf(IllegalArgumentException.class); |
| 495 | + } |
| 496 | + |
| 497 | + private List<InternalRow> read( |
| 498 | + FileFormat format, RowType fullRowType, RowType readRowType, Path testFile) |
| 499 | + throws IOException { |
| 500 | + try (RecordReader<InternalRow> reader = |
| 501 | + format.createReaderFactory(fullRowType, readRowType, new ArrayList<>()) |
| 502 | + .createReader( |
| 503 | + new FormatReaderContext( |
| 504 | + fileIO, testFile, fileIO.getFileSize(testFile)))) { |
| 505 | + |
| 506 | + InternalRowSerializer serializer = new InternalRowSerializer(readRowType); |
| 507 | + List<InternalRow> result = new ArrayList<>(); |
| 508 | + reader.forEachRemaining(row -> result.add(serializer.copy(row))); |
| 509 | + return result; |
| 510 | + } |
| 511 | + } |
| 512 | + |
447 | 513 | @Override |
448 | 514 | protected RowType rowTypeForFullTypesTest() { |
449 | 515 | RowType.Builder builder = |
@@ -581,16 +647,6 @@ private List<InternalRow> writeThenRead( |
581 | 647 | writer.addElement(row); |
582 | 648 | } |
583 | 649 | } |
584 | | - try (RecordReader<InternalRow> reader = |
585 | | - format.createReaderFactory(fullRowType, rowType, new ArrayList<>()) |
586 | | - .createReader( |
587 | | - new FormatReaderContext( |
588 | | - fileIO, testFile, fileIO.getFileSize(testFile)))) { |
589 | | - |
590 | | - InternalRowSerializer serializer = new InternalRowSerializer(rowType); |
591 | | - List<InternalRow> result = new ArrayList<>(); |
592 | | - reader.forEachRemaining(row -> result.add(serializer.copy(row))); |
593 | | - return result; |
594 | | - } |
| 650 | + return read(format, fullRowType, rowType, testFile); |
595 | 651 | } |
596 | 652 | } |
0 commit comments