|
434 | 434 | { |
435 | 435 | "data": { |
436 | 436 | "document_key": "sample.pdf", |
437 | | - "content": "# Hello World", |
| 437 | + "_ab_source_file_parse_error": "Error parsing record. This could be due to a mismatch between the config's file type and the actual file type, or because the file or record is not parseable. Contact Support if you need assistance.\nfilename=sample.pdf message=PDF parsing requires the 'unstructured_inference' package. Install it with: pip install unstructured-inference", |
438 | 438 | "_ab_source_file_last_modified": "2023-06-05T03:54:07.000000Z", |
439 | 439 | "_ab_source_file_url": "sample.pdf", |
440 | 440 | }, |
|
443 | 443 | { |
444 | 444 | "data": { |
445 | 445 | "document_key": "sample.docx", |
446 | | - "content": "# Content", |
| 446 | + "content": "Content", |
447 | 447 | "_ab_source_file_last_modified": "2023-06-06T03:54:07.000000Z", |
448 | 448 | "_ab_source_file_url": "sample.docx", |
449 | 449 | }, |
|
510 | 510 | { |
511 | 511 | "data": { |
512 | 512 | "document_key": "sample.pdf", |
513 | | - "_ab_source_file_parse_error": "Error parsing record. This could be due to a mismatch between the config's file type and the actual file type, or because the file or record is not parseable. Contact Support if you need assistance.\nfilename=sample.pdf message=No /Root object! - Is this really a PDF?", |
| 513 | + "_ab_source_file_parse_error": "Error parsing record. This could be due to a mismatch between the config's file type and the actual file type, or because the file or record is not parseable. Contact Support if you need assistance.\nfilename=sample.pdf message=PDF parsing requires the 'unstructured_inference' package. Install it with: pip install unstructured-inference", |
514 | 514 | "_ab_source_file_last_modified": "2023-06-05T03:54:07.000000Z", |
515 | 515 | "_ab_source_file_url": "sample.pdf", |
516 | 516 | }, |
|
578 | 578 | { |
579 | 579 | "data": { |
580 | 580 | "document_key": "pdf_without_extension", |
581 | | - "content": "# Hello World", |
| 581 | + "_ab_source_file_parse_error": "Error parsing record. This could be due to a mismatch between the config's file type and the actual file type, or because the file or record is not parseable. Contact Support if you need assistance.\nfilename=pdf_without_extension message=PDF parsing requires the 'unstructured_inference' package. Install it with: pip install unstructured-inference", |
582 | 582 | "_ab_source_file_last_modified": "2023-06-05T03:54:07.000000Z", |
583 | 583 | "_ab_source_file_url": "pdf_without_extension", |
584 | 584 | }, |
|
587 | 587 | { |
588 | 588 | "data": { |
589 | 589 | "document_key": "docx_without_extension", |
590 | | - "content": "# Content", |
| 590 | + "content": "Content", |
591 | 591 | "_ab_source_file_last_modified": "2023-06-06T03:54:07.000000Z", |
592 | 592 | "_ab_source_file_url": "docx_without_extension", |
593 | 593 | }, |
|
0 commit comments