feat: New command: bundle: Bundle multiple files info one PDF

MPCodeWriter21 · MPCodeWriter21 · commit 46a7f70d40cf · 2026-04-30T12:08:44.000+03:30
+ It replaces `merge` and `image-to-pdf`
+ Upgraded log21: CLI has changed a bit
diff --git a/README.md b/README.md
@@ -6,6 +6,10 @@ A simple python package that helps with doing simple stuff with PDFs.
 Features
 --------
 
++ [x] **Bundle**: Bundle multiple files into one PDF
+  + [x] PDF inputs
+  + [x] Image inputs (e.g. PNG, JPG, etc.)
+  + [ ] Markdown inputs
 + [x] **Merge PDFs**: Merge multiple PDFs into one PDF
 + [x] **Split PDFs**: Split a PDF into multiple PDFs, each containing a range of pages from
       the original PDF
@@ -17,7 +21,6 @@ Features
 + [ ] Extract images from a PDF
 + [x] **Extract text**: Export text from a PDF file and optionally save it to a text file
 + [ ] Extract links from a PDF
-+ [x] **Image to PDF**: Export one or multiple images as a PDF file
 
 If you want any other feature to be added, feel free to open an [issue](https://github.com/MPCodeWriter21/PDF-To-Image/issues)
 or fork the repo and make a [pull request](https://github.com/MPCodeWriter21/PDF-To-Image/pulls)
@@ -57,79 +60,74 @@ cd PDF-Helper
 uv run pdf-helper <command> [options]
 ```
 
-### Merge PDFs
+### Bundle PDFs
 
 Merge multiple PDFs into one PDF:
 
 ```bash
-pdf-helper merge -i <input_file_1> <input_file_2>... <input_file_n> -o <output_file>
+pdf-helper bundle <input_file_1> <input_file_2>... <input_file_n> <output_file>
 
 # E.g. Merge PDFs 1, 2 and 3 into a new PDF
-pdf-helper merge -i 1.pdf 2.pdf 3.pdf -o new.pdf
+pdf-helper merge 1.pdf 2.pdf 3.pdf new.pdf
+
+# E.g. Take 1.png, 2.jpg, and 3.png and create a PDF named 123.pdf and override
+# if already exists
+pdf-helper bundle 1.png 2.jpg 3.png 123.pdf -f
+
+# E.g. Take part1.pdf, image1.png, ending.pdf and bundle them into a PDF named final.pdf
+pdf-helper bundle part1.pdf image1.png ending.pdf final.pdf -v
 ```
 
 ### Split PDFs
 
 Split a PDF into multiple PDFs, each containing a range of pages:
 
 ```bash
-pdf-helper split -i <input_file> -o <output_folder> -s <split_point_1>,<split_point_2>
+pdf-helper split <input_file> <output_folder> -s <split_point_1>,<split_point_2>
 
 # E.g. Split a PDF into three PDFs, one with pages 1-10, the second with pages 11-20 and
 # the third with pages 21-end
-pdf-helper split -i my-pdf.pdf -o my-split-pdfs -s 10,20
+pdf-helper split my-pdf.pdf my-split-pdfs -s 10,20
 
 # E.g. Split a PDF into PDFs each containing one page
-pdf-helper split -i my-pdf.pdf -o my-split-pdfs  # No need to specify split points
+pdf-helper split my-pdf.pdf my-split-pdfs  # No need to specify split points
 ```
 
 ### Export PDF pages as image files
 
 Export PDF pages as image files:
 
 ```bash
-pdf-helper to-image -i <input_file> -o <output_folder> \
+pdf-helper to-image <input_file> <output_folder> \
         -p <page_number_1>,<page_number_2>,...,<page_number_n> -s <scale_factor>
 
 # E.g. Export pages 1, 2, 3 and 6 from a PDF with scale factor 1
-pdf-helper to-image -i 1.pdf -o images -p 1-3,6 -s 1
+pdf-helper to-image 1.pdf images -p 1-3,6 -s 1
 
 # E.g. Export all pages from a PDF with scale 2
-pdf-helper to-image -i my-pdf.pdf -o my-images
+pdf-helper to-image my-pdf.pdf my-images
 ```
 
 ### Remove pages from a PDF
 
 Remove pages from a PDF:
 
 ```bash
-pdf-helper remove-pages -i <input_file> -o <output_file> -p <page_number_1>,<page_number_2>,...,<page_number_n>
+pdf-helper remove-pages <input_file> <output_file> <page_number_1>,<page_number_2>,...,<page_number_n>
 
 # E.g. Remove pages 1, 2, 3 and 6 from a PDF
-pdf-helper remove-pages -i 1.pdf -o new.pdf -p 1-3,6
+pdf-helper remove-pages 1.pdf new.pdf 1-3,6
 ```
 
 ### Export text from a PDF
 
 To extract text from a PDF file and export them to text files you can do as follows:
 
 ```bash
-pdf-helper extract-text -i <input_file> -o <output_file_name>
+pdf-helper extract-text <input_file> -o <output_file_name>
 
 # E.g. Extract text from a PDF named my-pdf.pdf and save it to my-text.txt
-pdf-helper extract-text -i my-pdf.pdf -o my-text.txt
-```
-
-### Export one or multiple images as a PDF file
-
-You simply provide the script with your images, and it will create a PDF file with them:
-
-```bash
-pdf-helper image-to-pdf -i <image_1> <image_2> <image_3> ... -o <output_file>
-
-# E.g. Take 1.png, 2.jpg, and 3.png and create a PDF named 123.pdf and override
-# if already exists
-pdf-helper image-to-pdf -i 1.png 2.jpg 3.png -o 123.pdf -f
+pdf-helper extract-text my-pdf.pdf -o my-text.txt
 ```
 
 About
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,15 +1,15 @@
 [project]
 name = "PDF-Helper"
-version = "0.1.0"
+version = "0.2.0"
 authors = [
   {name = "CodeWriter21(Mehrad Pooryoussof)", email = "CodeWriter21@gmail.com"}
 ]
 description = "A simple python script that helps with doing simple stuff with PDFs."
 readme = {file = "README.md", content-type = "text/markdown"}
 license = {text = "MIT", file = "LICENSE"}
-requires-python = ">=3.9"
+requires-python = ">=3.10"
 dependencies = [
-    "log21>=3.0.0",
+    "log21>=3.3.1",
     "pypdfium2>=4.30.0",
     "Pillow>=11.0.0"
 ]
@@ -41,7 +41,7 @@ wrap-descriptions = 88
 [tool.ruff]
 show-fixes = true
 exclude = ["migrations"]
-target-version = "py39"
+target-version = "py310"
 line-length = 88
 
 [tool.ruff.lint]
diff --git a/src/pdf_helper/__init__.py b/src/pdf_helper/__init__.py
@@ -11,12 +11,70 @@
 from PIL import Image
 from pypdfium2 import PdfImage, PdfBitmap, PdfDocument
 
+__version__ = '0.2.0'
+
 __all__ = [
-    'merge_pdfs', 'remove_pages', 'pdf_to_image', 'extract_text', 'image_to_pdf',
-    'split_pdf', 'watermark_pdf'
+    'bundle', 'merge_pdfs', 'remove_pages', 'pdf_to_image', 'extract_text',
+    'image_to_pdf', 'split_pdf', 'watermark_pdf'
 ]
 
 
+def bundle(
+    input_files: Sequence[str | bytes | Path | os.PathLike[str] | io.BytesIO],
+    output_stream: str | Path | io.BytesIO | io.BufferedWriter
+) -> int:
+    """Bundle multiple files together.
+
+    :param input_files: List of files to bundle together. Each file can be a PDF or an
+        image. Supported image formats are those supported by Pillow.
+    :param output_stream: Output stream to write to.
+    :return: Number of pages in the bundled PDF.
+    """
+    writer = PdfDocument.new()
+    for input_file in input_files:
+        log21.info(f'Adding {input_file}...')
+        if isinstance(input_file, (str, bytes, Path, os.PathLike)):
+            if str(input_file).lower().endswith('.pdf'):
+                reader = PdfDocument(input_file)
+                writer.import_pages(reader)
+            else:
+                image = Image.open(input_file)
+                bitmap = PdfBitmap.from_pil(image)
+                pdf_image = PdfImage.new(writer)
+                pdf_image.set_bitmap(bitmap)
+                matrix = pdfium.PdfMatrix().scale(bitmap.width, bitmap.height)
+                pdf_image.set_matrix(matrix)
+                page = writer.new_page(bitmap.width, bitmap.height)
+                page.insert_obj(pdf_image)
+                page.gen_content()
+                page.close()
+                pdf_image.close()
+                bitmap.close()
+                image.close()
+        elif isinstance(input_file, io.BytesIO):
+            try:
+                reader = PdfDocument(input_file)
+                writer.import_pages(reader)
+            except Exception:
+                image = Image.open(input_file)
+                bitmap = PdfBitmap.from_pil(image)
+                pdf_image = PdfImage.new(writer)
+                pdf_image.set_bitmap(bitmap)
+                matrix = pdfium.PdfMatrix().scale(bitmap.width, bitmap.height)
+                pdf_image.set_matrix(matrix)
+                page = writer.new_page(bitmap.width, bitmap.height)
+                page.insert_obj(pdf_image)
+                page.gen_content()
+                page.close()
+                pdf_image.close()
+                bitmap.close()
+                image.close()
+        else:
+            raise ValueError(f'Unsupported input file type: {type(input_file)}')
+    writer.save(output_stream)
+    return len(writer)
+
+
 def merge_pdfs(
     input_files: Sequence[str | Path | io.TextIOWrapper],
     output_stream: str | Path | io.BytesIO | io.BufferedWriter
@@ -36,6 +94,41 @@ def merge_pdfs(
     return len(writer)
 
 
+def image_to_pdf(
+    input_files: Sequence[str | bytes | Path | os.PathLike[str] | io.BytesIO],
+    output_stream: str | Path | io.BytesIO | io.BufferedWriter
+) -> int:
+    """Convert images to a PDF file.
+
+    :param input_files: List of images to convert.
+    :param output_stream: Output stream to write to.
+    :return: Number of pages in the output PDF
+    """
+    writer = PdfDocument.new()
+    for input_file in input_files:
+        log21.info(f'Adding {input_file}...')
+        # Open the image file
+        image = Image.open(input_file)
+        # Create a bitmap from the image
+        bitmap = PdfBitmap.from_pil(image)
+        # Create a PdfImage object from the bitmap
+        pdf_image = PdfImage.new(writer)
+        pdf_image.set_bitmap(bitmap)
+        matrix = pdfium.PdfMatrix().scale(bitmap.width, bitmap.height)
+        pdf_image.set_matrix(matrix)
+        # Create a new page and insert the PdfImage object
+        page = writer.new_page(bitmap.width, bitmap.height)
+        page.insert_obj(pdf_image)
+        page.gen_content()
+        # Close the objects
+        page.close()
+        pdf_image.close()
+        bitmap.close()
+        image.close()
+    writer.save(output_stream)
+    return len(writer)
+
+
 def remove_pages(
     input_file: str | Path | io.BytesIO | io.TextIOWrapper,
     pages_to_remove: Collection[int],
@@ -160,41 +253,6 @@ def extract_text(
     return text
 
 
-def image_to_pdf(
-    input_files: Sequence[str | bytes | Path | os.PathLike[str] | io.BytesIO],
-    output_stream: str | Path | io.BytesIO | io.BufferedWriter
-) -> int:
-    """Convert images to a PDF file.
-
-    :param input_files: List of images to convert.
-    :param output_stream: Output stream to write to.
-    :return: Number of pages in the output PDF
-    """
-    writer = PdfDocument.new()
-    for input_file in input_files:
-        log21.info(f'Adding {input_file}...')
-        # Open the image file
-        image = Image.open(input_file)
-        # Create a bitmap from the image
-        bitmap = PdfBitmap.from_pil(image)
-        # Create a PdfImage object from the bitmap
-        pdf_image = PdfImage.new(writer)
-        pdf_image.set_bitmap(bitmap)
-        matrix = pdfium.PdfMatrix().scale(bitmap.width, bitmap.height)
-        pdf_image.set_matrix(matrix)
-        # Create a new page and insert the PdfImage object
-        page = writer.new_page(bitmap.width, bitmap.height)
-        page.insert_obj(pdf_image)
-        page.gen_content()
-        # Close the objects
-        page.close()
-        pdf_image.close()
-        bitmap.close()
-        image.close()
-    writer.save(output_stream)
-    return len(writer)
-
-
 def split_pdf(
     input_file: str | Path,
     output_directory: str | Path,
diff --git a/src/pdf_helper/__main__.py b/src/pdf_helper/__main__.py