LycheeOrg
diff --git a/‎Makefile‎
Lines changed: 3 additions & 0 deletions b/‎Makefile‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎ai-vision-service/face-recognition/.insightface/.gitignore‎
Lines changed: 2 additions & 0 deletions b/‎ai-vision-service/face-recognition/.insightface/.gitignore‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎ai-vision-service/face-recognition/README.md‎
Lines changed: 29 additions & 2 deletions b/‎ai-vision-service/face-recognition/README.md‎
Lines changed: 29 additions & 2 deletions
diff --git a/‎ai-vision-service/face-recognition/app/api/routes.py‎
Lines changed: 34 additions & 0 deletions b/‎ai-vision-service/face-recognition/app/api/routes.py‎
Lines changed: 34 additions & 0 deletions
diff --git a/‎ai-vision-service/face-recognition/app/config.py‎
Lines changed: 12 additions & 2 deletions b/‎ai-vision-service/face-recognition/app/config.py‎
Lines changed: 12 additions & 2 deletions
diff --git a/‎ai-vision-service/face-recognition/app/detection/cropper.py‎
Lines changed: 111 additions & 28 deletions b/‎ai-vision-service/face-recognition/app/detection/cropper.py‎
Lines changed: 111 additions & 28 deletions
@@ -166,6 +166,9 @@ class-leak:
 docker-build:
 	docker build -t lychee-frankenphp .
 
+docker-build-legacy:
+	docker build -t lychee-frankenphp -f Dockerfile-legacy .
+
 docker-build-no-cache:
 	docker build -t lychee-frankenphp . --no-cache
 
 
@@ -0,0 +1,2 @@
+*
+!.gitignore
@@ -80,22 +80,49 @@ All variables are prefixed `VISION_FACE_`.
 
 ## Development
 
+### Setup
+
 ```bash
 # Install uv (https://docs.astral.sh/uv/getting-started/installation/)
 curl -LsSf https://astral.sh/uv/install.sh | sh
 
 # Install all dependencies (including dev)
 uv sync
 
+# Configure .env file (create or edit .env in this directory)
+# Minimum required variables:
+# VISION_FACE_LYCHEE_API_URL=https://lychee.test
+# VISION_FACE_API_KEY=changeme
+# VISION_FACE_VERIFY_SSL=false
+# VISION_FACE_PHOTOS_PATH=../../public/uploads
+```
+
+### Running locally
+
+```bash
+# Using uv run (recommended)
+uv run python -m uvicorn app.main:app --host 0.0.0.0 --port 8000 --reload
+```
+
+The service will be available at http://localhost:8000
+- API docs: http://localhost:8000/docs
+- Health check: http://localhost:8000/health
+
+### Linting and testing
+
+```bash
 # Lint and format
-uv run ruff format --check
-uv run ruff check
+uv run ruff format
+uv run ruff check --fix
 
 # Type check
 uv run ty check
 
 # Run tests
 uv run pytest
+
+# Run tests with coverage
+uv run pytest --cov=app --cov-report=html
 ```
 
 ## Docker
 
@@ -118,15 +118,25 @@ async def match(
     store: EmbeddingStore = get_store(request)
     executor: Executor = request.app.state.executor
 
+    logger.info("Processing selfie match request (%d bytes)", len(image_bytes))
+
     loop = asyncio.get_running_loop()
     raw_faces: list[DetectedFace] = await loop.run_in_executor(executor, detector.detect_bytes, image_bytes)
 
     if not raw_faces:
+        logger.warning("No face detected in uploaded selfie image")
         raise HTTPException(status_code=422, detail="No face detected in the uploaded image")
 
     best = raw_faces[0]  # highest confidence (sorted descending)
     matches = store.similarity_search(best.embedding, settings.match_threshold, limit=10)
 
+    logger.info(
+        "Selfie match found %d match(es) above threshold %.2f (detected face confidence: %.3f)",
+        len(matches),
+        settings.match_threshold,
+        best.confidence,
+    )
+
     return MatchResponse(matches=[MatchResult(lychee_face_id=face_id, confidence=conf) for face_id, conf in matches])
 
 
@@ -221,13 +231,24 @@ async def _run_detection_job(
     returned 202.  All CPU-bound work is offloaded to ``executor`` via
     ``run_in_executor`` so the event loop remains responsive.
     """
+    logger.info("Starting detection job for photo_id=%s, path=%s", photo_id, image_path)
     try:
         loop = asyncio.get_running_loop()
 
         # --- 1. Detect faces (CPU-bound, runs in thread pool) ---
         raw_faces: list[DetectedFace] = await loop.run_in_executor(executor, detector.detect, image_path)
+
+        if len(raw_faces) > settings.max_faces_per_photo:
+            logger.info(
+                "Limiting faces from %d to %d (max_faces_per_photo setting)",
+                len(raw_faces),
+                settings.max_faces_per_photo,
+            )
         raw_faces = raw_faces[: settings.max_faces_per_photo]
 
+        if not raw_faces:
+            logger.info("No faces detected in photo_id=%s, sending empty results", photo_id)
+
         # --- 2. For each face: generate crop + search suggestions ---
         face_data: list[tuple[str, list[float], FaceResult]] = []
 
@@ -246,6 +267,13 @@ async def _run_detection_job(
 
             suggestions = store.similarity_search(raw_face.embedding, settings.match_threshold, limit=10)
 
+            if suggestions:
+                logger.debug(
+                    "Found %d suggestion(s) for face with confidence=%.3f",
+                    len(suggestions),
+                    raw_face.confidence,
+                )
+
             result = FaceResult(
                 x=raw_face.x,
                 y=raw_face.y,
@@ -279,6 +307,12 @@ async def _run_detection_job(
             response.raise_for_status()
             callback_resp = DetectCallbackResponse.model_validate(response.json())
 
+        logger.info(
+            "Successfully sent detection results to Lychee for photo_id=%s (%d face(s))",
+            photo_id,
+            len(face_data),
+        )
+
         # --- 4. Persist embeddings now that we have stable lychee_face_ids ---
         id_to_vector: dict[str, list[float]] = {eid: vec for eid, vec, _ in face_data}
         for mapping in callback_resp.faces:
 
@@ -5,6 +5,7 @@
 """
 
 from functools import lru_cache
+from pathlib import Path
 
 from pydantic_settings import BaseSettings, SettingsConfigDict
 
@@ -94,16 +95,25 @@ class AppSettings(BaseSettings):
     Lower values produce tighter, more homogeneous clusters."""
 
     # --- Quality filtering ---
-    blur_threshold: float = 100.0
+    blur_threshold: float = 0.5
     """Laplacian variance threshold for blur detection.
     Face crops with a variance below this value are discarded before embedding."""
 
+    model_root: str = "/root/.insightface"
+    """Root directory for InsightFace model packs.  Defaults to the library's default (``~/.insightface``)
+    but can be overridden to point to a shared Docker volume if desired."""
+
     model_config = SettingsConfigDict(
         env_prefix="VISION_FACE_",
         # Support .env files in development but never require them in production.
-        env_file=".env",
+        # Load project root .env first (fallback), then working directory .env (override)
+        env_file=(
+            Path(__file__).parent.parent / ".env",  # Project root (fallback)
+            ".env",  # Current working directory (takes precedence)
+        ),
         env_file_encoding="utf-8",
         case_sensitive=False,
+        extra="ignore",  # Ignore extra fields (e.g., from Lychee's .env when running from main project)
     )
 
 
 
@@ -21,38 +21,129 @@
 """Fractional padding added around each bounding box side before cropping."""
 
 
-def generate_crop(image_path: Path, x: float, y: float, width: float, height: float) -> str:
-    """Generate a base64-encoded 150 x 150 JPEG face crop.
+def _calculate_square_crop_coords(
+    x: float, y: float, width: float, height: float, img_w: int, img_h: int, padding_factor: float
+) -> tuple[int, int, int, int]:
+    """Calculate square crop coordinates centered on the face bounding box.
+
+    Attempts to create a square crop centered on the face. If the square would
+    extend beyond image boundaries, it shifts the crop to fit. If the square is
+    larger than the image dimensions, the crop will be the maximum square that
+    fits within the image.
 
     Args:
-        image_path: Absolute path to the source image.
         x: Normalised left edge of the bounding box (0.0-1.0).
         y: Normalised top edge of the bounding box (0.0-1.0).
         width: Normalised bounding-box width (0.0-1.0).
         height: Normalised bounding-box height (0.0-1.0).
+        img_w: Image width in pixels.
+        img_h: Image height in pixels.
+        padding_factor: Fractional padding to add around the bounding box.
 
     Returns:
-        Base64-encoded JPEG bytes (ASCII string).
+        Tuple of (x1, y1, x2, y2) defining a square crop region in absolute pixels.
     """
-    img = Image.open(image_path).convert("RGB")
-    img_w, img_h = img.size
-
-    # Absolute pixel coordinates
+    # Convert to absolute pixels
     abs_x = x * img_w
     abs_y = y * img_h
     abs_w = width * img_w
     abs_h = height * img_h
 
     # Add padding
-    pad_x = abs_w * _PADDING_FACTOR
-    pad_y = abs_h * _PADDING_FACTOR
+    pad_x = abs_w * padding_factor
+    pad_y = abs_h * padding_factor
+
+    padded_x = abs_x - pad_x
+    padded_y = abs_y - pad_y
+    padded_w = abs_w + 2 * pad_x
+    padded_h = abs_h + 2 * pad_y
+
+    # Determine square size (use the larger dimension)
+    square_size = max(padded_w, padded_h)
+
+    # Cap square size to image dimensions (can't crop larger than the image)
+    max_possible_size = min(img_w, img_h)
+    square_size = min(square_size, max_possible_size)
+
+    # Calculate center point of the padded bounding box
+    center_x = padded_x + padded_w / 2
+    center_y = padded_y + padded_h / 2
+
+    # Calculate square crop coordinates centered on the face
+    x1 = center_x - square_size / 2
+    y1 = center_y - square_size / 2
+    x2 = center_x + square_size / 2
+    y2 = center_y + square_size / 2
+
+    # Adjust to keep square within image boundaries
+    # If the square extends beyond the left edge, shift it right
+    if x1 < 0:
+        shift = -x1
+        x1 = 0
+        x2 = min(float(img_w), x2 + shift)
+    # If the square extends beyond the right edge, shift it left
+    if x2 > img_w:
+        shift = x2 - img_w
+        x2 = img_w
+        x1 = max(0.0, x1 - shift)
+
+    # If the square extends beyond the top edge, shift it down
+    if y1 < 0:
+        shift = -y1
+        y1 = 0
+        y2 = min(float(img_h), y2 + shift)
+    # If the square extends beyond the bottom edge, shift it up
+    if y2 > img_h:
+        shift = y2 - img_h
+        y2 = img_h
+        y1 = max(0.0, y1 - shift)
+
+    return int(x1), int(y1), int(x2), int(y2)
+
+
+def _pad_to_square(img: Image.Image) -> Image.Image:
+    """Pad a non-square image to square with black borders.
 
-    x1 = max(0.0, abs_x - pad_x)
-    y1 = max(0.0, abs_y - pad_y)
-    x2 = min(float(img_w), abs_x + abs_w + pad_x)
-    y2 = min(float(img_h), abs_y + abs_h + pad_y)
+    Args:
+        img: Input PIL Image.
 
-    crop = img.crop((int(x1), int(y1), int(x2), int(y2)))
+    Returns:
+        Square PIL Image with black padding if needed.
+    """
+    width, height = img.size
+    if width == height:
+        return img
+
+    size = max(width, height)
+    square_img = Image.new("RGB", (size, size), (0, 0, 0))
+    paste_x = (size - width) // 2
+    paste_y = (size - height) // 2
+    square_img.paste(img, (paste_x, paste_y))
+    return square_img
+
+
+def generate_crop(image_path: Path, x: float, y: float, width: float, height: float) -> str:
+    """Generate a base64-encoded 150 x 150 JPEG face crop.
+
+    Args:
+        image_path: Absolute path to the source image.
+        x: Normalised left edge of the bounding box (0.0-1.0).
+        y: Normalised top edge of the bounding box (0.0-1.0).
+        width: Normalised bounding-box width (0.0-1.0).
+        height: Normalised bounding-box height (0.0-1.0).
+
+    Returns:
+        Base64-encoded JPEG bytes (ASCII string).
+    """
+    img = Image.open(image_path).convert("RGB")
+    img_w, img_h = img.size
+
+    # Calculate square crop coordinates
+    x1, y1, x2, y2 = _calculate_square_crop_coords(x, y, width, height, img_w, img_h, _PADDING_FACTOR)
+
+    # Crop and ensure it's square (pad if needed due to edge constraints)
+    crop = img.crop((x1, y1, x2, y2))
+    crop = _pad_to_square(crop)
     crop = crop.resize((CROP_SIZE, CROP_SIZE), Image.Resampling.LANCZOS)
 
     buf = io.BytesIO()
@@ -76,20 +167,12 @@ def generate_crop_from_bytes(image_bytes: bytes, x: float, y: float, width: floa
     img = Image.open(io.BytesIO(image_bytes)).convert("RGB")
     img_w, img_h = img.size
 
-    abs_x = x * img_w
-    abs_y = y * img_h
-    abs_w = width * img_w
-    abs_h = height * img_h
-
-    pad_x = abs_w * _PADDING_FACTOR
-    pad_y = abs_h * _PADDING_FACTOR
-
-    x1 = max(0.0, abs_x - pad_x)
-    y1 = max(0.0, abs_y - pad_y)
-    x2 = min(float(img_w), abs_x + abs_w + pad_x)
-    y2 = min(float(img_h), abs_y + abs_h + pad_y)
+    # Calculate square crop coordinates
+    x1, y1, x2, y2 = _calculate_square_crop_coords(x, y, width, height, img_w, img_h, _PADDING_FACTOR)
 
-    crop = img.crop((int(x1), int(y1), int(x2), int(y2)))
+    # Crop and ensure it's square (pad if needed due to edge constraints)
+    crop = img.crop((x1, y1, x2, y2))
+    crop = _pad_to_square(crop)
     crop = crop.resize((CROP_SIZE, CROP_SIZE), Image.Resampling.LANCZOS)
 
     buf = io.BytesIO()