Merge pull request 'fix: VIN OCR scanning fails with "No VIN Pattern found" on all images (#113 )' (#114 ) from issue-113-fix-vin-ocr-scanning into main

Reviewed-on: #114
chore: Change crop to remove locked aspect ratio
2026-02-07 15:47:35 +00:00 · 2026-02-06 22:15:39 -06:00 · 2026-02-06 22:00:07 -06:00 · 2026-02-06 21:52:08 -06:00 · 2026-02-06 21:39:48 -06:00 · 2026-02-06 21:32:52 -06:00
11 changed files with 736 additions and 173 deletions
--- a/.ai/context.json
+++ b/.ai/context.json
@@ -5,7 +5,8 @@
    "host": "gitea",
    "owner": "egullickson",
    "repo": "motovaultpro",
-    "url": "https://git.motovaultpro.com"
+    "url": "https://git.motovaultpro.com",
+    "default_branch": "main"
  },
  "ai_quick_start": {
    "load_order": [
--- a/config/traefik/traefik.yml
+++ b/config/traefik/traefik.yml
@@ -52,7 +52,7 @@ global:

 # Logging
 log:
-  level: INFO
+  level: DEBUG
  format: json

 # Access logs
--- a/docker-compose.prod.yml
+++ b/docker-compose.prod.yml
@@ -9,16 +9,13 @@
 #   - Development-specific settings

 services:
-  # PostgreSQL - Remove development port exposure
-  mvp-postgres:
-    ports: []
-
-  # Redis - Remove development port exposure
-  mvp-redis:
-    ports: []
-
-  # Traefik - Ensure dashboard authentication is enforced
+  # Traefik - Production log level and dashboard auth
  mvp-traefik:
+    environment:
+      LOG_LEVEL: error
+    command:
+      - --configFile=/etc/traefik/traefik.yml
+      - --log.level=ERROR
    labels:
      - "traefik.enable=true"
      - "traefik.http.routers.traefik-dashboard.rule=Host(`traefik.motovaultpro.local`)"
@@ -26,3 +23,45 @@ services:
      - "traefik.http.routers.traefik-dashboard.middlewares=dashboard-auth"
      - "traefik.http.services.traefik-dashboard.loadbalancer.server.port=8080"
      - "traefik.http.middlewares.dashboard-auth.basicauth.users=admin:$$2y$$10$$foobar"
+
+  # Backend - Production log level
+  mvp-backend:
+    environment:
+      NODE_ENV: production
+      CONFIG_PATH: /app/config/production.yml
+      SECRETS_DIR: /run/secrets
+      LOG_LEVEL: error
+      DATABASE_HOST: mvp-postgres
+      REDIS_HOST: mvp-redis
+      STRIPE_PRO_MONTHLY_PRICE_ID: prod_Toj6BG9Z9JwREl
+      STRIPE_PRO_YEARLY_PRICE_ID: prod_Toj8oo0RpVBQmB
+      STRIPE_ENTERPRISE_MONTHLY_PRICE_ID: prod_Toj8xGEui9jl6j
+      STRIPE_ENTERPRISE_YEARLY_PRICE_ID: prod_Toj9A7A773xrdn
+
+  # OCR - Production log level
+  mvp-ocr:
+    environment:
+      LOG_LEVEL: error
+      REDIS_HOST: mvp-redis
+      REDIS_PORT: 6379
+      REDIS_DB: 1
+
+  # PostgreSQL - Remove dev ports, production log level
+  mvp-postgres:
+    ports: []
+    environment:
+      POSTGRES_DB: motovaultpro
+      POSTGRES_USER: postgres
+      POSTGRES_PASSWORD_FILE: /run/secrets/postgres-password
+      POSTGRES_INITDB_ARGS: --encoding=UTF8
+      LOG_LEVEL: error
+      POSTGRES_LOG_STATEMENT: none
+      POSTGRES_LOG_MIN_DURATION_STATEMENT: -1
+      PGDATA: /var/lib/postgresql/data
+
+  # Redis - Remove dev ports, production log level
+  mvp-redis:
+    ports: []
+    command: redis-server --appendonly yes --loglevel ${LOG_LEVEL:-info}
+    environment:
+      LOG_LEVEL: error
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -11,6 +11,7 @@ services:
    command:
      - --configFile=/etc/traefik/traefik.yml
    environment:
+      LOG_LEVEL: debug
      CLOUDFLARE_DNS_API_TOKEN_FILE: /run/secrets/cloudflare-dns-token
    ports:
      - "80:80"
@@ -112,6 +113,7 @@ services:
      NODE_ENV: production
      CONFIG_PATH: /app/config/production.yml
      SECRETS_DIR: /run/secrets
+      LOG_LEVEL: debug
      # Service references
      DATABASE_HOST: mvp-postgres
      REDIS_HOST: mvp-redis
@@ -187,10 +189,12 @@ services:
    container_name: mvp-ocr
    restart: unless-stopped
    environment:
-      LOG_LEVEL: info
+      LOG_LEVEL: debug
      REDIS_HOST: mvp-redis
      REDIS_PORT: 6379
      REDIS_DB: 1
+    volumes:
+      - /tmp/vin-debug:/tmp/vin-debug
    networks:
      - backend
      - database
@@ -218,8 +222,10 @@ services:
      POSTGRES_USER: postgres
      POSTGRES_PASSWORD_FILE: /run/secrets/postgres-password
      POSTGRES_INITDB_ARGS: --encoding=UTF8
-      POSTGRES_LOG_STATEMENT: ${POSTGRES_LOG_STATEMENT:-ddl}
-      POSTGRES_LOG_MIN_DURATION_STATEMENT: ${POSTGRES_LOG_MIN_DURATION:-500}
+      LOG_LEVEL: debug
+      POSTGRES_LOG_STATEMENT: all
+      POSTGRES_LOG_MIN_DURATION_STATEMENT: 0
+      PGDATA: /var/lib/postgresql/data
    volumes:
      - mvp_postgres_data:/var/lib/postgresql/data
      # Secrets (K8s Secrets equivalent)
@@ -245,7 +251,9 @@ services:
    image: ${REGISTRY_MIRRORS:-git.motovaultpro.com/egullickson/mirrors}/redis:8.4-alpine
    container_name: mvp-redis
    restart: unless-stopped
-    command: redis-server --appendonly yes --loglevel ${REDIS_LOGLEVEL:-notice}
+    command: redis-server --appendonly yes --loglevel ${LOG_LEVEL:-info}
+    environment:
+      LOG_LEVEL: debug
    volumes:
      - mvp_redis_data:/data
    networks:
--- a/frontend/src/shared/components/CameraCapture/CropTool.tsx
+++ b/frontend/src/shared/components/CameraCapture/CropTool.tsx
@@ -3,7 +3,7 @@
 * @ai-context Allows user to adjust crop area with touch/mouse, confirm or retake
 */

-import React, { useCallback, useState } from 'react';
+import React, { useCallback, useState, useRef, useEffect } from 'react';
 import { Box, IconButton, Button, Typography, CircularProgress } from '@mui/material';
 import CheckIcon from '@mui/icons-material/Check';
 import RefreshIcon from '@mui/icons-material/Refresh';
@@ -22,12 +22,30 @@ export const CropTool: React.FC<CropToolProps> = ({
  onSkip,
 }) => {
  const [isProcessing, setIsProcessing] = useState(false);
+  const imageAreaRef = useRef<HTMLDivElement>(null);
+  const [imageMaxHeight, setImageMaxHeight] = useState(0);

-  const { cropArea, isDragging, resetCrop, executeCrop, handleDragStart } =
+  const { cropArea, cropDrawn, isDragging, resetCrop, executeCrop, handleDragStart, handleDrawStart } =
    useImageCrop({
      aspectRatio: lockAspectRatio ? aspectRatio : undefined,
    });

+  const showCropArea = cropDrawn || (isDragging && cropArea.width > 1 && cropArea.height > 1);
+
+  // Measure available height for the image so the crop container
+  // matches the rendered image exactly (fixes mobile crop offset)
+  useEffect(() => {
+    const updateMaxHeight = () => {
+      if (imageAreaRef.current) {
+        const rect = imageAreaRef.current.getBoundingClientRect();
+        setImageMaxHeight(rect.height - 32); // subtract p:2 padding (16px * 2)
+      }
+    };
+    updateMaxHeight();
+    window.addEventListener('resize', updateMaxHeight);
+    return () => window.removeEventListener('resize', updateMaxHeight);
+  }, []);
+
  const handleConfirm = useCallback(async () => {
    setIsProcessing(true);
    try {
@@ -61,6 +79,7 @@ export const CropTool: React.FC<CropToolProps> = ({
    >
      {/* Image with crop overlay */}
      <Box
+        ref={imageAreaRef}
        sx={{
          flex: 1,
          position: 'relative',
@@ -75,8 +94,6 @@ export const CropTool: React.FC<CropToolProps> = ({
          data-crop-container
          sx={{
            position: 'relative',
-            maxWidth: '100%',
-            maxHeight: '100%',
            userSelect: 'none',
            touchAction: isDragging ? 'none' : 'auto',
          }}
@@ -87,132 +104,156 @@ export const CropTool: React.FC<CropToolProps> = ({
            alt="Captured"
            style={{
              maxWidth: '100%',
-              maxHeight: '100%',
+              maxHeight: imageMaxHeight > 0 ? `${imageMaxHeight}px` : '70vh',
              display: 'block',
            }}
            draggable={false}
          />

+          {/* Draw surface for free-form rectangle drawing */}
+          {!cropDrawn && (
+            <Box
+              onMouseDown={handleDrawStart}
+              onTouchStart={handleDrawStart}
+              sx={{
+                position: 'absolute',
+                inset: 0,
+                cursor: 'crosshair',
+                zIndex: 5,
+                touchAction: 'none',
+              }}
+            />
+          )}
+
          {/* Dark overlay outside crop area */}
-          <Box
-            sx={{
-              position: 'absolute',
-              inset: 0,
-              pointerEvents: 'none',
-            }}
-          >
-            {/* Top overlay */}
-            <Box
-              sx={{
-                position: 'absolute',
-                top: 0,
-                left: 0,
-                right: 0,
-                height: `${cropArea.y}%`,
-                backgroundColor: 'rgba(0, 0, 0, 0.6)',
-              }}
-            />
-            {/* Bottom overlay */}
-            <Box
-              sx={{
-                position: 'absolute',
-                bottom: 0,
-                left: 0,
-                right: 0,
-                height: `${100 - cropArea.y - cropArea.height}%`,
-                backgroundColor: 'rgba(0, 0, 0, 0.6)',
-              }}
-            />
-            {/* Left overlay */}
-            <Box
-              sx={{
-                position: 'absolute',
-                top: `${cropArea.y}%`,
-                left: 0,
-                width: `${cropArea.x}%`,
-                height: `${cropArea.height}%`,
-                backgroundColor: 'rgba(0, 0, 0, 0.6)',
-              }}
-            />
-            {/* Right overlay */}
-            <Box
-              sx={{
-                position: 'absolute',
-                top: `${cropArea.y}%`,
-                right: 0,
-                width: `${100 - cropArea.x - cropArea.width}%`,
-                height: `${cropArea.height}%`,
-                backgroundColor: 'rgba(0, 0, 0, 0.6)',
-              }}
-            />
-          </Box>
-
-          {/* Crop area with handles */}
-          <Box
-            sx={{
-              position: 'absolute',
-              top: `${cropArea.y}%`,
-              left: `${cropArea.x}%`,
-              width: `${cropArea.width}%`,
-              height: `${cropArea.height}%`,
-              border: '2px solid white',
-              boxSizing: 'border-box',
-            }}
-          >
-            {/* Move handle (center area) */}
-            <CropHandleArea
-              handle="move"
-              onDragStart={handleDragStart}
-              sx={{
-                position: 'absolute',
-                inset: 8,
-                cursor: 'move',
-              }}
-            />
-
-            {/* Corner handles */}
-            <CropHandle handle="nw" onDragStart={handleDragStart} position="top-left" />
-            <CropHandle handle="ne" onDragStart={handleDragStart} position="top-right" />
-            <CropHandle handle="sw" onDragStart={handleDragStart} position="bottom-left" />
-            <CropHandle handle="se" onDragStart={handleDragStart} position="bottom-right" />
-
-            {/* Edge handles */}
-            <CropHandle handle="n" onDragStart={handleDragStart} position="top" />
-            <CropHandle handle="s" onDragStart={handleDragStart} position="bottom" />
-            <CropHandle handle="w" onDragStart={handleDragStart} position="left" />
-            <CropHandle handle="e" onDragStart={handleDragStart} position="right" />
-
-            {/* Grid lines for alignment */}
+          {showCropArea && (
            <Box
              sx={{
                position: 'absolute',
                inset: 0,
-                display: 'grid',
-                gridTemplateColumns: '1fr 1fr 1fr',
-                gridTemplateRows: '1fr 1fr 1fr',
                pointerEvents: 'none',
-                opacity: isDragging ? 1 : 0.5,
-                transition: 'opacity 0.2s',
              }}
            >
-              {Array.from({ length: 9 }).map((_, i) => (
-                <Box
-                  key={i}
-                  sx={{
-                    borderRight: i % 3 !== 2 ? '1px solid rgba(255,255,255,0.3)' : 'none',
-                    borderBottom: i < 6 ? '1px solid rgba(255,255,255,0.3)' : 'none',
-                  }}
-                />
-              ))}
+              {/* Top overlay */}
+              <Box
+                sx={{
+                  position: 'absolute',
+                  top: 0,
+                  left: 0,
+                  right: 0,
+                  height: `${cropArea.y}%`,
+                  backgroundColor: 'rgba(0, 0, 0, 0.6)',
+                }}
+              />
+              {/* Bottom overlay */}
+              <Box
+                sx={{
+                  position: 'absolute',
+                  bottom: 0,
+                  left: 0,
+                  right: 0,
+                  height: `${100 - cropArea.y - cropArea.height}%`,
+                  backgroundColor: 'rgba(0, 0, 0, 0.6)',
+                }}
+              />
+              {/* Left overlay */}
+              <Box
+                sx={{
+                  position: 'absolute',
+                  top: `${cropArea.y}%`,
+                  left: 0,
+                  width: `${cropArea.x}%`,
+                  height: `${cropArea.height}%`,
+                  backgroundColor: 'rgba(0, 0, 0, 0.6)',
+                }}
+              />
+              {/* Right overlay */}
+              <Box
+                sx={{
+                  position: 'absolute',
+                  top: `${cropArea.y}%`,
+                  right: 0,
+                  width: `${100 - cropArea.x - cropArea.width}%`,
+                  height: `${cropArea.height}%`,
+                  backgroundColor: 'rgba(0, 0, 0, 0.6)',
+                }}
+              />
            </Box>
-          </Box>
+          )}
+
+          {/* Crop area border and handles */}
+          {showCropArea && (
+            <Box
+              sx={{
+                position: 'absolute',
+                top: `${cropArea.y}%`,
+                left: `${cropArea.x}%`,
+                width: `${cropArea.width}%`,
+                height: `${cropArea.height}%`,
+                border: '2px solid white',
+                boxSizing: 'border-box',
+              }}
+            >
+              {/* Handles only appear after drawing is complete */}
+              {cropDrawn && (
+                <>
+                  {/* Move handle (center area) */}
+                  <CropHandleArea
+                    handle="move"
+                    onDragStart={handleDragStart}
+                    sx={{
+                      position: 'absolute',
+                      inset: 8,
+                      cursor: 'move',
+                    }}
+                  />
+
+                  {/* Corner handles */}
+                  <CropHandle handle="nw" onDragStart={handleDragStart} position="top-left" />
+                  <CropHandle handle="ne" onDragStart={handleDragStart} position="top-right" />
+                  <CropHandle handle="sw" onDragStart={handleDragStart} position="bottom-left" />
+                  <CropHandle handle="se" onDragStart={handleDragStart} position="bottom-right" />
+
+                  {/* Edge handles */}
+                  <CropHandle handle="n" onDragStart={handleDragStart} position="top" />
+                  <CropHandle handle="s" onDragStart={handleDragStart} position="bottom" />
+                  <CropHandle handle="w" onDragStart={handleDragStart} position="left" />
+                  <CropHandle handle="e" onDragStart={handleDragStart} position="right" />
+                </>
+              )}
+
+              {/* Grid lines for alignment */}
+              <Box
+                sx={{
+                  position: 'absolute',
+                  inset: 0,
+                  display: 'grid',
+                  gridTemplateColumns: '1fr 1fr 1fr',
+                  gridTemplateRows: '1fr 1fr 1fr',
+                  pointerEvents: 'none',
+                  opacity: isDragging ? 1 : 0.5,
+                  transition: 'opacity 0.2s',
+                }}
+              >
+                {Array.from({ length: 9 }).map((_, i) => (
+                  <Box
+                    key={i}
+                    sx={{
+                      borderRight: i % 3 !== 2 ? '1px solid rgba(255,255,255,0.3)' : 'none',
+                      borderBottom: i < 6 ? '1px solid rgba(255,255,255,0.3)' : 'none',
+                    }}
+                  />
+                ))}
+              </Box>
+            </Box>
+          )}
        </Box>
      </Box>

      {/* Instructions */}
      <Box sx={{ px: 2, py: 1, textAlign: 'center' }}>
        <Typography variant="body2" sx={{ color: 'rgba(255, 255, 255, 0.7)' }}>
-          Drag to adjust crop area
+          {cropDrawn ? 'Drag handles to adjust crop area' : 'Tap and drag to select crop area'}
        </Typography>
      </Box>

@@ -240,7 +281,7 @@ export const CropTool: React.FC<CropToolProps> = ({
          onClick={handleReset}
          startIcon={<RefreshIcon />}
          sx={{ color: 'white' }}
-          disabled={isProcessing}
+          disabled={isProcessing || !cropDrawn}
        >
          Reset
        </Button>
@@ -256,7 +297,7 @@ export const CropTool: React.FC<CropToolProps> = ({

        <IconButton
          onClick={handleConfirm}
-          disabled={isProcessing}
+          disabled={isProcessing || !cropDrawn}
          aria-label="Confirm crop"
          sx={{
            width: 56,
--- a/frontend/src/shared/components/CameraCapture/useImageCrop.ts
+++ b/frontend/src/shared/components/CameraCapture/useImageCrop.ts
@@ -18,16 +18,20 @@ interface UseImageCropOptions {
 interface UseImageCropReturn {
  /** Current crop area */
  cropArea: CropArea;
+  /** Whether user has drawn a crop rectangle */
+  cropDrawn: boolean;
  /** Whether user is actively dragging */
  isDragging: boolean;
  /** Set crop area */
  setCropArea: (area: CropArea) => void;
-  /** Reset crop to initial/default */
+  /** Reset crop to drawing mode */
  resetCrop: () => void;
  /** Execute crop and return cropped blob */
  executeCrop: (imageSrc: string, mimeType?: string) => Promise<Blob>;
  /** Handle drag start for crop handles */
  handleDragStart: (handle: CropHandle, event: React.MouseEvent | React.TouchEvent) => void;
+  /** Handle draw start for free-form rectangle drawing */
+  handleDrawStart: (event: React.MouseEvent | React.TouchEvent) => void;
  /** Handle move during drag */
  handleMove: (event: MouseEvent | TouchEvent) => void;
  /** Handle drag end */
@@ -78,12 +82,22 @@ export function useImageCrop(options: UseImageCropOptions = {}): UseImageCropRet
  const [cropArea, setCropAreaState] = useState<CropArea>(
    getAspectRatioAdjustedCrop(initialCrop)
  );
+  const [cropDrawn, setCropDrawn] = useState(false);
  const [isDragging, setIsDragging] = useState(false);

  const activeHandleRef = useRef<CropHandle | null>(null);
  const startPosRef = useRef({ x: 0, y: 0 });
  const startCropRef = useRef<CropArea>(cropArea);
-  const containerRef = useRef<{ width: number; height: number }>({ width: 100, height: 100 });
+  const containerRef = useRef<{ width: number; height: number; left: number; top: number }>({
+    width: 100, height: 100, left: 0, top: 0,
+  });
+  const isDrawingRef = useRef(false);
+  const drawOriginRef = useRef({ x: 0, y: 0 });
+  const cropAreaRef = useRef(cropArea);
+
+  useEffect(() => {
+    cropAreaRef.current = cropArea;
+  }, [cropArea]);

  const setCropArea = useCallback(
    (area: CropArea) => {
@@ -94,6 +108,7 @@ export function useImageCrop(options: UseImageCropOptions = {}): UseImageCropRet

  const resetCrop = useCallback(() => {
    setCropAreaState(getAspectRatioAdjustedCrop(initialCrop));
+    setCropDrawn(false);
  }, [initialCrop, getAspectRatioAdjustedCrop]);

  const constrainCrop = useCallback(
@@ -136,19 +151,75 @@ export function useImageCrop(options: UseImageCropOptions = {}): UseImageCropRet
      const container = target.closest('[data-crop-container]');
      if (container) {
        const rect = container.getBoundingClientRect();
-        containerRef.current = { width: rect.width, height: rect.height };
+        containerRef.current = { width: rect.width, height: rect.height, left: rect.left, top: rect.top };
      }
    },
    [cropArea]
  );

-  const handleMove = useCallback(
-    (event: MouseEvent | TouchEvent) => {
-      if (!activeHandleRef.current || !isDragging) return;
+  const handleDrawStart = useCallback(
+    (event: React.MouseEvent | React.TouchEvent) => {
+      event.preventDefault();
+
+      const target = event.currentTarget as HTMLElement;
+      const container = target.closest('[data-crop-container]');
+      if (!container) return;
+
+      const rect = container.getBoundingClientRect();
+      containerRef.current = { width: rect.width, height: rect.height, left: rect.left, top: rect.top };

      const clientX = 'touches' in event ? event.touches[0].clientX : event.clientX;
      const clientY = 'touches' in event ? event.touches[0].clientY : event.clientY;

+      const x = Math.max(0, Math.min(100, ((clientX - rect.left) / rect.width) * 100));
+      const y = Math.max(0, Math.min(100, ((clientY - rect.top) / rect.height) * 100));
+
+      startPosRef.current = { x: clientX, y: clientY };
+      drawOriginRef.current = { x, y };
+
+      setCropAreaState({ x, y, width: 0, height: 0 });
+
+      isDrawingRef.current = true;
+      activeHandleRef.current = null;
+      setIsDragging(true);
+    },
+    []
+  );
+
+  const handleMove = useCallback(
+    (event: MouseEvent | TouchEvent) => {
+      if (!isDragging) return;
+
+      const clientX = 'touches' in event ? event.touches[0].clientX : event.clientX;
+      const clientY = 'touches' in event ? event.touches[0].clientY : event.clientY;
+
+      // Free-form drawing mode: compute rectangle from origin to current pointer
+      if (isDrawingRef.current) {
+        const currentX = Math.max(0, Math.min(100,
+          ((clientX - containerRef.current.left) / containerRef.current.width) * 100));
+        const currentY = Math.max(0, Math.min(100,
+          ((clientY - containerRef.current.top) / containerRef.current.height) * 100));
+
+        const originX = drawOriginRef.current.x;
+        const originY = drawOriginRef.current.y;
+
+        let newCrop: CropArea = {
+          x: Math.min(originX, currentX),
+          y: Math.min(originY, currentY),
+          width: Math.abs(currentX - originX),
+          height: Math.abs(currentY - originY),
+        };
+
+        if (aspectRatio) {
+          newCrop.height = newCrop.width / aspectRatio;
+        }
+
+        setCropAreaState(newCrop);
+        return;
+      }
+
+      if (!activeHandleRef.current) return;
+
      // Calculate delta as percentage of container
      const deltaX = ((clientX - startPosRef.current.x) / containerRef.current.width) * 100;
      const deltaY = ((clientY - startPosRef.current.y) / containerRef.current.height) * 100;
@@ -234,13 +305,20 @@ export function useImageCrop(options: UseImageCropOptions = {}): UseImageCropRet

      setCropAreaState(constrainCrop(newCrop));
    },
-    [isDragging, constrainCrop]
+    [isDragging, constrainCrop, aspectRatio]
  );

  const handleDragEnd = useCallback(() => {
+    if (isDrawingRef.current) {
+      isDrawingRef.current = false;
+      const area = cropAreaRef.current;
+      if (area.width >= minSize && area.height >= minSize) {
+        setCropDrawn(true);
+      }
+    }
    activeHandleRef.current = null;
    setIsDragging(false);
-  }, []);
+  }, [minSize]);

  // Add global event listeners for drag
  useEffect(() => {
@@ -304,7 +382,7 @@ export function useImageCrop(options: UseImageCropOptions = {}): UseImageCropRet
              }
            },
            mimeType,
-            0.92
+            0.95
          );
        };

@@ -320,11 +398,13 @@ export function useImageCrop(options: UseImageCropOptions = {}): UseImageCropRet

  return {
    cropArea,
+    cropDrawn,
    isDragging,
    setCropArea,
    resetCrop,
    executeCrop,
    handleDragStart,
+    handleDrawStart,
    handleMove,
    handleDragEnd,
  };
--- a/ocr/app/extractors/vin_extractor.py
+++ b/ocr/app/extractors/vin_extractor.py
@@ -1,8 +1,10 @@
 """VIN-specific OCR extractor with preprocessing and validation."""
 import io
 import logging
+import os
 import time
 from dataclasses import dataclass, field
+from datetime import datetime
 from typing import Optional

 import magic
@@ -57,9 +59,31 @@ class VinExtractor(BaseExtractor):
    # VIN character whitelist for Tesseract
    VIN_WHITELIST = "ABCDEFGHJKLMNPRSTUVWXYZ0123456789"

+    # Fixed debug output directory (inside container)
+    DEBUG_DIR = "/tmp/vin-debug"
+
    def __init__(self) -> None:
        """Initialize VIN extractor."""
        pytesseract.pytesseract.tesseract_cmd = settings.tesseract_cmd
+        self._debug = settings.log_level.upper() == "DEBUG"
+
+    def _save_debug_image(self, session_dir: str, name: str, data: bytes) -> None:
+        """Save image bytes to the debug session directory when LOG_LEVEL=debug."""
+        if not self._debug:
+            return
+        path = os.path.join(session_dir, name)
+        with open(path, "wb") as f:
+            f.write(data)
+        logger.debug("Saved debug image: %s (%d bytes)", name, len(data))
+
+    def _create_debug_session(self) -> Optional[str]:
+        """Create a timestamped debug directory. Returns path or None."""
+        if not self._debug:
+            return None
+        ts = datetime.now().strftime("%Y%m%d_%H%M%S_%f")
+        session_dir = os.path.join(self.DEBUG_DIR, ts)
+        os.makedirs(session_dir, exist_ok=True)
+        return session_dir

    def extract(
        self, image_bytes: bytes, content_type: Optional[str] = None
@@ -89,21 +113,91 @@ class VinExtractor(BaseExtractor):
            )

        try:
+            debug_session = self._create_debug_session()
+
+            logger.debug(
+                "VIN extraction input: %d bytes, content_type=%s",
+                len(image_bytes), content_type,
+            )
+            if debug_session:
+                self._save_debug_image(debug_session, "01_original.jpg", image_bytes)
+
            # Apply VIN-optimized preprocessing
            preprocessing_result = vin_preprocessor.preprocess(image_bytes)
            preprocessed_bytes = preprocessing_result.image_bytes
+            logger.debug(
+                "Preprocessing steps: %s", preprocessing_result.preprocessing_applied
+            )
+            if debug_session:
+                self._save_debug_image(
+                    debug_session, "02_preprocessed_adaptive.png", preprocessed_bytes
+                )

            # Perform OCR with VIN-optimized settings
            raw_text, word_confidences = self._perform_ocr(preprocessed_bytes)
+            logger.debug("PSM 6 raw text: '%s'", raw_text)
+            logger.debug("PSM 6 word confidences: %s", word_confidences)

            # Extract VIN candidates from raw text
            candidates = vin_validator.extract_candidates(raw_text)
+            logger.debug("PSM 6 candidates: %s", candidates)

            if not candidates:
                # No VIN candidates found - try with different PSM modes
                candidates = self._try_alternate_ocr(preprocessed_bytes)

            if not candidates:
+                # Try grayscale-only (no thresholding) — the Tesseract
+                # LSTM engine often performs better on non-binarized input
+                # because it does its own internal preprocessing.
+                gray_result = vin_preprocessor.preprocess(
+                    image_bytes, apply_threshold=False
+                )
+                logger.debug(
+                    "Grayscale preprocessing steps: %s",
+                    gray_result.preprocessing_applied,
+                )
+                if debug_session:
+                    self._save_debug_image(
+                        debug_session, "04_preprocessed_gray.png",
+                        gray_result.image_bytes,
+                    )
+
+                raw_text, word_confidences = self._perform_ocr(
+                    gray_result.image_bytes
+                )
+                logger.debug("Gray PSM 6 raw text: '%s'", raw_text)
+                candidates = vin_validator.extract_candidates(raw_text)
+                logger.debug("Gray PSM 6 candidates: %s", candidates)
+                if not candidates:
+                    candidates = self._try_alternate_ocr(
+                        gray_result.image_bytes, prefix="Gray"
+                    )
+
+            if not candidates:
+                # Try alternative preprocessing (Otsu's thresholding)
+                otsu_result = vin_preprocessor.preprocess_otsu(image_bytes)
+                logger.debug(
+                    "Otsu preprocessing steps: %s",
+                    otsu_result.preprocessing_applied,
+                )
+                if debug_session:
+                    self._save_debug_image(
+                        debug_session, "03_preprocessed_otsu.png",
+                        otsu_result.image_bytes,
+                    )
+
+                raw_text, word_confidences = self._perform_ocr(otsu_result.image_bytes)
+                logger.debug("Otsu PSM 6 raw text: '%s'", raw_text)
+                candidates = vin_validator.extract_candidates(raw_text)
+                logger.debug("Otsu PSM 6 candidates: %s", candidates)
+                if not candidates:
+                    candidates = self._try_alternate_ocr(
+                        otsu_result.image_bytes, prefix="Otsu"
+                    )
+
+            if not candidates:
+                logger.debug("No VIN pattern found in any OCR attempt")
                return VinExtractionResult(
                    success=False,
                    error="No VIN pattern found in image",
@@ -153,8 +247,12 @@ class VinExtractor(BaseExtractor):
            processing_time_ms = int((time.time() - start_time) * 1000)

            logger.info(
-                f"VIN extraction: {primary_vin}, confidence={primary_confidence:.2%}, "
-                f"time={processing_time_ms}ms"
+                "VIN extraction: %s, confidence=%.2f%%, time=%dms",
+                primary_vin, primary_confidence * 100, processing_time_ms,
+            )
+            logger.debug(
+                "VIN alternatives: %s",
+                [(a.vin, a.confidence) for a in alternatives],
            )

            return VinExtractionResult(
@@ -168,7 +266,7 @@ class VinExtractor(BaseExtractor):
            )

        except Exception as e:
-            logger.error(f"VIN extraction failed: {e}", exc_info=True)
+            logger.error("VIN extraction failed: %s", e, exc_info=True)
            return VinExtractionResult(
                success=False,
                error=str(e),
@@ -200,10 +298,15 @@ class VinExtractor(BaseExtractor):
        image = Image.open(io.BytesIO(image_bytes))

        # Configure Tesseract for VIN extraction
-        # Use character whitelist to exclude I, O, Q
+        # OEM 1 = LSTM neural network engine (best accuracy)
+        # NOTE: tessedit_char_whitelist does NOT work with OEM 1 (LSTM).
+        # Using it causes empty/erratic output.  Character filtering is
+        # handled post-OCR by vin_validator.correct_ocr_errors() instead.
        config = (
            f"--psm {psm} "
-            f"-c tessedit_char_whitelist={self.VIN_WHITELIST}"
+            f"--oem 1 "
+            f"-c load_system_dawg=false "
+            f"-c load_freq_dawg=false"
        )

        # Get detailed OCR data
@@ -224,24 +327,31 @@ class VinExtractor(BaseExtractor):
        raw_text = " ".join(words)
        return raw_text, confidences

-    def _try_alternate_ocr(self, image_bytes: bytes) -> list[tuple[str, int, int]]:
+    def _try_alternate_ocr(
+        self,
+        image_bytes: bytes,
+        prefix: str = "",
+    ) -> list[tuple[str, int, int]]:
        """
        Try alternate OCR configurations when initial extraction fails.

+        PSM modes tried in order:
+            7  - Single text line
+            8  - Single word
+            11 - Sparse text (finds text in any order, good for angled photos)
+            13 - Raw line (no Tesseract heuristics, good for clean VIN plates)
+
        Returns:
            List of VIN candidates
        """
-        # Try PSM 7 (single text line)
-        raw_text, _ = self._perform_ocr(image_bytes, psm=7)
-        candidates = vin_validator.extract_candidates(raw_text)
-        if candidates:
-            return candidates
-
-        # Try PSM 8 (single word)
-        raw_text, _ = self._perform_ocr(image_bytes, psm=8)
-        candidates = vin_validator.extract_candidates(raw_text)
-        if candidates:
-            return candidates
+        tag = f"{prefix} " if prefix else ""
+        for psm in (7, 8, 11, 13):
+            raw_text, _ = self._perform_ocr(image_bytes, psm=psm)
+            logger.debug("%sPSM %d raw text: '%s'", tag, psm, raw_text)
+            candidates = vin_validator.extract_candidates(raw_text)
+            logger.debug("%sPSM %d candidates: %s", tag, psm, candidates)
+            if candidates:
+                return candidates

        return []

--- a/ocr/app/preprocessors/vin_preprocessor.py
+++ b/ocr/app/preprocessors/vin_preprocessor.py
@@ -86,13 +86,17 @@ class VinPreprocessor:
        if len(cv_image.shape) == 3:
            cv_image = cv2.cvtColor(cv_image, cv2.COLOR_RGB2BGR)

-        # Convert to grayscale
+        # Convert to grayscale using best-contrast channel selection
        if len(cv_image.shape) == 3:
-            gray = cv2.cvtColor(cv_image, cv2.COLOR_BGR2GRAY)
+            gray = self._best_contrast_channel(cv_image)
        else:
            gray = cv_image
        steps_applied.append("grayscale")

+        # Upscale small images for better OCR (Tesseract needs ~300 DPI)
+        gray = self._ensure_minimum_resolution(gray)
+        steps_applied.append("resolution_check")
+
        # Apply deskew
        if apply_deskew:
            gray = self._deskew(gray)
@@ -111,6 +115,7 @@ class VinPreprocessor:
        # Apply adaptive thresholding
        if apply_threshold:
            gray = self._adaptive_threshold(gray)
+            gray = self._morphological_cleanup(gray)
            steps_applied.append("threshold")

        # Convert back to PNG bytes
@@ -123,6 +128,58 @@ class VinPreprocessor:
            preprocessing_applied=steps_applied,
        )

+    # Minimum width in pixels for reliable VIN OCR.
+    # A 17-char VIN needs ~30px per character for Tesseract accuracy.
+    MIN_WIDTH_FOR_VIN = 600
+
+    def _ensure_minimum_resolution(self, image: np.ndarray) -> np.ndarray:
+        """
+        Upscale image if too small for reliable OCR.
+
+        Tesseract works best at ~300 DPI. Mobile photos of VINs may have
+        the text occupy only a small portion of the frame, resulting in
+        low effective resolution for the VIN characters.
+        """
+        height, width = image.shape[:2]
+        if width < self.MIN_WIDTH_FOR_VIN:
+            scale = self.MIN_WIDTH_FOR_VIN / width
+            new_width = int(width * scale)
+            new_height = int(height * scale)
+            image = cv2.resize(
+                image, (new_width, new_height), interpolation=cv2.INTER_CUBIC
+            )
+            logger.debug(f"Upscaled image from {width}x{height} to {new_width}x{new_height}")
+        return image
+
+    def _best_contrast_channel(self, bgr_image: np.ndarray) -> np.ndarray:
+        """
+        Compute a grayscale image with dark text on light background.
+
+        Uses inverted per-pixel minimum across B, G, R channels.
+        White text has min(255,255,255) = 255 → inverted to 0 (black).
+        Colored backgrounds have a low min value (e.g. green sticker:
+        min(130,230,150) = 130) → inverted to 125 (medium gray).
+
+        The inversion ensures Tesseract always receives dark-text-on-
+        light-background, which is the polarity it expects.
+        """
+        b_channel, g_channel, r_channel = cv2.split(bgr_image)
+
+        min_channel = np.minimum(np.minimum(b_channel, g_channel), r_channel)
+
+        # Invert so white text (min=255) becomes black (0) and colored
+        # backgrounds (min~130) become lighter gray (~125).  Tesseract
+        # expects dark text on light background.
+        inverted = cv2.bitwise_not(min_channel)
+
+        gray = cv2.cvtColor(bgr_image, cv2.COLOR_BGR2GRAY)
+        logger.debug(
+            "Channel contrast: inverted-min std=%.1f, grayscale std=%.1f",
+            float(np.std(inverted)), float(np.std(gray)),
+        )
+
+        return inverted
+
    def _apply_clahe(self, image: np.ndarray) -> np.ndarray:
        """
        Apply CLAHE (Contrast Limited Adaptive Histogram Equalization).
@@ -242,6 +299,84 @@ class VinPreprocessor:
            logger.warning(f"Adaptive threshold failed: {e}")
            return image

+    def _morphological_cleanup(self, image: np.ndarray) -> np.ndarray:
+        """
+        Remove small noise artifacts from a thresholded binary image.
+
+        Morphological opening (erosion then dilation) removes isolated
+        pixels and thin noise lines while preserving larger text characters.
+        """
+        try:
+            kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (2, 2))
+            return cv2.morphologyEx(image, cv2.MORPH_OPEN, kernel)
+        except cv2.error as e:
+            logger.warning(f"Morphological cleanup failed: {e}")
+            return image
+
+    def _otsu_threshold(self, image: np.ndarray) -> np.ndarray:
+        """
+        Apply Otsu's thresholding for binarization.
+
+        Otsu's method auto-calculates the optimal threshold value,
+        which can work better than adaptive thresholding on evenly-lit images.
+        """
+        try:
+            _, result = cv2.threshold(
+                image, 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU
+            )
+            return result
+        except cv2.error as e:
+            logger.warning(f"Otsu threshold failed: {e}")
+            return image
+
+    def preprocess_otsu(self, image_bytes: bytes) -> PreprocessingResult:
+        """
+        Alternative preprocessing pipeline using Otsu's thresholding.
+
+        Used as a fallback when adaptive thresholding doesn't produce
+        good OCR results.
+        """
+        steps_applied = []
+
+        pil_image = Image.open(io.BytesIO(image_bytes))
+        steps_applied.append("loaded")
+
+        if pil_image.mode not in ("RGB", "L"):
+            pil_image = pil_image.convert("RGB")
+            steps_applied.append("convert_rgb")
+
+        cv_image = np.array(pil_image)
+        if len(cv_image.shape) == 3:
+            cv_image = cv2.cvtColor(cv_image, cv2.COLOR_RGB2BGR)
+
+        if len(cv_image.shape) == 3:
+            gray = self._best_contrast_channel(cv_image)
+        else:
+            gray = cv_image
+        steps_applied.append("grayscale")
+
+        gray = self._ensure_minimum_resolution(gray)
+        steps_applied.append("resolution_check")
+
+        gray = self._apply_clahe(gray)
+        steps_applied.append("clahe")
+
+        gray = self._denoise(gray)
+        steps_applied.append("denoise")
+
+        gray = self._otsu_threshold(gray)
+        gray = self._morphological_cleanup(gray)
+        steps_applied.append("otsu_threshold")
+
+        result_image = Image.fromarray(gray)
+        buffer = io.BytesIO()
+        result_image.save(buffer, format="PNG")
+
+        return PreprocessingResult(
+            image_bytes=buffer.getvalue(),
+            preprocessing_applied=steps_applied,
+        )
+
    def detect_vin_region(self, image_bytes: bytes) -> Optional[BoundingBox]:
        """
        Attempt to detect the VIN region in an image.
--- a/ocr/app/validators/vin_validator.py
+++ b/ocr/app/validators/vin_validator.py
@@ -20,7 +20,9 @@ class VinValidator:
    # VIN character set (excludes I, O, Q)
    VALID_CHARS = set("ABCDEFGHJKLMNPRSTUVWXYZ0123456789")

-    # Common OCR misreads and their corrections
+    # Common OCR misreads and their corrections.
+    # Only map characters that are INVALID in VINs to their likely correct values.
+    # B and S are valid VIN characters and must NOT be transliterated.
    TRANSLITERATION = {
        "I": "1",
        "O": "0",
@@ -29,9 +31,6 @@ class VinValidator:
        "o": "0",
        "q": "0",
        "l": "1",
-        "L": "1",
-        "B": "8",  # Sometimes confused
-        "S": "5",  # Sometimes confused
    }

    # Weights for check digit calculation (positions 1-17)
@@ -224,6 +223,11 @@ class VinValidator:
        """
        Extract VIN candidates from raw OCR text.

+        Uses two strategies:
+        1. Find continuous 11-20 char alphanumeric runs (handles intact VINs)
+        2. Concatenate adjacent short fragments separated by spaces/dashes
+           (handles Tesseract fragmenting VINs into multiple words)
+
        Args:
            text: Raw OCR text
            max_candidates: Maximum number of candidates to return
@@ -231,29 +235,104 @@ class VinValidator:
        Returns:
            List of (vin, start_pos, end_pos) tuples
        """
-        # Pattern to find potential VIN sequences
-        # Allow some flexibility for OCR errors (include I, O, Q for correction later)
-        potential_vin_pattern = re.compile(r"[A-Z0-9IOQ]{11,17}", re.IGNORECASE)
-
        candidates = []
-        for match in potential_vin_pattern.finditer(text.upper()):
-            candidate = match.group()
-            corrected = self.correct_ocr_errors(candidate)
+        seen_vins: set[str] = set()

-            # Only include if it could be a valid VIN after correction
-            if len(corrected) == 17 and self.MODERN_VIN_PATTERN.match(corrected):
-                candidates.append((corrected, match.start(), match.end()))
+        upper_text = text.upper()

-        # Sort by likelihood of being valid (check digit validation)
+        # Strategy 1: Find continuous runs of VIN-like characters
+        continuous_pattern = re.compile(r"[A-Z0-9IOQ]{11,20}", re.IGNORECASE)
+        for match in continuous_pattern.finditer(upper_text):
+            self._try_add_candidate(
+                match.group(), match.start(), match.end(), candidates, seen_vins
+            )
+
+        # Strategy 2: Concatenate adjacent alphanumeric fragments
+        # This handles OCR fragmentation like "1HGBH 41JXMN 109186"
+        # Only consider fragments >= 3 chars (filters out noise/short words)
+        fragment_pattern = re.compile(r"[A-Z0-9IOQ]{3,}", re.IGNORECASE)
+        fragments = [
+            (m.group(), m.start(), m.end())
+            for m in fragment_pattern.finditer(upper_text)
+        ]
+
+        # Try sliding windows of 2-4 adjacent fragments
+        for window_size in range(2, min(5, len(fragments) + 1)):
+            for i in range(len(fragments) - window_size + 1):
+                window = fragments[i : i + window_size]
+                combined = "".join(f[0] for f in window)
+                # Combined length must be close to 17 (allow +/- 2 for OCR noise)
+                # Must contain at least 2 digit characters (VINs always have digits;
+                # pure-alphabetic text is almost certainly not a VIN)
+                if 15 <= len(combined) <= 19 and sum(c.isdigit() for c in combined) >= 2:
+                    self._try_add_candidate(
+                        combined, window[0][1], window[-1][2], candidates, seen_vins
+                    )
+
+        # Sort by likelihood of being valid (check digit first, then position)
        def score_candidate(c: tuple[str, int, int]) -> int:
            vin = c[0]
            if self.validate_check_digit(vin):
-                return 0  # Best score
+                return 0
            return 1

        candidates.sort(key=score_candidate)
        return candidates[:max_candidates]

+    def _try_add_candidate(
+        self,
+        raw: str,
+        start: int,
+        end: int,
+        candidates: list[tuple[str, int, int]],
+        seen_vins: set[str],
+    ) -> None:
+        """Try to add a corrected VIN candidate if it passes validation."""
+        corrected = self.correct_ocr_errors(raw)
+
+        if len(corrected) == 17:
+            self._add_if_valid(corrected, start, end, candidates, seen_vins)
+            return
+
+        if len(corrected) > 17:
+            # Strategy A: try every 17-char sliding window
+            for i in range(len(corrected) - 16):
+                window = corrected[i : i + 17]
+                self._add_if_valid(window, start, end, candidates, seen_vins)
+
+            # Strategy B: for 18-19 char strings, try deleting each
+            # character one at a time.  OCR often inserts a spurious
+            # character (e.g. sticker border read as 'C') that breaks
+            # the VIN.  Check-digit validation filters out false hits.
+            if len(corrected) <= 19:
+                for i in range(len(corrected)):
+                    reduced = corrected[:i] + corrected[i + 1 :]
+                    if len(reduced) == 17:
+                        self._add_if_valid(
+                            reduced, start, end, candidates, seen_vins
+                        )
+                    elif len(reduced) == 18:
+                        # Two deletions needed — try removing one more
+                        for j in range(len(reduced)):
+                            reduced2 = reduced[:j] + reduced[j + 1 :]
+                            self._add_if_valid(
+                                reduced2, start, end, candidates, seen_vins
+                            )
+
+    def _add_if_valid(
+        self,
+        vin: str,
+        start: int,
+        end: int,
+        candidates: list[tuple[str, int, int]],
+        seen_vins: set[str],
+    ) -> None:
+        """Add a 17-char VIN to candidates if it matches the pattern."""
+        if len(vin) == 17 and self.MODERN_VIN_PATTERN.match(vin):
+            if vin not in seen_vins:
+                seen_vins.add(vin)
+                candidates.append((vin, start, end))
+

 # Singleton instance
 vin_validator = VinValidator()
--- a/ocr/tests/test_vin_preprocessor.py
+++ b/ocr/tests/test_vin_preprocessor.py
@@ -53,6 +53,7 @@ class TestVinPreprocessor:
        )

        assert "grayscale" in result.preprocessing_applied
+        assert "resolution_check" in result.preprocessing_applied
        assert "clahe" in result.preprocessing_applied
        assert "deskew" in result.preprocessing_applied
        assert "denoise" in result.preprocessing_applied
@@ -185,6 +186,54 @@ class TestVinPreprocessorThreshold:
        assert len(unique_values) <= 2


+class TestVinPreprocessorOtsu:
+    """Tests for Otsu's thresholding preprocessing."""
+
+    def test_otsu_threshold_creates_binary_image(self) -> None:
+        """Test Otsu's thresholding creates binary output."""
+        preprocessor = VinPreprocessor()
+        image = np.full((100, 400), 128, dtype=np.uint8)
+
+        result = preprocessor._otsu_threshold(image)
+
+        unique_values = np.unique(result)
+        assert len(unique_values) <= 2
+
+    def test_preprocess_otsu_returns_result(self) -> None:
+        """Test Otsu preprocessing pipeline returns valid result."""
+        preprocessor = VinPreprocessor()
+        image_bytes = create_test_image()
+
+        result = preprocessor.preprocess_otsu(image_bytes)
+
+        assert result.image_bytes is not None
+        assert len(result.image_bytes) > 0
+        assert "otsu_threshold" in result.preprocessing_applied
+        assert "grayscale" in result.preprocessing_applied
+
+
+class TestVinPreprocessorResolution:
+    """Tests for resolution upscaling."""
+
+    def test_upscale_small_image(self) -> None:
+        """Test small images are upscaled."""
+        preprocessor = VinPreprocessor()
+        small_image = np.full((50, 200), 128, dtype=np.uint8)
+
+        result = preprocessor._ensure_minimum_resolution(small_image)
+
+        assert result.shape[1] >= preprocessor.MIN_WIDTH_FOR_VIN
+
+    def test_no_upscale_large_image(self) -> None:
+        """Test large images are not upscaled."""
+        preprocessor = VinPreprocessor()
+        large_image = np.full((200, 800), 128, dtype=np.uint8)
+
+        result = preprocessor._ensure_minimum_resolution(large_image)
+
+        assert result.shape == large_image.shape
+
+
 class TestVinRegionDetection:
    """Tests for VIN region detection."""

--- a/ocr/tests/test_vin_validator.py
+++ b/ocr/tests/test_vin_validator.py
@@ -43,9 +43,9 @@ class TestVinValidator:
        result = validator.calculate_check_digit("1HGBH41JXMN109186")
        assert result == "X"

-        # 5YJSA1E28HF123456 has check digit 2 at position 9
+        # 5YJSA1E28HF123456 has check digit at position 9
        result = validator.calculate_check_digit("5YJSA1E28HF123456")
-        assert result == "8"  # Verify this is correct for this VIN
+        assert result == "5"

    def test_validate_check_digit_valid(self) -> None:
        """Test check digit validation with valid VIN."""
@@ -161,6 +161,27 @@ class TestVinValidator:
        assert len(candidates) >= 1
        assert candidates[0][0] == "1HGBH41JXMN109186"

+    def test_extract_candidates_fragmented_vin(self) -> None:
+        """Test candidate extraction handles space-fragmented VINs from OCR."""
+        validator = VinValidator()
+
+        # Tesseract often fragments VINs into multiple words
+        text = "1HGBH 41JXMN 109186"
+        candidates = validator.extract_candidates(text)
+
+        assert len(candidates) >= 1
+        assert candidates[0][0] == "1HGBH41JXMN109186"
+
+    def test_extract_candidates_dash_fragmented_vin(self) -> None:
+        """Test candidate extraction handles dash-separated VINs."""
+        validator = VinValidator()
+
+        text = "1HGBH41J-XMN109186"
+        candidates = validator.extract_candidates(text)
+
+        assert len(candidates) >= 1
+        assert candidates[0][0] == "1HGBH41JXMN109186"
+
    def test_extract_candidates_no_vin(self) -> None:
        """Test candidate extraction with no VIN."""
        validator = VinValidator()
Author	SHA1	Message	Date
egullickson	6b0c18a41c	Merge pull request 'fix: VIN OCR scanning fails with "No VIN Pattern found" on all images (#113 )' (#114 ) from issue-113-fix-vin-ocr-scanning into main All checks were successful Deploy to Staging / Build Images (push) Successful in 35s Details Deploy to Staging / Deploy to Staging (push) Successful in 21s Details Deploy to Staging / Verify Staging (push) Successful in 8s Details Deploy to Staging / Notify Staging Ready (push) Successful in 7s Details Deploy to Staging / Notify Staging Failure (push) Has been skipped Details Reviewed-on: #114	2026-02-07 15:47:35 +00:00
Eric Gullickson	75ce316aa5	chore: Change crop to remove locked aspect ratio All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 3m21s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 22s Details Deploy to Staging / Verify Staging (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 7s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details	2026-02-06 22:15:39 -06:00
Eric Gullickson	e4336ce9da	fix: extract VIN from noisy OCR via sliding window + char deletion (refs #113 ) All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 37s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 51s Details Deploy to Staging / Verify Staging (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 7s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details When OCR reads extra characters (e.g. sticker border as 'C', spurious 'Z' insertion), the raw text exceeds 17 chars and the old first-17 trim produced wrong VINs. New strategy tries all 17-char sliding windows and single/double character deletions, validating each via check digit. For 'CWVGGNPE2Z4NP069500', this finds the correct VIN 'WVGGNPE24NP069500' (valid check digit) instead of 'CWVGGNPE2Z4NP0695' (invalid). Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-02-06 22:00:07 -06:00
Eric Gullickson	432b3bda36	fix: remove char whitelist incompatible with Tesseract LSTM (refs #113 ) All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 36s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 51s Details Deploy to Staging / Verify Staging (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details tessedit_char_whitelist does not work with OEM 1 (LSTM engine) and causes empty/erratic output. This was the root cause of Tesseract returning empty text despite clear, well-preprocessed images. Character filtering is already handled post-OCR by the VIN validator's correct_ocr_errors() method (I->1, O->0, Q->0, etc). Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-02-06 21:52:08 -06:00
Eric Gullickson	ae5221c759	fix: invert min-channel so Tesseract gets dark-on-light text (refs #113 ) All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 35s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 51s Details Deploy to Staging / Verify Staging (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 7s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details The min-channel correctly extracts contrast (white text=255 vs green sticker bg=130), but Tesseract expects dark text on light background. Without inversion, the grayscale-only path returned empty text for every PSM mode because Tesseract couldn't see bright-on-dark text. Invert via bitwise_not: text becomes 0 (black), sticker bg becomes 125 (gray). Fixes all three OCR paths (adaptive, grayscale, Otsu). Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-02-06 21:39:48 -06:00
Eric Gullickson	63c027a454	fix: always use min-channel and add grayscale-only OCR path (refs #113 ) All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 35s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 50s Details Deploy to Staging / Verify Staging (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 7s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details Two fixes: 1. Always use min-channel for color images instead of gated comparison that was falling back to standard grayscale (which has only 23% contrast for white-on-green VIN stickers). 2. Add grayscale-only OCR path (CLAHE + denoise, no thresholding) between adaptive and Otsu attempts. Tesseract's LSTM engine is designed to handle grayscale input directly and often outperforms binarized input where thresholding creates artifacts. Pipeline order: adaptive threshold → grayscale-only → Otsu threshold Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-02-06 21:32:52 -06:00
Eric Gullickson	a07ec324fe	fix: use min-channel grayscale and morphological cleanup for VIN OCR (refs #113 ) All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 35s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 51s Details Deploy to Staging / Verify Staging (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details Replace std-based channel selection (which incorrectly picked green for green-tinted VIN stickers) with per-pixel min(B,G,R). White text stays 255 in all channels while colored backgrounds drop to their weakest channel value, giving 2x contrast improvement. Add morphological opening after thresholding to remove noise speckles from car body surface that were confusing Tesseract's page segmentation. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-02-06 21:23:43 -06:00
Eric Gullickson	0de34983bb	fix: use best-contrast color channel for VIN preprocessing (refs #113 ) All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 36s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 1m7s Details Deploy to Staging / Verify Staging (pull_request) Successful in 10s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 9s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details White text on green VIN stickers has only ~12% contrast in standard grayscale conversion because the green channel dominates luminance. The new _best_contrast_channel method evaluates each RGB channel's standard deviation and selects the one with highest contrast, giving ~2x improvement for green-tinted VIN stickers. Falls back to standard grayscale for neutral-colored images. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-02-06 21:14:56 -06:00
Eric Gullickson	ce2a8d88f9	fix: Mobile image crop fix All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 3m20s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 51s Details Deploy to Staging / Verify Staging (pull_request) Successful in 9s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 7s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details	2026-02-06 20:55:08 -06:00
Eric Gullickson	9ce08cbb89	fix: Debug variables All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 35s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 51s Details Deploy to Staging / Verify Staging (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 7s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details	2026-02-06 20:42:00 -06:00
Eric Gullickson	ff3858f750	fix: add debug image saving gated on LOG_LEVEL=debug (refs #113 ) All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 36s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 21s Details Deploy to Staging / Verify Staging (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 7s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details Save original, adaptive, and Otsu preprocessed images to /tmp/vin-debug/{timestamp}/ when LOG_LEVEL is set to debug. No images saved at info level. Volume mount added for access. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-02-06 20:26:06 -06:00
Eric Gullickson	488a267fc7	fix: Fixed debug env variable. All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 35s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 50s Details Deploy to Staging / Verify Staging (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 7s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details	2026-02-06 20:20:14 -06:00
Eric Gullickson	3f0e243087	fix: Postgres Data paths All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 35s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 19s Details Deploy to Staging / Verify Staging (pull_request) Successful in 2m30s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details	2026-02-06 19:53:37 -06:00
Eric Gullickson	d5696320f1	fix: align VIN OCR logging with unified logging design (refs #113 ) All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 3m25s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 51s Details Deploy to Staging / Verify Staging (pull_request) Successful in 2m36s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 9s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details Replace filesystem-based debug system (VIN_DEBUG_DIR) with standard logger.debug() calls that flow through Loki when LOG_LEVEL=DEBUG. Use .env.logging variable for OCR LOG_LEVEL. Increase image capture quality to 0.95 for better OCR accuracy. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-02-06 19:36:35 -06:00
Eric Gullickson	6a4c2137f7	fix: resolve VIN OCR scanning failures on all images (refs #113 ) All checks were successful Deploy to Staging / Build Images (pull_request) Successful in 35s Details Deploy to Staging / Deploy to Staging (pull_request) Successful in 51s Details Deploy to Staging / Verify Staging (pull_request) Successful in 2m31s Details Deploy to Staging / Notify Staging Ready (pull_request) Successful in 8s Details Deploy to Staging / Notify Staging Failure (pull_request) Has been skipped Details Root cause: Tesseract fragments VINs into multiple words but candidate extraction required continuous 17-char sequences, rejecting all results. Changes: - Fix candidate extraction to concatenate adjacent OCR fragments - Disable Tesseract dictionaries (VINs are not dictionary words) - Set OEM 1 (LSTM engine) for better accuracy - Add PSM 11 (sparse text) and PSM 13 (raw line) fallback modes - Add Otsu's thresholding as alternative preprocessing pipeline - Upscale small images to meet Tesseract's 300 DPI requirement - Remove incorrect B->8 and S->5 transliterations (valid VIN chars) - Fix pre-existing test bug in check digit expected value Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-02-06 15:57:14 -06:00
Eric Gullickson	45aaeab973	chore: update context.json	2026-02-06 15:48:45 -06:00