initial

2026-02-04 15:22:28 +07:00
commit 7e56948ece
3 changed files with 1044 additions and 0 deletions
@@ -0,0 +1,61 @@
 # YOLOv9 dataset augmentation
 Augment a YOLOv9-format dataset by creating new image and label files for horizontal flip, vertical flip, +10% hue, +30% contrast, and grayscale. Labels are updated correctly for flips; other augmentations copy labels unchanged.
 ## Dataset layout
 Expected structure:
 ```
 dataset/
 ├── images/          # .jpg or .png
 │   ├── img1.jpg
 │   └── img2.jpg
 └── labels/          # .txt, one per image, same base name
    ├── img1.txt
    └── img2.txt
 ```
 YOLO label format: one line per object: `class_id x_center y_center width height` (normalized 0–1).
 If `images/` and `labels/` are not present, the script treats the given directory as containing both images and labels (flat layout).
 ## Setup
 ```bash
 pip install -r requirements.txt
 ```
 ## Usage
 Augment in place (new files appear next to originals in `images/` and `labels/`):
 ```bash
 python augment_yolov9_dataset.py --dataset-dir ./dataset/train
 ```
 Write augmented files to a separate directory (creates `train_aug/images/` and `train_aug/labels/`):
 ```bash
 python augment_yolov9_dataset.py --dataset-dir ./dataset/train --output-dir ./dataset/train_aug
 ```
 Other options:
 - `--image-ext .png` — look for `.png` instead of `.jpg`
 - `--suffixes hflip vflip` — run only horizontal and vertical flip (choices: `hflip`, `vflip`, `hue`, `contrast`, `gray`)
 - `--dry-run` — print which files would be created without writing
 ## Output naming
 For each image `img.jpg` with label `img.txt`, the script can create:
 | Augmentation   | Image           | Label           |
 |----------------|-----------------|-----------------|
 | Horizontal flip| `img_hflip.jpg` | `img_hflip.txt` |
 | Vertical flip  | `img_vflip.jpg` | `img_vflip.txt` |
 | Hue +10%       | `img_hue.jpg`   | `img_hue.txt`   |
 | Contrast +30%  | `img_contrast.jpg` | `img_contrast.txt` |
 | Grayscale      | `img_gray.jpg`  | `img_gray.txt`  |
 Add these paths to your YOLOv9 data YAML or file lists to use the augmented set.
@@ -0,0 +1,393 @@
 #!/usr/bin/env python3
 """
 Augment a YOLOv9-format dataset by creating new image and label files for:
 horizontal flip, vertical flip, +10% hue, +30% contrast, and grayscale.
 """
 from __future__ import annotations
 import argparse
 import logging
 import random
 import time
 from pathlib import Path
 import cv2
 # Augmentation strength constants (tune as needed)
 HUE_DELTA = 0.1  # 10% hue shift in [0, 1] scale
 CONTRAST_FACTOR = 1.3  # 30% contrast increase
 # Suffix used for each augmentation type -> (suffix, applies to labels)
 SUFFIX_HFLIP = "hflip"
 SUFFIX_VFLIP = "vflip"
 SUFFIX_HUE = "hue"
 SUFFIX_CONTRAST = "contrast"
 SUFFIX_GRAY = "gray"
 LOG = logging.getLogger(__name__)
 # Default image extensions to discover (case-insensitive)
 DEFAULT_IMAGE_EXTS = (".jpg", ".jpeg", ".png")
 def read_yolo_labels(path: Path) -> list[tuple[int, float, float, float, float]]:
    """Read YOLO label file; return list of (class_id, x_center, y_center, width, height)."""
    rows = []
    with path.open() as f:
        for line in f:
            line = line.strip()
            if not line:
                continue
            parts = line.split()
            if len(parts) != 5:
                LOG.warning(
                    "Skipping malformed line in %s (expected 5 values): %s",
                    path,
                    line[:80],
                )
                continue
            class_id = int(parts[0])
            x_center = float(parts[1])
            y_center = float(parts[2])
            width = float(parts[3])
            height = float(parts[4])
            rows.append((class_id, x_center, y_center, width, height))
    return rows
 def write_yolo_labels(path: Path, rows: list[tuple[int, float, float, float, float]]) -> None:
    """Write YOLO label file in one-line-per-object format."""
    path.parent.mkdir(parents=True, exist_ok=True)
    with path.open("w") as f:
        for class_id, x_center, y_center, width, height in rows:
            f.write(f"{class_id} {x_center:.6f} {y_center:.6f} {width:.6f} {height:.6f}\n")
 def flip_labels_horizontal(
    rows: list[tuple[int, float, float, float, float]],
 ) -> list[tuple[int, float, float, float, float]]:
    """Return new rows with x_center replaced by 1 - x_center."""
    return [(c, 1.0 - x, y, w, h) for c, x, y, w, h in rows]
 def flip_labels_vertical(
    rows: list[tuple[int, float, float, float, float]],
 ) -> list[tuple[int, float, float, float, float]]:
    """Return new rows with y_center replaced by 1 - y_center."""
    return [(c, x, 1.0 - y, w, h) for c, x, y, w, h in rows]
 def _load_image(path: Path):
    """Load image as BGR; raise on failure."""
    img = cv2.imread(str(path))
    if img is None:
        raise OSError(f"Failed to load image: {path}. Check path and format (e.g. .jpg, .png).")
    return img
 def _ensure_parent(path: Path) -> None:
    path.parent.mkdir(parents=True, exist_ok=True)
 def apply_horizontal_flip(
    image_path: Path,
    labels_path: Path,
    out_image_path: Path,
    out_labels_path: Path,
    dry_run: bool = False,
 ) -> None:
    """Flip image horizontally and transform labels (x_center -> 1 - x_center)."""
    if dry_run:
        LOG.info("Would create: %s, %s", out_image_path, out_labels_path)
        return
    img = _load_image(image_path)
    flipped = cv2.flip(img, 1)
    _ensure_parent(out_image_path)
    if not cv2.imwrite(str(out_image_path), flipped):
        raise OSError(f"Failed to write image: {out_image_path}. Check permissions and disk space.")
    rows = read_yolo_labels(labels_path)
    write_yolo_labels(out_labels_path, flip_labels_horizontal(rows))
 def apply_vertical_flip(
    image_path: Path,
    labels_path: Path,
    out_image_path: Path,
    out_labels_path: Path,
    dry_run: bool = False,
 ) -> None:
    """Flip image vertically and transform labels (y_center -> 1 - y_center)."""
    if dry_run:
        LOG.info("Would create: %s, %s", out_image_path, out_labels_path)
        return
    img = _load_image(image_path)
    flipped = cv2.flip(img, 0)
    _ensure_parent(out_image_path)
    if not cv2.imwrite(str(out_image_path), flipped):
        raise OSError(f"Failed to write image: {out_image_path}. Check permissions and disk space.")
    rows = read_yolo_labels(labels_path)
    write_yolo_labels(out_labels_path, flip_labels_vertical(rows))
 def apply_hue_shift(
    image_path: Path,
    labels_path: Path,
    out_image_path: Path,
    out_labels_path: Path,
    delta: float = HUE_DELTA,
    dry_run: bool = False,
 ) -> None:
    """Shift hue by delta (0–1 scale); copy labels unchanged."""
    if dry_run:
        LOG.info("Would create: %s, %s", out_image_path, out_labels_path)
        return
    img = _load_image(image_path)
    hsv = cv2.cvtColor(img, cv2.COLOR_BGR2HSV).astype("float32")
    h, s, v = cv2.split(hsv)
    # OpenCV H is 0–180; treat delta as fraction of full circle
    h = (h + delta * 180) % 180
    hsv = cv2.merge([h, s, v]).astype("uint8")
    out = cv2.cvtColor(hsv, cv2.COLOR_HSV2BGR)
    _ensure_parent(out_image_path)
    if not cv2.imwrite(str(out_image_path), out):
        raise OSError(f"Failed to write image: {out_image_path}. Check permissions and disk space.")
    rows = read_yolo_labels(labels_path)
    write_yolo_labels(out_labels_path, rows)
 def apply_contrast(
    image_path: Path,
    labels_path: Path,
    out_image_path: Path,
    out_labels_path: Path,
    factor: float = CONTRAST_FACTOR,
    dry_run: bool = False,
 ) -> None:
    """Apply contrast: (pixel - mean) * factor + mean, clip to [0, 255]; copy labels."""
    if dry_run:
        LOG.info("Would create: %s, %s", out_image_path, out_labels_path)
        return
    img = _load_image(image_path).astype("float32")
    mean = img.mean()
    out = (img - mean) * factor + mean
    out = out.clip(0, 255).astype("uint8")
    _ensure_parent(out_image_path)
    if not cv2.imwrite(str(out_image_path), out):
        raise OSError(f"Failed to write image: {out_image_path}. Check permissions and disk space.")
    rows = read_yolo_labels(labels_path)
    write_yolo_labels(out_labels_path, rows)
 def apply_grayscale(
    image_path: Path,
    labels_path: Path,
    out_image_path: Path,
    out_labels_path: Path,
    dry_run: bool = False,
 ) -> None:
    """Convert to grayscale and broadcast to 3 channels; copy labels."""
    if dry_run:
        LOG.info("Would create: %s, %s", out_image_path, out_labels_path)
        return
    img = _load_image(image_path)
    gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
    out = cv2.cvtColor(gray, cv2.COLOR_GRAY2BGR)
    _ensure_parent(out_image_path)
    if not cv2.imwrite(str(out_image_path), out):
        raise OSError(f"Failed to write image: {out_image_path}. Check permissions and disk space.")
    rows = read_yolo_labels(labels_path)
    write_yolo_labels(out_labels_path, rows)
 def discover_images_and_labels(
    dataset_dir: Path,
    image_ext: str,
 ) -> list[tuple[Path, Path]]:
    """
    Find (image_path, label_path) pairs.
    Prefer dataset_dir/images/ and dataset_dir/labels/; else use dataset_dir for both.
    """
    images_dir = dataset_dir / "images"
    labels_dir = dataset_dir / "labels"
    if not images_dir.is_dir():
        images_dir = dataset_dir
        labels_dir = dataset_dir
    if not images_dir.is_dir():
        raise FileNotFoundError(
            f"Dataset directory not found or has no 'images' subdir: {dataset_dir}. "
            "Provide a path that contains an 'images' folder or is the folder with image files."
        )
    if not labels_dir.is_dir():
        raise FileNotFoundError(
            f"Labels directory not found: {labels_dir}. "
            "Expected a 'labels' folder next to 'images', or the same folder for flat layout."
        )
    pairs = []
    raw = (image_ext or "").strip()
    if raw.lower() in {"*", "any", "all", "auto"}:
        allowed_exts = {e.lower() for e in DEFAULT_IMAGE_EXTS}
    else:
        parts = [p.strip() for p in raw.split(",") if p.strip()]
        if not parts:
            allowed_exts = {e.lower() for e in DEFAULT_IMAGE_EXTS}
        else:
            allowed_exts = {(p if p.startswith(".") else f".{p}").lower() for p in parts}
    for img_path in images_dir.iterdir():
        if not img_path.is_file():
            continue
        if img_path.suffix.lower() not in allowed_exts:
            continue
        base = img_path.stem
        label_path = labels_dir / f"{base}.txt"
        if not label_path.is_file():
            LOG.warning("No label file for image %s, skipping: %s", img_path.name, label_path)
            continue
        pairs.append((img_path, label_path))
    return pairs
 def run_augmentations(
    dataset_dir: Path,
    output_dir: Path | None,
    image_ext: str,
    enabled: set[str],
    max_per_image: int,
    dry_run: bool,
 ) -> None:
    """Discover image/label pairs and apply up to max_per_image random augmentations per image."""
    pairs = discover_images_and_labels(dataset_dir, image_ext)
    if not pairs:
        LOG.warning("No image/label pairs found in %s with image-ext %s.", dataset_dir, image_ext)
        return
    enabled_list = list(enabled)
    if not enabled_list:
        LOG.warning("No augmentation types enabled.")
        return
    out_root = output_dir if output_dir is not None else dataset_dir
    if output_dir is None:
        out_images = dataset_dir / "images" if (dataset_dir / "images").is_dir() else dataset_dir
        out_labels = dataset_dir / "labels" if (dataset_dir / "labels").is_dir() else dataset_dir
    else:
        out_images = out_root / "images"
        out_labels = out_root / "labels"
    total_images = len(pairs)
    total_augmentations = 0
    start_time = time.perf_counter()
    LOG.info("Starting augmentation: %d images, max %d per image.", total_images, max_per_image)
    for idx, (img_path, label_path) in enumerate(pairs, start=1):
        base = img_path.stem
        ext = img_path.suffix
        k = min(max_per_image, len(enabled_list))
        chosen = random.sample(enabled_list, k)
        LOG.info(
            "Processing image %d/%d: %s (%s)",
            idx,
            total_images,
            img_path.name,
            ", ".join(chosen),
        )
        for suffix in chosen:
            out_img = out_images / f"{base}_{suffix}{ext}"
            out_lbl = out_labels / f"{base}_{suffix}.txt"
            try:
                if suffix == SUFFIX_HFLIP:
                    apply_horizontal_flip(img_path, label_path, out_img, out_lbl, dry_run=dry_run)
                elif suffix == SUFFIX_VFLIP:
                    apply_vertical_flip(img_path, label_path, out_img, out_lbl, dry_run=dry_run)
                elif suffix == SUFFIX_HUE:
                    apply_hue_shift(img_path, label_path, out_img, out_lbl, dry_run=dry_run)
                elif suffix == SUFFIX_CONTRAST:
                    apply_contrast(img_path, label_path, out_img, out_lbl, dry_run=dry_run)
                elif suffix == SUFFIX_GRAY:
                    apply_grayscale(img_path, label_path, out_img, out_lbl, dry_run=dry_run)
                total_augmentations += 1
            except OSError as e:
                LOG.error("Skipping %s %s: %s", suffix, img_path.name, e)
    elapsed = time.perf_counter() - start_time
    LOG.info(
        "Completed: %d images, %d augmentations in %.1f s.",
        total_images,
        total_augmentations,
        elapsed,
    )
 def main() -> None:
    logging.basicConfig(level=logging.INFO, format="%(levelname)s: %(message)s")
    parser = argparse.ArgumentParser(
        description="Augment YOLOv9 dataset with flips, hue, contrast, and grayscale.",
    )
    parser.add_argument(
        "--dataset-dir",
        type=Path,
        required=True,
        help="Root of the dataset (containing images/ and labels/ or flat image+label files).",
    )
    parser.add_argument(
        "--output-dir",
        type=Path,
        default=None,
        help="Where to write augmented files (default: same as dataset-dir).",
    )
    parser.add_argument(
        "--image-ext",
        type=str,
        default=",".join(DEFAULT_IMAGE_EXTS),
        help=(
            "Image extension(s) to look for. Provide a single ext (e.g. .jpg) or a comma-separated list "
            "(e.g. .jpg,.jpeg,.png). Use 'all'/'any' to use the defaults."
        ),
    )
    parser.add_argument(
        "--suffixes",
        type=str,
        nargs="+",
        default=[SUFFIX_HFLIP, SUFFIX_VFLIP, SUFFIX_HUE, SUFFIX_CONTRAST, SUFFIX_GRAY],
        choices=[SUFFIX_HFLIP, SUFFIX_VFLIP, SUFFIX_HUE, SUFFIX_CONTRAST, SUFFIX_GRAY],
        help="Which augmentations can be applied (default: all).",
    )
    parser.add_argument(
        "--max-per-image",
        type=int,
        default=2,
        metavar="N",
        help="Maximum number of augmentation types to apply per image (default: 2).",
    )
    parser.add_argument(
        "--seed",
        type=int,
        default=None,
        help="Random seed for reproducible augmentation selection.",
    )
    parser.add_argument(
        "--dry-run",
        action="store_true",
        help="Only print which files would be created.",
    )
    args = parser.parse_args()
    if args.max_per_image < 1:
        LOG.error("--max-per-image must be at least 1.")
        raise SystemExit(1)
    if args.seed is not None:
        random.seed(args.seed)
    if not args.dataset_dir.is_dir():
        LOG.error(
            "Dataset directory does not exist: %s. Create it and add images/ and labels/ (or image + label files).",
            args.dataset_dir,
        )
        raise SystemExit(1)
    run_augmentations(
        dataset_dir=args.dataset_dir,
        output_dir=args.output_dir,
        image_ext=args.image_ext,
        enabled=set(args.suffixes),
        max_per_image=args.max_per_image,
        dry_run=args.dry_run,
    )
 if __name__ == "__main__":
    main()
@@ -0,0 +1,590 @@
 #!/usr/bin/env python3
 """
 Script to convert YOLO txt label format to LabelMe JSON format.
 YOLO format: class_id x_center y_center width height (normalized 0.0-1.0)
 LabelMe format: JSON with shapes containing rectangles with pixel coordinates
 """
 import os
 import sys
 import argparse
 import json
 import shutil
 from pathlib import Path
 try:
    from PIL import Image
    HAS_PIL = True
 except ImportError:
    HAS_PIL = False
    print("Warning: PIL/Pillow not installed. Image dimension detection required for conversion.")
    print("Install with: pip install pillow")
 def get_image_dimensions(image_path):
    """Get image width and height."""
    if not HAS_PIL:
        return None, None
    try:
        with Image.open(image_path) as img:
            return img.size  # Returns (width, height)
    except Exception as e:
        print(f"Warning: Could not read image {image_path}: {e}")
        return None, None
 def yolo_to_labelme_rectangle(x_center_norm, y_center_norm, width_norm, height_norm,
                              img_width, img_height):
    """
    Convert YOLO normalized bounding box to LabelMe rectangle coordinates.
    Args:
        x_center_norm, y_center_norm, width_norm, height_norm: Normalized coordinates (0.0-1.0)
        img_width, img_height: Image dimensions in pixels
    Returns:
        List of two points: [[x1, y1], [x2, y2]] for top-left and bottom-right corners
    """
    # Denormalize center coordinates and dimensions
    x_center = x_center_norm * img_width
    y_center = y_center_norm * img_height
    width = width_norm * img_width
    height = height_norm * img_height
    # Calculate top-left and bottom-right corners
    x1 = x_center - width / 2.0
    y1 = y_center - height / 2.0
    x2 = x_center + width / 2.0
    y2 = y_center + height / 2.0
    # Ensure coordinates are within image bounds
    x1 = max(0.0, min(img_width, x1))
    y1 = max(0.0, min(img_height, y1))
    x2 = max(0.0, min(img_width, x2))
    y2 = max(0.0, min(img_height, y2))
    return [[float(x1), float(y1)], [float(x2), float(y2)]]
 def is_normalized(value):
    """Check if a coordinate value is normalized (0.0-1.0)."""
    return 0.0 <= float(value) <= 1.0
 def find_image_file(txt_file, image_extensions=None):
    """
    Find corresponding image file for a txt annotation file.
    Args:
        txt_file: Path to txt annotation file
        image_extensions: List of image extensions to try (default: ['.jpg', '.jpeg', '.png', '.bmp'])
    Returns:
        Path to image file or None if not found
    """
    if image_extensions is None:
        image_extensions = ['.jpg', '.jpeg', '.png', '.bmp', '.tif', '.tiff']
    txt_file = Path(txt_file)
    base_name = txt_file.stem
    txt_dir = txt_file.parent
    # First, check if txt_file is in a 'labels' directory
    # If so, look for corresponding 'images' directory
    if txt_dir.name.lower() == 'labels':
        # Try to find images directory at the same level
        images_dir = txt_dir.parent / 'images'
        if images_dir.exists():
            # Look for image in images directory
            for ext in image_extensions:
                potential_image = images_dir / f"{base_name}{ext}"
                if potential_image.exists():
                    return potential_image
            # Try case variations
            for ext in image_extensions:
                for case_ext in [ext, ext.upper(), ext.capitalize()]:
                    potential_image = images_dir / f"{base_name}{case_ext}"
                    if potential_image.exists():
                        return potential_image
    # Check in same directory as txt file
    for ext in image_extensions:
        potential_image = txt_dir / f"{base_name}{ext}"
        if potential_image.exists():
            return potential_image
    # Check with case variations in same directory
    for ext in image_extensions:
        for case_ext in [ext, ext.upper(), ext.capitalize()]:
            potential_image = txt_dir / f"{base_name}{case_ext}"
            if potential_image.exists():
                return potential_image
    return None
 def find_images_directory_for_labels(labels_dir):
    """
    Find the corresponding images directory for a labels directory.
    Args:
        labels_dir: Path to labels directory
    Returns:
        Path to images directory or None if not found
    """
    labels_dir = Path(labels_dir)
    # If the directory name is 'labels', look for 'images' at the same level
    if labels_dir.name.lower() == 'labels':
        images_dir = labels_dir.parent / 'images'
        if images_dir.exists():
            return images_dir
    return None
 def convert_yolo_to_labelme(txt_file, image_file=None, class_names=None, 
                            image_extensions=None, include_image_data=False):
    """
    Convert a single YOLO txt annotation file to LabelMe JSON format.
    Args:
        txt_file: Path to YOLO txt annotation file
        image_file: Path to corresponding image file (optional, will be searched if not provided)
        class_names: Dictionary mapping class_id to class name (optional)
        image_extensions: List of image extensions to search (default: ['.jpg', '.jpeg', '.png', '.bmp'])
        include_image_data: Whether to include base64-encoded image data in JSON
    Returns:
        Dictionary with LabelMe JSON structure
    """
    txt_file = Path(txt_file)
    if not txt_file.exists():
        raise FileNotFoundError(f"Annotation file not found: {txt_file}")
    # Find image file if not provided
    if image_file is None:
        image_file = find_image_file(txt_file, image_extensions)
    if image_file is None:
        raise FileNotFoundError(
            f"Image file not found for {txt_file}. "
            f"Please provide image_file or ensure image exists in same directory."
        )
    image_file = Path(image_file)
    if not image_file.exists():
        raise FileNotFoundError(f"Image file not found: {image_file}")
    # Get image dimensions
    img_width, img_height = get_image_dimensions(image_file)
    if img_width is None or img_height is None:
        raise ValueError(
            f"Could not determine image dimensions for {image_file}. "
            f"PIL/Pillow is required for this operation."
        )
    # Read YOLO annotations
    shapes = []
    with open(txt_file, 'r') as f:
        for line_num, line in enumerate(f, 1):
            line = line.strip()
            if not line:  # Skip empty lines
                continue
            parts = line.split()
            if len(parts) < 5:
                print(f"Warning: Invalid YOLO format in {txt_file} line {line_num}: {line}")
                continue
            try:
                class_id = int(parts[0])
                x_center = float(parts[1])
                y_center = float(parts[2])
                width = float(parts[3])
                height = float(parts[4])
                # Check if coordinates are normalized
                if not (is_normalized(x_center) and is_normalized(y_center) and
                       is_normalized(width) and is_normalized(height)):
                    print(f"Warning: Coordinates in {txt_file} line {line_num} may not be normalized. "
                          f"Assuming normalized format.")
                # Convert to LabelMe rectangle format
                points = yolo_to_labelme_rectangle(
                    x_center, y_center, width, height, img_width, img_height
                )
                # Get class name
                if class_names and class_id in class_names:
                    label = class_names[class_id]
                else:
                    label = str(class_id)  # Use class_id as label if no mapping provided
                # Create shape annotation
                shape = {
                    "label": label,
                    "points": points,
                    "group_id": None,
                    "shape_type": "rectangle",
                    "flags": {}
                }
                shapes.append(shape)
            except (ValueError, IndexError) as e:
                print(f"Warning: Could not parse line {line_num} in {txt_file}: {line} - {e}")
                continue
    # Get image data if requested
    image_data = None
    if include_image_data:
        try:
            with open(image_file, 'rb') as f:
                import base64
                image_data = base64.b64encode(f.read()).decode('utf-8')
        except Exception as e:
            print(f"Warning: Could not encode image data: {e}")
    # Create LabelMe JSON structure
    labelme_json = {
        "version": "5.0.1",
        "flags": {},
        "shapes": shapes,
        "imagePath": image_file.name,
        "imageData": image_data,
        "imageHeight": img_height,
        "imageWidth": img_width
    }
    return labelme_json
 def convert_dataset(input_dir, output_dir=None, class_names_file=None, 
                   image_extensions=None, include_image_data=False, 
                   copy_images=False, recursive=False):
    """
    Convert a directory of YOLO txt annotations to LabelMe JSON format.
    Args:
        input_dir: Input directory containing txt files and images
        output_dir: Output directory for LabelMe JSON files (optional, if None, JSON files are placed next to images)
        class_names_file: Path to file with class names (one per line, optional)
        image_extensions: List of image extensions to search
        include_image_data: Whether to include base64-encoded image data
        copy_images: Whether to copy images to output directory (only used if output_dir is specified)
        recursive: Whether to process subdirectories recursively
    Returns:
        Dictionary with conversion statistics
    """
    input_dir = Path(input_dir)
    if not input_dir.exists():
        raise FileNotFoundError(f"Input directory not found: {input_dir}")
    # Load class names if provided
    class_names = None
    if class_names_file:
        class_names_file = Path(class_names_file)
        if class_names_file.exists():
            class_names = {}
            with open(class_names_file, 'r') as f:
                for idx, line in enumerate(f):
                    class_name = line.strip()
                    if class_name:
                        class_names[idx] = class_name
            print(f"Loaded {len(class_names)} class names from {class_names_file}")
        else:
            print(f"Warning: Class names file not found: {class_names_file}")
    # Find all txt files (recursive or not)
    if recursive:
        txt_files = list(input_dir.rglob('*.txt'))
    else:
        txt_files = list(input_dir.glob('*.txt'))
    if not txt_files:
        search_type = "recursively" if recursive else "in"
        raise ValueError(f"No .txt files found {search_type} {input_dir}")
    stats = {
        'files_processed': 0,
        'total_annotations': 0,
        'errors': []
    }
    # Process each txt file
    for txt_file in txt_files:
        try:
            # Find corresponding image
            image_file = find_image_file(txt_file, image_extensions)
            if not image_file:
                error_msg = f"Image file not found for {txt_file}"
                stats['errors'].append(error_msg)
                print(f"ERROR: {error_msg}")
                continue
            # Convert to LabelMe format
            labelme_json = convert_yolo_to_labelme(
                txt_file, image_file, class_names, image_extensions, include_image_data
            )
            # Determine where to place the JSON file
            if output_dir:
                # If output_dir is specified, preserve relative path structure when recursive
                output_dir = Path(output_dir)
                if recursive:
                    # Preserve relative path from input_dir
                    relative_path = txt_file.relative_to(input_dir)
                    output_subdir = output_dir / relative_path.parent
                    output_subdir.mkdir(parents=True, exist_ok=True)
                    json_file = output_subdir / f"{image_file.stem}.json"
                    # Copy image if requested, preserving directory structure
                    if copy_images:
                        output_image = output_subdir / image_file.name
                        if not output_image.exists():
                            shutil.copy2(image_file, output_image)
                else:
                    # Non-recursive: just use output_dir
                    output_dir.mkdir(parents=True, exist_ok=True)
                    json_file = output_dir / f"{image_file.stem}.json"
                    # Copy image if requested
                    if copy_images:
                        output_image = output_dir / image_file.name
                        if not output_image.exists():
                            shutil.copy2(image_file, output_image)
            else:
                # Check if txt_file is in a 'labels' directory
                # If so, place JSON in corresponding 'images' directory
                txt_dir = txt_file.parent
                if txt_dir.name.lower() == 'labels':
                    images_dir = find_images_directory_for_labels(txt_dir)
                    if images_dir:
                        # Place JSON in images directory
                        json_file = images_dir / f"{image_file.stem}.json"
                    else:
                        # Fallback: place next to image file
                        json_file = image_file.parent / f"{image_file.stem}.json"
                else:
                    # Otherwise, place JSON file next to the image file
                    json_file = image_file.parent / f"{image_file.stem}.json"
            json_file.parent.mkdir(parents=True, exist_ok=True)
            with open(json_file, 'w') as f:
                json.dump(labelme_json, f, indent=2)
            stats['files_processed'] += 1
            stats['total_annotations'] += len(labelme_json['shapes'])
            print(f"Processed: {txt_file} -> {json_file} ({len(labelme_json['shapes'])} annotations)")
        except Exception as e:
            error_msg = f"Error processing {txt_file}: {str(e)}"
            stats['errors'].append(error_msg)
            print(f"ERROR: {error_msg}")
    return stats
 def main():
    parser = argparse.ArgumentParser(
        description='Convert YOLO txt label format to LabelMe JSON format',
        formatter_class=argparse.RawDescriptionHelpFormatter,
        epilog="""
 Examples:
  # Convert single file (JSON placed in images folder if txt is in labels folder)
  python convert_yolo_to_labelme.py train/labels/x.txt --image train/images/x.jpg
  # Output: train/images/x.json
  # Convert directory (JSON files placed in images folders when txt files are in labels folders)
  python convert_yolo_to_labelme.py --input-dir ./train/labels
  # Converts train/labels/x.txt -> train/images/x.json
  # Convert directory recursively (processes all subdirectories)
  python convert_yolo_to_labelme.py --input-dir ./dataset --recursive
  # Converts train/labels/x.txt -> train/images/x.json
  # Converts val/labels/y.txt -> val/images/y.json
  # Convert directory with custom output directory
  python convert_yolo_to_labelme.py --input-dir ./labels --output-dir ./labelme_annotations
  # Convert recursively with custom output directory (preserves directory structure)
  python convert_yolo_to_labelme.py --input-dir ./labels --output-dir ./labelme_annotations --recursive
  # Convert with class names file
  python convert_yolo_to_labelme.py --input-dir ./labels --class-names classes.txt
  # Convert and include image data in JSON
  python convert_yolo_to_labelme.py --input-dir ./labels --include-image-data
        """
    )
    parser.add_argument(
        'input',
        nargs='?',
        help='Input YOLO txt file (if converting single file)'
    )
    parser.add_argument(
        '--image',
        type=str,
        help='Image file path (required for single file conversion)'
    )
    parser.add_argument(
        '--output', '-o',
        type=str,
        help='Output JSON file path (for single file conversion). If not specified, JSON is placed in images folder when txt is in labels folder, otherwise next to image file.'
    )
    parser.add_argument(
        '--input-dir',
        type=str,
        help='Input directory containing txt files and images (for batch conversion)'
    )
    parser.add_argument(
        '--output-dir',
        type=str,
        default=None,
        help='Output directory for LabelMe JSON files (for batch conversion). If not specified, JSON files are placed in the images folder when txt files are in a labels folder (e.g., train/labels/x.txt -> train/images/x.json), otherwise next to image files.'
    )
    parser.add_argument(
        '--class-names',
        type=str,
        dest='class_names_file',
        help='File with class names (one per line, line number = class_id)'
    )
    parser.add_argument(
        '--image-extensions',
        nargs='+',
        default=['.jpg', '.jpeg', '.png', '.bmp', '.tif', '.tiff'],
        help='Image file extensions to search for (default: .jpg .jpeg .png .bmp .tif .tiff)'
    )
    parser.add_argument(
        '--include-image-data',
        action='store_true',
        help='Include base64-encoded image data in JSON (increases file size)'
    )
    parser.add_argument(
        '--copy-images',
        action='store_true',
        help='Copy images to output directory (for batch conversion)'
    )
    parser.add_argument(
        '--recursive', '-r',
        action='store_true',
        help='Process subdirectories recursively'
    )
    args = parser.parse_args()
    # Determine mode: single file or batch
    if args.input:
        # Single file mode
        if not args.image:
            parser.error("--image is required for single file conversion")
        # Load class names if provided
        class_names = None
        if args.class_names_file:
            class_names_file = Path(args.class_names_file)
            if class_names_file.exists():
                class_names = {}
                with open(class_names_file, 'r') as f:
                    for idx, line in enumerate(f):
                        class_name = line.strip()
                        if class_name:
                            class_names[idx] = class_name
            else:
                print(f"Warning: Class names file not found: {class_names_file}")
        try:
            labelme_json = convert_yolo_to_labelme(
                args.input,
                args.image,
                class_names,
                args.image_extensions,
                args.include_image_data
            )
            # Determine output file path
            if args.output:
                output_file = Path(args.output)
            else:
                # Check if txt file is in a 'labels' directory
                # If so, place JSON in corresponding 'images' directory
                txt_file = Path(args.input)
                txt_dir = txt_file.parent
                image_file = Path(args.image)
                if txt_dir.name.lower() == 'labels':
                    images_dir = find_images_directory_for_labels(txt_dir)
                    if images_dir:
                        # Place JSON in images directory
                        output_file = images_dir / f"{image_file.stem}.json"
                    else:
                        # Fallback: place next to image file
                        output_file = image_file.parent / f"{image_file.stem}.json"
                else:
                    # Place JSON file next to the image file
                    output_file = image_file.parent / f"{image_file.stem}.json"
            output_file.parent.mkdir(parents=True, exist_ok=True)
            with open(output_file, 'w') as f:
                json.dump(labelme_json, f, indent=2)
            print(f"Successfully converted {args.input} to {output_file}")
            print(f"  Annotations: {len(labelme_json['shapes'])}")
            print(f"  Image: {labelme_json['imagePath']} ({labelme_json['imageWidth']}x{labelme_json['imageHeight']})")
        except Exception as e:
            print(f"ERROR: {e}", file=sys.stderr)
            sys.exit(1)
    elif args.input_dir:
        # Batch mode - output_dir is optional
        try:
            stats = convert_dataset(
                args.input_dir,
                args.output_dir,
                args.class_names_file,
                args.image_extensions,
                args.include_image_data,
                args.copy_images,
                args.recursive
            )
            print("\n" + "="*50)
            print("Conversion Summary:")
            print(f"  Files processed: {stats['files_processed']}")
            print(f"  Total annotations: {stats['total_annotations']}")
            if stats['errors']:
                print(f"  Errors: {len(stats['errors'])}")
                for error in stats['errors']:
                    print(f"    - {error}")
            print("="*50)
        except Exception as e:
            print(f"ERROR: {e}", file=sys.stderr)
            sys.exit(1)
    else:
        parser.error("Either provide input file or --input-dir for batch conversion")
 if __name__ == '__main__':
    main()