feat: Implement sound normalization service and API endpoints

- Added SoundNormalizerService for normalizing audio files with support for one-pass and two-pass normalization methods. - Introduced API endpoints for normalizing all sounds and specific sounds by ID, including support for force normalization and handling of already normalized sounds. - Created comprehensive test suite for the sound normalizer service and its API endpoints, covering various scenarios including success, errors, and edge cases. - Refactored sound scanning service to utilize SHA-256 for file hashing instead of MD5 for improved security. - Enhanced logging and error handling throughout the sound normalization process.
2025-07-28 09:18:18 +02:00
parent 36949a1f1c
commit 0fffce53b4
8 changed files with 2031 additions and 75 deletions
--- a/app/api/v1/init.py
+++ b/app/api/v1/init.py
@@ -2,7 +2,7 @@

 from fastapi import APIRouter

-from app.api.v1 import auth, main, socket, sounds
+from app.api.v1 import auth, main, socket, sound_normalizer, sounds

 # V1 API router with v1 prefix
 api_router = APIRouter(prefix="/v1")
@@ -12,3 +12,4 @@ api_router.include_router(main.router, tags=["main"])
 api_router.include_router(auth.router, prefix="/auth", tags=["authentication"])
 api_router.include_router(socket.router, tags=["socket"])
 api_router.include_router(sounds.router, tags=["sounds"])
+api_router.include_router(sound_normalizer.router, tags=["sound-normalization"])
--- a/app/api/v1/sound_normalizer.py
+++ b/app/api/v1/sound_normalizer.py
@@ -0,0 +1,166 @@
+"""Sound normalization API endpoints."""
+
+from typing import Annotated
+
+from fastapi import APIRouter, Depends, HTTPException, Query, status
+from sqlmodel.ext.asyncio.session import AsyncSession
+
+from app.core.database import get_db
+from app.core.dependencies import get_current_active_user_flexible
+from app.models.user import User
+from app.services.sound_normalizer import NormalizationResults, SoundNormalizerService
+
+router = APIRouter(prefix="/sounds/normalize", tags=["sound-normalization"])
+
+
+async def get_sound_normalizer_service(
+    session: Annotated[AsyncSession, Depends(get_db)],
+) -> SoundNormalizerService:
+    """Get the sound normalizer service."""
+    return SoundNormalizerService(session)
+
+
+@router.post("/all")
+async def normalize_all_sounds(
+    current_user: Annotated[User, Depends(get_current_active_user_flexible)],
+    normalizer_service: Annotated[
+        SoundNormalizerService, Depends(get_sound_normalizer_service)
+    ],
+    force: bool = Query(
+        False, description="Force normalization of already normalized sounds"
+    ),
+    one_pass: bool | None = Query(
+        None, description="Use one-pass normalization (overrides config)"
+    ),
+) -> dict[str, NormalizationResults | str]:
+    """Normalize all unnormalized sounds."""
+    # Only allow admins to normalize sounds
+    if current_user.role not in ["admin", "superadmin"]:
+        raise HTTPException(
+            status_code=status.HTTP_403_FORBIDDEN,
+            detail="Only administrators can normalize sounds",
+        )
+
+    try:
+        results = await normalizer_service.normalize_all_sounds(
+            force=force,
+            one_pass=one_pass,
+        )
+        return {
+            "message": "Sound normalization completed",
+            "results": results,
+        }
+    except Exception as e:
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail=f"Failed to normalize sounds: {e!s}",
+        ) from e
+
+
+@router.post("/type/{sound_type}")
+async def normalize_sounds_by_type(
+    sound_type: str,
+    current_user: Annotated[User, Depends(get_current_active_user_flexible)],
+    normalizer_service: Annotated[
+        SoundNormalizerService, Depends(get_sound_normalizer_service)
+    ],
+    force: bool = Query(
+        False, description="Force normalization of already normalized sounds"
+    ),
+    one_pass: bool | None = Query(
+        None, description="Use one-pass normalization (overrides config)"
+    ),
+) -> dict[str, NormalizationResults | str]:
+    """Normalize all sounds of a specific type (SDB, TTS, EXT)."""
+    # Only allow admins to normalize sounds
+    if current_user.role not in ["admin", "superadmin"]:
+        raise HTTPException(
+            status_code=status.HTTP_403_FORBIDDEN,
+            detail="Only administrators can normalize sounds",
+        )
+
+    # Validate sound type
+    valid_types = ["SDB", "TTS", "EXT"]
+    if sound_type not in valid_types:
+        raise HTTPException(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            detail=f"Invalid sound type. Must be one of: {', '.join(valid_types)}",
+        )
+
+    try:
+        results = await normalizer_service.normalize_sounds_by_type(
+            sound_type=sound_type,
+            force=force,
+            one_pass=one_pass,
+        )
+        return {
+            "message": f"Normalization of {sound_type} sounds completed",
+            "results": results,
+        }
+    except Exception as e:
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail=f"Failed to normalize {sound_type} sounds: {e!s}",
+        ) from e
+
+
+@router.post("/{sound_id}")
+async def normalize_sound_by_id(
+    sound_id: int,
+    current_user: Annotated[User, Depends(get_current_active_user_flexible)],
+    normalizer_service: Annotated[
+        SoundNormalizerService, Depends(get_sound_normalizer_service)
+    ],
+    force: bool = Query(
+        False, description="Force normalization of already normalized sound"
+    ),
+    one_pass: bool | None = Query(
+        None, description="Use one-pass normalization (overrides config)"
+    ),
+) -> dict[str, str]:
+    """Normalize a specific sound by ID."""
+    # Only allow admins to normalize sounds
+    if current_user.role not in ["admin", "superadmin"]:
+        raise HTTPException(
+            status_code=status.HTTP_403_FORBIDDEN,
+            detail="Only administrators can normalize sounds",
+        )
+
+    try:
+        # Get the sound
+        sound = await normalizer_service.sound_repo.get_by_id(sound_id)
+        if not sound:
+            raise HTTPException(
+                status_code=status.HTTP_404_NOT_FOUND,
+                detail=f"Sound with ID {sound_id} not found",
+            )
+
+        # Normalize the sound
+        result = await normalizer_service.normalize_sound(
+            sound=sound,
+            force=force,
+            one_pass=one_pass,
+        )
+
+        # Check result status
+        if result["status"] == "error":
+            raise HTTPException(
+                status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+                detail=f"Failed to normalize sound: {result['error']}",
+            )
+
+        return {
+            "message": f"Sound normalization {result['status']}: {sound.filename}",
+            "status": result["status"],
+            "reason": result["reason"] or "",
+            "normalized_filename": result["normalized_filename"] or "",
+        }
+
+    except HTTPException:
+        # Re-raise HTTPExceptions without wrapping them
+        raise
+    except Exception as e:
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail=f"Failed to normalize sound: {e!s}",
+        ) from e
--- a/app/core/config.py
+++ b/app/core/config.py
@@ -47,5 +47,10 @@ class Settings(BaseSettings):
    GITHUB_CLIENT_ID: str = ""
    GITHUB_CLIENT_SECRET: str = ""

+    # Audio Normalization Configuration
+    NORMALIZED_AUDIO_FORMAT: str = "mp3"
+    NORMALIZED_AUDIO_BITRATE: str = "256k"
+    NORMALIZED_AUDIO_PASSES: int = 2  # 1 for one-pass, 2 for two-pass
+

 settings = Settings()
--- a/app/repositories/sound.py
+++ b/app/repositories/sound.py
@@ -126,3 +126,26 @@ class SoundRepository:
        except Exception:
            logger.exception("Failed to get popular sounds")
            raise
+
+    async def get_unnormalized_sounds(self) -> list[Sound]:
+        """Get all sounds that haven't been normalized yet."""
+        try:
+            statement = select(Sound).where(Sound.is_normalized == False)  # noqa: E712
+            result = await self.session.exec(statement)
+            return list(result.all())
+        except Exception:
+            logger.exception("Failed to get unnormalized sounds")
+            raise
+
+    async def get_unnormalized_sounds_by_type(self, sound_type: str) -> list[Sound]:
+        """Get unnormalized sounds by type."""
+        try:
+            statement = select(Sound).where(
+                Sound.type == sound_type,
+                Sound.is_normalized == False,  # noqa: E712
+            )
+            result = await self.session.exec(statement)
+            return list(result.all())
+        except Exception:
+            logger.exception("Failed to get unnormalized sounds by type: %s", sound_type)
+            raise
--- a/app/services/sound_normalizer.py
+++ b/app/services/sound_normalizer.py
@@ -0,0 +1,567 @@
+"""Sound normalizer service for normalizing audio files using ffmpeg loudnorm."""
+
+import hashlib
+import json
+import os
+import re
+from pathlib import Path
+from typing import TypedDict
+
+import ffmpeg  # type: ignore[import-untyped]
+from sqlmodel.ext.asyncio.session import AsyncSession
+
+from app.core.config import settings
+from app.core.logging import get_logger
+from app.models.sound import Sound
+from app.repositories.sound import SoundRepository
+
+logger = get_logger(__name__)
+
+
+class NormalizationInfo(TypedDict):
+    """Type definition for normalization information in results."""
+
+    filename: str
+    status: str
+    reason: str | None
+    original_path: str | None
+    normalized_path: str | None
+    normalized_filename: str | None
+    normalized_duration: int | None
+    normalized_size: int | None
+    normalized_hash: str | None
+    id: int | None
+    error: str | None
+
+
+class NormalizationResults(TypedDict):
+    """Type definition for normalization results."""
+
+    processed: int
+    normalized: int
+    skipped: int
+    errors: int
+    files: list[NormalizationInfo]
+
+
+class SoundNormalizerService:
+    """Service for normalizing audio files using ffmpeg loudnorm."""
+
+    def __init__(self, session: AsyncSession) -> None:
+        """Initialize the sound normalizer service."""
+        self.session = session
+        self.sound_repo = SoundRepository(session)
+
+        # Normalization settings from config
+        self.output_format = settings.NORMALIZED_AUDIO_FORMAT
+        self.output_bitrate = settings.NORMALIZED_AUDIO_BITRATE
+        self.passes = settings.NORMALIZED_AUDIO_PASSES
+
+        # Directory mappings for different sound types
+        self.type_directories = {
+            "SDB": "sounds/normalized/soundboard",
+            "TTS": "sounds/normalized/text_to_speech",
+            "EXT": "sounds/normalized/extracted",
+        }
+
+        # Ensure normalized directories exist
+        self._ensure_directories()
+
+    def _ensure_directories(self) -> None:
+        """Ensure all normalized sound directories exist."""
+        for directory in self.type_directories.values():
+            Path(directory).mkdir(parents=True, exist_ok=True)
+            logger.debug("Ensured directory exists: %s", directory)
+
+    def _get_normalized_path(self, sound: Sound) -> Path:
+        """Get the normalized file path for a sound."""
+        return self._get_normalized_path_from_data(sound.type, sound.filename)
+
+    def _get_normalized_path_from_data(self, sound_type: str, filename: str) -> Path:
+        """Get the normalized file path from sound data."""
+        # Get the appropriate directory for the sound type
+        directory = self.type_directories.get(sound_type, "sounds/normalized/other")
+
+        # Create the directory if it doesn't exist
+        Path(directory).mkdir(parents=True, exist_ok=True)
+
+        # Generate filename: original_name.{format}
+        original_stem = Path(filename).stem
+        normalized_filename = f"{original_stem}.{self.output_format}"
+
+        return Path(directory) / normalized_filename
+
+    def _get_original_path(self, sound: Sound) -> Path:
+        """Get the original file path for a sound."""
+        return self._get_original_path_from_data(sound.type, sound.filename)
+
+    def _get_original_path_from_data(self, sound_type: str, filename: str) -> Path:
+        """Get the original file path from sound data."""
+        # Map sound types to their original directories
+        type_to_original_dir = {
+            "SDB": "sounds/originals/soundboard",
+            "TTS": "sounds/originals/text_to_speech",
+            "EXT": "sounds/originals/extracted",
+        }
+
+        original_dir = type_to_original_dir.get(sound_type, "sounds/originals/other")
+        return Path(original_dir) / filename
+
+    def _get_file_hash(self, file_path: Path) -> str:
+        """Calculate SHA-256 hash of a file."""
+        hash_sha256 = hashlib.sha256()
+        with open(file_path, "rb") as f:
+            for chunk in iter(lambda: f.read(4096), b""):
+                hash_sha256.update(chunk)
+        return hash_sha256.hexdigest()
+
+    def _get_file_size(self, file_path: Path) -> int:
+        """Get file size in bytes."""
+        return file_path.stat().st_size
+
+    def _get_audio_duration(self, file_path: Path) -> int:
+        """Get audio duration in milliseconds using ffmpeg."""
+        try:
+            probe = ffmpeg.probe(str(file_path))
+            duration = float(probe["format"]["duration"])
+            return int(duration * 1000)  # Convert to milliseconds
+        except Exception as e:
+            logger.warning("Failed to get duration for %s: %s", file_path, e)
+            return 0
+
+    async def _normalize_audio_one_pass(
+        self,
+        input_path: Path,
+        output_path: Path,
+    ) -> None:
+        """Normalize audio using one-pass loudnorm."""
+        try:
+            logger.info(
+                "Starting one-pass normalization: %s -> %s",
+                input_path,
+                output_path,
+            )
+
+            stream = ffmpeg.input(str(input_path))
+            stream = ffmpeg.filter(stream, "loudnorm", I=-23, TP=-2, LRA=7)
+
+            # Apply output format and bitrate
+            output_args = {}
+            if self.output_format == "mp3":
+                output_args["acodec"] = "libmp3lame"
+                output_args["audio_bitrate"] = self.output_bitrate
+            elif self.output_format == "aac":
+                output_args["acodec"] = "aac"
+                output_args["audio_bitrate"] = self.output_bitrate
+            elif self.output_format == "opus":
+                output_args["acodec"] = "libopus"
+                output_args["audio_bitrate"] = self.output_bitrate
+
+            stream = ffmpeg.output(stream, str(output_path), **output_args)
+            stream = ffmpeg.overwrite_output(stream)
+
+            ffmpeg.run(stream, quiet=True, overwrite_output=True)
+            logger.info("One-pass normalization completed: %s", output_path)
+
+        except Exception as e:
+            logger.exception("One-pass normalization failed for %s", input_path)
+            raise
+
+    async def _normalize_audio_two_pass(
+        self,
+        input_path: Path,
+        output_path: Path,
+    ) -> None:
+        """Normalize audio using two-pass loudnorm for better quality."""
+        try:
+            logger.info(
+                "Starting two-pass normalization: %s -> %s", input_path, output_path
+            )
+
+            # First pass: analyze
+            logger.debug("First pass: analyzing %s", input_path)
+
+            stream = ffmpeg.input(str(input_path))
+            stream = ffmpeg.filter(
+                stream,
+                "loudnorm",
+                I=-23,
+                TP=-2,
+                LRA=7,
+                print_format="json",
+            )
+            # Output to null device with explicit format
+            null_output = "/dev/null" if os.name != "nt" else "NUL"
+            stream = ffmpeg.output(stream, null_output, format="null")
+
+            # Run first pass and capture output
+            try:
+                result = ffmpeg.run(stream, capture_stderr=True, quiet=True)
+                analysis_output = result[1].decode("utf-8")
+            except ffmpeg.Error as e:
+                logger.error("FFmpeg first pass failed for %s. Stdout: %s, Stderr: %s", 
+                           input_path, e.stdout.decode() if e.stdout else "None", 
+                           e.stderr.decode() if e.stderr else "None")
+                raise
+
+            # Extract loudnorm measurements from the output
+            # The JSON output is at the end of stderr
+            logger.debug("Loudnorm analysis output: %s", analysis_output)
+
+            # Find JSON in the output
+            json_match = re.search(r'\{[^{}]*"input_i"[^{}]*\}', analysis_output)
+            if not json_match:
+                logger.error("Could not find JSON in loudnorm output: %s", analysis_output)
+                raise ValueError("Could not extract loudnorm analysis data")
+
+            logger.debug("Found JSON match: %s", json_match.group())
+            analysis_data = json.loads(json_match.group())
+
+            # Second pass: normalize with measured values
+            logger.debug("Second pass: normalizing %s with measured values", input_path)
+
+            stream = ffmpeg.input(str(input_path))
+            stream = ffmpeg.filter(
+                stream,
+                "loudnorm",
+                measured_I=analysis_data["input_i"],
+                measured_LRA=analysis_data["input_lra"],
+                measured_TP=analysis_data["input_tp"],
+                measured_thresh=analysis_data["input_thresh"],
+                offset=analysis_data["target_offset"],
+            )
+
+            # Apply output format and bitrate
+            output_args = {}
+            if self.output_format == "mp3":
+                output_args["acodec"] = "libmp3lame"
+                output_args["audio_bitrate"] = self.output_bitrate
+            elif self.output_format == "aac":
+                output_args["acodec"] = "aac"
+                output_args["audio_bitrate"] = self.output_bitrate
+            elif self.output_format == "opus":
+                output_args["acodec"] = "libopus"
+                output_args["audio_bitrate"] = self.output_bitrate
+
+            stream = ffmpeg.output(stream, str(output_path), **output_args)
+            stream = ffmpeg.overwrite_output(stream)
+
+            try:
+                ffmpeg.run(stream, quiet=True, overwrite_output=True)
+                logger.info("Two-pass normalization completed: %s", output_path)
+            except ffmpeg.Error as e:
+                logger.error("FFmpeg second pass failed for %s. Stdout: %s, Stderr: %s", 
+                           input_path, e.stdout.decode() if e.stdout else "None", 
+                           e.stderr.decode() if e.stderr else "None")
+                raise
+
+        except Exception as e:
+            logger.exception("Two-pass normalization failed for %s", input_path)
+            raise
+
+    async def normalize_sound(
+        self,
+        sound: Sound,
+        force: bool = False,
+        one_pass: bool | None = None,
+        sound_data: dict | None = None,
+    ) -> NormalizationInfo:
+        """Normalize a single sound."""
+        # Use provided sound_data to avoid detached instance issues, or capture from sound
+        if sound_data:
+            filename = sound_data["filename"]
+            sound_id = sound_data["id"]
+            is_normalized = sound_data["is_normalized"]
+            sound_type = sound_data["type"]
+        else:
+            # Fallback to accessing sound properties (for single sound normalization)
+            filename = sound.filename
+            sound_id = sound.id
+            is_normalized = sound.is_normalized
+            sound_type = sound.type
+
+        # Check if already normalized and not forcing
+        if is_normalized and not force:
+            return {
+                "filename": filename,
+                "status": "skipped",
+                "reason": "already normalized",
+                "original_path": None,
+                "normalized_path": None,
+                "normalized_filename": None,
+                "normalized_duration": None,
+                "normalized_size": None,
+                "normalized_hash": None,
+                "id": sound_id,
+                "error": None,
+            }
+
+        try:
+            # Get paths using captured data to avoid accessing sound properties
+            original_path = self._get_original_path_from_data(sound_type, filename)
+            normalized_path = self._get_normalized_path_from_data(sound_type, filename)
+
+            # Check if original file exists
+            if not original_path.exists():
+                error_msg = f"Original file not found: {original_path}"
+                logger.error(error_msg)
+                return {
+                    "filename": filename,
+                    "status": "error",
+                    "reason": None,
+                    "original_path": str(original_path),
+                    "normalized_path": None,
+                    "normalized_filename": None,
+                    "normalized_duration": None,
+                    "normalized_size": None,
+                    "normalized_hash": None,
+                    "id": sound_id,
+                    "error": error_msg,
+                }
+
+            # Determine which normalization method to use
+            use_one_pass = one_pass if one_pass is not None else (self.passes == 1)
+
+            # Perform normalization
+            if use_one_pass:
+                await self._normalize_audio_one_pass(original_path, normalized_path)
+            else:
+                await self._normalize_audio_two_pass(original_path, normalized_path)
+
+            # Get normalized file info
+            normalized_duration = self._get_audio_duration(normalized_path)
+            normalized_size = self._get_file_size(normalized_path)
+            normalized_hash = self._get_file_hash(normalized_path)
+            normalized_filename = normalized_path.name
+
+            # Update sound in database
+            update_data = {
+                "normalized_filename": normalized_filename,
+                "normalized_duration": normalized_duration,
+                "normalized_size": normalized_size,
+                "normalized_hash": normalized_hash,
+                "is_normalized": True,
+            }
+
+            await self.sound_repo.update(sound, update_data)
+            logger.info("Normalized sound: %s -> %s", filename, normalized_filename)
+
+            return {
+                "filename": filename,
+                "status": "normalized",
+                "reason": None,
+                "original_path": str(original_path),
+                "normalized_path": str(normalized_path),
+                "normalized_filename": normalized_filename,
+                "normalized_duration": normalized_duration,
+                "normalized_size": normalized_size,
+                "normalized_hash": normalized_hash,
+                "id": sound_id,
+                "error": None,
+            }
+
+        except Exception as e:
+            error_msg = str(e)
+            logger.exception(
+                "Failed to normalize sound %s",
+                filename,
+            )
+            return {
+                "filename": filename,
+                "status": "error",
+                "reason": None,
+                "original_path": (
+                    str(original_path) if "original_path" in locals() else None
+                ),
+                "normalized_path": (
+                    str(normalized_path) if "normalized_path" in locals() else None
+                ),
+                "normalized_filename": None,
+                "normalized_duration": None,
+                "normalized_size": None,
+                "normalized_hash": None,
+                "id": sound_id,
+                "error": error_msg,
+            }
+
+    async def normalize_all_sounds(
+        self,
+        force: bool = False,
+        one_pass: bool | None = None,
+    ) -> NormalizationResults:
+        """Normalize all unnormalized sounds."""
+        logger.info("Starting normalization of all sounds")
+
+        results: NormalizationResults = {
+            "processed": 0,
+            "normalized": 0,
+            "skipped": 0,
+            "errors": 0,
+            "files": [],
+        }
+
+        # Get sounds to normalize
+        if force:
+            # Get all sounds if forcing
+            sounds = []
+            for sound_type in self.type_directories.keys():
+                type_sounds = await self.sound_repo.get_by_type(sound_type)
+                sounds.extend(type_sounds)
+        else:
+            # Get only unnormalized sounds
+            sounds = await self.sound_repo.get_unnormalized_sounds()
+
+        logger.info("Found %d sounds to process", len(sounds))
+
+        # Capture all sound data upfront to avoid session detachment issues
+        sound_data_list = []
+        for sound in sounds:
+            sound_data_list.append(
+                {
+                    "id": sound.id,
+                    "filename": sound.filename,
+                    "type": sound.type,
+                    "is_normalized": sound.is_normalized,
+                    "name": sound.name,
+                }
+            )
+
+        # Process each sound using captured data
+        for i, sound in enumerate(sounds):
+            results["processed"] += 1
+
+            # Use captured data to avoid detached instance issues
+            sound_data = sound_data_list[i]
+            sound_id = sound_data["id"]
+            sound_filename = sound_data["filename"]
+
+            try:
+                normalization_info = await self.normalize_sound(
+                    sound,
+                    force=force,
+                    one_pass=one_pass,
+                    sound_data=sound_data,
+                )
+
+                results["files"].append(normalization_info)
+
+                if normalization_info["status"] == "normalized":
+                    results["normalized"] += 1
+                elif normalization_info["status"] == "skipped":
+                    results["skipped"] += 1
+                elif normalization_info["status"] == "error":
+                    results["errors"] += 1
+
+            except Exception as e:
+                logger.exception(
+                    "Unexpected error processing sound %s",
+                    sound_filename,
+                )
+                results["errors"] += 1
+                results["files"].append(
+                    {
+                        "filename": sound_filename,
+                        "status": "error",
+                        "reason": None,
+                        "original_path": None,
+                        "normalized_path": None,
+                        "normalized_filename": None,
+                        "normalized_duration": None,
+                        "normalized_size": None,
+                        "normalized_hash": None,
+                        "id": sound_id,
+                        "error": str(e),
+                    }
+                )
+
+        logger.info("Normalization completed: %s", results)
+        return results
+
+    async def normalize_sounds_by_type(
+        self,
+        sound_type: str,
+        force: bool = False,
+        one_pass: bool | None = None,
+    ) -> NormalizationResults:
+        """Normalize all sounds of a specific type."""
+        logger.info("Starting normalization of %s sounds", sound_type)
+
+        results: NormalizationResults = {
+            "processed": 0,
+            "normalized": 0,
+            "skipped": 0,
+            "errors": 0,
+            "files": [],
+        }
+
+        # Get sounds to normalize
+        if force:
+            sounds = await self.sound_repo.get_by_type(sound_type)
+        else:
+            sounds = await self.sound_repo.get_unnormalized_sounds_by_type(sound_type)
+
+        logger.info("Found %d %s sounds to process", len(sounds), sound_type)
+
+        # Capture all sound data upfront to avoid session detachment issues
+        sound_data_list = []
+        for sound in sounds:
+            sound_data_list.append(
+                {
+                    "id": sound.id,
+                    "filename": sound.filename,
+                    "type": sound.type,
+                    "is_normalized": sound.is_normalized,
+                    "name": sound.name,
+                }
+            )
+
+        # Process each sound using captured data
+        for i, sound in enumerate(sounds):
+            results["processed"] += 1
+
+            # Use captured data to avoid detached instance issues
+            sound_data = sound_data_list[i]
+            sound_id = sound_data["id"]
+            sound_filename = sound_data["filename"]
+
+            try:
+                normalization_info = await self.normalize_sound(
+                    sound,
+                    force=force,
+                    one_pass=one_pass,
+                    sound_data=sound_data,
+                )
+
+                results["files"].append(normalization_info)
+
+                if normalization_info["status"] == "normalized":
+                    results["normalized"] += 1
+                elif normalization_info["status"] == "skipped":
+                    results["skipped"] += 1
+                elif normalization_info["status"] == "error":
+                    results["errors"] += 1
+
+            except Exception as e:
+                logger.exception(
+                    "Unexpected error processing sound %s",
+                    sound_filename,
+                )
+                results["errors"] += 1
+                results["files"].append(
+                    {
+                        "filename": sound_filename,
+                        "status": "error",
+                        "reason": None,
+                        "original_path": None,
+                        "normalized_path": None,
+                        "normalized_filename": None,
+                        "normalized_duration": None,
+                        "normalized_size": None,
+                        "normalized_hash": None,
+                        "id": sound_id,
+                        "error": str(e),
+                    }
+                )
+
+        logger.info("Type normalization completed: %s", results)
+        return results
--- a/app/services/sound_scanner.py
+++ b/app/services/sound_scanner.py
@@ -16,6 +16,7 @@ logger = get_logger(__name__)

 class FileInfo(TypedDict):
    """Type definition for file information in scan results."""
+
    filename: str
    status: str
    reason: str | None
@@ -29,6 +30,7 @@ class FileInfo(TypedDict):

 class ScanResults(TypedDict):
    """Type definition for scan results."""
+
    scanned: int
    added: int
    updated: int
@@ -45,15 +47,23 @@ class SoundScannerService:
        """Initialize the sound scanner service."""
        self.session = session
        self.sound_repo = SoundRepository(session)
-        self.supported_extensions = {".mp3", ".wav", ".opus", ".flac", ".ogg", ".m4a", ".aac"}
+        self.supported_extensions = {
+            ".mp3",
+            ".wav",
+            ".opus",
+            ".flac",
+            ".ogg",
+            ".m4a",
+            ".aac",
+        }

    def get_file_hash(self, file_path: Path) -> str:
-        """Calculate MD5 hash of a file."""
-        hash_md5 = hashlib.md5()
+        """Calculate SHA-256 hash of a file."""
+        hash_sha256 = hashlib.sha256()
        with open(file_path, "rb") as f:
            for chunk in iter(lambda: f.read(4096), b""):
-                hash_md5.update(chunk)
-        return hash_md5.hexdigest()
+                hash_sha256.update(chunk)
+        return hash_sha256.hexdigest()

    def get_audio_duration(self, file_path: Path) -> int:
        """Get audio duration in milliseconds using ffmpeg."""
@@ -76,8 +86,7 @@ class SoundScannerService:
        # Replace underscores and hyphens with spaces
        name = name.replace("_", " ").replace("-", " ")
        # Capitalize words
-        name = " ".join(word.capitalize() for word in name.split())
-        return name
+        return " ".join(word.capitalize() for word in name.split())

    async def scan_directory(
        self,
@@ -113,7 +122,8 @@ class SoundScannerService:

        # Get all audio files from directory
        audio_files = [
-            f for f in scan_path.iterdir()
+            f
+            for f in scan_path.iterdir()
            if f.is_file() and f.suffix.lower() in self.supported_extensions
        ]

@@ -134,17 +144,19 @@ class SoundScannerService:
            except Exception as e:
                logger.exception("Error processing file %s", file_path)
                results["errors"] += 1
-                results["files"].append({
-                    "filename": filename,
-                    "status": "error",
-                    "reason": None,
-                    "name": None,
-                    "duration": None,
-                    "size": None,
-                    "id": None,
-                    "error": str(e),
-                    "changes": None,
-                })
+                results["files"].append(
+                    {
+                        "filename": filename,
+                        "status": "error",
+                        "reason": None,
+                        "name": None,
+                        "duration": None,
+                        "size": None,
+                        "id": None,
+                        "error": str(e),
+                        "changes": None,
+                    }
+                )

        # Delete sounds that no longer exist in directory
        for filename, sound in sounds_by_filename.items():
@@ -153,31 +165,35 @@ class SoundScannerService:
                    await self.sound_repo.delete(sound)
                    logger.info("Deleted sound no longer in directory: %s", filename)
                    results["deleted"] += 1
-                    results["files"].append({
-                        "filename": filename,
-                        "status": "deleted",
-                        "reason": "file no longer exists",
-                        "name": sound.name,
-                        "duration": sound.duration,
-                        "size": sound.size,
-                        "id": sound.id,
-                        "error": None,
-                        "changes": None,
-                    })
+                    results["files"].append(
+                        {
+                            "filename": filename,
+                            "status": "deleted",
+                            "reason": "file no longer exists",
+                            "name": sound.name,
+                            "duration": sound.duration,
+                            "size": sound.size,
+                            "id": sound.id,
+                            "error": None,
+                            "changes": None,
+                        }
+                    )
                except Exception as e:
                    logger.exception("Error deleting sound %s", filename)
                    results["errors"] += 1
-                    results["files"].append({
-                        "filename": filename,
-                        "status": "error",
-                        "reason": "failed to delete",
-                        "name": sound.name,
-                        "duration": sound.duration,
-                        "size": sound.size,
-                        "id": sound.id,
-                        "error": str(e),
-                        "changes": None,
-                    })
+                    results["files"].append(
+                        {
+                            "filename": filename,
+                            "status": "error",
+                            "reason": "failed to delete",
+                            "name": sound.name,
+                            "duration": sound.duration,
+                            "size": sound.size,
+                            "id": sound.id,
+                            "error": str(e),
+                            "changes": None,
+                        }
+                    )

        logger.info("Sync completed: %s", results)
        return results
@@ -215,17 +231,19 @@ class SoundScannerService:
            logger.info("Added new sound: %s (ID: %s)", sound.name, sound.id)

            results["added"] += 1
-            results["files"].append({
-                "filename": filename,
-                "status": "added",
-                "reason": None,
-                "name": name,
-                "duration": duration,
-                "size": size,
-                "id": sound.id,
-                "error": None,
-                "changes": None,
-            })
+            results["files"].append(
+                {
+                    "filename": filename,
+                    "status": "added",
+                    "reason": None,
+                    "name": name,
+                    "duration": duration,
+                    "size": size,
+                    "id": sound.id,
+                    "error": None,
+                    "changes": None,
+                }
+            )

        elif existing_sound.hash != file_hash:
            # Update existing sound (file was modified)
@@ -240,33 +258,37 @@ class SoundScannerService:
            logger.info("Updated modified sound: %s (ID: %s)", name, existing_sound.id)

            results["updated"] += 1
-            results["files"].append({
-                "filename": filename,
-                "status": "updated",
-                "reason": "file was modified",
-                "name": name,
-                "duration": duration,
-                "size": size,
-                "id": existing_sound.id,
-                "error": None,
-                "changes": ["hash", "duration", "size", "name"],
-            })
+            results["files"].append(
+                {
+                    "filename": filename,
+                    "status": "updated",
+                    "reason": "file was modified",
+                    "name": name,
+                    "duration": duration,
+                    "size": size,
+                    "id": existing_sound.id,
+                    "error": None,
+                    "changes": ["hash", "duration", "size", "name"],
+                }
+            )

        else:
            # File unchanged, skip
            logger.debug("Sound unchanged: %s", filename)
            results["skipped"] += 1
-            results["files"].append({
-                "filename": filename,
-                "status": "skipped",
-                "reason": "file unchanged",
-                "name": existing_sound.name,
-                "duration": existing_sound.duration,
-                "size": existing_sound.size,
-                "id": existing_sound.id,
-                "error": None,
-                "changes": None,
-            })
+            results["files"].append(
+                {
+                    "filename": filename,
+                    "status": "skipped",
+                    "reason": "file unchanged",
+                    "name": existing_sound.name,
+                    "duration": existing_sound.duration,
+                    "size": existing_sound.size,
+                    "id": existing_sound.id,
+                    "error": None,
+                    "changes": None,
+                }
+            )

    async def scan_soundboard_directory(self) -> ScanResults:
        """Sync the default soundboard directory."""