mcma-backend/app/domain/entities/metadata.py

"""Value objects for the metadata-enrichment pipeline (plan §6.2).

Pure data carriers between the enrichment service and its adapters (tag reader,
fingerprinter, AcoustID). No framework imports — these cross the domain boundary.
"""

from dataclasses import dataclass


@dataclass(frozen=True, slots=True)
class AudioTags:
    """Embedded tags read from the file itself (ID3 / Vorbis / MP4 …).

    Every field is optional — files are tagged inconsistently. The reader fills
    what it can and leaves the rest ``None`` for downstream identification.
    """

    title: str | None = None
    artist: str | None = None
    album: str | None = None
    album_artist: str | None = None
    genre: str | None = None
    year: int | None = None
    track_number: int | None = None
    duration_seconds: int | None = None
    bitrate: int | None = None


@dataclass(frozen=True, slots=True)
class Fingerprint:
    """Chromaprint fingerprint plus the decoded duration (both needed by AcoustID)."""

    fingerprint: str
    duration_seconds: int


@dataclass(frozen=True, slots=True)
class RecordingMatch:
    """A single AcoustID result, flattened to the fields enrichment cares about.

    ``acoustid`` is the stable AcoustID identifier (a UUID) — used as the
    dedup key persisted on ``track.acoustid_fingerprint`` (fits the 64-char
    column; the raw fingerprint does not). ``recording_mbid`` is the MusicBrainz
    recording id when present.
    """

    acoustid: str
    score: float
    recording_mbid: str | None = None
    title: str | None = None
    artist: str | None = None
    album: str | None = None
    year: int | None = None