api/utils/sr_wrapper.py

from typing import Optional, Any
from uuid import uuid4
from urllib.parse import urlparse
import hashlib
import traceback
import logging
# Suppress all logging output from this module and its children
for name in [__name__, "utils.sr_wrapper"]:
    logger = logging.getLogger(name)
    logger.setLevel(logging.CRITICAL)
    logger.propagate = False
    for handler in logger.handlers:
        handler.setLevel(logging.CRITICAL)
# Also set the root logger to CRITICAL as a last resort (may affect global logging)
logging.getLogger().setLevel(logging.CRITICAL)
import random
import asyncio
import os
import aiohttp
import time
from streamrip.client import TidalClient  # type: ignore
from streamrip.config import Config as StreamripConfig  # type: ignore
from dotenv import load_dotenv
from rapidfuzz import fuzz


load_dotenv()


class SRUtil:
    """
    StreamRip API Utility Class
    """

    def __init__(self) -> None:
        """Initialize StreamRip utility."""
        self.streamrip_config = StreamripConfig.defaults()
        self.streamrip_config.session.tidal.user_id = os.getenv("tidal_user_id", "")
        self.streamrip_config.session.tidal.access_token = os.getenv(
            "tidal_access_token", ""
        )
        self.streamrip_config.session.tidal.refresh_token = os.getenv(
            "tidal_refresh_token", ""
        )
        self.streamrip_config.session.tidal.token_expiry = os.getenv(
            "tidal_token_expiry", ""
        )
        self.streamrip_config.session.tidal.country_code = os.getenv(
            "tidal_country_code", ""
        )
        self.streamrip_config.session.tidal.quality = int(
            os.getenv("tidal_default_quality", 2)
        )
        self.streamrip_config.session.conversion.enabled = False
        self.streamrip_config.session.downloads.folder = os.getenv(
            "tidal_download_folder", ""
        )
        self.streamrip_config
        self.streamrip_client = TidalClient(self.streamrip_config)
        self.MAX_CONCURRENT_METADATA_REQUESTS = 2
        self.METADATA_RATE_LIMIT = 1.25
        self.METADATA_SEMAPHORE = asyncio.Semaphore(self.MAX_CONCURRENT_METADATA_REQUESTS)
        self.LAST_METADATA_REQUEST = 0
        self.MAX_METADATA_RETRIES = 5
        self.METADATA_ALBUM_CACHE: dict[str, dict] = {}
        self.RETRY_DELAY = 1.0  # seconds between retries

    async def rate_limited_request(self, func, *args, **kwargs):
            async with self.METADATA_SEMAPHORE:
                now = time.time()
                elapsed = now - self.LAST_METADATA_REQUEST
                if elapsed < self.METADATA_RATE_LIMIT:
                    await asyncio.sleep(self.METADATA_RATE_LIMIT - elapsed)
                result = await func(*args, **kwargs)
                self.last_request_time = time.time()
                return result 

    def is_fuzzy_match(self, expected, actual, threshold=80):
        if not expected or not actual:
            return False
        return fuzz.token_set_ratio(expected.lower(), actual.lower()) >= threshold
        
    def is_metadata_match(self, expected_artist, expected_album, expected_title, found_artist, found_album, found_title, threshold=80):
        artist_match = self.is_fuzzy_match(expected_artist, found_artist, threshold)
        album_match = self.is_fuzzy_match(expected_album, found_album, threshold) if expected_album else True
        title_match = self.is_fuzzy_match(expected_title, found_title, threshold)
        return artist_match and album_match and title_match

    def dedupe_by_key(self, key: str, entries: list[dict]) -> list[dict]:
        deduped = {}
        for entry in entries:
            norm = entry[key].strip().lower()
            if norm not in deduped:
                deduped[norm] = entry
        return list(deduped.values())

    def format_duration(self, seconds):
        if not seconds:
            return None
        m, s = divmod(seconds, 60)
        return f"{m}:{s:02}"
    
    def _get_tidal_cover_url(self, uuid, size):
        """Generate a tidal cover url.

        :param uuid: VALID uuid string
        :param size:
        """
        TIDAL_COVER_URL = "https://resources.tidal.com/images/{uuid}/{width}x{height}.jpg"
        possibles = (80, 160, 320, 640, 1280)
        assert size in possibles, f"size must be in {possibles}"
        return TIDAL_COVER_URL.format(
            uuid=uuid.replace("-", "/"),
            height=size,
            width=size,
        )


    def combine_album_track_metadata(
        self, album_json: dict | None, track_json: dict
    ) -> dict:
        """
        Combine album-level and track-level metadata into a unified tag dictionary.
        Track-level metadata overrides album-level where relevant.
        """
        album_json = album_json or {}

        # Album-level
        combined = {
            "album": album_json.get("title"),
            "album_artist": album_json.get("artist", {}).get("name"),
            "release_date": album_json.get("releaseDate"),
            "album_type": album_json.get("type"),
            "total_tracks": album_json.get("numberOfTracks"),
            "upc": album_json.get("upc"),
            "album_copyright": album_json.get("copyright"),
            "album_cover_id": album_json.get("cover"),
            "album_cover_url": f"https://resources.tidal.com/images/{album_json.get('cover')}/1280x1280.jpg"
            if album_json.get("cover")
            else None,
        }

        # Track-level (overrides or adds to album info)
        combined.update(
            {
                "title": track_json.get("title"),
                "artist": track_json.get("artist", {}).get("name"),
                "artists": [a.get("name") for a in track_json.get("artists", [])],
                "track_number": track_json.get("trackNumber"),
                "disc_number": track_json.get("volumeNumber"),
                "duration": track_json.get("duration"),
                "isrc": track_json.get("isrc"),
                "bpm": track_json.get("bpm"),
                "explicit": track_json.get("explicit"),
                "replaygain": track_json.get("replayGain"),
                "peak": track_json.get("peak"),
                "lyrics": track_json.get("lyrics"),
                "track_copyright": track_json.get("copyright"),
                "cover_id": track_json.get("album", {}).get("cover") or album_json.get("cover"),
                "cover_url": (
                    f"https://resources.tidal.com/images/{track_json.get('album', {}).get('cover', album_json.get('cover'))}/1280x1280.jpg"
                    if (track_json.get("album", {}).get("cover") or album_json.get("cover"))
                    else None
                ),
            }
        )

        return combined


    def combine_album_with_all_tracks(
        self, album_json: dict[str, Any]
    ) -> list[dict[str, Any]]:
        """Return a list of combined metadata dicts for all tracks in an album JSON."""
        return [
            self.combine_album_track_metadata(album_json, t)
            for t in album_json.get("tracks", [])
        ]

    async def get_artists_by_name(self, artist_name: str) -> Optional[list]:
        """Get artist(s) by name. Retry login only on authentication failure. Rate limit and retry on 400/429."""
        import asyncio
        artists_out: list[dict] = []
        max_retries = 4
        delay = 1.0
        for attempt in range(max_retries):
            try:
                artists = await self.streamrip_client.search(
                    media_type="artist", query=artist_name
                )
                break
            except AttributeError:
                await self.streamrip_client.login()
                if attempt == max_retries - 1:
                    return None
            except Exception as e:
                msg = str(e)
                if ("400" in msg or "429" in msg) and attempt < max_retries - 1:
                    await asyncio.sleep(delay)
                    delay *= 2
                    continue
                else:
                    return None
        else:
            return None
        artists = artists[0].get("items", [])
        if not artists:
            return None
        artists_out = [
            {
                "artist": res["name"],
                "id": res["id"],
            }
            for res in artists
            if "name" in res and "id" in res
        ]
        artists_out = self.dedupe_by_key("artist", artists_out)  # Remove duplicates
        return artists_out

    async def get_albums_by_artist_id(self, artist_id: int) -> Optional[list | dict]:
        """Get albums by artist ID. Retry login only on authentication failure. Rate limit and retry on 400/429."""
        import asyncio
        artist_id_str: str = str(artist_id)
        albums_out: list[dict] = []
        max_retries = 4
        delay = 1.0
        for attempt in range(max_retries):
            try:
                metadata = await self.streamrip_client.get_metadata(
                    item_id=artist_id_str, media_type="artist"
                )
                break
            except AttributeError:
                await self.streamrip_client.login()
                if attempt == max_retries - 1:
                    return None
            except Exception as e:
                msg = str(e)
                if ("400" in msg or "429" in msg) and attempt < max_retries - 1:
                    await asyncio.sleep(delay)
                    delay *= 2
                    continue
                else:
                    return None
        else:
            return None
        if not metadata:
            return None
        albums = self.dedupe_by_key("title", metadata.get("albums", []))
        albums_out = [
            {
                "artist": ", ".join(artist["name"] for artist in album["artists"]),
                "album": album["title"],
                "id": album["id"],
                "release_date": album.get("releaseDate", "Unknown"),
            }
            for album in albums
            if "title" in album and "id" in album and "artists" in album
        ]
        return albums_out
    
    async def get_album_by_name(self, artist: str, album: str) -> Optional[dict]:
        """Get album by artist and album name using artist ID and fuzzy matching. Try first 8 chars, then 12 if no match. Notify on success."""
    # Notification moved to add_cover_art.py as requested
        for trunc in (8, 12):
            search_artist = artist[:trunc]
            artists = await self.get_artists_by_name(search_artist)
            if not artists:
                continue
            best_artist = None
            best_artist_score = 0
            for a in artists:
                score = fuzz.token_set_ratio(artist, a["artist"])
                if score > best_artist_score:
                    best_artist = a
                    best_artist_score = int(score)
            if not best_artist or best_artist_score < 85:
                continue
            artist_id = best_artist["id"]
            albums = await self.get_albums_by_artist_id(artist_id)
            if not albums:
                continue
            best_album = None
            best_album_score = 0
            for alb in albums:
                score = fuzz.token_set_ratio(album, alb["album"])
                if score > best_album_score:
                    best_album = alb
                    best_album_score = int(score)
            if best_album and best_album_score >= 85:
                return best_album
        return None
    
    async def get_cover_by_album_id(self, album_id: int, size: int = 640) -> Optional[str]:
        """Get cover URL by album ID. Retry login only on authentication failure."""
        if size not in [80, 160, 320, 640, 1280]:
            return None
        album_id_str: str = str(album_id)
        for attempt in range(2):
            try:
                metadata = await self.streamrip_client.get_metadata(
                    item_id=album_id_str, media_type="album"
                )
                break
            except AttributeError:
                await self.streamrip_client.login()
                if attempt == 1:
                    return None
        else:
            return None
        if not metadata:
            return None
        cover_id = metadata.get("cover")
        if not cover_id:
            return None
        cover_url = self._get_tidal_cover_url(cover_id, size)
        return cover_url


    async def get_tracks_by_album_id(
        self, album_id: int, quality: str = "FLAC"
    ) -> Optional[list | dict]:
        """Get tracks by album ID
        Args:
            album_id (int): The ID of the album.
        Returns:
            Optional[list[dict]]: List of tracks or None if not found.
        """
        album_id_str = str(album_id)
        await self.streamrip_client.login()
        metadata = await self.streamrip_client.get_metadata(
            item_id=album_id_str, media_type="album"
        )
        if not metadata:
            logging.warning("No metadata found for album ID: %s", album_id)
            return None

        track_list = metadata.get("tracks", [])
        tracks_out: list[dict] = [
            {
                "id": track.get("id"),
                "artist": track.get("artist").get("name"),
                "title": track.get("title"),
                "duration": self.format_duration(track.get("duration", 0)),
                "version": track.get("version"),
                "audioQuality": track.get("audioQuality"),
            }
            for track in track_list
        ]
        return tracks_out

    async def get_tracks_by_artist_song(self, artist: str, song: str, n: int = 0) -> Optional[list]:
        """Get track by artist and song name
        Args:
            artist (str): The name of the artist.
            song (str): The name of the song.
        Returns:
            Optional[dict]: The track details or None if not found.
        TODO: Reimplement using StreamRip
        """
        if not self.streamrip_client.logged_in:
            await self.streamrip_client.login()
        try: 
            search_res = await self.streamrip_client.search(media_type="track",
                                           query=f"{artist} - {song}",
                                           )
            logging.critical("Result: %s", search_res)
            return search_res[0].get('items')
        except Exception as e:
            traceback.print_exc()
            logging.critical("Search Exception: %s", str(e))
            if n < 3:
                n+=1
                return await self.get_tracks_by_artist_song(artist, song, n)
        finally:
            return []
        # return []

    async def get_stream_url_by_track_id(
        self, track_id: int, quality: str = "FLAC"
    ) -> Optional[str]:
        """Get stream URL by track ID
        Args:
            track_id (int): The ID of the track.
            quality (str): The quality of the stream, default is "LOSSLESS". Other options: HIGH, LOW
        Returns:
            Optional[str]: The stream URL or None if not found.
        """
        if quality not in ["FLAC", "Lossy"]:
            logging.error("Invalid quality requested: %s", quality)
            return None
        quality_int: int = int(self.streamrip_config.session.tidal.quality)
        match quality:
            case "FLAC":
                quality_int = 2
            case "Lossy":
                quality_int = 1
        track_id_str: str = str(track_id)

        await self.streamrip_client.login()

        try:
            logging.critical("Using quality_int: %s", quality_int)
            track = await self.streamrip_client.get_downloadable(
                track_id=track_id_str, quality=quality_int
            )
        except AttributeError:
            await self.streamrip_client.login()
            track = await self.streamrip_client.get_downloadable(
                track_id=track_id_str, quality=quality_int
            )
        if not track:
            logging.warning("No track found for ID: %s", track_id)
            return None
        stream_url = track.url
        if not stream_url:
            logging.warning("No stream URL found for track ID: %s", track_id)
            return None
        return stream_url

    async def get_metadata_by_track_id(self, track_id: int) -> Optional[dict]:
        """
        Fetch track + album metadata with retries, caching album data.
        Returns combined metadata dict or None after exhausting retries.
        """
        for attempt in range(1, self.MAX_METADATA_RETRIES + 1):
            try:
                await self.streamrip_client.login()
                
                # Track metadata
                metadata = await self.rate_limited_request(
                    self.streamrip_client.get_metadata, str(track_id), "track"
                )
                
                album_id = metadata.get("album", {}).get("id")
                album_metadata = None

                if album_id:
                    # Check cache first
                    if album_id in self.METADATA_ALBUM_CACHE:
                        album_metadata = self.METADATA_ALBUM_CACHE[album_id]
                    else:
                        album_metadata = await self.rate_limited_request(
                            self.streamrip_client.get_metadata, album_id, "album"
                        )
                        if not album_metadata:
                            return None
                        self.METADATA_ALBUM_CACHE[album_id] = album_metadata

                # Combine track + album metadata
                if not album_metadata:
                    return None
                combined_metadata: dict = self.combine_album_track_metadata(
                    album_metadata, metadata
                )

                logging.info(
                    "Combined metadata for track ID %s (attempt %d): %s",
                    track_id,
                    attempt,
                    combined_metadata,
                )
                return combined_metadata

            except Exception as e:
                # Exponential backoff with jitter for 429 or other errors
                delay = self.RETRY_DELAY * (2 ** (attempt - 1)) + random.uniform(0, 0.5)
                logging.warning(
                    "Metadata fetch failed for track %s (attempt %d/%d): %s. Retrying in %.2fs",
                    track_id,
                    attempt,
                    self.MAX_METADATA_RETRIES,
                    str(e),
                    delay,
                )
                if attempt < self.MAX_METADATA_RETRIES:
                    await asyncio.sleep(delay)
                else:
                    logging.error(
                        "Metadata fetch failed permanently for track %s after %d attempts",
                        track_id,
                        self.MAX_METADATA_RETRIES,
                    )
        return None


    async def download(self, track_id: int, quality: str = "LOSSLESS") -> bool | str:
        """Download track
        Args:
            track_id (int)
            quality (str): The quality of the stream, default is "LOSSLESS". Other options: HIGH, LOW
        Returns:
            bool
        """
        try:
            await self.streamrip_client.login()
            track_url = await self.get_stream_url_by_track_id(track_id)
            if not track_url:
                return False
            parsed_url = urlparse(track_url)
            parsed_url_filename = os.path.basename(parsed_url.path)
            parsed_url_ext = os.path.splitext(parsed_url_filename)[1]
            unique = hashlib.sha256(uuid4().bytes).hexdigest()[:16]
            dl_folder_path = (
                f"{self.streamrip_config.session.downloads.folder}/{unique}"
            )
            dl_path = f"{dl_folder_path}/{track_id}.{parsed_url_ext}"
            async with aiohttp.ClientSession() as session:
                async with session.get(
                    track_url, headers={}, timeout=aiohttp.ClientTimeout(total=60)
                ) as resp:
                    resp.raise_for_status()
                    with open(dl_path, "wb") as f:
                        async for chunk in resp.content.iter_chunked(1024 * 64):
                            f.write(chunk)
                    return dl_path
        except Exception as e:
            logging.critical("Error: %s", str(e))
            return False