522 lines
20 KiB
Python
522 lines
20 KiB
Python
from typing import Optional, Any
|
|
from uuid import uuid4
|
|
from urllib.parse import urlparse
|
|
import hashlib
|
|
import traceback
|
|
import logging
|
|
# Suppress all logging output from this module and its children
|
|
for name in [__name__, "utils.sr_wrapper"]:
|
|
logger = logging.getLogger(name)
|
|
logger.setLevel(logging.CRITICAL)
|
|
logger.propagate = False
|
|
for handler in logger.handlers:
|
|
handler.setLevel(logging.CRITICAL)
|
|
# Also set the root logger to CRITICAL as a last resort (may affect global logging)
|
|
logging.getLogger().setLevel(logging.CRITICAL)
|
|
import random
|
|
import asyncio
|
|
import os
|
|
import aiohttp
|
|
import time
|
|
from streamrip.client import TidalClient # type: ignore
|
|
from streamrip.config import Config as StreamripConfig # type: ignore
|
|
from dotenv import load_dotenv
|
|
from rapidfuzz import fuzz
|
|
|
|
|
|
|
|
load_dotenv()
|
|
|
|
|
|
class SRUtil:
|
|
"""
|
|
StreamRip API Utility Class
|
|
"""
|
|
|
|
def __init__(self) -> None:
|
|
"""Initialize StreamRip utility."""
|
|
self.streamrip_config = StreamripConfig.defaults()
|
|
self.streamrip_config.session.tidal.user_id = os.getenv("tidal_user_id", "")
|
|
self.streamrip_config.session.tidal.access_token = os.getenv(
|
|
"tidal_access_token", ""
|
|
)
|
|
self.streamrip_config.session.tidal.refresh_token = os.getenv(
|
|
"tidal_refresh_token", ""
|
|
)
|
|
self.streamrip_config.session.tidal.token_expiry = os.getenv(
|
|
"tidal_token_expiry", ""
|
|
)
|
|
self.streamrip_config.session.tidal.country_code = os.getenv(
|
|
"tidal_country_code", ""
|
|
)
|
|
self.streamrip_config.session.tidal.quality = int(
|
|
os.getenv("tidal_default_quality", 2)
|
|
)
|
|
self.streamrip_config.session.conversion.enabled = False
|
|
self.streamrip_config.session.downloads.folder = os.getenv(
|
|
"tidal_download_folder", ""
|
|
)
|
|
self.streamrip_config
|
|
self.streamrip_client = TidalClient(self.streamrip_config)
|
|
self.MAX_CONCURRENT_METADATA_REQUESTS = 2
|
|
self.METADATA_RATE_LIMIT = 1.25
|
|
self.METADATA_SEMAPHORE = asyncio.Semaphore(self.MAX_CONCURRENT_METADATA_REQUESTS)
|
|
self.LAST_METADATA_REQUEST = 0
|
|
self.MAX_METADATA_RETRIES = 5
|
|
self.METADATA_ALBUM_CACHE: dict[str, dict] = {}
|
|
self.RETRY_DELAY = 1.0 # seconds between retries
|
|
|
|
async def rate_limited_request(self, func, *args, **kwargs):
|
|
async with self.METADATA_SEMAPHORE:
|
|
now = time.time()
|
|
elapsed = now - self.LAST_METADATA_REQUEST
|
|
if elapsed < self.METADATA_RATE_LIMIT:
|
|
await asyncio.sleep(self.METADATA_RATE_LIMIT - elapsed)
|
|
result = await func(*args, **kwargs)
|
|
self.last_request_time = time.time()
|
|
return result
|
|
|
|
def is_fuzzy_match(self, expected, actual, threshold=80):
|
|
if not expected or not actual:
|
|
return False
|
|
return fuzz.token_set_ratio(expected.lower(), actual.lower()) >= threshold
|
|
|
|
def is_metadata_match(self, expected_artist, expected_album, expected_title, found_artist, found_album, found_title, threshold=80):
|
|
artist_match = self.is_fuzzy_match(expected_artist, found_artist, threshold)
|
|
album_match = self.is_fuzzy_match(expected_album, found_album, threshold) if expected_album else True
|
|
title_match = self.is_fuzzy_match(expected_title, found_title, threshold)
|
|
return artist_match and album_match and title_match
|
|
|
|
def dedupe_by_key(self, key: str, entries: list[dict]) -> list[dict]:
|
|
deduped = {}
|
|
for entry in entries:
|
|
norm = entry[key].strip().lower()
|
|
if norm not in deduped:
|
|
deduped[norm] = entry
|
|
return list(deduped.values())
|
|
|
|
def format_duration(self, seconds):
|
|
if not seconds:
|
|
return None
|
|
m, s = divmod(seconds, 60)
|
|
return f"{m}:{s:02}"
|
|
|
|
def _get_tidal_cover_url(self, uuid, size):
|
|
"""Generate a tidal cover url.
|
|
|
|
:param uuid: VALID uuid string
|
|
:param size:
|
|
"""
|
|
TIDAL_COVER_URL = "https://resources.tidal.com/images/{uuid}/{width}x{height}.jpg"
|
|
possibles = (80, 160, 320, 640, 1280)
|
|
assert size in possibles, f"size must be in {possibles}"
|
|
return TIDAL_COVER_URL.format(
|
|
uuid=uuid.replace("-", "/"),
|
|
height=size,
|
|
width=size,
|
|
)
|
|
|
|
|
|
|
|
def combine_album_track_metadata(
|
|
self, album_json: dict | None, track_json: dict
|
|
) -> dict:
|
|
"""
|
|
Combine album-level and track-level metadata into a unified tag dictionary.
|
|
Track-level metadata overrides album-level where relevant.
|
|
"""
|
|
album_json = album_json or {}
|
|
|
|
# Album-level
|
|
combined = {
|
|
"album": album_json.get("title"),
|
|
"album_artist": album_json.get("artist", {}).get("name"),
|
|
"release_date": album_json.get("releaseDate"),
|
|
"album_type": album_json.get("type"),
|
|
"total_tracks": album_json.get("numberOfTracks"),
|
|
"upc": album_json.get("upc"),
|
|
"album_copyright": album_json.get("copyright"),
|
|
"album_cover_id": album_json.get("cover"),
|
|
"album_cover_url": f"https://resources.tidal.com/images/{album_json.get('cover')}/1280x1280.jpg"
|
|
if album_json.get("cover")
|
|
else None,
|
|
}
|
|
|
|
# Track-level (overrides or adds to album info)
|
|
combined.update(
|
|
{
|
|
"title": track_json.get("title"),
|
|
"artist": track_json.get("artist", {}).get("name"),
|
|
"artists": [a.get("name") for a in track_json.get("artists", [])],
|
|
"track_number": track_json.get("trackNumber"),
|
|
"disc_number": track_json.get("volumeNumber"),
|
|
"duration": track_json.get("duration"),
|
|
"isrc": track_json.get("isrc"),
|
|
"bpm": track_json.get("bpm"),
|
|
"explicit": track_json.get("explicit"),
|
|
"replaygain": track_json.get("replayGain"),
|
|
"peak": track_json.get("peak"),
|
|
"lyrics": track_json.get("lyrics"),
|
|
"track_copyright": track_json.get("copyright"),
|
|
"cover_id": track_json.get("album", {}).get("cover") or album_json.get("cover"),
|
|
"cover_url": (
|
|
f"https://resources.tidal.com/images/{track_json.get('album', {}).get('cover', album_json.get('cover'))}/1280x1280.jpg"
|
|
if (track_json.get("album", {}).get("cover") or album_json.get("cover"))
|
|
else None
|
|
),
|
|
}
|
|
)
|
|
|
|
return combined
|
|
|
|
|
|
def combine_album_with_all_tracks(
|
|
self, album_json: dict[str, Any]
|
|
) -> list[dict[str, Any]]:
|
|
"""Return a list of combined metadata dicts for all tracks in an album JSON."""
|
|
return [
|
|
self.combine_album_track_metadata(album_json, t)
|
|
for t in album_json.get("tracks", [])
|
|
]
|
|
|
|
async def get_artists_by_name(self, artist_name: str) -> Optional[list]:
|
|
"""Get artist(s) by name. Retry login only on authentication failure. Rate limit and retry on 400/429."""
|
|
import asyncio
|
|
artists_out: list[dict] = []
|
|
max_retries = 4
|
|
delay = 1.0
|
|
for attempt in range(max_retries):
|
|
try:
|
|
artists = await self.streamrip_client.search(
|
|
media_type="artist", query=artist_name
|
|
)
|
|
break
|
|
except AttributeError:
|
|
await self.streamrip_client.login()
|
|
if attempt == max_retries - 1:
|
|
return None
|
|
except Exception as e:
|
|
msg = str(e)
|
|
if ("400" in msg or "429" in msg) and attempt < max_retries - 1:
|
|
await asyncio.sleep(delay)
|
|
delay *= 2
|
|
continue
|
|
else:
|
|
return None
|
|
else:
|
|
return None
|
|
artists = artists[0].get("items", [])
|
|
if not artists:
|
|
return None
|
|
artists_out = [
|
|
{
|
|
"artist": res["name"],
|
|
"id": res["id"],
|
|
}
|
|
for res in artists
|
|
if "name" in res and "id" in res
|
|
]
|
|
artists_out = self.dedupe_by_key("artist", artists_out) # Remove duplicates
|
|
return artists_out
|
|
|
|
async def get_albums_by_artist_id(self, artist_id: int) -> Optional[list | dict]:
|
|
"""Get albums by artist ID. Retry login only on authentication failure. Rate limit and retry on 400/429."""
|
|
import asyncio
|
|
artist_id_str: str = str(artist_id)
|
|
albums_out: list[dict] = []
|
|
max_retries = 4
|
|
delay = 1.0
|
|
for attempt in range(max_retries):
|
|
try:
|
|
metadata = await self.streamrip_client.get_metadata(
|
|
item_id=artist_id_str, media_type="artist"
|
|
)
|
|
break
|
|
except AttributeError:
|
|
await self.streamrip_client.login()
|
|
if attempt == max_retries - 1:
|
|
return None
|
|
except Exception as e:
|
|
msg = str(e)
|
|
if ("400" in msg or "429" in msg) and attempt < max_retries - 1:
|
|
await asyncio.sleep(delay)
|
|
delay *= 2
|
|
continue
|
|
else:
|
|
return None
|
|
else:
|
|
return None
|
|
if not metadata:
|
|
return None
|
|
albums = self.dedupe_by_key("title", metadata.get("albums", []))
|
|
albums_out = [
|
|
{
|
|
"artist": ", ".join(artist["name"] for artist in album["artists"]),
|
|
"album": album["title"],
|
|
"id": album["id"],
|
|
"release_date": album.get("releaseDate", "Unknown"),
|
|
}
|
|
for album in albums
|
|
if "title" in album and "id" in album and "artists" in album
|
|
]
|
|
return albums_out
|
|
|
|
async def get_album_by_name(self, artist: str, album: str) -> Optional[dict]:
|
|
"""Get album by artist and album name using artist ID and fuzzy matching. Try first 8 chars, then 12 if no match. Notify on success."""
|
|
# Notification moved to add_cover_art.py as requested
|
|
for trunc in (8, 12):
|
|
search_artist = artist[:trunc]
|
|
artists = await self.get_artists_by_name(search_artist)
|
|
if not artists:
|
|
continue
|
|
best_artist = None
|
|
best_artist_score = 0
|
|
for a in artists:
|
|
score = fuzz.token_set_ratio(artist, a["artist"])
|
|
if score > best_artist_score:
|
|
best_artist = a
|
|
best_artist_score = int(score)
|
|
if not best_artist or best_artist_score < 85:
|
|
continue
|
|
artist_id = best_artist["id"]
|
|
albums = await self.get_albums_by_artist_id(artist_id)
|
|
if not albums:
|
|
continue
|
|
best_album = None
|
|
best_album_score = 0
|
|
for alb in albums:
|
|
score = fuzz.token_set_ratio(album, alb["album"])
|
|
if score > best_album_score:
|
|
best_album = alb
|
|
best_album_score = int(score)
|
|
if best_album and best_album_score >= 85:
|
|
return best_album
|
|
return None
|
|
|
|
async def get_cover_by_album_id(self, album_id: int, size: int = 640) -> Optional[str]:
|
|
"""Get cover URL by album ID. Retry login only on authentication failure."""
|
|
if size not in [80, 160, 320, 640, 1280]:
|
|
return None
|
|
album_id_str: str = str(album_id)
|
|
for attempt in range(2):
|
|
try:
|
|
metadata = await self.streamrip_client.get_metadata(
|
|
item_id=album_id_str, media_type="album"
|
|
)
|
|
break
|
|
except AttributeError:
|
|
await self.streamrip_client.login()
|
|
if attempt == 1:
|
|
return None
|
|
else:
|
|
return None
|
|
if not metadata:
|
|
return None
|
|
cover_id = metadata.get("cover")
|
|
if not cover_id:
|
|
return None
|
|
cover_url = self._get_tidal_cover_url(cover_id, size)
|
|
return cover_url
|
|
|
|
|
|
async def get_tracks_by_album_id(
|
|
self, album_id: int, quality: str = "FLAC"
|
|
) -> Optional[list | dict]:
|
|
"""Get tracks by album ID
|
|
Args:
|
|
album_id (int): The ID of the album.
|
|
Returns:
|
|
Optional[list[dict]]: List of tracks or None if not found.
|
|
"""
|
|
album_id_str = str(album_id)
|
|
await self.streamrip_client.login()
|
|
metadata = await self.streamrip_client.get_metadata(
|
|
item_id=album_id_str, media_type="album"
|
|
)
|
|
if not metadata:
|
|
logging.warning("No metadata found for album ID: %s", album_id)
|
|
return None
|
|
|
|
track_list = metadata.get("tracks", [])
|
|
tracks_out: list[dict] = [
|
|
{
|
|
"id": track.get("id"),
|
|
"artist": track.get("artist").get("name"),
|
|
"title": track.get("title"),
|
|
"duration": self.format_duration(track.get("duration", 0)),
|
|
"version": track.get("version"),
|
|
"audioQuality": track.get("audioQuality"),
|
|
}
|
|
for track in track_list
|
|
]
|
|
return tracks_out
|
|
|
|
async def get_tracks_by_artist_song(self, artist: str, song: str, n: int = 0) -> Optional[list]:
|
|
"""Get track by artist and song name
|
|
Args:
|
|
artist (str): The name of the artist.
|
|
song (str): The name of the song.
|
|
Returns:
|
|
Optional[dict]: The track details or None if not found.
|
|
TODO: Reimplement using StreamRip
|
|
"""
|
|
if not self.streamrip_client.logged_in:
|
|
await self.streamrip_client.login()
|
|
try:
|
|
search_res = await self.streamrip_client.search(media_type="track",
|
|
query=f"{artist} - {song}",
|
|
)
|
|
logging.critical("Result: %s", search_res)
|
|
return search_res[0].get('items')
|
|
except Exception as e:
|
|
traceback.print_exc()
|
|
logging.critical("Search Exception: %s", str(e))
|
|
if n < 3:
|
|
n+=1
|
|
return await self.get_tracks_by_artist_song(artist, song, n)
|
|
finally:
|
|
return []
|
|
# return []
|
|
|
|
async def get_stream_url_by_track_id(
|
|
self, track_id: int, quality: str = "FLAC"
|
|
) -> Optional[str]:
|
|
"""Get stream URL by track ID
|
|
Args:
|
|
track_id (int): The ID of the track.
|
|
quality (str): The quality of the stream, default is "LOSSLESS". Other options: HIGH, LOW
|
|
Returns:
|
|
Optional[str]: The stream URL or None if not found.
|
|
"""
|
|
if quality not in ["FLAC", "Lossy"]:
|
|
logging.error("Invalid quality requested: %s", quality)
|
|
return None
|
|
quality_int: int = int(self.streamrip_config.session.tidal.quality)
|
|
match quality:
|
|
case "FLAC":
|
|
quality_int = 2
|
|
case "Lossy":
|
|
quality_int = 1
|
|
track_id_str: str = str(track_id)
|
|
|
|
await self.streamrip_client.login()
|
|
|
|
try:
|
|
logging.critical("Using quality_int: %s", quality_int)
|
|
track = await self.streamrip_client.get_downloadable(
|
|
track_id=track_id_str, quality=quality_int
|
|
)
|
|
except AttributeError:
|
|
await self.streamrip_client.login()
|
|
track = await self.streamrip_client.get_downloadable(
|
|
track_id=track_id_str, quality=quality_int
|
|
)
|
|
if not track:
|
|
logging.warning("No track found for ID: %s", track_id)
|
|
return None
|
|
stream_url = track.url
|
|
if not stream_url:
|
|
logging.warning("No stream URL found for track ID: %s", track_id)
|
|
return None
|
|
return stream_url
|
|
|
|
async def get_metadata_by_track_id(self, track_id: int) -> Optional[dict]:
|
|
"""
|
|
Fetch track + album metadata with retries, caching album data.
|
|
Returns combined metadata dict or None after exhausting retries.
|
|
"""
|
|
for attempt in range(1, self.MAX_METADATA_RETRIES + 1):
|
|
try:
|
|
await self.streamrip_client.login()
|
|
|
|
# Track metadata
|
|
metadata = await self.rate_limited_request(
|
|
self.streamrip_client.get_metadata, str(track_id), "track"
|
|
)
|
|
|
|
album_id = metadata.get("album", {}).get("id")
|
|
album_metadata = None
|
|
|
|
if album_id:
|
|
# Check cache first
|
|
if album_id in self.METADATA_ALBUM_CACHE:
|
|
album_metadata = self.METADATA_ALBUM_CACHE[album_id]
|
|
else:
|
|
album_metadata = await self.rate_limited_request(
|
|
self.streamrip_client.get_metadata, album_id, "album"
|
|
)
|
|
if not album_metadata:
|
|
return None
|
|
self.METADATA_ALBUM_CACHE[album_id] = album_metadata
|
|
|
|
# Combine track + album metadata
|
|
if not album_metadata:
|
|
return None
|
|
combined_metadata: dict = self.combine_album_track_metadata(
|
|
album_metadata, metadata
|
|
)
|
|
|
|
logging.info(
|
|
"Combined metadata for track ID %s (attempt %d): %s",
|
|
track_id,
|
|
attempt,
|
|
combined_metadata,
|
|
)
|
|
return combined_metadata
|
|
|
|
except Exception as e:
|
|
# Exponential backoff with jitter for 429 or other errors
|
|
delay = self.RETRY_DELAY * (2 ** (attempt - 1)) + random.uniform(0, 0.5)
|
|
logging.warning(
|
|
"Metadata fetch failed for track %s (attempt %d/%d): %s. Retrying in %.2fs",
|
|
track_id,
|
|
attempt,
|
|
self.MAX_METADATA_RETRIES,
|
|
str(e),
|
|
delay,
|
|
)
|
|
if attempt < self.MAX_METADATA_RETRIES:
|
|
await asyncio.sleep(delay)
|
|
else:
|
|
logging.error(
|
|
"Metadata fetch failed permanently for track %s after %d attempts",
|
|
track_id,
|
|
self.MAX_METADATA_RETRIES,
|
|
)
|
|
return None
|
|
|
|
|
|
async def download(self, track_id: int, quality: str = "LOSSLESS") -> bool | str:
|
|
"""Download track
|
|
Args:
|
|
track_id (int)
|
|
quality (str): The quality of the stream, default is "LOSSLESS". Other options: HIGH, LOW
|
|
Returns:
|
|
bool
|
|
"""
|
|
try:
|
|
await self.streamrip_client.login()
|
|
track_url = await self.get_stream_url_by_track_id(track_id)
|
|
if not track_url:
|
|
return False
|
|
parsed_url = urlparse(track_url)
|
|
parsed_url_filename = os.path.basename(parsed_url.path)
|
|
parsed_url_ext = os.path.splitext(parsed_url_filename)[1]
|
|
unique = hashlib.sha256(uuid4().bytes).hexdigest()[:16]
|
|
dl_folder_path = (
|
|
f"{self.streamrip_config.session.downloads.folder}/{unique}"
|
|
)
|
|
dl_path = f"{dl_folder_path}/{track_id}.{parsed_url_ext}"
|
|
async with aiohttp.ClientSession() as session:
|
|
async with session.get(
|
|
track_url, headers={}, timeout=aiohttp.ClientTimeout(total=60)
|
|
) as resp:
|
|
resp.raise_for_status()
|
|
with open(dl_path, "wb") as f:
|
|
async for chunk in resp.content.iter_chunked(1024 * 64):
|
|
f.write(chunk)
|
|
return dl_path
|
|
except Exception as e:
|
|
logging.critical("Error: %s", str(e))
|
|
return False
|