progress -- change get to search for lrclib

This commit is contained in:
codey 2025-01-14 10:04:05 -05:00
parent 9d8d38081a
commit f86d5a4fec
6 changed files with 113 additions and 8 deletions

View File

@ -123,8 +123,14 @@ class LyricSearch(FastAPI):
aggregate_search = aggregate.Aggregate()
result = await aggregate_search.search(data.a, data.s)
if not result:
return {
'err': True,
'errorText': 'Sources exhausted, lyrics not located.',
}
result = result.dict()
result['lyrics'] = regex.sub(r'(\s/\s|\n)', '<br>', result['lyrics']).strip()
result['confidence'] = f'{float(result.get('confidence', 0)):.2f}'
return result

View File

@ -8,6 +8,7 @@ sys.path.insert(1,'..')
sys.path.insert(1,'..')
from . import cache
from . import genius
from . import lrclib
class Aggregate:
"""Aggregate all source methods"""
@ -20,12 +21,18 @@ class Aggregate:
async def search(self, artist: str, song: str) -> Optional[LyricsResult]:
cache_search = cache.Cache()
genius_search = genius.Genius()
lrclib_search = lrclib.LRCLib()
search = None
if "cache" not in self.exclude_methods:
# First, try cache
search = await cache_search.search(artist, song)
if not search:
print("Cache: NOT FOUND!")
# Then try LRCLib
if "lrclib" not in self.exclude_methods:
search = await lrclib_search.search(artist, song)
if not search:
print("LRCLib: Not found!")
# Then try Genius
if "genius" in self.exclude_methods:
return # Skipped last possible source, return None

View File

@ -48,7 +48,8 @@ class Cache:
for ext in self.sqlite_exts:
await db_conn.load_extension(ext)
async with await db_conn.executescript(self.cache_pre_query) as _db_cursor:
search_query = 'SELECT id, artist, song, lyrics, src, confidence FROM lyrics WHERE editdist3((artist || " " || song), (? || " " || ?))\
search_query = 'SELECT id, artist, song, lyrics, src, confidence FROM lyrics\
WHERE editdist3((artist || " " || song), (? || " " || ?))\
<= 410 ORDER BY editdist3((artist || " " || song), ?) ASC LIMIT 10'
search_params = (artist.strip(), song.strip(),
f"{artist.strip()} {song.strip()}")

View File

@ -0,0 +1,82 @@
#!/usr/bin/env python3.12
# pylint: disable=bare-except, broad-exception-caught, wrong-import-position
import sys
sys.path.insert(1,'..')
import traceback
from aiohttp import ClientTimeout, ClientSession
from lyric_search_new import utils
from lyric_search_new.constructors import LyricsResult
from . import common
class InvalidResponseException(Exception):
"""
Invalid Response Exception
"""
class LRCLib:
"""LRCLib Search Module"""
def __init__(self):
self.label = "LRCLib"
self.lrclib_url = "https://lrclib.net/api/get"
self.headers = common.SCRAPE_HEADERS
self.timeout = ClientTimeout(connect=2, sock_read=4)
self.datautils = utils.DataUtils()
self.matcher = utils.TrackMatcher()
async def search(self, artist: str, song: str):
"""
@artist: the artist to search
@song: the song to search
"""
try:
artist = artist.strip().lower()
song = song.strip().lower()
returned_lyrics = ''
async with ClientSession() as client:
async with client.get(self.lrclib_url,
params = {
'artist_name': artist,
'track_name': song,
},
timeout=self.timeout,
headers=self.headers) as request:
request.raise_for_status()
text = await request.text()
if len(text) < 100:
raise InvalidResponseException("Search response text was invalid (len < 100 chars.)")
search_data = await request.json()
if not isinstance(search_data, dict):
raise InvalidResponseException("Invalid JSON.")
if not isinstance(search_data['artistName'], str):
raise InvalidResponseException(f"Invalid JSON: Cannot find artistName key.\n{search_data}")
if not isinstance(search_data['trackName'], str):
raise InvalidResponseException(f"Invalid JSON: Cannot find trackName key.\n{search_data}")
returned_artist = search_data['artistName']
returned_song = search_data['trackName']
returned_lyrics = search_data['plainLyrics']
returned_lyrics = self.datautils.scrub_lyrics(returned_lyrics)
input_track = f"{artist} - {song}"
returned_track = f"{artist} - {song}"
(matched, confidence) = self.matcher.find_best_match(input_track=input_track,
candidate_tracks=[(0, returned_track)])
if not confidence:
print(f"I have no confidence! {confidence}, input_track: {input_track}; candidates: {[returned_track]}")
return # No suitable match found
print("Returning!")
return LyricsResult(artist=returned_artist,
song=returned_song,
src=self.label,
lyrics=returned_lyrics,
confidence=confidence)
except:
traceback.print_exc()
return

View File

@ -4,7 +4,7 @@
import asyncio
import sys
sys.path.insert(1, '.')
import sources.cache, sources.genius, sources.aggregate
import sources.cache, sources.genius, sources.aggregate, sources.lrclib
test_artist = "hopsin"
test_song = "ill mind of hopsin 5"
@ -28,6 +28,14 @@ async def test_genius(artist=None, song=None):
result = await genius.search(artist, song)
print(result)
async def test_lrclib(artist=None, song=None):
if not artist or not song:
artist = test_artist
song = test_song
lrclib = sources.lrclib.LRCLib()
result = await lrclib.search(artist, song)
print(result)
async def test_aggregate(artist=None, song=None):
if not artist or not song:
artist = test_artist
@ -40,5 +48,6 @@ async def test_aggregate(artist=None, song=None):
loop = asyncio.new_event_loop()
# loop.run_until_complete(test_genius())
loop.run_until_complete(test_cache(artist=test_artist, song=test_song))
loop.run_until_complete(test_lrclib())
# loop.run_until_complete(test_cache(artist=test_artist, song=test_song))
# loop.run_until_complete(test_aggregate())

View File

@ -55,7 +55,7 @@ class TrackMatcher:
best_match = candidate
# Return the match only if it meets the threshold
return (best_match, best_score) if best_score >= self.threshold else None
return (best_match, round(best_score, 2)) if best_score >= self.threshold else None
def _normalize_string(self, text: str) -> str:
"""