98 lines
4.7 KiB
Python
Raw Normal View History

2025-01-12 20:19:48 -05:00
#!/usr/bin/env python3.12
2025-01-14 11:10:13 -05:00
# pylint: disable=wrong-import-order, wrong-import-position bare-except, broad-exception-caught
2025-01-12 20:19:48 -05:00
2025-01-13 20:47:39 -05:00
import os
2025-01-14 11:10:13 -05:00
import logging
2025-01-13 20:47:39 -05:00
import sys
2025-01-14 11:10:13 -05:00
import traceback
2025-01-13 20:47:39 -05:00
sys.path.insert(1,'..')
2025-01-14 07:45:34 -05:00
sys.path.insert(1,'.')
2025-01-13 20:47:39 -05:00
from typing import Optional
2025-01-14 07:45:34 -05:00
import aiosqlite as sqlite3
2025-01-13 20:47:39 -05:00
from lyric_search_new import utils
from lyric_search_new.constructors import LyricsResult
2025-01-14 11:10:13 -05:00
logger = logging.getLogger()
log_level = logging.getLevelName(logger.level)
2025-01-12 20:19:48 -05:00
class Cache:
"""Cache Search Module"""
def __init__(self):
2025-01-14 14:17:18 -05:00
self.cache_db: str = os.path.join("/", "var",
2025-01-13 20:47:39 -05:00
"lib", "singerdbs",
"cached_lyrics.db")
2025-01-14 14:17:18 -05:00
self.cache_pre_query: str = "pragma journal_mode = WAL; pragma synchronous = normal; pragma temp_store = memory; pragma mmap_size = 30000000000;"
self.sqlite_exts: list[str] = ['/usr/local/lib/python3.11/dist-packages/spellfix1.cpython-311-x86_64-linux-gnu.so']
self.label: str = "Cache"
2025-01-13 20:47:39 -05:00
2025-01-14 14:17:18 -05:00
def get_matched(self, sqlite_rows: list[sqlite3.Row], matched_candidate: tuple, confidence: float) -> Optional[LyricsResult]:
2025-01-14 07:45:34 -05:00
"""Get Matched Result"""
2025-01-14 14:17:18 -05:00
matched_id: int = matched_candidate[0]
2025-01-13 20:47:39 -05:00
for row in sqlite_rows:
if row[0] == matched_id:
(_id, artist, song, lyrics, original_src, _confidence) = row
return LyricsResult(
artist=artist,
song=song,
lyrics=lyrics,
src=f"{original_src} (cached, id: {_id})",
confidence=confidence)
return None
2025-01-14 14:17:18 -05:00
async def search(self, artist: str, song: str) -> Optional[LyricsResult]:
2025-01-13 20:47:39 -05:00
"""
@artist: the artist to search
@song: the song to search
Returns:
- LyricsResult corresponding to nearest match found (if found), **None** otherwise
"""
2025-01-14 11:10:13 -05:00
try:
2025-01-14 14:17:18 -05:00
artist: str = artist.strip().lower()
song: str = song.strip().lower()
2025-01-14 18:37:49 -05:00
search_params: Optional[tuple] = None
random_search: bool = False
2025-01-14 11:13:39 -05:00
logging.info("Searching %s - %s on %s",
artist, song, self.label)
2025-01-14 11:10:13 -05:00
async with sqlite3.connect(self.cache_db, timeout=2) as db_conn:
await db_conn.enable_load_extension(True)
for ext in self.sqlite_exts:
await db_conn.load_extension(ext)
async with await db_conn.executescript(self.cache_pre_query) as _db_cursor:
2025-01-14 14:17:18 -05:00
search_query: str = 'SELECT id, artist, song, lyrics, src, confidence FROM lyrics\
2025-01-14 11:10:13 -05:00
WHERE editdist3((artist || " " || song), (? || " " || ?))\
<= 410 ORDER BY editdist3((artist || " " || song), ?) ASC LIMIT 10'
2025-01-14 14:17:18 -05:00
search_params: tuple = (artist.strip(), song.strip(),
2025-01-14 18:37:49 -05:00
f"{artist.strip()} {song.strip()}")
if artist == "!" and song == "!":
random_search: bool = True
search_query: str = 'SELECT id, artist, song, lyrics, src, confidence FROM lyrics ORDER BY RANDOM() LIMIT 1'
search_params = None
2025-01-14 11:10:13 -05:00
async with await _db_cursor.execute(search_query, search_params) as db_cursor:
2025-01-14 14:17:18 -05:00
results: list = await db_cursor.fetchall()
result_tracks: list = []
2025-01-14 11:10:13 -05:00
for track in results:
(_id, _artist, _song, _lyrics, _src, _confidence) = track
result_tracks.append((_id, f"{_artist} - {_song}"))
2025-01-14 14:17:18 -05:00
input_track: str = f"{artist} - {song}"
2025-01-14 11:10:13 -05:00
matcher = utils.TrackMatcher()
2025-01-14 18:37:49 -05:00
if not random_search:
best_match: tuple|None = matcher.find_best_match(input_track=input_track,
2025-01-14 11:10:13 -05:00
candidate_tracks=result_tracks)
2025-01-14 18:37:49 -05:00
else:
best_match = (result_tracks[0], float(1))
2025-01-14 11:10:13 -05:00
if not best_match:
return None
(candidate, confidence) = best_match
logging.info("Result found on %s", self.label)
return self.get_matched(sqlite_rows=results,
matched_candidate=candidate,
confidence=confidence)
except:
if log_level == "DEBUG":
traceback.print_exc()
return
2025-01-13 20:47:39 -05:00