revisions

This commit is contained in:
2025-01-14 11:10:13 -05:00
parent 3c23bc93f6
commit f3336b09ac
5 changed files with 58 additions and 37 deletions

View File

@@ -33,8 +33,6 @@ class TrackMatcher:
# Normalize input track
input_track = self._normalize_string(input_track)
print(f"input_track: {input_track}")
best_match = None
best_score = 0
@@ -64,7 +62,6 @@ class TrackMatcher:
"""
# Remove special characters and convert to lowercase
text = regex.sub(r'[^\w\s-]', '', text).lower()
print(f"Text: {text}")
# Normalize spaces
text = ' '.join(text.split())
return text
@@ -89,7 +86,7 @@ class DataUtils:
Data Utils
"""
def scrub_lyrics(self, lyrics: str) -> str:
# Regex chain
"""Regex Chain"""
lyrics = regex.sub(r'(\[.*?\])(\s){0,}(\:){0,1}', '', lyrics)
lyrics = regex.sub(r'(\d?)(Embed\b)', '', lyrics, flags=regex.IGNORECASE)
lyrics = regex.sub(r'\n{2}', '\n', lyrics) # Gaps between verses