mirror of https://github.com/Nezreka/SoulSync.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
592 lines
24 KiB
592 lines
24 KiB
"""
|
|
Hydrabase P2P metadata client.
|
|
|
|
Sends search requests over a shared WebSocket connection and returns
|
|
results normalized to the same dataclass types used by SpotifyClient
|
|
and iTunesClient (Track, Artist, Album).
|
|
"""
|
|
|
|
import json
|
|
import logging
|
|
import re
|
|
import time
|
|
from typing import List, Optional, Callable, Tuple
|
|
|
|
from core.itunes_client import Track, Artist, Album
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
class HydrabaseClient:
|
|
"""
|
|
Synchronous metadata client that queries the Hydrabase P2P network.
|
|
|
|
Shares the WebSocket connection and lock with HydrabaseWorker.
|
|
All search methods block until a response is received (with timeout).
|
|
"""
|
|
|
|
def __init__(self, get_ws_and_lock: Callable[[], Tuple]):
|
|
"""
|
|
Args:
|
|
get_ws_and_lock: Callable returning (ws, lock) tuple.
|
|
Same callable used by HydrabaseWorker.
|
|
"""
|
|
self.get_ws_and_lock = get_ws_and_lock
|
|
self.timeout = 8 # seconds
|
|
self.last_peer_count = None
|
|
self.last_peer_count_time = None
|
|
|
|
def is_connected(self) -> bool:
|
|
ws, lock = self.get_ws_and_lock()
|
|
if ws is None:
|
|
return False
|
|
try:
|
|
return ws.connected
|
|
except Exception:
|
|
return False
|
|
|
|
def _extract_stats(self, data):
|
|
"""Extract peer stats from any message that contains them."""
|
|
if isinstance(data, dict) and 'stats' in data:
|
|
stats = data['stats']
|
|
if isinstance(stats, dict) and 'connectedPeers' in stats:
|
|
self.last_peer_count = stats['connectedPeers']
|
|
self.last_peer_count_time = time.time()
|
|
|
|
@staticmethod
|
|
def _extract_results(data) -> Optional[list]:
|
|
"""Extract results array from a response dict. Returns None if not a results message."""
|
|
if not isinstance(data, dict):
|
|
return None
|
|
if 'response' in data:
|
|
resp = data['response']
|
|
return resp if isinstance(resp, list) else [resp]
|
|
if 'results' in data:
|
|
return data['results']
|
|
if 'data' in data:
|
|
result = data['data']
|
|
return result if isinstance(result, list) else [result]
|
|
return None
|
|
|
|
def _send_and_recv(self, request_type: str, query: str) -> Optional[list]:
|
|
"""Send a search request and return the response array.
|
|
|
|
Uses a nonce for request-response correlation and loops on recv()
|
|
to drain any interleaved stats/heartbeat messages from the server.
|
|
"""
|
|
ws, lock = self.get_ws_and_lock()
|
|
if ws is None:
|
|
return None
|
|
try:
|
|
if not ws.connected:
|
|
return None
|
|
except Exception:
|
|
return None
|
|
|
|
nonce = int(time.time() * 1000)
|
|
payload = json.dumps({
|
|
'request': {
|
|
'type': request_type,
|
|
'query': query
|
|
},
|
|
'nonce': nonce
|
|
})
|
|
|
|
try:
|
|
with lock:
|
|
ws.settimeout(self.timeout)
|
|
ws.send(payload)
|
|
|
|
deadline = time.time() + self.timeout
|
|
while True:
|
|
remaining = deadline - time.time()
|
|
if remaining <= 0:
|
|
logger.warning(f"Hydrabase response timeout for ({request_type}, '{query}')")
|
|
return None
|
|
|
|
ws.settimeout(remaining)
|
|
raw = ws.recv()
|
|
data = json.loads(raw)
|
|
|
|
# Always extract stats from any message
|
|
self._extract_stats(data)
|
|
|
|
# Bare list — results with no envelope
|
|
if isinstance(data, list):
|
|
return data
|
|
|
|
if not isinstance(data, dict):
|
|
continue
|
|
|
|
# Response has our nonce — definitely ours
|
|
if data.get('nonce') == nonce:
|
|
results = self._extract_results(data)
|
|
logger.debug(f"Hydrabase matched nonce for ({request_type}, '{query}'): {len(results) if results else 0} results")
|
|
return results if results is not None else []
|
|
|
|
# Response has results but no nonce (server doesn't echo nonces)
|
|
if 'nonce' not in data:
|
|
results = self._extract_results(data)
|
|
if results is not None:
|
|
logger.debug(f"Hydrabase no-nonce results for ({request_type}, '{query}'): {len(results)} results")
|
|
return results
|
|
# Stats-only message with no nonce — skip and recv again
|
|
logger.debug(f"Hydrabase draining non-result message for ({request_type}, '{query}')")
|
|
continue
|
|
|
|
# Has a nonce but not ours — stale response, skip it
|
|
logger.debug(f"Hydrabase draining stale nonce {data.get('nonce')} (ours={nonce}) for ({request_type}, '{query}')")
|
|
|
|
except Exception as e:
|
|
logger.error(f"Hydrabase query failed ({request_type}, '{query}'): {e}")
|
|
return None
|
|
|
|
@staticmethod
|
|
def _normalize_artists(artists_raw) -> list:
|
|
"""Normalize artists to a list of strings (Hydrabase may send dicts or strings)."""
|
|
if not artists_raw or not isinstance(artists_raw, list):
|
|
return []
|
|
result = []
|
|
for a in artists_raw:
|
|
if isinstance(a, str):
|
|
result.append(a)
|
|
elif isinstance(a, dict):
|
|
result.append(a.get('name', ''))
|
|
else:
|
|
result.append(str(a))
|
|
return [x for x in result if x]
|
|
|
|
@staticmethod
|
|
def _normalize_release_date(date_str: str) -> str:
|
|
"""Strip time portion from ISO dates like '1995-01-01T08:00:00Z' -> '1995-01-01'."""
|
|
if not date_str:
|
|
return date_str
|
|
# Match YYYY-MM-DD at the start, discard the rest
|
|
match = re.match(r'(\d{4}(?:-\d{2}(?:-\d{2})?)?)', date_str)
|
|
return match.group(1) if match else date_str
|
|
|
|
# ==================== Track Methods ====================
|
|
|
|
def search_tracks(self, query: str, limit: int = 20) -> List[Track]:
|
|
results = self._send_and_recv('tracks', query)
|
|
if not results:
|
|
return []
|
|
|
|
tracks = []
|
|
for item in results[:limit]:
|
|
try:
|
|
ext_urls = dict(item.get('external_urls', {}) or {})
|
|
if item.get('soul_id'):
|
|
ext_urls['hydrabase_soul_id'] = str(item['soul_id'])
|
|
if item.get('plugin_id'):
|
|
ext_urls['hydrabase_plugin'] = item['plugin_id'].lower()
|
|
tracks.append(Track(
|
|
id=str(item.get('id', '')),
|
|
name=item.get('name', ''),
|
|
artists=self._normalize_artists(item.get('artists', [])),
|
|
album=item.get('album', ''),
|
|
duration_ms=item.get('duration_ms', 0),
|
|
popularity=item.get('popularity', 0),
|
|
preview_url=item.get('preview_url'),
|
|
external_urls=ext_urls,
|
|
image_url=item.get('image_url'),
|
|
release_date=self._normalize_release_date(item.get('release_date', ''))
|
|
))
|
|
except Exception as e:
|
|
logger.debug(f"Skipping malformed Hydrabase track: {e}")
|
|
return tracks
|
|
|
|
# ==================== Artist Methods ====================
|
|
|
|
def search_artists(self, query: str, limit: int = 20) -> List[Artist]:
|
|
results = self._send_and_recv('artists', query)
|
|
if not results:
|
|
return []
|
|
|
|
artists = []
|
|
for item in results[:limit]:
|
|
try:
|
|
ext_urls = dict(item.get('external_urls', {}) or {})
|
|
if item.get('soul_id'):
|
|
ext_urls['hydrabase_soul_id'] = str(item['soul_id'])
|
|
if item.get('plugin_id'):
|
|
ext_urls['hydrabase_plugin'] = item['plugin_id'].lower()
|
|
artists.append(Artist(
|
|
id=str(item.get('id', '')),
|
|
name=item.get('name', ''),
|
|
popularity=item.get('popularity', 0),
|
|
genres=item.get('genres', []),
|
|
followers=item.get('followers', 0),
|
|
image_url=item.get('image_url'),
|
|
external_urls=ext_urls
|
|
))
|
|
except Exception as e:
|
|
logger.debug(f"Skipping malformed Hydrabase artist: {e}")
|
|
return artists
|
|
|
|
# ==================== Album Methods ====================
|
|
|
|
def search_albums(self, query: str, limit: int = 20) -> List[Album]:
|
|
results = self._send_and_recv('albums', query)
|
|
if not results:
|
|
return []
|
|
|
|
albums = []
|
|
for item in results[:limit]:
|
|
try:
|
|
# Use the plugin's native ID (iTunes/Spotify) so downstream
|
|
# endpoints can look it up. Carry soul_id in external_urls
|
|
# for Hydrabase-specific lookups (album.tracks).
|
|
ext_urls = dict(item.get('external_urls', {}) or {})
|
|
soul_id = item.get('soul_id', '')
|
|
if soul_id:
|
|
ext_urls['hydrabase_soul_id'] = str(soul_id)
|
|
albums.append(Album(
|
|
id=str(item.get('id', soul_id)),
|
|
name=item.get('name', ''),
|
|
artists=self._normalize_artists(item.get('artists', [])),
|
|
release_date=self._normalize_release_date(item.get('release_date', '')),
|
|
total_tracks=item.get('total_tracks', 0),
|
|
album_type=item.get('album_type', 'album'),
|
|
image_url=item.get('image_url'),
|
|
external_urls=ext_urls
|
|
))
|
|
except Exception as e:
|
|
logger.debug(f"Skipping malformed Hydrabase album: {e}")
|
|
return albums
|
|
|
|
# ==================== Discography Methods ====================
|
|
|
|
def search_discography(self, artist_name: str, limit: int = 50) -> List[Album]:
|
|
"""Fetch an artist's discography (albums + singles) from Hydrabase."""
|
|
results = self._send_and_recv('artist.albums', artist_name)
|
|
if not results:
|
|
results = self._send_and_recv('discography', artist_name)
|
|
if not results:
|
|
return []
|
|
|
|
albums = []
|
|
for item in results[:limit]:
|
|
try:
|
|
ext_urls = dict(item.get('external_urls', {}) or {})
|
|
soul_id = item.get('soul_id', '')
|
|
if soul_id:
|
|
ext_urls['hydrabase_soul_id'] = str(soul_id)
|
|
albums.append(Album(
|
|
id=str(item.get('id', soul_id)),
|
|
name=item.get('name', ''),
|
|
artists=self._normalize_artists(item.get('artists', [])),
|
|
release_date=self._normalize_release_date(item.get('release_date', '')),
|
|
total_tracks=item.get('total_tracks', 0),
|
|
album_type=item.get('album_type', 'album'),
|
|
image_url=item.get('image_url'),
|
|
external_urls=ext_urls
|
|
))
|
|
except Exception as e:
|
|
logger.debug(f"Skipping malformed Hydrabase discography album: {e}")
|
|
return albums
|
|
|
|
# ==================== Detail Methods (Spotify-compatible dict format) ====================
|
|
|
|
def get_track_details(self, track_id: str) -> Optional[dict]:
|
|
"""Get detailed track information including album data — Spotify-compatible dict.
|
|
|
|
Sends 'track.details' request. If the server doesn't support it,
|
|
falls back to a track search by ID and builds the enhanced dict from
|
|
whatever we get back.
|
|
"""
|
|
results = self._send_and_recv('track.details', track_id)
|
|
if not results:
|
|
results = self._send_and_recv('tracks', track_id)
|
|
if not results:
|
|
return None
|
|
|
|
item = results[0] if results else None
|
|
if not item or not isinstance(item, dict):
|
|
return None
|
|
|
|
artists = item.get('artists', [])
|
|
primary_artist = artists[0] if artists else 'Unknown Artist'
|
|
if isinstance(primary_artist, dict):
|
|
primary_artist = primary_artist.get('name', 'Unknown Artist')
|
|
|
|
album_name = item.get('album', '') or item.get('album_name', '')
|
|
release_date = self._normalize_release_date(item.get('release_date', ''))
|
|
|
|
return {
|
|
'id': str(item.get('id', '')),
|
|
'name': item.get('name', ''),
|
|
'track_number': item.get('track_number', 0),
|
|
'disc_number': item.get('disc_number', 1),
|
|
'duration_ms': item.get('duration_ms', 0),
|
|
'explicit': item.get('explicit', False),
|
|
'artists': [primary_artist] if isinstance(primary_artist, str) else artists,
|
|
'primary_artist': primary_artist,
|
|
'album': {
|
|
'id': str(item.get('album_id', item.get('soul_id', ''))),
|
|
'name': album_name,
|
|
'total_tracks': item.get('total_tracks', 0),
|
|
'release_date': release_date,
|
|
'album_type': item.get('album_type', 'album'),
|
|
'artists': [primary_artist] if isinstance(primary_artist, str) else artists,
|
|
},
|
|
'is_album_track': (item.get('total_tracks', 0) or 0) > 1,
|
|
'image_url': item.get('image_url'),
|
|
'external_urls': item.get('external_urls', {}),
|
|
'_source': 'hydrabase',
|
|
}
|
|
|
|
def get_album(self, album_id: str, include_tracks: bool = True) -> Optional[dict]:
|
|
"""Get album information with tracks — Spotify-compatible dict.
|
|
|
|
Sends 'album.get' request. Falls back to 'album' search if the
|
|
server doesn't support the detailed endpoint.
|
|
"""
|
|
results = self._send_and_recv('album.get', album_id)
|
|
if not results:
|
|
results = self._send_and_recv('albums', album_id)
|
|
if not results:
|
|
return None
|
|
|
|
item = results[0] if results else None
|
|
if not item or not isinstance(item, dict):
|
|
return None
|
|
|
|
artists_raw = item.get('artists', [])
|
|
artist_dicts = []
|
|
for a in artists_raw:
|
|
if isinstance(a, dict):
|
|
artist_dicts.append(a)
|
|
elif isinstance(a, str):
|
|
artist_dicts.append({'name': a, 'id': ''})
|
|
|
|
image_url = item.get('image_url', '')
|
|
images = []
|
|
if image_url:
|
|
images = [
|
|
{'url': image_url, 'height': 600, 'width': 600},
|
|
{'url': image_url, 'height': 300, 'width': 300},
|
|
]
|
|
|
|
release_date = self._normalize_release_date(item.get('release_date', ''))
|
|
total_tracks = item.get('total_tracks', 0)
|
|
|
|
album_type = item.get('album_type', 'album')
|
|
if not album_type or album_type == 'album':
|
|
if total_tracks and total_tracks <= 3:
|
|
album_type = 'single'
|
|
elif total_tracks and total_tracks <= 6:
|
|
album_type = 'ep'
|
|
|
|
album_result = {
|
|
'id': str(item.get('soul_id', item.get('id', ''))),
|
|
'name': item.get('name', ''),
|
|
'images': images,
|
|
'artists': artist_dicts,
|
|
'release_date': release_date,
|
|
'total_tracks': total_tracks,
|
|
'album_type': album_type,
|
|
'external_urls': item.get('external_urls', {}),
|
|
'uri': f"hydrabase:album:{item.get('soul_id', item.get('id', ''))}",
|
|
'_source': 'hydrabase',
|
|
}
|
|
|
|
if include_tracks:
|
|
tracks_data = self.get_album_tracks_dict(album_id)
|
|
if tracks_data and isinstance(tracks_data, dict) and 'items' in tracks_data:
|
|
album_result['tracks'] = tracks_data
|
|
else:
|
|
album_result['tracks'] = {'items': [], 'total': 0}
|
|
|
|
return album_result
|
|
|
|
def get_album_tracks(self, album_id: str, limit: int = 50) -> List[Track]:
|
|
"""Fetch tracks for an album — returns Track dataclass list.
|
|
|
|
Used by existing web_server.py endpoints that expect List[Track].
|
|
"""
|
|
results = self._send_and_recv('album.tracks', album_id)
|
|
if not results:
|
|
return []
|
|
|
|
tracks = []
|
|
for item in results[:limit]:
|
|
try:
|
|
tracks.append(Track(
|
|
id=str(item.get('id', '')),
|
|
name=item.get('name', ''),
|
|
artists=self._normalize_artists(item.get('artists', [])),
|
|
album=item.get('album', ''),
|
|
duration_ms=item.get('duration_ms', 0),
|
|
popularity=item.get('popularity', 0),
|
|
preview_url=item.get('preview_url'),
|
|
external_urls=item.get('external_urls'),
|
|
image_url=item.get('image_url'),
|
|
release_date=self._normalize_release_date(item.get('release_date', '')),
|
|
track_number=item.get('track_number'),
|
|
disc_number=item.get('disc_number'),
|
|
))
|
|
except Exception as e:
|
|
logger.debug(f"Skipping malformed Hydrabase album track: {e}")
|
|
return tracks
|
|
|
|
def get_album_tracks_dict(self, album_id: str, limit: int = 50) -> Optional[dict]:
|
|
"""Fetch tracks for an album — Spotify-compatible dict format.
|
|
|
|
Returns {items: List[Dict], total: int, limit: int, next: None}.
|
|
Used by get_album() for Spotify-compatible interface parity.
|
|
"""
|
|
results = self._send_and_recv('album.tracks', album_id)
|
|
if not results:
|
|
return None
|
|
|
|
tracks = []
|
|
for item in results[:limit]:
|
|
try:
|
|
artists_raw = item.get('artists', [])
|
|
artist_dicts = [{'name': a} if isinstance(a, str) else a for a in artists_raw]
|
|
|
|
tracks.append({
|
|
'id': str(item.get('id', '')),
|
|
'name': item.get('name', ''),
|
|
'artists': artist_dicts,
|
|
'album': {
|
|
'id': str(album_id),
|
|
'name': item.get('album', ''),
|
|
'images': [{'url': item.get('image_url', ''), 'height': 300, 'width': 300}] if item.get('image_url') else [],
|
|
'release_date': self._normalize_release_date(item.get('release_date', '')),
|
|
},
|
|
'duration_ms': item.get('duration_ms', 0),
|
|
'track_number': item.get('track_number', 0),
|
|
'disc_number': item.get('disc_number', 1),
|
|
'explicit': item.get('explicit', False),
|
|
'preview_url': item.get('preview_url'),
|
|
'external_urls': item.get('external_urls', {}),
|
|
'uri': f"hydrabase:track:{item.get('id', '')}",
|
|
'_source': 'hydrabase',
|
|
})
|
|
except Exception as e:
|
|
logger.debug(f"Skipping malformed Hydrabase album track: {e}")
|
|
|
|
tracks.sort(key=lambda t: (t.get('disc_number', 1), t.get('track_number', 0)))
|
|
|
|
return {
|
|
'items': tracks,
|
|
'total': len(tracks),
|
|
'limit': limit,
|
|
'next': None,
|
|
}
|
|
|
|
def get_artist(self, artist_id: str) -> Optional[dict]:
|
|
"""Get detailed artist info — Spotify-compatible dict.
|
|
|
|
Sends 'artist.get' request. Falls back to 'artists' search if the
|
|
server doesn't support the detailed endpoint.
|
|
"""
|
|
results = self._send_and_recv('artist.get', artist_id)
|
|
if not results:
|
|
results = self._send_and_recv('artists', artist_id)
|
|
if not results:
|
|
return None
|
|
|
|
item = results[0] if results else None
|
|
if not item or not isinstance(item, dict):
|
|
return None
|
|
|
|
image_url = item.get('image_url', '')
|
|
images = []
|
|
if image_url:
|
|
images = [
|
|
{'url': image_url, 'height': 600, 'width': 600},
|
|
{'url': image_url, 'height': 300, 'width': 300},
|
|
]
|
|
|
|
genres = item.get('genres', [])
|
|
if not genres and item.get('genre'):
|
|
genres = [item['genre']]
|
|
|
|
return {
|
|
'id': str(item.get('id', '')),
|
|
'name': item.get('name', ''),
|
|
'images': images,
|
|
'genres': genres,
|
|
'popularity': item.get('popularity', 0),
|
|
'followers': {'total': item.get('followers', 0)},
|
|
'external_urls': item.get('external_urls', {}),
|
|
'uri': f"hydrabase:artist:{item.get('id', '')}",
|
|
'_source': 'hydrabase',
|
|
}
|
|
|
|
def _get_artist_image_from_albums(self, artist_id: str):
|
|
"""Get artist image from their album art — stub for interface parity with iTunes/Deezer clients."""
|
|
try:
|
|
albums = self.get_artist_albums(artist_id, limit=5)
|
|
if albums:
|
|
for album in albums:
|
|
if album.image_url:
|
|
return album.image_url
|
|
except Exception:
|
|
pass
|
|
return None
|
|
|
|
def get_artist_albums(self, artist_id: str, album_type: str = 'album,single', limit: int = 50) -> List[Album]:
|
|
"""Get albums by artist — returns Album dataclass list.
|
|
|
|
Uses the discography endpoint under the hood since Hydrabase
|
|
indexes by artist name rather than ID. Falls back to search_discography
|
|
if 'artist.albums' isn't supported.
|
|
"""
|
|
results = self._send_and_recv('artist.albums', artist_id)
|
|
if not results:
|
|
# Fallback: try discography with the ID as a name query
|
|
results = self._send_and_recv('discography', artist_id)
|
|
if not results:
|
|
return []
|
|
|
|
# Filter by album_type if requested
|
|
type_filter = set(album_type.split(',')) if album_type else None
|
|
|
|
albums = []
|
|
for item in results[:limit]:
|
|
try:
|
|
item_type = item.get('album_type', 'album')
|
|
if type_filter and item_type not in type_filter:
|
|
continue
|
|
ext_urls = dict(item.get('external_urls', {}) or {})
|
|
soul_id = item.get('soul_id', '')
|
|
if soul_id:
|
|
ext_urls['hydrabase_soul_id'] = str(soul_id)
|
|
albums.append(Album(
|
|
id=str(item.get('id', soul_id)),
|
|
name=item.get('name', ''),
|
|
artists=self._normalize_artists(item.get('artists', [])),
|
|
release_date=self._normalize_release_date(item.get('release_date', '')),
|
|
total_tracks=item.get('total_tracks', 0),
|
|
album_type=item_type,
|
|
image_url=item.get('image_url'),
|
|
external_urls=ext_urls,
|
|
))
|
|
except Exception as e:
|
|
logger.debug(f"Skipping malformed Hydrabase artist album: {e}")
|
|
return albums
|
|
|
|
def get_track_features(self, track_id: str) -> None:
|
|
"""Audio features not available from Hydrabase."""
|
|
return None
|
|
|
|
# ==================== Interface parity ====================
|
|
|
|
def is_authenticated(self) -> bool:
|
|
"""Matches iTunes/Deezer/Spotify interface — True if connected."""
|
|
return self.is_connected()
|
|
|
|
def reload_config(self):
|
|
"""No-op for interface parity with iTunes/Deezer/Spotify."""
|
|
pass
|
|
|
|
# ==================== Raw access (for comparison) ====================
|
|
|
|
def search_raw(self, query: str, search_type: str) -> Optional[list]:
|
|
"""Return raw Hydrabase results without normalization (for comparison UI)."""
|
|
return self._send_and_recv(search_type, query)
|