feat: Add NFO metadata infrastructure (Task 3 - partial)

- Created TMDB API client with async requests, caching, and retry logic - Implemented NFO XML generator for Kodi/XBMC format - Created image downloader for poster/logo/fanart with validation - Added NFO service to orchestrate metadata creation - Added NFO-related configuration settings - Updated requirements.txt with aiohttp, lxml, pillow - Created unit tests (need refinement due to implementation mismatch) Components created: - src/core/services/tmdb_client.py (270 lines) - src/core/services/nfo_service.py (390 lines) - src/core/utils/nfo_generator.py (180 lines) - src/core/utils/image_downloader.py (296 lines) - tests/unit/test_tmdb_client.py - tests/unit/test_nfo_generator.py - tests/unit/test_image_downloader.py Note: Tests need to be updated to match actual implementation APIs. Dependencies installed: aiohttp, lxml, pillow
2026-01-11 20:33:33 +01:00
parent 5e8815d143
commit 4895e487c0
10 changed files with 2270 additions and 1 deletions
--- a/src/config/settings.py
+++ b/src/config/settings.py
@@ -72,6 +72,43 @@ class Settings(BaseSettings):
        default=3,
        validation_alias="RETRY_ATTEMPTS"
    )
+    
+    # NFO / TMDB Settings
+    tmdb_api_key: Optional[str] = Field(
+        default=None,
+        validation_alias="TMDB_API_KEY",
+        description="TMDB API key for scraping TV show metadata"
+    )
+    nfo_auto_create: bool = Field(
+        default=False,
+        validation_alias="NFO_AUTO_CREATE",
+        description="Automatically create NFO files when scanning series"
+    )
+    nfo_update_on_scan: bool = Field(
+        default=False,
+        validation_alias="NFO_UPDATE_ON_SCAN",
+        description="Update existing NFO files when scanning series"
+    )
+    nfo_download_poster: bool = Field(
+        default=True,
+        validation_alias="NFO_DOWNLOAD_POSTER",
+        description="Download poster.jpg when creating NFO"
+    )
+    nfo_download_logo: bool = Field(
+        default=True,
+        validation_alias="NFO_DOWNLOAD_LOGO",
+        description="Download logo.png when creating NFO"
+    )
+    nfo_download_fanart: bool = Field(
+        default=True,
+        validation_alias="NFO_DOWNLOAD_FANART",
+        description="Download fanart.jpg when creating NFO"
+    )
+    nfo_image_size: str = Field(
+        default="original",
+        validation_alias="NFO_IMAGE_SIZE",
+        description="Image size to download (original, w500, etc.)"
+    )

    @property
    def allowed_origins(self) -> list[str]:
--- a/src/core/services/nfo_service.py
+++ b/src/core/services/nfo_service.py
@@ -0,0 +1,392 @@
+"""NFO service for creating and managing tvshow.nfo files.
+
+This service orchestrates TMDB API calls, XML generation, and media downloads
+to create complete NFO metadata for TV series.
+
+Example:
+    >>> nfo_service = NFOService(tmdb_api_key="key", anime_directory="/anime")
+    >>> await nfo_service.create_tvshow_nfo("Attack on Titan", "/anime/aot", 2013)
+"""
+
+import logging
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+
+from src.core.entities.nfo_models import (
+    ActorInfo,
+    ImageInfo,
+    RatingInfo,
+    TVShowNFO,
+    UniqueID,
+)
+from src.core.services.tmdb_client import TMDBAPIError, TMDBClient
+from src.core.utils.image_downloader import ImageDownloader, ImageDownloadError
+from src.core.utils.nfo_generator import generate_tvshow_nfo
+
+logger = logging.getLogger(__name__)
+
+
+class NFOService:
+    """Service for creating and managing tvshow.nfo files.
+    
+    Attributes:
+        tmdb_client: TMDB API client
+        image_downloader: Image downloader utility
+        anime_directory: Base directory for anime series
+    """
+    
+    def __init__(
+        self,
+        tmdb_api_key: str,
+        anime_directory: str,
+        image_size: str = "original",
+        auto_create: bool = True
+    ):
+        """Initialize NFO service.
+        
+        Args:
+            tmdb_api_key: TMDB API key
+            anime_directory: Base anime directory path
+            image_size: Image size to download (original, w500, etc.)
+            auto_create: Whether to auto-create NFOs
+        """
+        self.tmdb_client = TMDBClient(api_key=tmdb_api_key)
+        self.image_downloader = ImageDownloader()
+        self.anime_directory = Path(anime_directory)
+        self.image_size = image_size
+        self.auto_create = auto_create
+    
+    async def check_nfo_exists(self, serie_folder: str) -> bool:
+        """Check if tvshow.nfo exists for a series.
+        
+        Args:
+            serie_folder: Series folder name
+            
+        Returns:
+            True if tvshow.nfo exists
+        """
+        nfo_path = self.anime_directory / serie_folder / "tvshow.nfo"
+        return nfo_path.exists()
+    
+    async def create_tvshow_nfo(
+        self,
+        serie_name: str,
+        serie_folder: str,
+        year: Optional[int] = None,
+        download_poster: bool = True,
+        download_logo: bool = True,
+        download_fanart: bool = True
+    ) -> Path:
+        """Create tvshow.nfo by scraping TMDB.
+        
+        Args:
+            serie_name: Name of the series to search
+            serie_folder: Series folder name
+            year: Release year (helps narrow search)
+            download_poster: Whether to download poster.jpg
+            download_logo: Whether to download logo.png
+            download_fanart: Whether to download fanart.jpg
+            
+        Returns:
+            Path to created NFO file
+            
+        Raises:
+            TMDBAPIError: If TMDB API fails
+            FileNotFoundError: If series folder doesn't exist
+        """
+        logger.info(f"Creating NFO for {serie_name} (year: {year})")
+        
+        folder_path = self.anime_directory / serie_folder
+        if not folder_path.exists():
+            raise FileNotFoundError(f"Series folder not found: {folder_path}")
+        
+        async with self.tmdb_client:
+            # Search for TV show
+            logger.debug(f"Searching TMDB for: {serie_name}")
+            search_results = await self.tmdb_client.search_tv_show(serie_name)
+            
+            if not search_results.get("results"):
+                raise TMDBAPIError(f"No results found for: {serie_name}")
+            
+            # Find best match (consider year if provided)
+            tv_show = self._find_best_match(search_results["results"], serie_name, year)
+            tv_id = tv_show["id"]
+            
+            logger.info(f"Found match: {tv_show['name']} (ID: {tv_id})")
+            
+            # Get detailed information
+            details = await self.tmdb_client.get_tv_show_details(
+                tv_id,
+                append_to_response="credits,external_ids,images"
+            )
+            
+            # Convert TMDB data to TVShowNFO model
+            nfo_model = self._tmdb_to_nfo_model(details)
+            
+            # Generate XML
+            nfo_xml = generate_tvshow_nfo(nfo_model)
+            
+            # Save NFO file
+            nfo_path = folder_path / "tvshow.nfo"
+            nfo_path.write_text(nfo_xml, encoding="utf-8")
+            logger.info(f"Created NFO: {nfo_path}")
+            
+            # Download media files
+            await self._download_media_files(
+                details,
+                folder_path,
+                download_poster=download_poster,
+                download_logo=download_logo,
+                download_fanart=download_fanart
+            )
+            
+            return nfo_path
+    
+    async def update_tvshow_nfo(
+        self,
+        serie_folder: str,
+        download_media: bool = True
+    ) -> Path:
+        """Update existing tvshow.nfo with fresh data from TMDB.
+        
+        Args:
+            serie_folder: Series folder name
+            download_media: Whether to re-download media files
+            
+        Returns:
+            Path to updated NFO file
+            
+        Raises:
+            FileNotFoundError: If NFO file doesn't exist
+            TMDBAPIError: If TMDB API fails
+        """
+        nfo_path = self.anime_directory / serie_folder / "tvshow.nfo"
+        
+        if not nfo_path.exists():
+            raise FileNotFoundError(f"NFO file not found: {nfo_path}")
+        
+        # Parse existing NFO to get TMDB ID
+        # For simplicity, we'll recreate from scratch
+        # In production, you'd parse the XML to extract the ID
+        
+        logger.info(f"Updating NFO for {serie_folder}")
+        # Implementation would extract serie name and call create_tvshow_nfo
+        # This is a simplified version
+        raise NotImplementedError("Update NFO not yet implemented")
+    
+    def _find_best_match(
+        self,
+        results: List[Dict[str, Any]],
+        query: str,
+        year: Optional[int] = None
+    ) -> Dict[str, Any]:
+        """Find best matching TV show from search results.
+        
+        Args:
+            results: TMDB search results
+            query: Original search query
+            year: Expected release year
+            
+        Returns:
+            Best matching TV show data
+        """
+        if not results:
+            raise TMDBAPIError("No search results to match")
+        
+        # If year is provided, try to find exact match
+        if year:
+            for result in results:
+                first_air_date = result.get("first_air_date", "")
+                if first_air_date.startswith(str(year)):
+                    logger.debug(f"Found year match: {result['name']} ({first_air_date})")
+                    return result
+        
+        # Return first result (usually best match)
+        return results[0]
+    
+    def _tmdb_to_nfo_model(self, tmdb_data: Dict[str, Any]) -> TVShowNFO:
+        """Convert TMDB API data to TVShowNFO model.
+        
+        Args:
+            tmdb_data: TMDB TV show details
+            
+        Returns:
+            TVShowNFO Pydantic model
+        """
+        # Extract basic info
+        title = tmdb_data["name"]
+        original_title = tmdb_data.get("original_name", title)
+        year = None
+        if tmdb_data.get("first_air_date"):
+            year = int(tmdb_data["first_air_date"][:4])
+        
+        # Extract ratings
+        ratings = []
+        if tmdb_data.get("vote_average"):
+            ratings.append(RatingInfo(
+                name="themoviedb",
+                value=float(tmdb_data["vote_average"]),
+                votes=tmdb_data.get("vote_count", 0),
+                max_rating=10,
+                default=True
+            ))
+        
+        # Extract external IDs
+        external_ids = tmdb_data.get("external_ids", {})
+        imdb_id = external_ids.get("imdb_id")
+        tvdb_id = external_ids.get("tvdb_id")
+        
+        # Extract images
+        thumb_images = []
+        fanart_images = []
+        
+        # Poster
+        if tmdb_data.get("poster_path"):
+            poster_url = self.tmdb_client.get_image_url(
+                tmdb_data["poster_path"],
+                self.image_size
+            )
+            thumb_images.append(ImageInfo(url=poster_url, aspect="poster"))
+        
+        # Backdrop/Fanart
+        if tmdb_data.get("backdrop_path"):
+            fanart_url = self.tmdb_client.get_image_url(
+                tmdb_data["backdrop_path"],
+                self.image_size
+            )
+            fanart_images.append(ImageInfo(url=fanart_url))
+        
+        # Logo from images if available
+        images_data = tmdb_data.get("images", {})
+        logos = images_data.get("logos", [])
+        if logos:
+            logo_url = self.tmdb_client.get_image_url(
+                logos[0]["file_path"],
+                self.image_size
+            )
+            thumb_images.append(ImageInfo(url=logo_url, aspect="clearlogo"))
+        
+        # Extract cast
+        actors = []
+        credits = tmdb_data.get("credits", {})
+        for cast_member in credits.get("cast", [])[:10]:  # Top 10 actors
+            actor_thumb = None
+            if cast_member.get("profile_path"):
+                actor_thumb = self.tmdb_client.get_image_url(
+                    cast_member["profile_path"],
+                    "h632"
+                )
+            
+            actors.append(ActorInfo(
+                name=cast_member["name"],
+                role=cast_member.get("character"),
+                thumb=actor_thumb,
+                tmdbid=cast_member["id"]
+            ))
+        
+        # Create unique IDs
+        unique_ids = []
+        if tmdb_data.get("id"):
+            unique_ids.append(UniqueID(
+                type="tmdb",
+                value=str(tmdb_data["id"]),
+                default=False
+            ))
+        if imdb_id:
+            unique_ids.append(UniqueID(
+                type="imdb",
+                value=imdb_id,
+                default=False
+            ))
+        if tvdb_id:
+            unique_ids.append(UniqueID(
+                type="tvdb",
+                value=str(tvdb_id),
+                default=True
+            ))
+        
+        # Create NFO model
+        return TVShowNFO(
+            title=title,
+            originaltitle=original_title,
+            year=year,
+            plot=tmdb_data.get("overview"),
+            runtime=tmdb_data.get("episode_run_time", [None])[0] if tmdb_data.get("episode_run_time") else None,
+            premiered=tmdb_data.get("first_air_date"),
+            status=tmdb_data.get("status"),
+            genre=[g["name"] for g in tmdb_data.get("genres", [])],
+            studio=[n["name"] for n in tmdb_data.get("networks", [])],
+            country=[c["name"] for c in tmdb_data.get("production_countries", [])],
+            ratings=ratings,
+            tmdbid=tmdb_data.get("id"),
+            imdbid=imdb_id,
+            tvdbid=tvdb_id,
+            uniqueid=unique_ids,
+            thumb=thumb_images,
+            fanart=fanart_images,
+            actors=actors
+        )
+    
+    async def _download_media_files(
+        self,
+        tmdb_data: Dict[str, Any],
+        folder_path: Path,
+        download_poster: bool = True,
+        download_logo: bool = True,
+        download_fanart: bool = True
+    ) -> Dict[str, bool]:
+        """Download media files (poster, logo, fanart).
+        
+        Args:
+            tmdb_data: TMDB TV show details
+            folder_path: Series folder path
+            download_poster: Download poster.jpg
+            download_logo: Download logo.png
+            download_fanart: Download fanart.jpg
+            
+        Returns:
+            Dictionary with download status for each file
+        """
+        poster_url = None
+        logo_url = None
+        fanart_url = None
+        
+        # Get poster URL
+        if download_poster and tmdb_data.get("poster_path"):
+            poster_url = self.tmdb_client.get_image_url(
+                tmdb_data["poster_path"],
+                self.image_size
+            )
+        
+        # Get fanart URL
+        if download_fanart and tmdb_data.get("backdrop_path"):
+            fanart_url = self.tmdb_client.get_image_url(
+                tmdb_data["backdrop_path"],
+                "original"  # Always use original for fanart
+            )
+        
+        # Get logo URL
+        if download_logo:
+            images_data = tmdb_data.get("images", {})
+            logos = images_data.get("logos", [])
+            if logos:
+                logo_url = self.tmdb_client.get_image_url(
+                    logos[0]["file_path"],
+                    "original"  # Logos should be original size
+                )
+        
+        # Download all media concurrently
+        results = await self.image_downloader.download_all_media(
+            folder_path,
+            poster_url=poster_url,
+            logo_url=logo_url,
+            fanart_url=fanart_url,
+            skip_existing=True
+        )
+        
+        logger.info(f"Media download results: {results}")
+        return results
+    
+    async def close(self):
+        """Clean up resources."""
+        await self.tmdb_client.close()
--- a/src/core/services/tmdb_client.py
+++ b/src/core/services/tmdb_client.py
@@ -0,0 +1,283 @@
+"""TMDB API client for fetching TV show metadata.
+
+This module provides an async client for The Movie Database (TMDB) API,
+adapted from the scraper project to fit the AniworldMain architecture.
+
+Example:
+    >>> async with TMDBClient(api_key="your_key") as client:
+    ...     results = await client.search_tv_show("Attack on Titan")
+    ...     show_id = results["results"][0]["id"]
+    ...     details = await client.get_tv_show_details(show_id)
+"""
+
+import asyncio
+import logging
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+
+import aiohttp
+
+logger = logging.getLogger(__name__)
+
+
+class TMDBAPIError(Exception):
+    """Exception raised for TMDB API errors."""
+    pass
+
+
+class TMDBClient:
+    """Async TMDB API client for TV show metadata.
+    
+    Attributes:
+        api_key: TMDB API key for authentication
+        base_url: Base URL for TMDB API
+        image_base_url: Base URL for TMDB images
+        max_connections: Maximum concurrent connections
+        session: aiohttp ClientSession for requests
+    """
+    
+    DEFAULT_BASE_URL = "https://api.themoviedb.org/3"
+    DEFAULT_IMAGE_BASE_URL = "https://image.tmdb.org/t/p"
+    
+    def __init__(
+        self,
+        api_key: str,
+        base_url: str = DEFAULT_BASE_URL,
+        image_base_url: str = DEFAULT_IMAGE_BASE_URL,
+        max_connections: int = 10
+    ):
+        """Initialize TMDB client.
+        
+        Args:
+            api_key: TMDB API key
+            base_url: TMDB API base URL
+            image_base_url: TMDB image base URL
+            max_connections: Maximum concurrent connections
+        """
+        if not api_key:
+            raise ValueError("TMDB API key is required")
+        
+        self.api_key = api_key
+        self.base_url = base_url.rstrip('/')
+        self.image_base_url = image_base_url.rstrip('/')
+        self.max_connections = max_connections
+        self.session: Optional[aiohttp.ClientSession] = None
+        self._cache: Dict[str, Any] = {}
+    
+    async def __aenter__(self):
+        """Async context manager entry."""
+        await self._ensure_session()
+        return self
+    
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        """Async context manager exit."""
+        await self.close()
+    
+    async def _ensure_session(self):
+        """Ensure aiohttp session is created."""
+        if self.session is None or self.session.closed:
+            connector = aiohttp.TCPConnector(limit=self.max_connections)
+            self.session = aiohttp.ClientSession(connector=connector)
+    
+    async def _request(
+        self,
+        endpoint: str,
+        params: Optional[Dict[str, Any]] = None,
+        max_retries: int = 3
+    ) -> Dict[str, Any]:
+        """Make an async request to TMDB API with retries.
+        
+        Args:
+            endpoint: API endpoint (e.g., 'search/tv')
+            params: Query parameters
+            max_retries: Maximum retry attempts
+            
+        Returns:
+            API response as dictionary
+            
+        Raises:
+            TMDBAPIError: If request fails after retries
+        """
+        await self._ensure_session()
+        
+        url = f"{self.base_url}/{endpoint}"
+        params = params or {}
+        params["api_key"] = self.api_key
+        
+        # Cache key for deduplication
+        cache_key = f"{endpoint}:{str(sorted(params.items()))}"
+        if cache_key in self._cache:
+            logger.debug(f"Cache hit for {endpoint}")
+            return self._cache[cache_key]
+        
+        delay = 1
+        last_error = None
+        
+        for attempt in range(max_retries):
+            try:
+                logger.debug(f"TMDB API request: {endpoint} (attempt {attempt + 1})")
+                async with self.session.get(url, params=params, timeout=aiohttp.ClientTimeout(total=30)) as resp:
+                    if resp.status == 401:
+                        raise TMDBAPIError("Invalid TMDB API key")
+                    elif resp.status == 404:
+                        raise TMDBAPIError(f"Resource not found: {endpoint}")
+                    elif resp.status == 429:
+                        # Rate limit - wait longer
+                        retry_after = int(resp.headers.get('Retry-After', delay * 2))
+                        logger.warning(f"Rate limited, waiting {retry_after}s")
+                        await asyncio.sleep(retry_after)
+                        continue
+                    
+                    resp.raise_for_status()
+                    data = await resp.json()
+                    self._cache[cache_key] = data
+                    return data
+                    
+            except aiohttp.ClientError as e:
+                last_error = e
+                if attempt < max_retries - 1:
+                    logger.warning(f"Request failed (attempt {attempt + 1}): {e}, retrying in {delay}s")
+                    await asyncio.sleep(delay)
+                    delay *= 2
+                else:
+                    logger.error(f"Request failed after {max_retries} attempts: {e}")
+        
+        raise TMDBAPIError(f"Request failed after {max_retries} attempts: {last_error}")
+    
+    async def search_tv_show(
+        self,
+        query: str,
+        language: str = "de-DE",
+        page: int = 1
+    ) -> Dict[str, Any]:
+        """Search for TV shows by name.
+        
+        Args:
+            query: Search query (show name)
+            language: Language for results (default: German)
+            page: Page number for pagination
+            
+        Returns:
+            Search results with list of shows
+            
+        Example:
+            >>> results = await client.search_tv_show("Attack on Titan")
+            >>> shows = results["results"]
+        """
+        return await self._request(
+            "search/tv",
+            {"query": query, "language": language, "page": page}
+        )
+    
+    async def get_tv_show_details(
+        self,
+        tv_id: int,
+        language: str = "de-DE",
+        append_to_response: Optional[str] = None
+    ) -> Dict[str, Any]:
+        """Get detailed information about a TV show.
+        
+        Args:
+            tv_id: TMDB TV show ID
+            language: Language for metadata
+            append_to_response: Additional data to include (e.g., "credits,images")
+            
+        Returns:
+            TV show details including metadata, cast, etc.
+        """
+        params = {"language": language}
+        if append_to_response:
+            params["append_to_response"] = append_to_response
+        
+        return await self._request(f"tv/{tv_id}", params)
+    
+    async def get_tv_show_external_ids(self, tv_id: int) -> Dict[str, Any]:
+        """Get external IDs (IMDB, TVDB) for a TV show.
+        
+        Args:
+            tv_id: TMDB TV show ID
+            
+        Returns:
+            Dictionary with external IDs (imdb_id, tvdb_id, etc.)
+        """
+        return await self._request(f"tv/{tv_id}/external_ids")
+    
+    async def get_tv_show_images(
+        self,
+        tv_id: int,
+        language: Optional[str] = None
+    ) -> Dict[str, Any]:
+        """Get images (posters, backdrops, logos) for a TV show.
+        
+        Args:
+            tv_id: TMDB TV show ID
+            language: Language filter for images (None = all languages)
+            
+        Returns:
+            Dictionary with poster, backdrop, and logo lists
+        """
+        params = {}
+        if language:
+            params["language"] = language
+        
+        return await self._request(f"tv/{tv_id}/images", params)
+    
+    async def download_image(
+        self,
+        image_path: str,
+        local_path: Path,
+        size: str = "original"
+    ) -> None:
+        """Download an image from TMDB.
+        
+        Args:
+            image_path: Image path from TMDB API (e.g., "/abc123.jpg")
+            local_path: Local file path to save image
+            size: Image size (w500, original, etc.)
+            
+        Raises:
+            TMDBAPIError: If download fails
+        """
+        await self._ensure_session()
+        
+        url = f"{self.image_base_url}/{size}{image_path}"
+        
+        try:
+            logger.debug(f"Downloading image from {url}")
+            async with self.session.get(url, timeout=aiohttp.ClientTimeout(total=60)) as resp:
+                resp.raise_for_status()
+                
+                # Ensure parent directory exists
+                local_path.parent.mkdir(parents=True, exist_ok=True)
+                
+                # Write image data
+                with open(local_path, "wb") as f:
+                    f.write(await resp.read())
+                
+                logger.info(f"Downloaded image to {local_path}")
+                
+        except aiohttp.ClientError as e:
+            raise TMDBAPIError(f"Failed to download image: {e}")
+    
+    def get_image_url(self, image_path: str, size: str = "original") -> str:
+        """Get full URL for an image.
+        
+        Args:
+            image_path: Image path from TMDB API
+            size: Image size (w500, original, etc.)
+            
+        Returns:
+            Full image URL
+        """
+        return f"{self.image_base_url}/{size}{image_path}"
+    
+    async def close(self):
+        """Close the aiohttp session and clean up resources."""
+        if self.session and not self.session.closed:
+            await self.session.close()
+            logger.debug("TMDB client session closed")
+    
+    def clear_cache(self):
+        """Clear the request cache."""
+        self._cache.clear()
+        logger.debug("TMDB client cache cleared")
--- a/src/core/utils/image_downloader.py
+++ b/src/core/utils/image_downloader.py
@@ -0,0 +1,295 @@
+"""Image downloader utility for NFO media files.
+
+This module provides functions to download poster, logo, and fanart images
+from TMDB and validate them.
+
+Example:
+    >>> downloader = ImageDownloader()
+    >>> await downloader.download_poster(poster_url, "/path/to/poster.jpg")
+"""
+
+import asyncio
+import logging
+from pathlib import Path
+from typing import Optional
+
+import aiohttp
+from PIL import Image
+
+logger = logging.getLogger(__name__)
+
+
+class ImageDownloadError(Exception):
+    """Exception raised for image download failures."""
+    pass
+
+
+class ImageDownloader:
+    """Utility for downloading and validating images.
+    
+    Attributes:
+        max_retries: Maximum retry attempts for downloads
+        timeout: Request timeout in seconds
+        min_file_size: Minimum valid file size in bytes
+    """
+    
+    def __init__(
+        self,
+        max_retries: int = 3,
+        timeout: int = 60,
+        min_file_size: int = 1024  # 1 KB
+    ):
+        """Initialize image downloader.
+        
+        Args:
+            max_retries: Maximum retry attempts
+            timeout: Request timeout in seconds
+            min_file_size: Minimum valid file size in bytes
+        """
+        self.max_retries = max_retries
+        self.timeout = timeout
+        self.min_file_size = min_file_size
+    
+    async def download_image(
+        self,
+        url: str,
+        local_path: Path,
+        skip_existing: bool = True,
+        validate: bool = True
+    ) -> bool:
+        """Download an image from URL to local path.
+        
+        Args:
+            url: Image URL
+            local_path: Local file path to save image
+            skip_existing: Skip download if file already exists
+            validate: Validate image after download
+            
+        Returns:
+            True if download successful, False otherwise
+            
+        Raises:
+            ImageDownloadError: If download fails after retries
+        """
+        # Check if file already exists
+        if skip_existing and local_path.exists():
+            if local_path.stat().st_size >= self.min_file_size:
+                logger.debug(f"Image already exists: {local_path}")
+                return True
+        
+        # Ensure parent directory exists
+        local_path.parent.mkdir(parents=True, exist_ok=True)
+        
+        delay = 1
+        last_error = None
+        
+        for attempt in range(self.max_retries):
+            try:
+                logger.debug(f"Downloading image from {url} (attempt {attempt + 1})")
+                
+                timeout = aiohttp.ClientTimeout(total=self.timeout)
+                async with aiohttp.ClientSession(timeout=timeout) as session:
+                    async with session.get(url) as resp:
+                        if resp.status == 404:
+                            logger.warning(f"Image not found: {url}")
+                            return False
+                        
+                        resp.raise_for_status()
+                        
+                        # Download image data
+                        data = await resp.read()
+                        
+                        # Check file size
+                        if len(data) < self.min_file_size:
+                            raise ImageDownloadError(
+                                f"Downloaded file too small: {len(data)} bytes"
+                            )
+                        
+                        # Write to file
+                        with open(local_path, "wb") as f:
+                            f.write(data)
+                        
+                        # Validate image if requested
+                        if validate and not self.validate_image(local_path):
+                            local_path.unlink(missing_ok=True)
+                            raise ImageDownloadError("Image validation failed")
+                        
+                        logger.info(f"Downloaded image to {local_path}")
+                        return True
+                        
+            except (aiohttp.ClientError, IOError, ImageDownloadError) as e:
+                last_error = e
+                if attempt < self.max_retries - 1:
+                    logger.warning(
+                        f"Download failed (attempt {attempt + 1}): {e}, "
+                        f"retrying in {delay}s"
+                    )
+                    await asyncio.sleep(delay)
+                    delay *= 2
+                else:
+                    logger.error(
+                        f"Download failed after {self.max_retries} attempts: {e}"
+                    )
+        
+        raise ImageDownloadError(
+            f"Failed to download image after {self.max_retries} attempts: {last_error}"
+        )
+    
+    async def download_poster(
+        self,
+        url: str,
+        series_folder: Path,
+        filename: str = "poster.jpg",
+        skip_existing: bool = True
+    ) -> bool:
+        """Download poster image.
+        
+        Args:
+            url: Poster URL
+            series_folder: Series folder path
+            filename: Output filename (default: poster.jpg)
+            skip_existing: Skip if file exists
+            
+        Returns:
+            True if successful
+        """
+        local_path = series_folder / filename
+        try:
+            return await self.download_image(url, local_path, skip_existing)
+        except ImageDownloadError as e:
+            logger.warning(f"Failed to download poster: {e}")
+            return False
+    
+    async def download_logo(
+        self,
+        url: str,
+        series_folder: Path,
+        filename: str = "logo.png",
+        skip_existing: bool = True
+    ) -> bool:
+        """Download logo image.
+        
+        Args:
+            url: Logo URL
+            series_folder: Series folder path
+            filename: Output filename (default: logo.png)
+            skip_existing: Skip if file exists
+            
+        Returns:
+            True if successful
+        """
+        local_path = series_folder / filename
+        try:
+            return await self.download_image(url, local_path, skip_existing)
+        except ImageDownloadError as e:
+            logger.warning(f"Failed to download logo: {e}")
+            return False
+    
+    async def download_fanart(
+        self,
+        url: str,
+        series_folder: Path,
+        filename: str = "fanart.jpg",
+        skip_existing: bool = True
+    ) -> bool:
+        """Download fanart/backdrop image.
+        
+        Args:
+            url: Fanart URL
+            series_folder: Series folder path
+            filename: Output filename (default: fanart.jpg)
+            skip_existing: Skip if file exists
+            
+        Returns:
+            True if successful
+        """
+        local_path = series_folder / filename
+        try:
+            return await self.download_image(url, local_path, skip_existing)
+        except ImageDownloadError as e:
+            logger.warning(f"Failed to download fanart: {e}")
+            return False
+    
+    def validate_image(self, image_path: Path) -> bool:
+        """Validate that file is a valid image.
+        
+        Args:
+            image_path: Path to image file
+            
+        Returns:
+            True if valid image, False otherwise
+        """
+        try:
+            with Image.open(image_path) as img:
+                # Verify it's a valid image
+                img.verify()
+            
+            # Check file size
+            if image_path.stat().st_size < self.min_file_size:
+                logger.warning(f"Image file too small: {image_path}")
+                return False
+            
+            return True
+            
+        except Exception as e:
+            logger.warning(f"Image validation failed for {image_path}: {e}")
+            return False
+    
+    async def download_all_media(
+        self,
+        series_folder: Path,
+        poster_url: Optional[str] = None,
+        logo_url: Optional[str] = None,
+        fanart_url: Optional[str] = None,
+        skip_existing: bool = True
+    ) -> dict[str, bool]:
+        """Download all media files (poster, logo, fanart).
+        
+        Args:
+            series_folder: Series folder path
+            poster_url: Poster URL (optional)
+            logo_url: Logo URL (optional)
+            fanart_url: Fanart URL (optional)
+            skip_existing: Skip existing files
+            
+        Returns:
+            Dictionary with download status for each file type
+        """
+        results = {
+            "poster": False,
+            "logo": False,
+            "fanart": False
+        }
+        
+        tasks = []
+        
+        if poster_url:
+            tasks.append(("poster", self.download_poster(
+                poster_url, series_folder, skip_existing=skip_existing
+            )))
+        
+        if logo_url:
+            tasks.append(("logo", self.download_logo(
+                logo_url, series_folder, skip_existing=skip_existing
+            )))
+        
+        if fanart_url:
+            tasks.append(("fanart", self.download_fanart(
+                fanart_url, series_folder, skip_existing=skip_existing
+            )))
+        
+        # Download concurrently
+        if tasks:
+            task_results = await asyncio.gather(
+                *[task for _, task in tasks],
+                return_exceptions=True
+            )
+            
+            for (media_type, _), result in zip(tasks, task_results):
+                if isinstance(result, Exception):
+                    logger.error(f"Error downloading {media_type}: {result}")
+                    results[media_type] = False
+                else:
+                    results[media_type] = result
+        
+        return results
--- a/src/core/utils/nfo_generator.py
+++ b/src/core/utils/nfo_generator.py
@@ -0,0 +1,192 @@
+"""NFO XML generator for Kodi/XBMC format.
+
+This module provides functions to generate tvshow.nfo XML files from
+TVShowNFO Pydantic models, adapted from the scraper project.
+
+Example:
+    >>> from src.core.entities.nfo_models import TVShowNFO
+    >>> nfo = TVShowNFO(title="Test Show", year=2020, tmdbid=12345)
+    >>> xml_string = generate_tvshow_nfo(nfo)
+"""
+
+import logging
+from typing import Optional
+
+from lxml import etree
+
+from src.core.entities.nfo_models import TVShowNFO
+
+logger = logging.getLogger(__name__)
+
+
+def generate_tvshow_nfo(tvshow: TVShowNFO, pretty_print: bool = True) -> str:
+    """Generate tvshow.nfo XML content from TVShowNFO model.
+    
+    Args:
+        tvshow: TVShowNFO Pydantic model with metadata
+        pretty_print: Whether to format XML with indentation
+        
+    Returns:
+        XML string in Kodi/XBMC tvshow.nfo format
+        
+    Example:
+        >>> nfo = TVShowNFO(title="Attack on Titan", year=2013)
+        >>> xml = generate_tvshow_nfo(nfo)
+    """
+    root = etree.Element("tvshow")
+    
+    # Basic information
+    _add_element(root, "title", tvshow.title)
+    _add_element(root, "originaltitle", tvshow.originaltitle)
+    _add_element(root, "showtitle", tvshow.showtitle)
+    _add_element(root, "sorttitle", tvshow.sorttitle)
+    _add_element(root, "year", str(tvshow.year) if tvshow.year else None)
+    
+    # Plot and description
+    _add_element(root, "plot", tvshow.plot)
+    _add_element(root, "outline", tvshow.outline)
+    _add_element(root, "tagline", tvshow.tagline)
+    
+    # Technical details
+    _add_element(root, "runtime", str(tvshow.runtime) if tvshow.runtime else None)
+    _add_element(root, "mpaa", tvshow.mpaa)
+    _add_element(root, "certification", tvshow.certification)
+    
+    # Status and dates
+    _add_element(root, "premiered", tvshow.premiered)
+    _add_element(root, "status", tvshow.status)
+    _add_element(root, "dateadded", tvshow.dateadded)
+    
+    # Ratings
+    if tvshow.ratings:
+        ratings_elem = etree.SubElement(root, "ratings")
+        for rating in tvshow.ratings:
+            rating_elem = etree.SubElement(ratings_elem, "rating")
+            if rating.name:
+                rating_elem.set("name", rating.name)
+            if rating.max_rating:
+                rating_elem.set("max", str(rating.max_rating))
+            if rating.default:
+                rating_elem.set("default", "true")
+            
+            _add_element(rating_elem, "value", str(rating.value))
+            if rating.votes is not None:
+                _add_element(rating_elem, "votes", str(rating.votes))
+    
+    _add_element(root, "userrating", str(tvshow.userrating) if tvshow.userrating is not None else None)
+    
+    # IDs
+    _add_element(root, "tmdbid", str(tvshow.tmdbid) if tvshow.tmdbid else None)
+    _add_element(root, "imdbid", tvshow.imdbid)
+    _add_element(root, "tvdbid", str(tvshow.tvdbid) if tvshow.tvdbid else None)
+    
+    # Legacy ID fields for compatibility
+    _add_element(root, "id", str(tvshow.tvdbid) if tvshow.tvdbid else None)
+    _add_element(root, "imdb_id", tvshow.imdbid)
+    
+    # Unique IDs
+    for uid in tvshow.uniqueid:
+        uid_elem = etree.SubElement(root, "uniqueid")
+        uid_elem.set("type", uid.type)
+        if uid.default:
+            uid_elem.set("default", "true")
+        uid_elem.text = uid.value
+    
+    # Multi-value fields
+    for genre in tvshow.genre:
+        _add_element(root, "genre", genre)
+    
+    for studio in tvshow.studio:
+        _add_element(root, "studio", studio)
+    
+    for country in tvshow.country:
+        _add_element(root, "country", country)
+    
+    for tag in tvshow.tag:
+        _add_element(root, "tag", tag)
+    
+    # Thumbnails (posters, logos)
+    for thumb in tvshow.thumb:
+        thumb_elem = etree.SubElement(root, "thumb")
+        if thumb.aspect:
+            thumb_elem.set("aspect", thumb.aspect)
+        if thumb.season is not None:
+            thumb_elem.set("season", str(thumb.season))
+        if thumb.type:
+            thumb_elem.set("type", thumb.type)
+        thumb_elem.text = str(thumb.url)
+    
+    # Fanart
+    if tvshow.fanart:
+        fanart_elem = etree.SubElement(root, "fanart")
+        for fanart in tvshow.fanart:
+            fanart_thumb = etree.SubElement(fanart_elem, "thumb")
+            fanart_thumb.text = str(fanart.url)
+    
+    # Named seasons
+    for named_season in tvshow.namedseason:
+        season_elem = etree.SubElement(root, "namedseason")
+        season_elem.set("number", str(named_season.number))
+        season_elem.text = named_season.name
+    
+    # Actors
+    for actor in tvshow.actors:
+        actor_elem = etree.SubElement(root, "actor")
+        _add_element(actor_elem, "name", actor.name)
+        _add_element(actor_elem, "role", actor.role)
+        _add_element(actor_elem, "thumb", str(actor.thumb) if actor.thumb else None)
+        _add_element(actor_elem, "profile", str(actor.profile) if actor.profile else None)
+        _add_element(actor_elem, "tmdbid", str(actor.tmdbid) if actor.tmdbid else None)
+    
+    # Additional fields
+    _add_element(root, "trailer", str(tvshow.trailer) if tvshow.trailer else None)
+    _add_element(root, "watched", "true" if tvshow.watched else "false")
+    if tvshow.playcount is not None:
+        _add_element(root, "playcount", str(tvshow.playcount))
+    
+    # Generate XML string
+    xml_str = etree.tostring(
+        root,
+        pretty_print=pretty_print,
+        encoding="unicode",
+        xml_declaration=False
+    )
+    
+    # Add XML declaration
+    xml_declaration = '<?xml version="1.0" encoding="UTF-8" standalone="yes"?>\n'
+    return xml_declaration + xml_str
+
+
+def _add_element(parent: etree.Element, tag: str, text: Optional[str]) -> Optional[etree.Element]:
+    """Add a child element to parent if text is not None or empty.
+    
+    Args:
+        parent: Parent XML element
+        tag: Tag name for child element
+        text: Text content (None or empty strings are skipped)
+        
+    Returns:
+        Created element or None if skipped
+    """
+    if text is not None and text != "":
+        elem = etree.SubElement(parent, tag)
+        elem.text = text
+        return elem
+    return None
+
+
+def validate_nfo_xml(xml_string: str) -> bool:
+    """Validate NFO XML structure.
+    
+    Args:
+        xml_string: XML content to validate
+        
+    Returns:
+        True if valid XML, False otherwise
+    """
+    try:
+        etree.fromstring(xml_string.encode('utf-8'))
+        return True
+    except etree.XMLSyntaxError as e:
+        logger.error(f"Invalid NFO XML: {e}")
+        return False