devine/devine/core/tracks/tracks.py

from __future__ import annotations

import logging
import subprocess
from functools import partial
from pathlib import Path
from typing import Callable, Iterator, Optional, Sequence, Union

from langcodes import Language, closest_supported_match
from rich.progress import BarColumn, Progress, SpinnerColumn, TextColumn, TimeRemainingColumn
from rich.table import Table
from rich.tree import Tree

from devine.core.config import config
from devine.core.console import console
from devine.core.constants import LANGUAGE_MAX_DISTANCE, AnyTrack, TrackT
from devine.core.tracks.audio import Audio
from devine.core.tracks.chapters import Chapter, Chapters
from devine.core.tracks.subtitle import Subtitle
from devine.core.tracks.track import Track
from devine.core.tracks.video import Video
from devine.core.utilities import is_close_match, sanitize_filename
from devine.core.utils.collections import as_list, flatten


class Tracks:
    """
    Video, Audio, Subtitle, and Chapter Track Store.
    It provides convenience functions for listing, sorting, and selecting tracks.
    """

    TRACK_ORDER_MAP = {
        Video: 0,
        Audio: 1,
        Subtitle: 2,
        Chapter: 3
    }

    def __init__(self, *args: Union[Tracks, Sequence[Union[AnyTrack, Chapter, Chapters]], Track, Chapter, Chapters]):
        self.videos: list[Video] = []
        self.audio: list[Audio] = []
        self.subtitles: list[Subtitle] = []
        self.chapters = Chapters()

        if args:
            self.add(args)

    def __iter__(self) -> Iterator[AnyTrack]:
        return iter(as_list(self.videos, self.audio, self.subtitles))

    def __len__(self) -> int:
        return len(self.videos) + len(self.audio) + len(self.subtitles)

    def __add__(
        self,
        other: Union[Tracks, Sequence[Union[AnyTrack, Chapter, Chapters]], Track, Chapter, Chapters]
    ) -> Tracks:
        self.add(other)
        return self

    def __repr__(self) -> str:
        return "{name}({items})".format(
            name=self.__class__.__name__,
            items=", ".join([f"{k}={repr(v)}" for k, v in self.__dict__.items()])
        )

    def __str__(self) -> str:
        rep = {
            Video: [],
            Audio: [],
            Subtitle: [],
            Chapter: []
        }
        tracks = [*list(self), *self.chapters]

        for track in sorted(tracks, key=lambda t: self.TRACK_ORDER_MAP[type(t)]):
            if not rep[type(track)]:
                count = sum(type(x) is type(track) for x in tracks)
                rep[type(track)].append("{count} {type} Track{plural}{colon}".format(
                    count=count,
                    type=track.__class__.__name__,
                    plural="s" if count != 1 else "",
                    colon=":" if count > 0 else ""
                ))
            rep[type(track)].append(str(track))

        for type_ in list(rep):
            if not rep[type_]:
                del rep[type_]
                continue
            rep[type_] = "\n".join(
                [rep[type_][0]] +
                [f"├─ {x}" for x in rep[type_][1:-1]] +
                [f"└─ {rep[type_][-1]}"]
            )
        rep = "\n".join(list(rep.values()))

        return rep

    def tree(self, add_progress: bool = False) -> tuple[Tree, list[partial]]:
        all_tracks = [*list(self), *self.chapters]

        progress_callables = []

        tree = Tree("", hide_root=True)
        for track_type in self.TRACK_ORDER_MAP:
            tracks = list(x for x in all_tracks if isinstance(x, track_type))
            if not tracks:
                continue
            num_tracks = len(tracks)
            track_type_plural = track_type.__name__ + ("s" if track_type != Audio and num_tracks != 1 else "")
            tracks_tree = tree.add(f"[repr.number]{num_tracks}[/] {track_type_plural}")
            for track in tracks:
                if add_progress and track_type != Chapter:
                    progress = Progress(
                        SpinnerColumn(finished_text=""),
                        BarColumn(),
                        "•",
                        TimeRemainingColumn(compact=True, elapsed_when_finished=True),
                        "•",
                        TextColumn("[progress.data.speed]{task.fields[downloaded]}"),
                        console=console,
                        speed_estimate_period=10
                    )
                    task = progress.add_task("", downloaded="-")
                    progress_callables.append(partial(progress.update, task_id=task))
                    track_table = Table.grid()
                    track_table.add_row(str(track)[6:], style="text2")
                    track_table.add_row(progress)
                    tracks_tree.add(track_table)
                else:
                    tracks_tree.add(str(track)[6:], style="text2")

        return tree, progress_callables

    def exists(self, by_id: Optional[str] = None, by_url: Optional[Union[str, list[str]]] = None) -> bool:
        """Check if a track already exists by various methods."""
        if by_id:  # recommended
            return any(x.id == by_id for x in self)
        if by_url:
            return any(x.url == by_url for x in self)
        return False

    def add(
        self,
        tracks: Union[Tracks, Sequence[Union[AnyTrack, Chapter, Chapters]], Track, Chapter, Chapters],
        warn_only: bool = False
    ) -> None:
        """Add a provided track to its appropriate array and ensuring it's not a duplicate."""
        if isinstance(tracks, Tracks):
            tracks = [*list(tracks), *tracks.chapters]

        duplicates = 0
        for track in flatten(tracks):
            if self.exists(by_id=track.id):
                if not warn_only:
                    raise ValueError(
                        "One or more of the provided Tracks is a duplicate. "
                        "Track IDs must be unique but accurate using static values. The "
                        "value should stay the same no matter when you request the same "
                        "content. Use a value that has relation to the track content "
                        "itself and is static or permanent and not random/RNG data that "
                        "wont change each refresh or conflict in edge cases."
                    )
                duplicates += 1
                continue

            if isinstance(track, Video):
                self.videos.append(track)
            elif isinstance(track, Audio):
                self.audio.append(track)
            elif isinstance(track, Subtitle):
                self.subtitles.append(track)
            elif isinstance(track, Chapter):
                self.chapters.add(track)
            else:
                raise ValueError("Track type was not set or is invalid.")

        log = logging.getLogger("Tracks")

        if duplicates:
            log.warning(f" - Found and skipped {duplicates} duplicate tracks...")

    def sort_videos(self, by_language: Optional[Sequence[Union[str, Language]]] = None) -> None:
        """Sort video tracks by bitrate, and optionally language."""
        if not self.videos:
            return
        # bitrate
        self.videos.sort(
            key=lambda x: float(x.bitrate or 0.0),
            reverse=True
        )
        # language
        for language in reversed(by_language or []):
            if str(language) == "all":
                language = next((x.language for x in self.videos if x.is_original_lang), "")
            if not language:
                continue
            self.videos.sort(key=lambda x: str(x.language))
            self.videos.sort(key=lambda x: not is_close_match(language, [x.language]))

    def sort_audio(self, by_language: Optional[Sequence[Union[str, Language]]] = None) -> None:
        """Sort audio tracks by bitrate, descriptive, and optionally language."""
        if not self.audio:
            return
        # bitrate
        self.audio.sort(
            key=lambda x: float(x.bitrate or 0.0),
            reverse=True
        )
        # descriptive
        self.audio.sort(key=lambda x: str(x.language) if x.descriptive else "")
        # language
        for language in reversed(by_language or []):
            if str(language) == "all":
                language = next((x.language for x in self.audio if x.is_original_lang), "")
            if not language:
                continue
            self.audio.sort(key=lambda x: str(x.language))
            self.audio.sort(key=lambda x: not is_close_match(language, [x.language]))

    def sort_subtitles(self, by_language: Optional[Sequence[Union[str, Language]]] = None) -> None:
        """
        Sort subtitle tracks by various track attributes to a common P2P standard.
        You may optionally provide a sequence of languages to prioritize to the top.

        Section Order:
          - by_language groups prioritized to top, and ascending alphabetically
          - then rest ascending alphabetically after the prioritized groups
          (Each section ascending alphabetically, but separated)

        Language Group Order:
          - Forced
          - Normal
          - Hard of Hearing (SDH/CC)
          (Least to most captions expected in the subtitle)
        """
        if not self.subtitles:
            return
        # language groups
        self.subtitles.sort(key=lambda x: str(x.language))
        self.subtitles.sort(key=lambda x: x.sdh or x.cc)
        self.subtitles.sort(key=lambda x: x.forced, reverse=True)
        # sections
        for language in reversed(by_language or []):
            if str(language) == "all":
                language = next((x.language for x in self.subtitles if x.is_original_lang), "")
            if not language:
                continue
            self.subtitles.sort(key=lambda x: is_close_match(language, [x.language]), reverse=True)

    def select_video(self, x: Callable[[Video], bool]) -> None:
        self.videos = list(filter(x, self.videos))

    def select_audio(self, x: Callable[[Audio], bool]) -> None:
        self.audio = list(filter(x, self.audio))

    def select_subtitles(self, x: Callable[[Subtitle], bool]) -> None:
        self.subtitles = list(filter(x, self.subtitles))

    def by_resolutions(self, resolutions: list[int], per_resolution: int = 0) -> None:
        # Note: Do not merge these list comprehensions. They must be done separately so the results
        # from the 16:9 canvas check is only used if there's no exact height resolution match.
        selected = []
        for resolution in resolutions:
            matches = [  # exact matches
                x
                for x in self.videos
                if x.height == resolution
            ]
            if not matches:
                matches = [  # 16:9 canvas matches
                    x
                    for x in self.videos
                    if int(x.width * (9 / 16)) == resolution
                ]
            selected.extend(matches[:per_resolution or None])
        self.videos = selected

    @staticmethod
    def by_language(tracks: list[TrackT], languages: list[str], per_language: int = 0) -> list[TrackT]:
        selected = []
        for language in languages:
            selected.extend([
                x
                for x in tracks
                if closest_supported_match(x.language, [language], LANGUAGE_MAX_DISTANCE)
            ][:per_language or None])
        return selected

    def mux(self, title: str, delete: bool = True, progress: Optional[partial] = None) -> tuple[Path, int]:
        """
        Multiplex all the Tracks into a Matroska Container file.

        Parameters:
            title: Set the Matroska Container file title. Usually displayed in players
                instead of the filename if set.
            delete: Delete all track files after multiplexing.
            progress: Update a rich progress bar via `completed=...`. This must be the
                progress object's update() func, pre-set with task id via functools.partial.
        """
        cl = [
            "mkvmerge",
            "--no-date",  # remove dates from the output for security
        ]

        if config.muxing.get("set_title", True):
            cl.extend(["--title", title])

        for i, vt in enumerate(self.videos):
            if not vt.path or not vt.path.exists():
                raise ValueError("Video Track must be downloaded before muxing...")
            if callable(vt.OnMultiplex):
                vt.OnMultiplex()
            cl.extend([
                "--language", f"0:{vt.language}",
                "--default-track", f"0:{i == 0}",
                "--original-flag", f"0:{vt.is_original_lang}",
                "--compression", "0:none",  # disable extra compression
                "(", str(vt.path), ")"
            ])

        for i, at in enumerate(self.audio):
            if not at.path or not at.path.exists():
                raise ValueError("Audio Track must be downloaded before muxing...")
            if callable(at.OnMultiplex):
                at.OnMultiplex()
            cl.extend([
                "--track-name", f"0:{at.get_track_name() or ''}",
                "--language", f"0:{at.language}",
                "--default-track", f"0:{i == 0}",
                "--visual-impaired-flag", f"0:{at.descriptive}",
                "--original-flag", f"0:{at.is_original_lang}",
                "--compression", "0:none",  # disable extra compression
                "(", str(at.path), ")"
            ])

        for st in self.subtitles:
            if not st.path or not st.path.exists():
                raise ValueError("Text Track must be downloaded before muxing...")
            if callable(st.OnMultiplex):
                st.OnMultiplex()
            default = bool(self.audio and is_close_match(st.language, [self.audio[0].language]) and st.forced)
            cl.extend([
                "--track-name", f"0:{st.get_track_name() or ''}",
                "--language", f"0:{st.language}",
                "--sub-charset", "0:UTF-8",
                "--forced-track", f"0:{st.forced}",
                "--default-track", f"0:{default}",
                "--hearing-impaired-flag", f"0:{st.sdh}",
                "--original-flag", f"0:{st.is_original_lang}",
                "--compression", "0:none",  # disable extra compression (probably zlib)
                "(", str(st.path), ")"
            ])

        if self.chapters:
            chapters_path = config.directories.temp / config.filenames.chapters.format(
                title=sanitize_filename(title),
                random=self.chapters.id
            )
            self.chapters.dump(chapters_path, fallback_name=config.chapter_fallback_name)
            cl.extend(["--chapter-charset", "UTF-8", "--chapters", str(chapters_path)])
        else:
            chapters_path = None

        output_path = (
            self.videos[0].path.with_suffix(".muxed.mkv") if self.videos else
            self.audio[0].path.with_suffix(".muxed.mka") if self.audio else
            self.subtitles[0].path.with_suffix(".muxed.mks") if self.subtitles else
            chapters_path.with_suffix(".muxed.mkv") if self.chapters else
            None
        )
        if not output_path:
            raise ValueError("No tracks provided, at least one track must be provided.")

        # let potential failures go to caller, caller should handle
        try:
            p = subprocess.Popen([
                *cl,
                "--output", str(output_path),
                "--gui-mode"
            ], text=True, stdout=subprocess.PIPE)
            for line in iter(p.stdout.readline, ""):
                if "progress" in line:
                    progress(total=100, completed=int(line.strip()[14:-1]))
            return output_path, p.wait()
        finally:
            if chapters_path:
                # regardless of delete param, we delete as it's a file we made during muxing
                chapters_path.unlink()
            if delete:
                for track in self:
                    track.delete()


__all__ = ("Tracks",)