feat: moved cli helpers to seperate file

feat: completely dynamified the datasource import
feat: auto import pages in page module
2024-05-27 13:41:24 +02:00 · 2024-05-24 17:00:39 +02:00 · 2024-05-24 15:46:42 +02:00 · 2024-05-24 15:28:47 +02:00 · 2024-05-24 14:46:38 +02:00 · 2024-05-24 13:21:07 +02:00
28 changed files with 1075 additions and 761 deletions
--- a/.vscode/launch.json
+++ b/.vscode/launch.json
@@ -17,6 +17,12 @@
            "request": "launch",
            "program": "development/actual_donwload.py",
            "console": "integratedTerminal"
        },
        {
            "name": "Python Debugger: Music Kraken",
            "type": "debugpy",
            "request": "launch", // run the module
            "module": "music_kraken",
        }
    ]
 }
--- a/.vscode/settings.json
+++ b/.vscode/settings.json
@@ -27,6 +27,7 @@
        "Gitea",
        "iframe",
        "isrc",
        "itemprop",
        "levenshtein",
        "metallum",
        "MUSICBRAINZ",
--- a/development/actual_donwload.py
+++ b/development/actual_donwload.py
@@ -6,9 +6,10 @@ logging.getLogger().setLevel(logging.DEBUG)
 if __name__ == "__main__":
    commands = [
-        "s: #a I'm in a coffin",
+        "s: #a Crystal F",
-        "0",
+        "10",
-        "d: 0",
+        "1",
        "3",
    ]
--- a/music_kraken/audio/metadata.py
+++ b/music_kraken/audio/metadata.py
@@ -93,6 +93,10 @@ def write_metadata_to_target(metadata: Metadata, target: Target, song: Song):
            # resize the image to the preferred resolution
            img.thumbnail((main_settings["preferred_artwork_resolution"], main_settings["preferred_artwork_resolution"]))
            # https://stackoverflow.com/a/59476938/16804841
            if img.mode != 'RGB':
                img = img.convert('RGB')
            img.save(converted_target.file_path, "JPEG")
        # https://stackoverflow.com/questions/70228440/mutagen-how-can-i-correctly-embed-album-art-into-mp3-file-so-that-i-can-see-t
--- a/music_kraken/cli/main_downloader.py
+++ b/music_kraken/cli/main_downloader.py
@@ -1,89 +1,25 @@
 import random
 from typing import Set, Type, Dict, List
 from pathlib import Path
 import re
 from pathlib import Path
 from typing import Dict, Generator, List, Set, Type
-from .utils import cli_function
+from .. import console
-from .options.first_config import initial_config
+from ..download import Downloader, Page, components
-
+from ..download.results import GoToResults
-from ..utils import output, BColors
+from ..download.results import Option as ResultOption
-from ..utils.config import write_config, main_settings
+from ..download.results import PageResults, Results
-from ..utils.shared import URL_PATTERN
+from ..objects import Album, Artist, DatabaseObject, Song
-from ..utils.string_processing import fit_to_file_system
+from ..utils import BColors, output
-from ..utils.support_classes.query import Query
+from ..utils.config import main_settings, write_config
-from ..utils.support_classes.download_result import DownloadResult
+from ..utils.enums.colors import BColors
 from ..utils.exception import MKInvalidInputException
 from ..utils.exception.download import UrlNotFoundException
-from ..utils.enums.colors import BColors
+from ..utils.shared import URL_PATTERN
-from .. import console
+from ..utils.string_processing import fit_to_file_system
-
+from ..utils.support_classes.download_result import DownloadResult
-from ..download.results import Results, Option, PageResults, GoToResults
+from ..utils.support_classes.query import Query
-from ..download.page_attributes import Pages
+from .options.first_config import initial_config
-from ..pages import Page
+from .utils import ask_for_bool, cli_function
 from ..objects import Song, Album, Artist, DatabaseObject
 """
 This is the implementation of the Shell
 # Behaviour
 ## Searching
 ```mkshell
 > s: {querry or url}
 # examples
 > s: https://musify.club/release/some-random-release-183028492
 > s: r: #a an Artist #r some random Release
 ```
 Searches for an url, or an query
 ### Query Syntax
 ```
 #a {artist} #r {release} #t {track}
 ```
 You can escape stuff like `#` doing this: `\#`
 ## Downloading
 To download something, you either need a direct link, or you need to have already searched for options
 ```mkshell
 > d: {option ids or direct url}
 # examples
 > d: 0, 3, 4
 > d: 1
 > d: https://musify.club/release/some-random-release-183028492
 ```
 ## Misc
 ### Exit
 ```mkshell
 > q
 > quit
 > exit
 > abort
 ```
 ### Current Options
 ```mkshell
 > .
 ```
 ### Previous Options
 ```
 > ..
 ```
 """
 EXIT_COMMANDS = {"q", "quit", "exit", "abort"}
 ALPHABET = "abcdefghijklmnopqrstuvwxyz"
@@ -91,50 +27,19 @@ PAGE_NAME_FILL = "-"
 MAX_PAGE_LEN = 21
 def get_existing_genre() -> List[str]:
    """
    gets the name of all subdirectories of shared.MUSIC_DIR,
    but filters out all directories, where the name matches with any patern
    from shared.NOT_A_GENRE_REGEX.
    """
    existing_genres: List[str] = []
    # get all subdirectories of MUSIC_DIR, not the files in the dir.
    existing_subdirectories: List[Path] = [f for f in main_settings["music_directory"].iterdir() if f.is_dir()]
    for subdirectory in existing_subdirectories:
        name: str = subdirectory.name
        if not any(re.match(regex_pattern, name) for regex_pattern in main_settings["not_a_genre_regex"]):
            existing_genres.append(name)
    existing_genres.sort()
    return existing_genres
 def get_genre():
-    existing_genres = get_existing_genre()
+    select_genre = components.GenreSelect()
-    for i, genre_option in enumerate(existing_genres):
+    select_genre._ask_for_creating_option = lambda key: ask_for_bool(f"Create the genre \"{key}\"")
        print(f"{i + 1:0>2}: {genre_option}")
-    while True:
+    genre: Optional[components.Option] = None
        genre = input("Id or new genre: ")
-        if genre.isdigit():
+    while genre is None:
-            genre_id = int(genre) - 1
+        for genre in select_genre:
-            if genre_id >= len(existing_genres):
+            print(genre)
                print(f"No genre under the id {genre_id + 1}.")
                continue
-            return existing_genres[genre_id]
+        genre = select_genre.choose(input("Id or new genre: "))
-        new_genre = fit_to_file_system(genre)
+    return genre.value
        agree_inputs = {"y", "yes", "ok"}
        verification = input(f"create new genre \"{new_genre}\"? (Y/N): ").lower()
        if verification in agree_inputs:
            return new_genre
 def help_message():
@@ -143,7 +48,7 @@ def help_message():
    print()
-class Downloader:
+class CliDownloader:
    def __init__(
            self,
            exclude_pages: Set[Type[Page]] = None,
@@ -153,7 +58,7 @@ class Downloader:
            genre: str = None,
            process_metadata_anyway: bool = False,
    ) -> None:
-        self.pages: Pages = Pages(exclude_pages=exclude_pages, exclude_shady=exclude_shady)
+        self.pages: Downloader = Downloader(exclude_pages=exclude_pages, exclude_shady=exclude_shady)
        self.page_dict: Dict[str, Type[Page]] = dict()
@@ -177,7 +82,7 @@ class Downloader:
        page_count = 0
        for option in self.current_results.formatted_generator():
-            if isinstance(option, Option):
+            if isinstance(option, ResultOption):
                r = f"{BColors.GREY.value}{option.index:0{self.option_digits}}{BColors.ENDC.value} {option.music_object.option_string}"
                print(r)
            else:
@@ -446,7 +351,7 @@ def download(
        else:
            print(f"{BColors.FAIL.value}Something went wrong configuring.{BColors.ENDC.value}")
-    shell = Downloader(genre=genre, process_metadata_anyway=process_metadata_anyway)
+    shell = CliDownloader(genre=genre, process_metadata_anyway=process_metadata_anyway)
    if command_list is not None:
        for command in command_list:
--- a/music_kraken/cli/utils.py
+++ b/music_kraken/cli/utils.py
@@ -39,4 +39,8 @@ def print_cute_message():
        print(message)
 AGREE_INPUTS = {"y", "yes", "ok"}
 def ask_for_bool(msg: str) -> bool:
    i = input(msg + " (Y/N):").lower()
    return i in AGREE_INPUTS
--- a/music_kraken/connection/cache.py
+++ b/music_kraken/connection/cache.py
@@ -137,13 +137,13 @@ class Cache:
        )
        self._write_attribute(cache_attribute)
-        cache_path = fit_to_file_system(Path(module_path, name), hidden_ok=True)
+        cache_path = fit_to_file_system(Path(module_path, name.replace("/", "_")), hidden_ok=True)
        with cache_path.open("wb") as content_file:
            self.logger.debug(f"writing cache to {cache_path}")
            content_file.write(content)
    def get(self, name: str) -> Optional[CacheResult]:
-        path = fit_to_file_system(Path(self._dir, self.module, name), hidden_ok=True)
+        path = fit_to_file_system(Path(self._dir, self.module, name.replace("/", "_")), hidden_ok=True)
        if not path.is_file():
            return None
@@ -166,7 +166,7 @@ class Cache:
            if ca.name == "":
                continue
-            file = fit_to_file_system(Path(self._dir, ca.module, ca.name), hidden_ok=True)
+            file = fit_to_file_system(Path(self._dir, ca.module, ca.name.replace("/", "_")), hidden_ok=True)
            if not ca.is_valid:
                self.logger.debug(f"deleting cache {ca.id}")
--- a/music_kraken/download/init.py
+++ b/music_kraken/download/init.py
@@ -1,8 +1,36 @@
-from dataclasses import dataclass, field
+from __future__ import annotations
 from typing import Set
-from ..utils.config import main_settings
+import logging
 import random
 import re
 from collections import defaultdict
 from copy import copy
 from dataclasses import dataclass, field
 from pathlib import Path
 from string import Formatter
 from typing import (TYPE_CHECKING, Any, Callable, Dict, Generator, List,
                    Optional, Set, Tuple, Type, TypedDict, Union)
 import requests
 from bs4 import BeautifulSoup
 from ..audio import correct_codec, write_metadata_to_target
 from ..connection import Connection
 from ..objects import Album, Artist, Collection
 from ..objects import DatabaseObject as DataObject
 from ..objects import Label, Options, Song, Source, Target
 from ..utils import BColors, output, trace
 from ..utils.config import main_settings, youtube_settings
 from ..utils.enums import ALL_SOURCE_TYPES, SourceType
 from ..utils.enums.album import AlbumType
 from ..utils.exception import MKComposeException, MKMissingNameException
 from ..utils.exception.download import UrlNotFoundException
 from ..utils.path_manager import LOCATIONS
 from ..utils.shared import DEBUG_PAGES
 from ..utils.string_processing import fit_to_file_system
 from ..utils.support_classes.download_result import DownloadResult
 from ..utils.support_classes.query import Query
 from .results import SearchResults
@dataclass
@@ -19,3 +47,409 @@ class DownloadOptions:
    download_again_if_found: bool = False
    process_audio_if_found: bool = False
    process_metadata_if_found: bool = True
 fetch_map = {
    Song: "fetch_song",
    Album: "fetch_album",
    Artist: "fetch_artist",
    Label: "fetch_label",
 }
 class Downloader:
    def __init__(
        self, 
        auto_register_pages: bool = True, 
        download_options: DownloadOptions = None, 
        fetch_options: FetchOptions = None, 
        **kwargs
    ):
        self.LOGGER = logging.getLogger("download")
        self.download_options: DownloadOptions = download_options or DownloadOptions()
        self.fetch_options: FetchOptions = fetch_options or FetchOptions()
        self._registered_pages: Dict[Type[Page], Set[Page]] = defaultdict(set)
        if auto_register_pages:
            self.scan_for_pages(**kwargs)
    def register_page(self, page_type: Type[Page], **kwargs):
        if page_type in self._registered_pages:
            return
        self._registered_pages[page_type].add(page_type(
            download_options=self.download_options, 
            fetch_options=self.fetch_options, 
            **kwargs
        ))
    def deregister_page(self, page_type: Type[Page]):
        if page_type not in _registered_pages:
            return
        for p in self._registered_pages[page_type]:
            p.__del__()
        del self._registered_pages[page_type]
    def scan_for_pages(self, **kwargs):
        # assuming the wanted pages are the leaf classes of the interface
        from .. import pages
        leaf_classes = []
        class_list = [Page]
        while len(class_list):
            _class = class_list.pop()
            class_subclasses = _class.__subclasses__()
            if len(class_subclasses) == 0:
                if _class.REGISTER:
                    leaf_classes.append(_class)
            else:
                class_list.extend(class_subclasses)
        if Page in leaf_classes:
            self.LOGGER.warn("couldn't find any data source")
            return
        for leaf_class in leaf_classes:
            self.register_page(leaf_class, **kwargs)
    def get_pages(self, *page_types: List[Type[Page]]) -> Generator[Page, None, None]:
        if len(page_types) == 0:
            page_types = _registered_pages.keys()
        for page_type in page_types:
            yield from self._registered_pages[page_type]
    def search(self, query: Query) -> SearchResults:
        result = SearchResults()
        for page in self.get_pages():
            result.add(
                page=type(page),
                search_result=page.search(query=query)
            )
        return result
    def fetch_details(self, data_object: DataObject, stop_at_level: int = 1, **kwargs) -> DataObject:
        source: Source
        for source in data_object.source_collection.get_sources(source_type_sorting={
            "only_with_page": True,
        }):
            new_data_object = self.fetch_from_source(source=source, stop_at_level=stop_at_level)
            if new_data_object is not None:
                data_object.merge(new_data_object)
        return data_object
    def fetch_from_source(self, source: Source, **kwargs) -> Optional[DataObject]:
        if not source.has_page:
            return None
        source_type = source.page.get_source_type(source=source)
        if source_type is None:
            self.LOGGER.debug(f"Could not determine source type for {source}.")
            return None
        func = getattr(source.page, fetch_map[source_type])
        # fetching the data object and marking it as fetched
        data_object: DataObject = func(source=source, **kwargs)
        data_object.mark_as_fetched(source.hash_url)
        return data_object
    def fetch_from_url(self, url: str) -> Optional[DataObject]:
        source = Source.match_url(url, ALL_SOURCE_TYPES.MANUAL)
        if source is None:
            return None
        return self.fetch_from_source(source=source)
    def _skip_object(self, data_object: DataObject) -> bool:
        if isinstance(data_object, Album):
            if not self.download_options.download_all and data_object.album_type in self.download_options.album_type_blacklist:
                return True
        return False
    def download(self, data_object: DataObject, genre: str, **kwargs) -> DownloadResult:
        # fetch the given object
        self.fetch_details(data_object)
        output(f"\nDownloading {data_object.option_string}...", color=BColors.BOLD)
        # fetching all parent objects (e.g. if you only download a song)
        if not kwargs.get("fetched_upwards", False):
            to_fetch: List[DataObject] = [data_object]
            while len(to_fetch) > 0:
                new_to_fetch = []
                for d in to_fetch:
                    if self._skip_object(d):
                        continue
                    self.fetch_details(d)
                    for c in d.get_parent_collections():
                        new_to_fetch.extend(c)
                to_fetch = new_to_fetch
            kwargs["fetched_upwards"] = True
        # download all children
        download_result: DownloadResult = DownloadResult()
        for c in data_object.get_child_collections():
            for d in c:
                if self._skip_object(d):
                    continue
                download_result.merge(self.download(d, genre, **kwargs))
        # actually download if the object is a song
        if isinstance(data_object, Song):
            """
            TODO
            add the traced artist and album to the naming.
            I am able to do that, because duplicate values are removed later on.
            """
            self._download_song(data_object, naming={
                "genre": [genre],
                "audio_format": [main_settings["audio_format"]],
            })
        return download_result
    def _extract_fields_from_template(self, path_template: str) -> Set[str]:
        return set(re.findall(r"{([^}]+)}", path_template))
    def _parse_path_template(self, path_template: str, naming: Dict[str, List[str]]) -> str:
        field_names: Set[str] = self._extract_fields_from_template(path_template)
        for field in field_names:
            if len(naming[field]) == 0:
                raise MKMissingNameException(f"Missing field for {field}.")
            path_template = path_template.replace(f"{{{field}}}", naming[field][0])
        return path_template
    def _download_song(self, song: Song, naming: dict) -> DownloadOptions:
        """
        TODO
        Search the song in the file system.
        """
        r = DownloadResult(total=1)
        # pre process the data recursively
        song.compile()
        # manage the naming
        naming: Dict[str, List[str]] = defaultdict(list, naming)
        naming["song"].append(song.title_value)
        naming["isrc"].append(song.isrc)
        naming["album"].extend(a.title_value for a in song.album_collection)
        naming["album_type"].extend(a.album_type.value for a in song.album_collection)
        naming["artist"].extend(a.name for a in song.artist_collection)
        naming["artist"].extend(a.name for a in song.feature_artist_collection)
        for a in song.album_collection:
            naming["label"].extend([l.title_value for l in a.label_collection])
        # removing duplicates from the naming, and process the strings
        for key, value in naming.items():
            # https://stackoverflow.com/a/17016257
            naming[key] = list(dict.fromkeys(value))
        song.genre = naming["genre"][0]
        # manage the targets
        tmp: Target = Target.temp(file_extension=main_settings["audio_format"])
        song.target_collection.append(Target(
            relative_to_music_dir=True,
            file_path=Path(
                self._parse_path_template(main_settings["download_path"], naming=naming), 
                self._parse_path_template(main_settings["download_file"], naming=naming),
            )
        ))
        for target in song.target_collection:
            if target.exists:
                output(f'{target.file_path} {BColors.OKGREEN.value}[already exists]', color=BColors.GREY)
                r.found_on_disk += 1
                if not self.download_options.download_again_if_found:
                    target.copy_content(tmp)
            else:
                target.create_path()
                output(f'{target.file_path}', color=BColors.GREY)
        # this streams from every available source until something succeeds, setting the skip intervals to the values of the according source
        used_source: Optional[Source] = None
        skip_intervals: List[Tuple[float, float]] = []
        for source in song.source_collection.get_sources(source_type_sorting={
            "only_with_page": True,
            "sort_key": lambda page: page.download_priority,
            "reverse": True,
        }):
            if tmp.exists:
                break
            used_source = source
            streaming_results = source.page.download_song_to_target(source=source, target=tmp, desc="download")
            skip_intervals = source.page.get_skip_intervals(song=song, source=source)
            # if something has been downloaded but it somehow failed, delete the file
            if streaming_results.is_fatal_error and tmp.exists:
                tmp.delete()
        # if everything went right, the file should exist now
        if not tmp.exists:
            if used_source is None:
                r.error_message = f"No source found for {song.option_string}."
            else:
                r.error_message = f"Something went wrong downloading {song.option_string}."
            return r
        # post process the audio
        found_on_disk = used_source is None
        if not found_on_disk or self.download_options.process_audio_if_found:
            correct_codec(target=tmp, skip_intervals=skip_intervals)
            r.sponsor_segments = len(skip_intervals)
        if used_source is not None:
            used_source.page.post_process_hook(song=song, temp_target=tmp)
        if not found_on_disk or self.download_options.process_metadata_if_found:
            write_metadata_to_target(metadata=song.metadata, target=tmp, song=song)
        # copy the tmp target to the final locations
        for target in song.target_collection:
            tmp.copy_content(target)
        tmp.delete()
        return r
    def fetch_url(self, url: str, **kwargs) -> DataObject:
        source = Source.match_url(url, ALL_SOURCE_TYPES.MANUAL)
        if source is None or source.page is None:
            raise UrlNotFoundException(url=url)
        return source.page.fetch_object_from_source(source=source, **kwargs)
 class Page:
    REGISTER = True
    SOURCE_TYPE: SourceType
    LOGGER: logging.Logger
    def __new__(cls, *args, **kwargs):
        cls.LOGGER = logging.getLogger(cls.__name__)
        return super().__new__(cls)
    @classmethod
    def is_leaf_page(cls) -> bool:
        return len(cls.__subclasses__()) == 0
    def __init__(self, download_options: DownloadOptions = None, fetch_options: FetchOptions = None, **kwargs):
        self.SOURCE_TYPE.register_page(self)
        self.download_options: DownloadOptions = download_options or DownloadOptions()
        self.fetch_options: FetchOptions = fetch_options or FetchOptions()
    def __del__(self):
        self.SOURCE_TYPE.deregister_page()
    def _search_regex(self, pattern, string, default=None, fatal=True, flags=0, group=None):
        """
        Perform a regex search on the given string, using a single or a list of
        patterns returning the first matching group.
        In case of failure return a default value or raise a WARNING or a
        RegexNotFoundError, depending on fatal, specifying the field name.
        """
        if isinstance(pattern, str):
            mobj = re.search(pattern, string, flags)
        else:
            for p in pattern:
                mobj = re.search(p, string, flags)
                if mobj:
                    break
        if mobj:
            if group is None:
                # return the first matching group
                return next(g for g in mobj.groups() if g is not None)
            elif isinstance(group, (list, tuple)):
                return tuple(mobj.group(g) for g in group)
            else:
                return mobj.group(group)
        return default
    def get_source_type(self, source: Source) -> Optional[Type[DataObject]]:
        return None
    def get_soup_from_response(self, r: requests.Response) -> BeautifulSoup:
        return BeautifulSoup(r.content, "html.parser")
    # to search stuff
    def search(self, query: Query) -> List[DataObject]:
        music_object = query.music_object
        search_functions = {
            Song: self.song_search,
            Album: self.album_search,
            Artist: self.artist_search,
            Label: self.label_search
        }
        if type(music_object) in search_functions:
            r = search_functions[type(music_object)](music_object)
            if r is not None and len(r) > 0:
                return r
        r = []
        for default_query in query.default_search:
            for single_option in self.general_search(default_query):
                r.append(single_option)
        return r
    def general_search(self, search_query: str) -> List[DataObject]:
        return []
    def label_search(self, label: Label) -> List[Label]:
        return []
    def artist_search(self, artist: Artist) -> List[Artist]:
        return []
    def album_search(self, album: Album) -> List[Album]:
        return []
    def song_search(self, song: Song) -> List[Song]:
        return []
    # to fetch stuff
    def fetch_song(self, source: Source, stop_at_level: int = 1) -> Song:
        return Song()
    def fetch_album(self, source: Source, stop_at_level: int = 1) -> Album:
        return Album()
    def fetch_artist(self, source: Source, stop_at_level: int = 1) -> Artist:
        return Artist()
    def fetch_label(self, source: Source, stop_at_level: int = 1) -> Label:
        return Label()
    # to download stuff
    def get_skip_intervals(self, song: Song, source: Source) -> List[Tuple[float, float]]:
        return []
    def post_process_hook(self, song: Song, temp_target: Target, **kwargs):
        pass
    def download_song_to_target(self, source: Source, target: Target, desc: str = None) -> DownloadResult:
        return DownloadResult()
--- a/music_kraken/download/components.py
+++ b/music_kraken/download/components.py
@@ -0,0 +1,158 @@
 import re
 from pathlib import Path
 from typing import Any, Callable, Dict, Generator, List, Optional
 from ..utils.config import main_settings
 from ..utils.exception import MKComposeException
 from ..utils.string_processing import unify
 class Option:
    """
    This could represent a data object, a string or a page.
    """
    def __init__(
        self, 
        value: Any, 
        text: Optional[str] = None, 
        keys: List[Any] = None, 
        hidden: bool = False, 
        parse_key: Callable[[Any], Any] = lambda x: x,
    ):
        self._parse_key: Callable[[Any], Any] = parse_key
        self.value = value
        self.text = text or str(value)
        self.hidden = hidden
        self._raw_keys = set(keys or [])
        self._raw_keys.add(self.text)
        self.keys = set(self.parse_key(key) for key in self._raw_keys)
    def register_key(self, key: Any):
        self._raw_keys.add(key)
        self.keys.add(self._parse_key(key))
    @property
    def parse_key(self) -> Callable[[Any], Any]:
        return self._parse_key
    @parse_key.setter
    def parse_key(self, value: Callable[[Any], Any]):
        self._parse_key = value
        self.keys = set(self._parse_key(key) for key in self._raw_keys)
    def __str__(self):
        return self.text
 class Select:
    def __init__(
        self, 
        options: Generator[Option, None, None] = None, 
        option_factory: Callable[[Any], Option] = None,
        raw_options: List[Any] = None,
        parse_option_key: Callable[[Any], Any] = lambda x: x,
        ask_for_creating_option: Callable[[Option], bool] = lambda x: True,
        sort: bool = False,
        **kwargs
    ):
        self._parse_option_key: Callable[[Any], Any] = parse_option_key
        self._ask_for_creating_option: Callable[[Option], bool] = ask_for_creating_option
        self._key_to_option: Dict[Any, Option] = dict()
        self._options: List[Option] = []
        options = options or []
        self.option_factory: Optional[Callable[[Any], Option]] = option_factory
        if self.can_create_options:
            _raw_options = raw_options or []
            if sort:
                _raw_options = sorted(_raw_options)
            for raw_option in _raw_options:
                self.append(self.option_factory(raw_option))
        elif raw_options is not None:
            raise MKComposeException("Cannot create options without a factory.")
        self.extend(options)
    @property
    def can_create_options(self) -> bool:
        return self.option_factory is not None
    def append(self, option: Option):
        option.parse_key = self._parse_option_key
        self._options.append(option)
        for key in option.keys:
            self._key_to_option[key] = option
    def extend(self, options: List[Option]):
        for option in options:
            self.append(option)
    def __iter__(self) -> Generator[Option, None, None]:
        for option in self._options:
            if option.hidden:
                continue
            yield option
    def __contains__(self, key: Any) -> bool:
        return key in self._key_to_option
    def __getitem__(self, key: Any) -> Option:
        return self._key_to_option[key]
    def create_option(self, key: Any, **kwargs) -> Option:
        if not self.can_create_options:
            raise MKComposeException("Cannot create options without a factory.")
        option = self.option_factory(key, **kwargs)
        self.append(option)
        return option
    def choose(self, key: Any) -> Optional[Option]:
        if key not in self:
            if self.can_create_options and self._ask_for_creating_option(key):
                return self.create_option(key)
            return None
        return self[key]
 class StringSelect(Select):
    def __init__(self, **kwargs):
        self._current_index = 0
        kwargs["option_factory"] = self.next_option
        kwargs["parse_option_key"] = lambda x: unify(str(x))
        super().__init__(**kwargs)
    def next_option(self, value: Any) -> Optional[Option]:
        o = Option(value=value, keys=[self._current_index], text=f"{self._current_index:0>2}: {value}")
        self._current_index += 1
        return o
 class GenreSelect(StringSelect):
    @staticmethod
    def is_valid_genre(genre: Path) -> bool:
        """
        gets the name of all subdirectories of shared.MUSIC_DIR,
        but filters out all directories, where the name matches with any Patern
        from shared.NOT_A_GENRE_REGEX.
        """
        if not genre.is_dir():
            return False
        if any(re.match(regex_pattern, genre.name) for regex_pattern in main_settings["not_a_genre_regex"]):
            return False
        return True
    def __init__(self):
        super().__init__(sort=True, raw_options=(genre.name for genre in filter(self.is_valid_genre, main_settings["music_directory"].iterdir())))
--- a/music_kraken/download/page_attributes.py
+++ b/music_kraken/download/page_attributes.py
@@ -1,327 +0,0 @@
 from typing import Tuple, Type, Dict, Set, Optional, List
 from collections import defaultdict
 from pathlib import Path
 import re
 import logging
 from . import FetchOptions, DownloadOptions
 from .results import SearchResults
 from ..objects import (
    DatabaseObject as DataObject,
    Collection,
    Target,
    Source,
    Options,
    Song,
    Album,
    Artist,
    Label,
 )
 from ..audio import write_metadata_to_target, correct_codec
 from ..utils import output, BColors
 from ..utils.string_processing import fit_to_file_system
 from ..utils.config import youtube_settings, main_settings
 from ..utils.path_manager import LOCATIONS
 from ..utils.enums import SourceType, ALL_SOURCE_TYPES
 from ..utils.support_classes.download_result import DownloadResult
 from ..utils.support_classes.query import Query
 from ..utils.support_classes.download_result import DownloadResult
 from ..utils.exception import MKMissingNameException
 from ..utils.exception.download import UrlNotFoundException
 from ..utils.shared import DEBUG_PAGES
 from ..pages import Page, EncyclopaediaMetallum, Musify, YouTube, YoutubeMusic, Bandcamp, INDEPENDENT_DB_OBJECTS
 ALL_PAGES: Set[Type[Page]] = {
    # EncyclopaediaMetallum,
    Musify,
    YoutubeMusic,
    Bandcamp
 }
 if youtube_settings["use_youtube_alongside_youtube_music"]:
    ALL_PAGES.add(YouTube)
 AUDIO_PAGES: Set[Type[Page]] = {
    Musify,
    YouTube,
    YoutubeMusic,
    Bandcamp
 }
 SHADY_PAGES: Set[Type[Page]] = {
    Musify,
 }
 fetch_map = {
    Song: "fetch_song",
    Album: "fetch_album",
    Artist: "fetch_artist",
    Label: "fetch_label",
 }
 if DEBUG_PAGES:
    DEBUGGING_PAGE = Bandcamp
    print(f"Only downloading from page {DEBUGGING_PAGE}.")
    ALL_PAGES = {DEBUGGING_PAGE}
    AUDIO_PAGES = ALL_PAGES.union(AUDIO_PAGES)
 class Pages:
    def __init__(self, exclude_pages: Set[Type[Page]] = None, exclude_shady: bool = False, download_options: DownloadOptions = None, fetch_options: FetchOptions = None):
        self.LOGGER = logging.getLogger("download")
        self.download_options: DownloadOptions = download_options or DownloadOptions()
        self.fetch_options: FetchOptions = fetch_options or FetchOptions()
        # initialize all page instances
        self._page_instances: Dict[Type[Page], Page] = dict()
        self._source_to_page: Dict[SourceType, Type[Page]] = dict()
        exclude_pages = exclude_pages if exclude_pages is not None else set()
        if exclude_shady:
            exclude_pages = exclude_pages.union(SHADY_PAGES)
        if not exclude_pages.issubset(ALL_PAGES):
            raise ValueError(f"The excluded pages have to be a subset of all pages: {exclude_pages} | {ALL_PAGES}")
        def _set_to_tuple(page_set: Set[Type[Page]]) -> Tuple[Type[Page], ...]:
            return tuple(sorted(page_set, key=lambda page: page.__name__))
        self._pages_set: Set[Type[Page]] = ALL_PAGES.difference(exclude_pages)
        self.pages: Tuple[Type[Page], ...] = _set_to_tuple(self._pages_set)
        self._audio_pages_set: Set[Type[Page]] = self._pages_set.intersection(AUDIO_PAGES)
        self.audio_pages: Tuple[Type[Page], ...] = _set_to_tuple(self._audio_pages_set)
        for page_type in self.pages:
            self._page_instances[page_type] = page_type(fetch_options=self.fetch_options, download_options=self.download_options)
            self._source_to_page[page_type.SOURCE_TYPE] = page_type
    def _get_page_from_enum(self, source_page: SourceType) -> Page:
        if source_page not in self._source_to_page:
            return None
        return self._page_instances[self._source_to_page[source_page]]
    def search(self, query: Query) -> SearchResults:
        result = SearchResults()
        for page_type in self.pages:
            result.add(
                page=page_type,
                search_result=self._page_instances[page_type].search(query=query)
            )
        return result
    def fetch_details(self, data_object: DataObject, stop_at_level: int = 1, **kwargs) -> DataObject:
        if not isinstance(data_object, INDEPENDENT_DB_OBJECTS):
            return data_object
        source: Source
        for source in data_object.source_collection.get_sources(source_type_sorting={
            "only_with_page": True,
        }):
            new_data_object = self.fetch_from_source(source=source, stop_at_level=stop_at_level)
            if new_data_object is not None:
                data_object.merge(new_data_object)
        return data_object
    def fetch_from_source(self, source: Source, **kwargs) -> Optional[DataObject]:
        if not source.has_page:
            return None
        source_type = source.page.get_source_type(source=source)
        if source_type is None:
            self.LOGGER.debug(f"Could not determine source type for {source}.")
            return None
        func = getattr(source.page, fetch_map[source_type])
        # fetching the data object and marking it as fetched
        data_object: DataObject = func(source=source, **kwargs)
        data_object.mark_as_fetched(source.hash_url)
        return data_object
    def fetch_from_url(self, url: str) -> Optional[DataObject]:
        source = Source.match_url(url, ALL_SOURCE_TYPES.MANUAL)
        if source is None:
            return None
        return self.fetch_from_source(source=source)
    def _skip_object(self, data_object: DataObject) -> bool:
        if isinstance(data_object, Album):
            if not self.download_options.download_all and data_object.album_type in self.download_options.album_type_blacklist:
                return True
        return False
    def download(self, data_object: DataObject, genre: str, **kwargs) -> DownloadResult:
        # fetch the given object
        self.fetch_details(data_object)
        output(f"\nDownloading {data_object.option_string}...", color=BColors.BOLD)
        # fetching all parent objects (e.g. if you only download a song)
        if not kwargs.get("fetched_upwards", False):
            to_fetch: List[DataObject] = [data_object]
            while len(to_fetch) > 0:
                new_to_fetch = []
                for d in to_fetch:
                    if self._skip_object(d):
                        continue
                    self.fetch_details(d)
                    for c in d.get_parent_collections():
                        new_to_fetch.extend(c)
                to_fetch = new_to_fetch
            kwargs["fetched_upwards"] = True
        # download all children
        download_result: DownloadResult = DownloadResult()
        for c in data_object.get_child_collections():
            for d in c:
                if self._skip_object(d):
                    continue
                download_result.merge(self.download(d, genre, **kwargs))
        # actually download if the object is a song
        if isinstance(data_object, Song):
            """
            TODO
            add the traced artist and album to the naming.
            I am able to do that, because duplicate values are removed later on.
            """
            self._download_song(data_object, naming={
                "genre": [genre],
                "audio_format": [main_settings["audio_format"]],
            })
        return download_result
    def _extract_fields_from_template(self, path_template: str) -> Set[str]:
        return set(re.findall(r"{([^}]+)}", path_template))
    def _parse_path_template(self, path_template: str, naming: Dict[str, List[str]]) -> str:
        field_names: Set[str] = self._extract_fields_from_template(path_template)
        for field in field_names:
            if len(naming[field]) == 0:
                raise MKMissingNameException(f"Missing field for {field}.")
            path_template = path_template.replace(f"{{{field}}}", naming[field][0])
        return path_template
    def _download_song(self, song: Song, naming: dict) -> DownloadOptions:
        """
        TODO
        Search the song in the file system.
        """
        r = DownloadResult(total=1)
        # pre process the data recursively
        song.compile()
        # manage the naming
        naming: Dict[str, List[str]] = defaultdict(list, naming)
        naming["song"].append(song.title_value)
        naming["isrc"].append(song.isrc)
        naming["album"].extend(a.title_value for a in song.album_collection)
        naming["album_type"].extend(a.album_type.value for a in song.album_collection)
        naming["artist"].extend(a.name for a in song.artist_collection)
        naming["artist"].extend(a.name for a in song.feature_artist_collection)
        for a in song.album_collection:
            naming["label"].extend([l.title_value for l in a.label_collection])
        # removing duplicates from the naming, and process the strings
        for key, value in naming.items():
            # https://stackoverflow.com/a/17016257
            naming[key] = list(dict.fromkeys(value))
        song.genre = naming["genre"][0]
        # manage the targets
        tmp: Target = Target.temp(file_extension=main_settings["audio_format"])
        song.target_collection.append(Target(
            relative_to_music_dir=True,
            file_path=Path(
                self._parse_path_template(main_settings["download_path"], naming=naming), 
                self._parse_path_template(main_settings["download_file"], naming=naming),
            )
        ))
        for target in song.target_collection:
            if target.exists:
                output(f'{target.file_path} {BColors.OKGREEN.value}[already exists]', color=BColors.GREY)
                r.found_on_disk += 1
                if not self.download_options.download_again_if_found:
                    target.copy_content(tmp)
            else:
                target.create_path()
                output(f'{target.file_path}', color=BColors.GREY)
        # this streams from every available source until something succeeds, setting the skip intervals to the values of the according source
        used_source: Optional[Source] = None
        skip_intervals: List[Tuple[float, float]] = []
        for source in song.source_collection.get_sources(source_type_sorting={
            "only_with_page": True,
            "sort_key": lambda page: page.download_priority,
            "reverse": True,
        }):
            if tmp.exists:
                break
            used_source = source
            streaming_results = source.page.download_song_to_target(source=source, target=tmp, desc="download")
            skip_intervals = source.page.get_skip_intervals(song=song, source=source)
            # if something has been downloaded but it somehow failed, delete the file
            if streaming_results.is_fatal_error and tmp.exists:
                tmp.delete()
        # if everything went right, the file should exist now
        if not tmp.exists:
            if used_source is None:
                r.error_message = f"No source found for {song.option_string}."
            else:
                r.error_message = f"Something went wrong downloading {song.option_string}."
            return r
        # post process the audio
        found_on_disk = used_source is None
        if not found_on_disk or self.download_options.process_audio_if_found:
            correct_codec(target=tmp, skip_intervals=skip_intervals)
            r.sponsor_segments = len(skip_intervals)
        if used_source is not None:
            used_source.page.post_process_hook(song=song, temp_target=tmp)
        if not found_on_disk or self.download_options.process_metadata_if_found:
            write_metadata_to_target(metadata=song.metadata, target=tmp, song=song)
        # copy the tmp target to the final locations
        for target in song.target_collection:
            tmp.copy_content(target)
        tmp.delete()
        return r
    def fetch_url(self, url: str, stop_at_level: int = 2) -> Tuple[Type[Page], DataObject]:
        source = Source.match_url(url, ALL_SOURCE_TYPES.MANUAL)
        if source is None:
            raise UrlNotFoundException(url=url)
        _actual_page = self._source_to_page[source.source_type]
        return _actual_page, self._page_instances[_actual_page].fetch_object_from_source(source=source, stop_at_level=stop_at_level)
--- a/music_kraken/download/results.py
+++ b/music_kraken/download/results.py
@@ -1,8 +1,12 @@
-from typing import Tuple, Type, Dict, List, Generator, Union
+from __future__ import annotations
 from dataclasses import dataclass
 from typing import TYPE_CHECKING, Dict, Generator, List, Tuple, Type, Union
 from ..objects import DatabaseObject
-from ..pages import Page, EncyclopaediaMetallum, Musify
+
 if TYPE_CHECKING:
    from . import Page
@dataclass
--- a/music_kraken/objects/artwork.py
+++ b/music_kraken/objects/artwork.py
@@ -59,4 +59,6 @@ class Artwork:
                self._variant_mapping[key] = value
    def __eq__(self, other: Artwork) -> bool:
        if not isinstance(other, Artwork):
            return False
        return any(a == b for a, b in zip(self._variant_mapping.keys(), other._variant_mapping.keys()))
--- a/music_kraken/objects/formatted_text.py
+++ b/music_kraken/objects/formatted_text.py
@@ -37,11 +37,19 @@ class FormattedText:
    @property
    def markdown(self) -> str:
        return md(self.html).strip()
    @markdown.setter
    def markdown(self, value: str) -> None:
        self.html = mistune.markdown(value)
    @property
    def plain(self) -> str:
        md = self.markdown
        return md.replace("\n\n", "\n")
    @plain.setter
    def plain(self, value: str) -> None:
        self.html = mistune.markdown(plain_to_markdown(value))
    def __str__(self) -> str:
        return self.markdown
--- a/music_kraken/pages/init.py
+++ b/music_kraken/pages/init.py
@@ -1,7 +1,52 @@
-from .encyclopaedia_metallum import EncyclopaediaMetallum
+import importlib
-from .musify import Musify
+import inspect
-from .youtube import YouTube
+import logging
-from .youtube_music import YoutubeMusic
+import pkgutil
-from .bandcamp import Bandcamp
+import sys
 from collections import defaultdict
 from copy import copy
 from pathlib import Path
 from typing import Dict, Generator, List, Set, Type
-from .abstract import Page, INDEPENDENT_DB_OBJECTS
+from ._bandcamp import Bandcamp
 from ._encyclopaedia_metallum import EncyclopaediaMetallum
 from ._genius import Genius
 from ._musify import Musify
 from ._youtube import YouTube
 from ._youtube_music import YoutubeMusic
 def import_children():
    _page_directory = Path(__file__).parent
    _stem_blacklist = set(["__pycache__", "__init__"])
    for _file in _page_directory.iterdir():
        if _file.stem in _stem_blacklist:
            continue
        logging.debug(f"importing {_file.absolute()}")
        exec(f"from . import {_file.stem}")
 # module_blacklist = set(sys.modules.keys())
 import_children()
 """
 classes = set()
 print(__name__)
 for module_name, module in sys.modules.items():
    if module_name in module_blacklist or not module_name.startswith(__name__):
        continue
    print("scanning module", module_name)
    for name, obj in inspect.getmembers(module, predicate=inspect.isclass):
        _module = obj.__module__
        if _module.startswith(__name__) and hasattr(obj, "SOURCE_TYPE"):
            print("checking object", name, obj.__module__)
            classes.add(obj)
    print()
 print(*(c.__name__ for c in classes), sep=",\t")
 __all__ = [c.__name__ for c in classes]
 """
--- a/music_kraken/pages/_bandcamp.py
+++ b/music_kraken/pages/_bandcamp.py
@@ -1,33 +1,22 @@
 from typing import List, Optional, Type
 from urllib.parse import urlparse, urlunparse
 import json
 from enum import Enum
-from bs4 import BeautifulSoup
+from typing import List, Optional, Type
-import pycountry
+from urllib.parse import urlparse, urlunparse
 import pycountry
 from bs4 import BeautifulSoup
 from ..objects import Source, DatabaseObject
 from .abstract import Page
 from ..objects import (
    Artist,
    Source,
    SourceType,
    Song,
    Album,
    Label,
    Target,
    Contact,
    ID3Timestamp,
    Lyrics,
    FormattedText,
    Artwork,
 )
 from ..connection import Connection
 from ..download import Page
 from ..objects import (Album, Artist, Artwork, Contact, DatabaseObject,
                       FormattedText, ID3Timestamp, Label, Lyrics, Song,
                       Source, SourceType, Target)
 from ..utils import dump_to_file
-from ..utils.enums import SourceType, ALL_SOURCE_TYPES
+from ..utils.config import logging_settings, main_settings
-from ..utils.support_classes.download_result import DownloadResult
+from ..utils.enums import ALL_SOURCE_TYPES, SourceType
 from ..utils.string_processing import clean_song_title
 from ..utils.config import main_settings, logging_settings
 from ..utils.shared import DEBUG
 from ..utils.string_processing import clean_song_title
 from ..utils.support_classes.download_result import DownloadResult
 if DEBUG:
    from ..utils import dump_to_file
--- a/music_kraken/pages/_encyclopaedia_metallum.py
+++ b/music_kraken/pages/_encyclopaedia_metallum.py
@@ -1,31 +1,20 @@
 from collections import defaultdict
-from typing import List, Optional, Dict, Type, Union
+from typing import Dict, List, Optional, Type, Union
-from bs4 import BeautifulSoup
+from urllib.parse import urlencode, urlparse
 import pycountry
-from urllib.parse import urlparse, urlencode
+from bs4 import BeautifulSoup
 from ..connection import Connection
-from ..utils.config import logging_settings
+from ..download import Page
-from .abstract import Page
+from ..objects import (Album, Artist, DatabaseObject, FormattedText,
-from ..utils.enums import SourceType, ALL_SOURCE_TYPES
+                       ID3Timestamp, Label, Lyrics, Options, Song, Source)
 from ..utils.enums.album import AlbumType
 from ..utils.support_classes.query import Query
 from ..objects import (
    Lyrics,
    Artist,
    Source,
    Song,
    Album,
    ID3Timestamp,
    FormattedText,
    Label,
    Options,
    DatabaseObject
 )
 from ..utils.shared import DEBUG
 from ..utils import dump_to_file
-
+from ..utils.config import logging_settings
-
+from ..utils.enums import ALL_SOURCE_TYPES, SourceType
 from ..utils.enums.album import AlbumType
 from ..utils.shared import DEBUG
 from ..utils.support_classes.query import Query
 ALBUM_TYPE_MAP: Dict[str, AlbumType] = defaultdict(lambda: AlbumType.OTHER, {
    "Full-length": AlbumType.STUDIO_ALBUM,
@@ -207,6 +196,7 @@ def create_grid(
 class EncyclopaediaMetallum(Page):
    REGISTER = False
    SOURCE_TYPE = ALL_SOURCE_TYPES.ENCYCLOPAEDIA_METALLUM
    LOGGER = logging_settings["metal_archives_logger"]
--- a/music_kraken/pages/_genius.py
+++ b/music_kraken/pages/_genius.py
@@ -0,0 +1,286 @@
 import json
 from enum import Enum
 from typing import List, Optional, Type
 from urllib.parse import urlencode, urlparse, urlunparse
 import pycountry
 from bs4 import BeautifulSoup
 from ..connection import Connection
 from ..download import Page
 from ..objects import (Album, Artist, Artwork, Contact, DatabaseObject,
                       FormattedText, ID3Timestamp, Label, Lyrics, Song,
                       Source, SourceType, Target)
 from ..utils import dump_to_file, traverse_json_path
 from ..utils.config import logging_settings, main_settings
 from ..utils.enums import ALL_SOURCE_TYPES, SourceType
 from ..utils.shared import DEBUG
 from ..utils.string_processing import clean_song_title
 from ..utils.support_classes.download_result import DownloadResult
 if DEBUG:
    from ..utils import dump_to_file
 class Genius(Page):
    SOURCE_TYPE = ALL_SOURCE_TYPES.GENIUS
    HOST = "genius.com"
    def __init__(self, *args, **kwargs):
        self.connection: Connection = Connection(
            host="https://genius.com/",
            logger=self.LOGGER,
            module="genius",
        )
        super().__init__(*args, **kwargs)
    def get_source_type(self, source: Source) -> Optional[Type[DatabaseObject]]:
        path = source.parsed_url.path.replace("/", "")
        if path.startswith("artists"):
            return Artist
        if path.startswith("albums"):
            return Album
        return Song
    def add_to_artwork(self, artwork: Artwork, url: str):
        if url is None:
            return
        url_frags = url.split(".")
        if len(url_frags) < 2:
            artwork.append(url=url)
            return
        dimensions = url_frags[-2].split("x")
        if len(dimensions) < 2:
            artwork.append(url=url)
            return
        if len(dimensions) == 3:
            dimensions = dimensions[:-1]
        try:
            artwork.append(url=url, width=int(dimensions[0]), height=int(dimensions[1]))
        except ValueError:
            artwork.append(url=url)
    def parse_api_object(self, data: dict) -> Optional[DatabaseObject]:
        if data is None:
            return None
        object_type = data.get("_type")
        artwork = Artwork()
        self.add_to_artwork(artwork, data.get("header_image_url"))
        self.add_to_artwork(artwork, data.get("image_url"))
        additional_sources: List[Source] = []
        source: Source = Source(self.SOURCE_TYPE, data.get("url"), additional_data={
            "id": data.get("id"),
            "slug": data.get("slug"),
            "api_path": data.get("api_path"),
        })
        notes = FormattedText()
        description = data.get("description") or {}
        if "html" in description:
            notes.html = description["html"]
        elif "markdown" in description:
            notes.markdown = description["markdown"]
        elif "description_preview" in data:
            notes.plaintext = data["description_preview"]
        if source.url is None:
            return None
        if object_type == "artist":
            if data.get("instagram_name") is not None:
                additional_sources.append(Source(ALL_SOURCE_TYPES.INSTAGRAM, f"https://www.instagram.com/{data['instagram_name']}/"))
            if data.get("facebook_name") is not None:
                additional_sources.append(Source(ALL_SOURCE_TYPES.FACEBOOK, f"https://www.facebook.com/{data['facebook_name']}/"))
            if data.get("twitter_name") is not None:
                additional_sources.append(Source(ALL_SOURCE_TYPES.TWITTER, f"https://x.com/{data['twitter_name']}/"))
            return Artist(
                name=data["name"].strip() if data.get("name") is not None else None,
                source_list=[source],
                artwork=artwork,
                notes=notes,
            )
        if object_type == "album":
            self.add_to_artwork(artwork, data.get("cover_art_thumbnail_url"))
            self.add_to_artwork(artwork, data.get("cover_art_url"))
            for cover_art in data.get("cover_arts", []):
                self.add_to_artwork(artwork, cover_art.get("image_url"))
                self.add_to_artwork(artwork, cover_art.get("thumbnail_image_url"))
            return Album(
                title=data.get("name").strip(),
                source_list=[source],
                artist_list=[self.parse_api_object(data.get("artist"))],
                artwork=artwork,
                date=ID3Timestamp(**data.get("release_date_components", {})),
            )
        if object_type == "song":
            self.add_to_artwork(artwork, data.get("song_art_image_thumbnail_url"))
            self.add_to_artwork(artwork, data.get("song_art_image_url"))
            main_artist_list = []
            featured_artist_list = []
            _artist_name = None
            primary_artist = self.parse_api_object(data.get("primary_artist"))
            if primary_artist is not None:
                _artist_name = primary_artist.name
                main_artist_list.append(primary_artist)
            for feature_artist in (*(data.get("featured_artists") or []), *(data.get("producer_artists") or []), *(data.get("writer_artists") or [])):
                artist = self.parse_api_object(feature_artist)
                if artist is not None:
                    featured_artist_list.append(artist)
            return Song(
                title=clean_song_title(data.get("title"), artist_name=_artist_name),
                source_list=[source],
                artwork=artwork,
                feature_artist_list=featured_artist_list,
                artist_list=main_artist_list,
            )
        return None
    def general_search(self, search_query: str, **kwargs) -> List[DatabaseObject]:
        results = []
        search_params = {
            "q": search_query,
        }
        r = self.connection.get("https://genius.com/api/search/multi?" + urlencode(search_params), name=f"search_{search_query}")
        if r is None:
            return results
        dump_to_file("search_genius.json", r.text, is_json=True, exit_after_dump=False)
        data = r.json()
        for elements in traverse_json_path(data, "response.sections", default=[]):
            hits = elements.get("hits", [])
            for hit in hits:
                parsed = self.parse_api_object(hit.get("result"))
                if parsed is not None:
                    results.append(parsed)
        return results
    def fetch_artist(self, source: Source, stop_at_level: int = 1) -> Artist:
        artist: Artist = Artist()
        # https://genius.com/api/artists/24527/albums?page=1
        r = self.connection.get(source.url, name=source.url)
        if r is None:
            return artist
        soup = self.get_soup_from_response(r)
        # find the content attribute in the meta tag which is contained in the head
        data_container = soup.find("meta", {"itemprop": "page_data"})
        if data_container is not None:
            content = data_container["content"]
            dump_to_file("genius_itemprop_artist.json", content, is_json=True, exit_after_dump=False)
            data = json.loads(content)
            artist = self.parse_api_object(data.get("artist"))
            for e in (data.get("artist_albums") or []):
                r = self.parse_api_object(e)
                if not isinstance(r, Album):
                    continue
                artist.album_collection.append(r)
            for e in (data.get("artist_songs") or []):
                r = self.parse_api_object(e)
                if not isinstance(r, Song):
                    continue
                """
                TODO
                fetch the album for these songs, because the api doesn't 
                return them
                """
                artist.album_collection.extend(r.album_collection)
        artist.source_collection.append(source)
        return artist
    def fetch_album(self, source: Source, stop_at_level: int = 1) -> Album:
        album: Album = Album()
        # https://genius.com/api/artists/24527/albums?page=1
        r = self.connection.get(source.url, name=source.url)
        if r is None:
            return album
        soup = self.get_soup_from_response(r)
        # find the content attribute in the meta tag which is contained in the head
        data_container = soup.find("meta", {"itemprop": "page_data"})
        if data_container is not None:
            content = data_container["content"]
            dump_to_file("genius_itemprop_album.json", content, is_json=True, exit_after_dump=False)
            data = json.loads(content)
            album = self.parse_api_object(data.get("album"))
            for e in data.get("album_appearances", []):
                r = self.parse_api_object(e.get("song"))
                if not isinstance(r, Song):
                    continue
                album.song_collection.append(r)
        album.source_collection.append(source)
        return album
    def get_json_content_from_response(self, response, start: str, end: str) -> Optional[str]:
        content = response.text
        start_index = content.find(start)
        if start_index < 0:
            return None
        start_index += len(start)
        end_index = content.find(end, start_index)
        if end_index < 0:
            return None
        return content[start_index:end_index]
    def fetch_song(self, source: Source, stop_at_level: int = 1) -> Song:
        song: Song = Song()
        r = self.connection.get(source.url, name=source.url)
        if r is None:
            return song
        # get the contents that are between `JSON.parse('` and `');`
        content = self.get_json_content_from_response(r, start="window.__PRELOADED_STATE__ = JSON.parse('", end="');\n      window.__APP_CONFIG__ = ")
        if content is not None:
            content = content.replace("\\\\", "\\").replace('\\"', '"').replace("\\'", "'")
            data = json.loads(content)
            lyrics_html = traverse_json_path(data, "songPage.lyricsData.body.html", default=None)
            if lyrics_html is not None:
                song.lyrics_collection.append(Lyrics(FormattedText(html=lyrics_html)))
            dump_to_file("genius_song_script_json.json", content, is_json=True, exit_after_dump=False)
        soup = self.get_soup_from_response(r)
        for lyrics in soup.find_all("div", {"data-lyrics-container": "true"}):
            lyrics_object = Lyrics(FormattedText(html=lyrics.prettify()))
            song.lyrics_collection.append(lyrics_object)
        song.source_collection.append(source)
        return song
--- a/music_kraken/pages/_musify.py
+++ b/music_kraken/pages/_musify.py
@@ -1,34 +1,23 @@
 from collections import defaultdict
 from dataclasses import dataclass
 from enum import Enum
-from typing import List, Optional, Type, Union, Generator, Dict, Any
+from typing import Any, Dict, Generator, List, Optional, Type, Union
 from urllib.parse import urlparse
 import pycountry
 from bs4 import BeautifulSoup
 from ..connection import Connection
-from .abstract import Page
+from ..download import Page
-from ..utils.enums import SourceType, ALL_SOURCE_TYPES
+from ..objects import (Album, Artist, Artwork, DatabaseObject, FormattedText,
-from ..utils.enums.album import AlbumType, AlbumStatus
+                       ID3Timestamp, Label, Lyrics, Song, Source, Target)
-from ..objects import (
+from ..utils import shared, string_processing
    Artist,
    Source,
    Song,
    Album,
    ID3Timestamp,
    FormattedText,
    Label,
    Target,
    DatabaseObject,
    Lyrics,
    Artwork
 )
 from ..utils.config import logging_settings, main_settings
-from ..utils import string_processing, shared
+from ..utils.enums import ALL_SOURCE_TYPES, SourceType
 from ..utils.enums.album import AlbumStatus, AlbumType
 from ..utils.string_processing import clean_song_title
 from ..utils.support_classes.query import Query
 from ..utils.support_classes.download_result import DownloadResult
 from ..utils.support_classes.query import Query
 """
 https://musify.club/artist/ghost-bath-280348?_pjax=#bodyContent
--- a/music_kraken/pages/_youtube.py
+++ b/music_kraken/pages/_youtube.py
@@ -1,29 +1,19 @@
 from typing import List, Optional, Type, Tuple
 from urllib.parse import urlparse, urlunparse, parse_qs
 from enum import Enum
 from typing import List, Optional, Tuple, Type
 from urllib.parse import parse_qs, urlparse, urlunparse
 import python_sponsorblock
 from ..objects import Source, DatabaseObject, Song, Target
 from .abstract import Page
 from ..objects import (
    Artist,
    Source,
    Song,
    Album,
    Label,
    Target,
    FormattedText,
    ID3Timestamp
 )
 from ..connection import Connection
 from ..download import Page
 from ..objects import (Album, Artist, DatabaseObject, FormattedText,
                       ID3Timestamp, Label, Song, Source, Target)
 from ..utils.config import logging_settings, main_settings, youtube_settings
 from ..utils.enums import ALL_SOURCE_TYPES, SourceType
 from ..utils.string_processing import clean_song_title
 from ..utils.enums import SourceType, ALL_SOURCE_TYPES
 from ..utils.support_classes.download_result import DownloadResult
-from ..utils.config import youtube_settings, main_settings, logging_settings
+from ._youtube_music.super_youtube import (SuperYouTube, YouTubeUrl,
-
+                                           YouTubeUrlType, get_invidious_url)
 from .youtube_music.super_youtube import SuperYouTube, YouTubeUrl, get_invidious_url, YouTubeUrlType
 """
 - https://yt.artemislena.eu/api/v1/search?q=Zombiez+-+Topic&page=1&date=none&type=channel&duration=none&sort=relevance
@@ -38,7 +28,7 @@ def get_piped_url(path: str = "", params: str = "", query: str = "", fragment: s
 class YouTube(SuperYouTube):
-    # CHANGE
+    REGISTER = youtube_settings["use_youtube_alongside_youtube_music"]
    SOURCE_TYPE = ALL_SOURCE_TYPES.YOUTUBE
    def __init__(self, *args, **kwargs):
--- a/music_kraken/pages/_youtube_music/init.py
+++ b/music_kraken/pages/_youtube_music/init.py
--- a/music_kraken/pages/_youtube_music/_list_render.py
+++ b/music_kraken/pages/_youtube_music/_list_render.py
@@ -3,7 +3,6 @@ from enum import Enum
 from ...utils.config import logging_settings
 from ...objects import Source, DatabaseObject
 from ..abstract import Page
 from ...objects import (
    Artist,
    Source,
--- a/music_kraken/pages/_youtube_music/_music_object_render.py
+++ b/music_kraken/pages/_youtube_music/_music_object_render.py
@@ -6,7 +6,6 @@ from ...utils.string_processing import clean_song_title
 from ...utils.enums import SourceType, ALL_SOURCE_TYPES
 from ...objects import Source, DatabaseObject
 from ..abstract import Page
 from ...objects import (
    Artist,
    Source,
--- a/music_kraken/pages/_youtube_music/super_youtube.py
+++ b/music_kraken/pages/_youtube_music/super_youtube.py
@@ -1,26 +1,17 @@
 from typing import List, Optional, Type, Tuple
 from urllib.parse import urlparse, urlunparse, parse_qs
 from enum import Enum
-import requests
+from typing import List, Optional, Tuple, Type
 from urllib.parse import parse_qs, urlparse, urlunparse
 import python_sponsorblock
 import requests
 from ...objects import Source, DatabaseObject, Song, Target
 from ..abstract import Page
 from ...objects import (
    Artist,
    Source,
    Song,
    Album,
    Label,
    Target,
    FormattedText,
    ID3Timestamp
 )
 from ...connection import Connection
 from ...download import Page
 from ...objects import (Album, Artist, DatabaseObject, FormattedText,
                        ID3Timestamp, Label, Song, Source, Target)
 from ...utils.config import logging_settings, main_settings, youtube_settings
 from ...utils.enums import ALL_SOURCE_TYPES, SourceType
 from ...utils.support_classes.download_result import DownloadResult
 from ...utils.config import youtube_settings, logging_settings, main_settings
 from ...utils.enums import SourceType, ALL_SOURCE_TYPES
 def get_invidious_url(path: str = "", params: str = "", query: str = "", fragment: str = "") -> str:
--- a/music_kraken/pages/_youtube_music/youtube_music.py
+++ b/music_kraken/pages/_youtube_music/youtube_music.py
@@ -1,46 +1,33 @@
-from __future__ import unicode_literals, annotations
+from __future__ import annotations, unicode_literals
-from typing import Dict, List, Optional, Set, Type
+import json
 from urllib.parse import urlparse, urlunparse, quote, parse_qs, urlencode
 import logging
 import random
 import json
 from dataclasses import dataclass
 import re
 from functools import lru_cache
 from collections import defaultdict
 from dataclasses import dataclass
 from functools import lru_cache
 from typing import Dict, List, Optional, Set, Type
 from urllib.parse import parse_qs, quote, urlencode, urlparse, urlunparse
 import youtube_dl
 from youtube_dl.extractor.youtube import YoutubeIE
 from youtube_dl.utils import DownloadError
 from ...connection import Connection
 from ...download import Page
 from ...objects import Album, Artist, Artwork
 from ...objects import DatabaseObject as DataObject
 from ...objects import (FormattedText, ID3Timestamp, Label, Lyrics, Song,
                        Source, Target)
 from ...utils import dump_to_file, get_current_millis, traverse_json_path
 from ...utils.config import logging_settings, main_settings, youtube_settings
 from ...utils.enums import ALL_SOURCE_TYPES, SourceType
 from ...utils.enums.album import AlbumType
 from ...utils.exception.config import SettingValueError
 from ...utils.config import main_settings, youtube_settings, logging_settings
 from ...utils.shared import DEBUG, DEBUG_YOUTUBE_INITIALIZING
 from ...utils.string_processing import clean_song_title
 from ...utils import get_current_millis, traverse_json_path
 from ...utils import dump_to_file
 from ..abstract import Page
 from ...objects import (
    DatabaseObject as DataObject,
    Source,
    FormattedText,
    ID3Timestamp,
    Artwork,
    Artist,
    Song,
    Album,
    Label,
    Target,
    Lyrics,
 )
 from ...connection import Connection
 from ...utils.enums import SourceType, ALL_SOURCE_TYPES
 from ...utils.enums.album import AlbumType
 from ...utils.support_classes.download_result import DownloadResult
 from ._list_render import parse_renderer
 from ._music_object_render import parse_run_element
 from .super_youtube import SuperYouTube
--- a/music_kraken/pages/abstract.py
+++ b/music_kraken/pages/abstract.py
@@ -1,157 +0,0 @@
 import logging
 import random
 import re
 from copy import copy
 from pathlib import Path
 from typing import Optional, Union, Type, Dict, Set, List, Tuple, TypedDict
 from string import Formatter
 from dataclasses import dataclass, field
 import requests
 from bs4 import BeautifulSoup
 from ..connection import Connection
 from ..objects import (
    Song,
    Source,
    Album,
    Artist,
    Target,
    DatabaseObject,
    Options,
    Collection,
    Label,
 )
 from ..utils.enums import SourceType
 from ..utils.enums.album import AlbumType
 from ..audio import write_metadata_to_target, correct_codec
 from ..utils.config import main_settings
 from ..utils.support_classes.query import Query
 from ..utils.support_classes.download_result import DownloadResult
 from ..utils.string_processing import fit_to_file_system
 from ..utils import trace, output, BColors
 INDEPENDENT_DB_OBJECTS = Union[Label, Album, Artist, Song]
 INDEPENDENT_DB_TYPES = Union[Type[Song], Type[Album], Type[Artist], Type[Label]]
@dataclass
 class FetchOptions:
    download_all: bool = False
    album_type_blacklist: Set[AlbumType] = field(default_factory=lambda: set(AlbumType(a) for a in main_settings["album_type_blacklist"]))
@dataclass
 class DownloadOptions:
    download_all: bool = False
    album_type_blacklist: Set[AlbumType] = field(default_factory=lambda: set(AlbumType(a) for a in main_settings["album_type_blacklist"]))
    process_audio_if_found: bool = False
    process_metadata_if_found: bool = True
 class Page:
    SOURCE_TYPE: SourceType
    LOGGER: logging.Logger
    def __new__(cls, *args, **kwargs):
        cls.LOGGER = logging.getLogger(cls.__name__)
        return super().__new__(cls)
    def __init__(self, download_options: DownloadOptions = None, fetch_options: FetchOptions = None):
        self.SOURCE_TYPE.register_page(self)
        self.download_options: DownloadOptions = download_options or DownloadOptions()
        self.fetch_options: FetchOptions = fetch_options or FetchOptions()
    def _search_regex(self, pattern, string, default=None, fatal=True, flags=0, group=None):
        """
        Perform a regex search on the given string, using a single or a list of
        patterns returning the first matching group.
        In case of failure return a default value or raise a WARNING or a
        RegexNotFoundError, depending on fatal, specifying the field name.
        """
        if isinstance(pattern, str):
            mobj = re.search(pattern, string, flags)
        else:
            for p in pattern:
                mobj = re.search(p, string, flags)
                if mobj:
                    break
        if mobj:
            if group is None:
                # return the first matching group
                return next(g for g in mobj.groups() if g is not None)
            elif isinstance(group, (list, tuple)):
                return tuple(mobj.group(g) for g in group)
            else:
                return mobj.group(group)
        return default
    def get_source_type(self, source: Source) -> Optional[Type[DatabaseObject]]:
        return None
    def get_soup_from_response(self, r: requests.Response) -> BeautifulSoup:
        return BeautifulSoup(r.content, "html.parser")
    # to search stuff
    def search(self, query: Query) -> List[DatabaseObject]:
        music_object = query.music_object
        search_functions = {
            Song: self.song_search,
            Album: self.album_search,
            Artist: self.artist_search,
            Label: self.label_search
        }
        if type(music_object) in search_functions:
            r = search_functions[type(music_object)](music_object)
            if r is not None and len(r) > 0:
                return r
        r = []
        for default_query in query.default_search:
            for single_option in self.general_search(default_query):
                r.append(single_option)
        return r
    def general_search(self, search_query: str) -> List[DatabaseObject]:
        return []
    def label_search(self, label: Label) -> List[Label]:
        return []
    def artist_search(self, artist: Artist) -> List[Artist]:
        return []
    def album_search(self, album: Album) -> List[Album]:
        return []
    def song_search(self, song: Song) -> List[Song]:
        return []
    # to fetch stuff
    def fetch_song(self, source: Source, stop_at_level: int = 1) -> Song:
        return Song()
    def fetch_album(self, source: Source, stop_at_level: int = 1) -> Album:
        return Album()
    def fetch_artist(self, source: Source, stop_at_level: int = 1) -> Artist:
        return Artist()
    def fetch_label(self, source: Source, stop_at_level: int = 1) -> Label:
        return Label()
    # to download stuff
    def get_skip_intervals(self, song: Song, source: Source) -> List[Tuple[float, float]]:
        return []
    def post_process_hook(self, song: Song, temp_target: Target, **kwargs):
        pass
    def download_song_to_target(self, source: Source, target: Target, desc: str = None) -> DownloadResult:
        return DownloadResult()
--- a/music_kraken/utils/enums/init.py
+++ b/music_kraken/utils/enums/init.py
@@ -17,6 +17,9 @@ class SourceType:
    def register_page(self, page: Page):
        self.page = page
    def deregister_page(self):
        self.page = None
    def __hash__(self):
        return hash(self.name)
--- a/music_kraken/utils/exception/init.py
+++ b/music_kraken/utils/exception/init.py
@@ -3,6 +3,9 @@ class MKBaseException(Exception):
        self.message = message
        super().__init__(message, **kwargs)
 # Compose exceptions. Those usually mean a bug on my side.
 class MKComposeException(MKBaseException):
    pass
 # Downloading
 class MKDownloadException(MKBaseException):
--- a/music_kraken/utils/shared.py
+++ b/music_kraken/utils/shared.py
@@ -15,11 +15,11 @@ __stage__ = os.getenv("STAGE", "prod")
 DEBUG = (__stage__ == "dev") and True
 DEBUG_LOGGING = DEBUG and False
 DEBUG_TRACE = DEBUG and True
-DEBUG_OBJECT_TRACE = DEBUG and True
+DEBUG_OBJECT_TRACE = DEBUG and False
 DEBUG_OBJECT_TRACE_CALLSTACK = DEBUG_OBJECT_TRACE and False
 DEBUG_YOUTUBE_INITIALIZING = DEBUG and False
 DEBUG_PAGES = DEBUG and False
-DEBUG_DUMP = DEBUG and False
+DEBUG_DUMP = DEBUG and True
 DEBUG_PRINT_ID = DEBUG and True
 if DEBUG:
Author	SHA1	Message	Date
Lars Noack	49145a7d93	feat: moved cli helpers to seperate file All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-27 13:41:24 +02:00
Lars Noack	0f2229b0f2	feat: completely dynamified the datasource import All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-24 17:00:39 +02:00
Lars Noack	5af95f1b03	feat: auto import pages in page module	2024-05-24 15:46:42 +02:00
Lars Noack	c24cf701c1	fix: pages were not in the subclasses because the module was never importet	2024-05-24 15:28:47 +02:00
Lars Noack	cef87460a7	draft All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-24 14:46:38 +02:00
Lars Noack	c0fbd16929	feat: basic select layout	2024-05-24 13:21:07 +02:00
Lars Noack	b5a5559f7b	feat: created layout for option All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-23 18:05:18 +02:00
Lars Noack	906ddb679d	draft: All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-23 17:27:24 +02:00
Lars Noack	cd2e7d7173	draft: moving page interface to downloader module All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-23 16:33:40 +02:00
Lars Noack	c683394228	feat: imports	2024-05-23 16:13:47 +02:00
Lars Noack	aafbba3b1c	feat: implemented consistent settings All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-23 14:36:19 +02:00
Lars Noack	40e9366a0b	feat: implemented the new page mechanics in the downloader	2024-05-23 14:32:31 +02:00
Lars Noack	8255ad5264	feat: added detection to autoscann pages All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-23 14:24:20 +02:00
Lars Noack	2aa0f02fa5	Merge branch 'adding_genius' into experimental All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-23 13:36:10 +02:00
Lars Noack	344da0a0bf	fix: converting pictures to rgb before saving All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-22 15:20:26 +02:00
Lars Noack	49dc7093c8	fix: genius fallback All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-22 15:18:43 +02:00
Lars Noack	90f70638b4	feat: better lyrics support All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-21 17:55:08 +02:00
Lars Noack	7b4eee858a	feat: parsed script json All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-21 17:14:58 +02:00
Lars Noack	f61b34dd40	feat: improved feature artists by also adding writer and producer to it All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-21 16:52:01 +02:00
Lars Noack	688b4fd357	feat: getting the album tracklist All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-21 16:47:38 +02:00
Lars Noack	769d27dc5c	feat: album details All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-21 16:43:52 +02:00
Lars Noack	f5d953d9ce	feat: theoretically fetching feature songs All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-21 16:34:04 +02:00
Lars Noack	46b64b8f8d	feat: fetched the flat artist details	2024-05-21 16:23:05 +02:00
Lars Noack	adfce16d2a	feat: fetched the flat artist details	2024-05-21 16:21:58 +02:00
Lars Noack	e4fd9faf12	feat: detecting url type	2024-05-21 15:57:09 +02:00
Lars Noack	f6caee41a8	feat: finished searching genious All checks were successful ci/woodpecker/push/woodpecker Pipeline was successful Details	2024-05-21 15:52:41 +02:00
Lars Noack	068c749c38	feat: implemented artist search	2024-05-21 15:27:10 +02:00