Compare commits
	
		
			32 Commits
		
	
	
		
			main
			...
			850c68f3e5
		
	
	| Author | SHA1 | Date | |
|---|---|---|---|
| 850c68f3e5 | |||
| 7219048422 | |||
| 49145a7d93 | |||
| 0f2229b0f2 | |||
| 5af95f1b03 | |||
| c24cf701c1 | |||
| cef87460a7 | |||
| c0fbd16929 | |||
| b5a5559f7b | |||
| 906ddb679d | |||
| cd2e7d7173 | |||
| c683394228 | |||
| aafbba3b1c | |||
| 40e9366a0b | |||
| 8255ad5264 | |||
| 2aa0f02fa5 | |||
| 7b0b830d64 | |||
| 1ba6c97f5a | |||
| c8cbfc7cb9 | |||
| 344da0a0bf | |||
| 49dc7093c8 | |||
| 90f70638b4 | |||
| 7b4eee858a | |||
| f61b34dd40 | |||
| 688b4fd357 | |||
| 769d27dc5c | |||
| f5d953d9ce | |||
| 46b64b8f8d | |||
| adfce16d2a | |||
| e4fd9faf12 | |||
| f6caee41a8 | |||
| 068c749c38 | 
							
								
								
									
										6
									
								
								.vscode/launch.json
									
									
									
									
										vendored
									
									
								
							
							
						
						
									
										6
									
								
								.vscode/launch.json
									
									
									
									
										vendored
									
									
								
							| @@ -17,6 +17,12 @@ | |||||||
|             "request": "launch", |             "request": "launch", | ||||||
|             "program": "development/actual_donwload.py", |             "program": "development/actual_donwload.py", | ||||||
|             "console": "integratedTerminal" |             "console": "integratedTerminal" | ||||||
|  |         }, | ||||||
|  |         { | ||||||
|  |             "name": "Python Debugger: Music Kraken", | ||||||
|  |             "type": "debugpy", | ||||||
|  |             "request": "launch", // run the module | ||||||
|  |             "module": "music_kraken", | ||||||
|         } |         } | ||||||
|     ] |     ] | ||||||
| } | } | ||||||
							
								
								
									
										1
									
								
								.vscode/settings.json
									
									
									
									
										vendored
									
									
								
							
							
						
						
									
										1
									
								
								.vscode/settings.json
									
									
									
									
										vendored
									
									
								
							| @@ -27,6 +27,7 @@ | |||||||
|         "Gitea", |         "Gitea", | ||||||
|         "iframe", |         "iframe", | ||||||
|         "isrc", |         "isrc", | ||||||
|  |         "itemprop", | ||||||
|         "levenshtein", |         "levenshtein", | ||||||
|         "metallum", |         "metallum", | ||||||
|         "MUSICBRAINZ", |         "MUSICBRAINZ", | ||||||
|   | |||||||
| @@ -6,9 +6,10 @@ logging.getLogger().setLevel(logging.DEBUG) | |||||||
|  |  | ||||||
| if __name__ == "__main__": | if __name__ == "__main__": | ||||||
|     commands = [ |     commands = [ | ||||||
|         "s: #a I'm in a coffin", |         "s: #a Crystal F", | ||||||
|         "0", |         "10", | ||||||
|         "d: 0", |         "1", | ||||||
|  |         "3", | ||||||
|     ] |     ] | ||||||
|  |  | ||||||
|      |      | ||||||
|   | |||||||
| @@ -93,6 +93,10 @@ def write_metadata_to_target(metadata: Metadata, target: Target, song: Song): | |||||||
|             # resize the image to the preferred resolution |             # resize the image to the preferred resolution | ||||||
|             img.thumbnail((main_settings["preferred_artwork_resolution"], main_settings["preferred_artwork_resolution"])) |             img.thumbnail((main_settings["preferred_artwork_resolution"], main_settings["preferred_artwork_resolution"])) | ||||||
|  |  | ||||||
|  |             # https://stackoverflow.com/a/59476938/16804841 | ||||||
|  |             if img.mode != 'RGB': | ||||||
|  |                 img = img.convert('RGB') | ||||||
|  |  | ||||||
|             img.save(converted_target.file_path, "JPEG") |             img.save(converted_target.file_path, "JPEG") | ||||||
|  |  | ||||||
|         # https://stackoverflow.com/questions/70228440/mutagen-how-can-i-correctly-embed-album-art-into-mp3-file-so-that-i-can-see-t |         # https://stackoverflow.com/questions/70228440/mutagen-how-can-i-correctly-embed-album-art-into-mp3-file-so-that-i-can-see-t | ||||||
|   | |||||||
| @@ -1,89 +1,25 @@ | |||||||
| import random | import random | ||||||
| from typing import Set, Type, Dict, List |  | ||||||
| from pathlib import Path |  | ||||||
| import re | import re | ||||||
|  | from pathlib import Path | ||||||
|  | from typing import Dict, Generator, List, Set, Type | ||||||
|  |  | ||||||
| from .utils import cli_function | from .. import console | ||||||
| from .options.first_config import initial_config | from ..download import Downloader, Page, components | ||||||
|  | from ..download.results import GoToResults | ||||||
| from ..utils import output, BColors | from ..download.results import Option as ResultOption | ||||||
| from ..utils.config import write_config, main_settings | from ..download.results import PageResults, Results | ||||||
| from ..utils.shared import URL_PATTERN | from ..objects import Album, Artist, DatabaseObject, Song | ||||||
| from ..utils.string_processing import fit_to_file_system | from ..utils import BColors, output | ||||||
| from ..utils.support_classes.query import Query | from ..utils.config import main_settings, write_config | ||||||
| from ..utils.support_classes.download_result import DownloadResult | from ..utils.enums.colors import BColors | ||||||
| from ..utils.exception import MKInvalidInputException | from ..utils.exception import MKInvalidInputException | ||||||
| from ..utils.exception.download import UrlNotFoundException | from ..utils.exception.download import UrlNotFoundException | ||||||
| from ..utils.enums.colors import BColors | from ..utils.shared import HELP_MESSAGE, URL_PATTERN | ||||||
| from .. import console | from ..utils.string_processing import fit_to_file_system | ||||||
|  | from ..utils.support_classes.download_result import DownloadResult | ||||||
| from ..download.results import Results, Option, PageResults, GoToResults | from ..utils.support_classes.query import Query | ||||||
| from ..download.page_attributes import Pages | from .options.first_config import initial_config | ||||||
| from ..pages import Page | from .utils import ask_for_bool, cli_function | ||||||
| from ..objects import Song, Album, Artist, DatabaseObject |  | ||||||
|  |  | ||||||
| """ |  | ||||||
| This is the implementation of the Shell |  | ||||||
|  |  | ||||||
| # Behaviour |  | ||||||
|  |  | ||||||
| ## Searching |  | ||||||
|  |  | ||||||
| ```mkshell |  | ||||||
| > s: {querry or url} |  | ||||||
|  |  | ||||||
| # examples |  | ||||||
| > s: https://musify.club/release/some-random-release-183028492 |  | ||||||
| > s: r: #a an Artist #r some random Release |  | ||||||
| ``` |  | ||||||
|  |  | ||||||
| Searches for an url, or an query |  | ||||||
|  |  | ||||||
| ### Query Syntax |  | ||||||
|  |  | ||||||
| ``` |  | ||||||
| #a {artist} #r {release} #t {track} |  | ||||||
| ``` |  | ||||||
|  |  | ||||||
| You can escape stuff like `#` doing this: `\#` |  | ||||||
|  |  | ||||||
| ## Downloading |  | ||||||
|  |  | ||||||
| To download something, you either need a direct link, or you need to have already searched for options |  | ||||||
|  |  | ||||||
| ```mkshell |  | ||||||
| > d: {option ids or direct url} |  | ||||||
|  |  | ||||||
| # examples |  | ||||||
| > d: 0, 3, 4 |  | ||||||
| > d: 1 |  | ||||||
| > d: https://musify.club/release/some-random-release-183028492 |  | ||||||
| ``` |  | ||||||
|  |  | ||||||
| ## Misc |  | ||||||
|  |  | ||||||
| ### Exit |  | ||||||
|  |  | ||||||
| ```mkshell |  | ||||||
| > q |  | ||||||
| > quit |  | ||||||
| > exit |  | ||||||
| > abort |  | ||||||
| ``` |  | ||||||
|  |  | ||||||
| ### Current Options |  | ||||||
|  |  | ||||||
| ```mkshell |  | ||||||
| > . |  | ||||||
| ``` |  | ||||||
|  |  | ||||||
| ### Previous Options |  | ||||||
|  |  | ||||||
| ``` |  | ||||||
| > .. |  | ||||||
| ``` |  | ||||||
|  |  | ||||||
| """ |  | ||||||
|  |  | ||||||
| EXIT_COMMANDS = {"q", "quit", "exit", "abort"} | EXIT_COMMANDS = {"q", "quit", "exit", "abort"} | ||||||
| ALPHABET = "abcdefghijklmnopqrstuvwxyz" | ALPHABET = "abcdefghijklmnopqrstuvwxyz" | ||||||
| @@ -91,59 +27,29 @@ PAGE_NAME_FILL = "-" | |||||||
| MAX_PAGE_LEN = 21 | MAX_PAGE_LEN = 21 | ||||||
|  |  | ||||||
|  |  | ||||||
| def get_existing_genre() -> List[str]: |  | ||||||
|     """ |  | ||||||
|     gets the name of all subdirectories of shared.MUSIC_DIR, |  | ||||||
|     but filters out all directories, where the name matches with any patern |  | ||||||
|     from shared.NOT_A_GENRE_REGEX. |  | ||||||
|     """ |  | ||||||
|     existing_genres: List[str] = [] |  | ||||||
|  |  | ||||||
|     # get all subdirectories of MUSIC_DIR, not the files in the dir. |  | ||||||
|     existing_subdirectories: List[Path] = [f for f in main_settings["music_directory"].iterdir() if f.is_dir()] |  | ||||||
|  |  | ||||||
|     for subdirectory in existing_subdirectories: |  | ||||||
|         name: str = subdirectory.name |  | ||||||
|  |  | ||||||
|         if not any(re.match(regex_pattern, name) for regex_pattern in main_settings["not_a_genre_regex"]): |  | ||||||
|             existing_genres.append(name) |  | ||||||
|  |  | ||||||
|     existing_genres.sort() |  | ||||||
|  |  | ||||||
|     return existing_genres |  | ||||||
|  |  | ||||||
|  |  | ||||||
| def get_genre(): | def get_genre(): | ||||||
|     existing_genres = get_existing_genre() |     select_genre = components.GenreSelect() | ||||||
|     for i, genre_option in enumerate(existing_genres): |     select_genre._ask_for_creating_option = lambda key: ask_for_bool(f"Create the genre \"{key}\"") | ||||||
|         print(f"{i + 1:0>2}: {genre_option}") |  | ||||||
|  |  | ||||||
|     while True: |     genre: Optional[components.Option] = None | ||||||
|         genre = input("Id or new genre: ") |  | ||||||
|  |  | ||||||
|         if genre.isdigit(): |     while genre is None: | ||||||
|             genre_id = int(genre) - 1 |         for genre in select_genre: | ||||||
|             if genre_id >= len(existing_genres): |             print(genre) | ||||||
|                 print(f"No genre under the id {genre_id + 1}.") |  | ||||||
|                 continue |  | ||||||
|  |  | ||||||
|             return existing_genres[genre_id] |         genre = select_genre.choose(input("Id or new genre: ")) | ||||||
|  |  | ||||||
|         new_genre = fit_to_file_system(genre) |     return genre.value | ||||||
|  |  | ||||||
|         agree_inputs = {"y", "yes", "ok"} |  | ||||||
|         verification = input(f"create new genre \"{new_genre}\"? (Y/N): ").lower() |  | ||||||
|         if verification in agree_inputs: |  | ||||||
|             return new_genre |  | ||||||
|  |  | ||||||
|  |  | ||||||
| def help_message(): | def help_message(): | ||||||
|  |     print(HELP_MESSAGE) | ||||||
|     print() |     print() | ||||||
|     print(random.choice(main_settings["happy_messages"])) |     print(random.choice(main_settings["happy_messages"])) | ||||||
|     print() |     print() | ||||||
|  |  | ||||||
|  |  | ||||||
| class Downloader: | class CliDownloader: | ||||||
|     def __init__( |     def __init__( | ||||||
|             self, |             self, | ||||||
|             exclude_pages: Set[Type[Page]] = None, |             exclude_pages: Set[Type[Page]] = None, | ||||||
| @@ -153,7 +59,7 @@ class Downloader: | |||||||
|             genre: str = None, |             genre: str = None, | ||||||
|             process_metadata_anyway: bool = False, |             process_metadata_anyway: bool = False, | ||||||
|     ) -> None: |     ) -> None: | ||||||
|         self.pages: Pages = Pages(exclude_pages=exclude_pages, exclude_shady=exclude_shady) |         self.pages: Downloader = Downloader(exclude_pages=exclude_pages, exclude_shady=exclude_shady) | ||||||
|  |  | ||||||
|         self.page_dict: Dict[str, Type[Page]] = dict() |         self.page_dict: Dict[str, Type[Page]] = dict() | ||||||
|  |  | ||||||
| @@ -177,7 +83,7 @@ class Downloader: | |||||||
|  |  | ||||||
|         page_count = 0 |         page_count = 0 | ||||||
|         for option in self.current_results.formatted_generator(): |         for option in self.current_results.formatted_generator(): | ||||||
|             if isinstance(option, Option): |             if isinstance(option, ResultOption): | ||||||
|                 r = f"{BColors.GREY.value}{option.index:0{self.option_digits}}{BColors.ENDC.value} {option.music_object.option_string}" |                 r = f"{BColors.GREY.value}{option.index:0{self.option_digits}}{BColors.ENDC.value} {option.music_object.option_string}" | ||||||
|                 print(r) |                 print(r) | ||||||
|             else: |             else: | ||||||
| @@ -446,7 +352,7 @@ def download( | |||||||
|         else: |         else: | ||||||
|             print(f"{BColors.FAIL.value}Something went wrong configuring.{BColors.ENDC.value}") |             print(f"{BColors.FAIL.value}Something went wrong configuring.{BColors.ENDC.value}") | ||||||
|  |  | ||||||
|     shell = Downloader(genre=genre, process_metadata_anyway=process_metadata_anyway) |     shell = CliDownloader(genre=genre, process_metadata_anyway=process_metadata_anyway) | ||||||
|  |  | ||||||
|     if command_list is not None: |     if command_list is not None: | ||||||
|         for command in command_list: |         for command in command_list: | ||||||
|   | |||||||
| @@ -1,3 +1,4 @@ | |||||||
|  | from ..utils import BColors | ||||||
| from ..utils.shared import get_random_message | from ..utils.shared import get_random_message | ||||||
|  |  | ||||||
|  |  | ||||||
| @@ -39,4 +40,8 @@ def print_cute_message(): | |||||||
|         print(message) |         print(message) | ||||||
|  |  | ||||||
|  |  | ||||||
|  | AGREE_INPUTS = {"y", "yes", "ok"} | ||||||
|  | def ask_for_bool(msg: str) -> bool: | ||||||
|  |     i = input(f"{msg} ({BColors.OKGREEN.value}Y{BColors.ENDC.value}/{BColors.FAIL.value}N{BColors.ENDC.value})? ").lower() | ||||||
|  |     return i in AGREE_INPUTS | ||||||
|      |      | ||||||
| @@ -6,6 +6,7 @@ from typing import List, Optional | |||||||
| from functools import lru_cache | from functools import lru_cache | ||||||
| import logging | import logging | ||||||
|  |  | ||||||
|  | from ..utils import output, BColors | ||||||
| from ..utils.config import main_settings | from ..utils.config import main_settings | ||||||
| from ..utils.string_processing import fit_to_file_system | from ..utils.string_processing import fit_to_file_system | ||||||
|  |  | ||||||
| @@ -136,13 +137,13 @@ class Cache: | |||||||
|         ) |         ) | ||||||
|         self._write_attribute(cache_attribute) |         self._write_attribute(cache_attribute) | ||||||
|  |  | ||||||
|         cache_path = fit_to_file_system(Path(module_path, name), hidden_ok=True) |         cache_path = fit_to_file_system(Path(module_path, name.replace("/", "_")), hidden_ok=True) | ||||||
|         with cache_path.open("wb") as content_file: |         with cache_path.open("wb") as content_file: | ||||||
|             self.logger.debug(f"writing cache to {cache_path}") |             self.logger.debug(f"writing cache to {cache_path}") | ||||||
|             content_file.write(content) |             content_file.write(content) | ||||||
|  |  | ||||||
|     def get(self, name: str) -> Optional[CacheResult]: |     def get(self, name: str) -> Optional[CacheResult]: | ||||||
|         path = fit_to_file_system(Path(self._dir, self.module, name), hidden_ok=True) |         path = fit_to_file_system(Path(self._dir, self.module, name.replace("/", "_")), hidden_ok=True) | ||||||
|  |  | ||||||
|         if not path.is_file(): |         if not path.is_file(): | ||||||
|             return None |             return None | ||||||
| @@ -165,7 +166,7 @@ class Cache: | |||||||
|             if ca.name == "": |             if ca.name == "": | ||||||
|                 continue |                 continue | ||||||
|  |  | ||||||
|             file = fit_to_file_system(Path(self._dir, ca.module, ca.name), hidden_ok=True) |             file = fit_to_file_system(Path(self._dir, ca.module, ca.name.replace("/", "_")), hidden_ok=True) | ||||||
|  |  | ||||||
|             if not ca.is_valid: |             if not ca.is_valid: | ||||||
|                 self.logger.debug(f"deleting cache {ca.id}") |                 self.logger.debug(f"deleting cache {ca.id}") | ||||||
| @@ -204,9 +205,12 @@ class Cache: | |||||||
|         for path in self._dir.iterdir(): |         for path in self._dir.iterdir(): | ||||||
|             if path.is_dir(): |             if path.is_dir(): | ||||||
|                 for file in path.iterdir(): |                 for file in path.iterdir(): | ||||||
|  |                     output(f"Deleting file {file}", color=BColors.GREY) | ||||||
|                     file.unlink() |                     file.unlink() | ||||||
|  |                 output(f"Deleting folder {path}", color=BColors.HEADER) | ||||||
|                 path.rmdir() |                 path.rmdir() | ||||||
|             else: |             else: | ||||||
|  |                 output(f"Deleting folder {path}", color=BColors.HEADER) | ||||||
|                 path.unlink() |                 path.unlink() | ||||||
|  |  | ||||||
|         self.cached_attributes.clear() |         self.cached_attributes.clear() | ||||||
|   | |||||||
| @@ -1,8 +1,36 @@ | |||||||
| from dataclasses import dataclass, field | from __future__ import annotations | ||||||
| from typing import Set |  | ||||||
|  |  | ||||||
| from ..utils.config import main_settings | import logging | ||||||
|  | import random | ||||||
|  | import re | ||||||
|  | from collections import defaultdict | ||||||
|  | from copy import copy | ||||||
|  | from dataclasses import dataclass, field | ||||||
|  | from pathlib import Path | ||||||
|  | from string import Formatter | ||||||
|  | from typing import (TYPE_CHECKING, Any, Callable, Dict, Generator, List, | ||||||
|  |                     Optional, Set, Tuple, Type, TypedDict, Union) | ||||||
|  |  | ||||||
|  | import requests | ||||||
|  | from bs4 import BeautifulSoup | ||||||
|  |  | ||||||
|  | from ..audio import correct_codec, write_metadata_to_target | ||||||
|  | from ..connection import Connection | ||||||
|  | from ..objects import Album, Artist, Collection | ||||||
|  | from ..objects import DatabaseObject as DataObject | ||||||
|  | from ..objects import Label, Options, Song, Source, Target | ||||||
|  | from ..utils import BColors, output, trace | ||||||
|  | from ..utils.config import main_settings, youtube_settings | ||||||
|  | from ..utils.enums import ALL_SOURCE_TYPES, SourceType | ||||||
| from ..utils.enums.album import AlbumType | from ..utils.enums.album import AlbumType | ||||||
|  | from ..utils.exception import MKComposeException, MKMissingNameException | ||||||
|  | from ..utils.exception.download import UrlNotFoundException | ||||||
|  | from ..utils.path_manager import LOCATIONS | ||||||
|  | from ..utils.shared import DEBUG_PAGES | ||||||
|  | from ..utils.string_processing import fit_to_file_system | ||||||
|  | from ..utils.support_classes.download_result import DownloadResult | ||||||
|  | from ..utils.support_classes.query import Query | ||||||
|  | from .results import SearchResults | ||||||
|  |  | ||||||
|  |  | ||||||
| @dataclass | @dataclass | ||||||
| @@ -19,3 +47,409 @@ class DownloadOptions: | |||||||
|     download_again_if_found: bool = False |     download_again_if_found: bool = False | ||||||
|     process_audio_if_found: bool = False |     process_audio_if_found: bool = False | ||||||
|     process_metadata_if_found: bool = True |     process_metadata_if_found: bool = True | ||||||
|  |  | ||||||
|  |  | ||||||
|  | fetch_map = { | ||||||
|  |     Song: "fetch_song", | ||||||
|  |     Album: "fetch_album", | ||||||
|  |     Artist: "fetch_artist", | ||||||
|  |     Label: "fetch_label", | ||||||
|  | } | ||||||
|  |  | ||||||
|  |  | ||||||
|  | class Downloader: | ||||||
|  |     def __init__( | ||||||
|  |         self,  | ||||||
|  |         auto_register_pages: bool = True,  | ||||||
|  |         download_options: DownloadOptions = None,  | ||||||
|  |         fetch_options: FetchOptions = None,  | ||||||
|  |         **kwargs | ||||||
|  |     ): | ||||||
|  |         self.LOGGER = logging.getLogger("download") | ||||||
|  |          | ||||||
|  |         self.download_options: DownloadOptions = download_options or DownloadOptions() | ||||||
|  |         self.fetch_options: FetchOptions = fetch_options or FetchOptions() | ||||||
|  |  | ||||||
|  |         self._registered_pages: Dict[Type[Page], Set[Page]] = defaultdict(set) | ||||||
|  |         if auto_register_pages: | ||||||
|  |             self.scan_for_pages(**kwargs) | ||||||
|  |  | ||||||
|  |     def register_page(self, page_type: Type[Page], **kwargs): | ||||||
|  |         if page_type in self._registered_pages: | ||||||
|  |             return | ||||||
|  |  | ||||||
|  |         self._registered_pages[page_type].add(page_type( | ||||||
|  |             download_options=self.download_options,  | ||||||
|  |             fetch_options=self.fetch_options,  | ||||||
|  |             **kwargs | ||||||
|  |         )) | ||||||
|  |  | ||||||
|  |     def deregister_page(self, page_type: Type[Page]): | ||||||
|  |         if page_type not in _registered_pages: | ||||||
|  |             return | ||||||
|  |  | ||||||
|  |         for p in self._registered_pages[page_type]: | ||||||
|  |             p.__del__() | ||||||
|  |         del self._registered_pages[page_type] | ||||||
|  |  | ||||||
|  |     def scan_for_pages(self, **kwargs): | ||||||
|  |         # assuming the wanted pages are the leaf classes of the interface | ||||||
|  |         from .. import pages | ||||||
|  |          | ||||||
|  |         leaf_classes = [] | ||||||
|  |  | ||||||
|  |         class_list = [Page] | ||||||
|  |         while len(class_list): | ||||||
|  |             _class = class_list.pop() | ||||||
|  |             class_subclasses = _class.__subclasses__() | ||||||
|  |  | ||||||
|  |             if len(class_subclasses) == 0: | ||||||
|  |                 if _class.REGISTER: | ||||||
|  |                     leaf_classes.append(_class) | ||||||
|  |             else: | ||||||
|  |                 class_list.extend(class_subclasses) | ||||||
|  |  | ||||||
|  |         if Page in leaf_classes: | ||||||
|  |             self.LOGGER.warn("couldn't find any data source") | ||||||
|  |             return | ||||||
|  |         for leaf_class in leaf_classes: | ||||||
|  |             self.register_page(leaf_class, **kwargs) | ||||||
|  |  | ||||||
|  |     def get_pages(self, *page_types: List[Type[Page]]) -> Generator[Page, None, None]: | ||||||
|  |         if len(page_types) == 0: | ||||||
|  |             page_types = _registered_pages.keys() | ||||||
|  |  | ||||||
|  |         for page_type in page_types: | ||||||
|  |             yield from self._registered_pages[page_type] | ||||||
|  |  | ||||||
|  |     def search(self, query: Query) -> SearchResults: | ||||||
|  |         result = SearchResults() | ||||||
|  |          | ||||||
|  |         for page in self.get_pages(): | ||||||
|  |             result.add( | ||||||
|  |                 page=type(page), | ||||||
|  |                 search_result=page.search(query=query) | ||||||
|  |             ) | ||||||
|  |              | ||||||
|  |         return result | ||||||
|  |      | ||||||
|  |     def fetch_details(self, data_object: DataObject, stop_at_level: int = 1, **kwargs) -> DataObject: | ||||||
|  |         source: Source | ||||||
|  |         for source in data_object.source_collection.get_sources(source_type_sorting={ | ||||||
|  |             "only_with_page": True, | ||||||
|  |         }): | ||||||
|  |             new_data_object = self.fetch_from_source(source=source, stop_at_level=stop_at_level) | ||||||
|  |             if new_data_object is not None: | ||||||
|  |                 data_object.merge(new_data_object) | ||||||
|  |  | ||||||
|  |         return data_object | ||||||
|  |  | ||||||
|  |     def fetch_from_source(self, source: Source, **kwargs) -> Optional[DataObject]: | ||||||
|  |         if not source.has_page: | ||||||
|  |             return None | ||||||
|  |          | ||||||
|  |         source_type = source.page.get_source_type(source=source) | ||||||
|  |         if source_type is None: | ||||||
|  |             self.LOGGER.debug(f"Could not determine source type for {source}.") | ||||||
|  |             return None | ||||||
|  |  | ||||||
|  |         func = getattr(source.page, fetch_map[source_type]) | ||||||
|  |          | ||||||
|  |         # fetching the data object and marking it as fetched | ||||||
|  |         data_object: DataObject = func(source=source, **kwargs) | ||||||
|  |         data_object.mark_as_fetched(source.hash_url) | ||||||
|  |         return data_object | ||||||
|  |  | ||||||
|  |     def fetch_from_url(self, url: str) -> Optional[DataObject]: | ||||||
|  |         source = Source.match_url(url, ALL_SOURCE_TYPES.MANUAL) | ||||||
|  |         if source is None: | ||||||
|  |             return None | ||||||
|  |          | ||||||
|  |         return self.fetch_from_source(source=source) | ||||||
|  |      | ||||||
|  |     def _skip_object(self, data_object: DataObject) -> bool: | ||||||
|  |         if isinstance(data_object, Album): | ||||||
|  |             if not self.download_options.download_all and data_object.album_type in self.download_options.album_type_blacklist: | ||||||
|  |                 return True | ||||||
|  |          | ||||||
|  |         return False | ||||||
|  |  | ||||||
|  |     def download(self, data_object: DataObject, genre: str, **kwargs) -> DownloadResult: | ||||||
|  |         # fetch the given object | ||||||
|  |         self.fetch_details(data_object) | ||||||
|  |         output(f"\nDownloading {data_object.option_string}...", color=BColors.BOLD) | ||||||
|  |          | ||||||
|  |         # fetching all parent objects (e.g. if you only download a song) | ||||||
|  |         if not kwargs.get("fetched_upwards", False): | ||||||
|  |             to_fetch: List[DataObject] = [data_object] | ||||||
|  |  | ||||||
|  |             while len(to_fetch) > 0: | ||||||
|  |                 new_to_fetch = [] | ||||||
|  |                 for d in to_fetch: | ||||||
|  |                     if self._skip_object(d): | ||||||
|  |                         continue | ||||||
|  |  | ||||||
|  |                     self.fetch_details(d) | ||||||
|  |  | ||||||
|  |                     for c in d.get_parent_collections(): | ||||||
|  |                         new_to_fetch.extend(c) | ||||||
|  |  | ||||||
|  |                 to_fetch = new_to_fetch | ||||||
|  |              | ||||||
|  |             kwargs["fetched_upwards"] = True | ||||||
|  |          | ||||||
|  |         # download all children | ||||||
|  |         download_result: DownloadResult = DownloadResult() | ||||||
|  |         for c in data_object.get_child_collections(): | ||||||
|  |             for d in c: | ||||||
|  |                 if self._skip_object(d): | ||||||
|  |                     continue | ||||||
|  |  | ||||||
|  |                 download_result.merge(self.download(d, genre, **kwargs)) | ||||||
|  |  | ||||||
|  |         # actually download if the object is a song | ||||||
|  |         if isinstance(data_object, Song): | ||||||
|  |             """ | ||||||
|  |             TODO | ||||||
|  |             add the traced artist and album to the naming. | ||||||
|  |             I am able to do that, because duplicate values are removed later on. | ||||||
|  |             """ | ||||||
|  |  | ||||||
|  |             self._download_song(data_object, naming={ | ||||||
|  |                 "genre": [genre], | ||||||
|  |                 "audio_format": [main_settings["audio_format"]], | ||||||
|  |             }) | ||||||
|  |  | ||||||
|  |         return download_result | ||||||
|  |  | ||||||
|  |     def _extract_fields_from_template(self, path_template: str) -> Set[str]: | ||||||
|  |         return set(re.findall(r"{([^}]+)}", path_template)) | ||||||
|  |  | ||||||
|  |     def _parse_path_template(self, path_template: str, naming: Dict[str, List[str]]) -> str: | ||||||
|  |         field_names: Set[str] = self._extract_fields_from_template(path_template) | ||||||
|  |          | ||||||
|  |         for field in field_names: | ||||||
|  |             if len(naming[field]) == 0: | ||||||
|  |                 raise MKMissingNameException(f"Missing field for {field}.") | ||||||
|  |  | ||||||
|  |             path_template = path_template.replace(f"{{{field}}}", naming[field][0]) | ||||||
|  |  | ||||||
|  |         return path_template | ||||||
|  |  | ||||||
|  |     def _download_song(self, song: Song, naming: dict) -> DownloadOptions: | ||||||
|  |         """ | ||||||
|  |         TODO | ||||||
|  |         Search the song in the file system. | ||||||
|  |         """ | ||||||
|  |         r = DownloadResult(total=1) | ||||||
|  |          | ||||||
|  |         # pre process the data recursively | ||||||
|  |         song.compile() | ||||||
|  |          | ||||||
|  |         # manage the naming | ||||||
|  |         naming: Dict[str, List[str]] = defaultdict(list, naming) | ||||||
|  |         naming["song"].append(song.title_value) | ||||||
|  |         naming["isrc"].append(song.isrc) | ||||||
|  |         naming["album"].extend(a.title_value for a in song.album_collection) | ||||||
|  |         naming["album_type"].extend(a.album_type.value for a in song.album_collection) | ||||||
|  |         naming["artist"].extend(a.name for a in song.artist_collection) | ||||||
|  |         naming["artist"].extend(a.name for a in song.feature_artist_collection) | ||||||
|  |         for a in song.album_collection: | ||||||
|  |             naming["label"].extend([l.title_value for l in a.label_collection]) | ||||||
|  |         # removing duplicates from the naming, and process the strings | ||||||
|  |         for key, value in naming.items(): | ||||||
|  |             # https://stackoverflow.com/a/17016257 | ||||||
|  |             naming[key] = list(dict.fromkeys(value)) | ||||||
|  |         song.genre = naming["genre"][0] | ||||||
|  |  | ||||||
|  |         # manage the targets | ||||||
|  |         tmp: Target = Target.temp(file_extension=main_settings["audio_format"]) | ||||||
|  |  | ||||||
|  |         song.target_collection.append(Target( | ||||||
|  |             relative_to_music_dir=True, | ||||||
|  |             file_path=Path( | ||||||
|  |                 self._parse_path_template(main_settings["download_path"], naming=naming),  | ||||||
|  |                 self._parse_path_template(main_settings["download_file"], naming=naming), | ||||||
|  |             ) | ||||||
|  |         )) | ||||||
|  |         for target in song.target_collection: | ||||||
|  |             if target.exists: | ||||||
|  |                 output(f'{target.file_path} {BColors.OKGREEN.value}[already exists]', color=BColors.GREY) | ||||||
|  |                 r.found_on_disk += 1 | ||||||
|  |  | ||||||
|  |                 if not self.download_options.download_again_if_found: | ||||||
|  |                     target.copy_content(tmp) | ||||||
|  |             else: | ||||||
|  |                 target.create_path() | ||||||
|  |                 output(f'{target.file_path}', color=BColors.GREY) | ||||||
|  |  | ||||||
|  |         # this streams from every available source until something succeeds, setting the skip intervals to the values of the according source | ||||||
|  |         used_source: Optional[Source] = None | ||||||
|  |         skip_intervals: List[Tuple[float, float]] = [] | ||||||
|  |         for source in song.source_collection.get_sources(source_type_sorting={ | ||||||
|  |             "only_with_page": True, | ||||||
|  |             "sort_key": lambda page: page.download_priority, | ||||||
|  |             "reverse": True, | ||||||
|  |         }): | ||||||
|  |             if tmp.exists: | ||||||
|  |                 break | ||||||
|  |  | ||||||
|  |             used_source = source | ||||||
|  |             streaming_results = source.page.download_song_to_target(source=source, target=tmp, desc="download") | ||||||
|  |             skip_intervals = source.page.get_skip_intervals(song=song, source=source) | ||||||
|  |  | ||||||
|  |             # if something has been downloaded but it somehow failed, delete the file | ||||||
|  |             if streaming_results.is_fatal_error and tmp.exists: | ||||||
|  |                 tmp.delete() | ||||||
|  |  | ||||||
|  |         # if everything went right, the file should exist now | ||||||
|  |         if not tmp.exists: | ||||||
|  |             if used_source is None: | ||||||
|  |                 r.error_message = f"No source found for {song.option_string}." | ||||||
|  |             else: | ||||||
|  |                 r.error_message = f"Something went wrong downloading {song.option_string}." | ||||||
|  |             return r | ||||||
|  |  | ||||||
|  |         # post process the audio | ||||||
|  |         found_on_disk = used_source is None | ||||||
|  |         if not found_on_disk or self.download_options.process_audio_if_found: | ||||||
|  |             correct_codec(target=tmp, skip_intervals=skip_intervals) | ||||||
|  |             r.sponsor_segments = len(skip_intervals) | ||||||
|  |  | ||||||
|  |         if used_source is not None: | ||||||
|  |             used_source.page.post_process_hook(song=song, temp_target=tmp) | ||||||
|  |  | ||||||
|  |         if not found_on_disk or self.download_options.process_metadata_if_found: | ||||||
|  |             write_metadata_to_target(metadata=song.metadata, target=tmp, song=song) | ||||||
|  |  | ||||||
|  |         # copy the tmp target to the final locations | ||||||
|  |         for target in song.target_collection: | ||||||
|  |             tmp.copy_content(target) | ||||||
|  |  | ||||||
|  |         tmp.delete() | ||||||
|  |         return r | ||||||
|  |  | ||||||
|  |     def fetch_url(self, url: str, **kwargs) -> DataObject: | ||||||
|  |         source = Source.match_url(url, ALL_SOURCE_TYPES.MANUAL) | ||||||
|  |          | ||||||
|  |         if source is None or source.page is None: | ||||||
|  |             raise UrlNotFoundException(url=url) | ||||||
|  |          | ||||||
|  |         return source.page.fetch_object_from_source(source=source, **kwargs) | ||||||
|  |  | ||||||
|  |  | ||||||
|  | class Page: | ||||||
|  |     REGISTER = True | ||||||
|  |     SOURCE_TYPE: SourceType | ||||||
|  |     LOGGER: logging.Logger | ||||||
|  |  | ||||||
|  |     def __new__(cls, *args, **kwargs): | ||||||
|  |         cls.LOGGER = logging.getLogger(cls.__name__) | ||||||
|  |         return super().__new__(cls) | ||||||
|  |  | ||||||
|  |     @classmethod | ||||||
|  |     def is_leaf_page(cls) -> bool: | ||||||
|  |         return len(cls.__subclasses__()) == 0 | ||||||
|  |  | ||||||
|  |     def __init__(self, download_options: DownloadOptions = None, fetch_options: FetchOptions = None, **kwargs): | ||||||
|  |         self.SOURCE_TYPE.register_page(self) | ||||||
|  |          | ||||||
|  |         self.download_options: DownloadOptions = download_options or DownloadOptions() | ||||||
|  |         self.fetch_options: FetchOptions = fetch_options or FetchOptions() | ||||||
|  |  | ||||||
|  |     def __del__(self): | ||||||
|  |         self.SOURCE_TYPE.deregister_page() | ||||||
|  |  | ||||||
|  |     def _search_regex(self, pattern, string, default=None, fatal=True, flags=0, group=None): | ||||||
|  |         """ | ||||||
|  |         Perform a regex search on the given string, using a single or a list of | ||||||
|  |         patterns returning the first matching group. | ||||||
|  |         In case of failure return a default value or raise a WARNING or a | ||||||
|  |         RegexNotFoundError, depending on fatal, specifying the field name. | ||||||
|  |         """ | ||||||
|  |  | ||||||
|  |         if isinstance(pattern, str): | ||||||
|  |             mobj = re.search(pattern, string, flags) | ||||||
|  |         else: | ||||||
|  |             for p in pattern: | ||||||
|  |                 mobj = re.search(p, string, flags) | ||||||
|  |                 if mobj: | ||||||
|  |                     break | ||||||
|  |  | ||||||
|  |         if mobj: | ||||||
|  |             if group is None: | ||||||
|  |                 # return the first matching group | ||||||
|  |                 return next(g for g in mobj.groups() if g is not None) | ||||||
|  |             elif isinstance(group, (list, tuple)): | ||||||
|  |                 return tuple(mobj.group(g) for g in group) | ||||||
|  |             else: | ||||||
|  |                 return mobj.group(group) | ||||||
|  |  | ||||||
|  |         return default | ||||||
|  |  | ||||||
|  |     def get_source_type(self, source: Source) -> Optional[Type[DataObject]]: | ||||||
|  |         return None | ||||||
|  |  | ||||||
|  |     def get_soup_from_response(self, r: requests.Response) -> BeautifulSoup: | ||||||
|  |         return BeautifulSoup(r.content, "html.parser") | ||||||
|  |  | ||||||
|  |     # to search stuff | ||||||
|  |     def search(self, query: Query) -> List[DataObject]: | ||||||
|  |         music_object = query.music_object | ||||||
|  |  | ||||||
|  |         search_functions = { | ||||||
|  |             Song: self.song_search, | ||||||
|  |             Album: self.album_search, | ||||||
|  |             Artist: self.artist_search, | ||||||
|  |             Label: self.label_search | ||||||
|  |         } | ||||||
|  |  | ||||||
|  |         if type(music_object) in search_functions: | ||||||
|  |             r = search_functions[type(music_object)](music_object) | ||||||
|  |             if r is not None and len(r) > 0: | ||||||
|  |                 return r | ||||||
|  |  | ||||||
|  |         r = [] | ||||||
|  |         for default_query in query.default_search: | ||||||
|  |             for single_option in self.general_search(default_query): | ||||||
|  |                 r.append(single_option) | ||||||
|  |  | ||||||
|  |         return r | ||||||
|  |  | ||||||
|  |     def general_search(self, search_query: str) -> List[DataObject]: | ||||||
|  |         return [] | ||||||
|  |  | ||||||
|  |     def label_search(self, label: Label) -> List[Label]: | ||||||
|  |         return [] | ||||||
|  |  | ||||||
|  |     def artist_search(self, artist: Artist) -> List[Artist]: | ||||||
|  |         return [] | ||||||
|  |  | ||||||
|  |     def album_search(self, album: Album) -> List[Album]: | ||||||
|  |         return [] | ||||||
|  |  | ||||||
|  |     def song_search(self, song: Song) -> List[Song]: | ||||||
|  |         return [] | ||||||
|  |  | ||||||
|  |     # to fetch stuff | ||||||
|  |     def fetch_song(self, source: Source, stop_at_level: int = 1) -> Song: | ||||||
|  |         return Song() | ||||||
|  |  | ||||||
|  |     def fetch_album(self, source: Source, stop_at_level: int = 1) -> Album: | ||||||
|  |         return Album() | ||||||
|  |  | ||||||
|  |     def fetch_artist(self, source: Source, stop_at_level: int = 1) -> Artist: | ||||||
|  |         return Artist() | ||||||
|  |  | ||||||
|  |     def fetch_label(self, source: Source, stop_at_level: int = 1) -> Label: | ||||||
|  |         return Label() | ||||||
|  |  | ||||||
|  |     # to download stuff | ||||||
|  |     def get_skip_intervals(self, song: Song, source: Source) -> List[Tuple[float, float]]: | ||||||
|  |         return [] | ||||||
|  |  | ||||||
|  |     def post_process_hook(self, song: Song, temp_target: Target, **kwargs): | ||||||
|  |         pass | ||||||
|  |  | ||||||
|  |     def download_song_to_target(self, source: Source, target: Target, desc: str = None) -> DownloadResult: | ||||||
|  |         return DownloadResult() | ||||||
|   | |||||||
							
								
								
									
										160
									
								
								music_kraken/download/components.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										160
									
								
								music_kraken/download/components.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,160 @@ | |||||||
|  | import re | ||||||
|  | from pathlib import Path | ||||||
|  | from typing import Any, Callable, Dict, Generator, List, Optional | ||||||
|  |  | ||||||
|  | from ..utils.config import main_settings | ||||||
|  | from ..utils.exception import MKComposeException | ||||||
|  | from ..utils.string_processing import unify | ||||||
|  |  | ||||||
|  |  | ||||||
|  | class Option: | ||||||
|  |     """ | ||||||
|  |     This could represent a data object, a string or a page. | ||||||
|  |     """ | ||||||
|  |  | ||||||
|  |     def __init__( | ||||||
|  |         self,  | ||||||
|  |         value: Any,  | ||||||
|  |         text: Optional[str] = None,  | ||||||
|  |         keys: List[Any] = None,  | ||||||
|  |         hidden: bool = False,  | ||||||
|  |         parse_key: Callable[[Any], Any] = lambda x: x, | ||||||
|  |     ): | ||||||
|  |         self._parse_key: Callable[[Any], Any] = parse_key | ||||||
|  |          | ||||||
|  |         self.value = value | ||||||
|  |         self.text = text or str(value) | ||||||
|  |         self.hidden = hidden | ||||||
|  |  | ||||||
|  |         self._raw_keys = set(keys or []) | ||||||
|  |         self._raw_keys.add(self.text) | ||||||
|  |         self._raw_keys.add(self.value) | ||||||
|  |         self._raw_keys.add(str(self.value)) | ||||||
|  |         self.keys = set(self.parse_key(key) for key in self._raw_keys) | ||||||
|  |      | ||||||
|  |     def register_key(self, key: Any): | ||||||
|  |         self._raw_keys.add(key) | ||||||
|  |         self.keys.add(self._parse_key(key)) | ||||||
|  |  | ||||||
|  |     @property | ||||||
|  |     def parse_key(self) -> Callable[[Any], Any]: | ||||||
|  |         return self._parse_key | ||||||
|  |  | ||||||
|  |     @parse_key.setter | ||||||
|  |     def parse_key(self, value: Callable[[Any], Any]): | ||||||
|  |         self._parse_key = value | ||||||
|  |         self.keys = set(self._parse_key(key) for key in self._raw_keys) | ||||||
|  |  | ||||||
|  |     def __str__(self): | ||||||
|  |         return self.text | ||||||
|  |  | ||||||
|  |  | ||||||
|  | class Select: | ||||||
|  |     def __init__( | ||||||
|  |         self,  | ||||||
|  |         options: Generator[Option, None, None] = None,  | ||||||
|  |         option_factory: Callable[[Any], Option] = None, | ||||||
|  |         raw_options: List[Any] = None, | ||||||
|  |         parse_option_key: Callable[[Any], Any] = lambda x: x, | ||||||
|  |         ask_for_creating_option: Callable[[Option], bool] = lambda x: True, | ||||||
|  |         sort: bool = False, | ||||||
|  |         **kwargs | ||||||
|  |     ): | ||||||
|  |         self._parse_option_key: Callable[[Any], Any] = parse_option_key | ||||||
|  |         self._ask_for_creating_option: Callable[[Option], bool] = ask_for_creating_option | ||||||
|  |  | ||||||
|  |         self._key_to_option: Dict[Any, Option] = dict() | ||||||
|  |         self._options: List[Option] = [] | ||||||
|  |  | ||||||
|  |         options = options or [] | ||||||
|  |         self.option_factory: Optional[Callable[[Any], Option]] = option_factory | ||||||
|  |         if self.can_create_options: | ||||||
|  |             _raw_options = raw_options or [] | ||||||
|  |             if sort: | ||||||
|  |                 _raw_options = sorted(_raw_options) | ||||||
|  |  | ||||||
|  |             for raw_option in _raw_options: | ||||||
|  |                 self.append(self.option_factory(raw_option)) | ||||||
|  |         elif raw_options is not None: | ||||||
|  |             raise MKComposeException("Cannot create options without a factory.") | ||||||
|  |  | ||||||
|  |         self.extend(options) | ||||||
|  |  | ||||||
|  |     @property | ||||||
|  |     def can_create_options(self) -> bool: | ||||||
|  |         return self.option_factory is not None | ||||||
|  |  | ||||||
|  |     def append(self, option: Option): | ||||||
|  |         option.parse_key = self._parse_option_key | ||||||
|  |         self._options.append(option) | ||||||
|  |         for key in option.keys: | ||||||
|  |             self._key_to_option[key] = option | ||||||
|  |  | ||||||
|  |     def extend(self, options: List[Option]): | ||||||
|  |         for option in options: | ||||||
|  |             self.append(option) | ||||||
|  |  | ||||||
|  |     def __iter__(self) -> Generator[Option, None, None]: | ||||||
|  |         for option in self._options: | ||||||
|  |             if option.hidden: | ||||||
|  |                 continue | ||||||
|  |              | ||||||
|  |             yield option | ||||||
|  |  | ||||||
|  |     def __contains__(self, key: Any) -> bool: | ||||||
|  |         return self._parse_option_key(key) in self._key_to_option | ||||||
|  |  | ||||||
|  |     def __getitem__(self, key: Any) -> Option: | ||||||
|  |         return self._key_to_option[self._parse_option_key(key)] | ||||||
|  |  | ||||||
|  |     def create_option(self, key: Any, **kwargs) -> Option: | ||||||
|  |         if not self.can_create_options: | ||||||
|  |             raise MKComposeException("Cannot create options without a factory.") | ||||||
|  |  | ||||||
|  |         option = self.option_factory(key, **kwargs) | ||||||
|  |         self.append(option) | ||||||
|  |         return option | ||||||
|  |  | ||||||
|  |     def choose(self, key: Any) -> Optional[Option]: | ||||||
|  |         if key not in self: | ||||||
|  |             if self.can_create_options and self._ask_for_creating_option(key): | ||||||
|  |                 return self.create_option(key) | ||||||
|  |             return None | ||||||
|  |  | ||||||
|  |         return self[key] | ||||||
|  |  | ||||||
|  |  | ||||||
|  |  | ||||||
|  | class StringSelect(Select): | ||||||
|  |     def __init__(self, **kwargs): | ||||||
|  |         self._current_index = 0 | ||||||
|  |         kwargs["option_factory"] = self.next_option | ||||||
|  |         kwargs["parse_option_key"] = lambda x: unify(str(x)) | ||||||
|  |  | ||||||
|  |         super().__init__(**kwargs) | ||||||
|  |  | ||||||
|  |     def next_option(self, value: Any) -> Optional[Option]: | ||||||
|  |         o = Option(value=value, keys=[self._current_index], text=f"{self._current_index:0>2}: {value}") | ||||||
|  |         self._current_index += 1 | ||||||
|  |         return o | ||||||
|  |  | ||||||
|  |  | ||||||
|  | class GenreSelect(StringSelect): | ||||||
|  |     @staticmethod | ||||||
|  |     def is_valid_genre(genre: Path) -> bool: | ||||||
|  |         """ | ||||||
|  |         gets the name of all subdirectories of shared.MUSIC_DIR, | ||||||
|  |         but filters out all directories, where the name matches with any Patern | ||||||
|  |         from shared.NOT_A_GENRE_REGEX. | ||||||
|  |         """ | ||||||
|  |         if not genre.is_dir(): | ||||||
|  |             return False | ||||||
|  |  | ||||||
|  |         if any(re.match(regex_pattern, genre.name) for regex_pattern in main_settings["not_a_genre_regex"]): | ||||||
|  |             return False | ||||||
|  |  | ||||||
|  |         return True | ||||||
|  |  | ||||||
|  |     def __init__(self): | ||||||
|  |         super().__init__(sort=True, raw_options=(genre.name for genre in filter(self.is_valid_genre, main_settings["music_directory"].iterdir()))) | ||||||
|  |  | ||||||
| @@ -1,327 +0,0 @@ | |||||||
| from typing import Tuple, Type, Dict, Set, Optional, List |  | ||||||
| from collections import defaultdict |  | ||||||
| from pathlib import Path |  | ||||||
| import re |  | ||||||
| import logging |  | ||||||
|  |  | ||||||
| from . import FetchOptions, DownloadOptions |  | ||||||
| from .results import SearchResults |  | ||||||
| from ..objects import ( |  | ||||||
|     DatabaseObject as DataObject, |  | ||||||
|     Collection, |  | ||||||
|     Target, |  | ||||||
|     Source, |  | ||||||
|     Options, |  | ||||||
|     Song, |  | ||||||
|     Album, |  | ||||||
|     Artist, |  | ||||||
|     Label, |  | ||||||
| ) |  | ||||||
| from ..audio import write_metadata_to_target, correct_codec |  | ||||||
| from ..utils import output, BColors |  | ||||||
| from ..utils.string_processing import fit_to_file_system |  | ||||||
| from ..utils.config import youtube_settings, main_settings |  | ||||||
| from ..utils.path_manager import LOCATIONS |  | ||||||
| from ..utils.enums import SourceType, ALL_SOURCE_TYPES |  | ||||||
| from ..utils.support_classes.download_result import DownloadResult |  | ||||||
| from ..utils.support_classes.query import Query |  | ||||||
| from ..utils.support_classes.download_result import DownloadResult |  | ||||||
| from ..utils.exception import MKMissingNameException |  | ||||||
| from ..utils.exception.download import UrlNotFoundException |  | ||||||
| from ..utils.shared import DEBUG_PAGES |  | ||||||
|  |  | ||||||
| from ..pages import Page, EncyclopaediaMetallum, Musify, YouTube, YoutubeMusic, Bandcamp, INDEPENDENT_DB_OBJECTS |  | ||||||
|  |  | ||||||
|  |  | ||||||
| ALL_PAGES: Set[Type[Page]] = { |  | ||||||
|     # EncyclopaediaMetallum, |  | ||||||
|     Musify, |  | ||||||
|     YoutubeMusic, |  | ||||||
|     Bandcamp |  | ||||||
| } |  | ||||||
|  |  | ||||||
| if youtube_settings["use_youtube_alongside_youtube_music"]: |  | ||||||
|     ALL_PAGES.add(YouTube) |  | ||||||
|  |  | ||||||
| AUDIO_PAGES: Set[Type[Page]] = { |  | ||||||
|     Musify, |  | ||||||
|     YouTube, |  | ||||||
|     YoutubeMusic, |  | ||||||
|     Bandcamp |  | ||||||
| } |  | ||||||
|  |  | ||||||
| SHADY_PAGES: Set[Type[Page]] = { |  | ||||||
|     Musify, |  | ||||||
| } |  | ||||||
|  |  | ||||||
| fetch_map = { |  | ||||||
|     Song: "fetch_song", |  | ||||||
|     Album: "fetch_album", |  | ||||||
|     Artist: "fetch_artist", |  | ||||||
|     Label: "fetch_label", |  | ||||||
| } |  | ||||||
|  |  | ||||||
| if DEBUG_PAGES: |  | ||||||
|     DEBUGGING_PAGE = Bandcamp |  | ||||||
|     print(f"Only downloading from page {DEBUGGING_PAGE}.") |  | ||||||
|  |  | ||||||
|     ALL_PAGES = {DEBUGGING_PAGE} |  | ||||||
|     AUDIO_PAGES = ALL_PAGES.union(AUDIO_PAGES) |  | ||||||
|  |  | ||||||
|  |  | ||||||
| class Pages: |  | ||||||
|     def __init__(self, exclude_pages: Set[Type[Page]] = None, exclude_shady: bool = False, download_options: DownloadOptions = None, fetch_options: FetchOptions = None): |  | ||||||
|         self.LOGGER = logging.getLogger("download") |  | ||||||
|          |  | ||||||
|         self.download_options: DownloadOptions = download_options or DownloadOptions() |  | ||||||
|         self.fetch_options: FetchOptions = fetch_options or FetchOptions() |  | ||||||
|  |  | ||||||
|         # initialize all page instances |  | ||||||
|         self._page_instances: Dict[Type[Page], Page] = dict() |  | ||||||
|         self._source_to_page: Dict[SourceType, Type[Page]] = dict() |  | ||||||
|          |  | ||||||
|         exclude_pages = exclude_pages if exclude_pages is not None else set() |  | ||||||
|          |  | ||||||
|         if exclude_shady: |  | ||||||
|             exclude_pages = exclude_pages.union(SHADY_PAGES) |  | ||||||
|          |  | ||||||
|         if not exclude_pages.issubset(ALL_PAGES): |  | ||||||
|             raise ValueError(f"The excluded pages have to be a subset of all pages: {exclude_pages} | {ALL_PAGES}") |  | ||||||
|          |  | ||||||
|         def _set_to_tuple(page_set: Set[Type[Page]]) -> Tuple[Type[Page], ...]: |  | ||||||
|             return tuple(sorted(page_set, key=lambda page: page.__name__)) |  | ||||||
|          |  | ||||||
|         self._pages_set: Set[Type[Page]] = ALL_PAGES.difference(exclude_pages) |  | ||||||
|         self.pages: Tuple[Type[Page], ...] = _set_to_tuple(self._pages_set) |  | ||||||
|  |  | ||||||
|         self._audio_pages_set: Set[Type[Page]] = self._pages_set.intersection(AUDIO_PAGES) |  | ||||||
|         self.audio_pages: Tuple[Type[Page], ...] = _set_to_tuple(self._audio_pages_set) |  | ||||||
|          |  | ||||||
|         for page_type in self.pages: |  | ||||||
|             self._page_instances[page_type] = page_type(fetch_options=self.fetch_options, download_options=self.download_options) |  | ||||||
|             self._source_to_page[page_type.SOURCE_TYPE] = page_type |  | ||||||
|  |  | ||||||
|     def _get_page_from_enum(self, source_page: SourceType) -> Page: |  | ||||||
|         if source_page not in self._source_to_page: |  | ||||||
|             return None |  | ||||||
|         return self._page_instances[self._source_to_page[source_page]] |  | ||||||
|  |  | ||||||
|     def search(self, query: Query) -> SearchResults: |  | ||||||
|         result = SearchResults() |  | ||||||
|          |  | ||||||
|         for page_type in self.pages: |  | ||||||
|             result.add( |  | ||||||
|                 page=page_type, |  | ||||||
|                 search_result=self._page_instances[page_type].search(query=query) |  | ||||||
|             ) |  | ||||||
|              |  | ||||||
|         return result |  | ||||||
|      |  | ||||||
|     def fetch_details(self, data_object: DataObject, stop_at_level: int = 1, **kwargs) -> DataObject: |  | ||||||
|         if not isinstance(data_object, INDEPENDENT_DB_OBJECTS): |  | ||||||
|             return data_object |  | ||||||
|          |  | ||||||
|         source: Source |  | ||||||
|         for source in data_object.source_collection.get_sources(source_type_sorting={ |  | ||||||
|             "only_with_page": True, |  | ||||||
|         }): |  | ||||||
|             new_data_object = self.fetch_from_source(source=source, stop_at_level=stop_at_level) |  | ||||||
|             if new_data_object is not None: |  | ||||||
|                 data_object.merge(new_data_object) |  | ||||||
|  |  | ||||||
|         return data_object |  | ||||||
|  |  | ||||||
|     def fetch_from_source(self, source: Source, **kwargs) -> Optional[DataObject]: |  | ||||||
|         if not source.has_page: |  | ||||||
|             return None |  | ||||||
|          |  | ||||||
|         source_type = source.page.get_source_type(source=source) |  | ||||||
|         if source_type is None: |  | ||||||
|             self.LOGGER.debug(f"Could not determine source type for {source}.") |  | ||||||
|             return None |  | ||||||
|  |  | ||||||
|         func = getattr(source.page, fetch_map[source_type]) |  | ||||||
|          |  | ||||||
|         # fetching the data object and marking it as fetched |  | ||||||
|         data_object: DataObject = func(source=source, **kwargs) |  | ||||||
|         data_object.mark_as_fetched(source.hash_url) |  | ||||||
|         return data_object |  | ||||||
|  |  | ||||||
|     def fetch_from_url(self, url: str) -> Optional[DataObject]: |  | ||||||
|         source = Source.match_url(url, ALL_SOURCE_TYPES.MANUAL) |  | ||||||
|         if source is None: |  | ||||||
|             return None |  | ||||||
|          |  | ||||||
|         return self.fetch_from_source(source=source) |  | ||||||
|      |  | ||||||
|     def _skip_object(self, data_object: DataObject) -> bool: |  | ||||||
|         if isinstance(data_object, Album): |  | ||||||
|             if not self.download_options.download_all and data_object.album_type in self.download_options.album_type_blacklist: |  | ||||||
|                 return True |  | ||||||
|          |  | ||||||
|         return False |  | ||||||
|  |  | ||||||
|     def download(self, data_object: DataObject, genre: str, **kwargs) -> DownloadResult: |  | ||||||
|         # fetch the given object |  | ||||||
|         self.fetch_details(data_object) |  | ||||||
|         output(f"\nDownloading {data_object.option_string}...", color=BColors.BOLD) |  | ||||||
|          |  | ||||||
|         # fetching all parent objects (e.g. if you only download a song) |  | ||||||
|         if not kwargs.get("fetched_upwards", False): |  | ||||||
|             to_fetch: List[DataObject] = [data_object] |  | ||||||
|  |  | ||||||
|             while len(to_fetch) > 0: |  | ||||||
|                 new_to_fetch = [] |  | ||||||
|                 for d in to_fetch: |  | ||||||
|                     if self._skip_object(d): |  | ||||||
|                         continue |  | ||||||
|  |  | ||||||
|                     self.fetch_details(d) |  | ||||||
|  |  | ||||||
|                     for c in d.get_parent_collections(): |  | ||||||
|                         new_to_fetch.extend(c) |  | ||||||
|  |  | ||||||
|                 to_fetch = new_to_fetch |  | ||||||
|              |  | ||||||
|             kwargs["fetched_upwards"] = True |  | ||||||
|          |  | ||||||
|         # download all children |  | ||||||
|         download_result: DownloadResult = DownloadResult() |  | ||||||
|         for c in data_object.get_child_collections(): |  | ||||||
|             for d in c: |  | ||||||
|                 if self._skip_object(d): |  | ||||||
|                     continue |  | ||||||
|  |  | ||||||
|                 download_result.merge(self.download(d, genre, **kwargs)) |  | ||||||
|  |  | ||||||
|         # actually download if the object is a song |  | ||||||
|         if isinstance(data_object, Song): |  | ||||||
|             """ |  | ||||||
|             TODO |  | ||||||
|             add the traced artist and album to the naming. |  | ||||||
|             I am able to do that, because duplicate values are removed later on. |  | ||||||
|             """ |  | ||||||
|  |  | ||||||
|             self._download_song(data_object, naming={ |  | ||||||
|                 "genre": [genre], |  | ||||||
|                 "audio_format": [main_settings["audio_format"]], |  | ||||||
|             }) |  | ||||||
|  |  | ||||||
|         return download_result |  | ||||||
|  |  | ||||||
|     def _extract_fields_from_template(self, path_template: str) -> Set[str]: |  | ||||||
|         return set(re.findall(r"{([^}]+)}", path_template)) |  | ||||||
|  |  | ||||||
|     def _parse_path_template(self, path_template: str, naming: Dict[str, List[str]]) -> str: |  | ||||||
|         field_names: Set[str] = self._extract_fields_from_template(path_template) |  | ||||||
|          |  | ||||||
|         for field in field_names: |  | ||||||
|             if len(naming[field]) == 0: |  | ||||||
|                 raise MKMissingNameException(f"Missing field for {field}.") |  | ||||||
|  |  | ||||||
|             path_template = path_template.replace(f"{{{field}}}", naming[field][0]) |  | ||||||
|  |  | ||||||
|         return path_template |  | ||||||
|  |  | ||||||
|     def _download_song(self, song: Song, naming: dict) -> DownloadOptions: |  | ||||||
|         """ |  | ||||||
|         TODO |  | ||||||
|         Search the song in the file system. |  | ||||||
|         """ |  | ||||||
|         r = DownloadResult(total=1) |  | ||||||
|          |  | ||||||
|         # pre process the data recursively |  | ||||||
|         song.compile() |  | ||||||
|          |  | ||||||
|         # manage the naming |  | ||||||
|         naming: Dict[str, List[str]] = defaultdict(list, naming) |  | ||||||
|         naming["song"].append(song.title_value) |  | ||||||
|         naming["isrc"].append(song.isrc) |  | ||||||
|         naming["album"].extend(a.title_value for a in song.album_collection) |  | ||||||
|         naming["album_type"].extend(a.album_type.value for a in song.album_collection) |  | ||||||
|         naming["artist"].extend(a.name for a in song.artist_collection) |  | ||||||
|         naming["artist"].extend(a.name for a in song.feature_artist_collection) |  | ||||||
|         for a in song.album_collection: |  | ||||||
|             naming["label"].extend([l.title_value for l in a.label_collection]) |  | ||||||
|         # removing duplicates from the naming, and process the strings |  | ||||||
|         for key, value in naming.items(): |  | ||||||
|             # https://stackoverflow.com/a/17016257 |  | ||||||
|             naming[key] = list(dict.fromkeys(value)) |  | ||||||
|         song.genre = naming["genre"][0] |  | ||||||
|  |  | ||||||
|         # manage the targets |  | ||||||
|         tmp: Target = Target.temp(file_extension=main_settings["audio_format"]) |  | ||||||
|  |  | ||||||
|         song.target_collection.append(Target( |  | ||||||
|             relative_to_music_dir=True, |  | ||||||
|             file_path=Path( |  | ||||||
|                 self._parse_path_template(main_settings["download_path"], naming=naming),  |  | ||||||
|                 self._parse_path_template(main_settings["download_file"], naming=naming), |  | ||||||
|             ) |  | ||||||
|         )) |  | ||||||
|         for target in song.target_collection: |  | ||||||
|             if target.exists: |  | ||||||
|                 output(f'{target.file_path} {BColors.OKGREEN.value}[already exists]', color=BColors.GREY) |  | ||||||
|                 r.found_on_disk += 1 |  | ||||||
|  |  | ||||||
|                 if not self.download_options.download_again_if_found: |  | ||||||
|                     target.copy_content(tmp) |  | ||||||
|             else: |  | ||||||
|                 target.create_path() |  | ||||||
|                 output(f'{target.file_path}', color=BColors.GREY) |  | ||||||
|  |  | ||||||
|         # this streams from every available source until something succeeds, setting the skip intervals to the values of the according source |  | ||||||
|         used_source: Optional[Source] = None |  | ||||||
|         skip_intervals: List[Tuple[float, float]] = [] |  | ||||||
|         for source in song.source_collection.get_sources(source_type_sorting={ |  | ||||||
|             "only_with_page": True, |  | ||||||
|             "sort_key": lambda page: page.download_priority, |  | ||||||
|             "reverse": True, |  | ||||||
|         }): |  | ||||||
|             if tmp.exists: |  | ||||||
|                 break |  | ||||||
|  |  | ||||||
|             used_source = source |  | ||||||
|             streaming_results = source.page.download_song_to_target(source=source, target=tmp, desc="download") |  | ||||||
|             skip_intervals = source.page.get_skip_intervals(song=song, source=source) |  | ||||||
|  |  | ||||||
|             # if something has been downloaded but it somehow failed, delete the file |  | ||||||
|             if streaming_results.is_fatal_error and tmp.exists: |  | ||||||
|                 tmp.delete() |  | ||||||
|  |  | ||||||
|         # if everything went right, the file should exist now |  | ||||||
|         if not tmp.exists: |  | ||||||
|             if used_source is None: |  | ||||||
|                 r.error_message = f"No source found for {song.option_string}." |  | ||||||
|             else: |  | ||||||
|                 r.error_message = f"Something went wrong downloading {song.option_string}." |  | ||||||
|             return r |  | ||||||
|  |  | ||||||
|         # post process the audio |  | ||||||
|         found_on_disk = used_source is None |  | ||||||
|         if not found_on_disk or self.download_options.process_audio_if_found: |  | ||||||
|             correct_codec(target=tmp, skip_intervals=skip_intervals) |  | ||||||
|             r.sponsor_segments = len(skip_intervals) |  | ||||||
|  |  | ||||||
|         if used_source is not None: |  | ||||||
|             used_source.page.post_process_hook(song=song, temp_target=tmp) |  | ||||||
|  |  | ||||||
|         if not found_on_disk or self.download_options.process_metadata_if_found: |  | ||||||
|             write_metadata_to_target(metadata=song.metadata, target=tmp, song=song) |  | ||||||
|  |  | ||||||
|         # copy the tmp target to the final locations |  | ||||||
|         for target in song.target_collection: |  | ||||||
|             tmp.copy_content(target) |  | ||||||
|  |  | ||||||
|         tmp.delete() |  | ||||||
|         return r |  | ||||||
|  |  | ||||||
|     def fetch_url(self, url: str, stop_at_level: int = 2) -> Tuple[Type[Page], DataObject]: |  | ||||||
|         source = Source.match_url(url, ALL_SOURCE_TYPES.MANUAL) |  | ||||||
|          |  | ||||||
|         if source is None: |  | ||||||
|             raise UrlNotFoundException(url=url) |  | ||||||
|          |  | ||||||
|         _actual_page = self._source_to_page[source.source_type] |  | ||||||
|          |  | ||||||
|         return _actual_page, self._page_instances[_actual_page].fetch_object_from_source(source=source, stop_at_level=stop_at_level) |  | ||||||
| @@ -1,8 +1,12 @@ | |||||||
| from typing import Tuple, Type, Dict, List, Generator, Union | from __future__ import annotations | ||||||
|  |  | ||||||
| from dataclasses import dataclass | from dataclasses import dataclass | ||||||
|  | from typing import TYPE_CHECKING, Dict, Generator, List, Tuple, Type, Union | ||||||
|  |  | ||||||
| from ..objects import DatabaseObject | from ..objects import DatabaseObject | ||||||
| from ..pages import Page, EncyclopaediaMetallum, Musify |  | ||||||
|  | if TYPE_CHECKING: | ||||||
|  |     from . import Page | ||||||
|  |  | ||||||
|  |  | ||||||
| @dataclass | @dataclass | ||||||
|   | |||||||
| @@ -59,4 +59,6 @@ class Artwork: | |||||||
|                 self._variant_mapping[key] = value |                 self._variant_mapping[key] = value | ||||||
|  |  | ||||||
|     def __eq__(self, other: Artwork) -> bool: |     def __eq__(self, other: Artwork) -> bool: | ||||||
|  |         if not isinstance(other, Artwork): | ||||||
|  |             return False | ||||||
|         return any(a == b for a, b in zip(self._variant_mapping.keys(), other._variant_mapping.keys())) |         return any(a == b for a, b in zip(self._variant_mapping.keys(), other._variant_mapping.keys())) | ||||||
|   | |||||||
| @@ -38,11 +38,19 @@ class FormattedText: | |||||||
|     def markdown(self) -> str: |     def markdown(self) -> str: | ||||||
|         return md(self.html).strip() |         return md(self.html).strip() | ||||||
|      |      | ||||||
|  |     @markdown.setter | ||||||
|  |     def markdown(self, value: str) -> None: | ||||||
|  |         self.html = mistune.markdown(value) | ||||||
|  |  | ||||||
|     @property |     @property | ||||||
|     def plain(self) -> str: |     def plain(self) -> str: | ||||||
|         md = self.markdown |         md = self.markdown | ||||||
|         return md.replace("\n\n", "\n") |         return md.replace("\n\n", "\n") | ||||||
|      |      | ||||||
|  |     @plain.setter | ||||||
|  |     def plain(self, value: str) -> None: | ||||||
|  |         self.html = mistune.markdown(plain_to_markdown(value)) | ||||||
|  |  | ||||||
|     def __str__(self) -> str: |     def __str__(self) -> str: | ||||||
|         return self.markdown |         return self.markdown | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,7 +1,52 @@ | |||||||
| from .encyclopaedia_metallum import EncyclopaediaMetallum | import importlib | ||||||
| from .musify import Musify | import inspect | ||||||
| from .youtube import YouTube | import logging | ||||||
| from .youtube_music import YoutubeMusic | import pkgutil | ||||||
| from .bandcamp import Bandcamp | import sys | ||||||
|  | from collections import defaultdict | ||||||
|  | from copy import copy | ||||||
|  | from pathlib import Path | ||||||
|  | from typing import Dict, Generator, List, Set, Type | ||||||
|  |  | ||||||
| from .abstract import Page, INDEPENDENT_DB_OBJECTS | from ._bandcamp import Bandcamp | ||||||
|  | from ._encyclopaedia_metallum import EncyclopaediaMetallum | ||||||
|  | from ._genius import Genius | ||||||
|  | from ._musify import Musify | ||||||
|  | from ._youtube import YouTube | ||||||
|  | from ._youtube_music import YoutubeMusic | ||||||
|  |  | ||||||
|  |  | ||||||
|  | def import_children(): | ||||||
|  |     _page_directory = Path(__file__).parent | ||||||
|  |     _stem_blacklist = set(["__pycache__", "__init__"]) | ||||||
|  |  | ||||||
|  |     for _file in _page_directory.iterdir(): | ||||||
|  |         if _file.stem in _stem_blacklist: | ||||||
|  |             continue | ||||||
|  |          | ||||||
|  |         logging.debug(f"importing {_file.absolute()}") | ||||||
|  |         exec(f"from . import {_file.stem}") | ||||||
|  |  | ||||||
|  | # module_blacklist = set(sys.modules.keys()) | ||||||
|  | import_children() | ||||||
|  |  | ||||||
|  | """ | ||||||
|  | classes = set() | ||||||
|  |  | ||||||
|  | print(__name__) | ||||||
|  | for module_name, module in sys.modules.items(): | ||||||
|  |     if module_name in module_blacklist or not module_name.startswith(__name__): | ||||||
|  |         continue | ||||||
|  |  | ||||||
|  |     print("scanning module", module_name) | ||||||
|  |     for name, obj in inspect.getmembers(module, predicate=inspect.isclass): | ||||||
|  |         _module = obj.__module__ | ||||||
|  |         if _module.startswith(__name__) and hasattr(obj, "SOURCE_TYPE"): | ||||||
|  |             print("checking object", name, obj.__module__) | ||||||
|  |             classes.add(obj) | ||||||
|  |     print() | ||||||
|  |  | ||||||
|  | print(*(c.__name__ for c in classes), sep=",\t") | ||||||
|  |  | ||||||
|  | __all__ = [c.__name__ for c in classes] | ||||||
|  | """ | ||||||
| @@ -1,33 +1,22 @@ | |||||||
| from typing import List, Optional, Type |  | ||||||
| from urllib.parse import urlparse, urlunparse |  | ||||||
| import json | import json | ||||||
| from enum import Enum | from enum import Enum | ||||||
| from bs4 import BeautifulSoup | from typing import List, Optional, Type | ||||||
| import pycountry | from urllib.parse import urlparse, urlunparse | ||||||
|  | 
 | ||||||
|  | import pycountry | ||||||
|  | from bs4 import BeautifulSoup | ||||||
| 
 | 
 | ||||||
| from ..objects import Source, DatabaseObject |  | ||||||
| from .abstract import Page |  | ||||||
| from ..objects import ( |  | ||||||
|     Artist, |  | ||||||
|     Source, |  | ||||||
|     SourceType, |  | ||||||
|     Song, |  | ||||||
|     Album, |  | ||||||
|     Label, |  | ||||||
|     Target, |  | ||||||
|     Contact, |  | ||||||
|     ID3Timestamp, |  | ||||||
|     Lyrics, |  | ||||||
|     FormattedText, |  | ||||||
|     Artwork, |  | ||||||
| ) |  | ||||||
| from ..connection import Connection | from ..connection import Connection | ||||||
|  | from ..download import Page | ||||||
|  | from ..objects import (Album, Artist, Artwork, Contact, DatabaseObject, | ||||||
|  |                        FormattedText, ID3Timestamp, Label, Lyrics, Song, | ||||||
|  |                        Source, SourceType, Target) | ||||||
| from ..utils import dump_to_file | from ..utils import dump_to_file | ||||||
| from ..utils.enums import SourceType, ALL_SOURCE_TYPES | from ..utils.config import logging_settings, main_settings | ||||||
| from ..utils.support_classes.download_result import DownloadResult | from ..utils.enums import ALL_SOURCE_TYPES, SourceType | ||||||
| from ..utils.string_processing import clean_song_title |  | ||||||
| from ..utils.config import main_settings, logging_settings |  | ||||||
| from ..utils.shared import DEBUG | from ..utils.shared import DEBUG | ||||||
|  | from ..utils.string_processing import clean_song_title | ||||||
|  | from ..utils.support_classes.download_result import DownloadResult | ||||||
| 
 | 
 | ||||||
| if DEBUG: | if DEBUG: | ||||||
|     from ..utils import dump_to_file |     from ..utils import dump_to_file | ||||||
| @@ -1,31 +1,20 @@ | |||||||
| from collections import defaultdict | from collections import defaultdict | ||||||
| from typing import List, Optional, Dict, Type, Union | from typing import Dict, List, Optional, Type, Union | ||||||
| from bs4 import BeautifulSoup | from urllib.parse import urlencode, urlparse | ||||||
|  | 
 | ||||||
| import pycountry | import pycountry | ||||||
| from urllib.parse import urlparse, urlencode | from bs4 import BeautifulSoup | ||||||
| 
 | 
 | ||||||
| from ..connection import Connection | from ..connection import Connection | ||||||
| from ..utils.config import logging_settings | from ..download import Page | ||||||
| from .abstract import Page | from ..objects import (Album, Artist, DatabaseObject, FormattedText, | ||||||
| from ..utils.enums import SourceType, ALL_SOURCE_TYPES |                        ID3Timestamp, Label, Lyrics, Options, Song, Source) | ||||||
| from ..utils.enums.album import AlbumType |  | ||||||
| from ..utils.support_classes.query import Query |  | ||||||
| from ..objects import ( |  | ||||||
|     Lyrics, |  | ||||||
|     Artist, |  | ||||||
|     Source, |  | ||||||
|     Song, |  | ||||||
|     Album, |  | ||||||
|     ID3Timestamp, |  | ||||||
|     FormattedText, |  | ||||||
|     Label, |  | ||||||
|     Options, |  | ||||||
|     DatabaseObject |  | ||||||
| ) |  | ||||||
| from ..utils.shared import DEBUG |  | ||||||
| from ..utils import dump_to_file | from ..utils import dump_to_file | ||||||
| 
 | from ..utils.config import logging_settings | ||||||
| 
 | from ..utils.enums import ALL_SOURCE_TYPES, SourceType | ||||||
|  | from ..utils.enums.album import AlbumType | ||||||
|  | from ..utils.shared import DEBUG | ||||||
|  | from ..utils.support_classes.query import Query | ||||||
| 
 | 
 | ||||||
| ALBUM_TYPE_MAP: Dict[str, AlbumType] = defaultdict(lambda: AlbumType.OTHER, { | ALBUM_TYPE_MAP: Dict[str, AlbumType] = defaultdict(lambda: AlbumType.OTHER, { | ||||||
|     "Full-length": AlbumType.STUDIO_ALBUM, |     "Full-length": AlbumType.STUDIO_ALBUM, | ||||||
| @@ -207,6 +196,7 @@ def create_grid( | |||||||
| 
 | 
 | ||||||
| 
 | 
 | ||||||
| class EncyclopaediaMetallum(Page): | class EncyclopaediaMetallum(Page): | ||||||
|  |     REGISTER = False | ||||||
|     SOURCE_TYPE = ALL_SOURCE_TYPES.ENCYCLOPAEDIA_METALLUM |     SOURCE_TYPE = ALL_SOURCE_TYPES.ENCYCLOPAEDIA_METALLUM | ||||||
|     LOGGER = logging_settings["metal_archives_logger"] |     LOGGER = logging_settings["metal_archives_logger"] | ||||||
|      |      | ||||||
							
								
								
									
										286
									
								
								music_kraken/pages/_genius.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										286
									
								
								music_kraken/pages/_genius.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,286 @@ | |||||||
|  | import json | ||||||
|  | from enum import Enum | ||||||
|  | from typing import List, Optional, Type | ||||||
|  | from urllib.parse import urlencode, urlparse, urlunparse | ||||||
|  |  | ||||||
|  | import pycountry | ||||||
|  | from bs4 import BeautifulSoup | ||||||
|  |  | ||||||
|  | from ..connection import Connection | ||||||
|  | from ..download import Page | ||||||
|  | from ..objects import (Album, Artist, Artwork, Contact, DatabaseObject, | ||||||
|  |                        FormattedText, ID3Timestamp, Label, Lyrics, Song, | ||||||
|  |                        Source, SourceType, Target) | ||||||
|  | from ..utils import dump_to_file, traverse_json_path | ||||||
|  | from ..utils.config import logging_settings, main_settings | ||||||
|  | from ..utils.enums import ALL_SOURCE_TYPES, SourceType | ||||||
|  | from ..utils.shared import DEBUG | ||||||
|  | from ..utils.string_processing import clean_song_title | ||||||
|  | from ..utils.support_classes.download_result import DownloadResult | ||||||
|  |  | ||||||
|  | if DEBUG: | ||||||
|  |     from ..utils import dump_to_file | ||||||
|  |  | ||||||
|  |  | ||||||
|  | class Genius(Page): | ||||||
|  |     SOURCE_TYPE = ALL_SOURCE_TYPES.GENIUS | ||||||
|  |     HOST = "genius.com" | ||||||
|  |  | ||||||
|  |     def __init__(self, *args, **kwargs): | ||||||
|  |         self.connection: Connection = Connection( | ||||||
|  |             host="https://genius.com/", | ||||||
|  |             logger=self.LOGGER, | ||||||
|  |             module="genius", | ||||||
|  |         ) | ||||||
|  |  | ||||||
|  |         super().__init__(*args, **kwargs) | ||||||
|  |  | ||||||
|  |     def get_source_type(self, source: Source) -> Optional[Type[DatabaseObject]]: | ||||||
|  |         path = source.parsed_url.path.replace("/", "") | ||||||
|  |          | ||||||
|  |         if path.startswith("artists"): | ||||||
|  |             return Artist | ||||||
|  |         if path.startswith("albums"): | ||||||
|  |             return Album | ||||||
|  |  | ||||||
|  |         return Song | ||||||
|  |  | ||||||
|  |     def add_to_artwork(self, artwork: Artwork, url: str): | ||||||
|  |         if url is None: | ||||||
|  |             return | ||||||
|  |          | ||||||
|  |         url_frags = url.split(".") | ||||||
|  |         if len(url_frags) < 2: | ||||||
|  |             artwork.append(url=url) | ||||||
|  |             return | ||||||
|  |  | ||||||
|  |         dimensions = url_frags[-2].split("x") | ||||||
|  |         if len(dimensions) < 2: | ||||||
|  |             artwork.append(url=url) | ||||||
|  |             return | ||||||
|  |  | ||||||
|  |         if len(dimensions) == 3: | ||||||
|  |             dimensions = dimensions[:-1] | ||||||
|  |          | ||||||
|  |         try: | ||||||
|  |             artwork.append(url=url, width=int(dimensions[0]), height=int(dimensions[1])) | ||||||
|  |         except ValueError: | ||||||
|  |             artwork.append(url=url) | ||||||
|  |  | ||||||
|  |     def parse_api_object(self, data: dict) -> Optional[DatabaseObject]: | ||||||
|  |         if data is None: | ||||||
|  |             return None | ||||||
|  |         object_type = data.get("_type") | ||||||
|  |  | ||||||
|  |         artwork = Artwork() | ||||||
|  |         self.add_to_artwork(artwork, data.get("header_image_url")) | ||||||
|  |         self.add_to_artwork(artwork, data.get("image_url")) | ||||||
|  |          | ||||||
|  |         additional_sources: List[Source] = [] | ||||||
|  |         source: Source = Source(self.SOURCE_TYPE, data.get("url"), additional_data={ | ||||||
|  |             "id": data.get("id"), | ||||||
|  |             "slug": data.get("slug"), | ||||||
|  |             "api_path": data.get("api_path"), | ||||||
|  |         }) | ||||||
|  |  | ||||||
|  |         notes = FormattedText() | ||||||
|  |         description = data.get("description") or {} | ||||||
|  |         if "html" in description: | ||||||
|  |             notes.html = description["html"] | ||||||
|  |         elif "markdown" in description: | ||||||
|  |             notes.markdown = description["markdown"] | ||||||
|  |         elif "description_preview" in data: | ||||||
|  |             notes.plaintext = data["description_preview"] | ||||||
|  |  | ||||||
|  |         if source.url is None: | ||||||
|  |             return None | ||||||
|  |  | ||||||
|  |         if object_type == "artist": | ||||||
|  |             if data.get("instagram_name") is not None: | ||||||
|  |                 additional_sources.append(Source(ALL_SOURCE_TYPES.INSTAGRAM, f"https://www.instagram.com/{data['instagram_name']}/")) | ||||||
|  |             if data.get("facebook_name") is not None: | ||||||
|  |                 additional_sources.append(Source(ALL_SOURCE_TYPES.FACEBOOK, f"https://www.facebook.com/{data['facebook_name']}/")) | ||||||
|  |             if data.get("twitter_name") is not None: | ||||||
|  |                 additional_sources.append(Source(ALL_SOURCE_TYPES.TWITTER, f"https://x.com/{data['twitter_name']}/")) | ||||||
|  |  | ||||||
|  |             return Artist( | ||||||
|  |                 name=data["name"].strip() if data.get("name") is not None else None, | ||||||
|  |                 source_list=[source], | ||||||
|  |                 artwork=artwork, | ||||||
|  |                 notes=notes, | ||||||
|  |             ) | ||||||
|  |  | ||||||
|  |         if object_type == "album": | ||||||
|  |             self.add_to_artwork(artwork, data.get("cover_art_thumbnail_url")) | ||||||
|  |             self.add_to_artwork(artwork, data.get("cover_art_url")) | ||||||
|  |  | ||||||
|  |             for cover_art in data.get("cover_arts", []): | ||||||
|  |                 self.add_to_artwork(artwork, cover_art.get("image_url")) | ||||||
|  |                 self.add_to_artwork(artwork, cover_art.get("thumbnail_image_url")) | ||||||
|  |  | ||||||
|  |             return Album( | ||||||
|  |                 title=data.get("name").strip(), | ||||||
|  |                 source_list=[source], | ||||||
|  |                 artist_list=[self.parse_api_object(data.get("artist"))], | ||||||
|  |                 artwork=artwork, | ||||||
|  |                 date=ID3Timestamp(**data.get("release_date_components", {})), | ||||||
|  |             ) | ||||||
|  |  | ||||||
|  |         if object_type == "song": | ||||||
|  |             self.add_to_artwork(artwork, data.get("song_art_image_thumbnail_url")) | ||||||
|  |             self.add_to_artwork(artwork, data.get("song_art_image_url")) | ||||||
|  |  | ||||||
|  |             main_artist_list = [] | ||||||
|  |             featured_artist_list = [] | ||||||
|  |  | ||||||
|  |             _artist_name = None | ||||||
|  |             primary_artist = self.parse_api_object(data.get("primary_artist")) | ||||||
|  |             if primary_artist is not None: | ||||||
|  |                 _artist_name = primary_artist.name | ||||||
|  |                 main_artist_list.append(primary_artist) | ||||||
|  |             for feature_artist in (*(data.get("featured_artists") or []), *(data.get("producer_artists") or []), *(data.get("writer_artists") or [])): | ||||||
|  |                 artist = self.parse_api_object(feature_artist) | ||||||
|  |                 if artist is not None: | ||||||
|  |                     featured_artist_list.append(artist) | ||||||
|  |  | ||||||
|  |             return Song( | ||||||
|  |                 title=clean_song_title(data.get("title"), artist_name=_artist_name), | ||||||
|  |                 source_list=[source], | ||||||
|  |                 artwork=artwork, | ||||||
|  |                 feature_artist_list=featured_artist_list, | ||||||
|  |                 artist_list=main_artist_list, | ||||||
|  |             ) | ||||||
|  |  | ||||||
|  |         return None | ||||||
|  |  | ||||||
|  |     def general_search(self, search_query: str, **kwargs) -> List[DatabaseObject]: | ||||||
|  |         results = [] | ||||||
|  |  | ||||||
|  |         search_params = { | ||||||
|  |             "q": search_query, | ||||||
|  |         } | ||||||
|  |  | ||||||
|  |         r = self.connection.get("https://genius.com/api/search/multi?" + urlencode(search_params), name=f"search_{search_query}") | ||||||
|  |         if r is None: | ||||||
|  |             return results | ||||||
|  |  | ||||||
|  |         dump_to_file("search_genius.json", r.text, is_json=True, exit_after_dump=False) | ||||||
|  |         data = r.json() | ||||||
|  |  | ||||||
|  |         for elements in traverse_json_path(data, "response.sections", default=[]): | ||||||
|  |             hits = elements.get("hits", []) | ||||||
|  |             for hit in hits: | ||||||
|  |                 parsed = self.parse_api_object(hit.get("result")) | ||||||
|  |                 if parsed is not None: | ||||||
|  |                     results.append(parsed) | ||||||
|  |  | ||||||
|  |         return results | ||||||
|  |  | ||||||
|  |     def fetch_artist(self, source: Source, stop_at_level: int = 1) -> Artist: | ||||||
|  |         artist: Artist = Artist() | ||||||
|  |         # https://genius.com/api/artists/24527/albums?page=1 | ||||||
|  |  | ||||||
|  |         r = self.connection.get(source.url, name=source.url) | ||||||
|  |         if r is None: | ||||||
|  |             return artist | ||||||
|  |         soup = self.get_soup_from_response(r) | ||||||
|  |  | ||||||
|  |         # find the content attribute in the meta tag which is contained in the head | ||||||
|  |         data_container = soup.find("meta", {"itemprop": "page_data"}) | ||||||
|  |         if data_container is not None: | ||||||
|  |             content = data_container["content"] | ||||||
|  |             dump_to_file("genius_itemprop_artist.json", content, is_json=True, exit_after_dump=False) | ||||||
|  |             data = json.loads(content) | ||||||
|  |  | ||||||
|  |             artist = self.parse_api_object(data.get("artist")) | ||||||
|  |              | ||||||
|  |             for e in (data.get("artist_albums") or []): | ||||||
|  |                 r = self.parse_api_object(e) | ||||||
|  |                 if not isinstance(r, Album): | ||||||
|  |                     continue | ||||||
|  |  | ||||||
|  |                 artist.album_collection.append(r) | ||||||
|  |              | ||||||
|  |             for e in (data.get("artist_songs") or []): | ||||||
|  |                 r = self.parse_api_object(e) | ||||||
|  |                 if not isinstance(r, Song): | ||||||
|  |                     continue | ||||||
|  |  | ||||||
|  |                 """ | ||||||
|  |                 TODO | ||||||
|  |                 fetch the album for these songs, because the api doesn't  | ||||||
|  |                 return them | ||||||
|  |                 """ | ||||||
|  |  | ||||||
|  |                 artist.album_collection.extend(r.album_collection) | ||||||
|  |  | ||||||
|  |         artist.source_collection.append(source) | ||||||
|  |  | ||||||
|  |         return artist | ||||||
|  |  | ||||||
|  |     def fetch_album(self, source: Source, stop_at_level: int = 1) -> Album: | ||||||
|  |         album: Album = Album() | ||||||
|  |         # https://genius.com/api/artists/24527/albums?page=1 | ||||||
|  |  | ||||||
|  |         r = self.connection.get(source.url, name=source.url) | ||||||
|  |         if r is None: | ||||||
|  |             return album | ||||||
|  |         soup = self.get_soup_from_response(r) | ||||||
|  |  | ||||||
|  |         # find the content attribute in the meta tag which is contained in the head | ||||||
|  |         data_container = soup.find("meta", {"itemprop": "page_data"}) | ||||||
|  |         if data_container is not None: | ||||||
|  |             content = data_container["content"] | ||||||
|  |             dump_to_file("genius_itemprop_album.json", content, is_json=True, exit_after_dump=False) | ||||||
|  |             data = json.loads(content) | ||||||
|  |  | ||||||
|  |             album = self.parse_api_object(data.get("album")) | ||||||
|  |  | ||||||
|  |             for e in data.get("album_appearances", []): | ||||||
|  |                 r = self.parse_api_object(e.get("song")) | ||||||
|  |                 if not isinstance(r, Song): | ||||||
|  |                     continue | ||||||
|  |  | ||||||
|  |                 album.song_collection.append(r) | ||||||
|  |  | ||||||
|  |         album.source_collection.append(source) | ||||||
|  |          | ||||||
|  |         return album | ||||||
|  |  | ||||||
|  |     def get_json_content_from_response(self, response, start: str, end: str) -> Optional[str]: | ||||||
|  |         content = response.text | ||||||
|  |         start_index = content.find(start) | ||||||
|  |         if start_index < 0: | ||||||
|  |             return None | ||||||
|  |         start_index += len(start) | ||||||
|  |         end_index = content.find(end, start_index) | ||||||
|  |         if end_index < 0: | ||||||
|  |             return None | ||||||
|  |         return content[start_index:end_index] | ||||||
|  |  | ||||||
|  |     def fetch_song(self, source: Source, stop_at_level: int = 1) -> Song: | ||||||
|  |         song: Song = Song() | ||||||
|  |  | ||||||
|  |         r = self.connection.get(source.url, name=source.url) | ||||||
|  |         if r is None: | ||||||
|  |             return song | ||||||
|  |  | ||||||
|  |         # get the contents that are between `JSON.parse('` and `');` | ||||||
|  |         content = self.get_json_content_from_response(r, start="window.__PRELOADED_STATE__ = JSON.parse('", end="');\n      window.__APP_CONFIG__ = ") | ||||||
|  |         if content is not None: | ||||||
|  |             content = content.replace("\\\\", "\\").replace('\\"', '"').replace("\\'", "'") | ||||||
|  |             data = json.loads(content) | ||||||
|  |  | ||||||
|  |             lyrics_html = traverse_json_path(data, "songPage.lyricsData.body.html", default=None) | ||||||
|  |             if lyrics_html is not None: | ||||||
|  |                 song.lyrics_collection.append(Lyrics(FormattedText(html=lyrics_html))) | ||||||
|  |  | ||||||
|  |             dump_to_file("genius_song_script_json.json", content, is_json=True, exit_after_dump=False) | ||||||
|  |  | ||||||
|  |         soup = self.get_soup_from_response(r) | ||||||
|  |         for lyrics in soup.find_all("div", {"data-lyrics-container": "true"}): | ||||||
|  |             lyrics_object = Lyrics(FormattedText(html=lyrics.prettify())) | ||||||
|  |             song.lyrics_collection.append(lyrics_object) | ||||||
|  |  | ||||||
|  |         song.source_collection.append(source) | ||||||
|  |         return song | ||||||
| @@ -1,34 +1,23 @@ | |||||||
| from collections import defaultdict | from collections import defaultdict | ||||||
| from dataclasses import dataclass | from dataclasses import dataclass | ||||||
| from enum import Enum | from enum import Enum | ||||||
| from typing import List, Optional, Type, Union, Generator, Dict, Any | from typing import Any, Dict, Generator, List, Optional, Type, Union | ||||||
| from urllib.parse import urlparse | from urllib.parse import urlparse | ||||||
| 
 | 
 | ||||||
| import pycountry | import pycountry | ||||||
| from bs4 import BeautifulSoup | from bs4 import BeautifulSoup | ||||||
| 
 | 
 | ||||||
| from ..connection import Connection | from ..connection import Connection | ||||||
| from .abstract import Page | from ..download import Page | ||||||
| from ..utils.enums import SourceType, ALL_SOURCE_TYPES | from ..objects import (Album, Artist, Artwork, DatabaseObject, FormattedText, | ||||||
| from ..utils.enums.album import AlbumType, AlbumStatus |                        ID3Timestamp, Label, Lyrics, Song, Source, Target) | ||||||
| from ..objects import ( | from ..utils import shared, string_processing | ||||||
|     Artist, |  | ||||||
|     Source, |  | ||||||
|     Song, |  | ||||||
|     Album, |  | ||||||
|     ID3Timestamp, |  | ||||||
|     FormattedText, |  | ||||||
|     Label, |  | ||||||
|     Target, |  | ||||||
|     DatabaseObject, |  | ||||||
|     Lyrics, |  | ||||||
|     Artwork |  | ||||||
| ) |  | ||||||
| from ..utils.config import logging_settings, main_settings | from ..utils.config import logging_settings, main_settings | ||||||
| from ..utils import string_processing, shared | from ..utils.enums import ALL_SOURCE_TYPES, SourceType | ||||||
|  | from ..utils.enums.album import AlbumStatus, AlbumType | ||||||
| from ..utils.string_processing import clean_song_title | from ..utils.string_processing import clean_song_title | ||||||
| from ..utils.support_classes.query import Query |  | ||||||
| from ..utils.support_classes.download_result import DownloadResult | from ..utils.support_classes.download_result import DownloadResult | ||||||
|  | from ..utils.support_classes.query import Query | ||||||
| 
 | 
 | ||||||
| """ | """ | ||||||
| https://musify.club/artist/ghost-bath-280348?_pjax=#bodyContent | https://musify.club/artist/ghost-bath-280348?_pjax=#bodyContent | ||||||
| @@ -1,29 +1,19 @@ | |||||||
| from typing import List, Optional, Type, Tuple |  | ||||||
| from urllib.parse import urlparse, urlunparse, parse_qs |  | ||||||
| from enum import Enum | from enum import Enum | ||||||
|  | from typing import List, Optional, Tuple, Type | ||||||
|  | from urllib.parse import parse_qs, urlparse, urlunparse | ||||||
| 
 | 
 | ||||||
| import python_sponsorblock | import python_sponsorblock | ||||||
| 
 | 
 | ||||||
| from ..objects import Source, DatabaseObject, Song, Target |  | ||||||
| from .abstract import Page |  | ||||||
| from ..objects import ( |  | ||||||
|     Artist, |  | ||||||
|     Source, |  | ||||||
|     Song, |  | ||||||
|     Album, |  | ||||||
|     Label, |  | ||||||
|     Target, |  | ||||||
|     FormattedText, |  | ||||||
|     ID3Timestamp |  | ||||||
| ) |  | ||||||
| from ..connection import Connection | from ..connection import Connection | ||||||
|  | from ..download import Page | ||||||
|  | from ..objects import (Album, Artist, DatabaseObject, FormattedText, | ||||||
|  |                        ID3Timestamp, Label, Song, Source, Target) | ||||||
|  | from ..utils.config import logging_settings, main_settings, youtube_settings | ||||||
|  | from ..utils.enums import ALL_SOURCE_TYPES, SourceType | ||||||
| from ..utils.string_processing import clean_song_title | from ..utils.string_processing import clean_song_title | ||||||
| from ..utils.enums import SourceType, ALL_SOURCE_TYPES |  | ||||||
| from ..utils.support_classes.download_result import DownloadResult | from ..utils.support_classes.download_result import DownloadResult | ||||||
| from ..utils.config import youtube_settings, main_settings, logging_settings | from ._youtube_music.super_youtube import (SuperYouTube, YouTubeUrl, | ||||||
| 
 |                                            YouTubeUrlType, get_invidious_url) | ||||||
| from .youtube_music.super_youtube import SuperYouTube, YouTubeUrl, get_invidious_url, YouTubeUrlType |  | ||||||
| 
 |  | ||||||
| 
 | 
 | ||||||
| """ | """ | ||||||
| - https://yt.artemislena.eu/api/v1/search?q=Zombiez+-+Topic&page=1&date=none&type=channel&duration=none&sort=relevance | - https://yt.artemislena.eu/api/v1/search?q=Zombiez+-+Topic&page=1&date=none&type=channel&duration=none&sort=relevance | ||||||
| @@ -38,7 +28,7 @@ def get_piped_url(path: str = "", params: str = "", query: str = "", fragment: s | |||||||
| 
 | 
 | ||||||
| 
 | 
 | ||||||
| class YouTube(SuperYouTube): | class YouTube(SuperYouTube): | ||||||
|     # CHANGE |     REGISTER = youtube_settings["use_youtube_alongside_youtube_music"] | ||||||
|     SOURCE_TYPE = ALL_SOURCE_TYPES.YOUTUBE |     SOURCE_TYPE = ALL_SOURCE_TYPES.YOUTUBE | ||||||
| 
 | 
 | ||||||
|     def __init__(self, *args, **kwargs): |     def __init__(self, *args, **kwargs): | ||||||
| @@ -3,7 +3,6 @@ from enum import Enum | |||||||
| 
 | 
 | ||||||
| from ...utils.config import logging_settings | from ...utils.config import logging_settings | ||||||
| from ...objects import Source, DatabaseObject | from ...objects import Source, DatabaseObject | ||||||
| from ..abstract import Page |  | ||||||
| from ...objects import ( | from ...objects import ( | ||||||
|     Artist, |     Artist, | ||||||
|     Source, |     Source, | ||||||
| @@ -6,7 +6,6 @@ from ...utils.string_processing import clean_song_title | |||||||
| from ...utils.enums import SourceType, ALL_SOURCE_TYPES | from ...utils.enums import SourceType, ALL_SOURCE_TYPES | ||||||
| 
 | 
 | ||||||
| from ...objects import Source, DatabaseObject | from ...objects import Source, DatabaseObject | ||||||
| from ..abstract import Page |  | ||||||
| from ...objects import ( | from ...objects import ( | ||||||
|     Artist, |     Artist, | ||||||
|     Source, |     Source, | ||||||
| @@ -1,26 +1,17 @@ | |||||||
| from typing import List, Optional, Type, Tuple |  | ||||||
| from urllib.parse import urlparse, urlunparse, parse_qs |  | ||||||
| from enum import Enum | from enum import Enum | ||||||
| import requests | from typing import List, Optional, Tuple, Type | ||||||
|  | from urllib.parse import parse_qs, urlparse, urlunparse | ||||||
| 
 | 
 | ||||||
| import python_sponsorblock | import python_sponsorblock | ||||||
|  | import requests | ||||||
| 
 | 
 | ||||||
| from ...objects import Source, DatabaseObject, Song, Target |  | ||||||
| from ..abstract import Page |  | ||||||
| from ...objects import ( |  | ||||||
|     Artist, |  | ||||||
|     Source, |  | ||||||
|     Song, |  | ||||||
|     Album, |  | ||||||
|     Label, |  | ||||||
|     Target, |  | ||||||
|     FormattedText, |  | ||||||
|     ID3Timestamp |  | ||||||
| ) |  | ||||||
| from ...connection import Connection | from ...connection import Connection | ||||||
|  | from ...download import Page | ||||||
|  | from ...objects import (Album, Artist, DatabaseObject, FormattedText, | ||||||
|  |                         ID3Timestamp, Label, Song, Source, Target) | ||||||
|  | from ...utils.config import logging_settings, main_settings, youtube_settings | ||||||
|  | from ...utils.enums import ALL_SOURCE_TYPES, SourceType | ||||||
| from ...utils.support_classes.download_result import DownloadResult | from ...utils.support_classes.download_result import DownloadResult | ||||||
| from ...utils.config import youtube_settings, logging_settings, main_settings |  | ||||||
| from ...utils.enums import SourceType, ALL_SOURCE_TYPES |  | ||||||
| 
 | 
 | ||||||
| 
 | 
 | ||||||
| def get_invidious_url(path: str = "", params: str = "", query: str = "", fragment: str = "") -> str: | def get_invidious_url(path: str = "", params: str = "", query: str = "", fragment: str = "") -> str: | ||||||
| @@ -1,46 +1,33 @@ | |||||||
| from __future__ import unicode_literals, annotations | from __future__ import annotations, unicode_literals | ||||||
| 
 | 
 | ||||||
| from typing import Dict, List, Optional, Set, Type | import json | ||||||
| from urllib.parse import urlparse, urlunparse, quote, parse_qs, urlencode |  | ||||||
| import logging | import logging | ||||||
| import random | import random | ||||||
| import json |  | ||||||
| from dataclasses import dataclass |  | ||||||
| import re | import re | ||||||
| from functools import lru_cache |  | ||||||
| from collections import defaultdict | from collections import defaultdict | ||||||
|  | from dataclasses import dataclass | ||||||
|  | from functools import lru_cache | ||||||
|  | from typing import Dict, List, Optional, Set, Type | ||||||
|  | from urllib.parse import parse_qs, quote, urlencode, urlparse, urlunparse | ||||||
| 
 | 
 | ||||||
| import youtube_dl | import youtube_dl | ||||||
| from youtube_dl.extractor.youtube import YoutubeIE | from youtube_dl.extractor.youtube import YoutubeIE | ||||||
| from youtube_dl.utils import DownloadError | from youtube_dl.utils import DownloadError | ||||||
| 
 | 
 | ||||||
|  | from ...connection import Connection | ||||||
|  | from ...download import Page | ||||||
|  | from ...objects import Album, Artist, Artwork | ||||||
|  | from ...objects import DatabaseObject as DataObject | ||||||
|  | from ...objects import (FormattedText, ID3Timestamp, Label, Lyrics, Song, | ||||||
|  |                         Source, Target) | ||||||
|  | from ...utils import dump_to_file, get_current_millis, traverse_json_path | ||||||
|  | from ...utils.config import logging_settings, main_settings, youtube_settings | ||||||
|  | from ...utils.enums import ALL_SOURCE_TYPES, SourceType | ||||||
|  | from ...utils.enums.album import AlbumType | ||||||
| from ...utils.exception.config import SettingValueError | from ...utils.exception.config import SettingValueError | ||||||
| from ...utils.config import main_settings, youtube_settings, logging_settings |  | ||||||
| from ...utils.shared import DEBUG, DEBUG_YOUTUBE_INITIALIZING | from ...utils.shared import DEBUG, DEBUG_YOUTUBE_INITIALIZING | ||||||
| from ...utils.string_processing import clean_song_title | from ...utils.string_processing import clean_song_title | ||||||
| from ...utils import get_current_millis, traverse_json_path |  | ||||||
| 
 |  | ||||||
| from ...utils import dump_to_file |  | ||||||
| 
 |  | ||||||
| from ..abstract import Page |  | ||||||
| from ...objects import ( |  | ||||||
|     DatabaseObject as DataObject, |  | ||||||
|     Source, |  | ||||||
|     FormattedText, |  | ||||||
|     ID3Timestamp, |  | ||||||
|     Artwork, |  | ||||||
|     Artist, |  | ||||||
|     Song, |  | ||||||
|     Album, |  | ||||||
|     Label, |  | ||||||
|     Target, |  | ||||||
|     Lyrics, |  | ||||||
| ) |  | ||||||
| from ...connection import Connection |  | ||||||
| from ...utils.enums import SourceType, ALL_SOURCE_TYPES |  | ||||||
| from ...utils.enums.album import AlbumType |  | ||||||
| from ...utils.support_classes.download_result import DownloadResult | from ...utils.support_classes.download_result import DownloadResult | ||||||
| 
 |  | ||||||
| from ._list_render import parse_renderer | from ._list_render import parse_renderer | ||||||
| from ._music_object_render import parse_run_element | from ._music_object_render import parse_run_element | ||||||
| from .super_youtube import SuperYouTube | from .super_youtube import SuperYouTube | ||||||
| @@ -549,6 +536,11 @@ class YoutubeMusic(SuperYouTube): | |||||||
|         return album |         return album | ||||||
| 
 | 
 | ||||||
|     def fetch_lyrics(self, video_id: str, playlist_id: str = None) -> str: |     def fetch_lyrics(self, video_id: str, playlist_id: str = None) -> str: | ||||||
|  |         """ | ||||||
|  |         1. fetches the tabs of a song, to get the browse id | ||||||
|  |         2. finds the browse id of the lyrics | ||||||
|  |         3. fetches the lyrics with the browse id | ||||||
|  |         """ | ||||||
|         request_data = { |         request_data = { | ||||||
|             "context": {**self.credentials.context, "adSignalsInfo": {"params": []}}, |             "context": {**self.credentials.context, "adSignalsInfo": {"params": []}}, | ||||||
|             "videoId": video_id, |             "videoId": video_id, | ||||||
| @@ -575,6 +567,7 @@ class YoutubeMusic(SuperYouTube): | |||||||
|             pageType = traverse_json_path(tab, "tabRenderer.endpoint.browseEndpoint.browseEndpointContextSupportedConfigs.browseEndpointContextMusicConfig.pageType", default="") |             pageType = traverse_json_path(tab, "tabRenderer.endpoint.browseEndpoint.browseEndpointContextSupportedConfigs.browseEndpointContextMusicConfig.pageType", default="") | ||||||
|             if pageType in ("MUSIC_TAB_TYPE_LYRICS", "MUSIC_PAGE_TYPE_TRACK_LYRICS") or "lyrics" in pageType.lower(): |             if pageType in ("MUSIC_TAB_TYPE_LYRICS", "MUSIC_PAGE_TYPE_TRACK_LYRICS") or "lyrics" in pageType.lower(): | ||||||
|                 browse_id = traverse_json_path(tab, "tabRenderer.endpoint.browseEndpoint.browseId", default=None) |                 browse_id = traverse_json_path(tab, "tabRenderer.endpoint.browseEndpoint.browseId", default=None) | ||||||
|  |                 if browse_id is not None: | ||||||
|                     break |                     break | ||||||
| 
 | 
 | ||||||
|         if browse_id is None: |         if browse_id is None: | ||||||
| @@ -721,7 +714,6 @@ class YoutubeMusic(SuperYouTube): | |||||||
| 
 | 
 | ||||||
|         self.download_values_by_url[source.url] = { |         self.download_values_by_url[source.url] = { | ||||||
|             "url": _best_format.get("url"), |             "url": _best_format.get("url"), | ||||||
|             "chunk_size": _best_format.get("downloader_options", {}).get("http_chunk_size", main_settings["chunk_size"]), |  | ||||||
|             "headers": _best_format.get("http_headers", {}), |             "headers": _best_format.get("http_headers", {}), | ||||||
|         } |         } | ||||||
| 
 | 
 | ||||||
| @@ -1,157 +0,0 @@ | |||||||
| import logging |  | ||||||
| import random |  | ||||||
| import re |  | ||||||
| from copy import copy |  | ||||||
| from pathlib import Path |  | ||||||
| from typing import Optional, Union, Type, Dict, Set, List, Tuple, TypedDict |  | ||||||
| from string import Formatter |  | ||||||
| from dataclasses import dataclass, field |  | ||||||
|  |  | ||||||
| import requests |  | ||||||
| from bs4 import BeautifulSoup |  | ||||||
|  |  | ||||||
| from ..connection import Connection |  | ||||||
| from ..objects import ( |  | ||||||
|     Song, |  | ||||||
|     Source, |  | ||||||
|     Album, |  | ||||||
|     Artist, |  | ||||||
|     Target, |  | ||||||
|     DatabaseObject, |  | ||||||
|     Options, |  | ||||||
|     Collection, |  | ||||||
|     Label, |  | ||||||
| ) |  | ||||||
| from ..utils.enums import SourceType |  | ||||||
| from ..utils.enums.album import AlbumType |  | ||||||
| from ..audio import write_metadata_to_target, correct_codec |  | ||||||
| from ..utils.config import main_settings |  | ||||||
| from ..utils.support_classes.query import Query |  | ||||||
| from ..utils.support_classes.download_result import DownloadResult |  | ||||||
| from ..utils.string_processing import fit_to_file_system |  | ||||||
| from ..utils import trace, output, BColors |  | ||||||
|  |  | ||||||
| INDEPENDENT_DB_OBJECTS = Union[Label, Album, Artist, Song] |  | ||||||
| INDEPENDENT_DB_TYPES = Union[Type[Song], Type[Album], Type[Artist], Type[Label]] |  | ||||||
|  |  | ||||||
| @dataclass |  | ||||||
| class FetchOptions: |  | ||||||
|     download_all: bool = False |  | ||||||
|     album_type_blacklist: Set[AlbumType] = field(default_factory=lambda: set(AlbumType(a) for a in main_settings["album_type_blacklist"])) |  | ||||||
|  |  | ||||||
| @dataclass |  | ||||||
| class DownloadOptions: |  | ||||||
|     download_all: bool = False |  | ||||||
|     album_type_blacklist: Set[AlbumType] = field(default_factory=lambda: set(AlbumType(a) for a in main_settings["album_type_blacklist"])) |  | ||||||
|  |  | ||||||
|     process_audio_if_found: bool = False |  | ||||||
|     process_metadata_if_found: bool = True |  | ||||||
|  |  | ||||||
| class Page: |  | ||||||
|     SOURCE_TYPE: SourceType |  | ||||||
|     LOGGER: logging.Logger |  | ||||||
|  |  | ||||||
|     def __new__(cls, *args, **kwargs): |  | ||||||
|         cls.LOGGER = logging.getLogger(cls.__name__) |  | ||||||
|  |  | ||||||
|         return super().__new__(cls) |  | ||||||
|  |  | ||||||
|     def __init__(self, download_options: DownloadOptions = None, fetch_options: FetchOptions = None): |  | ||||||
|         self.SOURCE_TYPE.register_page(self) |  | ||||||
|          |  | ||||||
|         self.download_options: DownloadOptions = download_options or DownloadOptions() |  | ||||||
|         self.fetch_options: FetchOptions = fetch_options or FetchOptions() |  | ||||||
|  |  | ||||||
|     def _search_regex(self, pattern, string, default=None, fatal=True, flags=0, group=None): |  | ||||||
|         """ |  | ||||||
|         Perform a regex search on the given string, using a single or a list of |  | ||||||
|         patterns returning the first matching group. |  | ||||||
|         In case of failure return a default value or raise a WARNING or a |  | ||||||
|         RegexNotFoundError, depending on fatal, specifying the field name. |  | ||||||
|         """ |  | ||||||
|  |  | ||||||
|         if isinstance(pattern, str): |  | ||||||
|             mobj = re.search(pattern, string, flags) |  | ||||||
|         else: |  | ||||||
|             for p in pattern: |  | ||||||
|                 mobj = re.search(p, string, flags) |  | ||||||
|                 if mobj: |  | ||||||
|                     break |  | ||||||
|  |  | ||||||
|         if mobj: |  | ||||||
|             if group is None: |  | ||||||
|                 # return the first matching group |  | ||||||
|                 return next(g for g in mobj.groups() if g is not None) |  | ||||||
|             elif isinstance(group, (list, tuple)): |  | ||||||
|                 return tuple(mobj.group(g) for g in group) |  | ||||||
|             else: |  | ||||||
|                 return mobj.group(group) |  | ||||||
|  |  | ||||||
|         return default |  | ||||||
|  |  | ||||||
|     def get_source_type(self, source: Source) -> Optional[Type[DatabaseObject]]: |  | ||||||
|         return None |  | ||||||
|  |  | ||||||
|     def get_soup_from_response(self, r: requests.Response) -> BeautifulSoup: |  | ||||||
|         return BeautifulSoup(r.content, "html.parser") |  | ||||||
|  |  | ||||||
|     # to search stuff |  | ||||||
|     def search(self, query: Query) -> List[DatabaseObject]: |  | ||||||
|         music_object = query.music_object |  | ||||||
|  |  | ||||||
|         search_functions = { |  | ||||||
|             Song: self.song_search, |  | ||||||
|             Album: self.album_search, |  | ||||||
|             Artist: self.artist_search, |  | ||||||
|             Label: self.label_search |  | ||||||
|         } |  | ||||||
|  |  | ||||||
|         if type(music_object) in search_functions: |  | ||||||
|             r = search_functions[type(music_object)](music_object) |  | ||||||
|             if r is not None and len(r) > 0: |  | ||||||
|                 return r |  | ||||||
|  |  | ||||||
|         r = [] |  | ||||||
|         for default_query in query.default_search: |  | ||||||
|             for single_option in self.general_search(default_query): |  | ||||||
|                 r.append(single_option) |  | ||||||
|  |  | ||||||
|         return r |  | ||||||
|  |  | ||||||
|     def general_search(self, search_query: str) -> List[DatabaseObject]: |  | ||||||
|         return [] |  | ||||||
|  |  | ||||||
|     def label_search(self, label: Label) -> List[Label]: |  | ||||||
|         return [] |  | ||||||
|  |  | ||||||
|     def artist_search(self, artist: Artist) -> List[Artist]: |  | ||||||
|         return [] |  | ||||||
|  |  | ||||||
|     def album_search(self, album: Album) -> List[Album]: |  | ||||||
|         return [] |  | ||||||
|  |  | ||||||
|     def song_search(self, song: Song) -> List[Song]: |  | ||||||
|         return [] |  | ||||||
|  |  | ||||||
|     # to fetch stuff |  | ||||||
|     def fetch_song(self, source: Source, stop_at_level: int = 1) -> Song: |  | ||||||
|         return Song() |  | ||||||
|  |  | ||||||
|     def fetch_album(self, source: Source, stop_at_level: int = 1) -> Album: |  | ||||||
|         return Album() |  | ||||||
|  |  | ||||||
|     def fetch_artist(self, source: Source, stop_at_level: int = 1) -> Artist: |  | ||||||
|         return Artist() |  | ||||||
|  |  | ||||||
|     def fetch_label(self, source: Source, stop_at_level: int = 1) -> Label: |  | ||||||
|         return Label() |  | ||||||
|  |  | ||||||
|     # to download stuff |  | ||||||
|     def get_skip_intervals(self, song: Song, source: Source) -> List[Tuple[float, float]]: |  | ||||||
|         return [] |  | ||||||
|  |  | ||||||
|     def post_process_hook(self, song: Song, temp_target: Target, **kwargs): |  | ||||||
|         pass |  | ||||||
|  |  | ||||||
|     def download_song_to_target(self, source: Source, target: Target, desc: str = None) -> DownloadResult: |  | ||||||
|         return DownloadResult() |  | ||||||
| @@ -17,6 +17,9 @@ class SourceType: | |||||||
|     def register_page(self, page: Page): |     def register_page(self, page: Page): | ||||||
|         self.page = page |         self.page = page | ||||||
|  |  | ||||||
|  |     def deregister_page(self): | ||||||
|  |         self.page = None | ||||||
|  |  | ||||||
|     def __hash__(self): |     def __hash__(self): | ||||||
|         return hash(self.name) |         return hash(self.name) | ||||||
|  |  | ||||||
|   | |||||||
| @@ -3,6 +3,9 @@ class MKBaseException(Exception): | |||||||
|         self.message = message |         self.message = message | ||||||
|         super().__init__(message, **kwargs) |         super().__init__(message, **kwargs) | ||||||
|  |  | ||||||
|  | # Compose exceptions. Those usually mean a bug on my side. | ||||||
|  | class MKComposeException(MKBaseException): | ||||||
|  |     pass | ||||||
|  |  | ||||||
| # Downloading | # Downloading | ||||||
| class MKDownloadException(MKBaseException): | class MKDownloadException(MKBaseException): | ||||||
|   | |||||||
| @@ -15,11 +15,11 @@ __stage__ = os.getenv("STAGE", "prod") | |||||||
| DEBUG = (__stage__ == "dev") and True | DEBUG = (__stage__ == "dev") and True | ||||||
| DEBUG_LOGGING = DEBUG and False | DEBUG_LOGGING = DEBUG and False | ||||||
| DEBUG_TRACE = DEBUG and True | DEBUG_TRACE = DEBUG and True | ||||||
| DEBUG_OBJECT_TRACE = DEBUG and True | DEBUG_OBJECT_TRACE = DEBUG and False | ||||||
| DEBUG_OBJECT_TRACE_CALLSTACK = DEBUG_OBJECT_TRACE and False | DEBUG_OBJECT_TRACE_CALLSTACK = DEBUG_OBJECT_TRACE and False | ||||||
| DEBUG_YOUTUBE_INITIALIZING = DEBUG and False | DEBUG_YOUTUBE_INITIALIZING = DEBUG and False | ||||||
| DEBUG_PAGES = DEBUG and False | DEBUG_PAGES = DEBUG and False | ||||||
| DEBUG_DUMP = DEBUG and False | DEBUG_DUMP = DEBUG and True | ||||||
| DEBUG_PRINT_ID = DEBUG and True | DEBUG_PRINT_ID = DEBUG and True | ||||||
|  |  | ||||||
| if DEBUG: | if DEBUG: | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user