music-kraken-core/src/music_kraken/__init__.py

import gc
import musicbrainzngs
import logging
import re
import os
from pathlib import Path
from typing import List

from . import objects, pages
from .utils.string_processing import fit_to_file_system
from .utils.shared import MUSIC_DIR, MODIFY_GC, NOT_A_GENRE_REGEX, get_random_message

if MODIFY_GC:
    """
    At the start I modify the garbage collector to run a bit fewer times.
    This should increase speed:
    https://mkennedy.codes/posts/python-gc-settings-change-this-and-make-your-app-go-20pc-faster/
    """
    # Clean up what might be garbage so far.
    gc.collect(2)

    allocs, gen1, gen2 = gc.get_threshold()
    allocs = 50_000  # Start the GC sequence every 50K not 700 allocations.
    gen1 = gen1 * 2
    gen2 = gen2 * 2
    gc.set_threshold(allocs, gen1, gen2)

logging.getLogger("musicbrainzngs").setLevel(logging.WARNING)
musicbrainzngs.set_useragent("metadata receiver", "0.1", "https://github.com/HeIIow2/music-downloader")

URL_REGEX = 'https?://(?:[-\w.]|(?:%[\da-fA-F]{2}))+'
DOWNLOAD_COMMANDS = {
    "ok",
    "download",
    "\\d",
    "hs"
}

EXIT_COMMANDS = {
    "exit",
    "quit"
}


def cli(genre: str = None):
    def get_existing_genre() -> List[str]:
        """
        gets the name of all subdirectories of shared.MUSIC_DIR,
        but filters out all directories, where the name matches with any patern
        from shared.NOT_A_GENRE_REGEX.
        """
        existing_genres: List[str] = []
        
        # get all subdirectories of MUSIC_DIR, not the files in the dir.
        existing_subdirectories: List[Path] = [f for f in MUSIC_DIR.iterdir() if f.is_dir()]
        
        for subdirectory in existing_subdirectories:
            name: str = subdirectory.name
                    
            if not any(re.match(regex_pattern, name) for regex_pattern in NOT_A_GENRE_REGEX):
                existing_genres.append(name)
            
        return existing_genres
    
    def get_genre():
        existing_genres = get_existing_genre()
        for i, genre_option in enumerate(existing_genres):
            print(f"{i+1:0>2}: {genre_option}")

        
        while True:
            genre = input("Id or new genre: ")

            if genre.isdigit():
                genre_id = int(genre) - 1
                if genre_id >= len(existing_genres):
                    print(f"No genre under the id {genre_id+1}.")
                    continue
                
                return existing_genres[genre_id]

            new_genre = fit_to_file_system(genre)
            
            agree_inputs = {"y", "yes", "ok"}
            verification = input(f"create new genre \"{new_genre}\"? (Y/N): ").lower()
            if verification in agree_inputs:
                return new_genre
            
    def next_search(_search: pages.Search, query: str, genre: str) -> bool:
        """
        :param _search:
        :param query:
        :return exit in the next step:
        """
        query: str = query.strip()
        parsed: str = query.lower()

        if parsed in EXIT_COMMANDS:
            return True

        if parsed == ".":
            return False
        if parsed == "..":
            _search.goto_previous()
            return False

        if parsed.isdigit():
            _search.choose_index(int(parsed))
            return False

        if parsed in DOWNLOAD_COMMANDS:
            r = _search.download_chosen(genre=genre)

            print()
            print(r)
            print()

            return not r.is_mild_failure

        url = re.match(URL_REGEX, query)
        if url is not None:
            if not _search.search_url(url.string):
                print("The given url couldn't be found.")
            return False

        page = _search.get_page_from_query(parsed)
        if page is not None:
            _search.choose_page(page)
            return False

        # if everything else is not valid search
        _search.search(query)
        return False

    if genre is None:
        genre = get_genre()
        print()
    print(get_random_message())
    print()
    print(f"Downloading to: \"{genre}\"")
    print()

    search = pages.Search()

    while True:
        if next_search(search, input(">> "), genre):
            break
        print(search)

    print()
    print(get_random_message())
modified garbage collection to run a bit less often 2022-11-24 21:10:22 +00:00			`import gc`
refactored cli, removed switch case 2022-11-23 07:24:05 +00:00			`import musicbrainzngs`
			`import logging`
implemented direct download in the cli 2023-03-30 10:43:43 +00:00			`import re`
implemented genre in the cli 2023-04-04 20:30:14 +00:00			`import os`
drastically improved genre selection 2023-04-05 08:01:51 +00:00			`from pathlib import Path`
			`from typing import List`
refactored cli, removed switch case 2022-11-23 07:24:05 +00:00
cute messages 2023-04-04 18:19:29 +00:00			`from . import objects, pages`
drastically improved genre selection 2023-04-05 08:01:51 +00:00			`from .utils.string_processing import fit_to_file_system`
			`from .utils.shared import MUSIC_DIR, MODIFY_GC, NOT_A_GENRE_REGEX, get_random_message`
made gc modification optional 2023-04-04 20:07:56 +00:00
			`if MODIFY_GC:`
			`"""`
			`At the start I modify the garbage collector to run a bit fewer times.`
			`This should increase speed:`
			`https://mkennedy.codes/posts/python-gc-settings-change-this-and-make-your-app-go-20pc-faster/`
			`"""`
			`# Clean up what might be garbage so far.`
			`gc.collect(2)`

			`allocs, gen1, gen2 = gc.get_threshold()`
			`allocs = 50_000 # Start the GC sequence every 50K not 700 allocations.`
			`gen1 = gen1 * 2`
			`gen2 = gen2 * 2`
			`gc.set_threshold(allocs, gen1, gen2)`
modified garbage collection to run a bit less often 2022-11-24 21:10:22 +00:00
fixed dependency 2022-11-22 13:53:29 +00:00			`logging.getLogger("musicbrainzngs").setLevel(logging.WARNING)`
			`musicbrainzngs.set_useragent("metadata receiver", "0.1", "https://github.com/HeIIow2/music-downloader")`
implemented the ability to simply run the programm from terminal typing 'music-kraken' when installing with pip 2022-11-15 12:04:44 +00:00
small change 2023-04-04 19:27:27 +00:00			`URL_REGEX = 'https?://(?:[-\w.]\|(?:%[\da-fA-F]{2}))+'`
implemented downloading 2023-03-31 08:34:29 +00:00			`DOWNLOAD_COMMANDS = {`
			`"ok",`
			`"download",`
small change 2023-04-04 19:29:10 +00:00			`"\\d",`
implemented downloading 2023-03-31 08:34:29 +00:00			`"hs"`
			`}`
implemented direct download in the cli 2023-03-30 10:43:43 +00:00
cute messages 2023-04-04 18:19:29 +00:00			`EXIT_COMMANDS = {`
			`"exit",`
			`"quit"`
			`}`

ready for test build 2022-11-24 17:25:49 +00:00
implemented genre in the cli 2023-04-04 20:30:14 +00:00

drastically improved genre selection 2023-04-05 08:01:51 +00:00
cleaned up genre 2023-04-05 08:05:45 +00:00			`def cli(genre: str = None):`
drastically improved genre selection 2023-04-05 08:01:51 +00:00			`def get_existing_genre() -> List[str]:`
			`"""`
			`gets the name of all subdirectories of shared.MUSIC_DIR,`
			`but filters out all directories, where the name matches with any patern`
			`from shared.NOT_A_GENRE_REGEX.`
			`"""`
			`existing_genres: List[str] = []`

			`# get all subdirectories of MUSIC_DIR, not the files in the dir.`
			`existing_subdirectories: List[Path] = [f for f in MUSIC_DIR.iterdir() if f.is_dir()]`

			`for subdirectory in existing_subdirectories:`
			`name: str = subdirectory.name`

			`if not any(re.match(regex_pattern, name) for regex_pattern in NOT_A_GENRE_REGEX):`
			`existing_genres.append(name)`

			`return existing_genres`

			`def get_genre():`
implemented genre in the cli 2023-04-04 20:30:14 +00:00			`existing_genres = get_existing_genre()`
			`for i, genre_option in enumerate(existing_genres):`
drastically improved genre selection 2023-04-05 08:01:51 +00:00			`print(f"{i+1:0>2}: {genre_option}")`


			`while True:`
cleaned up genre 2023-04-05 08:05:45 +00:00			`genre = input("Id or new genre: ")`
drastically improved genre selection 2023-04-05 08:01:51 +00:00
			`if genre.isdigit():`
			`genre_id = int(genre) - 1`
			`if genre_id >= len(existing_genres):`
cleaned up genre 2023-04-05 08:05:45 +00:00			`print(f"No genre under the id {genre_id+1}.")`
drastically improved genre selection 2023-04-05 08:01:51 +00:00			`continue`

			`return existing_genres[genre_id]`

			`new_genre = fit_to_file_system(genre)`

			`agree_inputs = {"y", "yes", "ok"}`
			`verification = input(f"create new genre \"{new_genre}\"? (Y/N): ").lower()`
			`if verification in agree_inputs:`
			`return new_genre`

implemented genre in the cli 2023-04-04 20:30:14 +00:00			`def next_search(_search: pages.Search, query: str, genre: str) -> bool:`
cute messages 2023-04-04 18:19:29 +00:00			`"""`
small change 2023-04-04 19:26:37 +00:00			`:param _search:`
cute messages 2023-04-04 18:19:29 +00:00			`:param query:`
			`:return exit in the next step:`
			`"""`
moved cli to __init__.py 2023-03-30 08:49:17 +00:00			`query: str = query.strip()`
			`parsed: str = query.lower()`
cute messages 2023-04-04 18:19:29 +00:00
			`if parsed in EXIT_COMMANDS:`
			`return True`
implemented genre in the cli 2023-04-04 20:30:14 +00:00
moved cli to __init__.py 2023-03-30 08:49:17 +00:00			`if parsed == ".":`
cute messages 2023-04-04 18:19:29 +00:00			`return False`
moved cli to __init__.py 2023-03-30 08:49:17 +00:00			`if parsed == "..":`
small change 2023-04-04 19:26:37 +00:00			`_search.goto_previous()`
cute messages 2023-04-04 18:19:29 +00:00			`return False`
implemented genre in the cli 2023-04-04 20:30:14 +00:00
moved cli to __init__.py 2023-03-30 08:49:17 +00:00			`if parsed.isdigit():`
small change 2023-04-04 19:26:37 +00:00			`_search.choose_index(int(parsed))`
cute messages 2023-04-04 18:19:29 +00:00			`return False`
implemented genre in the cli 2023-04-04 20:30:14 +00:00
implemented downloading 2023-03-31 08:34:29 +00:00			`if parsed in DOWNLOAD_COMMANDS:`
implemented genre in the cli 2023-04-04 20:30:14 +00:00			`r = _search.download_chosen(genre=genre)`
improved 2023-04-04 19:18:56 +00:00
cute messages 2023-04-04 18:19:29 +00:00			`print()`
			`print(r)`
improved 2023-04-04 19:18:56 +00:00			`print()`

			`return not r.is_mild_failure`
changed download results and integrated them in the cli 2023-04-04 18:00:21 +00:00
small change 2023-04-04 19:27:27 +00:00			`url = re.match(URL_REGEX, query)`
implemented direct download in the cli 2023-03-30 10:43:43 +00:00			`if url is not None:`
small change 2023-04-04 19:26:37 +00:00			`if not _search.search_url(url.string):`
cute messages 2023-04-04 18:19:29 +00:00			`print("The given url couldn't be found.")`
			`return False`
implemented genre in the cli 2023-04-04 20:30:14 +00:00
small change 2023-04-04 19:26:37 +00:00			`page = _search.get_page_from_query(parsed)`
moved cli to __init__.py 2023-03-30 08:49:17 +00:00			`if page is not None:`
small change 2023-04-04 19:26:37 +00:00			`_search.choose_page(page)`
cute messages 2023-04-04 18:19:29 +00:00			`return False`
implemented genre in the cli 2023-04-04 20:30:14 +00:00
moved cli to __init__.py 2023-03-30 08:49:17 +00:00			`# if everything else is not valid search`
small change 2023-04-04 19:26:37 +00:00			`_search.search(query)`
cute messages 2023-04-04 18:19:29 +00:00			`return False`

cleaned up genre 2023-04-05 08:05:45 +00:00			`if genre is None:`
			`genre = get_genre()`
			`print()`
added message 2023-04-05 08:08:27 +00:00			`print(get_random_message())`
			`print()`
			`print(f"Downloading to: \"{genre}\"")`
			`print()`
implemented genre in the cli 2023-04-04 20:30:14 +00:00
moved cli to __init__.py 2023-03-30 08:49:17 +00:00			`search = pages.Search()`

added cli to __init__.py 2023-03-29 15:24:02 +00:00			`while True:`
implemented genre in the cli 2023-04-04 20:30:14 +00:00			`if next_search(search, input(">> "), genre):`
changed download results and integrated them in the cli 2023-04-04 18:00:21 +00:00			`break`
added cli to __init__.py 2023-03-29 15:24:02 +00:00			`print(search)`
cute messages 2023-04-04 18:19:29 +00:00
			`print()`
			`print(get_random_message())`