music-kraken-core/src/music_kraken/objects/source.py

from collections import defaultdict
from enum import Enum
from typing import List, Dict, Tuple

from .metadata import Mapping, MetadataAttribute
from .parents import DatabaseObject
from .collection import Collection


class SourceTypes(Enum):
    SONG = "song"
    ALBUM = "album"
    ARTIST = "artist"
    LYRICS = "lyrics"


class SourcePages(Enum):
    YOUTUBE = "youtube"
    MUSIFY = "musify"
    GENIUS = "genius"
    MUSICBRAINZ = "musicbrainz"
    ENCYCLOPAEDIA_METALLUM = "encyclopaedia metallum"
    BANDCAMP = "bandcamp"
    DEEZER = "deezer"
    SPOTIFY = "spotify"

    # This has nothing to do with audio, but bands can be here
    INSTAGRAM = "instagram"
    FACEBOOK = "facebook"
    TWITTER = "twitter" # I will use nitter though lol

    @classmethod
    def get_homepage(cls, attribute) -> str:
        homepage_map = {
            cls.YOUTUBE: "https://www.youtube.com/",
            cls.MUSIFY: "https://musify.club/",
            cls.MUSICBRAINZ: "https://musicbrainz.org/",
            cls.ENCYCLOPAEDIA_METALLUM: "https://www.metal-archives.com/",
            cls.GENIUS: "https://genius.com/",
            cls.BANDCAMP: "https://bandcamp.com/",
            cls.DEEZER: "https://www.deezer.com/",
            cls.INSTAGRAM: "https://www.instagram.com/",
            cls.FACEBOOK: "https://www.facebook.com/",
            cls.SPOTIFY: "https://open.spotify.com/",
            cls.TWITTER: "https://twitter.com/"
        }
        return homepage_map[attribute]


class Source(DatabaseObject, MetadataAttribute):
    """
    create somehow like that
    ```python
    # url won't be a valid one due to it being just an example
    Source(src="youtube", url="https://youtu.be/dfnsdajlhkjhsd")
    ```
    """

    def __init__(self, page_enum: SourcePages, url: str, id_: str = None, type_enum=None) -> None:
        DatabaseObject.__init__(self, id_=id_)

        self.type_enum = type_enum
        self.page_enum = page_enum

        self.url = url

    @classmethod
    def match_url(cls, url: str):
        """
        this shouldn't be used, unlesse you are not certain what the source is for
        the reason is that it is more inefficient
        """
        if url.startswith("https://www.youtube"):
            return cls(SourcePages.YOUTUBE, url)

        if url.startswith("https://www.deezer"):
            return cls(SourcePages.DEEZER, url)
        
        if url.startswith("https://open.spotify.com"):
            return cls(SourcePages.SPOTIFY, url)

        if "bandcamp" in url:
            return cls(SourcePages.BANDCAMP, url)

        if url.startswith("https://www.metal-archives.com/"):
            return cls(SourcePages.ENCYCLOPAEDIA_METALLUM, url)

        # the less important once
        if url.startswith("https://www.facebook"):
            return cls(SourcePages.FACEBOOK, url)

        if url.startswith("https://www.instagram"):
            return cls(SourcePages.INSTAGRAM, url)

        if url.startswith("https://twitter"):
            return cls(SourcePages.TWITTER, url)

    def get_song_metadata(self) -> MetadataAttribute.Metadata:
        return MetadataAttribute.Metadata({
            Mapping.FILE_WEBPAGE_URL: [self.url],
            Mapping.SOURCE_WEBPAGE_URL: [self.homepage]
        })

    def get_artist_metadata(self) -> MetadataAttribute.Metadata:
        return MetadataAttribute.Metadata({
            Mapping.ARTIST_WEBPAGE_URL: [self.url]
        })

    def get_metadata(self) -> MetadataAttribute.Metadata:
        if self.type_enum == SourceTypes.SONG:
            return self.get_song_metadata()

        if self.type_enum == SourceTypes.ARTIST:
            return self.get_artist_metadata()

        return super().get_metadata()

    @property
    def indexing_values(self) -> List[Tuple[str, object]]:
        return [
            ('id', self.id),
            ('url', self.url)
        ]

    def __str__(self):
        return self.__repr__()

    def __repr__(self) -> str:
        return f"Src({self.page_enum.value}: {self.url})"

    page_str = property(fget=lambda self: self.page_enum.value)
    type_str = property(fget=lambda self: self.type_enum.value)
    homepage = property(fget=lambda self: SourcePages.get_homepage(self.page_enum))


class SourceCollection(Collection):
    def __init__(self, source_list: List[Source]):
        super().__init__(data=source_list, element_type=Source)

        self._page_to_source_list: Dict[SourcePages, List[Source]] = defaultdict(list)

    def map_element(self, source: Source):
        super().map_element(source)

        self._page_to_source_list[source.page_enum].append(source)

    def get_sources_from_page(self, source_page: SourcePages) -> List[Source]:
        """
        getting the sources for a specific page like
        YouTube or musify
        """
        return self._page_to_source_list[source_page]


class SourceAttribute(DatabaseObject):
    """
    This is a class that is meant to be inherited from.
    it adds the source_list attribute to a class
    """
    _source_dict: Dict[SourcePages, List[Source]]
    source_url_map: Dict[str, Source]

    def __new__(cls, **kwargs):
        new = object.__new__(cls)
        new._source_dict = {page_enum: list() for page_enum in SourcePages}
        new.source_url_map = dict()
        return new

    def match_source_with_url(self, url: str) -> bool:
        """
        this function returns true, if a source with this url exists,
        else it returns false
        :param url:
        :return source_with_url_exists:
        """
        return url in self.source_url_map

    def match_source(self, source: Source) -> bool:
        return self.match_source_with_url(source.url)

    def add_source(self, source: Source):
        """
        adds a new Source to the sources
        """
        if self.match_source(source):
            return
        self.source_url_map[source.url] = source
        self._source_dict[source.page_enum].append(source)

    def get_sources_from_page(self, page_enum) -> List[Source]:
        """
        getting the sources for a specific page like
        youtube or musify
        """
        return self._source_dict[page_enum]

    def get_source_list(self) -> List[Source]:
        """
        gets all sources
        """
        return [item for _, page_list in self._source_dict.items() for item in page_list]

    def set_source_list(self, source_list: List[Source]):
        self._source_dict = {page_enum: list() for page_enum in SourcePages}

        for source in source_list:
            self.add_source(source)

    def get_source_dict(self) -> Dict[object, List[Source]]:
        """
        gets a dictionary of all Sources,
        where the key is a page enum, 
        and the value is a List with all sources of according page
        """
        return self._source_dict

    source_list: List[Source] = property(fget=get_source_list, fset=set_source_list)
    source_dict: Dict[object, List[Source]] = property(fget=get_source_dict)
refactorings 2023-03-09 21:14:39 +00:00			`from collections import defaultdict`
dasfh 2023-01-12 15:25:50 +00:00			`from enum import Enum`
implemented DatabaseObject.indexing_values for each data objects 2023-03-09 18:53:28 +00:00			`from typing import List, Dict, Tuple`
dasfh 2023-01-12 15:25:50 +00:00
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`from .metadata import Mapping, MetadataAttribute`
refactorings 2023-03-09 21:14:39 +00:00			`from .parents import DatabaseObject`
			`from .collection import Collection`
dasfh 2023-01-12 15:25:50 +00:00
added source to artist 2023-01-20 22:05:15 +00:00
			`class SourceTypes(Enum):`
daffasf 2023-01-16 14:37:04 +00:00			`SONG = "song"`
			`ALBUM = "album"`
			`ARTIST = "artist"`
			`LYRICS = "lyrics"`

added source to artist 2023-01-20 22:05:15 +00:00
			`class SourcePages(Enum):`
dasfh 2023-01-12 15:25:50 +00:00			`YOUTUBE = "youtube"`
added source to artist 2023-01-20 22:05:15 +00:00			`MUSIFY = "musify"`
daffasf 2023-01-16 14:37:04 +00:00			`GENIUS = "genius"`
			`MUSICBRAINZ = "musicbrainz"`
			`ENCYCLOPAEDIA_METALLUM = "encyclopaedia metallum"`
started implementation of fetching from ma artis sources 2023-01-31 23:07:13 +00:00			`BANDCAMP = "bandcamp"`
			`DEEZER = "deezer"`
			`SPOTIFY = "spotify"`

			`# This has nothing to do with audio, but bands can be here`
			`INSTAGRAM = "instagram"`
			`FACEBOOK = "facebook"`
			`TWITTER = "twitter" # I will use nitter though lol`
dasfh 2023-01-12 15:25:50 +00:00
			`@classmethod`
			`def get_homepage(cls, attribute) -> str:`
			`homepage_map = {`
added source to artist 2023-01-20 22:05:15 +00:00			`cls.YOUTUBE: "https://www.youtube.com/",`
			`cls.MUSIFY: "https://musify.club/",`
			`cls.MUSICBRAINZ: "https://musicbrainz.org/",`
daffasf 2023-01-16 14:37:04 +00:00			`cls.ENCYCLOPAEDIA_METALLUM: "https://www.metal-archives.com/",`
started implementation of fetching from ma artis sources 2023-01-31 23:07:13 +00:00			`cls.GENIUS: "https://genius.com/",`
			`cls.BANDCAMP: "https://bandcamp.com/",`
			`cls.DEEZER: "https://www.deezer.com/",`
			`cls.INSTAGRAM: "https://www.instagram.com/",`
			`cls.FACEBOOK: "https://www.facebook.com/",`
			`cls.SPOTIFY: "https://open.spotify.com/",`
			`cls.TWITTER: "https://twitter.com/"`
dasfh 2023-01-12 15:25:50 +00:00			`}`
			`return homepage_map[attribute]`


tried fixing shit 2023-03-02 06:59:53 +00:00			`class Source(DatabaseObject, MetadataAttribute):`
dasfh 2023-01-12 15:25:50 +00:00			`"""`
			`create somehow like that`
			```python
			`# url won't be a valid one due to it being just an example`
			`Source(src="youtube", url="https://youtu.be/dfnsdajlhkjhsd")`
			```
			`"""`

Update source.py 2023-03-03 06:52:13 +00:00			`def __init__(self, page_enum: SourcePages, url: str, id_: str = None, type_enum=None) -> None:`
dasfh 2023-01-12 15:25:50 +00:00			`DatabaseObject.__init__(self, id_=id_)`

added type to src 2023-01-20 09:56:40 +00:00			`self.type_enum = type_enum`
added source to artist 2023-01-20 22:05:15 +00:00			`self.page_enum = page_enum`

dasfh 2023-01-12 15:25:50 +00:00			`self.url = url`

added the fetching of the sources from ma regarding artists 2023-02-01 08:10:05 +00:00			`@classmethod`
			`def match_url(cls, url: str):`
			`"""`
			`this shouldn't be used, unlesse you are not certain what the source is for`
			`the reason is that it is more inefficient`
			`"""`
			`if url.startswith("https://www.youtube"):`
			`return cls(SourcePages.YOUTUBE, url)`

			`if url.startswith("https://www.deezer"):`
			`return cls(SourcePages.DEEZER, url)`

			`if url.startswith("https://open.spotify.com"):`
			`return cls(SourcePages.SPOTIFY, url)`

			`if "bandcamp" in url:`
			`return cls(SourcePages.BANDCAMP, url)`

			`if url.startswith("https://www.metal-archives.com/"):`
			`return cls(SourcePages.ENCYCLOPAEDIA_METALLUM, url)`

			`# the less important once`
			`if url.startswith("https://www.facebook"):`
			`return cls(SourcePages.FACEBOOK, url)`

			`if url.startswith("https://www.instagram"):`
			`return cls(SourcePages.INSTAGRAM, url)`

			`if url.startswith("https://twitter"):`
			`return cls(SourcePages.TWITTER, url)`

finished refactoring metadata 2023-01-30 13:41:02 +00:00			`def get_song_metadata(self) -> MetadataAttribute.Metadata:`
			`return MetadataAttribute.Metadata({`
			`Mapping.FILE_WEBPAGE_URL: [self.url],`
			`Mapping.SOURCE_WEBPAGE_URL: [self.homepage]`
			`})`

			`def get_artist_metadata(self) -> MetadataAttribute.Metadata:`
			`return MetadataAttribute.Metadata({`
			`Mapping.ARTIST_WEBPAGE_URL: [self.url]`
			`})`

			`def get_metadata(self) -> MetadataAttribute.Metadata:`
added source to artist 2023-01-20 22:05:15 +00:00			`if self.type_enum == SourceTypes.SONG:`
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`return self.get_song_metadata()`
added source to artist 2023-01-20 22:05:15 +00:00
			`if self.type_enum == SourceTypes.ARTIST:`
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`return self.get_artist_metadata()`
added artist attribute 2023-01-20 10:01:18 +00:00
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`return super().get_metadata()`
dfsa 2023-01-12 16:14:21 +00:00
implemented DatabaseObject.indexing_values for each data objects 2023-03-09 18:53:28 +00:00			`@property`
			`def indexing_values(self) -> List[Tuple[str, object]]:`
			`return [`
			`('id', self.id),`
			`('url', self.url)`
			`]`

dasfh 2023-01-12 15:25:50 +00:00			`def __str__(self):`
added the fetching of the sources from ma regarding artists 2023-02-01 08:10:05 +00:00			`return self.__repr__()`
dasfh 2023-01-12 15:25:50 +00:00
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`def __repr__(self) -> str:`
			`return f"Src({self.page_enum.value}: {self.url})"`

added source to artist 2023-01-20 22:05:15 +00:00			`page_str = property(fget=lambda self: self.page_enum.value)`
added type to src 2023-01-20 09:56:40 +00:00			`type_str = property(fget=lambda self: self.type_enum.value)`
added source to artist 2023-01-20 22:05:15 +00:00			`homepage = property(fget=lambda self: SourcePages.get_homepage(self.page_enum))`
source 2023-01-25 13:14:15 +00:00

refactorings 2023-03-09 21:14:39 +00:00			`class SourceCollection(Collection):`
			`def __init__(self, source_list: List[Source]):`
			`super().__init__(data=source_list, element_type=Source)`

			`self._page_to_source_list: Dict[SourcePages, List[Source]] = defaultdict(list)`

			`def map_element(self, source: Source):`
			`super().map_element(source)`

			`self._page_to_source_list[source.page_enum].append(source)`

			`def get_sources_from_page(self, source_page: SourcePages) -> List[Source]:`
			`"""`
			`getting the sources for a specific page like`
			`YouTube or musify`
			`"""`
			`return self._page_to_source_list[source_page]`


cvyxv 2023-03-06 14:20:26 +00:00			`class SourceAttribute(DatabaseObject):`
source 2023-01-25 13:14:15 +00:00			`"""`
			`This is a class that is meant to be inherited from.`
			`it adds the source_list attribute to a class`
			`"""`
refactored and cleaned up data objects 2023-02-25 21:16:32 +00:00			`_source_dict: Dict[SourcePages, List[Source]]`
started implementation of fetching from ma artis sources 2023-01-31 23:07:13 +00:00			`source_url_map: Dict[str, Source]`
fixed mutable argument bug in the source dict of SourceAttribute 2023-01-31 12:18:52 +00:00
renamed a var to follow more the python defaults 2023-01-31 12:28:27 +00:00			`def __new__(cls, **kwargs):`
fixed mutable argument bug in the source dict of SourceAttribute 2023-01-31 12:18:52 +00:00			`new = object.__new__(cls)`
			`new._source_dict = {page_enum: list() for page_enum in SourcePages}`
started implementation of fetching from ma artis sources 2023-01-31 23:07:13 +00:00			`new.source_url_map = dict()`
fixed mutable argument bug in the source dict of SourceAttribute 2023-01-31 12:18:52 +00:00			`return new`
source 2023-01-25 13:14:15 +00:00
started implementation of fetching from ma artis sources 2023-01-31 23:07:13 +00:00			`def match_source_with_url(self, url: str) -> bool:`
			`"""`
			`this function returns true, if a source with this url exists,`
			`else it returns false`
			`:param url:`
			`:return source_with_url_exists:`
			`"""`
			`return url in self.source_url_map`

			`def match_source(self, source: Source) -> bool:`
			`return self.match_source_with_url(source.url)`

source 2023-01-25 13:14:15 +00:00			`def add_source(self, source: Source):`
			`"""`
			`adds a new Source to the sources`
			`"""`
started implementation of fetching from ma artis sources 2023-01-31 23:07:13 +00:00			`if self.match_source(source):`
			`return`
			`self.source_url_map[source.url] = source`
metadata 2023-01-27 11:56:59 +00:00			`self._source_dict[source.page_enum].append(source)`
source 2023-01-25 13:14:15 +00:00
			`def get_sources_from_page(self, page_enum) -> List[Source]:`
			`"""`
			`getting the sources for a specific page like`
			`youtube or musify`
			`"""`
			`return self._source_dict[page_enum]`

			`def get_source_list(self) -> List[Source]:`
			`"""`
			`gets all sources`
			`"""`
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`return [item for _, page_list in self._source_dict.items() for item in page_list]`
metadata 2023-01-27 11:56:59 +00:00
			`def set_source_list(self, source_list: List[Source]):`
			`self._source_dict = {page_enum: list() for page_enum in SourcePages}`

			`for source in source_list:`
			`self.add_source(source)`
source 2023-01-25 13:14:15 +00:00
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`def get_source_dict(self) -> Dict[object, List[Source]]:`
source 2023-01-25 13:14:15 +00:00			`"""`
			`gets a dictionary of all Sources,`
			`where the key is a page enum,`
			`and the value is a List with all sources of according page`
			`"""`
			`return self._source_dict`

metadata 2023-01-27 11:56:59 +00:00			`source_list: List[Source] = property(fget=get_source_list, fset=set_source_list)`
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`source_dict: Dict[object, List[Source]] = property(fget=get_source_dict)`