music-kraken-core/src/music_kraken/objects/source.py

from collections import defaultdict
from enum import Enum
from typing import List, Dict, Tuple, Optional
from urllib.parse import urlparse

from .metadata import Mapping, Metadata
from .parents import DatabaseObject
from .collection import Collection


class SourceTypes(Enum):
    SONG = "song"
    ALBUM = "album"
    ARTIST = "artist"
    LYRICS = "lyrics"


class SourcePages(Enum):
    YOUTUBE = "youtube"
    MUSIFY = "musify"
    GENIUS = "genius"
    MUSICBRAINZ = "musicbrainz"
    ENCYCLOPAEDIA_METALLUM = "encyclopaedia metallum"
    BANDCAMP = "bandcamp"
    DEEZER = "deezer"
    SPOTIFY = "spotify"

    # This has nothing to do with audio, but bands can be here
    INSTAGRAM = "instagram"
    FACEBOOK = "facebook"
    TWITTER = "twitter"     # I will use nitter though lol
    MYSPACE = "myspace"     # Yes somehow this ancient site is linked EVERYWHERE

    @classmethod
    def get_homepage(cls, attribute) -> str:
        homepage_map = {
            cls.YOUTUBE: "https://www.youtube.com/",
            cls.MUSIFY: "https://musify.club/",
            cls.MUSICBRAINZ: "https://musicbrainz.org/",
            cls.ENCYCLOPAEDIA_METALLUM: "https://www.metal-archives.com/",
            cls.GENIUS: "https://genius.com/",
            cls.BANDCAMP: "https://bandcamp.com/",
            cls.DEEZER: "https://www.deezer.com/",
            cls.INSTAGRAM: "https://www.instagram.com/",
            cls.FACEBOOK: "https://www.facebook.com/",
            cls.SPOTIFY: "https://open.spotify.com/",
            cls.TWITTER: "https://twitter.com/",
            cls.MYSPACE: "https://myspace.com/"
        }
        return homepage_map[attribute]


class Source(DatabaseObject):
    """
    create somehow like that
    ```python
    # url won't be a valid one due to it being just an example
    Source(src="youtube", url="https://youtu.be/dfnsdajlhkjhsd")
    ```
    """
    COLLECTION_ATTRIBUTES = tuple()
    SIMPLE_ATTRIBUTES = {
        "type_enum": None,
        "page_enum": None,
        "url": None
    }

    def __init__(self, page_enum: SourcePages, url: str, id_: str = None, type_enum=None) -> None:
        DatabaseObject.__init__(self, id_=id_)

        self.type_enum = type_enum
        self.page_enum = page_enum

        self.url = url

    @classmethod
    def match_url(cls, url: str) -> Optional["Source"]:
        """
        this shouldn't be used, unlesse you are not certain what the source is for
        the reason is that it is more inefficient
        """
        parsed = urlparse(url)
        url = parsed.geturl()

        if url.startswith("https://www.youtube"):
            return cls(SourcePages.YOUTUBE, url)

        if url.startswith("https://www.deezer"):
            return cls(SourcePages.DEEZER, url)
        
        if url.startswith("https://open.spotify.com"):
            return cls(SourcePages.SPOTIFY, url)

        if "bandcamp" in url:
            return cls(SourcePages.BANDCAMP, url)

        if url.startswith("https://www.metal-archives.com/"):
            return cls(SourcePages.ENCYCLOPAEDIA_METALLUM, url)

        # the less important once
        if url.startswith("https://www.facebook"):
            return cls(SourcePages.FACEBOOK, url)

        if url.startswith("https://www.instagram"):
            return cls(SourcePages.INSTAGRAM, url)

        if url.startswith("https://twitter"):
            return cls(SourcePages.TWITTER, url)

        if url.startswith("https://myspace.com"):
            return cls(SourcePages.MYSPACE, url)

    def get_song_metadata(self) -> Metadata:
        return Metadata({
            Mapping.FILE_WEBPAGE_URL: [self.url],
            Mapping.SOURCE_WEBPAGE_URL: [self.homepage]
        })

    def get_artist_metadata(self) -> Metadata:
        return Metadata({
            Mapping.ARTIST_WEBPAGE_URL: [self.url]
        })

    @property
    def metadata(self) -> Metadata:
        if self.type_enum == SourceTypes.SONG:
            return self.get_song_metadata()

        if self.type_enum == SourceTypes.ARTIST:
            return self.get_artist_metadata()

        return super().metadata

    @property
    def indexing_values(self) -> List[Tuple[str, object]]:
        return [
            ('id', self.id),
            ('url', self.url)
        ]

    def __str__(self):
        return self.__repr__()

    def __repr__(self) -> str:
        return f"Src({self.page_enum.value}: {self.url})"

    page_str = property(fget=lambda self: self.page_enum.value)
    type_str = property(fget=lambda self: self.type_enum.value)
    homepage = property(fget=lambda self: SourcePages.get_homepage(self.page_enum))


class SourceCollection(Collection):
    def __init__(self, source_list: List[Source]):
        self._page_to_source_list: Dict[SourcePages, List[Source]] = defaultdict(list)

        super().__init__(data=source_list, element_type=Source)

        
    def map_element(self, source: Source):
        super().map_element(source)

        self._page_to_source_list[source.page_enum].append(source)

    def get_sources_from_page(self, source_page: SourcePages) -> List[Source]:
        """
        getting the sources for a specific page like
        YouTube or musify
        """
        return self._page_to_source_list[source_page].copy()
refactorings 2023-03-09 21:14:39 +00:00			`from collections import defaultdict`
dasfh 2023-01-12 15:25:50 +00:00			`from enum import Enum`
added fetching of linked sources to musify 2023-03-18 12:01:27 +00:00			`from typing import List, Dict, Tuple, Optional`
			`from urllib.parse import urlparse`
dasfh 2023-01-12 15:25:50 +00:00
refactor 2023-03-10 08:09:35 +00:00			`from .metadata import Mapping, Metadata`
refactorings 2023-03-09 21:14:39 +00:00			`from .parents import DatabaseObject`
			`from .collection import Collection`
dasfh 2023-01-12 15:25:50 +00:00
added source to artist 2023-01-20 22:05:15 +00:00
			`class SourceTypes(Enum):`
daffasf 2023-01-16 14:37:04 +00:00			`SONG = "song"`
			`ALBUM = "album"`
			`ARTIST = "artist"`
			`LYRICS = "lyrics"`

added source to artist 2023-01-20 22:05:15 +00:00
			`class SourcePages(Enum):`
dasfh 2023-01-12 15:25:50 +00:00			`YOUTUBE = "youtube"`
added source to artist 2023-01-20 22:05:15 +00:00			`MUSIFY = "musify"`
daffasf 2023-01-16 14:37:04 +00:00			`GENIUS = "genius"`
			`MUSICBRAINZ = "musicbrainz"`
			`ENCYCLOPAEDIA_METALLUM = "encyclopaedia metallum"`
started implementation of fetching from ma artis sources 2023-01-31 23:07:13 +00:00			`BANDCAMP = "bandcamp"`
			`DEEZER = "deezer"`
			`SPOTIFY = "spotify"`

			`# This has nothing to do with audio, but bands can be here`
			`INSTAGRAM = "instagram"`
			`FACEBOOK = "facebook"`
added fetching of linked sources to musify 2023-03-18 12:01:27 +00:00			`TWITTER = "twitter" # I will use nitter though lol`
			`MYSPACE = "myspace" # Yes somehow this ancient site is linked EVERYWHERE`
dasfh 2023-01-12 15:25:50 +00:00
			`@classmethod`
			`def get_homepage(cls, attribute) -> str:`
			`homepage_map = {`
added source to artist 2023-01-20 22:05:15 +00:00			`cls.YOUTUBE: "https://www.youtube.com/",`
			`cls.MUSIFY: "https://musify.club/",`
			`cls.MUSICBRAINZ: "https://musicbrainz.org/",`
daffasf 2023-01-16 14:37:04 +00:00			`cls.ENCYCLOPAEDIA_METALLUM: "https://www.metal-archives.com/",`
started implementation of fetching from ma artis sources 2023-01-31 23:07:13 +00:00			`cls.GENIUS: "https://genius.com/",`
			`cls.BANDCAMP: "https://bandcamp.com/",`
			`cls.DEEZER: "https://www.deezer.com/",`
			`cls.INSTAGRAM: "https://www.instagram.com/",`
			`cls.FACEBOOK: "https://www.facebook.com/",`
			`cls.SPOTIFY: "https://open.spotify.com/",`
added fetching of linked sources to musify 2023-03-18 12:01:27 +00:00			`cls.TWITTER: "https://twitter.com/",`
			`cls.MYSPACE: "https://myspace.com/"`
dasfh 2023-01-12 15:25:50 +00:00			`}`
			`return homepage_map[attribute]`


fixed exceptions 2023-03-10 09:13:35 +00:00			`class Source(DatabaseObject):`
dasfh 2023-01-12 15:25:50 +00:00			`"""`
			`create somehow like that`
			```python
			`# url won't be a valid one due to it being just an example`
			`Source(src="youtube", url="https://youtu.be/dfnsdajlhkjhsd")`
			```
			`"""`
attribute 2023-03-13 13:33:17 +00:00			`COLLECTION_ATTRIBUTES = tuple()`
refactored merging function to take default values other than None into account parents.py 2023-03-18 11:36:53 +00:00			`SIMPLE_ATTRIBUTES = {`
			`"type_enum": None,`
			`"page_enum": None,`
			`"url": None`
			`}`
dasfh 2023-01-12 15:25:50 +00:00
Update source.py 2023-03-03 06:52:13 +00:00			`def __init__(self, page_enum: SourcePages, url: str, id_: str = None, type_enum=None) -> None:`
dasfh 2023-01-12 15:25:50 +00:00			`DatabaseObject.__init__(self, id_=id_)`

added type to src 2023-01-20 09:56:40 +00:00			`self.type_enum = type_enum`
added source to artist 2023-01-20 22:05:15 +00:00			`self.page_enum = page_enum`

dasfh 2023-01-12 15:25:50 +00:00			`self.url = url`

added the fetching of the sources from ma regarding artists 2023-02-01 08:10:05 +00:00			`@classmethod`
added fetching of linked sources to musify 2023-03-18 12:01:27 +00:00			`def match_url(cls, url: str) -> Optional["Source"]:`
added the fetching of the sources from ma regarding artists 2023-02-01 08:10:05 +00:00			`"""`
			`this shouldn't be used, unlesse you are not certain what the source is for`
			`the reason is that it is more inefficient`
			`"""`
added fetching of linked sources to musify 2023-03-18 12:01:27 +00:00			`parsed = urlparse(url)`
			`url = parsed.geturl()`

added the fetching of the sources from ma regarding artists 2023-02-01 08:10:05 +00:00			`if url.startswith("https://www.youtube"):`
			`return cls(SourcePages.YOUTUBE, url)`

			`if url.startswith("https://www.deezer"):`
			`return cls(SourcePages.DEEZER, url)`

			`if url.startswith("https://open.spotify.com"):`
			`return cls(SourcePages.SPOTIFY, url)`

			`if "bandcamp" in url:`
			`return cls(SourcePages.BANDCAMP, url)`

			`if url.startswith("https://www.metal-archives.com/"):`
			`return cls(SourcePages.ENCYCLOPAEDIA_METALLUM, url)`

			`# the less important once`
			`if url.startswith("https://www.facebook"):`
			`return cls(SourcePages.FACEBOOK, url)`

			`if url.startswith("https://www.instagram"):`
			`return cls(SourcePages.INSTAGRAM, url)`

			`if url.startswith("https://twitter"):`
			`return cls(SourcePages.TWITTER, url)`

added fetching of linked sources to musify 2023-03-18 12:01:27 +00:00			`if url.startswith("https://myspace.com"):`
			`return cls(SourcePages.MYSPACE, url)`

fixed exceptions 2023-03-10 09:13:35 +00:00			`def get_song_metadata(self) -> Metadata:`
			`return Metadata({`
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`Mapping.FILE_WEBPAGE_URL: [self.url],`
			`Mapping.SOURCE_WEBPAGE_URL: [self.homepage]`
			`})`

fixed exceptions 2023-03-10 09:13:35 +00:00			`def get_artist_metadata(self) -> Metadata:`
			`return Metadata({`
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`Mapping.ARTIST_WEBPAGE_URL: [self.url]`
			`})`

refactor 2023-03-10 08:09:35 +00:00			`@property`
			`def metadata(self) -> Metadata:`
added source to artist 2023-01-20 22:05:15 +00:00			`if self.type_enum == SourceTypes.SONG:`
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`return self.get_song_metadata()`
added source to artist 2023-01-20 22:05:15 +00:00
			`if self.type_enum == SourceTypes.ARTIST:`
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`return self.get_artist_metadata()`
added artist attribute 2023-01-20 10:01:18 +00:00
refactor 2023-03-10 08:09:35 +00:00			`return super().metadata`
dfsa 2023-01-12 16:14:21 +00:00
implemented DatabaseObject.indexing_values for each data objects 2023-03-09 18:53:28 +00:00			`@property`
			`def indexing_values(self) -> List[Tuple[str, object]]:`
			`return [`
			`('id', self.id),`
			`('url', self.url)`
			`]`

dasfh 2023-01-12 15:25:50 +00:00			`def __str__(self):`
added the fetching of the sources from ma regarding artists 2023-02-01 08:10:05 +00:00			`return self.__repr__()`
dasfh 2023-01-12 15:25:50 +00:00
finished refactoring metadata 2023-01-30 13:41:02 +00:00			`def __repr__(self) -> str:`
			`return f"Src({self.page_enum.value}: {self.url})"`

added source to artist 2023-01-20 22:05:15 +00:00			`page_str = property(fget=lambda self: self.page_enum.value)`
added type to src 2023-01-20 09:56:40 +00:00			`type_str = property(fget=lambda self: self.type_enum.value)`
added source to artist 2023-01-20 22:05:15 +00:00			`homepage = property(fget=lambda self: SourcePages.get_homepage(self.page_enum))`
source 2023-01-25 13:14:15 +00:00

refactorings 2023-03-09 21:14:39 +00:00			`class SourceCollection(Collection):`
			`def __init__(self, source_list: List[Source]):`
			`self._page_to_source_list: Dict[SourcePages, List[Source]] = defaultdict(list)`

fixed exceptions 2023-03-10 09:13:35 +00:00			`super().__init__(data=source_list, element_type=Source)`


refactorings 2023-03-09 21:14:39 +00:00			`def map_element(self, source: Source):`
			`super().map_element(source)`

			`self._page_to_source_list[source.page_enum].append(source)`

			`def get_sources_from_page(self, source_page: SourcePages) -> List[Source]:`
			`"""`
			`getting the sources for a specific page like`
			`YouTube or musify`
			`"""`
added fetching of linked sources to musify 2023-03-18 12:01:27 +00:00			`return self._page_to_source_list[source_page].copy()`