feat: implemented downloading from bandcamp

This commit is contained in:
Hellow 2023-09-12 23:39:22 +02:00
parent a3934a384e
commit 8091a9ffb0
2 changed files with 37 additions and 6 deletions

View File

@ -31,7 +31,8 @@ if __name__ == "__main__":
youtube_music_test = [
"s: #a Only Smile #r Your best friend",
"8",
"2"
"2",
"d: 2"
]
music_kraken.cli.download(genre="test", command_list=youtube_music_test, process_metadata_anyway=True)

View File

@ -3,6 +3,8 @@ from urllib.parse import urlparse
import json
from enum import Enum
from bs4 import BeautifulSoup
import pycountry
import demjson3
from ..objects import Source, DatabaseObject
from .abstract import Page
@ -15,7 +17,9 @@ from ..objects import (
Label,
Target,
Contact,
ID3Timestamp
ID3Timestamp,
Lyrics,
FormattedText
)
from ..connection import Connection
from ..utils.support_classes import DownloadResult
@ -254,6 +258,17 @@ class Bandcamp(Page):
return album
def _fetch_lyrics(self, soup: BeautifulSoup) -> List[Lyrics]:
track_lyrics = soup.find("div", {"class": "lyricsText"})
if track_lyrics:
self.LOGGER.debug(" Lyrics retrieved..")
return [Lyrics(FormattedText(
html=track_lyrics.prettify()
), pycountry.languages.get(alpha_2="en"))]
return []
def fetch_song(self, source: Source, stop_at_level: int = 1) -> Song:
print(source)
@ -264,17 +279,28 @@ class Bandcamp(Page):
soup = self.get_soup_from_response(r)
data_container = soup.find("script", {"type": "application/ld+json"})
other_data = {}
other_data_list = soup.select("script[data-tralbum]")
if len(other_data_list) > 0:
other_data = json.loads(other_data_list[0]["data-tralbum"])
if DEBUG:
dump_to_file("bandcamp_song_data.json", data_container.text, is_json=True, exit_after_dump=False)
dump_to_file("bandcamp_song_data_other.json", json.dumps(other_data), is_json=True, exit_after_dump=False)
dump_to_file("bandcamp_song_page.html", r.text, exit_after_dump=False)
data = json.loads(data_container.text)
album_data = data["inAlbum"]
artist_data = data["byArtist"]
mp3_url = None
for key, value in other_data.get("trackinfo", [{}])[0].get("file", {"": None}).items():
mp3_url = value
song = Song(
title=data["name"],
source_list=[Source(self.SOURCE_TYPE, data.get("mainEntityOfPage", data["@id"]))],
source_list=[Source(self.SOURCE_TYPE, data.get("mainEntityOfPage", data["@id"]), adio_url=mp3_url)],
album_list=[Album(
title=album_data["name"],
date=ID3Timestamp.strptime(data["datePublished"], "%d %b %Y %H:%M:%S %Z"),
@ -283,10 +309,14 @@ class Bandcamp(Page):
main_artist_list=[Artist(
name=artist_data["name"],
source_list=[Source(self.SOURCE_TYPE, artist_data["@id"])]
)]
)],
lyrics_list=self._fetch_lyrics(soup=soup)
)
return song
def download_song_to_target(self, source: Source, target: Target, desc: str = None) -> DownloadResult:
return DownloadResult()
if source.audio_url is None:
return DownloadResult(error_message="Couldn't find download link.")
return self.connection.stream_into(url=source.audio_url, target=target, description=desc)