finished fetching of artist details
This commit is contained in:
parent
05c9610683
commit
5d0f9814c8
@ -550,8 +550,106 @@ class Musify(Page):
|
|||||||
:param url:
|
:param url:
|
||||||
:return:
|
:return:
|
||||||
"""
|
"""
|
||||||
return Artist(
|
|
||||||
|
r = cls.get_request(f"https://musify.club/{url.source_type.value}/{url.name_with_id}?_pjax=#bodyContent")
|
||||||
|
if r is None:
|
||||||
|
return Artist(_id=url.musify_id, name="")
|
||||||
|
|
||||||
|
soup = BeautifulSoup(r.content, "html.parser")
|
||||||
|
|
||||||
|
"""
|
||||||
|
<ol class="breadcrumb" itemscope="" itemtype="http://schema.org/BreadcrumbList">
|
||||||
|
<li class="breadcrumb-item" itemprop="itemListElement" itemscope="" itemtype="http://schema.org/ListItem"><a href="/" itemprop="item"><span itemprop="name">Главная</span><meta content="1" itemprop="position"/></a></li>
|
||||||
|
<li class="breadcrumb-item" itemprop="itemListElement" itemscope="" itemtype="http://schema.org/ListItem"><a href="/artist" itemprop="item"><span itemprop="name">Исполнители</span><meta content="2" itemprop="position"/></a></li>
|
||||||
|
<li class="breadcrumb-item active">Ghost Bath</li>
|
||||||
|
</ol>
|
||||||
|
|
||||||
|
<ul class="nav nav-tabs nav-fill">
|
||||||
|
<li class="nav-item"><a class="active nav-link" href="/artist/ghost-bath-280348">песни (41)</a></li>
|
||||||
|
<li class="nav-item"><a class="nav-link" href="/artist/ghost-bath-280348/releases">альбомы (12)</a></li>
|
||||||
|
<li class="nav-item"><a class="nav-link" href="/artist/ghost-bath-280348/clips">видеоклипы (23)</a></li>
|
||||||
|
<li class="nav-item"><a class="nav-link" href="/artist/ghost-bath-280348/photos">фото (38)</a></li>
|
||||||
|
</ul>
|
||||||
|
|
||||||
|
<header class="content__title">
|
||||||
|
<h1>Ghost Bath</h1>
|
||||||
|
<div class="actions">
|
||||||
|
...
|
||||||
|
</div>
|
||||||
|
</header>
|
||||||
|
|
||||||
|
<ul class="icon-list">
|
||||||
|
<li>
|
||||||
|
<i class="zmdi zmdi-globe zmdi-hc-fw" title="Страна"></i>
|
||||||
|
<i class="flag-icon US shadow"></i>
|
||||||
|
Соединенные Штаты
|
||||||
|
</li>
|
||||||
|
</ul>
|
||||||
|
"""
|
||||||
name = ""
|
name = ""
|
||||||
|
source_list: List[Source] = []
|
||||||
|
county = None
|
||||||
|
|
||||||
|
breadcrumbs: BeautifulSoup = soup.find("ol", {"class": "breadcrumb"})
|
||||||
|
if breadcrumbs is not None:
|
||||||
|
breadcrumb_list: List[BeautifulSoup] = breadcrumbs.find_all("li", {"class": "breadcrumb"}, recursive=False)
|
||||||
|
if len(breadcrumb_list) == 3:
|
||||||
|
name = breadcrumb_list[-1].get_text(strip=True)
|
||||||
|
else:
|
||||||
|
LOGGER.debug("breadcrumb layout on artist page changed")
|
||||||
|
|
||||||
|
nav_tabs: BeautifulSoup = soup.find("ul", {"class": "nav-tabs"})
|
||||||
|
if nav_tabs is not None:
|
||||||
|
list_item: BeautifulSoup
|
||||||
|
for list_item in nav_tabs.find_all("li", {"class": "nav-item"}, recursive=False):
|
||||||
|
if not list_item.get_text(strip=True).startswith("песни"):
|
||||||
|
# "песни" translates to "songs"
|
||||||
|
continue
|
||||||
|
|
||||||
|
anchor: BeautifulSoup = list_item.find("a")
|
||||||
|
if anchor is None:
|
||||||
|
continue
|
||||||
|
href = anchor.get("href")
|
||||||
|
if href is None:
|
||||||
|
continue
|
||||||
|
|
||||||
|
source_list.append(Source(
|
||||||
|
cls.SOURCE_TYPE,
|
||||||
|
cls.HOST + href
|
||||||
|
))
|
||||||
|
|
||||||
|
content_title: BeautifulSoup = soup.find("header", {"class": "content__title"})
|
||||||
|
if content_title is not None:
|
||||||
|
h1_name: BeautifulSoup = soup.find("h1", recursive=False)
|
||||||
|
if h1_name is not None:
|
||||||
|
name = h1_name.get_text(strip=True)
|
||||||
|
|
||||||
|
icon_list: BeautifulSoup = soup.find("ul", {"class": "icon-list"})
|
||||||
|
if icon_list is not None:
|
||||||
|
country_italic: BeautifulSoup = icon_list.find("i", {"class", "flag-icon"})
|
||||||
|
if country_italic is not None:
|
||||||
|
style_classes: set = {'flag-icon', 'shadow'}
|
||||||
|
classes: set = set(country_italic.get("class"))
|
||||||
|
|
||||||
|
country_set: set = classes.difference(style_classes)
|
||||||
|
if len(country_set) != 1:
|
||||||
|
LOGGER.debug("the country set contains multiple values")
|
||||||
|
if len(country_set) != 0:
|
||||||
|
"""
|
||||||
|
This is the css file, where all flags that can be used on musify
|
||||||
|
are laid out and styled.
|
||||||
|
Every flag has two upper case letters, thus I assume they follow the alpha_2
|
||||||
|
standard, though I haven't checked.
|
||||||
|
https://musify.club/content/flags.min.css
|
||||||
|
"""
|
||||||
|
|
||||||
|
country = pycountry.countries.get(alpha_2=list(country_set)[0])
|
||||||
|
|
||||||
|
return Artist(
|
||||||
|
_id=url.musify_id,
|
||||||
|
name=name,
|
||||||
|
country=county,
|
||||||
|
source_list=source_list
|
||||||
)
|
)
|
||||||
|
|
||||||
@classmethod
|
@classmethod
|
||||||
@ -560,8 +658,8 @@ class Musify(Page):
|
|||||||
fetches artist from source
|
fetches artist from source
|
||||||
|
|
||||||
[x] discography
|
[x] discography
|
||||||
[] attributes
|
[x] attributes *(name and country... wooooow and I waste one request for this)*
|
||||||
[] picture galery
|
[] picture gallery
|
||||||
|
|
||||||
Args:
|
Args:
|
||||||
source (Source): the source to fetch
|
source (Source): the source to fetch
|
||||||
|
Loading…
Reference in New Issue
Block a user