From 7ae7aa87fd744d8dbe8d0400996e26bd94b12589 Mon Sep 17 00:00:00 2001 From: Hellow Date: Mon, 27 Mar 2023 20:02:17 +0200 Subject: [PATCH] fixed a bit of the scraping --- documentation/html/metal-archives/artist.html | 537 ++++++++++++++++++ documentation/html/metal-archives/overview.md | 4 + .../pages/encyclopaedia_metallum.py | 49 +- 3 files changed, 588 insertions(+), 2 deletions(-) create mode 100644 documentation/html/metal-archives/artist.html create mode 100644 documentation/html/metal-archives/overview.md diff --git a/documentation/html/metal-archives/artist.html b/documentation/html/metal-archives/artist.html new file mode 100644 index 0000000..51b024d --- /dev/null +++ b/documentation/html/metal-archives/artist.html @@ -0,0 +1,537 @@ + + + + + Ghost Bath - Encyclopaedia Metallum: The Metal Archives + + + +
+ + +
+ +
+
+ + + +
+
+ +
+ +
+ Ghost Bath - Photo +
+ + +
+ +
+
+

+ Ghost Bath +

+ +
+
+
+
Country of origin:
+
United States
+
Location:
+
Minot, North Dakota
+
Status:
+
Active
+
Formed in:
+
2012
+
+
+
Genre:
+
Depressive/Post-Black Metal
+
Themes:
+
Depression, Loneliness, Death
+
Current label:
+
+ + Nuclear Blast Entertainment + +
+
+
+
Years active:
+
+ 2012-present +
+
+
+ +
+ +
+
+ +
+
+
+ +
+
+ +
+
+
+
+ + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ Current +
+ Nameless + + Vocals (lead), Guitars, Piano (2012-present) +
+ See also: + If + I Could Kill Myself, Electric Specter 電妖怪, ex-I, Apparatus +
+ Josh Jaye + + Bass (2016-present) +
+ See also: + Stone + Marrow, Alistair Hennessey, Death House +
+ Jason Hirt + + Drums (2016-present) +
+ See also: + Nothingness, + Conduit, ex-StillBreather +
+ Tim Church + + Guitars (2016-present) +
+ See also: + Stone + Marrow, Death House, ex-Alistair Hennessey +
+ John Olivier + + Guitars (2016-present) +
+ See also: + Stone + Marrow, Death House, ex-Lungs, + ex-Alistair Hennessey +
+ Past +
+ 杰米 + + Bass +
+ 泰勒 + + Drums +
+ 多诺万 + + Guitars, Vocals (backing) +
+ D.J. Gunnarson + + Vocals +
+ See also: + ex-Thee + Massacre, Buried Above Ground, ex-White + Empress
+ Current (Live) +
+ Chris Piette + + Drums (2022-present) +
+ See also: + Amiensus, + Choke, + ex-Thee + Massacre, ex-McNally Smith Extreme Metal Ensemble (live) +
+ Caleb Cheslock + + Guitars (2022-present) +
+ See also: + Cavernlight, + Choke, + Christopher Gold and The New Old Things, Servare +
+
+
+ +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ Nameless + + Vocals (lead), Guitars, Piano (2012-present) +
+ See also: + If + I Could Kill Myself, Electric Specter 電妖怪, ex-I, Apparatus +
+ Josh Jaye + + Bass (2016-present) +
+ See also: + Stone + Marrow, Alistair Hennessey, Death House +
+ Jason Hirt + + Drums (2016-present) +
+ See also: + Nothingness, + Conduit, ex-StillBreather +
+ Tim Church + + Guitars (2016-present) +
+ See also: + Stone + Marrow, Death House, ex-Alistair Hennessey +
+ John Olivier + + Guitars (2016-present) +
+ See also: + Stone + Marrow, Death House, ex-Lungs, + ex-Alistair Hennessey +
+
+
+ +
+
+ + + + + + + + + + + + + + + + + + + + +
+ 杰米 + + Bass +
+ 泰勒 + + Drums +
+ 多诺万 + + Guitars, Vocals (backing) +
+ D.J. Gunnarson + + Vocals +
+ See also: + ex-Thee + Massacre, Buried Above Ground, ex-White + Empress
+
+
+ +
+
+ + + + + + + + + + + + + + + + + + +
+ Current +
+ Chris Piette + + Drums (2022-present) +
+ See also: + Amiensus, + Choke, + ex-Thee + Massacre, ex-McNally Smith Extreme Metal Ensemble (live) +
+ Caleb Cheslock + + Guitars (2022-present) +
+ See also: + Cavernlight, + Choke, + Christopher Gold and The New Old Things, Servare +
+
+
+
+
+
+ +
+ + + + + + + + + + + + + +
Added by: Teglement + Modified by: Mole666
Added on: 2013-11-06 23:08:16Last modified on: 2023-02-11 04:24:36
+   + +
+
+
+
+
+
+ + + + diff --git a/documentation/html/metal-archives/overview.md b/documentation/html/metal-archives/overview.md new file mode 100644 index 0000000..28dec97 --- /dev/null +++ b/documentation/html/metal-archives/overview.md @@ -0,0 +1,4 @@ +# Metal Archives +https://www.metal-archives.com/ + +- [Artist page (https://www.metal-archives.com/)](artist.html) \ No newline at end of file diff --git a/src/music_kraken/pages/encyclopaedia_metallum.py b/src/music_kraken/pages/encyclopaedia_metallum.py index f8f4450..9210deb 100644 --- a/src/music_kraken/pages/encyclopaedia_metallum.py +++ b/src/music_kraken/pages/encyclopaedia_metallum.py @@ -300,12 +300,56 @@ class EncyclopaediaMetallum(Page): @classmethod def _parse_artist_attributes(cls, artist_soup: BeautifulSoup) -> Artist: + name: str = None country: pycountry.Countrie = None formed_in_year: int = None genre: str = None lyrical_themes: List[str] = [] label_name: str = None label_url: str = None + source_list: List[Source] = [] + + title_soup: BeautifulSoup = artist_soup.find("title") + if title_soup is not None: + bad_name_substring = " - Encyclopaedia Metallum: The Metal Archives" + title_text = title_soup.get_text() + if title_text.count(bad_name_substring) == 1: + name = title_text.replace(bad_name_substring, "") + else: + LOGGER.debug(f"the title of the page is \"{title_text}\"") + + """ + TODO + Implement the bandpictures and logos that can be gotten with the elements + Artist: - print(url) r = cls.get_request(url) if r is None: return Artist()