2022-10-27 12:15:18 +00:00
|
|
|
import sqlite3
|
|
|
|
import os
|
|
|
|
import logging
|
2022-10-30 15:29:42 +00:00
|
|
|
import json
|
2022-10-27 12:15:18 +00:00
|
|
|
|
2022-10-27 17:53:12 +00:00
|
|
|
|
2022-10-27 12:15:18 +00:00
|
|
|
def get_temp_dir():
|
|
|
|
import tempfile
|
|
|
|
|
|
|
|
temp_folder = "music-downloader"
|
|
|
|
temp_dir = os.path.join(tempfile.gettempdir(), temp_folder)
|
|
|
|
if not os.path.exists(temp_dir):
|
|
|
|
os.mkdir(temp_dir)
|
|
|
|
return temp_dir
|
|
|
|
|
2022-10-27 17:53:12 +00:00
|
|
|
|
2022-10-30 15:29:42 +00:00
|
|
|
DATABASE_STRUCTURE_FILE = "database_structure.sql"
|
|
|
|
# DATABASE_STRUCTURE_FILE = "src/metadata/database_structure.sql"
|
2022-10-27 12:15:18 +00:00
|
|
|
TEMP_DIR = get_temp_dir()
|
|
|
|
DATABASE_FILE = "metadata.db"
|
|
|
|
db_path = os.path.join(TEMP_DIR, DATABASE_FILE)
|
|
|
|
|
2022-10-27 13:00:24 +00:00
|
|
|
connection = sqlite3.connect(db_path)
|
2022-10-30 15:29:42 +00:00
|
|
|
# connection.row_factory = sqlite3.Row
|
2022-10-27 13:00:24 +00:00
|
|
|
cursor = connection.cursor()
|
2022-10-27 12:15:18 +00:00
|
|
|
|
2022-10-27 17:53:12 +00:00
|
|
|
|
2022-10-27 13:00:24 +00:00
|
|
|
def init_db(cursor, connection, reset_anyways: bool = False):
|
2022-10-27 12:15:18 +00:00
|
|
|
# check if db exists
|
|
|
|
exists = True
|
|
|
|
try:
|
|
|
|
query = 'SELECT * FROM track;'
|
|
|
|
cursor.execute(query)
|
|
|
|
_ = cursor.fetchall()
|
|
|
|
except sqlite3.OperationalError:
|
|
|
|
exists = False
|
2022-10-27 17:53:12 +00:00
|
|
|
|
2022-10-27 12:15:18 +00:00
|
|
|
if not exists:
|
|
|
|
logging.info("Database does not exist yet.")
|
|
|
|
|
|
|
|
if reset_anyways or not exists:
|
|
|
|
# reset the database if reset_anyways is true or if an error has been thrown previously.
|
|
|
|
logging.info("Creating/Reseting Database.")
|
|
|
|
|
|
|
|
# read the file
|
|
|
|
with open(DATABASE_STRUCTURE_FILE, "r") as database_structure_file:
|
|
|
|
query = database_structure_file.read()
|
|
|
|
cursor.executescript(query)
|
2022-10-27 17:53:12 +00:00
|
|
|
connection.commit()
|
2022-10-27 12:15:18 +00:00
|
|
|
|
2022-10-27 13:00:24 +00:00
|
|
|
|
|
|
|
def add_artist(
|
2022-10-27 17:53:12 +00:00
|
|
|
musicbrainz_artistid: str,
|
|
|
|
artist: str = None
|
2022-10-27 13:00:24 +00:00
|
|
|
):
|
2022-10-27 17:53:12 +00:00
|
|
|
query = "INSERT OR REPLACE INTO artist (id, name) VALUES (?, ?);"
|
2022-10-27 13:00:24 +00:00
|
|
|
values = musicbrainz_artistid, artist
|
|
|
|
|
|
|
|
cursor.execute(query, values)
|
|
|
|
connection.commit()
|
|
|
|
|
2022-10-27 17:53:12 +00:00
|
|
|
|
2022-10-27 13:00:24 +00:00
|
|
|
def add_release_group(
|
2022-10-27 17:53:12 +00:00
|
|
|
musicbrainz_releasegroupid: str,
|
|
|
|
artist_ids: list,
|
|
|
|
albumartist: str = None,
|
|
|
|
albumsort: int = None,
|
|
|
|
musicbrainz_albumtype: str = None,
|
|
|
|
compilation: str = None,
|
|
|
|
album_artist_id: str = None
|
2022-10-27 13:00:24 +00:00
|
|
|
):
|
|
|
|
# add adjacency
|
|
|
|
adjacency_list = []
|
|
|
|
for artist_id in artist_ids:
|
2022-10-27 17:53:12 +00:00
|
|
|
adjacency_list.append((artist_id, musicbrainz_releasegroupid))
|
2022-10-27 13:00:24 +00:00
|
|
|
adjacency_values = tuple(adjacency_list)
|
2022-10-27 17:53:12 +00:00
|
|
|
adjacency_query = "INSERT OR REPLACE INTO artist_release_group (artist_id, release_group_id) VALUES (?, ?);"
|
2022-10-27 13:00:24 +00:00
|
|
|
cursor.executemany(adjacency_query, adjacency_values)
|
|
|
|
connection.commit()
|
|
|
|
|
|
|
|
# add release group
|
2022-10-27 17:53:12 +00:00
|
|
|
query = "INSERT OR REPLACE INTO release_group (id, albumartist, albumsort, musicbrainz_albumtype, compilation, album_artist_id) VALUES (?, ?, ?, ?, ?, ?);"
|
|
|
|
values = musicbrainz_releasegroupid, albumartist, albumsort, musicbrainz_albumtype, compilation, album_artist_id
|
2022-10-27 13:27:57 +00:00
|
|
|
cursor.execute(query, values)
|
|
|
|
connection.commit()
|
|
|
|
|
2022-10-27 17:53:12 +00:00
|
|
|
|
2022-10-27 13:27:57 +00:00
|
|
|
def add_release(
|
2022-10-27 17:53:12 +00:00
|
|
|
musicbrainz_albumid: str,
|
|
|
|
release_group_id: str,
|
|
|
|
title: str = None,
|
|
|
|
copyright_: str = None,
|
|
|
|
album_status: str = None,
|
|
|
|
language: str = None,
|
|
|
|
year: str = None,
|
|
|
|
date: str = None,
|
|
|
|
country: str = None,
|
|
|
|
barcode: str = None
|
2022-10-27 13:27:57 +00:00
|
|
|
):
|
2022-10-27 17:53:12 +00:00
|
|
|
query = "INSERT OR REPLACE INTO release_ (id, release_group_id, title, copyright, album_status, language, year, date, country, barcode) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?);"
|
|
|
|
values = musicbrainz_albumid, release_group_id, title, copyright_, album_status, language, year, date, country, barcode
|
2022-10-27 13:27:57 +00:00
|
|
|
|
|
|
|
cursor.execute(query, values)
|
|
|
|
connection.commit()
|
2022-10-27 12:15:18 +00:00
|
|
|
|
2022-10-27 17:53:12 +00:00
|
|
|
|
2022-10-27 13:55:16 +00:00
|
|
|
def add_track(
|
2022-10-27 17:53:12 +00:00
|
|
|
musicbrainz_releasetrackid: str,
|
|
|
|
musicbrainz_albumid: str,
|
|
|
|
feature_aritsts: list,
|
|
|
|
track: str = None,
|
|
|
|
isrc: str = None
|
2022-10-27 13:55:16 +00:00
|
|
|
):
|
2022-10-27 17:53:12 +00:00
|
|
|
# add adjacency
|
|
|
|
adjacency_list = []
|
|
|
|
for artist_id in feature_aritsts:
|
|
|
|
adjacency_list.append((artist_id, musicbrainz_releasetrackid))
|
|
|
|
adjacency_values = tuple(adjacency_list)
|
|
|
|
adjacency_query = "INSERT OR REPLACE INTO artist_track (artist_id, track_id) VALUES (?, ?);"
|
|
|
|
cursor.executemany(adjacency_query, adjacency_values)
|
|
|
|
connection.commit()
|
|
|
|
|
|
|
|
# add track
|
|
|
|
query = "INSERT OR REPLACE INTO track (id, release_id, track, isrc) VALUES (?, ?, ?, ?);"
|
|
|
|
values = musicbrainz_releasetrackid, musicbrainz_albumid, track, isrc
|
|
|
|
cursor.execute(query, values)
|
|
|
|
connection.commit()
|
|
|
|
|
2022-10-30 15:29:42 +00:00
|
|
|
|
2022-10-28 10:35:26 +00:00
|
|
|
def get_custom_track_querry(custom_where: list) -> str:
|
|
|
|
where_args = [
|
|
|
|
"track.release_id == release_.id",
|
2022-10-30 16:07:13 +00:00
|
|
|
"release_group.id == release_.release_group_id",
|
|
|
|
"artist_track.artist_id == artist.id",
|
|
|
|
"artist_track.track_id == track.id"
|
2022-10-28 10:35:26 +00:00
|
|
|
]
|
|
|
|
where_args.extend(custom_where)
|
2022-10-27 17:53:12 +00:00
|
|
|
|
2022-10-28 10:35:26 +00:00
|
|
|
where_arg = " AND ".join(where_args)
|
2022-10-27 21:09:37 +00:00
|
|
|
query = f"""
|
2022-10-30 15:29:42 +00:00
|
|
|
SELECT DISTINCT
|
|
|
|
json_object(
|
2022-10-30 16:07:13 +00:00
|
|
|
'artists', json_group_array(
|
|
|
|
(
|
|
|
|
SELECT DISTINCT json_object(
|
|
|
|
'id', artist.id,
|
|
|
|
'name', artist.name
|
|
|
|
)
|
|
|
|
)
|
|
|
|
),
|
2022-10-30 15:29:42 +00:00
|
|
|
'musicbrainz_releasetrackid', track.id,
|
|
|
|
'musicbrainz_albumid', release_.id,
|
|
|
|
'track', track.track,
|
|
|
|
'isrc', track.isrc,
|
|
|
|
'title', release_.title,
|
|
|
|
'copyright', release_.copyright,
|
|
|
|
'album_status', release_.album_status,
|
|
|
|
'language', release_.language,
|
|
|
|
'year', release_.year,
|
|
|
|
'date', release_.date,
|
|
|
|
'country', release_.country,
|
|
|
|
'barcode', release_.barcode,
|
|
|
|
'albumartist', release_group.albumartist,
|
|
|
|
'albumsort', release_group.albumsort,
|
|
|
|
'musicbrainz_albumtype', release_group.musicbrainz_albumtype,
|
|
|
|
'compilation', release_group.compilation,
|
|
|
|
'album_artist_id', release_group.album_artist_id
|
|
|
|
)
|
2022-10-30 16:07:13 +00:00
|
|
|
FROM track, release_, release_group,artist, artist_track
|
2022-10-27 21:09:37 +00:00
|
|
|
WHERE
|
2022-10-30 16:07:13 +00:00
|
|
|
{where_arg}
|
|
|
|
GROUP BY track.id;
|
2022-10-27 21:09:37 +00:00
|
|
|
"""
|
2022-10-28 10:35:26 +00:00
|
|
|
return query
|
2022-10-27 21:09:37 +00:00
|
|
|
|
2022-10-30 15:29:42 +00:00
|
|
|
|
2022-10-28 10:35:26 +00:00
|
|
|
def get_custom_track(custom_where: list):
|
|
|
|
query = get_custom_track_querry(custom_where=custom_where)
|
2022-10-30 15:29:42 +00:00
|
|
|
return [json.loads(i[0]) for i in cursor.execute(query)]
|
|
|
|
|
2022-10-28 10:35:26 +00:00
|
|
|
|
|
|
|
def get_track_metadata(musicbrainz_releasetrackid: str):
|
|
|
|
# this would be vulnerable if musicbrainz_releasetrackid would be user input
|
|
|
|
resulting_tracks = get_custom_track([f'track.id == "{musicbrainz_releasetrackid}"'])
|
2022-10-27 21:09:37 +00:00
|
|
|
if len(resulting_tracks) != 1:
|
|
|
|
return -1
|
|
|
|
|
2022-10-30 15:29:42 +00:00
|
|
|
return resulting_tracks[0]
|
|
|
|
|
2022-10-27 21:09:37 +00:00
|
|
|
|
2022-10-28 10:35:26 +00:00
|
|
|
def get_tracks_to_download():
|
|
|
|
return get_custom_track(["track.downloaded == 0"])
|
|
|
|
|
2022-10-30 15:29:42 +00:00
|
|
|
|
2022-10-28 10:35:26 +00:00
|
|
|
def get_tracks_without_isrc():
|
|
|
|
return get_custom_track(["track.isrc IS NULL"])
|
2022-10-27 21:09:37 +00:00
|
|
|
|
2022-10-30 15:29:42 +00:00
|
|
|
|
2022-10-27 17:53:12 +00:00
|
|
|
init_db(cursor=cursor, connection=connection, reset_anyways=False)
|
2022-10-27 13:55:16 +00:00
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
logging.basicConfig(level=logging.DEBUG)
|
2022-10-27 21:09:37 +00:00
|
|
|
|
2022-10-28 10:35:26 +00:00
|
|
|
# get_track(["track.downloaded == 0", "track.isrc IS NOT NULL"])
|
|
|
|
#
|
|
|
|
for track in get_tracks_without_isrc():
|
2022-10-30 16:07:13 +00:00
|
|
|
print(track['track'], [artist['name'] for artist in track['artists']])
|
2022-10-28 10:35:26 +00:00
|
|
|
|
2022-10-30 15:29:42 +00:00
|
|
|
# print(get_track_metadata("a85d5ed5-20e5-4f95-8034-d204d81a36dd"))
|