music-kraken-core/src/music_kraken/connection/connection.py

import time
from typing import List, Dict, Callable, Optional, Set
from urllib.parse import urlparse, urlunsplit, ParseResult
import logging

import threading
import requests
from tqdm import tqdm

from .rotating import RotatingProxy
from ..utils.shared import PROXIES_LIST, CHUNK_SIZE
from ..utils.support_classes import DownloadResult
from ..objects import Target


class Connection:
    def __init__(
            self,
            host: str,
            proxies: List[dict] = None,
            tries: int = (len(PROXIES_LIST) + 1) * 4,
            timeout: int = 7,
            logger: logging.Logger = logging.getLogger("connection"),
            header_values: Dict[str, str] = None,
            accepted_response_codes: Set[int] = None,
            semantic_not_found: bool = True,
            sleep_after_404: float = 0.0,
            hearthbeat_interval = 0,
    ):
        if proxies is None:
            proxies = PROXIES_LIST
        if header_values is None:
            header_values = dict()

        self.HEADER_VALUES = header_values

        self.LOGGER = logger
        self.HOST = urlparse(host)
        self.TRIES = tries
        self.TIMEOUT = timeout
        self.rotating_proxy = RotatingProxy(proxy_list=proxies)

        self.ACCEPTED_RESPONSE_CODES = accepted_response_codes or {200}
        self.SEMANTIC_NOT_FOUND = semantic_not_found
        self.sleep_after_404 = sleep_after_404

        self.session = requests.Session()
        self.session.headers = self.get_header(**self.HEADER_VALUES)
        self.session.proxies = self.rotating_proxy.current_proxy

        self.session_is_occupied: bool = False

        self.hearthbeat_thread = None
        self.hearthbeat_interval = hearthbeat_interval

    @property
    def user_agent(self) -> str:
        return self.session.headers.get("user-agent", "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/112.0.0.0 Safari/537.36")


    def start_hearthbeat(self):
        if self.hearthbeat_interval <= 0:
            self.LOGGER.warning(f"Can't start a hearthbeat with {self.hearthbeat_interval}s in between.")

        self.hearthbeat_thread = threading.Thread(target=self._hearthbeat_loop, args=(self.hearthbeat_interval, ), daemon=True)
        self.hearthbeat_thread.start()

    def hearthbeat_failed(self):
        self.LOGGER.warning(f"I just died... (The hearthbeat failed)")


    def hearthbeat(self):
        # Your code to send heartbeat requests goes here
        print("the hearth is beating, but it needs to be implemented ;-;\nFuck youuuu for setting hearthbeat in the constructor to true, but not implementing the method Connection.hearbeat()")

    def _hearthbeat_loop(self, interval: float):
        def hearthbeat_wrapper():
            self.session_is_occupied = True
            self.LOGGER.info(f"I am living. (sending a hearthbeat)")
            self.hearthbeat()
            self.LOGGER.debug(f"finished the hearthbeat")
            self.session_is_occupied = False

        while True:
            hearthbeat_wrapper()
            time.sleep(interval)


    def base_url(self, url: ParseResult = None):
        if url is None:
            url = self.HOST

        return urlunsplit((url.scheme, url.netloc, "", "", ""))

    def get_header(self, **header_values) -> Dict[str, str]:
        return {
            "user-agent": "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/112.0.0.0 Safari/537.36",
            "Connection": "keep-alive",
            # "Host": self.HOST.netloc,
            "Referer": self.base_url(),
            **header_values
        }

    def rotate(self):
        self.session.proxies = self.rotating_proxy.rotate()

    def _update_headers(
            self,
            headers: Optional[dict],
            refer_from_origin: bool,
            url: ParseResult
    ) -> Dict[str, str]:
        if headers is None:
            headers = dict()

        if not refer_from_origin:
            headers["Referer"] = self.base_url(url=url)

        return headers

    def _request(
            self,
            request: Callable,
            try_count: int,
            accepted_response_codes: set,
            url: str,
            timeout: float,
            headers: dict,
            refer_from_origin: bool = True,
            raw_url: bool = False,
            sleep_after_404: float = None,
            is_hearthbeat: bool = False,
            **kwargs
    ) -> Optional[requests.Response]:
        if sleep_after_404 is None:
            sleep_after_404 = self.sleep_after_404
        if try_count >= self.TRIES:
            return

        if timeout is None:
            timeout = self.TIMEOUT

        parsed_url = urlparse(url)

        headers = self._update_headers(
            headers=headers,
            refer_from_origin=refer_from_origin,
            url=parsed_url
        )

        request_url = parsed_url.geturl() if not raw_url else url

        connection_failed = False
        try:
            if self.session_is_occupied and not is_hearthbeat:
                self.LOGGER.info(f"Waiting for the hearthbeat to finish.")
                while self.session_is_occupied and not is_hearthbeat:
                    pass

            r: requests.Response = request(request_url, timeout=timeout, headers=headers, **kwargs)

            if r.status_code in accepted_response_codes:
                return r

            if self.SEMANTIC_NOT_FOUND and r.status_code == 404:
                self.LOGGER.warning(f"Couldn't find url (404): {request_url}")
                return None

        except requests.exceptions.Timeout:
            self.LOGGER.warning(f"Request timed out at \"{request_url}\": ({try_count}-{self.TRIES})")
            connection_failed = True
        except requests.exceptions.ConnectionError:
            self.LOGGER.warning(f"Couldn't connect to \"{request_url}\": ({try_count}-{self.TRIES})")
            connection_failed = True

        if not connection_failed:
            self.LOGGER.warning(f"{self.HOST.netloc} responded wit {r.status_code} "
                                f"at {url}. ({try_count}-{self.TRIES})")
            self.LOGGER.debug(r.content)
            if sleep_after_404 != 0:
                self.LOGGER.warning(f"Waiting for {sleep_after_404} seconds.")
                time.sleep(sleep_after_404)

        self.rotate()

        return self._request(
            request=request,
            try_count=try_count+1,
            accepted_response_codes=accepted_response_codes,
            url=url,
            timeout=timeout,
            headers=headers,
            sleep_after_404=sleep_after_404,
            is_hearthbeat=is_hearthbeat,
            **kwargs
        )

    def get(
            self,
            url: str,
            refer_from_origin: bool = True,
            stream: bool = False,
            accepted_response_codes: set = None,
            timeout: float = None,
            headers: dict = None,
            raw_url: bool = False,
            **kwargs
    ) -> Optional[requests.Response]:
        if accepted_response_codes is None:
            accepted_response_codes = self.ACCEPTED_RESPONSE_CODES

        r = self._request(
            request=self.session.get,
            try_count=0,
            accepted_response_codes=accepted_response_codes,
            url=url,
            timeout=timeout,
            headers=headers,
            raw_url=raw_url,
            refer_from_origin=refer_from_origin,
            stream=stream,
            **kwargs
        )
        if r is None:
            self.LOGGER.warning(f"Max attempts ({self.TRIES}) exceeded for: GET:{url}")
        return r

    def post(
            self,
            url: str,
            json: dict,
            refer_from_origin: bool = True,
            stream: bool = False,
            accepted_response_codes: set = None,
            timeout: float = None,
            headers: dict = None,
            raw_url: bool = False,
            **kwargs
    ) -> Optional[requests.Response]:
        r = self._request(
            request=self.session.post,
            try_count=0,
            accepted_response_codes=accepted_response_codes or self.ACCEPTED_RESPONSE_CODES,
            url=url,
            timeout=timeout,
            headers=headers,
            refer_from_origin=refer_from_origin,
            raw_url=raw_url,
            json=json,
            stream=stream,
            **kwargs
        )
        if r is None:
            self.LOGGER.warning(f"Max attempts ({self.TRIES}) exceeded for: GET:{url}")
            self.LOGGER.warning(f"payload: {json}")
        return r

    def stream_into(
            self,
            url: str,
            target: Target,
            description: str = "download",
            refer_from_origin: bool = True,
            accepted_response_codes: set = None,
            timeout: float = None,
            headers: dict = None,
            raw_url: bool = False,
            chunk_size: int = CHUNK_SIZE,
            try_count: int = 0,
            progress: int = 0,
            **kwargs
    ) -> DownloadResult:

        if progress > 0:
            if headers is None:
                headers = dict()
            headers["Range"] = f"bytes={target.size}-"

        if accepted_response_codes is None:
            accepted_response_codes = self.ACCEPTED_RESPONSE_CODES
        
        r = self._request(
            request=self.session.get,
            try_count=0,
            accepted_response_codes=accepted_response_codes,
            url=url,
            timeout=timeout,
            headers=headers,
            raw_url=raw_url,
            refer_from_origin=refer_from_origin,
            stream=True,
            **kwargs
        )

        if r is None:
            return DownloadResult(error_message=f"Could not establish connection to: {url}")

        target.create_path()
        total_size = int(r.headers.get('content-length'))
        progress = 0

        retry = False

        with target.open("ab") as f:
            """
            https://en.wikipedia.org/wiki/Kilobyte
            > The internationally recommended unit symbol for the kilobyte is kB.
            """
                
            with tqdm(total=total_size-target.size, unit='B', unit_scale=True, unit_divisor=1024, desc=description) as t:
                try:
                    for chunk in r.iter_content(chunk_size=chunk_size):
                        size = f.write(chunk)
                        progress += size
                        t.update(size)

                except requests.exceptions.ConnectionError:
                    if try_count >= self.TRIES:
                        self.LOGGER.warning(f"Stream timed out at \"{url}\": to many retries, aborting.")
                        return DownloadResult(error_message=f"Stream timed out from {url}, reducing the chunksize might help.")

                    self.LOGGER.warning(f"Stream timed out at \"{url}\": ({try_count}-{self.TRIES})")
                    retry = True

            if total_size > progress:
                retry = True


            if retry:
                self.LOGGER.warning(f"Retrying stream...")
                accepted_response_codes.add(206)
                return self.stream_into(
                    url = url,
                    target = target,
                    description = description,
                    try_count=try_count+1,
                    progress=progress,
                    accepted_response_codes=accepted_response_codes,
                    timeout=timeout,
                    headers=headers,
                    raw_url=raw_url,
                    refer_from_origin=refer_from_origin,
                    chunk_size=chunk_size,
                    **kwargs
                )

            return DownloadResult()
completely implemented downloading from youtube 2023-06-13 18:10:11 +00:00			`import time`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`from typing import List, Dict, Callable, Optional, Set`
sda 2023-04-22 12:20:19 +00:00			`from urllib.parse import urlparse, urlunsplit, ParseResult`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`import logging`

implemented the hearthbeat of youtube music 2023-07-17 19:19:19 +00:00			`import threading`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`import requests`
connection 2023-06-15 16:22:00 +00:00			`from tqdm import tqdm`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00
			`from .rotating import RotatingProxy`
connection 2023-06-15 16:22:00 +00:00			`from ..utils.shared import PROXIES_LIST, CHUNK_SIZE`
updated conecting behaviour 2023-06-16 10:26:02 +00:00			`from ..utils.support_classes import DownloadResult`
connection 2023-06-15 16:22:00 +00:00			`from ..objects import Target`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00

			`class Connection:`
			`def __init__(`
			`self,`
			`host: str,`
			`proxies: List[dict] = None,`
made streaming more stable 2023-06-16 21:27:08 +00:00			`tries: int = (len(PROXIES_LIST) + 1) * 4,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`timeout: int = 7,`
theoretically implemented the request partially 2023-04-20 17:37:41 +00:00			`logger: logging.Logger = logging.getLogger("connection"),`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`header_values: Dict[str, str] = None,`
			`accepted_response_codes: Set[int] = None,`
added the config option how long to wait after yt returns 404 2023-06-22 12:30:26 +00:00			`semantic_not_found: bool = True,`
implemented the hearthbeat of youtube music 2023-07-17 19:19:19 +00:00			`sleep_after_404: float = 0.0,`
implemented the automated fetching of the api key 2023-07-19 19:40:23 +00:00			`hearthbeat_interval = 0,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`):`
			`if proxies is None:`
			`proxies = PROXIES_LIST`
			`if header_values is None:`
			`header_values = dict()`

sda 2023-04-22 12:20:19 +00:00			`self.HEADER_VALUES = header_values`

theoretically implemented the request partially 2023-04-20 17:37:41 +00:00			`self.LOGGER = logger`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`self.HOST = urlparse(host)`
			`self.TRIES = tries`
			`self.TIMEOUT = timeout`
			`self.rotating_proxy = RotatingProxy(proxy_list=proxies)`

			`self.ACCEPTED_RESPONSE_CODES = accepted_response_codes or {200}`
			`self.SEMANTIC_NOT_FOUND = semantic_not_found`
added the config option how long to wait after yt returns 404 2023-06-22 12:30:26 +00:00			`self.sleep_after_404 = sleep_after_404`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00
failed attempts 2023-04-23 10:08:39 +00:00			`self.session = requests.Session()`
			`self.session.headers = self.get_header(**self.HEADER_VALUES)`
			`self.session.proxies = self.rotating_proxy.current_proxy`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00
implemented the hearthbeat of youtube music 2023-07-17 19:19:19 +00:00			`self.session_is_occupied: bool = False`

			`self.hearthbeat_thread = None`
implemented the automated fetching of the api key 2023-07-19 19:40:23 +00:00			`self.hearthbeat_interval = hearthbeat_interval`
implemented the hearthbeat of youtube music 2023-07-17 19:19:19 +00:00
layed out api request 2023-07-26 22:27:08 +00:00			`@property`
			`def user_agent(self) -> str:`
			`return self.session.headers.get("user-agent", "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/112.0.0.0 Safari/537.36")`

implemented the hearthbeat of youtube music 2023-07-17 19:19:19 +00:00
implemented the automated fetching of the api key 2023-07-19 19:40:23 +00:00			`def start_hearthbeat(self):`
			`if self.hearthbeat_interval <= 0:`
			`self.LOGGER.warning(f"Can't start a hearthbeat with {self.hearthbeat_interval}s in between.")`

			`self.hearthbeat_thread = threading.Thread(target=self._hearthbeat_loop, args=(self.hearthbeat_interval, ), daemon=True)`
			`self.hearthbeat_thread.start()`

implemented the hearthbeat of youtube music 2023-07-17 19:19:19 +00:00			`def hearthbeat_failed(self):`
			`self.LOGGER.warning(f"I just died... (The hearthbeat failed)")`


			`def hearthbeat(self):`
			`# Your code to send heartbeat requests goes here`
			`print("the hearth is beating, but it needs to be implemented ;-;\nFuck youuuu for setting hearthbeat in the constructor to true, but not implementing the method Connection.hearbeat()")`

			`def _hearthbeat_loop(self, interval: float):`
			`def hearthbeat_wrapper():`
			`self.session_is_occupied = True`
			`self.LOGGER.info(f"I am living. (sending a hearthbeat)")`
			`self.hearthbeat()`
			`self.LOGGER.debug(f"finished the hearthbeat")`
			`self.session_is_occupied = False`

			`while True:`
			`hearthbeat_wrapper()`
			`time.sleep(interval)`



sda 2023-04-22 12:20:19 +00:00			`def base_url(self, url: ParseResult = None):`
			`if url is None:`
			`url = self.HOST`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00
sda 2023-04-22 12:20:19 +00:00			`return urlunsplit((url.scheme, url.netloc, "", "", ""))`

improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`def get_header(self, **header_values) -> Dict[str, str]:`
			`return {`
failed attempts 2023-04-23 10:08:39 +00:00			`"user-agent": "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/112.0.0.0 Safari/537.36",`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`"Connection": "keep-alive",`
fixed nasty bug, where musify just returned 404 al lthe time 2023-05-03 14:14:03 +00:00			`# "Host": self.HOST.netloc,`
sda 2023-04-22 12:20:19 +00:00			`"Referer": self.base_url(),`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`**header_values`
			`}`

			`def rotate(self):`
failed attempts 2023-04-23 10:08:39 +00:00			`self.session.proxies = self.rotating_proxy.rotate()`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00
failed attempts 2023-04-23 10:08:39 +00:00			`def _update_headers(`
			`self,`
			`headers: Optional[dict],`
			`refer_from_origin: bool,`
			`url: ParseResult`
			`) -> Dict[str, str]:`
			`if headers is None:`
			`headers = dict()`
sda 2023-04-22 12:20:19 +00:00
failed attempts 2023-04-23 10:08:39 +00:00			`if not refer_from_origin:`
			`headers["Referer"] = self.base_url(url=url)`
sda 2023-04-22 12:20:19 +00:00
failed attempts 2023-04-23 10:08:39 +00:00			`return headers`
sda 2023-04-22 12:20:19 +00:00
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`def _request(`
			`self,`
			`request: Callable,`
			`try_count: int,`
made streaming more stable 2023-06-16 21:27:08 +00:00			`accepted_response_codes: set,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`url: str,`
theoretically implemented the request partially 2023-04-20 17:37:41 +00:00			`timeout: float,`
failed attempts 2023-04-23 10:08:39 +00:00			`headers: dict,`
			`refer_from_origin: bool = True,`
dsf 2023-05-03 13:16:01 +00:00			`raw_url: bool = False,`
added the config option how long to wait after yt returns 404 2023-06-22 12:30:26 +00:00			`sleep_after_404: float = None,`
implemented the hearthbeat of youtube music 2023-07-17 19:19:19 +00:00			`is_hearthbeat: bool = False,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`**kwargs`
			`) -> Optional[requests.Response]:`
added the config option how long to wait after yt returns 404 2023-06-22 12:30:26 +00:00			`if sleep_after_404 is None:`
			`sleep_after_404 = self.sleep_after_404`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`if try_count >= self.TRIES:`
			`return`

theoretically implemented the request partially 2023-04-20 17:37:41 +00:00			`if timeout is None:`
			`timeout = self.TIMEOUT`

failed attempts 2023-04-23 10:08:39 +00:00			`parsed_url = urlparse(url)`

			`headers = self._update_headers(`
			`headers=headers,`
			`refer_from_origin=refer_from_origin,`
			`url=parsed_url`
			`)`

dsf 2023-05-03 13:16:01 +00:00			`request_url = parsed_url.geturl() if not raw_url else url`

fixed nasty bug, where musify just returned 404 al lthe time 2023-05-03 14:14:03 +00:00			`connection_failed = False`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`try:`
implemented the automated fetching of the api key 2023-07-19 19:40:23 +00:00			`if self.session_is_occupied and not is_hearthbeat:`
			`self.LOGGER.info(f"Waiting for the hearthbeat to finish.")`
			`while self.session_is_occupied and not is_hearthbeat:`
			`pass`
implemented the hearthbeat of youtube music 2023-07-17 19:19:19 +00:00
fixed nasty bug, where musify just returned 404 al lthe time 2023-05-03 14:14:03 +00:00			`r: requests.Response = request(request_url, timeout=timeout, headers=headers, **kwargs)`

made streaming more stable 2023-06-16 21:27:08 +00:00			`if r.status_code in accepted_response_codes:`
fixed nasty bug, where musify just returned 404 al lthe time 2023-05-03 14:14:03 +00:00			`return r`

			`if self.SEMANTIC_NOT_FOUND and r.status_code == 404:`
			`self.LOGGER.warning(f"Couldn't find url (404): {request_url}")`
			`return None`

improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`except requests.exceptions.Timeout:`
dsf 2023-05-03 13:16:01 +00:00			`self.LOGGER.warning(f"Request timed out at \"{request_url}\": ({try_count}-{self.TRIES})")`
fixed nasty bug, where musify just returned 404 al lthe time 2023-05-03 14:14:03 +00:00			`connection_failed = True`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`except requests.exceptions.ConnectionError:`
dsf 2023-05-03 13:16:01 +00:00			`self.LOGGER.warning(f"Couldn't connect to \"{request_url}\": ({try_count}-{self.TRIES})")`
fixed nasty bug, where musify just returned 404 al lthe time 2023-05-03 14:14:03 +00:00			`connection_failed = True`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00
fixed nasty bug, where musify just returned 404 al lthe time 2023-05-03 14:14:03 +00:00			`if not connection_failed:`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`self.LOGGER.warning(f"{self.HOST.netloc} responded wit {r.status_code} "`
			`f"at {url}. ({try_count}-{self.TRIES})")`
			`self.LOGGER.debug(r.content)`
added the config option how long to wait after yt returns 404 2023-06-22 12:30:26 +00:00			`if sleep_after_404 != 0:`
			`self.LOGGER.warning(f"Waiting for {sleep_after_404} seconds.")`
			`time.sleep(sleep_after_404)`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00
			`self.rotate()`

			`return self._request(`
			`request=request,`
completely implemented downloading from youtube 2023-06-13 18:10:11 +00:00			`try_count=try_count+1,`
made streaming more stable 2023-06-16 21:27:08 +00:00			`accepted_response_codes=accepted_response_codes,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`url=url,`
sda 2023-04-22 12:20:19 +00:00			`timeout=timeout,`
continued download 2023-06-12 15:40:54 +00:00			`headers=headers,`
added the config option how long to wait after yt returns 404 2023-06-22 12:30:26 +00:00			`sleep_after_404=sleep_after_404,`
implemented the hearthbeat of youtube music 2023-07-17 19:19:19 +00:00			`is_hearthbeat=is_hearthbeat,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`**kwargs`
			`)`

			`def get(`
			`self,`
			`url: str,`
sda 2023-04-22 12:20:19 +00:00			`refer_from_origin: bool = True,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`stream: bool = False,`
			`accepted_response_codes: set = None,`
theoretically implemented the request partially 2023-04-20 17:37:41 +00:00			`timeout: float = None,`
failed attempts 2023-04-23 10:08:39 +00:00			`headers: dict = None,`
dsf 2023-05-03 13:16:01 +00:00			`raw_url: bool = False,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`**kwargs`
			`) -> Optional[requests.Response]:`
made streaming more stable 2023-06-16 21:27:08 +00:00			`if accepted_response_codes is None:`
			`accepted_response_codes = self.ACCEPTED_RESPONSE_CODES`

improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`r = self._request(`
failed attempts 2023-04-23 10:08:39 +00:00			`request=self.session.get,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`try_count=0,`
made streaming more stable 2023-06-16 21:27:08 +00:00			`accepted_response_codes=accepted_response_codes,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`url=url,`
theoretically implemented the request partially 2023-04-20 17:37:41 +00:00			`timeout=timeout,`
failed attempts 2023-04-23 10:08:39 +00:00			`headers=headers,`
dsf 2023-05-03 13:16:01 +00:00			`raw_url=raw_url,`
fixed nasty bug, where musify just returned 404 al lthe time 2023-05-03 14:14:03 +00:00			`refer_from_origin=refer_from_origin,`
			`stream=stream,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`**kwargs`
			`)`
			`if r is None:`
			`self.LOGGER.warning(f"Max attempts ({self.TRIES}) exceeded for: GET:{url}")`
			`return r`

			`def post(`
			`self,`
			`url: str,`
			`json: dict,`
sda 2023-04-22 12:20:19 +00:00			`refer_from_origin: bool = True,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`stream: bool = False,`
			`accepted_response_codes: set = None,`
theoretically implemented the request partially 2023-04-20 17:37:41 +00:00			`timeout: float = None,`
failed attempts 2023-04-23 10:08:39 +00:00			`headers: dict = None,`
dsf 2023-05-03 13:16:01 +00:00			`raw_url: bool = False,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`**kwargs`
			`) -> Optional[requests.Response]:`
			`r = self._request(`
failed attempts 2023-04-23 10:08:39 +00:00			`request=self.session.post,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`try_count=0,`
made streaming more stable 2023-06-16 21:27:08 +00:00			`accepted_response_codes=accepted_response_codes or self.ACCEPTED_RESPONSE_CODES,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`url=url,`
theoretically implemented the request partially 2023-04-20 17:37:41 +00:00			`timeout=timeout,`
failed attempts 2023-04-23 10:08:39 +00:00			`headers=headers,`
			`refer_from_origin=refer_from_origin,`
fixed nasty bug, where musify just returned 404 al lthe time 2023-05-03 14:14:03 +00:00			`raw_url=raw_url,`
improved function to connect to the internet 2023-04-20 16:47:47 +00:00			`json=json,`
			`stream=stream,`
			`**kwargs`
			`)`
			`if r is None:`
			`self.LOGGER.warning(f"Max attempts ({self.TRIES}) exceeded for: GET:{url}")`
			`self.LOGGER.warning(f"payload: {json}")`
			`return r`
connection 2023-06-15 16:22:00 +00:00
			`def stream_into(`
			`self,`
			`url: str,`
			`target: Target,`
			`description: str = "download",`
			`refer_from_origin: bool = True,`
			`accepted_response_codes: set = None,`
			`timeout: float = None,`
			`headers: dict = None,`
			`raw_url: bool = False,`
updated conecting behaviour 2023-06-16 10:26:02 +00:00			`chunk_size: int = CHUNK_SIZE,`
			`try_count: int = 0,`
			`progress: int = 0,`
connection 2023-06-15 16:22:00 +00:00			`**kwargs`
updated conecting behaviour 2023-06-16 10:26:02 +00:00			`) -> DownloadResult:`
made streaming more stable 2023-06-16 21:27:08 +00:00
			`if progress > 0:`
			`if headers is None:`
			`headers = dict()`
			`headers["Range"] = f"bytes={target.size}-"`

			`if accepted_response_codes is None:`
			`accepted_response_codes = self.ACCEPTED_RESPONSE_CODES`
updated conecting behaviour 2023-06-16 10:26:02 +00:00
connection 2023-06-15 16:22:00 +00:00			`r = self._request(`
			`request=self.session.get,`
			`try_count=0,`
made streaming more stable 2023-06-16 21:27:08 +00:00			`accepted_response_codes=accepted_response_codes,`
connection 2023-06-15 16:22:00 +00:00			`url=url,`
			`timeout=timeout,`
			`headers=headers,`
			`raw_url=raw_url,`
			`refer_from_origin=refer_from_origin,`
			`stream=True,`
			`**kwargs`
			`)`

			`if r is None:`
updated conecting behaviour 2023-06-16 10:26:02 +00:00			`return DownloadResult(error_message=f"Could not establish connection to: {url}")`
connection 2023-06-15 16:22:00 +00:00
			`target.create_path()`
			`total_size = int(r.headers.get('content-length'))`
updated conecting behaviour 2023-06-16 10:26:02 +00:00			`progress = 0`

			`retry = False`
connection 2023-06-15 16:22:00 +00:00
made streaming more stable 2023-06-16 21:27:08 +00:00			`with target.open("ab") as f:`
			`"""`
			`https://en.wikipedia.org/wiki/Kilobyte`
			`> The internationally recommended unit symbol for the kilobyte is kB.`
			`"""`
updated conecting behaviour 2023-06-16 10:26:02 +00:00
made streaming more stable 2023-06-16 21:27:08 +00:00			`with tqdm(total=total_size-target.size, unit='B', unit_scale=True, unit_divisor=1024, desc=description) as t:`
			`try:`
updated conecting behaviour 2023-06-16 10:26:02 +00:00			`for chunk in r.iter_content(chunk_size=chunk_size):`
connection 2023-06-15 16:22:00 +00:00			`size = f.write(chunk)`
updated conecting behaviour 2023-06-16 10:26:02 +00:00			`progress += size`
connection 2023-06-15 16:22:00 +00:00			`t.update(size)`

made streaming more stable 2023-06-16 21:27:08 +00:00			`except requests.exceptions.ConnectionError:`
			`if try_count >= self.TRIES:`
			`self.LOGGER.warning(f"Stream timed out at \"{url}\": to many retries, aborting.")`
			`return DownloadResult(error_message=f"Stream timed out from {url}, reducing the chunksize might help.")`

			`self.LOGGER.warning(f"Stream timed out at \"{url}\": ({try_count}-{self.TRIES})")`
			`retry = True`

			`if total_size > progress:`
updated conecting behaviour 2023-06-16 10:26:02 +00:00			`retry = True`


made streaming more stable 2023-06-16 21:27:08 +00:00			`if retry:`
			`self.LOGGER.warning(f"Retrying stream...")`
			`accepted_response_codes.add(206)`
			`return self.stream_into(`
			`url = url,`
			`target = target,`
			`description = description,`
			`try_count=try_count+1,`
			`progress=progress,`
			`accepted_response_codes=accepted_response_codes,`
			`timeout=timeout,`
			`headers=headers,`
			`raw_url=raw_url,`
			`refer_from_origin=refer_from_origin,`
			`chunk_size=chunk_size,`
			`**kwargs`
			`)`

			`return DownloadResult()`