Hoshpak
/
stov


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156
							#
#        This file is part of stov, written by Helmut Pozimski 2012-2017.
#
#       stov is free software: you can redistribute it and/or modify
#       it under the terms of the GNU General Public License as published by
#       the Free Software Foundation, version 2 of the License.
#
#       stov is distributed in the hope that it will be useful,
#       but WITHOUT ANY WARRANTY; without even the implied warranty of
#       MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
#       GNU General Public License for more details.
#
#       You should have received a copy of the GNU General Public License
#       along with stov.  If not, see <http://www.gnu.org/licenses/>.


# -*- coding: utf8 -*-

"""This module provides all classes and methods that were provided by the
youtubeAPI module earlier."""

import subprocess
import urllib.parse
import urllib.request
import urllib.error
import logging

import lxml.html
from lib_stov import stov_exceptions
from lib_stov import youtubedl_wrapper

LOGGER = logging.getLogger("stov")


class YtChannel(object):
    """Stores the relevant attributes of a youtube channel."""
    def __init__(self):
        self.title = ""
        self.videos = []


class YtVideo(object):
    """Stores the relevant attributes of a single youtube video."""
    def __init__(self, title, ytid):
        self.title = title
        self.ytid = ytid


class Connector(object):
    """This class will retrieve all the necessary data from youtube using
    youtube-dl, thus bypassing the API.
    """
    def __init__(self, subscription_type, name, conf, search=""):
        """Populates the object with all necessary data."""
        self._type = subscription_type
        self._name = name
        self._search = search
        self._conf = conf
        self._title = ""
        self._url = ""
        self._construct_url()

    def _construct_url(self):
        """Constructs the URL to request from youtube-dl according to the
        subscription type and the given parameters.
        """
        if self._type == "user":
            self._url = "https://www.youtube.com/user/%s" \
                        % urllib.parse.quote(self._name)
        elif self._type == "channel":
            self._url = "https://www.youtube.com/channel/%s" \
                        % urllib.parse.quote(self._name)
        elif self._type == "search":
            self._url = "https://www.youtube.com/results?search_query=%s"\
                        % urllib.parse.quote(self._search)
        elif self._type == "playlist":
            self._url = "https://www.youtube.com/playlist?list=%s" \
                        % urllib.parse.quote(self._name)

    def _fetch_title(self):
        """Retrieves the title of the HTML page to use as a title for the
        subscription."""
        try:
            data = urllib.request.urlopen(self._url)
        except urllib.error.HTTPError as err:
            if err.code == 404 and self._type == "user":
                self._type = "channel"
                self._construct_url()
                try:
                    data = urllib.request.urlopen(self._url)
                except urllib.error.HTTPError:
                    raise stov_exceptions.ChannelNotFound()
                else:
                    self._parse_title(data)
            else:
                raise stov_exceptions.ChannelNotFound()
        else:
            self._parse_title(data)

    def _parse_title(self, data):
        """ Parses the title from a HTML document
        :param data: HTTP connection to the document
        :type data: http.client.HTTPResponse
        """
        parsed_html = lxml.html.parse(data)
        data.close()
        i = 0
        for item in parsed_html.iter("title"):
            if i == 0:
                self._title = item.text_content().strip().replace("\n", "")
            i += 1
        if self._search != "" and self._type == "user":
            self._title += _(" search %s") % self._search

    def _fetch_videos(self, existing_videos):
        """Retrieves all the relevant videos in a subscription."""
        videos_list = []
        if self._type == "user" and self._search:
            video_ids = youtubedl_wrapper.get_ids(self._conf, self._url,
                                                  self._search)
        else:
            video_ids = youtubedl_wrapper.get_ids(self._conf, self._url)
        LOGGER.debug("Got video IDs: %s", video_ids)
        if video_ids:
            for video_id in video_ids:
                video_exists = False
                if existing_videos:
                    for existing_video in existing_videos:
                        if video_id == existing_video.ytid:
                            video_exists = True
                            break
                if not video_exists:
                    try:
                        video_title = youtubedl_wrapper.get_title(
                            self._conf, "https://www.youtube.com/watch?v=%s"
                                        % video_id)
                    except subprocess.CalledProcessError:
                        raise stov_exceptions.YoutubeDlCallFailed()
                    else:
                        videos_list.append(YtVideo(
                            video_title,
                            video_id))
        return videos_list

    def parse_api_data(self, existing_videos):
        """This method calls all necessary methods to retrieve the data
                and assembles them into a Channel object. The naming of this
                method was set according to the method in youtubeAPI to be
                compatible.
        """
        self._fetch_title()
        videos = self._fetch_videos(existing_videos)
        channel = YtChannel()
        channel.title = self._title
        channel.videos = videos
        return channel