#   Copyright 2011-2016 Josh Kearney
#
#   Licensed under the Apache License, Version 2.0 (the "License");
#   you may not use this file except in compliance with the License.
#   You may obtain a copy of the License at
#
#       http://www.apache.org/licenses/LICENSE-2.0
#
#   Unless required by applicable law or agreed to in writing, software
#   distributed under the License is distributed on an "AS IS" BASIS,
#   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#   See the License for the specific language governing permissions and
#   limitations under the License.

"""Pyhole URL Plugin"""

from BeautifulSoup import BeautifulSoup

from pyhole.core import plugin
from pyhole.core import request
from pyhole.core import utils


class Url(plugin.Plugin):
    """Provide access to URL data."""

    def __init__(self, session):
        self.session = session
        self.name = self.__class__.__name__
        self.url = None

    @plugin.hook_add_command("title")
    def title(self, message, params=None, **kwargs):
        """Display the title of the a URL (ex: .title [<url>])"""
        if params:
            self.url = params.split(" ", 1)[0]

        if not _matches_host(self.url):
            self._find_title(message, self.url)

    @plugin.hook_add_msg_regex("(https?://|www.)[^\> ]+")
    def regex_match_url(self, message, match, **kwargs):
        """Watch and keep track of the latest URL."""
        try:
            # NOTE(jk0): Slack does some weird things with URLs.
            self.url = match.group(0).split("|", 1)[0]

            if _matches_host(self.url):
                self._find_title(message, self.url)
        except TypeError:
            return

    @utils.spawn
    def _find_title(self, message, url):
        """Find the title of a given URL."""
        # NOTE(jk0): Slack does some weird things with URLs.
        url = url.replace("<", "").replace(">", "").split("|")[0]
        if not url.startswith(("http://", "https://")):
            url = "http://" + url

        try:
            response = request.get(url)
        except Exception:
            return

        soup = BeautifulSoup(response.content)
        if soup.head:
            title = utils.decode_entities(soup.head.title.string)
            content_type = response.headers.get("Content-Type")
            message.dispatch("%s (%s)" % (title, content_type))
        else:
            message.dispatch("No title found: %s" % url)


def _matches_host(url):
    """Watch for certain websites."""
    try:
        host = url.split("/")[2]
    except IndexError:
        host = url

    lookup_sites = ("open.spotify.com", "www.youtube.com", "youtu.be")
    if host.startswith(lookup_sites):
        return True