doxygen/mevio__api_8py_source.html

# -*- coding: UTF-8 -*-


# ----------------------

# Name: mevio_api - XPath and XSLT functions for the Mevio RSS/HTML items

# Python Script

# Author:   R.D. Vaughan

# Purpose:  This python script is intended to perform a variety of utility functions

#           for the conversion of data to the MNV standard RSS output format.

#           See this link for the specifications:

#           http://www.mythtv.org/wiki/MythNetvision_Grabber_Script_Format

#

# License:Creative Commons GNU GPL v2

# (http://creativecommons.org/licenses/GPL/2.0/)

#-------------------------------------

__title__ ="mevio_api - XPath and XSLT functions for the www.mevio.com RSS/HTML"

__author__="R.D. Vaughan"

__purpose__='''

This python script is intended to perform a variety of utility functions

for the conversion of data to the MNV standard RSS output format.

See this link for the specifications:

http://www.mythtv.org/wiki/MythNetvision_Grabber_Script_Format

'''


__version__="v0.1.1"

# 0.1.0 Initial development

# 0.1.1 Fixed a bug when an autoplay link cannot be created

#       Added MP4 as an acceptable downloadable video file type

#       Added checking to see if the item is already in the data base


# Specify the class names that have XPath extention functions

__xpathClassList__ = ['xpathFunctions', ]


# Specify the XSLT extention class names. Each class is a stand lone extention function

#__xsltExtentionList__ = ['xsltExtExample', ]

__xsltExtentionList__ = []


import os, sys, re, time, datetime, shutil, urllib.request, urllib.parse, urllib.error, string

from copy import deepcopy

import io


class OutStreamEncoder(object):

    """Wraps a stream with an encoder"""

    def __init__(self, outstream, encoding=None):

        self.out = outstream

        if not encoding:

            self.encoding = sys.getfilesystemencoding()

        else:

            self.encoding = encoding


    def write(self, obj):

        """Wraps the output stream, encoding Unicode strings with the specified encoding"""

        if isinstance(obj, str):

            obj = obj.encode(self.encoding)

        try:

            self.out.buffer.write(obj)

        except OSError:

            pass


    def __getattr__(self, attr):

        """Delegate everything but write to the stream"""

        return getattr(self.out, attr)


if isinstance(sys.stdout, io.TextIOWrapper):

    sys.stdout = OutStreamEncoder(sys.stdout, 'utf8')

    sys.stderr = OutStreamEncoder(sys.stderr, 'utf8')


try:

    from io import StringIO

    from lxml import etree

except Exception as e:

    sys.stderr.write('\n! Error - Importing the "lxml" and "StringIO" python libraries failed on error(%s)\n' % e)

    sys.exit(1)


class xpathFunctions(object):

    """Functions specific extending XPath

    """

    def __init__(self):

        self.functList = ['mevioLinkGeneration', 'mevioTitle', 'mevioEpisode', 'mevioCheckIfDBItem', ]

        self.episodeRegex = [

            # Episode 224

            re.compile('''^.+?Episode\\ (?P<episodeno>[0-9]+).*$''', re.UNICODE),

            # CrankyGeeks 136:

            re.compile('''^.+?(?P<episodeno>[0-9]+)\\:.*$''', re.UNICODE),

            ]

        self.namespaces = {

            'atom10': "http://www.w3.org/2005/Atom",

            'media': "http://search.yahoo.com/mrss/",

            'itunes':"http://www.itunes.com/dtds/podcast-1.0.dtd",

            'xhtml': "http://www.w3.org/1999/xhtml",

            'feedburner': "http://rssnamespace.org/feedburner/ext/1.0",

            'mythtv': "http://www.mythtv.org/wiki/MythNetvision_Grabber_Script_Format",

            'dc': "http://purl.org/dc/elements/1.1/",

            'fb': "http://www.facebook.com/2008/fbml/",

            }

        self.mediaIdFilters = [

            [etree.XPath(".//embed/@flashvars", namespaces=self.namespaces), re.compile('''^.+?MediaId=(?P<videocode>[0-9]+).*$''', re.UNICODE)],

            [etree.XPath(".//div[@class='player_wrapper']/a/@href", namespaces=self.namespaces), re.compile('''^.+?\\'(?P<videocode>[0-9]+)\\'\\)\\;.*$''', re.UNICODE)]

            ]

    # end __init__()


    def mevioLinkGeneration(self, context, *arg):

        '''Generate a link for the video.

        Call example: 'mnvXpath:mevioLinkGeneration(string(link))'

        return the url link

        '''

        webURL = arg[0]

        try:

            tmpHTML = etree.parse(webURL, etree.HTMLParser())

        except Exception as errmsg:

            sys.stderr.write("Error reading url(%s) error(%s)\n" % (webURL, errmsg))

            return webURL


        for index in range(len(self.mediaIdFilters)):

            mediaId = self.mediaIdFilters[index][0](tmpHTML)

            if not len(mediaId):

                continue

            match = self.mediaIdFilters[index][1].match(mediaId[0])

            if match:

                videocode = match.groups()

                return 'file://%s/nv_python_libs/configs/HTML/mevio.html?videocode=%s' % (common.baseProcessingDir, videocode[0])

        else:

            return webURL

    # end mevioLinkGeneration()


    def mevioTitle(self, context, arg):

        '''Parse the title string extract only the title text removing the redundant show name

        Call example: 'mnvXpath:mevioTitle(./title/text())'

        return the title text

        '''

        epText = self.mevioEpisode('dummy', arg).text

        if epText:

            epText = 'Ep %s: ' % epText

        else:

            epText = ''

        seperatorStrs = [[' | ', 'before'], [': ', 'after'], [' - ', 'before']]

        for sepStr in seperatorStrs:

            if sepStr[1] == 'after':

                index = arg[0].find(sepStr[0])

            else:

                index = arg[0].rfind(sepStr[0])

            if index != -1:

                if sepStr[1] == 'after':

                    return '%s%s' % (epText, arg[0][index+len(sepStr[0]):].strip())

                else:

                    return '%s%s' % (epText, arg[0][:index].strip())

        else:

            if epText:

                return epText

            else:

                return arg[0].strip()

    # end mevioTitle()


    def mevioEpisode(self, context, arg):

        '''Parse the title string and extract an episode number

        Call example: 'mnvXpath:mevioEpisode(./title/text())'

        return an episode element

        '''

        episodeNumber = ''

        for index in range(len(self.episodeRegex)):

            match = self.episodeRegex[index].match(arg[0])

            if match:

                episodeNumber = match.groups()

                break

        return etree.XML('<episode>%s</episode>' % episodeNumber)

    # end mevioEpisode()


    def mevioCheckIfDBItem(self, context, *arg):

        '''Use a unique key value pairing to find out if the 'internetcontentarticles' table already

        has a matching item. This is done to save accessing the Internet when not required.

        Call example: 'mnvXpath:mevioCheckIfDBItem(title, description)'

        return True if a match was found

        return False if a match was not found

        '''

        return common.checkIfDBItem('dummy', {'feedtitle': 'Technology', 'title': arg[0], 'description': arg[1]})

    # end mevioCheckIfDBItem()


nv_python_libs.xsltfunctions.mevio_api.OutStreamEncoder
Definition: mevio_api.py:41

nv_python_libs.xsltfunctions.mevio_api.OutStreamEncoder.write
def write(self, obj)
Definition: mevio_api.py:50

nv_python_libs.xsltfunctions.mevio_api.OutStreamEncoder.__init__
def __init__(self, outstream, encoding=None)
Definition: mevio_api.py:43

nv_python_libs.xsltfunctions.mevio_api.OutStreamEncoder.encoding
encoding
Definition: mevio_api.py:46

nv_python_libs.xsltfunctions.mevio_api.OutStreamEncoder.out
out
Definition: mevio_api.py:44

nv_python_libs.xsltfunctions.mevio_api.OutStreamEncoder.__getattr__
def __getattr__(self, attr)
Definition: mevio_api.py:59

nv_python_libs.xsltfunctions.mevio_api.xpathFunctions
Definition: mevio_api.py:75

nv_python_libs.xsltfunctions.mevio_api.xpathFunctions.mevioCheckIfDBItem
def mevioCheckIfDBItem(self, context, *arg)
Definition: mevio_api.py:174

nv_python_libs.xsltfunctions.mevio_api.xpathFunctions.mevioTitle
def mevioTitle(self, context, arg)
Definition: mevio_api.py:132

nv_python_libs.xsltfunctions.mevio_api.xpathFunctions.mevioLinkGeneration
def mevioLinkGeneration(self, context, *arg)
Start of XPath extension functions.
Definition: mevio_api.py:108

nv_python_libs.xsltfunctions.mevio_api.xpathFunctions.functList
functList
Definition: mevio_api.py:79

nv_python_libs.xsltfunctions.mevio_api.xpathFunctions.namespaces
namespaces
Definition: mevio_api.py:86

nv_python_libs.xsltfunctions.mevio_api.xpathFunctions.mevioEpisode
def mevioEpisode(self, context, arg)
Definition: mevio_api.py:160

nv_python_libs.xsltfunctions.mevio_api.xpathFunctions.episodeRegex
episodeRegex
Definition: mevio_api.py:80

nv_python_libs.xsltfunctions.mevio_api.xpathFunctions.mediaIdFilters
mediaIdFilters
Definition: mevio_api.py:96

nv_python_libs.xsltfunctions.mevio_api.xpathFunctions.__init__
def __init__(self)
Definition: mevio_api.py:78

find
static pid_list_t::iterator find(const PIDInfoMap &map, pid_list_t &list, pid_list_t::iterator begin, pid_list_t::iterator end, bool find_open)
Definition: dvbstreamhandler.cpp:363

urllib.request