Context Navigation

Back to Ticket #2734

Ticket #2734: metadata_script_improvements_against_trunk_07-03-03.patch

File metadata_script_improvements_against_trunk_07-03-03.patch, 31.4 KB (added by visit0r, 17 years ago)
Changes against trunk (note: scripts are NOT tested with MythVideo? on trunk, only with 0.20).

mythvideo/mythvideo/scripts/find_meta.py

-                      old
+                      new
 directory with multiple video files. Perform movie data lookups using the
 imdbpy.py script.
 Written by Pekka JÃ€Ã€skelÃ€inen (gmail: pekka.jaaskelainen) 2006.
+Written by Pekka JÃ€Ã€skelÃ€inen (gmail: pekka.jaaskelainen) 2006-2007.
 The metadata is searched with following steps:
 …
 In case it's a video directory (a directory with 2 or more video files for the same title,
 or a DVD directory) the file name is video.metadata.
+Includes an interactive mode which makes the script ask user for input in case there are
+titles for which IMDb queries cannot be done unambiguously.
+A crontab entry for the script to insert automatically data of new video files to
+MythDB every hour:
+* * * * find_meta.py -r /videos
+In which /videos is the root of your MythVideo files.
 """
 import sys
 …
 import glob
 import fileinput
 import imdbpy
+import shlex
+import socket
+import urllib
 try:
+        # If loaded, get neater input prompt for interactive questions.
+        import readline
+        # If found, we can insert data directly to MythDB
+        import MySQLdb
+        db_support = True
 except:
+        pass
+        print "MySQLdb (python-mysqldb) not installed, MythDB importing disabled."
+        db_support = False
 from stat import *
 verbose=False
+overwrite=False
 interactive=False
 recursive=False
+dbimport=False
+# Import metadata from .metadata files if found.
+import_from_files=False
+# Overwrite the old metadata if found.
+overwrite=False
+# Create the *.metadata files.
+metafiles=False
 videoExtensions = ["avi", "mpg", "wmv"]
+videoExtensions = ["avi", "mpg", "wmv", "mkv"]
 # The file name for storing metadata for videos that occupy the whole
 # directory and might consist of multiple video files for the same
 …
 # Directories to skip in the recursive scan (matched to the rightmost
 # part of the directory).
+skipDirs = ["/Sample", "/Sub"]
+skipDirs = ["/Sample", "/Sub", "/VIDEO_TS"]
+# The directory to store the poster files in (this will be fetched from the
+# MythTV settings table).
+poster_dir = "./"
 def print_verbose(string):
         global verbose
 …
                 print string
         return
+db = None
+def init_db():
+        global db
+        try:
+                config = shlex.shlex(open(os.path.expanduser('~/.mythtv/mysql.txt')))
+        except:
+                print "Error opening ~/.mythtv/mysql.txt"
+                return False
+        token = config.get_token()
+        db_host = db_user = db_password = None
+        while  token != config.eof and (db_host == None or db_user == None or db_password == None):
+                if token == "DBHostName":
+                        if config.get_token() == "=":
+                                db_host = config.get_token()
+                elif token == "DBUserName":
+                        if config.get_token() == "=":
+                                db_user = config.get_token()
+                elif token == "DBPassword":
+                        if config.get_token() == "=":
+                                db_password = config.get_token()
+                token = config.get_token()
+        db = MySQLdb.connect(user=db_user, host=db_host, passwd=db_password,
+                db="mythconverg")
+        print_verbose("Database connection successful.")
+        return True
 def find_imdb_id_from_text_file(textFile):
         if os.access(textFile, os.R_OK):
 …
                 return path[0: suffix_pos]
         else:
                 return path
 def cleanup_title(title):
         title = title.replace("_", " ").replace(".", " ")
         cut_point_strings = ["hdtv", "xvid", "dvd", "proper"]
+        cut_point_strings = ["hdtv", "xvid", "dvd", "proper", "720p"]
         lowest_cutpoint = len(title)
         for string in cut_point_strings:
                 pos = title.lower().rfind(string)
 …
         title = title[0:lowest_cutpoint]
         return title.strip()
+def save_metadata(fileName, metadata):
+def get_genre_id(genre_name):
+        """
+        Find the id of the given genre from MythDB.
+        If the genre does not exist, insert it and return its id.
+        """
+        global db
+        c = db.cursor()
+        c.execute("SELECT intid FROM videocategory WHERE lower(category) = %s", (genre_name,))
+        row = c.fetchone()
+        c.close()
+        if row is not None:
+                return row[0]
+        # Insert a new genre.
+        c = db.cursor()
+        c.execute("INSERT INTO videocategory(category) VALUES (%s)", (genre_name.capitalize(),))
+        newid = c.lastrowid
+        c.close()
+        return newid
+def parse_meta(variable, oldvalue, emptyvalue="", meta=""):
+        """
+        Parses a single metadata from a metadata string (returned by the imdbpy.py, etc.).
+        variable is the metadata to find
+        oldvalue if we are replacing an old value for the metadata
+        emptyvalue what is considered an empty value for the metadata (e.g. "None", "")
+        meta the metadata string
+        """
+        global overwrite
+        if not overwrite and oldvalue is not None and oldvalue != emptyvalue:
+                return oldvalue
+        for line in meta.split("\n"):
+                beginning = variable + ":"
+                if line.startswith(beginning):
+                        return line[len(beginning):].strip()
+        return None
+def detect_disc_number(allfiles, file):
+        """
+        Detect the number of disc of the video file considering all the discs
+        that are part of the title.
+        Returns None if cannot detect the disc number.
+        """
+        if len(allfiles) < 2 or file not in allfiles:
+                return None
+        # Ensure all filenames are of same length (assume there are no
+        # more than 9 discs per title). And they are not all the same.
+        size = len(allfiles[0])
+        differing = False
+        for f in allfiles:
+                if len(f) != size:
+                        return None
+                if f != file:
+                        differing = True
+        if not differing:
+                return None
+        # Find the range of chars of the string which are not equal
+        # for all the files.
+        # For example:
+        # "Rambo III disc 1.avi"
+        # "Rambo III disc 2.avi"
+        #  ===============!====
+        startpos = 0
+        for startpos in range(len(file)):
+                c = allfiles[0][startpos]
+                allequal = True
+                for f in allfiles:
+                        if f[startpos] != c:
+                                allequal = False
+                                break
+                if not allequal:
+                        # Found the starting index.
+                        break
+        endpos = len(file) - 1
+        for endpos in reversed(range(len(file))):
+                c = allfiles[0][endpos]
+                allequal = True
+                for f in allfiles:
+                        if f[endpos] != c:
+                                allequal = False
+                                break
+                if not allequal:
+                        # Found the ending index.
+                        break
+        endpos = endpos + 1
+        # Now the disc number can be found.
+        disc_str = file[startpos:endpos].lower()
+        disc = -1
+        try:
+                disc = int(disc_str)
+        except:
+                # It was not an integer. Maybe an alphabetic?
+                alpha = ["a", "b", "c", "d", "e"]
+                for i in range(len(alpha)):
+                        if alpha[i] == disc_str:
+                                return i + 1 # a == disc 1, b == disc 2, ...
+        if disc == -1:
+                return None
+        else:
+                return disc
+def save_metadata_to_mythdb(videopath, metadata):
+        """
+        Updates the given metadata for the given video path.
+        Detects if the given title is a dvd-rip dir with multiple videos and
+        adds metadata for all the videos separately, and chains the videos
+        together.
+        """
+        files_str = parse_meta("Files", "", "", metadata)
+        if files_str is not None:
+                files = files_str.split(",")
+                if len(files) > 1:
+                        # It's a dvd-rip dir.
+                        # Set the first video's childid to -1, which denotes no childs.
+                        child = -1
+                        # Add the last file in chain first so we can set it as a child
+                        # to the next one, etc.
+                        for file in reversed(files):
+                                child = save_video_metadata_to_mythdb(
+                                        videopath + "/" + file, metadata,
+                                        child, disc = detect_disc_number(files, file))
+                        return
+        return save_video_metadata_to_mythdb(videopath, metadata)
+def mythvideo_metadata_id(videopath):
+        """
+        Finds the MythVideo metadata id for the given video path from the MythDB, if any.
+        Returns None if no metadata was found.
+        """
+        global db
+        c = db.cursor()
+        c.execute("""
+                SELECT intid
+                FROM videometadata
+                WHERE filename = %s""", (videopath,))
+        row = c.fetchone()
+        c.close()
+        if row is not None:
+                return row[0]
+        else:
+                return None
+def mythtv_setting(value, hostname = '%'):
+        """
+        Returns the value for the given MythTV setting.
+        Returns None if the settings was not found. If multiple rows are
+        found (multiple hostnames), returns the value of the first one.
+        """
+        global db
+        c = db.cursor()
+        c.execute("""
+                SELECT data
+                FROM settings
+                WHERE value LIKE(%s) AND hostname LIKE(%s) LIMIT 1""",
+                (value, hostname))
+        row = c.fetchone()
+        c.close()
+        if row is not None:
+                return row[0]
+        else:
+                return None
+def save_video_metadata_to_mythdb(videopath, metadata, child=-1, disc=None):
+        """
+        Updates the given metadata for the given video file.
+        child can be set to the id of the child video (video to be played after this one).
+        disc can be set to the disc number in case of multifile title (the disc number
+             is appended to the title string to enable differentiating the titles in
+             file browse mode.
+        Returns the id of the inserted metadata.
+        """
+        global overwrite, db, poster_dir
+        # Drop the trailing '/' from the path
+        if videopath.endswith('/'):
+                videopath = videopath[0:-1]
+        videopath = os.path.abspath(videopath)
+        print_verbose("Inserting metadata to MythDB for %s." % videopath)
+        (intid, title, category, director, plot, rating, inetref, year,
+         userrating, length, filename, coverfile, childid, playcommand) = \
+                 (None, None, 0, None, None, None, None,
+.0, None, 0, None, None, child, "")
+        intid = mythvideo_metadata_id(videopath)
+        if intid is not None:
+                if not overwrite:
+                        print_verbose("Metadata already exist in MythDB, not overwriting it.")
+                        return None
+        else:
+                print_verbose("No metadata in MythDB, creating a new one.")
+                # Create a new empty entry at this point so we can use the common UPDATE code
+                # to actually insert the data.
+                c = db.cursor()
+                c.execute("""INSERT INTO videometadata(filename) VALUES(%s)""", (videopath,))
+                intid = c.lastrowid
+                c.close()
+        def parse_metadata(variable, oldvalue, emptyvalue="", meta=metadata):
+                return parse_meta(variable, oldvalue, emptyvalue, meta)
+        title = parse_metadata('Title', title)
+        if disc is not None:
+                title += " (disc " + str(disc) + ")"
+        year = parse_metadata('Year', year, 0)
+        if title is None or year is None:
+                return
+        director = parse_metadata('Director', director, 'Unknown')
+        if director == None:
+                director = "Unknown"
+        plot = parse_metadata('Plot', plot, "None")
+        userrating = parse_metadata('UserRating', userrating, 0.0)
+        try:
+                float(userrating)
+        except:
+                userrating = 0.0
+        rating = parse_metadata('MovieRating', rating, "Unknown")
+        if rating is None:
+                rating = "Unknown"
+        length = parse_metadata('Runtime', length, 0)
+        try:
+                length = length.split(",")[0]
+                length = int(length)
+        except:
+                length = 0
+        inetref = parse_metadata('IMDb', inetref, '00000000')
+        if inetref == None:
+                inetref = '00000000'
+        filename = videopath
+        genrestring = parse_metadata('Genres', "", "")
+        genres = []
+        if genrestring is not None and len(genrestring) > 0:
+                genres = genrestring.split(",")
+        if len(genres) < 1:
+                print_verbose("No genres.")
+                return
+        else:
+                # Only one genre supported?
+                category = get_genre_id(genres[0])
+        coverfile = find_poster_image(inetref)
+        if coverfile == None:
+                coverfile = "No cover"
+        else:
+                # TODO: should enter only the filename to allow reusing
+                # the same cover file from multiple hosts where the
+                # poster image directory is mounted to different directories.
+                # This needs to be fixed in MythVideo first.
+                coverfile = poster_dir + "/" + coverfile
+        c = db.cursor()
+        c.execute("""
+                UPDATE videometadata
+                SET showlevel = 1, browse = 1, childid = %s, playcommand = %s, title = %s,
+                    director = %s, plot = %s, rating = %s, inetref = %s, category = %s,
+                    year = %s, userrating = %s, length = %s, filename = %s, coverfile = %s
+                WHERE intid = %s""",
+                (childid, playcommand, title, director, plot, rating, inetref, category,
+                 year, userrating, length, filename, coverfile, intid))
+        c.close()
+        return intid
+def find_poster_image(imdb_id):
+        """
+        Tries to find a poster image for the given IMDb id.
+        First looks if the image already exist, if not, tries to fetch it using
+        the imdbpy.py. Returns None in case a poster image couldn't be found,
+        otherwise returns the base name of the poster image file.
+        """
+        global poster_dir
+        image_extensions = ["png", "jpg", "bmp"]
+        poster_files = []
+        for ext in image_extensions:
+                poster_files += glob.glob("%s/%s.%s" % (poster_dir, imdb_id, ext))
+        if len(poster_files) == 0:
+                # Try to fetch the poster image from the web.
+                poster_url = imdbpy.find_poster_url(imdb_id)
+                if poster_url is None:
+                        return None
+                print_verbose("Found poster at '%s', downloading it..." % poster_url)
+                filename = poster_url.split("/")[-1]
+                (name, extension) = os.path.splitext(filename)
+                local_filename = poster_dir + "/" + imdb_id + extension
+                urllib.urlretrieve(poster_url, local_filename)
+                poster_files.append(local_filename)
+        else:
+                print_verbose("Found existing cover image.")
+        coverfile = None
+        if len(poster_files) > 0:
+                # TODO: if multiple poster images available, pick the one with largest
+                # dimensions.
+                # Now just pick the first found.
+                coverfile = os.path.basename(poster_files[0])
+        return coverfile
+def save_metadata_to_file(fileName, metadata):
+        global overwrite
         if os.path.exists(fileName) and not overwrite:
                 print_verbose("Metadata already exists, not overwriting.")
+                return
         if metadata is not None:
                 print_verbose("Writing metadata to '%s'" % fileName)
                 f = open(fileName, 'w')
                 f.write(metadata.encode("utf8"))
                 f.close()
+                print_verbose("Metadata:")
+                print_verbose(metadata)
+def save_metadata(videopath, metadata_filename, metadata):
+        """
+        Saves metadata for the given video path to the given metadata_filename.
+        Metadata should be a single string.
+        """
+        global dbimport, metafiles
+        print_verbose("Metadata:")
+        print_verbose(metadata)
+        if metafiles:
+                save_metadata_to_file(metadata_filename, metadata)
+        if dbimport:
+                save_metadata_to_mythdb(videopath, metadata)
 def find_metadata_for_video_path(pathName):
         global interactive
         fileName = os.path.basename(pathName)
 …
                         dirName + "/imdb.url",
                         dirName + "/" + file_body + ".nfo",
                         dirName + "/" + file_body + ".imdb"]
+        # Add rest of the .nfos to the list of the scanned ones.
+        # Add rest of the .nfos to the end of the list.
         for nfo in glob.glob(dirName + "/*.nfo"):
                 if nfo not in nfos:
                         nfos.append(nfo)
 …
         if imdb_id is None:
                 # A title search
                 title = cleanup_title(title)
+                title = unicode(cleanup_title(title), "utf8", "ignore")
                 print_verbose("Title search '%s'" % title)
                 candidates = imdbpy.title_search(title.decode("utf8"))
+                candidates = imdbpy.title_search(title)
                 if candidates is None or len(candidates) == 0:
                         # Try with the dirname
+                        # TODO: Try with the dirname
                         pass
                 if candidates is not None and len(candidates) > 0:
                         index = 0
                         if len(candidates) > 1:
+                                print "Got multiple candidates for title search '%s'. " % title
+                                print "Use the '-a' switch to choose the correct one."
+                                for candidate in candidates:
+                                        print "%s) %s (%d)" % (candidate[0], candidate[1], candidate[2])
                                 if interactive:
-                                        print "Got multiple candidates for the title search '%s'. " % title
-                                        print "Which one is the correct title?"
-                                        for i in range(len(candidates)):
-                                                print "%d) %s (%d)" % (i, candidates[i][1], candidates[i][2])
-                                        print "N) None of the above"
                                         answer = raw_input("?)")
                                         if answer is None or len(answer) == 0:
                                                 return [None, None]
+                                                return None
+                                        if answer.lower() == "n":
+                                                return [None, None]
+                                        else:
+                                                try:
+                                                        ans = int(answer)
+                                                        if 0 <= ans < len(candidates):
+                                                                index = ans
+                                                        else:
+                                                                return [None, None]
+                                                except:
+                                                        print_verbose("Illegal index.")
+                                                        return [None, None]
+                                        print_verbose("Chose %d" % index)
+                                        print_verbose("Chose %s" % answer)
+                                        imdb_id = answer
                                 else:
+                                        print "Multiple candidates found for the movie and not in interactive mode."
+                                        return [None, None]
+                        imdb_id = candidates[index][0]
+                                        return None
+                        else:
+                                imdb_id = candidates[0][0]
                 else:
                         print "Couldn't find IMDb ID for '%s'" % pathName
                         return [None, None]
+                        return None
         print_verbose("Querying IMDb for meta data for ID %s..." % imdb_id)
         metadata = imdbpy.metadata_search(imdb_id)
         if metadata is not None:
                 metadata += "IMDb:%s" % imdb_id + "\n"
+        return [source_nfo, metadata]
+        # Save the metadata
+        return metadata
 def video_file_list_metadata(videoPaths):
         videoPaths = [os.path.basename(v) for v in videoPaths]
 …
         return "Files:%s" % (",".join(videoPaths)) + "\n"
+def load_metadata_file(metadata_filename):
+        """
+        Loads a metadata file if found, returns None otherwise.
+        """
+        metadata = None
+        try:
+                f = open(metadata_filename)
+                metadata = "".join(f.readlines())
+                f.close()
+        except:
+                pass
+        return metadata
 def detect_dvd_backup(dirName):
         """
         If the given directory is detected as a directory with a dvd backup, meta data is
         searched for the directory title name (in addition to the directory-wide imdb files).
         """
+        global import_from_files
         videoTs = dirName + "/VIDEO_TS"
         if not (os.path.exists(videoTs) and os.path.isdir(videoTs)):
                 return False
         print_verbose('A DVD backup directory (with DVD directory structure) detected.')
+        print_verbose('A DVD backup directory with DVD directory structure detected.')
         metadata_target = dirName + "/" + dirMetadataFileName
+        if os.path.exists(metadata_target) and not overwrite:
+                print_verbose("Metadata already exists, not overwriting.")
+                return True
+        [src_nfo, metadata] = find_metadata_for_video_path(dirName + "/VIDEO_TS")
+        metadata = None
+        if import_from_files:
+                metadata = load_metadata_file(metadata_target)
+        if metadata is None:
+                if should_be_skipped(dirName, metadata_target):
+                        return True
+                metadata = find_metadata_for_video_path(dirName + "/VIDEO_TS")
         if metadata is not None:
                 save_metadata(metadata_target, metadata)
+                save_metadata(dirName, metadata_target, metadata)
         return True
 def detect_compressed_dvd_backup_dir(dirName):
         """
         If the given directory is detected as a directory with one or more files of
         a single title, fetched the meta data and returns true.
+        a single title, fetches the meta data and returns true.
         """
         global videoExtensions
+        global videoExtensions, import_from_files
         maxFilesPerTitle = 3
         foundVideos = None
 …
         # a collection of videos in a directory (e.g., a backup of a tv-series).
         for ext in videoExtensions:
                 videos = glob.glob(dirName + "/*." + ext)
                 # TODO: ensure that the filenames are almost exactly the same (CD1, CD2, etc.)
                 if 1 < len(videos) <= maxFilesPerTitle:
                         if foundVideos is not None:
                                 # Already found a set of videos, this cannot be a dvdrip dir
                                 return False
+                        # Ensure that file names are of the same length:
+                        # moviename.cd1.avi moviename.cd2.avi, etc.
+                        # in addition, detect that the file names don't look like series episodes
+                        # Detect that the file names don't look like series episodes
                         filename_length = len(videos[0])
                         for video in videos:
                                 if imdbpy.detect_series_query(cleanup_title(video)) != (None, None, None):
                                         print_verbose("'%s' looks like a TV-series episode." % video)
                                         return False
+                                if len(video) != filename_length:
+                        # Detect the disc numbers from file names.
+                        # If cannot detect, assume it's not a dvd rip dir.
+                        for video in videos:
+                                disc = detect_disc_number(videos, video)
+                                if disc is None:
+                                        print_verbose("Did not detect disc number for %s." % video)
                                         return False
+                                else:
+                                        print_verbose("Found disc %d." % disc)
                         foundVideos = videos
                 elif len(videos) > maxFilesPerTitle:
                         return False                    # Too many videos for a dvdrip dir.
         metadata_target = dirName + "/" + dirMetadataFileName
         if foundVideos is not None:
+                print_verbose('Compressed DVD backup directory (a.k.a. DVD rip) detected.')
+                if os.path.exists(metadata_target) and not overwrite:
+                        print_verbose("Metadata already exists, not overwriting.")
+                        return True
+                print_verbose('DVD rip directory detected.')
+                # Check if the video search should be skipped (because of existing data).
+                first_file = foundVideos[0]
+                if should_be_skipped(first_file, metadata_target):
+                        print_verbose("Skipping '%s'." % dirName)
+                        return True # DVD rip was detected, but no data should be inserted
                 # Scan for the IMDb ID as usual, but store the
                 # metadata to video.metadata file instead, i.e., do not create .metadata for
                 # all videos in the directory.
+                [src_nfo, metadata] = find_metadata_for_video_path(foundVideos[0])
+                metadata = None
+                if import_from_files:
+                        metadata = load_metadata_file(metadata_target)
+                if metadata is None:
+                        metadata = find_metadata_for_video_path(foundVideos[0])
                 if metadata is not None:
                         # Add the Files: metadata which lists the videos in correct playing order
                         metadata += video_file_list_metadata(foundVideos)
                         save_metadata(metadata_target, metadata)
+                        save_metadata(dirName, metadata_target, metadata)
                 return True
         return False
+def scan_file(pathName):
+        metadata_target = strip_extension(pathName) + ".metadata";
+        if os.path.exists(metadata_target) and not overwrite:
+                print_verbose("Metadata already exists, not overwriting.")
+        else:
+                [src_nfo, metadata] = find_metadata_for_video_path(pathName)
+                save_metadata(metadata_target, metadata)
+def scan_file(pathName, imdb_id = None):
+        global import_from_files
+        metadata_target = strip_extension(pathName) + ".metadata";
+        if should_be_skipped(pathName, metadata_target):
+                print_verbose("Skipping '%s'." % pathName)
+                return
+        metadata = None
+        if import_from_files:
+                metadata = load_metadata_file(metadata_target)
+        if imdb_id is not None:
+                metadata = imdbpy.metadata_search(imdb_id)
+                metadata += "IMDb:%s" % imdb_id + "\n"
+        if metadata is None:
+                metadata = find_metadata_for_video_path(pathName)
+        if metadata is not None:
+                save_metadata(pathName, metadata_target, metadata)
 def scan_directory(dirName):
+def scan_directory(dirName, imdb_id = None):
         global videoExtensions
         print_verbose("Scanning directory %s..." % dirName)
         if detect_compressed_dvd_backup_dir(dirName):
                 return
+        if imdb_id is not None:
+                metadata = imdbpy.metadata_search(imdb_id)
+                if metadata is not None:
+                        metadata += "IMDb:%s" % imdb_id + "\n"
+                        save_metadata(dirName, dirName + "/video.metadata", metadata)
+                        return
         if detect_dvd_backup(dirName):
                 return
 …
         for video in foundVideos:
                 scan_file(video)
+def scan(pathName):
+def should_be_skipped(path, meta_file = None):
+        """
+        Returns true in case the given path should be skipped in the scan.
+        """
+        global skipDirs, overwrite, dbimport, metafiles
+        if path.endswith("/"):
+                path = path[0:-1]
+        # Check the ignored filename patterns.
+        for skip in skipDirs:
+                if path.endswith(skip):
+                        return True
+        # Check if we are not in overwrite mode and there is existing data
+        # for the wanted targets (metadata files and/or MythDB).
+        if not overwrite:
+                need_mythdb_data = dbimport and mythvideo_metadata_id(path) is None
+                need_metadata_file = metafiles
+                if metafiles and meta_file is not None:
+                        need_metadata_file = not os.path.exists(meta_file)
+                if not need_mythdb_data and not need_metadata_file:
+                        return True # No need for data, skip this path.
+        return False
+def scan(pathName, imdb_id = None):
         global recursive
         metadata = None
         metadata_target = None
         if os.path.isdir(pathName):
                 if recursive:
                         for root, dirs, files in os.walk(pathName):
+                                if should_be_skipped(root): continue
+                                if should_be_skipped(root):
+                                        print_verbose("Skipping '%s'." % root)
+                                        continue
                                 scan_directory(root)
                 else:
+                        scan_directory(pathName)
+                        if should_be_skipped(pathName):
+                                print_verbose("Skipping '%s'." % pathName)
+                                return
+                        scan_directory(pathName, imdb_id)
         elif os.path.isfile(pathName):
+                scan_file(pathName)
+                if should_be_skipped(pathName):
+                        print_verbose("Skipping '%s'." % pathName)
+                        return
+                scan_file(pathName, imdb_id)
         else:
                 raise IOError("File not found")
         return
 def main():
+        global verbose,overwrite,interactive,recursive
+        global verbose,overwrite,interactive,recursive,dbimport
+        global import_from_files,metafiles,poster_dir
+        p = optparse.OptionParser()
+        usage = "usage: %prog [options] videopath1 [videopath2 videopath3...]"
+        p = optparse.OptionParser(usage=usage)
         p.add_option('--version', '-v', action="store_true", default=False,
                 help="display 1-line describing name, version, author etc")
+                help="Display 1-line describing name, version, author etc.")
         p.add_option('--overwrite', '-o', action="store_true", default=False,
                 help="overwrite existing metadata file(s)")
+                help="Overwrite existing metadata.")
         p.add_option('--wordy', '-w', action="store_true", default=False,
                 help="verbose mode, be wordy while scanning for the info")
+                help="Verbose mode, be wordy while scanning for the info.")
         p.add_option('--interactive', '-i', action="store_true", default=False,
                 help="allow the script to ask questions from the user to find the meta data")
+                help="Allow the script to ask questions from the user to find the meta data.")
         p.add_option('--recursive', '-r', action="store_true", default=False,
+                help="traverse sub directories of the given directory recursively")
+                help="Traverse sub directories of the given directory recursively.")
+        p.add_option('--no_dbimport', '-n', action="store_true", default=False,
+                help="Do not import metadata directly to MythDB.")
+        p.add_option('--fromfiles', '-f', action="store_true", default=False,
+                help="Import data to MythDB from .metadata files if found. Requires -d.")
+        p.add_option('--metafiles', '-m', action="store_true", default=False,
+                help="Write metadata to *.metadata ascii files.")
+        p.add_option('--answer', '-a', action="store", type="string", dest="imdb_id",
+                help="Fetch metadata with the given IMDb ID for the path (must be a single path).")
         options, arguments = p.parse_args()
         if options.version:
                 print "MythVideo Metadata Finder (c) Pekka Jääskeläinen 2006-2007"
+                print "MythVideo Metadata Finder (c) Pekka JÃ€Ã€skelÃ€inen 2006-2007"
                 sys.exit(0)
         verbose = options.wordy
         overwrite = options.overwrite
         interactive = options.interactive
         recursive = options.recursive
+        dbimport = not options.no_dbimport
+        import_from_files = options.fromfiles and dbimport
+        metafiles = options.metafiles
+        if not (metafiles or dbimport):
+                print "You must define writing to either MythDB import (-d) or metadata files (-m)."
+                sys.exit(1)
         if len(arguments) < 1:
                 print "Please give the file/directory to be scanned as argument."
+                print "Please give the paths to be scanned as argument."
                 sys.exit(1)
+        paths = arguments
+        pathName = " ".join(arguments)
+        if not os.path.exists(pathName):
+                print "Given file does not exist."
+                sys.exit(1)
+        if options.imdb_id is not None:
+                if recursive:
+                        print "Manual IMDb ID must be given in recursive mode."
+                        sys.exit(1)
+                if len(arguments) > 1:
+                        print "Manual IMDb ID must be given for a single path only (%d given)." % len(arguments)
+                        sys.exit(1)
+                print_verbose("IMDb ID %s given manually." % options.imdb_id)
+        if dbimport:
+                if not db_support:
+                        print "You must install MySQLdb module to make direct DB importing to work"
+                        sys.exit(1)
+                if not init_db():
+                        print "Database connection failed."
+                        sys.exit(1)
+                poster_dir = mythtv_setting("VideoArtworkDir", socket.gethostname())
+        scan(pathName)
+        for path in paths:
+                if not os.path.exists(path):
+                        print "'%s' does not exist." % path
+                        sys.exit(1)
+                scan(path, options.imdb_id)
         sys.exit(0)

mythvideo/mythvideo/scripts/imdbpy.py

-                      old
+                      new
 it to make this script work.
 This wrapper script is written by
+Pekka JÃ€Ã€skelÃ€inen (pekka jaaskelainen gmail).
+Changes:
+-02-21:[AW] Inserted plot outline as potential plot pick, now prints
+                genre and country.
+-11-26:[PJ] Modified some of the functions to be suitable for using as a
+                Python API (from find_meta.py).
+-10-05:[PJ] Improved poster searching and Runtime metadata finding for
+                TV-series episodes.
+                Better detection for a episode search.
+-10-04:[PJ] The first version.
+Pekka JÃ€Ã€skelÃ€inen (gmail: pekka.jaaskelainen).
 """
 import sys
 …
 try:
         import imdb
 except ImportError:
         print "You need to install the IMDbPy library from "\
                         "http://imdbpy.sourceforge.net/"
+        print "You need to install the IMDbPy library "\
+                "from (http://imdbpy.sourceforge.net/?page=download)"
         sys.exit(1)
 def detect_series_query(search_string):
 …
                                         # Probably indexing exception in case the episode/season
                                         # is not found.
                                         continue
+                                # Found an exact episode match, return that match only.
+                                matches = []
                                 matches.append([imdb_access.get_imdbID(ep),
                                                 title.title().strip() + ", S" + season + " E" +
                                                 episode, int(serie['year'])])
+                                return matches
                         else:
                                 matches.append([imdb_access.get_imdbID(serie),
                                         serie['title'], int(serie['year'])])
 …
         imdb_access = imdb.IMDb()
         #print "Search:",search_string
         movies = imdb_access.search_movie(search_string.encode("ascii", 'replace'))
+        movies = imdb_access.search_movie(search_string.encode("ascii", 'ignore'))
         if movies is None or len(movies) == 0:
                 return None
 …
                 movies.append([imdb_access.get_imdbID(m), m['title'], int(m['year'])])
         return movies
+def poster_search(imdb_id):
+def find_poster_url(imdb_id):
         imdb_access = imdb.IMDb()
         movie = imdb_access.get_movie(imdb_id)
         imdb_access.update(movie)
         url = None
         if 'cover url' in movie.keys():
                 url = movie['cover url']
+        if url is not None:
+                print url
+        elif movie['kind'] == 'episode':
+        if url is None and movie['kind'] == 'episode':
                 series = movie['episode of']
                 imdb_access.update(series)
                 if 'cover url' in series.keys():
                         url = series['cover url']
+                if url is not None:
+                        print url
+        return url
+def poster_search(imdb_id):
+        url = find_poster_url(imdb_id)
+        if url is not None:
+                print url
 def metadata_search(imdb_id):
         metadata = unicode()
 …
         if 'plot' in movie.keys():
                 plots = movie['plot']
                 if movie['plot outline'] is not None and len(movie['plot outline']):
+                if 'plot outline' in movie and len(movie['plot outline']):
                         plots.append("Outline::" + movie['plot outline'])
                 if plots is not None:
                         # Find the shortest plot.
 …
         elif options.poster_search is not None:
                 poster_search(options.poster_search)
         elif options.metadata_search is not None:
                 print metadata_search(options.metadata_search)
+                print metadata_search(options.metadata_search).encode("utf8")
         else:
                 p.print_help()
         sys.exit(0)

Download in other formats:

Original Format