#!/usr/bin/env python # # VideoSort post-processing script for NZBGet. # # Copyright (C) 2013-2020 Andrey Prygunkov # # This program is free software; you can redistribute it and/or modify it # under the terms of the GNU Lesser General Public License as published by # the Free Software Foundation; either version 3 of the License, or # (at your option) any later version. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU Lesser General Public License for more details. # # You should have received a copy of the GNU Lesser General Public License # along with the program. If not, see . # ############################################################################## ### NZBGET POST-PROCESSING SCRIPT ### # Sort movies and tv shows. # # This is a script for downloaded TV shows and movies. It uses scene-standard # naming conventions to match TV shows and movies and rename/move/sort/organize # them as you like. # # The script relies on python library "guessit" (http://guessit.readthedocs.org) # to extract information from file names and includes portions of code from # "SABnzbd+" (http://sabnzbd.org). # # Info about pp-script: # Author: Andrey Prygunkov (nzbget@gmail.com). # Web-site: http://nzbget.net/VideoSort. # License: GPLv3 (http://www.gnu.org/licenses/gpl.html). # PP-Script Version: 9.0. # # NOTE: This script requires Python 2.x or 3.x to be installed on your system. ############################################################################## ### OPTIONS ### # Destination directory for movies. # # The option can be left empty to use global DestDir or CategoryX.DestDir # as destination. #MoviesDir=${DestDir}/movies # Destination directory for seasoned TV shows. # # The option can be left empty to use global DestDir or CategoryX.DestDir # as destination. #SeriesDir=${DestDir}/series # Destination directory for dated TV shows. # # The option can be left empty to use global DestDir or CategoryX.DestDir # as destination. #DatedDir=${DestDir}/tv # Destination directory for other TV shows. # # The option can be left empty to use global DestDir or CategoryX.DestDir # as destination. #OtherTvDir=${DestDir}/tv # List of TV categories. # # Comma separated list of categories for TV. VideoSort automatically # distinguishes movies from series and dated TV shows. But it needs help # to distinguish movies from other TV shows because they are named # using same conventions. If a download has associated category listed in # option , VideoSort uses this information. # # Category names must match categories defined in NZBGet. #TvCategories=tv # File extensions for video files. # # Only files with these extensions are processed. Extensions must # be separated with commas. # Example=.mkv,.avi,.divx,.xvid,.mov,.wmv,.mp4,.mpg,.mpeg,.vob,.iso #VideoExtensions=.mkv,.avi,.divx,.xvid,.mov,.wmv,.mp4,.mpg,.mpeg,.vob,.iso # File extensions for satellite files. # # Move satellite files such as subtitles to the destination along with # the files they are related to. Extensions must be separated with commas. # Example=.srt,.nfo #SatelliteExtensions=.srt,.sub # Minimum video file size (Megabytes). # # Smaller files are ignored. #MinSize=100 # Formatting rules for movies. # # Specifiers for movies: # %t, %.t, %_t - movie title with words separated with spaces, dots # or underscores (case-adjusted); # %tT, %t.T, %t_T - movie title (original letter case); # %y - year; # %decade - two-digits decade (90, 00, 10); # %0decade - four-digits decade (1990, 2000, 2010). # %imdb - IMDb ID; # %cpimdb - IMDb ID (formatted for CouchPotato); # # Common specifiers (for movies, series and dated tv shows): # %dn - original directory name (nzb-name); # %^dn, %.dn, %_dn - directory name with words separated with spaces, dots # or underscores (case-adjusted); # %^dN, %.dN, %_dN - directory name with words separated with spaces, dots # or underscores (original letter case); # %fn - original filename; # %^fn, %.fn, %_fn - filename with words separated with spaces, dots # or underscores (case-adjusted); # %^fN, %.fN, %_fN - filename with words separated with spaces, dots # or underscores (original letter case); # %cat, %.cat, %_cat - category with words separated with spaces, dots # or underscores (case-adjusted); # %cAt, %.cAt, %_cAt - category (original letter case); # %ext - file extension; # %Ext - file extension (case-adjusted); # %qf - video format (HTDV, BluRay, WEB-DL); # %qss - screen size (720p, 1080i); # %qvc - video codec (x264); # %qac - audio codec (DTS); # %qah - audio channels (5.1); # %qrg - release group; # {{text}} - uppercase the text; # {TEXT} - lowercase the text. #MoviesFormat=%t (%y) # Formatting rules for seasoned TV shows. # # Specifiers: # %sn, %s.n, %s_n - show name with words separated with spaces, dots # or underscores (case-adjusted); # %sN, %s.N, %s_N - show name (original letter case); # %s - season number (1, 2); # %0s - two-digits season number (01, 02); # %e - episode number (1, 2); # %0e - two-digits episode number (01, 02); # %en, %e.n, %e_n - episode name (case-adjusted); # %eN, %e.N, %e_N - episode name (original letter case); # %y - year; # %decade - two-digits decade (90, 00, 10); # %0decade - four-digits decade (1990, 2000, 2010). # # For a list of common specifiers see option . #SeriesFormat=%sn/Season %s/%sn - S%0sE%0e - %en # Multiple Episodes (list, range). # # This option is used for seasoned TV shows when the video file includes multiple episodes. For example: the formatting # string "S%0sE%0e", combined with "MultipleEpisode=list" and "EpisodeSeparator=E" will result in a file named # "My.Show.S01E01E02E03". "MultipleEpisode=range" and "EpisodeSeparator=-E" will result in a file named # "My.Show.S01E01-E03.mkv". The "range" option is useful to follow the TV episode naming conventions of popular media # management software, such as Plex. # #MultipleEpisodes=range # Separator for multi episodes. # # The option is used for seasoned TV shows when video file includes # multiple episodes, e. g. "My.Show.S01E02-03.mkv". The option defines # a character (or a string) which must be insterted between episode # numbers. For example, if "EpisodeSeparator=E", the specifier "%0e" # will expand to "02E03". Giving formatting string "%sN - S%0sE%0e" the # resulting filename will be "My Show - S01E02E03.mkv". #EpisodeSeparator=E # Treat year following title as part of title (yes, no). # # For seasoned TV shows: if year in the file name goes directly after # show name, it will be added to show name. This may be necessary for # media players like XBMC, Boxee or Plex (or anyone using TheTVDB) to # properly index TV show. #SeriesYear=yes # Formatting rules for dated TV shows. # # Specifiers: # %sn, %s.n, %s_n - show name with words separated with spaces, dots # or underscores (case-adjusted); # %sN, %s.N, %s_N - show name (original letter case); # %en, %e.n, %e_n - episode name (case-adjusted); # %eN, %e.N, %e_N - episode name (original letter case); # %y - year; # %decade - two-digits decade (90, 00, 10); # %0decade - four-digits decade (1990, 2000, 2010). # %m - month (1-12); # %0m - two-digits month (01-12); # %d - day (1-31); # %0d - two-digits day (01-31). # # For a list of common specifiers see option . #DatedFormat=%sn/%sn - %en - %y-%0m-%0d # Formatting rules for other TV shows. # # All specifiers are same as in option . #OtherTvFormat=%t # List of words to keep in lower case. # # This option has effect on "case-adjusted"-specifiers. #LowerWords=the,of,and,at,vs,a,an,but,nor,for,on,so,yet # List of words to keep in upper case. # # This option has effect on "case-adjusted"-specifiers. #UpperWords=III,II,IV # Use information from Direct-NZB headers (yes, no). # # NZB-sites may provide extended information about videos, # which is usually more confident than the information extracted # from file names. #DNZBHeaders=yes # Use name of nzb-file instead of name of video file (yes, no). # # Good indexer nzb-sites do renaming and cleanup of nzb-file # names making them a better choice to extract name information # than the original video file names. # # NOTE: If download contains more than one video file suitable # for renaming (having correct extension and bigger than ) # this option is ignored and the names of video files are always used. #PreferNZBName=no # Overwrite files at destination (yes, no). # # If not active the files are still moved into destination but # unique suffixes are added at the end of file names, e.g. My.Show.(2).mkv. #Overwrite=no # Delete download directory after renaming (yes, no). # # If after successful sorting all remaining files in the download directory # are smaller than "MinSize" the directory with all files is removed. If no # files could be processed, the directory remains untouched. #Cleanup=yes # Preview mode (yes, no). # # When active no changes to file system are made but the destination # file names are logged. Useful to test formating rules; to restart # the script use "Post-Process-Again" on history tab in NZBGet web-interface. #Preview=no # Print more logging messages (yes, no). # # For debugging or if you need to report a bug. #Verbose=no ### NZBGET POST-PROCESSING SCRIPT ### ############################################################################## import sys from os.path import dirname sys.path.insert(0, dirname(__file__) + '/lib') import os import traceback import re import shutil import guessit import difflib try: unicode except NameError: unicode = str # Exit codes used by NZBGet POSTPROCESS_SUCCESS=93 POSTPROCESS_NONE=95 POSTPROCESS_ERROR=94 # Check if the script is called from nzbget 11.0 or later if not 'NZBOP_SCRIPTDIR' in os.environ: print('*** NZBGet post-processing script ***') print('This script is supposed to be called from nzbget (11.0 or later).') sys.exit(POSTPROCESS_ERROR) # Check if directory still exist (for post-process again) if not os.path.exists(os.environ['NZBPP_DIRECTORY']): print('[INFO] Destination directory %s doesn\'t exist, exiting' % os.environ['NZBPP_DIRECTORY']) sys.exit(POSTPROCESS_NONE) # Check par and unpack status for errors if os.environ['NZBPP_PARSTATUS'] == '1' or os.environ['NZBPP_PARSTATUS'] == '4' or os.environ['NZBPP_UNPACKSTATUS'] == '1': print('[WARNING] Download of "%s" has failed, exiting' % (os.environ['NZBPP_NZBNAME'])) sys.exit(POSTPROCESS_NONE) # Check if all required script config options are present in config file required_options = ('NZBPO_MoviesDir', 'NZBPO_SeriesDir', 'NZBPO_DatedDir', 'NZBPO_OtherTvDir', 'NZBPO_VideoExtensions', 'NZBPO_SatelliteExtensions', 'NZBPO_MinSize', 'NZBPO_MoviesFormat', 'NZBPO_SeriesFormat', 'NZBPO_OtherTvFormat', 'NZBPO_DatedFormat', 'NZBPO_EpisodeSeparator', 'NZBPO_Overwrite', 'NZBPO_Cleanup', 'NZBPO_LowerWords', 'NZBPO_UpperWords', 'NZBPO_TvCategories', 'NZBPO_Preview', 'NZBPO_Verbose') for optname in required_options: if (not optname.upper() in os.environ): print('[ERROR] Option %s is missing in configuration file. Please check script settings' % optname[6:]) sys.exit(POSTPROCESS_ERROR) # Init script config options nzb_name=os.environ['NZBPP_NZBNAME'] download_dir=os.environ['NZBPP_DIRECTORY'] movies_format=os.environ['NZBPO_MOVIESFORMAT'] series_format=os.environ['NZBPO_SERIESFORMAT'] dated_format=os.environ['NZBPO_DATEDFORMAT'] othertv_format=os.environ['NZBPO_OTHERTVFORMAT'] multiple_episodes=os.environ['NZBPO_MULTIPLEEPISODES'] episode_separator=os.environ['NZBPO_EPISODESEPARATOR'] movies_dir=os.environ['NZBPO_MOVIESDIR'] series_dir=os.environ['NZBPO_SERIESDIR'] dated_dir=os.environ['NZBPO_DATEDDIR'] othertv_dir=os.environ['NZBPO_OTHERTVDIR'] video_extensions=os.environ['NZBPO_VIDEOEXTENSIONS'].replace(' ', '').lower().split(',') satellite_extensions=os.environ['NZBPO_SATELLITEEXTENSIONS'].replace(' ', '').lower().split(',') min_size=int(os.environ['NZBPO_MINSIZE']) min_size <<= 20 overwrite=os.environ['NZBPO_OVERWRITE'] == 'yes' cleanup=os.environ['NZBPO_CLEANUP'] == 'yes' preview=os.environ['NZBPO_PREVIEW'] == 'yes' verbose=os.environ['NZBPO_VERBOSE'] == 'yes' satellites=len(satellite_extensions)>0 lower_words=os.environ['NZBPO_LOWERWORDS'].replace(' ', '').split(',') upper_words=os.environ['NZBPO_UPPERWORDS'].replace(' ', '').split(',') series_year=os.environ.get('NZBPO_SERIESYEAR', 'yes') == 'yes' tv_categories=os.environ['NZBPO_TVCATEGORIES'].lower().split(',') category=os.environ.get('NZBPP_CATEGORY', '') force_tv=category.lower() in tv_categories dnzb_headers=os.environ.get('NZBPO_DNZBHEADERS', 'yes') == 'yes' dnzb_proper_name=os.environ.get('NZBPR__DNZB_PROPERNAME', '') dnzb_episode_name=os.environ.get('NZBPR__DNZB_EPISODENAME', '') dnzb_movie_year=os.environ.get('NZBPR__DNZB_MOVIEYEAR', '') dnzb_more_info=os.environ.get('NZBPR__DNZB_MOREINFO', '') prefer_nzb_name=os.environ.get('NZBPO_PREFERNZBNAME', '') == 'yes' use_nzb_name=False # NZBPO_DNZBHEADERS must also be enabled deep_scan = dnzb_headers # difflib match threshold. Anything below is not considered a match deep_scan_ratio = 0.60 if preview: print('[WARNING] *** PREVIEW MODE ON - NO CHANGES TO FILE SYSTEM ***') if verbose and force_tv: print('[INFO] Forcing TV sorting (category: %s)' % category) # List of moved files (source path) moved_src_files = [] # List of moved files (destination path) moved_dst_files = [] # Separator character used between file name and opening brace # for duplicate files such as "My Movie (2).mkv" dupe_separator = ' ' class deprecation_support: """Class implementing iterator for deprecation message support""" def __init__(self, mapping): self.iter = iter(mapping) def __iter__(self): return self def __next__(self): map_entry = next(self.iter) return map_entry if len(map_entry) >= 3 else list(map_entry) + [None] def next(self): return self.__next__() def guess_dupe_separator(format): """ Find out a char most suitable as dupe_separator """ global dupe_separator dupe_separator = ' ' format_fname = os.path.basename(format) for x in ('%.t', '%s.n', '%s.N'): if (format_fname.find(x) > -1): dupe_separator = '.' return for x in ('%_t', '%s_n', '%s_N'): if (format_fname.find(x) > -1): dupe_separator = '_' return def unique_name(new): """ Adds unique numeric suffix to destination file name to avoid overwriting such as "filename.(2).ext", "filename.(3).ext", etc. If existing file was created by the script it is renamed to "filename.(1).ext". """ fname, fext = os.path.splitext(new) suffix_num = 2 while True: new_name = fname + dupe_separator + '(' + str(suffix_num) + ')' + fext if not os.path.exists(new_name) and new_name not in moved_dst_files: break suffix_num += 1 return new_name def optimized_move(old, new): try: os.rename(old, new) except OSError as ex: print('[DETAIL] Rename failed ({}), performing copy: {}'.format(ex, new)) shutil.copyfile(old, new) os.remove(old) def rename(old, new): """ Moves the file to its sorted location. It creates any necessary directories to place the new file and moves it. """ if os.path.exists(new) or new in moved_dst_files: if overwrite and new not in moved_dst_files: os.remove(new) optimized_move(old, new) print('[INFO] Overwrote: %s' % new) else: # rename to filename.(2).ext, filename.(3).ext, etc. new = unique_name(new) rename(old, new) else: if not preview: if not os.path.exists(os.path.dirname(new)): os.makedirs(os.path.dirname(new)) optimized_move(old, new) print('[INFO] Moved: %s' % new) moved_src_files.append(old) moved_dst_files.append(new) return new def move_satellites(videofile, dest): """ Moves satellite files such as subtitles that are associated with base and stored in root to the correct dest. """ if verbose: print('Move satellites for %s' % videofile) root = os.path.dirname(videofile) destbasenm = os.path.splitext(dest)[0] base = os.path.basename(os.path.splitext(videofile)[0]) for (dirpath, dirnames, filenames) in os.walk(root): for filename in filenames: fbase, fext = os.path.splitext(filename) fextlo = fext.lower() fpath = os.path.join(dirpath, filename) if fextlo in satellite_extensions: # Handle subtitles and nfo files subpart = '' # We support GuessIt supported subtitle extensions if fextlo[1:] in ['srt', 'idx', 'sub', 'ssa', 'ass']: guess = guessit.guessit(filename) if guess and 'subtitle_language' in guess: fbase = fbase[:fbase.rfind('.')] # Use alpha2 subtitle language from GuessIt (en, es, de, etc.) subpart = '.' + guess['subtitle_language'][0].alpha2 if verbose: if subpart != '': print('Satellite: %s is a subtitle [%s]' % (filename, guess['subtitle_language'][0])) else: # English (or undetermined) print('Satellite: %s is a subtitle' % filename) elif (fbase.lower() != base.lower()) and fextlo == '.nfo': # Aggressive match attempt if deep_scan: guess = deep_scan_nfo(fpath) if guess is not None: # Guess details are not important, just that there was a match fbase = base if fbase.lower() == base.lower(): old = fpath new = destbasenm + subpart + fext if verbose: print('Satellite: %s' % os.path.basename(new)) rename(old, new) def deep_scan_nfo(filename, ratio=deep_scan_ratio): if verbose: print('Deep scanning satellite: %s (ratio=%.2f)' % (filename, ratio)) best_guess = None best_ratio = 0.00 try: nfo = open(filename) # Convert file content into iterable words for word in ''.join([item for item in nfo.readlines()]).split(): try: guess = guessit.guessit(word + '.nfo') # Series = TV, Title = Movie if any(item in guess for item in ('title')): # Compare word against NZB name diff = difflib.SequenceMatcher(None, word, nzb_name) # Evaluate ratio against threshold and previous matches if verbose: print('Tested: %s (ratio=%.2f)' % (word, diff.ratio())) if diff.ratio() >= ratio and diff.ratio() > best_ratio: if verbose: print('Possible match found: %s (ratio=%.2f)' % (word, diff.ratio())) best_guess = guess best_ratio = diff.ratio() except UnicodeDecodeError: # Ignore non-unicode words (common in nfo "artwork") pass nfo.close() except IOError as e: print('[ERROR] %s' % str(e)) return best_guess def cleanup_download_dir(): """ Remove the download directory if it (or any subfodler) does not contain "important" files (important = size >= min_size) """ if verbose: print('Cleanup') # Check if there are any big files remaining for root, dirs, files in os.walk(download_dir): for filename in files: path = os.path.join(root, filename) # Check minimum file size if os.path.getsize(path) >= min_size and (not preview or path not in moved_src_files): print('[WARNING] Skipping clean up due to large files remaining in the directory') return # Now delete all files with nice logging for root, dirs, files in os.walk(download_dir): for filename in files: path = os.path.join(root, filename) if not preview or path not in moved_src_files: if not preview: os.remove(path) print('[INFO] Deleted: %s' % path) if not preview: shutil.rmtree(download_dir) print('[INFO] Deleted: %s' % download_dir) STRIP_AFTER = ('_', '.', '-') # * From SABnzbd+ (with modifications) * REPLACE_AFTER = { '()': '', '..': '.', '__': '_', ' ': ' ', '//': '/', ' - - ': ' - ', '--': '-' } def path_subst(path, mapping): """ Replace the sort sting elements by real values. Non-elements are copied literally. path = the sort string mapping = array of tuples that maps all elements to their values """ newpath = [] plen = len(path) n = 0 # Sort list of mapping tuples by their first elements. First ascending by element, # then descending by element length. # Preparation to replace elements from longest to shortest in alphabetical order. # # >>> m = [('bb', 4), ('aa', 3), ('b', 6), ('aaa', 2), ('zzzz', 1), ('a', 5)] # >>> m.sort(key=lambda t: t[0]) # >>> m # [('a', 5), ('aa', 3), ('aaa', 2), ('b', 6), ('bb', 4), ('zzzz', 1)] # >>> m.sort(key=lambda t: len(t[0]), reverse=True) # >>> m # [('zzzz', 1), ('aaa', 2), ('aa', 3), ('bb', 4), ('a', 5), ('b', 6)] mapping.sort(key=lambda t: t[0]) mapping.sort(key=lambda t: len(t[0]), reverse=True) while n < plen: result = path[n] if result == '%': for key, value, msg in deprecation_support(mapping): if path.startswith(key, n): n += len(key)-1 result = value if msg: print('[WARNING] specifier %s is deprecated, %s' % (key, msg)) break newpath.append(result) n += 1 return ''.join(map(lambda x: '.'.join(x) if isinstance(x, list) else str(x), newpath)) def get_titles(name, titleing=False): ''' The title will be the part before the match Clean it up and title() it ''.title() isn't very good under python so this contains a lot of little hacks to make it better and for more control ''' #make valid filename title = re.sub('[\"\:\?\*\\\/\<\>\|]', ' ', name) if titleing: title = titler(title) # title the show name so it is in a consistant letter case #title applied uppercase to 's Python bug? title = title.replace("'S", "'s") # Make sure some words such as 'and' or 'of' stay lowercased. for x in lower_words: xtitled = titler(x) title = replace_word(title, xtitled, x) # Make sure some words such as 'III' or 'IV' stay uppercased. for x in upper_words: xtitled = titler(x) title = replace_word(title, xtitled, x) # Make sure the first letter of the title is always uppercase if title: title = titler(title[0]) + title[1:] # The title with spaces replaced by dots dots = title.replace(" - ", "-").replace(' ','.').replace('_','.') dots = dots.replace('(', '.').replace(')','.').replace('..','.').rstrip('.') # The title with spaces replaced by underscores underscores = title.replace(' ','_').replace('.','_').replace('__','_').rstrip('_') return title, dots, underscores def titler(p): """ title() replacement Python's title() fails with Latin-1, so use Unicode detour. """ if isinstance(p, unicode): return p.title() elif gUTF: try: return p.decode('utf-8').title().encode('utf-8') except: return p.decode('latin-1', 'replace').title().encode('latin-1', 'replace') else: return p.decode('latin-1', 'replace').title().encode('latin-1', 'replace') def replace_word(input, one, two): ''' Regex replace on just words ''' regex = re.compile(r'\W(%s)(\W|$)' % one, re.I) matches = regex.findall(input) if matches: for m in matches: input = input.replace(one, two) return input def get_decades(year): """ Return 4 digit and 2 digit decades given 'year' """ if year: try: decade = year[2:3]+'0' decade2 = year[:3]+'0' except: decade = '' decade2 = '' else: decade = '' decade2 = '' return decade, decade2 _RE_LOWERCASE = re.compile(r'{([^{]*)}') def to_lowercase(path): ''' Lowercases any characters enclosed in {} ''' while True: m = _RE_LOWERCASE.search(path) if not m: break path = path[:m.start()] + m.group(1).lower() + path[m.end():] # just incase path = path.replace('{', '') path = path.replace('}', '') return path _RE_UPPERCASE = re.compile(r'{{([^{]*)}}') def to_uppercase(path): ''' Lowercases any characters enclosed in {{}} ''' while True: m = _RE_UPPERCASE.search(path) if not m: break path = path[:m.start()] + m.group(1).upper() + path[m.end():] return path def strip_folders(path): """ Return 'path' without leading and trailing strip-characters in each element """ f = path.strip('/').split('/') # For path beginning with a slash, insert empty element to prevent loss if len(path.strip()) > 0 and path.strip()[0] in '/\\': f.insert(0, '') def strip_all(x): """ Strip all leading/trailing underscores and hyphens also dots for Windows """ old_name = '' while old_name != x: old_name = x for strip_char in STRIP_AFTER: x = x.strip().strip(strip_char) return x return os.path.normpath('/'.join([strip_all(x) for x in f])) gUTF = False try: if sys.platform == 'darwin': gUTF = True else: gUTF = locale.getdefaultlocale()[1].lower().find('utf') >= 0 except: # Incorrect locale implementation, assume the worst gUTF = False # END * From SABnzbd+ * END def add_common_mapping(old_filename, guess, mapping): # Original dir name, file name and extension original_dirname = os.path.basename(download_dir) original_fname, original_fext = os.path.splitext(os.path.split(os.path.basename(old_filename))[1]) original_category = os.environ.get('NZBPP_CATEGORY', '') # Directory name title_name = original_dirname.replace("-", " ").replace('.',' ').replace('_',' ') fname_tname, fname_tname_two, fname_tname_three = get_titles(title_name, True) fname_name, fname_name_two, fname_name_three = get_titles(title_name, False) mapping.append(('%dn', original_dirname)) mapping.append(('%^dn', fname_tname)) mapping.append(('%.dn', fname_tname_two)) mapping.append(('%_dn', fname_tname_three)) mapping.append(('%^dN', fname_name)) mapping.append(('%.dN', fname_name_two)) mapping.append(('%_dN', fname_name_three)) # File name title_name = original_fname.replace("-", " ").replace('.',' ').replace('_',' ') fname_tname, fname_tname_two, fname_tname_three = get_titles(title_name, True) fname_name, fname_name_two, fname_name_three = get_titles(title_name, False) mapping.append(('%fn', original_fname)) mapping.append(('%^fn', fname_tname)) mapping.append(('%.fn', fname_tname_two)) mapping.append(('%_fn', fname_tname_three)) mapping.append(('%^fN', fname_name)) mapping.append(('%.fN', fname_name_two)) mapping.append(('%_fN', fname_name_three)) # File extension mapping.append(('%ext', original_fext)) mapping.append(('%EXT', original_fext.upper())) mapping.append(('%Ext', original_fext.title())) # Category category_tname, category_tname_two, category_tname_three = get_titles(original_category, True) category_name, category_name_two, category_name_three = get_titles(original_category, False) mapping.append(('%cat', category_tname)) mapping.append(('%.cat', category_tname_two)) mapping.append(('%_cat', category_tname_three)) mapping.append(('%cAt', category_name)) mapping.append(('%.cAt', category_name_two)) mapping.append(('%_cAt', category_name_three)) # Video information mapping.append(('%qf', guess.get('format', ''))) mapping.append(('%qss', guess.get('screen_size', ''))) mapping.append(('%qvc', guess.get('video_codec', ''))) mapping.append(('%qac', guess.get('audio_codec', ''))) mapping.append(('%qah', guess.get('audio_channels', ''))) mapping.append(('%qrg', guess.get('release_group', ''))) def add_series_mapping(guess, mapping): # Show name series = guess.get('title', '') show_tname, show_tname_two, show_tname_three = get_titles(series, True) show_name, show_name_two, show_name_three = get_titles(series, False) mapping.append(('%sn', show_tname)) mapping.append(('%s.n', show_tname_two)) mapping.append(('%s_n', show_tname_three)) mapping.append(('%sN', show_name)) mapping.append(('%s.N', show_name_two)) mapping.append(('%s_N', show_name_three)) # season number season_num = str(guess.get('season', '')) mapping.append(('%s', season_num)) mapping.append(('%0s', season_num.rjust(2,'0'))) # episode names title = guess.get('episode_title') if title: ep_tname, ep_tname_two, ep_tname_three = get_titles(title, True) ep_name, ep_name_two, ep_name_three = get_titles(title, False) mapping.append(('%en', ep_tname)) mapping.append(('%e.n', ep_tname_two)) mapping.append(('%e_n', ep_tname_three)) mapping.append(('%eN', ep_name)) mapping.append(('%e.N', ep_name_two)) mapping.append(('%e_N', ep_name_three)) else: mapping.append(('%en', '')) mapping.append(('%e.n', '')) mapping.append(('%e_n', '')) mapping.append(('%eN', '')) mapping.append(('%e.N', '')) mapping.append(('%e_N', '')) # episode number if not isinstance(guess.get('episode'), list): episode_num = str(guess.get('episode', '')) mapping.append(('%e', episode_num)) mapping.append(('%0e', episode_num.rjust(2,'0'))) else: # multi episodes episodes = [str(item) for item in guess.get('episode')] episode_num_all = '' episode_num_just = '' if multiple_episodes == 'range': episode_num_all = episodes[0] + episode_separator + episodes[-1] episode_num_just = episodes[0].rjust(2, '0') + episode_separator + episodes[-1].rjust(2, '0') else: # if multiple_episodes == 'list': for episode_num in episodes: ep_prefix = episode_separator if episode_num_all != '' else '' episode_num_all += ep_prefix + episode_num episode_num_just += ep_prefix + episode_num.rjust(2,'0') mapping.append(('%e', episode_num_all)) mapping.append(('%0e', episode_num_just)) # year year = str(guess.get('year', '')) mapping.append(('%y', year)) # decades decade, decade_two = get_decades(year) mapping.append(('%decade', decade)) mapping.append(('%0decade', decade_two)) def add_movies_mapping(guess, mapping): # title name = guess.get('title', '') ttitle, ttitle_two, ttitle_three = get_titles(name, True) title, title_two, title_three = get_titles(name, False) mapping.append(('%title', ttitle)) mapping.append(('%.title', ttitle_two)) mapping.append(('%_title', ttitle_three)) # title (short forms) mapping.append(('%t', ttitle)) mapping.append(('%.t', ttitle_two)) mapping.append(('%_t', ttitle_three)) mapping.append(('%tT', title)) mapping.append(('%t.T', title_two)) mapping.append(('%t_T', title_three)) # year year = str(guess.get('year', '')) mapping.append(('%y', year)) # decades decade, decade_two = get_decades(year) mapping.append(('%decade', decade)) mapping.append(('%0decade', decade_two)) # imdb mapping.append(('%imdb', guess.get('imdb', ''))) mapping.append(('%cpimdb', guess.get('cpimdb', ''))) def add_dated_mapping(guess, mapping): # title name = guess.get('title', '') ttitle, ttitle_two, ttitle_three = get_titles(name, True) title, title_two, title_three = get_titles(name, True) mapping.append(('%title', title)) mapping.append(('%.title', title_two)) mapping.append(('%_title', title_three)) # title (short forms) mapping.append(('%t', title, 'consider using %sn')) mapping.append(('%.t', title_two, 'consider using %s.n')) mapping.append(('%_t', title_three, 'consider using %s_n')) # Show name series = guess.get('title', '') show_tname, show_tname_two, show_tname_three = get_titles(series, True) show_name, show_name_two, show_name_three = get_titles(series, False) mapping.append(('%sn', show_tname)) mapping.append(('%s.n', show_tname_two)) mapping.append(('%s_n', show_tname_three)) mapping.append(('%sN', show_name)) mapping.append(('%s.N', show_name_two)) mapping.append(('%s_N', show_name_three)) # Some older code at this point stated: # "Guessit doesn't provide episode names for dated tv shows" # but was referring to the invalid field '%desc' # In my researches I couldn't find such a case, but just to be sure ep_title = guess.get('episode_title') if ep_title: ep_tname, ep_tname_two, ep_tname_three = get_titles(ep_title, True) ep_name, ep_name_two, ep_name_three = get_titles(ep_title, False) mapping.append(('%en', ep_tname)) mapping.append(('%e.n', ep_tname_two)) mapping.append(('%e_n', ep_tname_three)) mapping.append(('%eN', ep_name)) mapping.append(('%e.N', ep_name_two)) mapping.append(('%e_N', ep_name_three)) else: mapping.append(('%en', '')) mapping.append(('%e.n', '')) mapping.append(('%e_n', '')) mapping.append(('%eN', '')) mapping.append(('%e.N', '')) mapping.append(('%e_N', '')) # date date = guess.get('date') # year year = str(date.year) mapping.append(('%year', year)) mapping.append(('%y', year)) # decades decade, decade_two = get_decades(year) mapping.append(('%decade', decade)) mapping.append(('%0decade', decade_two)) # month month = str(date.month) mapping.append(('%m', month)) mapping.append(('%0m', month.rjust(2, '0'))) # day day = str(date.day) mapping.append(('%d', day)) mapping.append(('%0d', day.rjust(2, '0'))) def os_path_split(path): parts = [] while True: newpath, tail = os.path.split(path) if newpath == path: if path: parts.append(path) break parts.append(tail) path = newpath parts.reverse() return parts def deobfuscate_path(filename): start = os.path.dirname(download_dir) new_name = filename[len(start)+1:] if verbose: print('stripped filename: %s' % new_name) parts = os_path_split(new_name) if verbose: print(parts) part_removed = 0 for x in range(0, len(parts)-1): fn = parts[x] if fn.find('.')==-1 and fn.find('_')==-1 and fn.find(' ')==-1: print('Detected obfuscated directory name %s, removing from guess path' % fn) parts[x] = None part_removed += 1 fn = os.path.splitext(parts[len(parts)-1])[0] if fn.find('.')==-1 and fn.find('_')==-1 and fn.find(' ')==-1: print('Detected obfuscated filename %s, removing from guess path' % os.path.basename(filename)) parts[len(parts)-1] = '-' + os.path.splitext(filename)[1] part_removed += 1 if part_removed < len(parts): new_name = '' for x in range(0, len(parts)): if parts[x] != None: new_name = os.path.join(new_name, parts[x]) else: print("All file path parts are obfuscated, using obfuscated NZB-Name") new_name = os.path.basename(download_dir) + os.path.splitext(filename)[1] return new_name def remove_year(title): """ Removes year from series name (if exist) """ m = re.compile('..*($(19|20)\d\d$)').search(title) if not m: m = re.compile('..*((19|20)\d\d)').search(title) if m: if verbose: print('Removing year from series name') title = title.replace(m.group(1), '').strip() return title def apply_dnzb_headers(guess): """ Applies DNZB headers (if exist) """ dnzb_used = False if dnzb_proper_name != '': dnzb_used = True if verbose: print('Using DNZB-ProperName') if guess['vtype'] == 'series': proper_name = dnzb_proper_name if not series_year: proper_name = remove_year(proper_name) guess['title'] = proper_name else: guess['title'] = dnzb_proper_name if dnzb_episode_name != '' and guess['vtype'] == 'series': dnzb_used = True if verbose: print('Using DNZB-EpisodeName') guess['episode_title'] = dnzb_episode_name if dnzb_movie_year != '': dnzb_used = True if verbose: print('Using DNZB-MovieYear') guess['year'] = dnzb_movie_year if dnzb_more_info != '': dnzb_used = True if verbose: print('Using DNZB-MoreInfo') if guess['type'] == 'movie': regex = re.compile(r'^http://www.imdb.com/title/(tt[0-9]+)/$', re.IGNORECASE) matches = regex.match(dnzb_more_info) if matches: guess['imdb'] = matches.group(1) guess['cpimdb'] = 'cp(' + guess['imdb'] + ')' if verbose and dnzb_used: print(guess) def guess_info(filename): """ Parses the filename using guessit-library """ if use_nzb_name: if verbose: print("Using NZB-Name") guessfilename = os.path.basename(download_dir) + os.path.splitext(filename)[1] else: guessfilename = deobfuscate_path(filename) # workaround for titles starting with numbers (which guessit has problems with) (part 1) path, tmp_filename = os.path.split(guessfilename) pad_start_digits = tmp_filename[0].isdigit() if pad_start_digits: guessfilename = os.path.join(path, 'T' + tmp_filename) if verbose: print('Guessing: %s' % guessfilename) guess = guessit.api.guessit(unicode(guessfilename), {'allowed_languages': [], 'allowed_countries': []}) if verbose: print(guess) # workaround for titles starting with numbers (part 2) if pad_start_digits: guess['title'] = guess['title'][1:] if guess['title'] == '': guess['title'] = os.path.splitext(os.path.basename(guessfilename))[0][1:] if verbose: print('use filename as title for recovery') # fix some strange guessit guessing: # if guessit doesn't find a year in the file name it thinks it is episode, # but we prefer it to be handled as movie instead if guess.get('type') == 'episode' and guess.get('episode', '') == '': guess['type'] = 'movie' guess['year'] = '1900' if verbose: print('episode without episode-number is a movie') # treat parts as episodes ("Part.2" or "Part.II") if guess.get('type') == 'movie' and guess.get('part') != None: guess['type'] = 'episode' guess['episode'] = guess.get('part') if verbose: print('treat parts as episodes') # add season number if not present if guess['type'] == 'episode' and (guess.get('season') == None): guess['season'] = 1 if verbose: print('force season 1') # detect if year is part of series name if guess['type'] == 'episode': if series_year: if guess.get('year') != None and guess.get('title') != None and \ guess.get('season') != guess.get('year') and \ guess['title'] == remove_year(guess['title']): guess['title'] += ' ' + str(guess['year']) if verbose: print('year is part of title') else: guess['title'] = remove_year(guess['title']) if guess['type'] == 'movie': date = guess.get('date') if date: guess['vtype'] = 'dated' elif force_tv: guess['vtype'] = 'othertv' else: guess['vtype'] = 'movie' elif guess['type'] == 'episode': guess['vtype'] = 'series' else: guess['vtype'] = guess['type'] if dnzb_headers: apply_dnzb_headers(guess) if verbose: print('Type: %s' % guess['vtype']) if verbose: print(guess) return guess def construct_path(filename): """ Parses the filename and generates new name for renaming """ if verbose: print("filename: %s" % filename) guess = guess_info(filename) type = guess.get('vtype') mapping = [] add_common_mapping(filename, guess, mapping) if type == 'movie': dest_dir = movies_dir format = movies_format add_movies_mapping(guess, mapping) elif type == 'series': dest_dir = series_dir format = series_format add_series_mapping(guess, mapping) elif type == 'dated': dest_dir = dated_dir format = dated_format add_dated_mapping(guess, mapping) elif type == 'othertv': dest_dir = othertv_dir format = othertv_format add_movies_mapping(guess, mapping) else: if verbose: print('Could not determine video type for %s' % filename) return None if dest_dir == '': dest_dir = os.path.dirname(download_dir) # Find out a char most suitable as dupe_separator guess_dupe_separator(format) # Add extension specifier if the format string doesn't end with it if format.rstrip('}')[-5:] != '.%ext': format += '.%ext' sorter = format.replace('\\', '/') if verbose: print('format: %s' % sorter) # Replace elements path = path_subst(sorter, mapping) if verbose: print('path after subst: %s' % path) # Cleanup file name old_path = '' while old_path != path: old_path = path for key, name in REPLACE_AFTER.items(): path = path.replace(key, name) path = path.replace('%up', '..') # Uppercase all characters encased in {{}} path = to_uppercase(path) # Lowercase all characters encased in {} path = to_lowercase(path) # Strip any extra strippable characters around foldernames and filename path, ext = os.path.splitext(path) path = strip_folders(path) path = path + ext path = os.path.normpath(path) if verbose: print('path after cleanup: %s' % path) new_path = os.path.join(dest_dir, path) if verbose: print('destination path: %s' % new_path) if filename.upper() == new_path.upper(): if verbose: print('Destination path equals filename - return None') return None return new_path # Flag indicating that anything was moved. Cleanup possible. files_moved = False # Flag indicating any error. Cleanup is disabled. errors = False # Process all the files in download_dir and its subdirectories video_files = [] for root, dirs, files in os.walk(download_dir): for old_filename in files: try: old_path = os.path.join(root, old_filename) # Check extension ext = os.path.splitext(old_filename)[1].lower() if ext not in video_extensions: continue # Check minimum file size if os.path.getsize(old_path) < min_size: print('[INFO] Skipping small: %s' % old_filename) continue # This is our video file, we should process it video_files.append(old_path) except Exception as e: errors = True print('[ERROR] Failed: %s' % old_filename) print('[ERROR] %s' % e) traceback.print_exc() use_nzb_name = prefer_nzb_name and len(video_files) == 1 for old_path in video_files: try: new_path = construct_path(old_path) # Move video file if new_path: new_path = rename(old_path, new_path) files_moved = True # Move satellite files if satellites: move_satellites(old_path, new_path) except Exception as e: errors = True print('[ERROR] Failed: %s' % old_filename) print('[ERROR] %s' % e) traceback.print_exc() # Inform NZBGet about new destination path finaldir = '' uniquedirs = [] for filename in moved_dst_files: dir = os.path.dirname(filename) if dir not in uniquedirs: uniquedirs.append(dir) finaldir += '|' if finaldir != '' else '' finaldir += dir if finaldir != '': print('[NZB] FINALDIR=%s' % finaldir) # Cleanup if: # 1) files were moved AND # 2) no errors happen AND # 3) all remaining files are smaller than if cleanup and files_moved and not errors: cleanup_download_dir() # Returing status to NZBGet if errors: sys.exit(POSTPROCESS_ERROR) elif files_moved: sys.exit(POSTPROCESS_SUCCESS) else: sys.exit(POSTPROCESS_NONE)