public
Description: Simple to use TVDB (thetvdb.com) API in Python, and automatic TV episode namer
Homepage: http://dbr.lighthouseapp.com/projects/13342-tvdb_api/tickets
Clone URL: git://github.com/dbr/tvdb_api.git
tvdb_api / tvnamer.py
100755 339 lines (290 sloc) 11.694 kb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
#!/usr/bin/env python
#encoding:utf-8
#author:dbr/Ben
#project:tvdb_api
#repository:http://github.com/dbr/tvdb_api
#license:Creative Commons GNU GPL v2
# (http://creativecommons.org/licenses/GPL/2.0/)
 
"""
tvnamer.py
Automatic TV episode namer.
Uses data from www.thetvdb.com via tvdb_api
"""
 
__author__ = "dbr/Ben"
__version__ = "1.2.2"
 
import os, sys, re
from optparse import OptionParser
 
from tvdb_api import (tvdb_error, tvdb_shownotfound, tvdb_seasonnotfound,
    tvdb_episodenotfound, tvdb_episodenotfound, tvdb_attributenotfound, tvdb_userabort)
from tvdb_api import Tvdb
 
config = {}
 
### Start user config
 
# The format of the renamed files (with and without episode names)
config['with_ep_name'] = '%(seriesname)s - [%(seasno)02dx%(epno)02d] - %(epname)s.%(ext)s'
config['without_ep_name'] = '%(seriesname)s - [%(seasno)02dx%(epno)02d].%(ext)s'
 
# Whitelist of valid filename characters
config['valid_filename_chars'] = """0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ!@£$%^&*()_+=-[]{}"'.,<>`~? """
 
# Force the stripping of invalid Windows characters, even if the current
# platform is not detected as Windows
config['force_windows_compliant_filenames'] = False
 
### End user config
 
if sys.platform == "win32" or config['force_windows_compliant_filenames']:
    # " * : < > ? | \ are all invalid on Windows
    config['valid_filename_chars'] = "".join([x for x in config['valid_filename_chars'] if x not in "\"*:<>?|\\"])
 
# Regex's to parse filenames with. Must have 3 groups, seriesname, season number
# and episode number. Use (?: optional) non-capturing groups if you need others.
config['name_parse'] = [
    # foo_[s01]_[e01]
    re.compile('''^(.+?)[ \._\-]\[[Ss]([0-9]+?)\]_\[[Ee]([0-9]+?)\]?[^\\/]*$'''),
    # foo.1x09*
    re.compile('''^(.+?)[ \._\-]\[?([0-9]+)x([0-9]+)[^\\/]*$'''),
    # foo.s01.e01, foo.s01_e01
    re.compile('''^(.+?)[ \._\-][Ss]([0-9]+)[\.\- ]?[Ee]([0-9]+)[^\\/]*$'''),
    # foo.103*
    re.compile('''^(.+)[ \._\-]([0-9]{1})([0-9]{2})[\._ -][^\\/]*$'''),
    # foo.0103*
    re.compile('''^(.+)[ \._\-]([0-9]{2})([0-9]{2,3})[\._ -][^\\/]*$'''),
]
 
 
def findFiles(args, recursive = False, verbose = False):
    """
Takes a list of files/folders, grabs files inside them. Does not recurse
more than one level (if a folder is supplied, it will list files within),
unless recurse is True, in which case it will recursively find all files.
"""
    allfiles = []
    for cfile in args:
        if os.path.isdir(cfile):
            for sf in os.listdir(cfile):
                newpath = os.path.join(cfile, sf)
                if os.path.isfile(newpath):
                    allfiles.append(newpath)
                else:
                    if recursive:
                        if verbose:
                            print "Recursively scanning %s" % (newpath)
                        allfiles.extend(
                            findFiles([newpath], recursive = recursive, verbose = verbose)
                        )
                    #end if recursive
                #end if isfile
            #end for sf
        elif os.path.isfile(cfile):
            allfiles.append(cfile)
        #end if isdir
    #end for cfile
    return allfiles
#end findFiles
 
def processSingleName(name, verbose=False):
    filepath, filename = os.path.split(name)
    filename, ext = os.path.splitext(filename)
 
    # Remove leading . from extension
    ext = ext.replace(".", "", 1)
 
    for r in config['name_parse']:
        match = r.match(filename)
        if match:
            seriesname, seasno, epno = match.groups()
 
            #remove ._- characters from name (- removed only if next to end of line)
            seriesname = re.sub("[\._]|\-(?=$)", " ", seriesname).strip()
 
            seasno, epno = int(seasno), int(epno)
 
            if verbose:
                print "*"*20
                print "File:", filename
                print "Pattern:", r.pattern
                print "Seriesname:", seriesname
                print "Seas:", seasno
                print "Ep:", epno
                print "*"*20
 
            return{'file_seriesname':seriesname,
                   'seasno':seasno,
                   'epno':epno,
                   'filepath':filepath,
                   'filename':filename,
                   'ext':ext
            }
    else:
        print "Invalid name: %s" % (name)
    #end for r
 
def processNames(names, verbose=False):
    """
Takes list of names, runs them though the config['name_parse'] regexs
"""
    allEps = []
    for f in names:
        cur = processSingleName(f, verbose=verbose)
        if cur is not None:
            allEps.append(cur)
    return allEps
#end processNames
 
def formatName(cfile):
    """
Takes a file dict and renames files using the configured format
"""
    if cfile['epname']:
        n = config['with_ep_name'] % (cfile)
    else:
        n = config['without_ep_name'] % (cfile)
    #end if epname
    return n
#end formatName
 
def cleanName(name):
    """
Cleans the supplied filename for renaming-to
"""
    name = name.encode('ascii', 'ignore') # convert unicode to ASCII
 
    return ''.join( [c for c in name if c in config['valid_filename_chars']] )
#end cleanName
 
def renameFile(oldfile, newfile, force=False):
    """
Renames files, does not overwrite files unless forced
"""
    new_exists = os.access(newfile, os.F_OK)
    if new_exists:
        sys.stderr.write("New filename already exists.. ")
        if force:
            sys.stderr.write("overwriting\n")
            os.rename(oldfile, newfile)
        else:
            sys.stderr.write("skipping\n")
            return False
        #end if force
    else:
        os.rename(oldfile, newfile)
        return True
    #end if new_exists
 
def processFile(t, opts, cfile):
    try:
        # Ask for episode name from tvdb_api
        epname = t[ cfile['file_seriesname'] ][ cfile['seasno'] ][ cfile['epno'] ]['episodename']
    except tvdb_shownotfound:
        # No such show found.
        # Use the show-name from the files name, and None as the ep name
        sys.stderr.write("! Warning: Show \"%s\" not found (for file %s.%s)\n" % (
            cfile['file_seriesname'],
            cfile['filename'],
            cfile['ext'])
        )
 
        cfile['seriesname'] = cfile['file_seriesname']
        cfile['epname'] = None
    except (tvdb_seasonnotfound, tvdb_episodenotfound, tvdb_attributenotfound):
        # The season, episode or name wasn't found, but the show was.
        # Use the corrected show-name, but no episode name.
        sys.stderr.write("! Warning: Episode name not found for %s (in %s)\n" % (
            cfile['file_seriesname'],
            cfile['filepath'] )
        )
 
        cfile['seriesname'] = t[ cfile['file_seriesname'] ]['seriesname']
        cfile['epname'] = None
    except tvdb_error, errormsg:
        # Error communicating with thetvdb.com
        sys.stderr.write(
            "! Warning: Error contacting www.thetvdb.com:\n%s\n" % (errormsg)
        )
 
        cfile['seriesname'] = cfile['file_seriesname']
        cfile['epname'] = None
    except tvdb_userabort, errormsg:
        # User aborted selection (q or ^c)
        print "\n", errormsg
        sys.exit(1)
    else:
        cfile['epname'] = epname
        cfile['seriesname'] = t[ cfile['file_seriesname'] ]['seriesname'] # get the corrected seriesname
 
    # Format new filename, strip unwanted characters
    newname = formatName(cfile)
    newname = cleanName(newname)
 
    # Append new filename (with extension) to path
    oldfile = os.path.join(
        cfile['filepath'],
        cfile['filename'] + "." + cfile['ext']
    )
    # Join path to new file name
    newfile = os.path.join(
        cfile['filepath'],
        newname
    )
 
    # Show new/old filename
    print "#"*20
    print "Old name: %s" % ( cfile['filename'] + "." + cfile['ext'] )
    print "New name: %s" % ( newname )
 
    # Either always rename, or prompt user
    if opts.always or (not opts.interactive):
        rename_result = renameFile(oldfile, newfile, force=opts.force)
        if rename_result:
            print "..auto-renaming"
        else:
            print "..not renamed"
        #end if rename_result
 
        return # next filename!
    #end if always
 
    ans = None
    while ans not in ['y', 'n', 'a', 'q', '']:
        print "Rename?"
        print "([y]/n/a/q)",
        try:
            ans = raw_input().strip()
        except KeyboardInterrupt, errormsg:
            print "\n", errormsg
            sys.exit(1)
        #end try
    #end while
 
    if len(ans) == 0:
        print "Renaming (default)"
        rename_result = renameFile(oldfile, newfile, force=opts.force)
    elif ans[0] == "a":
        opts.always = True
        rename_result = renameFile(oldfile, newfile, force=opts.force)
    elif ans[0] == "q":
        print "Aborting"
        sys.exit(1)
    elif ans[0] == "y":
        rename_result = renameFile(oldfile, newfile, force=opts.force)
    elif ans[0] == "n":
        print "Skipping"
        return
    else:
        print "Invalid input, skipping"
    #end if ans
    if rename_result:
        print "..renamed"
    else:
        print "..not renamed"
    #end if rename_result
#end processFile
 
def main():
    parser = OptionParser(usage="%prog [options] <file or directories>")
 
    parser.add_option( "-d", "--debug", action="store_true", default=False, dest="debug",
                        help="show debugging info")
    parser.add_option( "-b", "--batch", action="store_false", dest="interactive",
                        help="selects first search result, requires no human intervention once launched", default=False)
    parser.add_option( "-i", "--interactive", action="store_true", dest="interactive", default=True,
                        help="interactivly select correct show from search results [default]")
    parser.add_option( "-s", "--selectfirst", action="store_true", dest="selectfirst", default = False,
                        help = "automatically select first series search result (instead of showing the select-series interface)")
    parser.add_option( "-r", "--recursive", action="store_true", dest="recursive", default=True,
                        help="recursivly search supplied directories for files to rename")
    parser.add_option( "-a", "--always", action="store_true", default=False, dest="always",
                        help="always renames files (but still lets user select correct show). Can be changed during runtime with the 'a' prompt-option")
    parser.add_option( "-f", "--force", action="store_true", default=False, dest="force",
                        help="forces file to be renamed, even if it will overwrite an existing file")
 
    opts, args = parser.parse_args()
 
    if len(args) == 0:
        parser.error("No filenames or directories supplied")
    #end if len(args)
 
    allFiles = findFiles(args, opts.recursive, verbose = opts.debug)
    validFiles = processNames(allFiles, verbose = opts.debug)
 
    if len(validFiles) == 0:
        sys.stderr.write("No valid files found\n")
        sys.exit(2)
 
    print "#"*20
    print "# Starting tvnamer"
    print "# Processing %d files" % ( len(validFiles) )
 
    t = Tvdb(debug = opts.debug, interactive = opts.interactive, select_first = opts.selectfirst)
 
    print "# ..got tvdb mirrors"
    print "# Starting to process files"
    print "#"*20
 
    for cfile in validFiles:
        print "# Processing %(file_seriesname)s (season: %(seasno)d, episode %(epno)d)" % (cfile)
        processFile(t, opts, cfile)
    print "# Done"
#end main
 
if __name__ == "__main__":
    main()