Merge remote-tracking branch 'epitron/metadata-pp'
Conflicts: youtube_dl/PostProcessor.py
This commit is contained in:
commit
5f263296ea
@ -193,7 +193,9 @@ which means you can modify it, redistribute it or use it however you like.
|
|||||||
processed files are overwritten by default
|
processed files are overwritten by default
|
||||||
--embed-subs embed subtitles in the video (only for mp4
|
--embed-subs embed subtitles in the video (only for mp4
|
||||||
videos)
|
videos)
|
||||||
--add-metadata add metadata to the files
|
--add-metadata write metadata to the video file
|
||||||
|
--xattrs write metadata to the video file's xattrs (using
|
||||||
|
dublin core and xdg standards)
|
||||||
|
|
||||||
# CONFIGURATION
|
# CONFIGURATION
|
||||||
|
|
||||||
|
@ -63,6 +63,7 @@ class FFmpegPostProcessorError(PostProcessingError):
|
|||||||
class AudioConversionError(PostProcessingError):
|
class AudioConversionError(PostProcessingError):
|
||||||
pass
|
pass
|
||||||
|
|
||||||
|
|
||||||
class FFmpegPostProcessor(PostProcessor):
|
class FFmpegPostProcessor(PostProcessor):
|
||||||
def __init__(self,downloader=None):
|
def __init__(self,downloader=None):
|
||||||
PostProcessor.__init__(self, downloader)
|
PostProcessor.__init__(self, downloader)
|
||||||
@ -108,6 +109,7 @@ class FFmpegPostProcessor(PostProcessor):
|
|||||||
return u'./' + fn
|
return u'./' + fn
|
||||||
return fn
|
return fn
|
||||||
|
|
||||||
|
|
||||||
class FFmpegExtractAudioPP(FFmpegPostProcessor):
|
class FFmpegExtractAudioPP(FFmpegPostProcessor):
|
||||||
def __init__(self, downloader=None, preferredcodec=None, preferredquality=None, nopostoverwrites=False):
|
def __init__(self, downloader=None, preferredcodec=None, preferredquality=None, nopostoverwrites=False):
|
||||||
FFmpegPostProcessor.__init__(self, downloader)
|
FFmpegPostProcessor.__init__(self, downloader)
|
||||||
@ -236,6 +238,7 @@ class FFmpegExtractAudioPP(FFmpegPostProcessor):
|
|||||||
information['filepath'] = new_path
|
information['filepath'] = new_path
|
||||||
return self._nopostoverwrites,information
|
return self._nopostoverwrites,information
|
||||||
|
|
||||||
|
|
||||||
class FFmpegVideoConvertor(FFmpegPostProcessor):
|
class FFmpegVideoConvertor(FFmpegPostProcessor):
|
||||||
def __init__(self, downloader=None,preferedformat=None):
|
def __init__(self, downloader=None,preferedformat=None):
|
||||||
super(FFmpegVideoConvertor, self).__init__(downloader)
|
super(FFmpegVideoConvertor, self).__init__(downloader)
|
||||||
@ -519,3 +522,119 @@ class FFmpegMergerPP(FFmpegPostProcessor):
|
|||||||
args = ['-c', 'copy']
|
args = ['-c', 'copy']
|
||||||
self.run_ffmpeg_multiple_files(info['__files_to_merge'], filename, args)
|
self.run_ffmpeg_multiple_files(info['__files_to_merge'], filename, args)
|
||||||
return True, info
|
return True, info
|
||||||
|
|
||||||
|
class XAttrMetadataPP(PostProcessor):
|
||||||
|
|
||||||
|
#
|
||||||
|
# More info about extended attributes for media:
|
||||||
|
# http://freedesktop.org/wiki/CommonExtendedAttributes/
|
||||||
|
# http://www.freedesktop.org/wiki/PhreedomDraft/
|
||||||
|
# http://dublincore.org/documents/usageguide/elements.shtml
|
||||||
|
#
|
||||||
|
# TODO:
|
||||||
|
# * capture youtube keywords and put them in 'user.dublincore.subject' (comma-separated)
|
||||||
|
# * figure out which xattrs can be used for 'duration', 'thumbnail', 'resolution'
|
||||||
|
#
|
||||||
|
|
||||||
|
def run(self, info):
|
||||||
|
""" Set extended attributes on downloaded file (if xattr support is found). """
|
||||||
|
|
||||||
|
from .utils import hyphenate_date
|
||||||
|
|
||||||
|
# This mess below finds the best xattr tool for the job and creates a
|
||||||
|
# "write_xattr" function.
|
||||||
|
try:
|
||||||
|
# try the pyxattr module...
|
||||||
|
import xattr
|
||||||
|
def write_xattr(path, key, value):
|
||||||
|
return xattr.setxattr(path, key, value)
|
||||||
|
|
||||||
|
except ImportError:
|
||||||
|
|
||||||
|
if os.name == 'posix':
|
||||||
|
def which(bin):
|
||||||
|
for dir in os.environ["PATH"].split(":"):
|
||||||
|
path = os.path.join(dir, bin)
|
||||||
|
if os.path.exists(path):
|
||||||
|
return path
|
||||||
|
|
||||||
|
user_has_setfattr = which("setfattr")
|
||||||
|
user_has_xattr = which("xattr")
|
||||||
|
|
||||||
|
if user_has_setfattr or user_has_xattr:
|
||||||
|
|
||||||
|
def write_xattr(path, key, value):
|
||||||
|
import errno
|
||||||
|
potential_errors = {
|
||||||
|
# setfattr: /tmp/blah: Operation not supported
|
||||||
|
"Operation not supported": errno.EOPNOTSUPP,
|
||||||
|
# setfattr: ~/blah: No such file or directory
|
||||||
|
# xattr: No such file: ~/blah
|
||||||
|
"No such file": errno.ENOENT,
|
||||||
|
}
|
||||||
|
|
||||||
|
if user_has_setfattr:
|
||||||
|
cmd = ['setfattr', '-n', key, '-v', value, path]
|
||||||
|
elif user_has_xattr:
|
||||||
|
cmd = ['xattr', '-w', key, value, path]
|
||||||
|
|
||||||
|
try:
|
||||||
|
output = subprocess.check_output(cmd, stderr=subprocess.STDOUT)
|
||||||
|
except subprocess.CalledProcessError as e:
|
||||||
|
errorstr = e.output.strip().decode()
|
||||||
|
for potential_errorstr, potential_errno in potential_errors.items():
|
||||||
|
if errorstr.find(potential_errorstr) > -1:
|
||||||
|
e = OSError(potential_errno, potential_errorstr)
|
||||||
|
e.__cause__ = None
|
||||||
|
raise e
|
||||||
|
raise # Reraise unhandled error
|
||||||
|
|
||||||
|
else:
|
||||||
|
# On Unix, and can't find pyxattr, setfattr, or xattr.
|
||||||
|
if sys.platform.startswith('linux'):
|
||||||
|
self._downloader.report_error("Couldn't find a tool to set the xattrs. Install either the python 'pyxattr' or 'xattr' modules, or the GNU 'attr' package (which contains the 'setfattr' tool).")
|
||||||
|
elif sys.platform == 'darwin':
|
||||||
|
self._downloader.report_error("Couldn't find a tool to set the xattrs. Install either the python 'xattr' module, or the 'xattr' binary.")
|
||||||
|
else:
|
||||||
|
# Write xattrs to NTFS Alternate Data Streams: http://en.wikipedia.org/wiki/NTFS#Alternate_data_streams_.28ADS.29
|
||||||
|
def write_xattr(path, key, value):
|
||||||
|
assert(key.find(":") < 0)
|
||||||
|
assert(path.find(":") < 0)
|
||||||
|
assert(os.path.exists(path))
|
||||||
|
|
||||||
|
f = open(path+":"+key, "w")
|
||||||
|
f.write(value)
|
||||||
|
f.close()
|
||||||
|
|
||||||
|
# Write the metadata to the file's xattrs
|
||||||
|
self._downloader.to_screen('[metadata] Writing metadata to file\'s xattrs...')
|
||||||
|
|
||||||
|
filename = info['filepath']
|
||||||
|
|
||||||
|
try:
|
||||||
|
xattr_mapping = {
|
||||||
|
'user.xdg.referrer.url': 'webpage_url',
|
||||||
|
# 'user.xdg.comment': 'description',
|
||||||
|
'user.dublincore.title': 'title',
|
||||||
|
'user.dublincore.date': 'upload_date',
|
||||||
|
'user.dublincore.description': 'description',
|
||||||
|
'user.dublincore.contributor': 'uploader',
|
||||||
|
'user.dublincore.format': 'format',
|
||||||
|
}
|
||||||
|
|
||||||
|
for xattrname, infoname in xattr_mapping.items():
|
||||||
|
|
||||||
|
value = info.get(infoname)
|
||||||
|
|
||||||
|
if value:
|
||||||
|
if infoname == "upload_date":
|
||||||
|
value = hyphenate_date(value)
|
||||||
|
|
||||||
|
write_xattr(filename, xattrname, value)
|
||||||
|
|
||||||
|
return True, info
|
||||||
|
|
||||||
|
except OSError:
|
||||||
|
self._downloader.report_error("This filesystem doesn't support extended attributes. (You may have to enable them in your /etc/fstab)")
|
||||||
|
return False, info
|
||||||
|
|
||||||
|
@ -38,6 +38,7 @@ __authors__ = (
|
|||||||
'Takuya Tsuchida',
|
'Takuya Tsuchida',
|
||||||
'Sergey M.',
|
'Sergey M.',
|
||||||
'Michael Orlitzky',
|
'Michael Orlitzky',
|
||||||
|
'Chris Gahan',
|
||||||
)
|
)
|
||||||
|
|
||||||
__license__ = 'Public Domain'
|
__license__ = 'Public Domain'
|
||||||
@ -79,6 +80,7 @@ from .PostProcessor import (
|
|||||||
FFmpegVideoConvertor,
|
FFmpegVideoConvertor,
|
||||||
FFmpegExtractAudioPP,
|
FFmpegExtractAudioPP,
|
||||||
FFmpegEmbedSubtitlePP,
|
FFmpegEmbedSubtitlePP,
|
||||||
|
XAttrMetadataPP,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
@ -415,7 +417,9 @@ def parseOpts(overrideArguments=None):
|
|||||||
postproc.add_option('--embed-subs', action='store_true', dest='embedsubtitles', default=False,
|
postproc.add_option('--embed-subs', action='store_true', dest='embedsubtitles', default=False,
|
||||||
help='embed subtitles in the video (only for mp4 videos)')
|
help='embed subtitles in the video (only for mp4 videos)')
|
||||||
postproc.add_option('--add-metadata', action='store_true', dest='addmetadata', default=False,
|
postproc.add_option('--add-metadata', action='store_true', dest='addmetadata', default=False,
|
||||||
help='add metadata to the files')
|
help='write metadata to the video file')
|
||||||
|
postproc.add_option('--xattrs', action='store_true', dest='xattrs', default=False,
|
||||||
|
help='write metadata to the video file\'s xattrs (using dublin core and xdg standards)')
|
||||||
|
|
||||||
|
|
||||||
parser.add_option_group(general)
|
parser.add_option_group(general)
|
||||||
@ -717,6 +721,8 @@ def _real_main(argv=None):
|
|||||||
ydl.add_post_processor(FFmpegVideoConvertor(preferedformat=opts.recodevideo))
|
ydl.add_post_processor(FFmpegVideoConvertor(preferedformat=opts.recodevideo))
|
||||||
if opts.embedsubtitles:
|
if opts.embedsubtitles:
|
||||||
ydl.add_post_processor(FFmpegEmbedSubtitlePP(subtitlesformat=opts.subtitlesformat))
|
ydl.add_post_processor(FFmpegEmbedSubtitlePP(subtitlesformat=opts.subtitlesformat))
|
||||||
|
if opts.xattrs:
|
||||||
|
ydl.add_post_processor(XAttrMetadataPP())
|
||||||
|
|
||||||
# Update version
|
# Update version
|
||||||
if opts.update_self:
|
if opts.update_self:
|
||||||
|
@ -818,6 +818,15 @@ def date_from_str(date_str):
|
|||||||
return today + delta
|
return today + delta
|
||||||
return datetime.datetime.strptime(date_str, "%Y%m%d").date()
|
return datetime.datetime.strptime(date_str, "%Y%m%d").date()
|
||||||
|
|
||||||
|
def hyphenate_date(date_str):
|
||||||
|
"""
|
||||||
|
Convert a date in 'YYYYMMDD' format to 'YYYY-MM-DD' format"""
|
||||||
|
match = re.match(r'^(\d\d\d\d)(\d\d)(\d\d)$', date_str)
|
||||||
|
if match is not None:
|
||||||
|
return '-'.join(match.groups())
|
||||||
|
else:
|
||||||
|
return date_str
|
||||||
|
|
||||||
class DateRange(object):
|
class DateRange(object):
|
||||||
"""Represents a time interval between two dates"""
|
"""Represents a time interval between two dates"""
|
||||||
def __init__(self, start=None, end=None):
|
def __init__(self, start=None, end=None):
|
||||||
|
Loading…
Reference in New Issue
Block a user