pandora/pandora/archive/extract.py

520 lines
16 KiB
Python
Raw Normal View History

2010-09-04 12:59:09 +00:00
# -*- coding: utf-8 -*-
# vi:si:et:sw=4:sts=4:ts=4
from __future__ import division, with_statement
import os
2011-01-01 11:44:42 +00:00
from os.path import exists
2010-09-04 12:59:09 +00:00
import fractions
import subprocess
import tempfile
import time
import math
from glob import glob
import numpy as np
import Image
2011-01-25 15:14:25 +00:00
import ox
2011-02-22 16:09:13 +00:00
import ox.image
2012-05-17 09:38:59 +00:00
from ox.utils import json
2010-09-04 12:59:09 +00:00
img_extension='jpg'
AVCONV = 'avconv'
2012-03-06 20:18:29 +00:00
MAX_DISTANCE = math.sqrt(3 * pow(255, 2))
2010-09-04 12:59:09 +00:00
2011-01-01 11:44:42 +00:00
2010-09-04 12:59:09 +00:00
class AspectRatio(fractions.Fraction):
2011-01-01 11:44:42 +00:00
2010-09-04 12:59:09 +00:00
def __new__(cls, numerator, denominator=None):
if not denominator:
ratio = map(int, numerator.split(':'))
2011-01-01 11:44:42 +00:00
if len(ratio) == 1:
ratio.append(1)
2010-09-04 12:59:09 +00:00
numerator = ratio[0]
denominator = ratio[1]
#if its close enough to the common aspect ratios rather use that
if abs(numerator/denominator - 4/3) < 0.03:
numerator = 4
denominator = 3
elif abs(numerator/denominator - 16/9) < 0.02:
numerator = 16
denominator = 9
return super(AspectRatio, cls).__new__(cls, numerator, denominator)
@property
def ratio(self):
return "%d:%d" % (self.numerator, self.denominator)
def supported_formats():
p = subprocess.Popen(['which', AVCONV],
stdout=subprocess.PIPE, stderr=subprocess.PIPE)
stdout, stderr = p.communicate()
if not stdout.strip():
return None
p = subprocess.Popen([AVCONV, '-codecs'],
stdout=subprocess.PIPE, stderr=subprocess.PIPE)
stdout, stderr = p.communicate()
return {
'ogg': 'libtheora' in stdout and 'libvorbis' in stdout,
'webm': 'libvpx' in stdout and 'libvorbis' in stdout,
'mp4': 'libx264' in stdout and 'libvo_aacenc' in stdout,
}
2011-01-01 11:44:42 +00:00
def stream(video, target, profile, info, avconv=None):
2010-09-04 12:59:09 +00:00
if not os.path.exists(target):
ox.makedirs(os.path.dirname(target))
2010-09-04 12:59:09 +00:00
'''
WebM look into
lag
mb_static_threshold
qmax/qmin
rc_buf_aggressivity=0.95
token_partitions=4
level / speedlevel
bt?
H264, should bitrates be a bit lower? other stuff possible?
'''
profile, format = profile.split('.')
2011-12-28 12:35:10 +00:00
bpp = 0.17
2010-09-04 12:59:09 +00:00
if profile == '1080p':
height = 1080
audiorate = 48000
audioquality = 6
audiobitrate = None
audiochannels = None
if profile == '720p':
height = 720
audiorate = 48000
audioquality = 5
audiobitrate = None
audiochannels = None
if profile == '480p':
height = 480
audiorate = 44100
2012-04-19 16:14:43 +00:00
audioquality = 3
2010-09-04 12:59:09 +00:00
audiobitrate = None
audiochannels = 2
2012-04-19 16:06:38 +00:00
elif profile == '432p':
height = 432
audiorate = 44100
2012-04-19 16:14:43 +00:00
audioquality = 3
2012-04-19 16:06:38 +00:00
audiobitrate = None
audiochannels = 2
2010-09-04 12:59:09 +00:00
elif profile == '360p':
height = 360
audiorate = 44100
audioquality = 1
audiobitrate = None
audiochannels = 1
2012-04-19 16:06:38 +00:00
elif profile == '288p':
height = 288
audiorate = 44100
audioquality = 0
audiobitrate = None
audiochannels = 1
2010-12-28 10:15:45 +00:00
elif profile == '240p':
height = 240
audiorate = 44100
2010-09-04 12:59:09 +00:00
audioquality = 0
audiobitrate = None
audiochannels = 1
2012-04-19 16:06:38 +00:00
elif profile == '144p':
height = 144
audiorate = 22050
audioquality = -1
audiobitrate = '22k'
audiochannels = 1
2010-09-04 12:59:09 +00:00
else:
height = 96
audiorate = 22050
audioquality = -1
audiobitrate = '22k'
audiochannels = 1
if info['video'] and 'display_aspect_ratio' in info['video'][0]:
fps = AspectRatio(info['video'][0]['framerate'])
fps = min(30, float(fps))
2010-09-04 12:59:09 +00:00
dar = AspectRatio(info['video'][0]['display_aspect_ratio'])
width = int(dar * height)
width += width % 2
2010-09-04 12:59:09 +00:00
bitrate = height*width*fps*bpp/1000
aspect = dar.ratio
#use 1:1 pixel aspect ratio if dar is close to that
if abs(width/height - dar) < 0.02:
aspect = '%s:%s' % (width, height)
2010-09-04 12:59:09 +00:00
video_settings = [
'-vb', '%dk'%bitrate,
2010-09-04 12:59:09 +00:00
'-aspect', aspect,
#'-vf', 'yadif',
'-vf', 'hqdn3d,scale=%s:%s'%(width, height),
2012-01-05 15:41:42 +00:00
'-g', '%d' % int(fps*5),
2010-09-04 12:59:09 +00:00
]
2012-01-07 10:48:05 +00:00
if format == 'webm':
video_settings += [
'-deadline', 'good',
'-cpu-used', '0',
'-lag-in-frames', '16',
'-auto-alt-ref', '1',
]
2010-09-04 12:59:09 +00:00
if format == 'mp4':
#quicktime does not support bpyramid
'''
2010-09-04 12:59:09 +00:00
video_settings += [
'-vcodec', 'libx264',
'-flags', '+loop+mv4',
'-cmp', '256',
'-partitions', '+parti4x4+parti8x8+partp4x4+partp8x8+partb8x8',
'-me_method', 'hex',
'-subq', '7',
'-trellis', '1',
'-refs', '5',
'-bf', '3',
'-flags2', '+bpyramid+wpred+mixed_refs+dct8x8',
'-coder', '1',
'-me_range', '16',
'-keyint_min', '25', #FIXME: should this be related to fps?
'-sc_threshold','40',
'-i_qfactor', '0.71',
'-qmin', '10', '-qmax', '51',
'-qdiff', '4'
]
'''
video_settings += [
'-vcodec', 'libx264',
'-flags', '+loop+mv4',
'-cmp', '256',
'-partitions', '+parti4x4+parti8x8+partp4x4+partp8x8+partb8x8',
'-me_method', 'hex',
'-subq', '7',
'-trellis', '1',
'-refs', '5',
'-bf', '0',
'-flags2', '+mixed_refs',
'-coder', '0',
'-me_range', '16',
2011-01-01 11:44:42 +00:00
'-sc_threshold', '40',
'-i_qfactor', '0.71',
'-qmin', '10', '-qmax', '51',
'-qdiff', '4'
]
2010-09-04 12:59:09 +00:00
else:
video_settings = ['-vn']
if info['audio']:
audio_settings = ['-ar', str(audiorate), '-aq', str(audioquality)]
2013-05-10 14:17:15 +00:00
if audiochannels and 'channels' in info['audio'][0] \
and info['audio'][0]['channels'] > audiochannels:
audio_settings += ['-ac', str(audiochannels)]
if audiobitrate:
audio_settings += ['-ab', audiobitrate]
if format == 'mp4':
audio_settings += ['-acodec', 'libvo_aacenc']
else:
audio_settings += ['-acodec', 'libvorbis']
else:
audio_settings = ['-an']
if not avconv:
avconv = AVCONV
cmd = [avconv, '-y', '-i', video, '-threads', '4'] \
2010-09-04 12:59:09 +00:00
+ audio_settings \
+ video_settings
2011-02-06 12:40:28 +00:00
if format == 'webm':
cmd += ['-f', 'webm', target]
elif format == 'mp4':
2011-02-06 12:40:28 +00:00
#mp4 needs postprocessing(qt-faststart), write to temp file
cmd += ["%s.mp4" % target]
else:
2011-02-06 12:40:28 +00:00
cmd += [target]
2010-09-04 12:59:09 +00:00
#print cmd
p = subprocess.Popen(cmd, stdin=subprocess.PIPE,
stdout=open('/dev/null', 'w'),
stderr=subprocess.STDOUT)
2010-09-15 13:03:00 +00:00
p.communicate()
if p.returncode != 0:
t = "%s.mp4" % target if format == 'mp4' else target
if os.path.exists(t):
os.unlink(t)
return False
2010-09-04 12:59:09 +00:00
if format == 'mp4':
cmd = ['qt-faststart', "%s.mp4" % target, target]
#print cmd
p = subprocess.Popen(cmd, stdin=subprocess.PIPE,
stdout=open('/dev/null', 'w'),
stderr=subprocess.STDOUT)
2010-09-15 13:03:00 +00:00
p.communicate()
os.unlink("%s.mp4" % target)
2010-09-15 13:03:00 +00:00
return True
2010-09-04 12:59:09 +00:00
2011-01-01 11:44:42 +00:00
2010-09-04 12:59:09 +00:00
def run_command(cmd, timeout=10):
#print cmd
p = subprocess.Popen(cmd, stdout=open('/dev/null', 'w'),
stderr=subprocess.STDOUT)
2010-09-04 12:59:09 +00:00
while timeout > 0:
time.sleep(0.2)
timeout -= 0.2
if p.poll() != None:
return p.returncode
if p.poll() == None:
os.kill(p.pid, 9)
killedpid, stat = os.waitpid(p.pid, os.WNOHANG)
return p.returncode
2011-01-01 11:44:42 +00:00
def frame(video, frame, position, height=128, redo=False):
2010-09-04 12:59:09 +00:00
'''
params:
video input
frame output
2010-09-04 12:59:09 +00:00
position as float in seconds
2012-02-17 07:32:04 +00:00
height of frame
2010-09-04 12:59:09 +00:00
redo boolean to extract file even if it exists
'''
if exists(video):
folder = os.path.dirname(frame)
2010-09-04 12:59:09 +00:00
if redo or not exists(frame):
ox.makedirs(folder)
if video.endswith('.mp4'):
cmd = [
AVCONV, '-y',
'-ss', str(position),
'-i', video,
'-an', '-vframes', '1',
'-vf', 'scale=-1:%s' % height
]
if not frame.endswith('.png'):
cmd += ['-f', 'mjpeg']
cmd += [frame]
else:
cmd = ['oxframe', '-i', video, '-o', frame,
'-p', str(position), '-y', str(height)]
2010-09-04 12:59:09 +00:00
run_command(cmd)
2011-01-01 11:44:42 +00:00
2010-09-07 14:05:38 +00:00
def resize_image(image_source, image_output, width=None, size=None):
2010-09-04 12:59:09 +00:00
if exists(image_source):
source = Image.open(image_source).convert('RGB')
2010-09-04 12:59:09 +00:00
source_width = source.size[0]
source_height = source.size[1]
2010-09-07 14:05:38 +00:00
if size:
if source_width > source_height:
width = size
height = int(width / (float(source_width) / source_height))
height = height - height % 2
else:
height = size
width = int(height * (float(source_width) / source_height))
width = width - width % 2
2011-01-01 11:44:42 +00:00
2010-09-07 14:05:38 +00:00
else:
height = int(width / (float(source_width) / source_height))
height = height - height % 2
2010-09-04 12:59:09 +00:00
2011-10-27 22:19:58 +00:00
width = max(width, 1)
height = max(height, 1)
2011-10-27 14:31:23 +00:00
2010-09-04 12:59:09 +00:00
if width < source_width:
resize_method = Image.ANTIALIAS
else:
resize_method = Image.BICUBIC
output = source.resize((width, height), resize_method)
output.save(image_output)
2011-01-01 11:44:42 +00:00
2012-05-21 12:46:48 +00:00
def timeline(video, prefix, modes=None, size=None):
if modes is None:
modes = ['antialias', 'slitscan', 'keyframes', 'audio', 'data']
if size is None:
2012-05-17 09:38:59 +00:00
size=[64, 16]
if isinstance(video, basestring):
video = [video]
cmd = ['../bin/oxtimelines',
'-s', ','.join(map(str, reversed(sorted(size)))),
'-m', ','.join(modes),
'-o', prefix,
'-c', os.path.join(prefix, 'cuts.json'),
] + video
2013-05-10 14:17:15 +00:00
p = subprocess.Popen(cmd, stdin=subprocess.PIPE,
stdout=subprocess.PIPE, stderr=subprocess.PIPE)
2012-05-17 09:40:44 +00:00
#print cmd
#p = subprocess.Popen(cmd)
2010-09-04 12:59:09 +00:00
p.wait()
2011-01-01 11:44:42 +00:00
2012-05-17 09:38:59 +00:00
def average_color(prefix, start=0, end=0, mode='antialias'):
2010-09-04 12:59:09 +00:00
height = 64
frames = 0
pixels = []
color = np.asarray([0, 0, 0], dtype=np.float32)
2011-09-28 00:29:40 +00:00
if end:
start = int(start * 25)
end = int(end * 25)
2012-05-17 09:38:59 +00:00
mode = 'timeline' + mode
2013-03-23 14:52:54 +00:00
timelines = ox.sorted_strings(filter(lambda t: t!= '%s%s%sp.jpg'%(prefix, mode, height),
2012-05-17 09:38:59 +00:00
glob("%s%s%sp*.jpg"%(prefix, mode, height))))
2011-10-21 18:12:09 +00:00
for image in timelines:
2011-09-28 00:29:40 +00:00
start_offset = 0
2011-11-07 11:31:20 +00:00
if start and frames + 1500 <= start:
frames += 1500
2011-09-28 00:29:40 +00:00
continue
timeline = Image.open(image)
frames += timeline.size[0]
if start and frames > start > frames-timeline.size[0]:
2011-09-28 00:29:40 +00:00
start_offset = start - (frames-timeline.size[0])
box = (start_offset, 0, timeline.size[0], height)
timeline = timeline.crop(box)
if end and frames > end:
end_offset = timeline.size[0] - (frames - end)
box = (0, 0, end_offset, height)
timeline = timeline.crop(box)
p = np.asarray(timeline.convert('RGB'), dtype=np.float32)
2010-09-04 12:59:09 +00:00
p = np.sum(p, axis=0) / height #average color per frame
pixels.append(p)
2011-09-28 00:29:40 +00:00
if end and frames >= end:
break
if end:
frames = end - start
2011-11-07 11:09:38 +00:00
if frames:
for i in range(0, len(pixels)):
p = np.sum(pixels[i], axis=0) / frames
color += p
2011-01-25 15:14:25 +00:00
color = list(map(float, color))
return ox.image.getHSL(color)
2010-09-04 12:59:09 +00:00
2012-03-06 19:59:44 +00:00
2011-10-02 18:16:28 +00:00
def average_volume(prefix, start=0, end=0):
2012-05-17 09:38:59 +00:00
return average_color(prefix, start, end, 'audio')[2]
2011-01-01 11:44:42 +00:00
2012-03-06 19:59:44 +00:00
2010-09-04 12:59:09 +00:00
def get_distance(rgb0, rgb1):
2012-03-06 19:59:44 +00:00
# rgb distance, normalized so that black/white equals 1
2012-03-06 17:40:21 +00:00
dst = math.sqrt(pow(rgb0[0] - rgb1[0], 2) + pow(rgb0[1] - rgb1[1], 2) + pow(rgb0[2] - rgb1[2], 2))
2012-03-06 20:18:29 +00:00
return dst / MAX_DISTANCE
2010-09-04 12:59:09 +00:00
2011-01-01 11:44:42 +00:00
2010-09-04 12:59:09 +00:00
def cuts(prefix):
2012-05-17 09:38:59 +00:00
fname = os.path.join(prefix, 'cuts.json')
if not os.path.exists(fname):
return []
with open(fname) as f:
cuts = json.load(f)
2010-09-04 12:59:09 +00:00
return cuts
2011-01-01 11:44:42 +00:00
2010-09-08 13:38:44 +00:00
def divide(num, by):
# >>> divide(100, 3)
# [33, 33, 34]
arr = []
div = int(num / by)
mod = num % by
2010-09-08 17:14:01 +00:00
for i in range(int(by)):
2010-09-08 13:38:44 +00:00
arr.append(div + (i > by - 1 - mod))
return arr
2011-01-01 11:44:42 +00:00
2010-09-23 16:01:48 +00:00
def timeline_strip(item, cuts, info, prefix):
2010-09-08 13:38:44 +00:00
_debug = False
2011-01-01 11:44:42 +00:00
duration = info['duration']
2010-09-08 13:38:44 +00:00
video_height = info['video'][0]['height']
video_width = info['video'][0]['width']
video_ratio = video_width / video_height
line_image = []
timeline_height = 64
timeline_width = 1500
fps = 25
2010-09-08 17:14:01 +00:00
frames = int(duration * fps)
2010-09-08 13:38:44 +00:00
if cuts[0] != 0:
cuts.insert(0, 0)
cuts = map(lambda x: int(round(x * fps)), cuts)
for frame in range(frames):
i = int(frame / timeline_width)
x = frame % timeline_width
if x == 0:
timeline_width = min(timeline_width, frames - frame)
timeline_image = Image.new('RGB', (timeline_width, timeline_height))
if frame in cuts:
c = cuts.index(frame)
2010-09-08 17:14:01 +00:00
if c +1 < len(cuts):
duration = cuts[c + 1] - cuts[c]
2010-09-23 16:01:48 +00:00
frames = math.ceil(duration / (video_width * timeline_height / video_height))
widths = divide(duration, frames)
frame = frame
2010-09-08 13:38:44 +00:00
if _debug:
2010-09-23 16:01:48 +00:00
print widths, duration, frames, cuts[c], cuts[c + 1]
for s in range(int(frames)):
frame_ratio = widths[s] / timeline_height
if video_ratio > frame_ratio:
width = int(round(video_height * frame_ratio))
2010-09-08 17:14:01 +00:00
left = int((video_width - width) / 2)
box = (left, 0, left + width, video_height)
else:
2010-09-23 16:01:48 +00:00
height = int(round(video_width / frame_ratio))
2010-09-08 17:14:01 +00:00
top = int((video_height - height) / 2)
box = (0, top, video_width, top + height)
if _debug:
2010-09-23 16:01:48 +00:00
print frame, 'cut', c, 'frame', s, frame, 'width', widths[s], box
#FIXME: why does this have to be frame+1?
frame_image = Image.open(item.frame((frame+1)/fps))
2010-09-08 17:14:01 +00:00
frame_image = frame_image.crop(box).resize((widths[s], timeline_height), Image.ANTIALIAS)
for x_ in range(widths[s]):
line_image.append(frame_image.crop((x_, 0, x_ + 1, timeline_height)))
2010-09-23 16:01:48 +00:00
frame += widths[s]
2010-09-08 17:14:01 +00:00
if len(line_image) > frame:
timeline_image.paste(line_image[frame], (x, 0))
2010-09-08 13:38:44 +00:00
if x == timeline_width - 1:
2011-10-21 18:10:24 +00:00
timeline_file = '%sStrip64p%04d.png' % (prefix, i)
2010-09-08 13:38:44 +00:00
if _debug:
print 'writing', timeline_file
timeline_image.save(timeline_file)
2011-01-01 11:44:42 +00:00
def chop(video, start, end):
t = end - start
tmp = tempfile.mkdtemp()
ext = os.path.splitext(video)[1]
choped_video = '%s/tmp%s' % (tmp, ext)
cmd = [
'ffmpeg',
'-y',
'-i', video,
'-ss', '%.3f'%start,
2011-01-01 11:44:42 +00:00
'-t', '%.3f'%t,
'-vcodec', 'copy',
'-acodec', 'copy',
'-f', ext[1:],
choped_video
]
p = subprocess.Popen(cmd, stdin=subprocess.PIPE,
stdout=open('/dev/null', 'w'),
stderr=open('/dev/null', 'w'))
p.wait()
f = open(choped_video, 'r')
os.unlink(choped_video)
os.rmdir(tmp)
return f