python-ox/ox/file.py

# -*- coding: utf-8 -*-
# vi:si:et:sw=4:sts=4:ts=4
# GPL 2008
from __future__ import division, print_function
from glob import glob
import hashlib
import os
import re
import shutil
import sqlite3
import struct
import subprocess

from .utils import json

__all__ = ['sha1sum', 'oshash', 'avinfo', 'makedirs', 'iexists']

EXTENSIONS = {
    'audio': [
        'aac', 'aif', 'aiff', 'amr',
        'flac', 'm4a', 'mp3', 'oga', 'ogg', 'wav', 'wma', 'opus',
        'ra',  # Real Audio
    ],
    'image': [
        'bmp', 'gif', 'jpeg', 'jpg', 'png', 'svg', 'webp'
    ],
    'subtitle': [
        'idx', 'srt', 'sub', 'vtt'
    ],
    'video': [
        '3gp',
        'avi', 'divx', 'dv', 'flv', 'm2t', 'm2ts', 'm2v', 'm4v', 'mkv', 'mov', 'mp4',
        'mpeg', 'mpg', 'mts', 'ogm', 'ogv', 'vob', 'webm', 'wmv', 'asf',
        'mod', 'tod',  # http://en.wikipedia.org/wiki/MOD_and_TOD
        'mxf', 'ts',
        'dat',  # VOD files
        'rm', 'rmvb',  # Real Media
    ],
}

def is_exe(fpath):
    return os.path.isfile(fpath) and os.access(fpath, os.X_OK)

def which(program):
    fpath, fname = os.path.split(program)
    if fpath:
        if is_exe(program):
            return program
    else:
        for path in os.environ.get("PATH", "").split(os.pathsep):
            exe_file = os.path.join(path, program)
            if is_exe(exe_file):
                return exe_file
    return None

def cmd(program):
    local = os.path.expanduser('~/.ox/bin/%s' % program)
    if os.path.exists(local):
        program = local
    return program

def _get_file_cache():
    import ox.cache
    path = ox.cache.cache_path()
    if path.startswith('fs:'):
        path = path[3:]
    return os.path.join(path, 'files.sqlite')

def cache(filename, type='oshash', update=False):
    conn = sqlite3.connect(_get_file_cache(), timeout=10)
    conn.row_factory = sqlite3.Row

    if not cache.init:
        c = conn.cursor()
        c.execute('CREATE TABLE IF NOT EXISTS cache (path varchar(1024) unique, oshash varchar(16), sha1 varchar(42), size int, mtime int, info text)')
        c.execute('CREATE INDEX IF NOT EXISTS cache_oshash ON cache (oshash)')
        c.execute('CREATE INDEX IF NOT EXISTS cache_sha1 ON cache (sha1)')
        conn.commit()
        cache.init = True
    c = conn.cursor()
    c.execute('SELECT oshash, sha1, info, size, mtime FROM cache WHERE path = ?', (filename, ))
    stat = os.stat(filename)
    row = None
    h = None
    sha1 = None
    info = ''
    for row in c:
        if stat.st_size == row['size'] and int(stat.st_mtime) == int(row['mtime']):
            if not update:
                value = row[type]
                if value:
                    if type == 'info':
                        value = json.loads(value)
                    return value
            h = row['oshash']
            sha1 = row['sha1']
            info = row['info']
    if type == 'oshash':
        value = h = oshash(filename, cached=False)
    elif type == 'sha1':
        value = sha1 = sha1sum(filename, cached=False)
    elif type == 'info':
        value = avinfo(filename, cached=False)
        info = json.dumps(value)
    t = (filename, h, sha1, stat.st_size, int(stat.st_mtime), info)
    with conn:
        sql = u'INSERT OR REPLACE INTO cache values (?, ?, ?, ?, ?, ?)'
        c.execute(sql, t)
    return value
cache.init = None

def cleanup_cache():
    conn = sqlite3.connect(_get_file_cache(), timeout=10)
    conn.row_factory = sqlite3.Row
    c = conn.cursor()
    c.execute('SELECT path FROM cache')
    paths = [r[0] for r in c]
    for path in paths:
        if not os.path.exists(path):
            c.execute('DELETE FROM cache WHERE path = ?', (path, ))
    conn.commit()
    c.execute('VACUUM')
    conn.commit()

def sha1sum(filename, cached=False):
    if cached:
        return cache(filename, 'sha1')
    sha1 = hashlib.sha1()
    with open(filename, 'rb') as f:
        for chunk in iter(lambda: f.read(128*sha1.block_size), b''):
            sha1.update(chunk)
    return sha1.hexdigest()

'''
    os hash - http://trac.opensubtitles.org/projects/opensubtitles/wiki/HashSourceCodes
    plus modification for files < 64k, buffer is filled with file data and padded with 0
'''
def oshash(filename, cached=True):
    if cached:
        return cache(filename, 'oshash')
    try:
        longlongformat = 'q'  # long long
        bytesize = struct.calcsize(longlongformat)

        f = open(filename, "rb")

        filesize = os.path.getsize(filename)
        hash = filesize
        if filesize < 65536:
            for x in range(int(filesize/bytesize)):
                buffer = f.read(bytesize)
                (l_value,) = struct.unpack(longlongformat, buffer)
                hash += l_value
                hash = hash & 0xFFFFFFFFFFFFFFFF  # to remain as 64bit number
        else:
            for x in range(int(65536/bytesize)):
                buffer = f.read(bytesize)
                (l_value,) = struct.unpack(longlongformat, buffer)
                hash += l_value
                hash = hash & 0xFFFFFFFFFFFFFFFF  # to remain as 64bit number
            f.seek(max(0, filesize-65536), 0)
            for x in range(int(65536/bytesize)):
                buffer = f.read(bytesize)
                (l_value,) = struct.unpack(longlongformat, buffer)
                hash += l_value
                hash = hash & 0xFFFFFFFFFFFFFFFF
        f.close()
        returnedhash = "%016x" % hash
        return returnedhash
    except IOError:
        return "IOError"

def avinfo(filename, cached=True):
    if cached:
        return cache(filename, 'info')
    if os.path.getsize(filename):
        if which('ffprobe'):
            return ffprobe(filename)
        raise EnvironmentError('could to find ffprobe. please install ffmpeg')
    return {'path': filename, 'size': 0}

def ffprobe(filename):
    p = subprocess.Popen([
        cmd('ffprobe'),
        '-show_format',
        '-show_chapters',
        '-show_streams',
        '-print_format',
        'json',
        '-i', filename

    ], stdout=subprocess.PIPE, stderr=subprocess.PIPE)
    info, error = p.communicate()
    info = info.decode('utf-8')
    ffinfo = json.loads(info)

    def fix_value(key, value):
        if key == 'r_frame_rate':
            value = value.replace('/', ':')
        elif key == 'bit_rate':
            value = float(value) / 1000
        elif key == 'duration':
            value = float(value)
        elif key == 'size':
            value = int(value)
        return value

    info = {}
    if 'format' not in ffinfo:
        info['error'] = 'badfile'
    else:
        for key in ('duration', 'size', 'bit_rate'):
            if key in ffinfo['format']:
                info[{
                    'bit_rate': 'bitrate'
                }.get(key, key)] = fix_value(key, ffinfo['format'][key])
        info['audio'] = []
        info['video'] = []
        info['metadata'] = ffinfo['format'].get('tags', {})
        chapters = ffinfo.get('chapters', [])
        if chapters:
            info['chapters'] = [
                {
                    'in': float(chapter['start_time']),
                    'out': float(chapter['end_time']),
                    'value': chapter.get('tags', {}).get('title')
                }
                for chapter in chapters if chapter.get('tags', {}).get('title')
            ]
        for s in ffinfo['streams']:
            tags = s.pop('tags', {})
            side_data_list = s.pop('side_data_list', [])
            language = None
            for t in tags:
                if t == 'language':
                    language = tags[t]
                else:
                    info['metadata'][t] = tags[t]
            for kv in side_data_list:
                for k, v in kv.items():
                    info['metadata'][k] = v
            if s.get('codec_type') in ('audio', 'video'):
                stream = {}
                if language and language != 'und':
                    stream['language'] = language
                keys = [ 
                    'codec_name',
                    'width',
                    'height',
                    'bit_rate',
                    'index',
                    'display_aspect_ratio',
                    'sample_rate',
                    'channels',
                ]
                if s['codec_type'] == 'video':
                    keys += [
                        'sample_aspect_ratio',
                        'r_frame_rate',
                        'pix_fmt',
                    ]

                for key in keys:
                    if key in s:
                        stream[{
                            'codec_name': 'codec',
                            'bit_rate': 'bitrate',
                            'index': 'id',
                            'r_frame_rate': 'framerate',
                            'sample_rate': 'samplerate',
                            'pix_fmt': 'pixel_format',
                            'sample_aspect_ratio': 'pixel_aspect_ratio',
                        }.get(key, key)] = fix_value(key, s[key])
                if 'avg_frame_rate' in s and stream.get('framerate') == "90000:1":
                    stream['framerate'] = fix_value('r_frame_rate', s['avg_frame_rate'])
                    stream['force_framerate'] = True
                info[s['codec_type']].append(stream)
            elif s.get('codec_type') == 'subtitle':
                info['subtitles'] = info.get('subtitles', [])
                stream = {}
                if language and language != 'und':
                    stream['language'] = language
                for key in (
                    'codec_name',
                    'language',
                    'width',
                    'height',
                ):
                    if key in s:
                        stream[{
                            'codec_name': 'codec',
                        }.get(key, key)] = s[key]
                info['subtitles'].append(stream)
            else:
                pass
                # print s
        for v in info['video']:
            k = 'display_aspect_ratio'
            if 'rotate' in info.get('metadata', {}) and int(info['metadata']['rotate']) in (-90, 90):
                v['width'], v['height'] = v['height'], v['width']
                if k in v:
                    v[k] = ':'.join(reversed(v[k].split(':')))
            elif 'rotation' in info.get('metadata', {}) and int(info['metadata']['rotation']) in (-90, 90):
                v['width'], v['height'] = v['height'], v['width']
                if k in v:
                    v[k] = ':'.join(reversed(v[k].split(':')))
            if k not in v and 'width' in v \
                    or (k in v and v[k] == '0:1'):
                v[k] = '%d:%d' % (v['width'], v['height'])
                v['pixel_aspect_ratio'] = '1:1'
    info['oshash'] = oshash(filename)
    info['path'] = filename
    if 'size' not in info:
        info['size'] = os.path.getsize(filename)

    fix_coverart(info)
    return info

def fix_coverart(info):
    if info.get('video') \
            and info['path'].split('.')[-1] in EXTENSIONS['audio'] \
            and info['video'][0]['codec'] in EXTENSIONS['image'] + ['mjpeg']:
        info['cover'] = info.pop('video')
        info['video'] = []
    return info

def makedirs(path):
    if not os.path.exists(path):
        try:
            os.makedirs(path)
        except OSError as e:
            if e.errno != 17:
                raise

def copy_file(source, target, verbose=False):
    if verbose:
        print('copying', source, 'to', target)
    write_path(target)
    shutil.copyfile(source, target)

def read_file(file, verbose=False):
    if verbose:
        print('reading', file)
    f = open(file, 'rb')
    data = f.read()
    f.close()
    return data

def read_json(file, verbose=False):
    if verbose:
        print('reading', file)
    with open(file) as fd:
        data = json.load(fd)
    return data

def write_file(file, data, verbose=False):
    if verbose:
        print('writing', file)
    if not isinstance(data, bytes):
        data = data.encode('utf-8')
    write_path(file)
    f = open(file, 'wb')
    f.write(data)
    f.close()
    return len(data)

def write_image(file, image, verbose=False):
    if verbose:
        print('writing', file)
    write_path(file)
    image.save(file)

def write_json(file, data, ensure_ascii=True, indent=0, sort_keys=False, verbose=False):
    data = json.dumps(data, ensure_ascii=ensure_ascii, indent=indent, sort_keys=sort_keys)
    write_file(file, data if ensure_ascii else data.encode('utf-8'), verbose=verbose)

def write_link(source, target, verbose=False):
    if verbose:
        print('linking', source, 'to', target)
    write_path(target)
    if os.path.exists(target):
        os.unlink(target)
    os.symlink(source, target)

def write_path(file):
    path = os.path.split(file)[0]
    if path and not os.path.exists(path):
        os.makedirs(path)

def iexists(path):
    parts = path.split(os.sep)
    name = parts[-1].lower()
    if len(parts) == 1:
        folder = '.'
    else:
        folder = os.path.dirname(path)
    try:
        files = os.listdir(folder)
    except FileNotFoundError:
        return False
    files = {os.path.basename(f).lower() for f in files}
    return name in files
add some functions 2008-04-27 16:54:37 +00:00			`# -- coding: utf-8 --`
vi:si:et:sw=4:sts=4:ts=4 2008-06-19 09:21:21 +00:00			`# vi:si:et:sw=4:sts=4:ts=4`
move and rename some 2008-07-06 13:00:06 +00:00			`# GPL 2008`
remove with_statement(for 2.5) from __future__ 2016-08-23 16:12:46 +00:00			`from __future__ import division, print_function`
iexists 2017-01-07 11:11:05 +00:00			`from glob import glob`
use hashlib instead of sha 2009-03-16 17:15:14 +00:00			`import hashlib`
iexists 2017-01-07 11:11:05 +00:00			`import os`
work around ffmpeg2theora problems with some metadata output 2010-11-15 16:35:07 +00:00			`import re`
saner copyfile method (that works for files > max python str len) 2012-12-26 20:26:43 +00:00			`import shutil`
iexists 2017-01-07 11:11:05 +00:00			`import sqlite3`
deal with files < 64k in oshash 2009-06-14 19:22:47 +00:00			`import struct`
avinfo, get info about file 2009-08-07 11:35:28 +00:00			`import subprocess`

use six to support python 2 and 3 2014-09-30 19:04:46 +00:00			`from .utils import json`
add oshash 2009-05-28 17:00:30 +00:00
iexists 2017-01-07 11:11:05 +00:00			`__all__ = ['sha1sum', 'oshash', 'avinfo', 'makedirs', 'iexists']`
add some functions 2008-04-27 16:54:37 +00:00
move EXTENSIONS to ox.file and add image type 2013-10-14 18:07:05 +00:00			`EXTENSIONS = {`
			`'audio': [`
add amr 2016-08-06 11:17:10 +00:00			`'aac', 'aif', 'aiff', 'amr',`
detect add real media files 2021-11-14 13:35:26 +00:00			`'flac', 'm4a', 'mp3', 'oga', 'ogg', 'wav', 'wma', 'opus',`
			`'ra', # Real Audio`
move EXTENSIONS to ox.file and add image type 2013-10-14 18:07:05 +00:00			`],`
			`'image': [`
			`'bmp', 'gif', 'jpeg', 'jpg', 'png', 'svg', 'webp'`
			`],`
			`'subtitle': [`
add vtt as subtitle extension 2016-07-01 16:02:42 +00:00			`'idx', 'srt', 'sub', 'vtt'`
move EXTENSIONS to ox.file and add image type 2013-10-14 18:07:05 +00:00			`],`
			`'video': [`
			`'3gp',`
add m2v 2021-09-22 16:56:25 +00:00			`'avi', 'divx', 'dv', 'flv', 'm2t', 'm2ts', 'm2v', 'm4v', 'mkv', 'mov', 'mp4',`
split real media 2022-01-01 13:31:33 +00:00			`'mpeg', 'mpg', 'mts', 'ogm', 'ogv', 'vob', 'webm', 'wmv', 'asf',`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`'mod', 'tod', # http://en.wikipedia.org/wiki/MOD_and_TOD`
support dat 2021-02-23 08:09:35 +00:00			`'mxf', 'ts',`
			`'dat', # VOD files`
split real media 2022-01-01 13:31:33 +00:00			`'rm', 'rmvb', # Real Media`
move EXTENSIONS to ox.file and add image type 2013-10-14 18:07:05 +00:00			`],`
			`}`
add cache for file functions: oshash/sha1sum/avinfo 2012-08-21 07:35:37 +00:00
avoid distutils, no longer in python 3.12 2024-08-29 18:22:37 +00:00			`def is_exe(fpath):`
			`return os.path.isfile(fpath) and os.access(fpath, os.X_OK)`

			`def which(program):`
			`fpath, fname = os.path.split(program)`
			`if fpath:`
			`if is_exe(program):`
			`return program`
			`else:`
			`for path in os.environ.get("PATH", "").split(os.pathsep):`
			`exe_file = os.path.join(path, program)`
			`if is_exe(exe_file):`
			`return exe_file`
			`return None`

add ffprobe wrapper 2012-06-11 10:11:06 +00:00			`def cmd(program):`
			`local = os.path.expanduser('~/.ox/bin/%s' % program)`
			`if os.path.exists(local):`
			`program = local`
			`return program`

add cache for file functions: oshash/sha1sum/avinfo 2012-08-21 07:35:37 +00:00			`def _get_file_cache():`
			`import ox.cache`
work around thread issues with ox.cache 2014-05-17 09:25:19 +00:00			`path = ox.cache.cache_path()`
			`if path.startswith('fs:'):`
			`path = path[3:]`
			`return os.path.join(path, 'files.sqlite')`
add cache for file functions: oshash/sha1sum/avinfo 2012-08-21 07:35:37 +00:00
force cache update 2015-05-23 19:44:37 +00:00			`def cache(filename, type='oshash', update=False):`
add cache for file functions: oshash/sha1sum/avinfo 2012-08-21 07:35:37 +00:00			`conn = sqlite3.connect(_get_file_cache(), timeout=10)`
			`conn.row_factory = sqlite3.Row`

			`if not cache.init:`
			`c = conn.cursor()`
			`c.execute('CREATE TABLE IF NOT EXISTS cache (path varchar(1024) unique, oshash varchar(16), sha1 varchar(42), size int, mtime int, info text)')`
			`c.execute('CREATE INDEX IF NOT EXISTS cache_oshash ON cache (oshash)')`
			`c.execute('CREATE INDEX IF NOT EXISTS cache_sha1 ON cache (sha1)')`
			`conn.commit()`
			`cache.init = True`
			`c = conn.cursor()`
			`c.execute('SELECT oshash, sha1, info, size, mtime FROM cache WHERE path = ?', (filename, ))`
			`stat = os.stat(filename)`
			`row = None`
			`h = None`
			`sha1 = None`
			`info = ''`
			`for row in c:`
			`if stat.st_size == row['size'] and int(stat.st_mtime) == int(row['mtime']):`
force cache update 2015-05-23 19:44:37 +00:00			`if not update:`
			`value = row[type]`
			`if value:`
			`if type == 'info':`
			`value = json.loads(value)`
			`return value`
add cache for file functions: oshash/sha1sum/avinfo 2012-08-21 07:35:37 +00:00			`h = row['oshash']`
			`sha1 = row['sha1']`
			`info = row['info']`
			`if type == 'oshash':`
			`value = h = oshash(filename, cached=False)`
			`elif type == 'sha1':`
			`value = sha1 = sha1sum(filename, cached=False)`
			`elif type == 'info':`
			`value = avinfo(filename, cached=False)`
			`info = json.dumps(value)`
			`t = (filename, h, sha1, stat.st_size, int(stat.st_mtime), info)`
			`with conn:`
			`sql = u'INSERT OR REPLACE INTO cache values (?, ?, ?, ?, ?, ?)'`
			`c.execute(sql, t)`
			`return value`
			`cache.init = None`

			`def cleanup_cache():`
			`conn = sqlite3.connect(_get_file_cache(), timeout=10)`
			`conn.row_factory = sqlite3.Row`
			`c = conn.cursor()`
			`c.execute('SELECT path FROM cache')`
			`paths = [r[0] for r in c]`
			`for path in paths:`
			`if not os.path.exists(path):`
			`c.execute('DELETE FROM cache WHERE path = ?', (path, ))`
			`conn.commit()`
			`c.execute('VACUUM')`
			`conn.commit()`

			`def sha1sum(filename, cached=False):`
			`if cached:`
			`return cache(filename, 'sha1')`
use hashlib instead of sha 2009-03-16 17:15:14 +00:00			`sha1 = hashlib.sha1()`
fix ox.file 2014-09-30 19:30:25 +00:00			`with open(filename, 'rb') as f:`
			`for chunk in iter(lambda: f.read(128*sha1.block_size), b''):`
use iter to read file with a multiple of hash block_size(sha1sum) 2013-10-14 10:35:07 +00:00			`sha1.update(chunk)`
vi:si:et:sw=4:sts=4:ts=4 2008-06-19 09:21:21 +00:00			`return sha1.hexdigest()`
add some functions 2008-04-27 16:54:37 +00:00
add oshash 2009-05-28 17:00:30 +00:00			`'''`
			`os hash - http://trac.opensubtitles.org/projects/opensubtitles/wiki/HashSourceCodes`
deal with files < 64k in oshash 2009-06-14 19:22:47 +00:00			`plus modification for files < 64k, buffer is filled with file data and padded with 0`
add oshash 2009-05-28 17:00:30 +00:00			`'''`
add cache for file functions: oshash/sha1sum/avinfo 2012-08-21 07:35:37 +00:00			`def oshash(filename, cached=True):`
			`if cached:`
			`return cache(filename, 'oshash')`
deal with files < 64k in oshash 2009-06-14 19:22:47 +00:00			`try:`
			`longlongformat = 'q' # long long`
			`bytesize = struct.calcsize(longlongformat)`
add oshash 2009-05-28 17:00:30 +00:00
deal with files < 64k in oshash 2009-06-14 19:22:47 +00:00			`f = open(filename, "rb")`

			`filesize = os.path.getsize(filename)`
			`hash = filesize`
			`if filesize < 65536:`
			`for x in range(int(filesize/bytesize)):`
			`buffer = f.read(bytesize)`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`(l_value,) = struct.unpack(longlongformat, buffer)`
deal with files < 64k in oshash 2009-06-14 19:22:47 +00:00			`hash += l_value`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`hash = hash & 0xFFFFFFFFFFFFFFFF # to remain as 64bit number`
deal with files < 64k in oshash 2009-06-14 19:22:47 +00:00			`else:`
			`for x in range(int(65536/bytesize)):`
			`buffer = f.read(bytesize)`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`(l_value,) = struct.unpack(longlongformat, buffer)`
deal with files < 64k in oshash 2009-06-14 19:22:47 +00:00			`hash += l_value`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`hash = hash & 0xFFFFFFFFFFFFFFFF # to remain as 64bit number`
			`f.seek(max(0, filesize-65536), 0)`
deal with files < 64k in oshash 2009-06-14 19:22:47 +00:00			`for x in range(int(65536/bytesize)):`
			`buffer = f.read(bytesize)`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`(l_value,) = struct.unpack(longlongformat, buffer)`
deal with files < 64k in oshash 2009-06-14 19:22:47 +00:00			`hash += l_value`
			`hash = hash & 0xFFFFFFFFFFFFFFFF`
			`f.close()`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`returnedhash = "%016x" % hash`
deal with files < 64k in oshash 2009-06-14 19:22:47 +00:00			`return returnedhash`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`except IOError:`
add oshash 2009-05-28 17:00:30 +00:00			`return "IOError"`
add some functions 2008-04-27 16:54:37 +00:00
add cache for file functions: oshash/sha1sum/avinfo 2012-08-21 07:35:37 +00:00			`def avinfo(filename, cached=True):`
			`if cached:`
			`return cache(filename, 'info')`
avinfo should not fail for emptpy files 2010-02-27 11:47:13 +00:00			`if os.path.getsize(filename):`
avoid distutils, no longer in python 3.12 2024-08-29 18:22:37 +00:00			`if which('ffprobe'):`
use ffprobe in avinfo if installed 2015-01-03 09:58:21 +00:00			`return ffprobe(filename)`
don't fall back to ffmpeg2theora 2019-12-21 18:29:44 +00:00			`raise EnvironmentError('could to find ffprobe. please install ffmpeg')`
avinfo should not fail for emptpy files 2010-02-27 11:47:13 +00:00			`return {'path': filename, 'size': 0}`
ox.makedirs 2011-04-06 13:24:32 +00:00
add ffprobe wrapper 2012-06-11 10:11:06 +00:00			`def ffprobe(filename):`
			`p = subprocess.Popen([`
			`cmd('ffprobe'),`
			`'-show_format',`
include chapters in avinfo 2016-06-16 13:55:12 +00:00			`'-show_chapters',`
add ffprobe wrapper 2012-06-11 10:11:06 +00:00			`'-show_streams',`
			`'-print_format',`
			`'json',`
			`'-i', filename`

			`], stdout=subprocess.PIPE, stderr=subprocess.PIPE)`
			`info, error = p.communicate()`
decode stdout 2016-08-23 16:11:20 +00:00			`info = info.decode('utf-8')`
add ffprobe wrapper 2012-06-11 10:11:06 +00:00			`ffinfo = json.loads(info)`

			`def fix_value(key, value):`
			`if key == 'r_frame_rate':`
			`value = value.replace('/', ':')`
			`elif key == 'bit_rate':`
			`value = float(value) / 1000`
			`elif key == 'duration':`
			`value = float(value)`
			`elif key == 'size':`
			`value = int(value)`
			`return value`

			`info = {}`
iexists 2017-01-07 11:11:05 +00:00			`if 'format' not in ffinfo:`
dont throw exception for invalid files 2014-12-24 22:18:29 +00:00			`info['error'] = 'badfile'`
			`else:`
			`for key in ('duration', 'size', 'bit_rate'):`
dont fail if files dont have all format keys 2015-01-22 10:01:36 +00:00			`if key in ffinfo['format']:`
			`info[{`
			`'bit_rate': 'bitrate'`
			`}.get(key, key)] = fix_value(key, ffinfo['format'][key])`
dont throw exception for invalid files 2014-12-24 22:18:29 +00:00			`info['audio'] = []`
			`info['video'] = []`
			`info['metadata'] = ffinfo['format'].get('tags', {})`
include chapters in avinfo 2016-06-16 13:55:12 +00:00			`chapters = ffinfo.get('chapters', [])`
			`if chapters:`
			`info['chapters'] = [`
			`{`
			`'in': float(chapter['start_time']),`
			`'out': float(chapter['end_time']),`
			`'value': chapter.get('tags', {}).get('title')`
			`}`
			`for chapter in chapters if chapter.get('tags', {}).get('title')`
			`]`
dont throw exception for invalid files 2014-12-24 22:18:29 +00:00			`for s in ffinfo['streams']:`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`tags = s.pop('tags', {})`
the many ways of tagging video rotation 2023-08-25 10:13:01 +00:00			`side_data_list = s.pop('side_data_list', [])`
dont throw exception for invalid files 2014-12-24 22:18:29 +00:00			`language = None`
			`for t in tags:`
			`if t == 'language':`
			`language = tags[t]`
			`else:`
			`info['metadata'][t] = tags[t]`
the many ways of tagging video rotation 2023-08-25 10:13:01 +00:00			`for kv in side_data_list:`
			`for k, v in kv.items():`
			`info['metadata'][k] = v`
dont throw exception for invalid files 2014-12-24 22:18:29 +00:00			`if s.get('codec_type') in ('audio', 'video'):`
			`stream = {}`
			`if language and language != 'und':`
			`stream['language'] = language`
			`keys = [`
			`'codec_name',`
			`'width',`
			`'height',`
			`'bit_rate',`
			`'index',`
			`'display_aspect_ratio',`
			`'sample_rate',`
			`'channels',`
add ffprobe wrapper 2012-06-11 10:11:06 +00:00			`]`
dont throw exception for invalid files 2014-12-24 22:18:29 +00:00			`if s['codec_type'] == 'video':`
			`keys += [`
			`'sample_aspect_ratio',`
			`'r_frame_rate',`
			`'pix_fmt',`
			`]`
add ffprobe wrapper 2012-06-11 10:11:06 +00:00
dont throw exception for invalid files 2014-12-24 22:18:29 +00:00			`for key in keys:`
			`if key in s:`
			`stream[{`
			`'codec_name': 'codec',`
			`'bit_rate': 'bitrate',`
			`'index': 'id',`
			`'r_frame_rate': 'framerate',`
			`'sample_rate': 'samplerate',`
			`'pix_fmt': 'pixel_format',`
			`'sample_aspect_ratio': 'pixel_aspect_ratio',`
			`}.get(key, key)] = fix_value(key, s[key])`
use avg_frame_rate if video is 90k 2024-06-08 10:22:25 +00:00			`if 'avg_frame_rate' in s and stream.get('framerate') == "90000:1":`
			`stream['framerate'] = fix_value('r_frame_rate', s['avg_frame_rate'])`
add force_framerate flag 2024-06-08 10:37:47 +00:00			`stream['force_framerate'] = True`
dont throw exception for invalid files 2014-12-24 22:18:29 +00:00			`info[s['codec_type']].append(stream)`
load subtitle info 2019-08-01 14:28:00 +00:00			`elif s.get('codec_type') == 'subtitle':`
			`info['subtitles'] = info.get('subtitles', [])`
			`stream = {}`
fix subtitle language 2019-08-01 18:54:04 +00:00			`if language and language != 'und':`
			`stream['language'] = language`
load subtitle info 2019-08-01 14:28:00 +00:00			`for key in (`
fix subtitle language 2019-08-01 18:54:04 +00:00			`'codec_name',`
			`'language',`
			`'width',`
			`'height',`
load subtitle info 2019-08-01 14:28:00 +00:00			`):`
			`if key in s:`
			`stream[{`
			`'codec_name': 'codec',`
			`}.get(key, key)] = s[key]`
			`info['subtitles'].append(stream)`
dont throw exception for invalid files 2014-12-24 22:18:29 +00:00			`else:`
			`pass`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`# print s`
dont throw exception for invalid files 2014-12-24 22:18:29 +00:00			`for v in info['video']:`
fix aspect ratio 2022-10-22 09:50:46 +00:00			`k = 'display_aspect_ratio'`
180/-180 rotation does not change width/height 2023-07-06 11:37:11 +00:00			`if 'rotate' in info.get('metadata', {}) and int(info['metadata']['rotate']) in (-90, 90):`
rotate width/height 2017-01-07 11:11:21 +00:00			`v['width'], v['height'] = v['height'], v['width']`
fix aspect ratio 2022-10-22 09:50:46 +00:00			`if k in v:`
			`v[k] = ':'.join(reversed(v[k].split(':')))`
the many ways of tagging video rotation 2023-08-25 10:13:01 +00:00			`elif 'rotation' in info.get('metadata', {}) and int(info['metadata']['rotation']) in (-90, 90):`
			`v['width'], v['height'] = v['height'], v['width']`
			`if k in v:`
			`v[k] = ':'.join(reversed(v[k].split(':')))`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`if k not in v and 'width' in v \`
dont throw exception for invalid files 2014-12-24 22:18:29 +00:00			`or (k in v and v[k] == '0:1'):`
			`v[k] = '%d:%d' % (v['width'], v['height'])`
			`v['pixel_aspect_ratio'] = '1:1'`
use iter to read file with a multiple of hash block_size(sha1sum) 2013-10-14 10:35:07 +00:00			`info['oshash'] = oshash(filename)`
fix ox.ffprobe output to match ox.avinfo 2014-12-19 11:57:38 +00:00			`info['path'] = filename`
cleanup pylint errors and py2/3 issues 2016-06-08 13:32:46 +00:00			`if 'size' not in info:`
include size for unknown formats 2015-04-24 14:09:31 +00:00			`info['size'] = os.path.getsize(filename)`
dont treat coverart as video 2017-05-21 09:19:43 +00:00
			`fix_coverart(info)`
			`return info`

			`def fix_coverart(info):`
			`if info.get('video') \`
			`and info['path'].split('.')[-1] in EXTENSIONS['audio'] \`
			`and info['video'][0]['codec'] in EXTENSIONS['image'] + ['mjpeg']:`
			`info['cover'] = info.pop('video')`
			`info['video'] = []`
add ffprobe wrapper 2012-06-11 10:11:06 +00:00			`return info`

ox.makedirs 2011-04-06 13:24:32 +00:00			`def makedirs(path):`
			`if not os.path.exists(path):`
			`try:`
			`os.makedirs(path)`
use six to support python 2 and 3 2014-09-30 19:04:46 +00:00			`except OSError as e:`
ox.makedirs 2011-04-06 13:24:32 +00:00			`if e.errno != 17:`
			`raise`
update file module, add get_sort_name and get_sort_title to text module 2011-10-11 14:14:29 +00:00
			`def copy_file(source, target, verbose=False):`
			`if verbose:`
use six to support python 2 and 3 2014-09-30 19:04:46 +00:00			`print('copying', source, 'to', target)`
saner copyfile method (that works for files > max python str len) 2012-12-26 20:26:43 +00:00			`write_path(target)`
			`shutil.copyfile(source, target)`
update file module, add get_sort_name and get_sort_title to text module 2011-10-11 14:14:29 +00:00
			`def read_file(file, verbose=False):`
			`if verbose:`
use six to support python 2 and 3 2014-09-30 19:04:46 +00:00			`print('reading', file)`
better performances of ox.js.minify 2014-09-30 21:19:19 +00:00			`f = open(file, 'rb')`
update file module, add get_sort_name and get_sort_title to text module 2011-10-11 14:14:29 +00:00			`data = f.read()`
			`f.close()`
			`return data`

			`def read_json(file, verbose=False):`
no need to load json string into ram 2013-11-15 15:16:21 +00:00			`if verbose:`
use six to support python 2 and 3 2014-09-30 19:04:46 +00:00			`print('reading', file)`
no need to load json string into ram 2013-11-15 15:16:21 +00:00			`with open(file) as fd:`
			`data = json.load(fd)`
			`return data`
update file module, add get_sort_name and get_sort_title to text module 2011-10-11 14:14:29 +00:00
			`def write_file(file, data, verbose=False):`
			`if verbose:`
use six to support python 2 and 3 2014-09-30 19:04:46 +00:00			`print('writing', file)`
better performances of ox.js.minify 2014-09-30 21:19:19 +00:00			`if not isinstance(data, bytes):`
			`data = data.encode('utf-8')`
update file module, add get_sort_name and get_sort_title to text module 2011-10-11 14:14:29 +00:00			`write_path(file)`
better performances of ox.js.minify 2014-09-30 21:19:19 +00:00			`f = open(file, 'wb')`
update file module, add get_sort_name and get_sort_title to text module 2011-10-11 14:14:29 +00:00			`f.write(data)`
			`f.close()`
			`return len(data)`

ox.file: add ensure_ascii parameter to write_json; add write_image method (write_path + image.save) 2013-06-09 14:45:26 +00:00			`def write_image(file, image, verbose=False):`
			`if verbose:`
use six to support python 2 and 3 2014-09-30 19:04:46 +00:00			`print('writing', file)`
ox.file: add ensure_ascii parameter to write_json; add write_image method (write_path + image.save) 2013-06-09 14:45:26 +00:00			`write_path(file)`
			`image.save(file)`

			`def write_json(file, data, ensure_ascii=True, indent=0, sort_keys=False, verbose=False):`
			`data = json.dumps(data, ensure_ascii=ensure_ascii, indent=indent, sort_keys=sort_keys)`
			`write_file(file, data if ensure_ascii else data.encode('utf-8'), verbose=verbose)`
update file module, add get_sort_name and get_sort_title to text module 2011-10-11 14:14:29 +00:00
			`def write_link(source, target, verbose=False):`
			`if verbose:`
use six to support python 2 and 3 2014-09-30 19:04:46 +00:00			`print('linking', source, 'to', target)`
update file module, add get_sort_name and get_sort_title to text module 2011-10-11 14:14:29 +00:00			`write_path(target)`
			`if os.path.exists(target):`
			`os.unlink(target)`
			`os.symlink(source, target)`

			`def write_path(file):`
			`path = os.path.split(file)[0]`
			`if path and not os.path.exists(path):`
			`os.makedirs(path)`
iexists 2017-01-07 11:11:05 +00:00
			`def iexists(path):`
			`parts = path.split(os.sep)`
			`name = parts[-1].lower()`
			`if len(parts) == 1:`
			`folder = '.'`
			`else:`
			`folder = os.path.dirname(path)`
folder might not exist 2017-06-14 11:00:44 +00:00			`try:`
			`files = os.listdir(folder)`
			`except FileNotFoundError:`
			`return False`
iexists 2017-01-07 11:11:05 +00:00			`files = {os.path.basename(f).lower() for f in files}`
			`return name in files`