pandora_t_for_time/management/commands/generate_clips.py

import json
import os
import re
from collections import defaultdict

from django.core.management.base import BaseCommand
from django.conf import settings

import item.models
import itemlist.models

from ...render import get_srt


def resolve_roman(s):
    extra = re.compile('^\d+(.*?)$').findall(s)
    if extra:
        extra = extra[0].lower()
        new = {
            'i': '1', 'ii': '2', 'iii': '3', 'iv': '4', 'v': '5',
            'vi': '6', 'vii': 7, 'viii': '8', 'ix': '9', 'x': '10'
        }.get(extra, extra)
        return s.replace(extra, new)
    return s

def format_duration(duration, fps):
    return float('%0.5f' % (round(duration * fps) / fps))


class Command(BaseCommand):
    help = 'generate symlinks to clips and clips.json'

    def add_arguments(self, parser):
        parser.add_argument('--lang', action='store', dest='lang', default=None, help='subtitle language')
        parser.add_argument('--prefix', action='store', dest='prefix', default="/srv/t_for_time", help='prefix to build clips in')

    def handle(self, **options):
        prefix = options['prefix']
        lang = options["lang"]
        if lang:
            lang = lang.split(',')
            tlang = lang[1:]
            lang = lang[0]
        else:
            tlang = None
        if lang == "en":
            lang = None
        clips = []
        for i in item.models.Item.objects.filter(sort__type='original'):
            qs = item.models.Item.objects.filter(data__title=i.data['title']).exclude(id=i.id)
            if qs.count() >= 1:
                clip = {}
                durations = []
                for e in item.models.Item.objects.filter(data__title=i.data['title']):
                    if 'type' not in e.data:
                        print("ignoring invalid video %s (no type)" % e)
                        continue
                    if not e.files.filter(selected=True).exists():
                        continue
                    source = e.files.filter(selected=True)[0].data.path
                    ext = os.path.splitext(source)[1]
                    type_ = e.data['type'][0].lower()
                    target = os.path.join(prefix, type_, i.data['title'] + ext)
                    os.makedirs(os.path.dirname(target), exist_ok=True)
                    if os.path.islink(target):
                        os.unlink(target)
                    os.symlink(source, target)
                    clip[type_] = target
                    durations.append(e.files.filter(selected=True)[0].duration)
                clip["duration"] = min(durations)
                if not clip["duration"]:
                    print('!!', durations, clip)
                    continue
                cd = format_duration(clip["duration"], 24)
                #if cd != clip["duration"]:
                #    print(clip["duration"], '->', cd, durations, clip)
                clip["duration"] = cd
                clip['tags'] = i.data.get('tags', [])
                clip['editingtags'] = i.data.get('editingtags', [])
                name = os.path.basename(clip['original'])

                seqid = re.sub("Hotel Aporia_(\d+)", "S\\1_", name)
                seqid = re.sub("Night March_(\d+)", "S\\1_", seqid)
                seqid = re.sub("_(\d+)H_(\d+)", "_S\\1\\2_", seqid)
                seqid = seqid.split('_')[:2]
                seqid = [b[1:] if b[0] in ('B', 'S') else '0' for b in seqid]
                seqid[1] = resolve_roman(seqid[1])
                seqid[1] = ''.join([b for b in seqid[1] if b.isdigit()])
                if not seqid[1]:
                    seqid[1] = '0'
                try:
                    clip['seqid'] = int(''.join(['%06d' % int(b) for b in seqid]))
                except:
                    print(name, seqid, 'failed')
                    raise
                if "original" in clip and "foreground" in clip and "background" in clip:
                    clips.append(clip)
                elif "original" in clip and "animation" in clip:
                    clips.append(clip)
                else:
                    print("ignoring incomplete video", i)

        with open(os.path.join(prefix, 'clips.json'), 'w') as fd:
            json.dump(clips, fd, indent=2, ensure_ascii=False)

        print("using", len(clips), "clips")

        voice_over = defaultdict(dict)
        for vo in item.models.Item.objects.filter(
            data__type__contains="Voice Over",
        ):
            fragment_id = int(vo.get('title').split('_')[0])
            source = vo.files.filter(selected=True)[0]
            batch = vo.get('batch')[0].replace('Text-', '')
            src = source.data.path
            target = os.path.join(prefix, 'voice_over', batch, '%s.wav' % fragment_id)
            os.makedirs(os.path.dirname(target), exist_ok=True)
            if os.path.islink(target):
                os.unlink(target)
            os.symlink(src, target)
            subs = []
            for sub in vo.annotations.filter(layer="subtitles", languages=lang).exclude(value="").order_by("start"):
                sdata = get_srt(sub, lang=tlang)
                subs.append(sdata)
            voice_over[fragment_id][batch] = {
                "src": target,
                "duration": format_duration(source.duration, 24),
                "subs": subs
            }
        with open(os.path.join(prefix, 'voice_over.json'), 'w') as fd:
            json.dump(voice_over, fd, indent=2, ensure_ascii=False)
generate clips 2023-10-08 11:06:24 +00:00			`import json`
fix generate_clips 2023-10-08 11:07:57 +00:00			`import os`
get all originals, also get those with only animation player 2023-10-28 09:57:44 +00:00			`import re`
add voice over, output 6 channels, add 5.1 mix 2023-10-16 22:26:09 +00:00			`from collections import defaultdict`
generate clips 2023-10-08 11:06:24 +00:00
			`from django.core.management.base import BaseCommand`
			`from django.conf import settings`

			`import item.models`
			`import itemlist.models`

get_srt 2023-11-16 08:12:53 +00:00			`from ...render import get_srt`

generate clips 2023-10-08 11:06:24 +00:00
fix V1/V2 naming, handle animation players, don't use blank, results in white 2023-10-28 13:03:35 +00:00			`def resolve_roman(s):`
			`extra = re.compile('^\d+(.*?)$').findall(s)`
			`if extra:`
			`extra = extra[0].lower()`
			`new = {`
			`'i': '1', 'ii': '2', 'iii': '3', 'iv': '4', 'v': '5',`
			`'vi': '6', 'vii': 7, 'viii': '8', 'ix': '9', 'x': '10'`
			`}.get(extra, extra)`
			`return s.replace(extra, new)`
			`return s`

make sure all tracks are exactly the same length 2024-12-04 09:16:24 +00:00			`def format_duration(duration, fps):`
			`return float('%0.5f' % (round(duration * fps) / fps))`

fix V1/V2 naming, handle animation players, don't use blank, results in white 2023-10-28 13:03:35 +00:00
generate clips 2023-10-08 11:06:24 +00:00			`class Command(BaseCommand):`
			`help = 'generate symlinks to clips and clips.json'`

			`def add_arguments(self, parser):`
import/export subtitles 2024-03-22 09:56:50 +00:00			`parser.add_argument('--lang', action='store', dest='lang', default=None, help='subtitle language')`
fix generate_clips 2023-10-08 11:07:57 +00:00			`parser.add_argument('--prefix', action='store', dest='prefix', default="/srv/t_for_time", help='prefix to build clips in')`
generate clips 2023-10-08 11:06:24 +00:00
			`def handle(self, **options):`
			`prefix = options['prefix']`
multiple languages 2024-03-22 10:33:39 +00:00			`lang = options["lang"]`
			`if lang:`
			`lang = lang.split(',')`
			`tlang = lang[1:]`
			`lang = lang[0]`
			`else:`
			`tlang = None`
			`if lang == "en":`
			`lang = None`
generate clips 2023-10-08 11:06:24 +00:00			`clips = []`
get all originals, also get those with only animation player 2023-10-28 09:57:44 +00:00			`for i in item.models.Item.objects.filter(sort__type='original'):`
generate clips 2023-10-08 11:06:24 +00:00			`qs = item.models.Item.objects.filter(data__title=i.data['title']).exclude(id=i.id)`
get all originals, also get those with only animation player 2023-10-28 09:57:44 +00:00			`if qs.count() >= 1:`
generate clips 2023-10-08 11:06:24 +00:00			`clip = {}`
			`durations = []`
			`for e in item.models.Item.objects.filter(data__title=i.data['title']):`
render fixes, encode vides in render command 2023-10-09 19:29:11 +00:00			`if 'type' not in e.data:`
ignore no type 2023-11-08 08:08:38 +00:00			`print("ignoring invalid video %s (no type)" % e)`
			`continue`
ignore empty items 2023-10-21 14:36:08 +00:00			`if not e.files.filter(selected=True).exists():`
			`continue`
only use selected files 2023-10-21 14:32:55 +00:00			`source = e.files.filter(selected=True)[0].data.path`
generate clips 2023-10-08 11:06:24 +00:00			`ext = os.path.splitext(source)[1]`
			`type_ = e.data['type'][0].lower()`
			`target = os.path.join(prefix, type_, i.data['title'] + ext)`
			`os.makedirs(os.path.dirname(target), exist_ok=True)`
fix symlink check 2023-10-28 13:12:45 +00:00			`if os.path.islink(target):`
generate clips 2023-10-08 11:06:24 +00:00			`os.unlink(target)`
			`os.symlink(source, target)`
			`clip[type_] = target`
only use selected files 2023-10-21 14:32:55 +00:00			`durations.append(e.files.filter(selected=True)[0].duration)`
generate clips 2023-10-08 11:06:24 +00:00			`clip["duration"] = min(durations)`
fail for 0 lenght clips 2023-10-29 18:57:39 +00:00			`if not clip["duration"]:`
			`print('!!', durations, clip)`
			`continue`
make sure all tracks are exactly the same length 2024-12-04 09:16:24 +00:00			`cd = format_duration(clip["duration"], 24)`
			`#if cd != clip["duration"]:`
			`# print(clip["duration"], '->', cd, durations, clip)`
			`clip["duration"] = cd`
generate clips 2023-10-08 11:06:24 +00:00			`clip['tags'] = i.data.get('tags', [])`
load editing tags 2023-10-19 14:52:35 +00:00			`clip['editingtags'] = i.data.get('editingtags', [])`
get all originals, also get those with only animation player 2023-10-28 09:57:44 +00:00			`name = os.path.basename(clip['original'])`

fix V1/V2 naming, handle animation players, don't use blank, results in white 2023-10-28 13:03:35 +00:00			`seqid = re.sub("Hotel Aporia_(\d+)", "S\\1_", name)`
			`seqid = re.sub("Night March_(\d+)", "S\\1_", seqid)`
			`seqid = re.sub("_(\d+)H_(\d+)", "_S\\1\\2_", seqid)`
			`seqid = seqid.split('_')[:2]`
get all originals, also get those with only animation player 2023-10-28 09:57:44 +00:00			`seqid = [b[1:] if b[0] in ('B', 'S') else '0' for b in seqid]`
fix V1/V2 naming, handle animation players, don't use blank, results in white 2023-10-28 13:03:35 +00:00			`seqid[1] = resolve_roman(seqid[1])`
get all originals, also get those with only animation player 2023-10-28 09:57:44 +00:00			`seqid[1] = ''.join([b for b in seqid[1] if b.isdigit()])`
			`if not seqid[1]:`
			`seqid[1] = '0'`
			`try:`
			`clip['seqid'] = int(''.join(['%06d' % int(b) for b in seqid]))`
			`except:`
			`print(name, seqid, 'failed')`
			`raise`
render fixes, encode vides in render command 2023-10-09 19:29:11 +00:00			`if "original" in clip and "foreground" in clip and "background" in clip:`
			`clips.append(clip)`
handle animation clips 2023-10-28 09:25:45 +00:00			`elif "original" in clip and "animation" in clip:`
			`clips.append(clip)`
render fixes, encode vides in render command 2023-10-09 19:29:11 +00:00			`else:`
			`print("ignoring incomplete video", i)`
generate clips 2023-10-08 11:06:24 +00:00
			`with open(os.path.join(prefix, 'clips.json'), 'w') as fd:`
			`json.dump(clips, fd, indent=2, ensure_ascii=False)`
add voice over, output 6 channels, add 5.1 mix 2023-10-16 22:26:09 +00:00
get all originals, also get those with only animation player 2023-10-28 09:57:44 +00:00			`print("using", len(clips), "clips")`

add voice over, output 6 channels, add 5.1 mix 2023-10-16 22:26:09 +00:00			`voice_over = defaultdict(dict)`
			`for vo in item.models.Item.objects.filter(`
			`data__type__contains="Voice Over",`
			`):`
			`fragment_id = int(vo.get('title').split('_')[0])`
only use selected files 2023-10-21 14:32:55 +00:00			`source = vo.files.filter(selected=True)[0]`
add voice over, output 6 channels, add 5.1 mix 2023-10-16 22:26:09 +00:00			`batch = vo.get('batch')[0].replace('Text-', '')`
			`src = source.data.path`
mixed output 2023-10-28 09:24:51 +00:00			`target = os.path.join(prefix, 'voice_over', batch, '%s.wav' % fragment_id)`
add voice over, output 6 channels, add 5.1 mix 2023-10-16 22:26:09 +00:00			`os.makedirs(os.path.dirname(target), exist_ok=True)`
islink not exists 2023-10-21 14:46:03 +00:00			`if os.path.islink(target):`
add voice over, output 6 channels, add 5.1 mix 2023-10-16 22:26:09 +00:00			`os.unlink(target)`
			`os.symlink(src, target)`
render subtitles 2023-11-14 16:48:55 +00:00			`subs = []`
multiple languages 2024-03-22 10:33:39 +00:00			`for sub in vo.annotations.filter(layer="subtitles", languages=lang).exclude(value="").order_by("start"):`
			`sdata = get_srt(sub, lang=tlang)`
subtitle tweaks 2023-11-14 18:52:12 +00:00			`subs.append(sdata)`
add voice over, output 6 channels, add 5.1 mix 2023-10-16 22:26:09 +00:00			`voice_over[fragment_id][batch] = {`
			`"src": target,`
make sure all tracks are exactly the same length 2024-12-04 09:16:24 +00:00			`"duration": format_duration(source.duration, 24),`
render subtitles 2023-11-14 16:48:55 +00:00			`"subs": subs`
add voice over, output 6 channels, add 5.1 mix 2023-10-16 22:26:09 +00:00			`}`
			`with open(os.path.join(prefix, 'voice_over.json'), 'w') as fd:`
			`json.dump(voice_over, fd, indent=2, ensure_ascii=False)`