File size: 1,779 Bytes
21e6506
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
import os
import tempfile
from pathlib import Path, PurePath

import ffmpeg


class DecodedInput:
    audio: PurePath
    images: tuple[PurePath, ...]

    def __init__(
        self,
        audio: PurePath,
        images: tuple[PurePath, ...],
        tmpdir: tempfile.TemporaryDirectory,
    ):
        self.audio = audio
        self.images = images
        self.tmpdir = tmpdir

    def __enter__(self):
        return self

    def __exit__(self, exc_type, exc_val, exc_tb) -> None:
        print("Cleaning up " + self.tmpdir.name)
        self.tmpdir.cleanup()


def decode_input(input_path: PurePath, fps: int = 2) -> DecodedInput:
    outdir = tempfile.TemporaryDirectory()
    audio = PurePath(outdir.name) / "audio.mp3"
    (
        ffmpeg.input(
            str(input_path),
        )
        .output(
            str(audio),
            loglevel="error",
            **{
                # Use 64k bitrate for smaller file
                "b:a": "64k",
                # Only output one channel, again for smaller file
                "ac": "1",
            },
        )
        .run()
    )
    (
        ffmpeg.input(str(input_path))
        .output(
            str(PurePath(outdir.name) / "frame-%04d.jpg"),
            loglevel="error",
            **{
                # Use fps as specified, scale image to fit within 512x512
                "vf": f"fps={fps},scale='if(gt(iw,ih),512,-1)':'if(gt(ih,iw),512,-1)'",
                "q:v": "20",
            },
        )
        .run()
    )
    images = list(Path(outdir.name).glob("*.jpg"))
    images.sort()
    return DecodedInput(audio, tuple(images), outdir)


if __name__ == "__main__":
    with decode_input(PurePath("data/question.mov")) as input:
        print(input.audio)
        print(input.images)