File size: 915 Bytes
cb71ef5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
import json
from datetime import date

import webvtt


def get_seconds(time_str):
    h, m, s_ms = time_str.split(':')
    s, ms = s_ms.split('.')
    return int(h) * 3600 + int(m) * 60 + int(s) + float('0.' + ms)

def get_transcript(path):
    with open(path) as f:
        transcript = f.read()
        transcript = transcript.replace('\n', ' ')
    return transcript

def get_captions_from_vtt(path):
    vtt = webvtt.read(path)
    return [{'start': get_seconds(caption.start), 'end': get_seconds(caption.end), 'text': caption.text} for caption in vtt]

def save_summary(summary, path, filename, config):
    path.mkdir(parents=True, exist_ok=True)
    with open(path / filename, "w+") as f:
        f.write(summary)
    with open(path / "config.txt", "w+") as f:
        config["date"] = str(date.today())
        json.dump(config, f, indent=4)
    print("Saved", path / filename)