Create run_gentle.py

TarrySingh · TarrySingh · commit 273ad1a2fbd5 · 2019-04-04T17:36:25.000+02:00
diff --git a/Projects/youtube-gesture-dataset/script/run_gentle.py b/Projects/youtube-gesture-dataset/script/run_gentle.py
@@ -0,0 +1,64 @@
+# ------------------------------------------------------------------------------
+# Copyright (c) ETRI. All rights reserved.
+# Licensed under the BSD 3-Clause License.
+# This file is part of Youtube-Gesture-Dataset, a sub-project of AIR(AI for Robots) project.
+# You can refer to details of AIR project at https://aiforrobots.github.io
+# Written by Youngwoo Yoon (youngwoo@etri.re.kr)
+# ------------------------------------------------------------------------------
+
+import glob
+import logging
+import multiprocessing
+import os
+import re
+import sys
+
+from tqdm import tqdm
+
+from config import *
+from make_ted_dataset import read_subtitle
+
+sys.path.insert(0, '../../../gentle')
+import gentle
+
+
+# prepare gentle
+nthreads = multiprocessing.cpu_count() - 2
+logging.getLogger().setLevel("WARNING")
+disfluencies = set(['uh', 'um'])
+resources = gentle.Resources()
+
+
+def run_gentle(video_path, vid, result_path):
+    vtt_subtitle = read_subtitle(vid)
+    transcript = ''
+    for i, sub in enumerate(vtt_subtitle):
+        transcript += (vtt_subtitle[i].text + ' ')
+    transcript = re.sub('\n', ' ', transcript)  # remove newline characters
+
+    # align
+    with gentle.resampled(video_path) as wav_file:
+        aligner = gentle.ForcedAligner(resources, transcript, nthreads=nthreads, disfluency=False, conservative=False,
+                                       disfluencies=disfluencies)
+        result = aligner.transcribe(wav_file, logging=logging)
+
+    # write results
+    with open(result_path, 'w', encoding="utf-8") as fh:
+        fh.write(result.to_json(indent=2))
+
+
+def main():
+    videos = glob.glob(VIDEO_PATH + "/*.mp4")
+    n_total = len(videos)
+    for i, file_path in tqdm(enumerate(sorted(videos, key=os.path.getmtime))):
+        vid = os.path.split(file_path)[1][-15:-4]
+        print('{}/{} - {}'.format(i+1, n_total, vid))
+        result_path = VIDEO_PATH + '/' + vid + '_align_results.json'
+        if os.path.exists(result_path) and os.path.getsize(result_path):  # existing and not empty
+            print('JSON file already exists ({})'.format(vid))
+        else:
+            run_gentle(file_path, vid, result_path)
+
+
+if __name__ == '__main__':
+    main()