join-partial-lines.py

2022-09-27 06:00:34 +00:00
parent 8dffb5633d
commit 9a71ef0ada
2 changed files with 118 additions and 1 deletions
--- a/scripts/join-partial-lines.py
+++ b/scripts/join-partial-lines.py
@@ -0,0 +1,110 @@
+#! /usr/bin/env python
+# pip install -r requirements.txt
+usage = 'python join-partial-lines.py <cut json> <?wav filename>'
+
+from imports import *
+import util
+from time import sleep
+import string
+from os.path import exists
+from os import system
+system('color')
+
+json_filename = util.arg(1, usage)
+default_wav_name = json_filename.replace('.json', '.wav')
+wav_filename = util.arg(2, usage, default_wav_name)
+
+cutter = util.AudioCutter(wav_filename, json_filename)
+
+def new_wav_filename():
+    suffix = "0"
+    new_wav = wav_filename.replace(".wav", f"-joined{suffix}.wav")
+    while exists(new_wav):
+        new_suffix = str(int(suffix) + 1)
+        new_wav = new_wav.replace(f"-joined{suffix}.wav", f"-joined{new_suffix}.wav")
+        suffix = new_suffix
+    return new_wav
+
+
+def save():
+    cutter.save_and_quit(new_wav_filename())
+
+joining_with_guess = ""
+joining_with = None
+delay_time = 0.5
+
+def process_chunk(audio_guess, timestamp):
+    global joining_with_guess
+    global joining_with
+    global delay_time
+    if joining_with != None:
+        print(f'Joining onto: \033[92m{joining_with_guess}\033[0m')
+    print('\033[31m' + audio_guess + '\033[0m')
+    usage = f'u/d/j/p/t/f/n/q/h' 
+    print(usage)
+    if 'alts' in timestamp:
+        print('join-partial-lines cannot join alts. skipping')
+        length = timestamp['end'] - timestamp['start']
+        adjusted = {'start': cutter.current_sec, 'end': cutter.current_sec + length, 'alts': []}
+        cutter.take_audio(audio_guess, adjusted, timestamp['start'], timestamp['end'])
+        for alt in timestamp['alts']:
+            length = alt['end'] - alt['start']
+            adjusted['alts'].append({'start': cutter.current_sec, 'end': cutter.current_sec + length})
+            cutter.take_audio(audio_guess, adjusted, alt['start'], alt['end'])
+        return
+
+    while True:
+        choice = getch()
+        if choice == 'u':
+            cutter.take_audio(audio_guess, timestamp, timestamp['start'], timestamp['end'])
+        elif choice == 'd':
+            break
+        elif choice == 'j':
+            if joining_with == None:
+                joining_with_guess = audio_guess
+                joining_with = timestamp
+            else:
+                # do the join
+                joined_guess = joining_with_guess + " " + audio_guess
+                full_timestamp = {
+                    'start': cutter.current_sec,
+                    'end': cutter.current_sec + (joining_with['end'] - joining_with['start']) + delay_time + (timestamp['end'] - timestamp['start'])
+                }
+                cutter.take_audio(joined_guess, full_timestamp, joining_with['start'], joining_with['end'])
+                cutter.add_silence(delay_time)
+                cutter.take_audio(joined_guess, full_timestamp, timestamp['start'], timestamp['end'])
+                # clear the joining part
+                joining_with_guess = ""
+                joining_with = None
+            break
+        elif choice == 'f':
+            cutter.search()
+            break
+        elif choice == 'n':
+            cutter.repeat_search()
+            break
+        elif choice == 'q':
+            save()
+        elif choice == 'p':
+            cutter.play_audio(joining_with['start'], joining_with['end'])
+            sleep(joining_with['end'] - joining_with['start'])
+            sleep(delay_time)
+            cutter.play_audio(timestamp['start'], timestamp['end'])
+        elif choice == 't':
+            delay_time = float(input("seconds to pause between parts? "))
+            print(usage)
+
+        elif choice == 'h':
+            print('u - use this line as-is')
+            if joining_with != None:
+                print(f'j - join this line with \033[92m{joining_with_guess}\033[0m')
+            else:
+                print('j - join this line with another line')
+            print(f't - set the delay time (currently {delay_time}')
+            print('p - play this line as if joined')
+            print('f - search ahead for a word or phrase')
+            print('n - repeat a search.')
+            print('d - discard this line')
+            print('q - save and quit')
+
+cutter.process_audio(process_chunk, new_wav_filename())
--- a/scripts/util.py
+++ b/scripts/util.py
@@ -1,4 +1,5 @@
 from imports import *
+import numpy as np

 def arg(num, usage, default=None):
    val = ''
@@ -30,7 +31,7 @@ class AudioCutter:
            self.wav = wave.open(f)

        self.nchannels, self.sampwidth, self.framerate, self.nframes, self.comptype, self.compname = self.wav.getparams()
-        _, self.data = wavfile.read(wav_file)
+        self.rate, self.data = wavfile.read(wav_file)
        
        # Accumulate new sound data cut from the original, along with new related json data
        self.new_data = self.data[0:1]
@@ -58,6 +59,12 @@ class AudioCutter:
        self.current_sec += length
        self.new_json_info[tag] = info

+    def add_silence(self, seconds):
+        nframes = int(seconds * self.rate)
+        shape = self.new_data.shape
+        shape = (nframes,) + shape[1:]
+        self.new_data = vstack((self.new_data, np.zeros(shape, self.new_data.dtype)))
+
    def play_audio(self, start, end):
        audio, _ = self.audio_and_length(start, end)
        play_buffer(audio, self.nchannels, self.sampwidth, self.framerate)