script for cutting voice tracks

2021-12-13 20:44:40 -07:00
parent 4138dbf353
commit 731d81b99f
1 changed files with 105 additions and 0 deletions
--- a/scripts/cut-voice-track.py
+++ b/scripts/cut-voice-track.py
@@ -0,0 +1,105 @@
+# pip install -r requirements.txt
+usage = 'python cut-voice-track.py <?wav timestamp json> <?wav filename>'
+
+import util
+import json
+import sys
+from numpy import vstack
+from scipy.io import wavfile
+from simpleaudio import play_buffer
+import wave
+try:
+    from getch import getch
+except:
+    from msvcrt import getwch as getch
+from os.path import exists
+from os import system
+system('color')
+
+json_filename = util.arg(1, usage)
+default_wav_name = json_filename.replace('_4000.json', '')
+wav_filename = util.arg(2, usage, default_wav_name)
+
+timestamps = {}
+with open(json_filename, 'r') as f:
+    timestamps = json.load(f)
+
+wav = None
+with open(wav_filename, 'rb') as f:
+    wav = wave.open(f)
+
+nchannels, sampwidth, framerate, nframes, comptype, compname = wav.getparams()
+
+_, data = wavfile.read(wav_filename)
+
+new_data = data[0:1]
+new_json = {}
+
+current_sec = 0
+searching_for = None
+for (audio_guess, possible_sections) in timestamps.items():
+    if searching_for != None:
+        if searching_for in audio_guess:
+            searching_for = None
+        else:
+            continue
+
+    num_takes = len(possible_sections)
+    assert num_takes <= 10, "I didn't plan for this many takes of any line"
+    takes = '/'.join([str(num) for num in range(num_takes)])
+
+    def audio_and_length(choice):
+        take_num = int(choice)
+        take_info = possible_sections[take_num]
+        start = take_info['start']
+        end = take_info['end']
+        start_frame = int(start * framerate)
+        end_frame = int(end * framerate)
+        return data[start_frame:end_frame], end - start
+# Line: okay so what's the owner of what kind of oh know is this like oh no our table or it's it's a different oh no
+    
+    print('\033[31m' + audio_guess + '\033[0m')
+    print(f'{takes}/u({takes})/d/f/h/q')
+    while True:
+        choice = getch()
+        if choice == 'h':
+            print(f'{num_takes} takes. Type {takes} to play one. Type u + {takes} to use one of them. Type f to search ahead for a word or phrase. Type d to discard this snippet. Type q to quit')
+        elif choice == 'd':
+            break
+        elif choice != '/' and choice in takes:
+            audio, _ = audio_and_length(choice)
+            play_buffer(audio, nchannels, sampwidth, framerate)
+        elif choice == 'f':
+            phrase = input("phrase (lower-case) to search for?")
+            searching_for = phrase
+            break
+        elif choice == 'q':
+            suffix = "0"
+            new_wav = wav_filename.replace(".wav", f"-cut{suffix}.wav")
+            while exists(new_wav):
+                new_suffix = str(int(suffix) + 1)
+                new_wav = new_wav.replace(f"-cut{suffix}.wav", f"-cut{new_suffix}.wav")
+                suffix = new_suffix
+            wavfile.write(new_wav, framerate, new_data)
+            with open(new_wav.replace(".wav", ".json"), 'w') as f:
+                json.dump(new_json, f)
+            sys.exit(0)
+        elif choice == 'u':
+            choice = getch()
+            if choice != '/' and choice in takes:
+                audio, length = audio_and_length(choice)
+                new_json[audio_guess] = {
+                    'start': current_sec,
+                    'end': current_sec + length
+                }
+                new_data = vstack((new_data, audio))
+                current_sec += length
+                break
+            else:
+                print(f'{choice} is not a valid take to use')
+
+        else:
+            print(f'{choice} is not a valid option')
+
+if searching_for != None:
+    print(f"{searching_for} not found")