join-partial-lines.py

This commit is contained in:
2022-09-27 06:00:34 +00:00
parent 8dffb5633d
commit 9a71ef0ada
2 changed files with 118 additions and 1 deletions

View File

@@ -0,0 +1,110 @@
#! /usr/bin/env python
# pip install -r requirements.txt
usage = 'python join-partial-lines.py <cut json> <?wav filename>'
from imports import *
import util
from time import sleep
import string
from os.path import exists
from os import system
system('color')
json_filename = util.arg(1, usage)
default_wav_name = json_filename.replace('.json', '.wav')
wav_filename = util.arg(2, usage, default_wav_name)
cutter = util.AudioCutter(wav_filename, json_filename)
def new_wav_filename():
suffix = "0"
new_wav = wav_filename.replace(".wav", f"-joined{suffix}.wav")
while exists(new_wav):
new_suffix = str(int(suffix) + 1)
new_wav = new_wav.replace(f"-joined{suffix}.wav", f"-joined{new_suffix}.wav")
suffix = new_suffix
return new_wav
def save():
cutter.save_and_quit(new_wav_filename())
joining_with_guess = ""
joining_with = None
delay_time = 0.5
def process_chunk(audio_guess, timestamp):
global joining_with_guess
global joining_with
global delay_time
if joining_with != None:
print(f'Joining onto: \033[92m{joining_with_guess}\033[0m')
print('\033[31m' + audio_guess + '\033[0m')
usage = f'u/d/j/p/t/f/n/q/h'
print(usage)
if 'alts' in timestamp:
print('join-partial-lines cannot join alts. skipping')
length = timestamp['end'] - timestamp['start']
adjusted = {'start': cutter.current_sec, 'end': cutter.current_sec + length, 'alts': []}
cutter.take_audio(audio_guess, adjusted, timestamp['start'], timestamp['end'])
for alt in timestamp['alts']:
length = alt['end'] - alt['start']
adjusted['alts'].append({'start': cutter.current_sec, 'end': cutter.current_sec + length})
cutter.take_audio(audio_guess, adjusted, alt['start'], alt['end'])
return
while True:
choice = getch()
if choice == 'u':
cutter.take_audio(audio_guess, timestamp, timestamp['start'], timestamp['end'])
elif choice == 'd':
break
elif choice == 'j':
if joining_with == None:
joining_with_guess = audio_guess
joining_with = timestamp
else:
# do the join
joined_guess = joining_with_guess + " " + audio_guess
full_timestamp = {
'start': cutter.current_sec,
'end': cutter.current_sec + (joining_with['end'] - joining_with['start']) + delay_time + (timestamp['end'] - timestamp['start'])
}
cutter.take_audio(joined_guess, full_timestamp, joining_with['start'], joining_with['end'])
cutter.add_silence(delay_time)
cutter.take_audio(joined_guess, full_timestamp, timestamp['start'], timestamp['end'])
# clear the joining part
joining_with_guess = ""
joining_with = None
break
elif choice == 'f':
cutter.search()
break
elif choice == 'n':
cutter.repeat_search()
break
elif choice == 'q':
save()
elif choice == 'p':
cutter.play_audio(joining_with['start'], joining_with['end'])
sleep(joining_with['end'] - joining_with['start'])
sleep(delay_time)
cutter.play_audio(timestamp['start'], timestamp['end'])
elif choice == 't':
delay_time = float(input("seconds to pause between parts? "))
print(usage)
elif choice == 'h':
print('u - use this line as-is')
if joining_with != None:
print(f'j - join this line with \033[92m{joining_with_guess}\033[0m')
else:
print('j - join this line with another line')
print(f't - set the delay time (currently {delay_time}')
print('p - play this line as if joined')
print('f - search ahead for a word or phrase')
print('n - repeat a search.')
print('d - discard this line')
print('q - save and quit')
cutter.process_audio(process_chunk, new_wav_filename())

View File

@@ -1,4 +1,5 @@
from imports import *
import numpy as np
def arg(num, usage, default=None):
val = ''
@@ -30,7 +31,7 @@ class AudioCutter:
self.wav = wave.open(f)
self.nchannels, self.sampwidth, self.framerate, self.nframes, self.comptype, self.compname = self.wav.getparams()
_, self.data = wavfile.read(wav_file)
self.rate, self.data = wavfile.read(wav_file)
# Accumulate new sound data cut from the original, along with new related json data
self.new_data = self.data[0:1]
@@ -58,6 +59,12 @@ class AudioCutter:
self.current_sec += length
self.new_json_info[tag] = info
def add_silence(self, seconds):
nframes = int(seconds * self.rate)
shape = self.new_data.shape
shape = (nframes,) + shape[1:]
self.new_data = vstack((self.new_data, np.zeros(shape, self.new_data.dtype)))
def play_audio(self, start, end):
audio, _ = self.audio_and_length(start, end)
play_buffer(audio, self.nchannels, self.sampwidth, self.framerate)