import se_extractor as se

_ = se.generate_voice_segments('openai_source_output.mp3',vad=True)
_ = se.load_model()

from resemble_enhance.enhancer.inference import denoise, enhance
import torchaudio


dwav, sr = torchaudio.load('openai_source_output.mp3')
dwav = dwav.mean(dim=0)

wav1, new_sr = enhance(dwav, sr, 'cpu', nfe=32, solver='midpoint', lambd=0.9, tau=0.5)