mirror of
https://github.com/QuentinFuxa/WhisperLiveKit.git
synced 2026-03-07 22:33:36 +00:00
specify dtype for librosa.load, instead of cast
This commit is contained in:
@@ -10,8 +10,8 @@ import math
|
||||
|
||||
@lru_cache
|
||||
def load_audio(fname):
|
||||
a, _ = librosa.load(fname, sr=16000)
|
||||
return a.astype('float32')
|
||||
a, _ = librosa.load(fname, sr=16000, dtype=np.float32)
|
||||
return a
|
||||
|
||||
def load_audio_chunk(fname, beg, end):
|
||||
audio = load_audio(fname)
|
||||
|
||||
@@ -4,6 +4,7 @@ from whisper_online import *
|
||||
import sys
|
||||
import argparse
|
||||
import os
|
||||
import numpy as np
|
||||
parser = argparse.ArgumentParser()
|
||||
|
||||
# server options
|
||||
@@ -137,8 +138,8 @@ class ServerProcessor:
|
||||
if not raw_bytes:
|
||||
break
|
||||
sf = soundfile.SoundFile(io.BytesIO(raw_bytes), channels=1,endian="LITTLE",samplerate=SAMPLING_RATE, subtype="PCM_16",format="RAW")
|
||||
audio, _ = librosa.load(sf,sr=SAMPLING_RATE)
|
||||
out.append(audio.astype('float32'))
|
||||
audio, _ = librosa.load(sf,sr=SAMPLING_RATE,dtype=np.float32)
|
||||
out.append(audio)
|
||||
if not out:
|
||||
return None
|
||||
return np.concatenate(out)
|
||||
|
||||
Reference in New Issue
Block a user