specify dtype for librosa.load, instead of cast

This commit is contained in:
koiking213
2024-02-20 23:29:25 +09:00
parent 24926c98e0
commit 4405c451ce
2 changed files with 5 additions and 4 deletions

View File

@@ -10,8 +10,8 @@ import math
@lru_cache
def load_audio(fname):
a, _ = librosa.load(fname, sr=16000)
return a.astype('float32')
a, _ = librosa.load(fname, sr=16000, dtype=np.float32)
return a
def load_audio_chunk(fname, beg, end):
audio = load_audio(fname)

View File

@@ -4,6 +4,7 @@ from whisper_online import *
import sys
import argparse
import os
import numpy as np
parser = argparse.ArgumentParser()
# server options
@@ -137,8 +138,8 @@ class ServerProcessor:
if not raw_bytes:
break
sf = soundfile.SoundFile(io.BytesIO(raw_bytes), channels=1,endian="LITTLE",samplerate=SAMPLING_RATE, subtype="PCM_16",format="RAW")
audio, _ = librosa.load(sf,sr=SAMPLING_RATE)
out.append(audio.astype('float32'))
audio, _ = librosa.load(sf,sr=SAMPLING_RATE,dtype=np.float32)
out.append(audio)
if not out:
return None
return np.concatenate(out)