mirror of
https://github.com/zhayujie/chatgpt-on-wechat.git
synced 2026-02-18 16:17:05 +08:00
fix: correct sample rate when convert to silk
This commit is contained in:
@@ -3,6 +3,22 @@ import wave
|
||||
import pysilk
|
||||
from pydub import AudioSegment
|
||||
|
||||
sil_supports=[8000, 12000, 16000, 24000, 32000, 44100, 48000] # slk转wav时,支持的采样率
|
||||
def find_closest_sil_supports(sample_rate):
|
||||
"""
|
||||
找到最接近的支持的采样率
|
||||
"""
|
||||
if sample_rate in sil_supports:
|
||||
return sample_rate
|
||||
closest = 0
|
||||
mindiff = 9999999
|
||||
for rate in sil_supports:
|
||||
diff = abs(rate - sample_rate)
|
||||
if diff < mindiff:
|
||||
closest = sample_rate
|
||||
mindiff = diff
|
||||
return closest
|
||||
|
||||
def get_pcm_from_wav(wav_path):
|
||||
"""
|
||||
从 wav 文件中读取 pcm
|
||||
@@ -53,7 +69,7 @@ def pcm_to_sil(pcm_path, silk_path):
|
||||
audio = AudioSegment.from_wav(pcm_path)
|
||||
wav_data = audio.raw_data
|
||||
silk_data = pysilk.encode(
|
||||
wav_data, data_rate=audio.frame_rate, sample_rate=audio.frame_rate)
|
||||
wav_data, data_rate=audio.frame_rate, sample_rate=find_closest_sil_supports(audio.frame_rate))
|
||||
with open(silk_path, "wb") as f:
|
||||
f.write(silk_data)
|
||||
return audio.duration_seconds * 1000
|
||||
@@ -66,8 +82,7 @@ def mp3_to_sil(mp3_path, silk_path):
|
||||
"""
|
||||
audio = AudioSegment.from_mp3(mp3_path)
|
||||
wav_data = audio.raw_data
|
||||
silk_data = pysilk.encode(
|
||||
wav_data, data_rate=audio.frame_rate, sample_rate=audio.frame_rate)
|
||||
silk_data = pysilk.encode(wav_data, data_rate=audio.frame_rate, sample_rate=find_closest_sil_supports(audio.frame_rate))
|
||||
# Save the silk file
|
||||
with open(silk_path, "wb") as f:
|
||||
f.write(silk_data)
|
||||
|
||||
Reference in New Issue
Block a user