mirror of
https://github.com/zhayujie/chatgpt-on-wechat.git
synced 2026-03-19 13:28:11 +08:00
feat(wechatcomapp): add support for splitting long audio files
This commit is contained in:
@@ -19,7 +19,7 @@ from common.log import logger
|
|||||||
from common.singleton import singleton
|
from common.singleton import singleton
|
||||||
from common.utils import compress_imgfile, fsize, split_string_by_utf8_length
|
from common.utils import compress_imgfile, fsize, split_string_by_utf8_length
|
||||||
from config import conf, subscribe_msg
|
from config import conf, subscribe_msg
|
||||||
from voice.audio_convert import any_to_amr
|
from voice.audio_convert import any_to_amr, split_audio
|
||||||
|
|
||||||
MAX_UTF8_LEN = 2048
|
MAX_UTF8_LEN = 2048
|
||||||
|
|
||||||
@@ -66,8 +66,12 @@ class WechatComAppChannel(ChatChannel):
|
|||||||
file_path = reply.content
|
file_path = reply.content
|
||||||
amr_file = os.path.splitext(file_path)[0] + ".amr"
|
amr_file = os.path.splitext(file_path)[0] + ".amr"
|
||||||
any_to_amr(file_path, amr_file)
|
any_to_amr(file_path, amr_file)
|
||||||
response = self.client.media.upload("voice", open(amr_file, "rb"))
|
files = split_audio(amr_file, 60000)
|
||||||
logger.debug("[wechatcom] upload voice response: {}".format(response))
|
if len(files) > 1:
|
||||||
|
logger.info("[wechatcom] voice too long, split into {} parts".format(len(files)))
|
||||||
|
for path in files:
|
||||||
|
response = self.client.media.upload("voice", open(path, "rb"))
|
||||||
|
logger.debug("[wechatcom] upload voice response: {}".format(response))
|
||||||
except WeChatClientException as e:
|
except WeChatClientException as e:
|
||||||
logger.error("[wechatcom] upload voice failed: {}".format(e))
|
logger.error("[wechatcom] upload voice failed: {}".format(e))
|
||||||
return
|
return
|
||||||
|
|||||||
@@ -92,6 +92,7 @@ def any_to_amr(any_path, amr_path):
|
|||||||
audio = AudioSegment.from_file(any_path)
|
audio = AudioSegment.from_file(any_path)
|
||||||
audio = audio.set_frame_rate(8000) # only support 8000
|
audio = audio.set_frame_rate(8000) # only support 8000
|
||||||
audio.export(amr_path, format="amr")
|
audio.export(amr_path, format="amr")
|
||||||
|
return audio.duration_seconds * 1000
|
||||||
|
|
||||||
|
|
||||||
def sil_to_wav(silk_path, wav_path, rate: int = 24000):
|
def sil_to_wav(silk_path, wav_path, rate: int = 24000):
|
||||||
@@ -101,3 +102,26 @@ def sil_to_wav(silk_path, wav_path, rate: int = 24000):
|
|||||||
wav_data = pysilk.decode_file(silk_path, to_wav=True, sample_rate=rate)
|
wav_data = pysilk.decode_file(silk_path, to_wav=True, sample_rate=rate)
|
||||||
with open(wav_path, "wb") as f:
|
with open(wav_path, "wb") as f:
|
||||||
f.write(wav_data)
|
f.write(wav_data)
|
||||||
|
|
||||||
|
|
||||||
|
def split_audio(file_path, max_segment_length_ms=60000):
|
||||||
|
"""
|
||||||
|
分割音频文件
|
||||||
|
"""
|
||||||
|
audio = AudioSegment.from_file(file_path)
|
||||||
|
audio_length_ms = len(audio)
|
||||||
|
if audio_length_ms <= max_segment_length_ms:
|
||||||
|
return [file_path]
|
||||||
|
segments = []
|
||||||
|
for start_ms in range(0, audio_length_ms, max_segment_length_ms):
|
||||||
|
end_ms = min(audio_length_ms, start_ms + max_segment_length_ms)
|
||||||
|
segment = audio[start_ms:end_ms]
|
||||||
|
segments.append(segment)
|
||||||
|
file_prefix = file_path[: file_path.rindex(".")]
|
||||||
|
format = file_path[file_path.rindex(".") + 1 :]
|
||||||
|
files = []
|
||||||
|
for i, segment in enumerate(segments):
|
||||||
|
path = f"{file_prefix}_{i+1}" + f".{format}"
|
||||||
|
segment.export(path, format=format)
|
||||||
|
files.append(path)
|
||||||
|
return files
|
||||||
|
|||||||
Reference in New Issue
Block a user