# !/usr/bin/env python3
# -*- coding: UTF-8 -*-
"""
@author : v_jiaohaicheng@baidu.com
@des :
"""
from typing import Tuple, List
from pydub import AudioSegment
from pydub.silence import detect_silence
from sdk.utils.util_file import FileProcess
class VoiceProcess():
"""
音频处理
"""
def __init__(self):
self.Pfile = FileProcess()
def read_vioce(self, file: str) -> AudioSegment:
"""
读取音频
:param file:
:return:
"""
return AudioSegment.from_file(
file, format=self.Pfile.get_file_tail(file))
def get_total_duration(self, audio) -> int:
"""
获取音频时长
:param audio:
:return: 毫秒
"""
duration = audio.duration_seconds
return duration * 1000
def cut_voice(self, audio: AudioSegment, begin: int,
end: int) -> AudioSegment:
"""
切割音频
:param audio:
:param begin:毫秒
:param end:毫秒
:return:
"""
return audio[begin:end]
def merge_videos(self, voice_lists: List[AudioSegment]) -> AudioSegment:
"""
合并音频
:param audio1:
:param audio2:
:return:
"""
return sum(voice_lists)
def save_video(self, audio: AudioSegment, save_file: str):
"""
保存音频
:param audio:
:param save_file:
:return:
"""
audio.export(save_file, format=self.Pfile.get_file_tail(save_file))
def adjust_vioce(self, audio: AudioSegment, num: int):
"""
调整音量
:param audio:
:param num:
:return:
"""
return audio + num
def get_sample_rate(self,audio:AudioSegment)->int:
"""
获取采样率
:param audio:
:return:
"""
return audio.frame_rate
def resample_voice(self, audio: AudioSegment, rate: int) -> AudioSegment:
"""
重采样
:param audio:
:param rate:采样率
:return:
"""
return audio.set_frame_rate(rate)
def get_blank_voice(self, audio: AudioSegment,
min_len: int = 3000, db: int = -35) -> Tuple[int, int]:
"""
识别空白音
:param audio:
:param db:分贝
:return: 所有静音片段开始和结束时间
"""
silence_ranges = detect_silence(audio, db, min_len, 1)
for start, end in silence_ranges:
yield (start, end)
def ms_timedelete(self, millis: int) -> str:
"""
毫秒转换成 小时:分钟:秒.毫秒 格式
:param millis:
:return:
"""
seconds = int((millis / 1000) % 60)
minutes = int((millis / (1000 * 60)) % 60)
hours = int((millis / (1000 * 60 * 60)) % 24)
lay = millis - hours * 1000 * 60 * 60 - minutes * 1000 * 60 - seconds * 1000
return "{}:{}:{}.{}".format(
str(hours).rjust(2, "0"),
str(minutes).rjust(2, "0"),
str(seconds).rjust(2, "0"),
str(lay)
)
def voice_time_ms(self, time_voice: str):
"""
小时:分钟:秒.毫秒 转换成 毫秒
:param time_voice:
:return:
"""
h = time_voice.split(":")[0]
s = time_voice.split(".")[-1]
m = time_voice.split(":")[1].split(".")[0]
return (60 * int(h) + int(m) + int(s)) * 1000
def process(self):
"""
继承并实现 process 处理音频
:return:
"""
pass
版权声明:本文内容由互联网用户自发贡献,该文观点仅代表作者本人。本站仅提供信息存储空间服务,不拥有所有权,不承担相关法律责任。如发现本站有涉嫌侵权/违法违规的内容, 请发送邮件至 举报,一经查实,本站将立刻删除。
文章由极客之音整理,本文链接:https://www.bmabk.com/index.php/post/156855.html