# !/usr/bin/env python3
# -*- coding: UTF-8 -*-
"""
@author : [email protected]
@des :
"""
from typing import Tuple, List
from pydub import AudioSegment
from pydub.silence import detect_silence
from sdk.utils.util_file import FileProcess
class VoiceProcess():
"""
音频处理
"""
def __init__(self):
self.Pfile = FileProcess()
def read_vioce(self, file: str) -> AudioSegment:
"""
读取音频
:param file:
:return:
"""
return AudioSegment.from_file(
file, format=self.Pfile.get_file_tail(file))
def get_total_duration(self, audio) -> int:
"""
获取音频时长
:param audio:
:return: 毫秒
"""
duration = audio.duration_seconds
return duration * 1000
def cut_voice(self, audio: AudioSegment, begin: int,
end: int) -> AudioSegment:
"""
切割音频
:param audio:
:param begin:毫秒
:param end:毫秒
:return:
"""
return audio[begin:end]
def merge_videos(self, voice_lists: List[AudioSegment]) -> AudioSegment:
"""
合并音频
:param audio1:
:param audio2:
:return:
"""
return sum(voice_lists)
def save_video(self, audio: AudioSegment, save_file: str):
"""
保存音频
:param audio:
:param save_file:
:return:
"""
audio.export(save_file, format=self.Pfile.get_file_tail(save_file))
def adjust_vioce(self, audio: AudioSegment, num: int):
"""
调整音量
:param audio:
:param num:
:return:
"""
return audio + num
def get_sample_rate(self,audio:AudioSegment)->int:
"""
获取采样率
:param audio:
:return:
"""
return audio.frame_rate
def resample_voice(self, audio: AudioSegment, rate: int) -> AudioSegment:
"""
重采样
:param audio:
:param rate:采样率
:return:
"""
return audio.set_frame_rate(rate)
def get_blank_voice(self, audio: AudioSegment,
min_len: int = 3000, db: int = -35) -> Tuple[int, int]:
"""
识别空白音
:param audio:
:param db:分贝
:return: 所有静音片段开始和结束时间
"""
silence_ranges = detect_silence(audio, db, min_len, 1)
for start, end in silence_ranges:
yield (start, end)
def ms_timedelete(self, millis: int) -> str:
"""
毫秒转换成 小时:分钟:秒.毫秒 格式
:param millis:
:return:
"""
seconds = int((millis / 1000) % 60)
minutes = int((millis / (1000 * 60)) % 60)
hours = int((millis / (1000 * 60 * 60)) % 24)
lay = millis - hours * 1000 * 60 * 60 - minutes * 1000 * 60 - seconds * 1000
return "{}:{}:{}.{}".format(
str(hours).rjust(2, "0"),
str(minutes).rjust(2, "0"),
str(seconds).rjust(2, "0"),
str(lay)
)
def voice_time_ms(self, time_voice: str):
"""
小时:分钟:秒.毫秒 转换成 毫秒
:param time_voice:
:return:
"""
h = time_voice.split(":")[0]
s = time_voice.split(".")[-1]
m = time_voice.split(":")[1].split(".")[0]
return (60 * int(h) + int(m) + int(s)) * 1000
def process(self):
"""
继承并实现 process 处理音频
:return:
"""
pass
Python音频处理相关工具类库
猜你喜欢
转载自blog.csdn.net/CXY00000/article/details/130711402
今日推荐
周排行