All checks were successful
ci/woodpecker/tag/woodpecker Pipeline was successful
- 新增 monoToStereoReader 将单声道 WAV 实时转换为立体声 - PlayWav 自动检测单声道并应用转换管线 - 添加完整的单元测试覆盖转换逻辑 - 整理 import 顺序(goimports) Co-authored-by: Qwen-Coder <qwen-coder@alibabacloud.com>
179 lines
4.1 KiB
Go
179 lines
4.1 KiB
Go
package audio
|
|
|
|
import (
|
|
"bytes"
|
|
"context"
|
|
"fmt"
|
|
"io"
|
|
"time"
|
|
|
|
"github.com/hajimehoshi/go-mp3"
|
|
"github.com/youpy/go-wav"
|
|
"go.uber.org/zap"
|
|
)
|
|
|
|
// monoToStereoReader 将单声道音频转换为立体声
|
|
type monoToStereoReader struct {
|
|
src io.Reader
|
|
buf []byte
|
|
}
|
|
|
|
func (m *monoToStereoReader) Read(p []byte) (int, error) {
|
|
maxSamples := len(p) / 4
|
|
if maxSamples == 0 {
|
|
return 0, nil
|
|
}
|
|
|
|
// 按需分配缓冲区
|
|
if cap(m.buf) < maxSamples*2 {
|
|
m.buf = make([]byte, maxSamples*2)
|
|
}
|
|
|
|
// 读取单声道数据
|
|
n, err := m.src.Read(m.buf[:maxSamples*2])
|
|
if n == 0 {
|
|
return 0, err
|
|
}
|
|
|
|
// 单声道→立体声:复制每个样本到左右声道
|
|
samples := n / 2
|
|
for i := range samples {
|
|
base := i * 4
|
|
mono := i * 2
|
|
p[base] = m.buf[mono] // 左声道低字节
|
|
p[base+1] = m.buf[mono+1] // 左声道高字节
|
|
p[base+2] = m.buf[mono] // 右声道低字节
|
|
p[base+3] = m.buf[mono+1] // 右声道高字节
|
|
}
|
|
|
|
if err == io.EOF {
|
|
return samples * 4, io.EOF
|
|
}
|
|
return samples * 4, nil
|
|
}
|
|
|
|
// PlayWav 播放 WAV 文件(阻塞),直到完成或 context 取消
|
|
func PlayWav(ctx context.Context, r io.ReadCloser) error {
|
|
// Read the entire file into memory since wav.NewReader needs ReadAt
|
|
data, err := io.ReadAll(r)
|
|
if err != nil {
|
|
r.Close()
|
|
return fmt.Errorf("读取 WAV 文件失败: %w", err)
|
|
}
|
|
r.Close()
|
|
|
|
// Create a reader from the buffered data
|
|
dec := wav.NewReader(bytes.NewReader(data))
|
|
|
|
// 获取音频格式信息
|
|
format, err := dec.Format()
|
|
if err != nil {
|
|
return fmt.Errorf("获取 WAV 格式失败: %w", err)
|
|
}
|
|
|
|
duration, _ := dec.Duration()
|
|
sourceRate := int(format.SampleRate)
|
|
channels := int(format.NumChannels)
|
|
|
|
zap.S().Infof("WAV 音频: %d ch, %d Hz, 时长: %v", channels, sourceRate, duration)
|
|
|
|
// 构建处理管线:单声道转换 → 重采样
|
|
reader := io.Reader(dec)
|
|
if channels == 1 {
|
|
zap.S().Infof("单声道转立体声: 1 ch → 2 ch")
|
|
reader = &monoToStereoReader{src: dec}
|
|
channels = DefaultChannelCount
|
|
}
|
|
|
|
if needsResampling(sourceRate) {
|
|
zap.S().Infof("Sinc 重采样: %d Hz → %d Hz, %d ch", sourceRate, UniversalSampleRate, channels)
|
|
reader = newSincResampler(reader, sourceRate, UniversalSampleRate, channels)
|
|
}
|
|
|
|
otoCtx, err := initContext()
|
|
if err != nil {
|
|
return fmt.Errorf("音频上下文初始化失败: %w", err)
|
|
}
|
|
|
|
player := otoCtx.NewPlayer(reader)
|
|
defer player.Close()
|
|
|
|
player.Play()
|
|
|
|
// 等待播放完成
|
|
done := make(chan struct{})
|
|
go func() {
|
|
for !player.IsPlaying() {
|
|
time.Sleep(10 * time.Millisecond)
|
|
}
|
|
for player.IsPlaying() {
|
|
time.Sleep(10 * time.Millisecond)
|
|
}
|
|
time.Sleep(200 * time.Millisecond)
|
|
close(done)
|
|
}()
|
|
|
|
select {
|
|
case <-done:
|
|
return nil
|
|
case <-ctx.Done():
|
|
return ctx.Err()
|
|
}
|
|
}
|
|
|
|
// PlayMP3 播放 MP3 文件(阻塞),直到完成或 context 取消
|
|
func PlayMP3(ctx context.Context, r io.ReadCloser) error {
|
|
dec, err := mp3.NewDecoder(r)
|
|
if err != nil {
|
|
r.Close()
|
|
return fmt.Errorf("MP3 解码失败: %w", err)
|
|
}
|
|
defer r.Close()
|
|
|
|
// MP3 解码器信息
|
|
sampleRate := int(dec.SampleRate())
|
|
sampleCount := dec.Length()
|
|
channels := 2 // MP3 通常是立体声
|
|
duration := time.Duration(float64(sampleCount)/float64(sampleRate)*1000) * time.Millisecond
|
|
|
|
zap.S().Infof("MP3 音频: %d Hz → %d Hz, 时长约: %v",
|
|
sampleRate, UniversalSampleRate, duration)
|
|
|
|
// 需要重采样(使用 Sinc 高质量重采样)
|
|
var reader io.Reader = dec
|
|
if needsResampling(sampleRate) {
|
|
zap.S().Infof("Sinc 重采样: %d Hz → %d Hz", sampleRate, UniversalSampleRate)
|
|
reader = newSincResampler(dec, sampleRate, UniversalSampleRate, channels)
|
|
}
|
|
|
|
otoCtx, err := initContext()
|
|
if err != nil {
|
|
return fmt.Errorf("音频上下文初始化失败: %w", err)
|
|
}
|
|
|
|
player := otoCtx.NewPlayer(reader)
|
|
defer player.Close()
|
|
|
|
player.Play()
|
|
|
|
// 等待播放完成
|
|
done := make(chan struct{})
|
|
go func() {
|
|
for !player.IsPlaying() {
|
|
time.Sleep(10 * time.Millisecond)
|
|
}
|
|
for player.IsPlaying() {
|
|
time.Sleep(10 * time.Millisecond)
|
|
}
|
|
time.Sleep(200 * time.Millisecond)
|
|
close(done)
|
|
}()
|
|
|
|
select {
|
|
case <-done:
|
|
return nil
|
|
case <-ctx.Done():
|
|
return ctx.Err()
|
|
}
|
|
}
|