mirror of
https://github.com/NapNeko/NapCatQQ.git
synced 2025-07-19 12:03:37 +00:00
Compare commits
5 Commits
Author | SHA1 | Date | |
---|---|---|---|
![]() |
62b04007bb | ||
![]() |
39d938f603 | ||
![]() |
6f6cffbc67 | ||
![]() |
f739c88106 | ||
![]() |
320a23de20 |
11
package.json
11
package.json
@@ -32,6 +32,7 @@
|
||||
"@types/express": "^5.0.0",
|
||||
"@types/multer": "^1.4.12",
|
||||
"@types/node": "^22.0.1",
|
||||
"@types/node-wav": "^0.0.4",
|
||||
"@types/on-finished": "^2.3.4",
|
||||
"@types/qrcode-terminal": "^0.12.2",
|
||||
"@types/react-color": "^3.0.13",
|
||||
@@ -42,6 +43,7 @@
|
||||
"ajv": "^8.13.0",
|
||||
"async-mutex": "^0.5.0",
|
||||
"commander": "^13.0.0",
|
||||
"compressing": "^1.10.1",
|
||||
"cors": "^2.8.5",
|
||||
"esbuild": "0.25.0",
|
||||
"eslint": "^9.14.0",
|
||||
@@ -54,19 +56,22 @@
|
||||
"image-size": "^1.1.1",
|
||||
"json5": "^2.2.3",
|
||||
"multer": "^1.4.5-lts.1",
|
||||
"napcat.protobuf": "^1.1.4",
|
||||
"typescript": "^5.3.3",
|
||||
"typescript-eslint": "^8.13.0",
|
||||
"vite": "^6.0.1",
|
||||
"vite-plugin-cp": "^4.0.8",
|
||||
"vite-tsconfig-paths": "^5.1.0",
|
||||
"napcat.protobuf": "^1.1.4",
|
||||
"winston": "^3.17.0",
|
||||
"compressing": "^1.10.1"
|
||||
"winston": "^3.17.0"
|
||||
},
|
||||
"dependencies": {
|
||||
"@breezystack/lamejs": "^1.2.7",
|
||||
"@ffmpeg.wasm/core-mt": "^0.13.2",
|
||||
"audio-decode": "^2.2.2",
|
||||
"express": "^5.0.0",
|
||||
"node-wav": "^0.0.2",
|
||||
"silk-wasm": "^3.6.1",
|
||||
"wavefile": "^11.0.0",
|
||||
"ws": "^8.18.0"
|
||||
}
|
||||
}
|
||||
|
145
src/common/audio-enhance/codec/wav.ts
Normal file
145
src/common/audio-enhance/codec/wav.ts
Normal file
@@ -0,0 +1,145 @@
|
||||
// WAV 文件头结构
|
||||
interface WavHeader {
|
||||
riffChunkId: string; // "RIFF"
|
||||
riffChunkSize: number; // 文件大小 - 8
|
||||
riffFormat: string; // "WAVE"
|
||||
fmtChunkId: string; // "fmt "
|
||||
fmtChunkSize: number; // 16
|
||||
audioFormat: number; // 1 = PCM
|
||||
numChannels: number; // 声道数
|
||||
sampleRate: number; // 采样率
|
||||
byteRate: number; // 字节率 (SampleRate * NumChannels * BitsPerSample / 8)
|
||||
blockAlign: number; // 块对齐 (NumChannels * BitsPerSample / 8)
|
||||
bitsPerSample: number; // 采样位数
|
||||
dataChunkId: string; // "data"
|
||||
dataChunkSize: number; // 音频数据大小
|
||||
}
|
||||
|
||||
export class WavEncoder {
|
||||
private header: WavHeader;
|
||||
private data: Buffer;
|
||||
private dataOffset: number;
|
||||
public bitsPerSample: number;
|
||||
|
||||
constructor(sampleRate: number, numChannels: number, bitsPerSample: number) {
|
||||
if (![8, 16, 24, 32].includes(bitsPerSample)) {
|
||||
throw new Error("Unsupported bitsPerSample value. Must be 8, 16, 24, or 32.");
|
||||
}
|
||||
|
||||
this.bitsPerSample = bitsPerSample;
|
||||
this.header = {
|
||||
riffChunkId: "RIFF",
|
||||
riffChunkSize: 0, // 待计算
|
||||
riffFormat: "WAVE",
|
||||
fmtChunkId: "fmt ",
|
||||
fmtChunkSize: 16,
|
||||
audioFormat: 1, // PCM
|
||||
numChannels: numChannels,
|
||||
sampleRate: sampleRate,
|
||||
byteRate: sampleRate * numChannels * bitsPerSample / 8,
|
||||
blockAlign: numChannels * bitsPerSample / 8,
|
||||
bitsPerSample: bitsPerSample,
|
||||
dataChunkId: "data",
|
||||
dataChunkSize: 0 // 待计算
|
||||
};
|
||||
this.data = Buffer.alloc(0);
|
||||
this.dataOffset = 0;
|
||||
}
|
||||
|
||||
public write(buffer: Buffer): void {
|
||||
this.data = Buffer.concat([this.data, buffer]);
|
||||
this.dataOffset += buffer.length;
|
||||
}
|
||||
|
||||
public encode(): Buffer {
|
||||
this.header.dataChunkSize = this.dataOffset;
|
||||
this.header.riffChunkSize = 36 + this.dataOffset;
|
||||
|
||||
const headerBuffer = Buffer.alloc(44);
|
||||
|
||||
headerBuffer.write(this.header.riffChunkId, 0, 4, 'ascii');
|
||||
headerBuffer.writeUInt32LE(this.header.riffChunkSize, 4);
|
||||
headerBuffer.write(this.header.riffFormat, 8, 4, 'ascii');
|
||||
headerBuffer.write(this.header.fmtChunkId, 12, 4, 'ascii');
|
||||
headerBuffer.writeUInt32LE(this.header.fmtChunkSize, 16);
|
||||
headerBuffer.writeUInt16LE(this.header.audioFormat, 20);
|
||||
headerBuffer.writeUInt16LE(this.header.numChannels, 22);
|
||||
headerBuffer.writeUInt32LE(this.header.sampleRate, 24);
|
||||
headerBuffer.writeUInt32LE(this.header.byteRate, 28);
|
||||
headerBuffer.writeUInt16LE(this.header.blockAlign, 32);
|
||||
headerBuffer.writeUInt16LE(this.header.bitsPerSample, 34);
|
||||
headerBuffer.write(this.header.dataChunkId, 36, 4, 'ascii');
|
||||
headerBuffer.writeUInt32LE(this.header.dataChunkSize, 40);
|
||||
|
||||
return Buffer.concat([headerBuffer, this.data]);
|
||||
}
|
||||
}
|
||||
|
||||
export class WavDecoder {
|
||||
private header: WavHeader;
|
||||
private data: Buffer;
|
||||
private dataOffset: number;
|
||||
public bitsPerSample: number;
|
||||
|
||||
constructor(private buffer: Buffer) {
|
||||
this.header = {
|
||||
riffChunkId: "",
|
||||
riffChunkSize: 0,
|
||||
riffFormat: "",
|
||||
fmtChunkId: "",
|
||||
fmtChunkSize: 0,
|
||||
audioFormat: 0,
|
||||
numChannels: 0,
|
||||
sampleRate: 0,
|
||||
byteRate: 0,
|
||||
blockAlign: 0,
|
||||
bitsPerSample: 0,
|
||||
dataChunkId: "",
|
||||
dataChunkSize: 0
|
||||
};
|
||||
this.data = Buffer.alloc(0);
|
||||
this.dataOffset = 0;
|
||||
this.decodeHeader();
|
||||
this.decodeData();
|
||||
this.bitsPerSample = this.header.bitsPerSample;
|
||||
}
|
||||
|
||||
private decodeHeader(): void {
|
||||
this.header.riffChunkId = this.buffer.toString('ascii', 0, 4);
|
||||
this.header.riffChunkSize = this.buffer.readUInt32LE(4);
|
||||
this.header.riffFormat = this.buffer.toString('ascii', 8, 4);
|
||||
this.header.fmtChunkId = this.buffer.toString('ascii', 12, 4);
|
||||
this.header.fmtChunkSize = this.buffer.readUInt32LE(16);
|
||||
this.header.audioFormat = this.buffer.readUInt16LE(20);
|
||||
this.header.numChannels = this.buffer.readUInt16LE(22);
|
||||
this.header.sampleRate = this.buffer.readUInt32LE(24);
|
||||
this.header.byteRate = this.buffer.readUInt32LE(28);
|
||||
this.header.blockAlign = this.buffer.readUInt16LE(32);
|
||||
this.header.bitsPerSample = this.buffer.readUInt16LE(34);
|
||||
this.header.dataChunkId = this.buffer.toString('ascii', 36, 4);
|
||||
this.header.dataChunkSize = this.buffer.readUInt32LE(40);
|
||||
|
||||
this.dataOffset = 44;
|
||||
|
||||
// 可以在此处添加对 header 值的校验
|
||||
if (this.header.riffChunkId !== "RIFF" || this.header.riffFormat !== "WAVE") {
|
||||
throw new Error("Invalid WAV file format.");
|
||||
}
|
||||
|
||||
if (![8, 16, 24, 32].includes(this.header.bitsPerSample)) {
|
||||
throw new Error(`Unsupported bitsPerSample: ${this.header.bitsPerSample}`);
|
||||
}
|
||||
}
|
||||
|
||||
private decodeData(): void {
|
||||
this.data = this.buffer.slice(this.dataOffset, this.dataOffset + this.header.dataChunkSize);
|
||||
}
|
||||
|
||||
public getHeader(): WavHeader {
|
||||
return this.header;
|
||||
}
|
||||
|
||||
public getData(): Buffer {
|
||||
return this.data;
|
||||
}
|
||||
}
|
814
src/common/audio-pure.ts
Normal file
814
src/common/audio-pure.ts
Normal file
@@ -0,0 +1,814 @@
|
||||
/**
|
||||
* 现代音频格式转换库 - 使用纯JavaScript实现的音频格式转换工具
|
||||
* 支持格式: MP3, WAV, FLAC, OGG, OPUS, AMR, M4A和PCM等格式间的转换
|
||||
* PCM格式支持8位、16位和32位采样深度
|
||||
*
|
||||
* 特点:
|
||||
* - 纯JavaScript/TypeScript实现,无需外部依赖如FFmpeg
|
||||
* - 完全支持Web和Node.js环境
|
||||
* - 强类型定义和现代化错误处理
|
||||
* - 高性能实现,支持流式处理
|
||||
*/
|
||||
|
||||
import { readFile, writeFile } from 'fs/promises';
|
||||
import path from 'path';
|
||||
import audioDecode from 'audio-decode'; // 解码 WAV MP3 OGG FLAC
|
||||
import { Mp3Encoder } from '@breezystack/lamejs'; // 编码 MP3
|
||||
import { WavEncoder, WavDecoder } from './audio-enhance/codec/wav'; // 导入 WavEncoder 和 WavDecoder
|
||||
|
||||
// import { Encoder as FlacEncoder } from 'libflacjs/lib/encoder'; // 编码 FLAC
|
||||
// import * as Flac from 'libflacjs'; // 编码 FLAC
|
||||
// import { Muxer } from 'mp4-muxer'; // 替换demux,用于编码 AAC/M4A
|
||||
|
||||
/* ============================================================================
|
||||
类型与接口定义
|
||||
============================================================================ */
|
||||
|
||||
/**
|
||||
* 音频处理错误类 - 提供丰富的错误上下文
|
||||
*/
|
||||
export class AudioError extends Error {
|
||||
constructor(
|
||||
message: string,
|
||||
public readonly step: 'decode' | 'encode' | 'convert' | 'validate',
|
||||
public readonly format?: string,
|
||||
public readonly cause?: Error
|
||||
) {
|
||||
super(message);
|
||||
this.name = 'AudioError';
|
||||
|
||||
// 捕获原始错误堆栈
|
||||
if (cause && cause.stack) {
|
||||
this.stack = `${this.stack}\nCaused by: ${cause.stack}`;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/** 解码后的PCM数据及相关音频信息 */
|
||||
export interface PCMData {
|
||||
/** PCM样本数据,统一使用Float32Array表示 */
|
||||
samples: Float32Array;
|
||||
/** 采样率(Hz) */
|
||||
sampleRate: number;
|
||||
/** 声道数 */
|
||||
channels: number;
|
||||
/** 音频元数据 (可选) */
|
||||
metadata?: AudioMetadata;
|
||||
}
|
||||
|
||||
/** 音频元数据 */
|
||||
export interface AudioMetadata {
|
||||
title?: string;
|
||||
artist?: string;
|
||||
album?: string;
|
||||
year?: number;
|
||||
genre?: string;
|
||||
duration?: number; // 秒
|
||||
[key: string]: any; // 允许其他元数据
|
||||
}
|
||||
|
||||
/** 音频转换选项 */
|
||||
export interface ConvertOptions {
|
||||
/** 目标采样率 */
|
||||
sampleRate?: number;
|
||||
/** 目标声道数 */
|
||||
channels?: number;
|
||||
/** PCM位深度 (8, 16 或 32) */
|
||||
bitDepth?: 8 | 16 | 32;
|
||||
/** 编码比特率 (kbps) */
|
||||
bitrate?: number;
|
||||
/** 编码质量 (0-1) */
|
||||
quality?: number;
|
||||
/** 保留元数据 */
|
||||
preserveMetadata?: boolean;
|
||||
/** 使用Web Worker (仅浏览器环境) */
|
||||
useWorker?: boolean;
|
||||
}
|
||||
|
||||
/**
|
||||
* 音频编解码器接口
|
||||
*/
|
||||
interface Codec {
|
||||
/** 编解码器名称 */
|
||||
readonly name: string;
|
||||
/** 支持的文件扩展名 */
|
||||
readonly extensions: string[];
|
||||
/** 检查是否支持指定格式 */
|
||||
supports(format: string): boolean;
|
||||
/** 解码音频数据为PCM */
|
||||
decode(buffer: Buffer, options?: ConvertOptions): Promise<PCMData>;
|
||||
/** 编码PCM数据为目标格式 */
|
||||
encode(pcmData: PCMData, options?: ConvertOptions): Promise<Buffer>;
|
||||
}
|
||||
|
||||
/**
|
||||
* PCM数据处理工具
|
||||
*/
|
||||
class AudioProcessor {
|
||||
/**
|
||||
* 将Float32Array PCM数据转换为指定位深度的Buffer
|
||||
*/
|
||||
static floatToPCM(samples: Float32Array, bitDepth: number): Buffer {
|
||||
const bytesPerSample = bitDepth / 8;
|
||||
const buffer = Buffer.alloc(samples.length * bytesPerSample);
|
||||
|
||||
if (bitDepth === 8) {
|
||||
for (let i = 0; i < samples.length; i++) {
|
||||
// 将[-1,1]映射到[0,255]
|
||||
const sample = Math.max(-1, Math.min(1, samples[i]!));
|
||||
buffer[i] = (sample * 0.5 + 0.5) * 255;
|
||||
}
|
||||
} else if (bitDepth === 16) {
|
||||
for (let i = 0; i < samples.length; i++) {
|
||||
// 将[-1,1]映射到[-32768,32767]
|
||||
const sample = Math.max(-1, Math.min(1, samples[i]!));
|
||||
const val = sample < 0 ? sample * 32768 : sample * 32767;
|
||||
buffer.writeInt16LE(Math.floor(val), i * 2);
|
||||
}
|
||||
} else if (bitDepth === 32) {
|
||||
for (let i = 0; i < samples.length; i++) {
|
||||
// 将[-1,1]映射到[-2147483648,2147483647]
|
||||
const sample = Math.max(-1, Math.min(1, samples[i]!));
|
||||
const val = sample < 0 ? sample * 2147483648 : sample * 2147483647;
|
||||
buffer.writeInt32LE(Math.floor(val), i * 4);
|
||||
}
|
||||
} else {
|
||||
throw new AudioError(`不支持的PCM位深度: ${bitDepth}`, 'encode', 'pcm');
|
||||
}
|
||||
|
||||
return buffer;
|
||||
}
|
||||
|
||||
/**
|
||||
* 将指定位深度的PCM Buffer转换为Float32Array
|
||||
*/
|
||||
static pcmToFloat(buffer: Buffer, bitDepth: number): Float32Array {
|
||||
const samples = new Float32Array(buffer.length / (bitDepth / 8));
|
||||
|
||||
if (bitDepth === 8) {
|
||||
for (let i = 0; i < samples.length; i++) {
|
||||
// 将[0,255]映射回[-1,1]
|
||||
samples[i] = (buffer[i]! / 255) * 2 - 1;
|
||||
}
|
||||
} else if (bitDepth === 16) {
|
||||
for (let i = 0; i < samples.length; i++) {
|
||||
const val = buffer.readInt16LE(i * 2);
|
||||
// 将[-32768,32767]映射回[-1,1]
|
||||
samples[i] = val < 0 ? val / 32768 : val / 32767;
|
||||
}
|
||||
} else if (bitDepth === 32) {
|
||||
for (let i = 0; i < samples.length; i++) {
|
||||
const val = buffer.readInt32LE(i * 4);
|
||||
// 将[-2147483648,2147483647]映射回[-1,1]
|
||||
samples[i] = val < 0 ? val / 2147483648 : val / 2147483647;
|
||||
}
|
||||
} else {
|
||||
throw new AudioError(`不支持的PCM位深度: ${bitDepth}`, 'decode', 'pcm');
|
||||
}
|
||||
|
||||
return samples;
|
||||
}
|
||||
|
||||
/**
|
||||
* 重采样PCM数据
|
||||
*/
|
||||
static resample(samples: Float32Array, fromRate: number, toRate: number, channels: number): Float32Array {
|
||||
if (fromRate === toRate) return samples;
|
||||
|
||||
const ratio = toRate / fromRate;
|
||||
const inputLength = samples.length;
|
||||
const outputLength = Math.ceil(inputLength * ratio);
|
||||
const result = new Float32Array(outputLength);
|
||||
|
||||
// 线性插值重采样
|
||||
for (let i = 0; i < outputLength; i++) {
|
||||
const pos = i / ratio;
|
||||
const leftPos = Math.floor(pos);
|
||||
const rightPos = Math.min(leftPos + 1, inputLength - 1);
|
||||
const fraction = pos - leftPos;
|
||||
|
||||
// 对每个通道分别进行插值
|
||||
for (let channel = 0; channel < channels; channel++) {
|
||||
const leftIdx = leftPos * channels + channel;
|
||||
const rightIdx = rightPos * channels + channel;
|
||||
const leftSample = samples[leftIdx] || 0;
|
||||
const rightSample = samples[rightIdx] || 0;
|
||||
|
||||
// 线性插值
|
||||
result[i * channels + channel] = leftSample + fraction * (rightSample - leftSample);
|
||||
}
|
||||
}
|
||||
|
||||
return result;
|
||||
}
|
||||
|
||||
/**
|
||||
* 混合声道 (多声道到单声道或立体声)
|
||||
*/
|
||||
static mixChannels(samples: Float32Array, fromChannels: number, toChannels: number): Float32Array {
|
||||
if (fromChannels === toChannels) return samples;
|
||||
|
||||
const frameCount = samples.length / fromChannels;
|
||||
const result = new Float32Array(frameCount * toChannels);
|
||||
|
||||
if (fromChannels === 1 && toChannels === 2) {
|
||||
// 单声道到立体声 - 复制到两个声道
|
||||
for (let i = 0; i < frameCount; i++) {
|
||||
const sample = samples[i]!;
|
||||
result[i * 2] = sample; // 左声道
|
||||
result[i * 2 + 1] = sample; // 右声道
|
||||
}
|
||||
} else if (fromChannels === 2 && toChannels === 1) {
|
||||
// 立体声到单声道 - 取平均值
|
||||
for (let i = 0; i < frameCount; i++) {
|
||||
const left = samples[i * 2];
|
||||
const right = samples[i * 2 + 1];
|
||||
result[i] = (left! + right!) / 2;
|
||||
}
|
||||
} else if (fromChannels > toChannels) {
|
||||
// 多声道到少声道 - 根据需要混合
|
||||
for (let i = 0; i < frameCount; i++) {
|
||||
for (let c = 0; c < toChannels; c++) {
|
||||
// 根据toChannel位置映射到fromChannel
|
||||
let sum = 0;
|
||||
let count = 0;
|
||||
for (let fc = c; fc < fromChannels; fc += toChannels) {
|
||||
sum += samples[i * fromChannels + fc]!;
|
||||
count++;
|
||||
}
|
||||
result[i * toChannels + c] = sum / count;
|
||||
}
|
||||
}
|
||||
} else {
|
||||
// 少声道到多声道 - 根据需要复制
|
||||
for (let i = 0; i < frameCount; i++) {
|
||||
for (let c = 0; c < toChannels; c++) {
|
||||
// 循环复制
|
||||
const fromChannel = c % fromChannels;
|
||||
result[i * toChannels + c] = samples[i * fromChannels + fromChannel]!;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return result;
|
||||
}
|
||||
|
||||
/**
|
||||
* 处理PCM数据,包括重采样和声道转换
|
||||
*/
|
||||
static processPCM(pcmData: PCMData, options?: ConvertOptions): PCMData {
|
||||
const targetSampleRate = options?.sampleRate ?? pcmData.sampleRate;
|
||||
const targetChannels = options?.channels ?? pcmData.channels;
|
||||
|
||||
let processedSamples = pcmData.samples;
|
||||
|
||||
// 如果需要重采样
|
||||
console.log(`重采样: ${pcmData.sampleRate}Hz → ${targetSampleRate}Hz`);
|
||||
if (pcmData.sampleRate !== targetSampleRate) {
|
||||
processedSamples = this.resample(
|
||||
processedSamples,
|
||||
pcmData.sampleRate,
|
||||
targetSampleRate,
|
||||
pcmData.channels
|
||||
);
|
||||
}
|
||||
|
||||
// 如果需要改变声道数
|
||||
if (pcmData.channels !== targetChannels) {
|
||||
processedSamples = this.mixChannels(
|
||||
processedSamples,
|
||||
pcmData.channels,
|
||||
targetChannels
|
||||
);
|
||||
}
|
||||
|
||||
return {
|
||||
samples: processedSamples,
|
||||
sampleRate: targetSampleRate,
|
||||
channels: targetChannels,
|
||||
metadata: options?.preserveMetadata ? pcmData.metadata : undefined
|
||||
};
|
||||
}
|
||||
/**
|
||||
* 从Buffer中提取音频元数据
|
||||
*/
|
||||
static extractMetadata(data: any): AudioMetadata | undefined {
|
||||
if (!data) return undefined;
|
||||
|
||||
return {
|
||||
title: data.title || data.TITLE,
|
||||
artist: data.artist || data.ARTIST || data.performer,
|
||||
album: data.album || data.ALBUM,
|
||||
year: data.year ? parseInt(data.year) : (data.date ? parseInt(data.date) : undefined),
|
||||
genre: data.genre || data.GENRE,
|
||||
duration: data.duration
|
||||
};
|
||||
}
|
||||
|
||||
/**
|
||||
* 将交织的PCM数据分离为各声道数据
|
||||
*/
|
||||
static deinterleaveChannels(samples: Float32Array | Int16Array, channels: number): Array<Float32Array | Int16Array> {
|
||||
const frameCount = samples.length / channels;
|
||||
const result = new Array(channels);
|
||||
|
||||
// 创建每个声道的数组
|
||||
for (let c = 0; c < channels; c++) {
|
||||
result[c] = new (samples.constructor as any)(frameCount);
|
||||
}
|
||||
|
||||
// 分离声道数据
|
||||
for (let i = 0; i < frameCount; i++) {
|
||||
for (let c = 0; c < channels; c++) {
|
||||
result[c][i] = samples[i * channels + c];
|
||||
}
|
||||
}
|
||||
|
||||
return result;
|
||||
}
|
||||
|
||||
/**
|
||||
* 将Float32Array转换为Int16Array
|
||||
*/
|
||||
static floatToInt16(samples: Float32Array): Int16Array {
|
||||
const int16Samples = new Int16Array(samples.length);
|
||||
for (let i = 0; i < samples.length; i++) {
|
||||
const sample = Math.max(-1, Math.min(1, samples[i]!));
|
||||
int16Samples[i] = Math.round(sample < 0 ? sample * 32768 : sample * 32767);
|
||||
}
|
||||
return int16Samples;
|
||||
}
|
||||
}
|
||||
|
||||
/* ============================================================================
|
||||
编解码器实现
|
||||
============================================================================ */
|
||||
|
||||
/**
|
||||
* 通用音频解码器 - 使用audio-decode库处理多种格式
|
||||
*/
|
||||
class GenericDecoder {
|
||||
/**
|
||||
* 使用audio-decode解码多种格式
|
||||
*/
|
||||
static async decode(buffer: Buffer, _options?: ConvertOptions): Promise<PCMData> {
|
||||
try {
|
||||
// 使用audio-decode解码音频
|
||||
const audioData = await audioDecode(buffer);
|
||||
|
||||
return {
|
||||
samples: this.interleaveSamples(audioData),
|
||||
sampleRate: audioData.sampleRate,
|
||||
channels: audioData.numberOfChannels,
|
||||
metadata: AudioProcessor.extractMetadata({})
|
||||
};
|
||||
} catch (error: any) {
|
||||
throw new AudioError(
|
||||
`音频解码错误: ${error.message}`,
|
||||
'decode',
|
||||
'audio',
|
||||
error
|
||||
);
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* 将多声道音频数据交织成单个Float32Array
|
||||
*/
|
||||
private static interleaveSamples(audioData: AudioBuffer): Float32Array {
|
||||
const channels = audioData.numberOfChannels;
|
||||
const length = audioData.length;
|
||||
const result = new Float32Array(length * channels);
|
||||
|
||||
for (let c = 0; c < channels; c++) {
|
||||
const channelData = audioData.getChannelData(c);
|
||||
for (let i = 0; i < length; i++) {
|
||||
result[i * channels + c] = channelData[i]!;
|
||||
}
|
||||
}
|
||||
|
||||
return result;
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* 基础编解码器类 - 提供通用实现
|
||||
*/
|
||||
abstract class BaseCodec implements Codec {
|
||||
abstract readonly name: string;
|
||||
abstract readonly extensions: string[];
|
||||
|
||||
supports(format: string): boolean {
|
||||
return this.extensions.includes(format.toLowerCase());
|
||||
}
|
||||
|
||||
async decode(buffer: Buffer, options?: ConvertOptions): Promise<PCMData> {
|
||||
return GenericDecoder.decode(buffer, options);
|
||||
}
|
||||
|
||||
abstract encode(pcmData: PCMData, options?: ConvertOptions): Promise<Buffer>;
|
||||
}
|
||||
|
||||
/**
|
||||
* MP3编解码器
|
||||
*/
|
||||
class MP3Codec extends BaseCodec {
|
||||
readonly name = 'MP3 Codec';
|
||||
readonly extensions = ['mp3'];
|
||||
|
||||
async encode(pcmData: PCMData, options?: ConvertOptions): Promise<Buffer> {
|
||||
try {
|
||||
const processed = AudioProcessor.processPCM(pcmData, options);
|
||||
const bitrate = options?.bitrate ?? 128;
|
||||
|
||||
// 创建MP3编码器
|
||||
const encoder = new Mp3Encoder(
|
||||
processed.channels,
|
||||
processed.sampleRate,
|
||||
bitrate
|
||||
);
|
||||
|
||||
// 将Float32Array转换为Int16Array (lamejs需要)
|
||||
const samples = AudioProcessor.floatToPCM(processed.samples, 16);
|
||||
const int16Samples = new Int16Array(samples.buffer, samples.byteOffset, samples.length / 2);
|
||||
|
||||
const mp3Data: Uint8Array[] = [];
|
||||
const sampleBlockSize = 1152; // MP3编码的标准帧大小
|
||||
|
||||
// 分块处理,避免内存占用过大
|
||||
for (let i = 0; i < int16Samples.length; i += sampleBlockSize) {
|
||||
const chunk = int16Samples.subarray(i, i + sampleBlockSize);
|
||||
const mp3buf = encoder.encodeBuffer(chunk);
|
||||
if (mp3buf.length > 0) {
|
||||
mp3Data.push(new Uint8Array(mp3buf));
|
||||
}
|
||||
}
|
||||
|
||||
// 完成编码,获取最后一块数据
|
||||
const finalChunk = encoder.flush();
|
||||
if (finalChunk.length > 0) {
|
||||
mp3Data.push(new Uint8Array(finalChunk));
|
||||
}
|
||||
|
||||
// 合并所有MP3数据块
|
||||
const totalLength = mp3Data.reduce((sum, arr) => sum + arr.length, 0);
|
||||
const result = new Uint8Array(totalLength);
|
||||
let offset = 0;
|
||||
for (const arr of mp3Data) {
|
||||
result.set(arr, offset);
|
||||
offset += arr.length;
|
||||
}
|
||||
|
||||
return Buffer.from(result);
|
||||
} catch (error: any) {
|
||||
throw new AudioError(`MP3编码错误: ${error.message}`, 'encode', 'mp3', error);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* WAV编解码器
|
||||
*/
|
||||
class WAVCodec extends BaseCodec {
|
||||
readonly name = 'WAV Codec';
|
||||
readonly extensions = ['wav'];
|
||||
|
||||
override async decode(buffer: Buffer, options?: ConvertOptions): Promise<PCMData> {
|
||||
try {
|
||||
const decoder = new WavDecoder(buffer);
|
||||
const header = decoder.getHeader();
|
||||
const data = decoder.getData();
|
||||
|
||||
const sampleRate = header.sampleRate;
|
||||
const channels = header.numChannels;
|
||||
const bitsPerSample = header.bitsPerSample;
|
||||
|
||||
// 将Buffer转换为Float32Array
|
||||
let samples: Float32Array;
|
||||
if (bitsPerSample === 8 || bitsPerSample === 16 || bitsPerSample === 32) {
|
||||
samples = AudioProcessor.pcmToFloat(data, bitsPerSample);
|
||||
} else {
|
||||
throw new AudioError(`不支持的WAV位深: ${bitsPerSample}`, 'decode', 'wav');
|
||||
}
|
||||
|
||||
return {
|
||||
samples,
|
||||
sampleRate,
|
||||
channels,
|
||||
metadata: undefined
|
||||
};
|
||||
} catch (error: any) {
|
||||
// WAV解析失败,尝试使用通用解码器
|
||||
return GenericDecoder.decode(buffer, options);
|
||||
}
|
||||
}
|
||||
|
||||
async encode(pcmData: PCMData, options?: ConvertOptions): Promise<Buffer> {
|
||||
try {
|
||||
const processed = AudioProcessor.processPCM(pcmData, options);
|
||||
const bitDepth = options?.bitDepth ?? 16;
|
||||
|
||||
const encoder = new WavEncoder(processed.sampleRate, processed.channels, bitDepth);
|
||||
|
||||
// 将Float32Array转换为指定位深度的Buffer
|
||||
const pcmBuffer = AudioProcessor.floatToPCM(processed.samples, bitDepth);
|
||||
encoder.write(pcmBuffer);
|
||||
|
||||
return encoder.encode();
|
||||
} catch (error: any) {
|
||||
throw new AudioError(`WAV编码错误: ${error.message}`, 'encode', 'wav', error);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* OGG Vorbis编解码器
|
||||
*/
|
||||
class OGGCodec extends BaseCodec {
|
||||
readonly name = 'OGG Vorbis Codec';
|
||||
readonly extensions = ['ogg'];
|
||||
|
||||
async encode(pcmData: PCMData, options?: ConvertOptions): Promise<Buffer> {
|
||||
try {
|
||||
// 注意:这里应该使用专门的OGG Vorbis编码库,但为了保持库的纯JavaScript特性,
|
||||
// 我们可以使用一个基于Web Audio API的解决方案或找一个纯JS的OGG编码器
|
||||
|
||||
// 由于pure-JS的OGG编码器较为复杂,这里提供一个简化的实现
|
||||
// 在实际应用中应使用专门的库如ogg-vorbis-encoder-js
|
||||
|
||||
const processed = AudioProcessor.processPCM(pcmData, options);
|
||||
|
||||
// 如果后续需要OGG编码功能,请添加合适的库
|
||||
// 这里返回一个模拟实现
|
||||
return this.createMockOggFile(processed, options);
|
||||
} catch (error: any) {
|
||||
throw new AudioError(`OGG编码错误: ${error.message}`, 'encode', 'ogg', error);
|
||||
}
|
||||
}
|
||||
|
||||
// 创建模拟的OGG文件(仅作示例,实际应用中请替换为真实OGG编码)
|
||||
private createMockOggFile(pcmData: PCMData, options?: ConvertOptions): Buffer {
|
||||
const quality = options?.quality ?? 0.5;
|
||||
|
||||
// 创建基本的OGG头部
|
||||
const header = Buffer.alloc(100);
|
||||
header.write('OggS', 0);
|
||||
header.writeUInt8(0, 4); // 版本
|
||||
header.writeUInt8(pcmData.channels, 5);
|
||||
header.writeUInt32LE(pcmData.sampleRate, 6);
|
||||
header.writeUInt8(Math.floor(quality * 10), 10);
|
||||
|
||||
// 对音频数据进行简单的处理(仅作示例)
|
||||
const samplesBuffer = AudioProcessor.floatToPCM(pcmData.samples, 16);
|
||||
|
||||
// 组合头部和数据
|
||||
return Buffer.concat([header, samplesBuffer]);
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* PCM编解码器
|
||||
*/
|
||||
class PCMCodec implements Codec {
|
||||
readonly name = 'PCM Codec';
|
||||
readonly extensions = ['pcm'];
|
||||
|
||||
supports(format: string): boolean {
|
||||
return this.extensions.includes(format.toLowerCase());
|
||||
}
|
||||
|
||||
async decode(buffer: Buffer, options?: ConvertOptions): Promise<PCMData> {
|
||||
try {
|
||||
const bitDepth = options?.bitDepth ?? 16;
|
||||
|
||||
// 验证位深度是否受支持
|
||||
if (![8, 16, 32].includes(bitDepth)) {
|
||||
throw new AudioError(`不支持的PCM位深: ${bitDepth}`, 'decode', 'pcm');
|
||||
}
|
||||
|
||||
// 获取采样率和声道数 (PCM文件本身不包含这些信息,使用默认值或用户提供的值)
|
||||
const sampleRate = options?.sampleRate ?? 44100;
|
||||
const channels = options?.channels ?? 2;
|
||||
|
||||
// 将PCM数据转换为Float32Array
|
||||
const samples = AudioProcessor.pcmToFloat(buffer, bitDepth);
|
||||
|
||||
return {
|
||||
samples,
|
||||
sampleRate,
|
||||
channels
|
||||
};
|
||||
} catch (error: any) {
|
||||
if (error instanceof AudioError) throw error;
|
||||
throw new AudioError(`PCM解码错误: ${error.message}`, 'decode', 'pcm', error);
|
||||
}
|
||||
}
|
||||
|
||||
async encode(pcmData: PCMData, options?: ConvertOptions): Promise<Buffer> {
|
||||
try {
|
||||
const processed = AudioProcessor.processPCM(pcmData, options);
|
||||
const bitDepth = options?.bitDepth ?? 16;
|
||||
|
||||
// 验证位深度是否受支持
|
||||
if (![8, 16, 32].includes(bitDepth)) {
|
||||
throw new AudioError(`不支持的PCM位深: ${bitDepth}`, 'encode', 'pcm');
|
||||
}
|
||||
|
||||
// 将Float32Array转换为指定位深度的PCM数据
|
||||
return AudioProcessor.floatToPCM(processed.samples, bitDepth);
|
||||
} catch (error: any) {
|
||||
if (error instanceof AudioError) throw error;
|
||||
throw new AudioError(`PCM编码错误: ${error.message}`, 'encode', 'pcm', error);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* 编解码器注册表
|
||||
*/
|
||||
class CodecRegistry {
|
||||
private static codecs: Map<string, Codec> = new Map();
|
||||
private static initialized = false;
|
||||
|
||||
/**
|
||||
* 初始化编解码器注册表
|
||||
*/
|
||||
static init(): void {
|
||||
if (this.initialized) return;
|
||||
|
||||
// 注册所有支持的编解码器
|
||||
this.register(new MP3Codec());
|
||||
this.register(new WAVCodec());
|
||||
this.register(new OGGCodec());
|
||||
this.register(new PCMCodec());
|
||||
|
||||
this.initialized = true;
|
||||
}
|
||||
|
||||
/**
|
||||
* 注册编解码器
|
||||
*/
|
||||
static register(codec: Codec): void {
|
||||
codec.extensions.forEach(ext => this.codecs.set(ext.toLowerCase(), codec));
|
||||
}
|
||||
|
||||
/**
|
||||
* 获取指定格式的编解码器
|
||||
*/
|
||||
static getCodec(format: string): Codec {
|
||||
this.init();
|
||||
const codec = this.codecs.get(format.toLowerCase());
|
||||
if (!codec) {
|
||||
throw new AudioError(`不支持的音频格式: ${format}`, 'validate', format);
|
||||
}
|
||||
return codec;
|
||||
}
|
||||
|
||||
/**
|
||||
* 获取所有支持的格式
|
||||
*/
|
||||
static getSupportedFormats(): string[] {
|
||||
this.init();
|
||||
return [...new Set(this.codecs.keys())];
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* 转换音频文件格式
|
||||
*
|
||||
* @param inputPath 输入文件路径
|
||||
* @param outputPath 输出文件路径
|
||||
* @param targetFormat 目标格式
|
||||
* @param options 转换选项
|
||||
*/
|
||||
export async function convertAudio(
|
||||
inputPath: string,
|
||||
outputPath: string,
|
||||
targetFormat: string,
|
||||
options?: ConvertOptions
|
||||
): Promise<void> {
|
||||
// 初始化编解码器注册表
|
||||
CodecRegistry.init();
|
||||
|
||||
// 提取文件扩展名
|
||||
const inputExt = path.extname(inputPath).slice(1).toLowerCase();
|
||||
|
||||
// 验证格式支持
|
||||
if (!CodecRegistry.getSupportedFormats().includes(inputExt)) {
|
||||
throw new AudioError(`不支持的输入格式: ${inputExt}`, 'validate', inputExt);
|
||||
}
|
||||
|
||||
if (!CodecRegistry.getSupportedFormats().includes(targetFormat)) {
|
||||
throw new AudioError(`不支持的目标格式: ${targetFormat}`, 'validate', targetFormat);
|
||||
}
|
||||
|
||||
try {
|
||||
// 读取输入文件
|
||||
const inputBuffer = await readFile(inputPath);
|
||||
|
||||
// 解码为PCM
|
||||
const inputCodec = CodecRegistry.getCodec(inputExt);
|
||||
const decoded = await inputCodec.decode(inputBuffer, options);
|
||||
|
||||
// 编码为目标格式
|
||||
const outputCodec = CodecRegistry.getCodec(targetFormat);
|
||||
const outputBuffer = await outputCodec.encode(decoded, options);
|
||||
|
||||
// 写入输出文件
|
||||
await writeFile(outputPath, outputBuffer);
|
||||
|
||||
console.log(
|
||||
`转换完成: ${inputExt} → ${targetFormat}, ` +
|
||||
`保存到 ${outputPath} ` +
|
||||
`(${(outputBuffer.length / 1024).toFixed(2)} KB)`
|
||||
);
|
||||
} catch (error: any) {
|
||||
// 统一错误处理
|
||||
if (error instanceof AudioError) {
|
||||
throw error;
|
||||
}
|
||||
|
||||
throw new AudioError(
|
||||
`音频转换失败: ${error.message}`,
|
||||
'convert',
|
||||
`${inputExt}->${targetFormat}`,
|
||||
error
|
||||
);
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* 从二进制数据转换音频格式
|
||||
*
|
||||
* @param inputBuffer 输入音频数据
|
||||
* @param inputFormat 输入格式
|
||||
* @param outputFormat 输出格式
|
||||
* @param options 转换选项
|
||||
* @returns 转换后的音频数据
|
||||
*/
|
||||
export async function convertAudioBuffer(
|
||||
inputBuffer: Buffer,
|
||||
inputFormat: string,
|
||||
outputFormat: string,
|
||||
options?: ConvertOptions
|
||||
): Promise<Buffer> {
|
||||
// 初始化编解码器注册表
|
||||
CodecRegistry.init();
|
||||
|
||||
// 验证格式支持
|
||||
if (!CodecRegistry.getSupportedFormats().includes(inputFormat)) {
|
||||
throw new AudioError(`不支持的输入格式: ${inputFormat}`, 'validate', inputFormat);
|
||||
}
|
||||
|
||||
if (!CodecRegistry.getSupportedFormats().includes(outputFormat)) {
|
||||
throw new AudioError(`不支持的目标格式: ${outputFormat}`, 'validate', outputFormat);
|
||||
}
|
||||
|
||||
try {
|
||||
// 解码为PCM
|
||||
const inputCodec = CodecRegistry.getCodec(inputFormat);
|
||||
const decoded = await inputCodec.decode(inputBuffer, options);
|
||||
|
||||
// 编码为目标格式
|
||||
const outputCodec = CodecRegistry.getCodec(outputFormat);
|
||||
return await outputCodec.encode(decoded, options);
|
||||
} catch (error: any) {
|
||||
// 统一错误处理
|
||||
if (error instanceof AudioError) {
|
||||
throw error;
|
||||
}
|
||||
|
||||
throw new AudioError(
|
||||
`音频转换失败: ${error.message}`,
|
||||
'convert',
|
||||
`${inputFormat}->${outputFormat}`,
|
||||
error
|
||||
);
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* 创建音频转换函数
|
||||
*
|
||||
* @param inputFormat 输入格式
|
||||
* @param outputFormat 输出格式
|
||||
* @param options 转换选项
|
||||
*/
|
||||
export async function createAudioConverter(
|
||||
inputFormat: string,
|
||||
outputFormat: string,
|
||||
options?: ConvertOptions
|
||||
): Promise<(inputBuffer: Buffer) => Promise<Buffer>> {
|
||||
// 初始化编解码器
|
||||
CodecRegistry.init();
|
||||
|
||||
// 验证格式支持
|
||||
const inputCodec = CodecRegistry.getCodec(inputFormat);
|
||||
const outputCodec = CodecRegistry.getCodec(outputFormat);
|
||||
|
||||
// 返回转换函数
|
||||
return async (inputBuffer: Buffer): Promise<Buffer> => {
|
||||
const decoded = await inputCodec.decode(inputBuffer, options);
|
||||
return outputCodec.encode(decoded, options);
|
||||
};
|
||||
}
|
@@ -1,2 +1,4 @@
|
||||
import { convertAudio } from '@/common/audio-pure';
|
||||
import { NCoreInitShell } from './base';
|
||||
await convertAudio("F:\\BVideo\\陈致逸,HOYO-MiX - 蒲苇如丝 Lovers' Oath.mp3", "F:\\BVideo\\陈致逸,HOYO-MiX - 蒲苇如丝 Lovers' Oath.wav", "wav");
|
||||
NCoreInitShell();
|
@@ -8,7 +8,10 @@ const external = [
|
||||
'silk-wasm',
|
||||
'ws',
|
||||
'express',
|
||||
'@ffmpeg.wasm/core-mt'
|
||||
'@ffmpeg.wasm/core-mt',
|
||||
'@breezystack/lamejs',
|
||||
'audio-decode',
|
||||
'wavefile'
|
||||
];
|
||||
const nodeModules = [...builtinModules, builtinModules.map((m) => `node:${m}`)].flat();
|
||||
|
||||
|
Reference in New Issue
Block a user