HTML5的音频录制和播放

背景

公司内部需要利用第三方接口实现tts和stt的功能，就涉及到了音频的录制和播放，所以就看了一下最新的音频api，实现了一个简单的。

实现

import { useEffect, useMemo, useState } from "react";

export type RecorderParam = {
  onEnd: (chunks: Blob[]) => void;
  onSpeakChange?: (rms: number) => void;
  onStreamChange?: (buffer: ArrayBuffer) => void; // 处理流式数据可以传入这个回调，拿到buffer
  mimeType?: string;
};

export class Recorder {
  chunks: Blob[];
  onEnd: (chunks: Blob[]) => void;
  onSpeakChange?: (rms: number) => void;
  onStreamChange?: (buffer: ArrayBuffer) => void;
  stream: MediaStream | null;
  mediaRecorder: MediaRecorder | null;
  audioContext: AudioContext | null;
  mediaStreamSource: MediaStreamAudioSourceNode | null;
  processor: ScriptProcessorNode | null;
  mimeType: string;
  isCancel: boolean; // 是否是取消了录音
  constructor(param: RecorderParam) {
    const { onEnd, onSpeakChange, onStreamChange, mimeType } = param;
    this.chunks = [];
    this.onEnd = onEnd;
    this.onSpeakChange = onSpeakChange;
    this.onStreamChange = onStreamChange;
    this.stream = null;
    this.mediaRecorder = null;
    this.audioContext = null;
    this.mediaStreamSource = null;
    this.processor = null;
    this.isCancel = false;
    this.mimeType = mimeType || "audio/mp4"; // 目前MediaRecorder在safari上只支持MP4的格式
  }

  async start() {
    this.isCancel = false;
    this.stream = await navigator.mediaDevices.getUserMedia({ audio: true });
    this.audioContext = new AudioContext();
    this.mediaStreamSource = this.audioContext.createMediaStreamSource(
      this.stream
    );
    this.processor = this.audioContext.createScriptProcessor(2048, 1, 1); // 其实这个已经是要废弃的，推荐使用AudioWorklet，这个需要动态去加载js，感觉如果网络不好的话就不太行
    this.processor.onaudioprocess = (e) => {
      let buffer = e.inputBuffer.getChannelData(0);
      const numberArr: number[] = [];
      for (let i = 0; i < buffer.length; i++) {
        numberArr.push(buffer[i]);
      }
      let rms = Math.max.apply(null, numberArr);
      if (!this.isCancel) {
        this.onSpeakChange?.(rms);
        this.onStreamChange?.(buffer); // 流式交互可以用这个处理
      }
    };
    this.mediaStreamSource.connect(this.processor);
    this.processor.connect(this.audioContext.destination);

    this.mediaRecorder = new MediaRecorder(this.stream, {
      mimeType: this.mimeType,
    });
    this.mediaRecorder.ondataavailable = (event) => {
      this.chunks.push(event.data);
    };
    this.mediaRecorder.onstop = () => {
      if (!this.isCancel) {
        this.onEnd?.([...this.chunks]);
        this.onSpeakChange?.(0);
      }
      this.chunks = [];
    };
    this.mediaRecorder.start();
  }

  async stop() {
    if (this.mediaRecorder) {
      this.mediaRecorder.stop();
      this.mediaRecorder = null;
    }
    if (this.stream) {
      this.stream.getTracks().forEach((track) => track.stop());
      this.stream = null;
    }
    if (this.audioContext) {
      await this.audioContext.close();
      this.audioContext = null;
    }
    this.mediaStreamSource = null;
    this.processor = null;
  }

  // 取消录音
  async cancel() {
    this.isCancel = true;
    await this.stop();
  }
}

export type GetRecorderFuncParam = {
  onEnd: (file: File) => void;
  onSpeakChange?: (rms: number) => void;
  mimeType?: string;
};

export const useRecordAudioFunc = (param: GetRecorderFuncParam) => {
  const { onEnd, onSpeakChange } = param;

  const [recorder, setRecorder] = useState<Recorder>();

  useEffect(() => {
    setRecorder(
      new Recorder({
        onEnd: (chunks: Blob[]) => {
          const blob = new Blob(chunks, {
            type: "audio/webm",
          });
          const file = new File([blob], "record.webm", {
            type: "audio/webm",
          });
          onEnd?.(file);
        },
        onSpeakChange: (rms: number) => {
          onSpeakChange?.(rms);
        },
      })
    );
  }, []);

  // 不需要每次组件更新都重新获取
  return useMemo(
    () => ({
      start: () => recorder?.start(), // 开始录音
      stop: () => recorder?.stop(), // 结束录音
      cancel: () => recorder?.cancel(), // 取消录音
    }),
    [recorder]
  );
};

export type AudioPlayerProps = {
  arrayBuffer: ArrayBuffer; // 音频流
  rate: number; // 播放速率
  onEnd: () => {}; // 播放结束后的回调
  onReady: () => {}; // 准备好播放之后
};
export class AudioPlayer {
  audioBuffer: AudioBuffer | null;
  audioContext: AudioContext;
  source: AudioBufferSourceNode | null;
  startTime: number;
  offset: number;
  rate: number;
  isEndByStop: boolean;
  onEnd: () => void;
  onReady: () => void;
  constructor(props) {
    const { arrayBuffer, rate = 1, onEnd, onReady } = props;
    this.audioContext = new AudioContext();
    this.rate = rate;
    this.onEnd = onEnd;
    this.onReady = onReady;
    this.isEndByStop = false;
    this.startTime = 0;
    this.offset = 0;
    this.audioBuffer = null;
    this.source = null;
    this.audioContext.decodeAudioData(arrayBuffer).then((buffer) => {
      this.audioBuffer = buffer;
      this.onReady?.();
    });
  }

  start() {
    this.isEndByStop = false;
    this.source = this.audioContext.createBufferSource();
    this.source.buffer = this.audioBuffer;
    this.source.playbackRate.value = this.rate || 1;
    this.source.connect(this.audioContext.destination);
    this.source.onended = () => {
      if (!this.isEndByStop) {
        this.offset = 0; // 正常播放完成的重置offset
      } else {
        // 记录播放的时长
        this.offset =
          this.audioContext.currentTime - this.startTime + this.offset;
      }
      this.onEnd?.();
    };
    this.source.start(0, this.offset);
    this.startTime = this.audioContext.currentTime; // 记录开始时间
  }

  stop() {
    if (this.source) {
      // 手动停止的播放
      this.isEndByStop = true;
      this.source.stop();
      this.source.disconnect(this.audioContext.destination);
      this.source = null;
    }
  }
}

  // recorder
  const { start, stop, cancel } = useRecordAudioFunc({
    onEnd: async (file: File) => {
      try {
        // 调api进行stt
        const resp = await fetch(FETCH_URL, {
          method: "POST",
          headers: {
            "Content-Type": "application/octet-stream",
          },
          body: file,
        });
        const data = await resp.json();
        onEnd?.(data?.transcription?.trim() || "");
      } catch (err) {
        onEnd?.("failed");
      } finally {
        setSpeaking(0);
        setRecording(false);
      }
    },
    onSpeakChange: (rms: number) => {
      setSpeaking(rms);
    },
  });
  // player
      new AudioPlayer({
            arrayBuffer, // 获取到的音频流
            rate, // 播放速率
            onEnd: () => {
                // 播放结束的回调
            },
            onReady: () => {
              // 准备播放之前
            },
          });
      });

posted @ 2024-12-27 10:31 风行者夜色阅读(64) 评论(0) 收藏举报

刷新页面返回顶部

风行者夜色

一个看起来沉默寡言，实际上话痨的不行的翩翩美男子，想学做饭的可以看我的家常菜：https://author.baidu.com/home?context=%7B%22app_id%22%3A%221768210514672105%22%7D&wfr=bjh

HTML5的音频录制和播放

背景

实现

公告