Skip to content

Latest commit

 

History

History
117 lines (93 loc) · 2.68 KB

README.md

File metadata and controls

117 lines (93 loc) · 2.68 KB

openai-speech-stream-player

It's a player for play SSE streaming chunk from OpenAI audio speech API.

Usage

import { SpeechPlayer } from 'openai-speech-stream-player';

async function main() {
  const audioEl = document.querySelector('audio');
  const player = new SpeechPlayer({
    audio: audioEl,
    onPlaying: () => {},
    onPause: () => {},
    onChunkEnd: () => {},
    mimeType: 'audio/mpeg',
  });
  await player.init();

  var myHeaders = new Headers();
  myHeaders.append("Cache-Control", "no-store");
  myHeaders.append("Content-Type", "application/json");
  myHeaders.append("Authorization", "Bearer yourKeyHere");

  var raw = JSON.stringify({
    "model": "tts-1",
    "input": "Hi, What's your name?",
    "voice": "shimmer",
    "response_format": "mp3",
    "speed": 1
  });

  var requestOptions = {
    method: 'POST',
    headers: myHeaders,
    body: raw,
    redirect: 'follow'
  };

  const response = await fetch("https://api.openai.com/v1/audio/speech", requestOptions);
  player.feedWithResponse(response);
}

main();

Or you can DIY with response DIY

async function* streamAsyncIterable(stream) {
  const reader = stream.getReader();

  try {
    while (true) {
      const { done, value } = await reader.read();
      if (done) {
        return;
      }
      yield value;
    }
  } finally {
    reader.releaseLock();
  }
}

async function main() {
  // ...
  const response = await fetch("https://api.openai.com/v1/audio/speech", requestOptions);

  for await (const chunk of streamAsyncIterable(response.body)) {
    player.feed(chunk);
  }
}

Others

  1. how to deal stream chunk in NodeJs form OpenAI text-to-speech API?

here is my solution(code with nestJs):

import { Injectable, Logger } from '@nestjs/common';
import type { SpeechParams } from 'src/service/audio/Audio';
import type { Response } from 'express';
import { GPTAudio } from '../service/audio/Audio';

@Injectable()
export class AudioService {
  private readonly logger = new Logger(AudioService.name);
  private readonly audio = new GPTAudio();

  async speech(parmas: SpeechParams, res: Response): Promise<void> {
    this.logger.log(`[AudioService speech]\n${JSON.stringify(parmas)}`);
    res.setHeader('Content-Type', 'audio/mpeg');
    const response = await this.audio.speech(parmas);
    const body: NodeJS.ReadableStream = response.body as any;

    if (!body.on || !body.read) {
      throw new Error('unsupported "fetch" implementation');
    }

    body.on('readable', () => {
      let chunk: string | Buffer;
      while (null !== (chunk = body.read())) {
        res.write(chunk);
      }
    });
    body.on('close', () => {
      res.end();
    });
  }
}