src/hooks/useTTS.tsx

import { useEffect, useState } from "react"
import { notification } from "antd"
import {
  getElevenLabsApiKey,
  getElevenLabsModel,
  getElevenLabsVoiceId,
  getRemoveReasoningTagTTS,
  getTTSProvider,
  getVoice,
  isSSMLEnabled
} from "@/services/tts"
import { markdownToSSML } from "@/utils/markdown-to-ssml"
import { generateSpeech } from "@/services/elevenlabs"
import { splitMessageContent } from "@/utils/tts"
import { removeReasoning } from "@/libs/reasoning"

export interface VoiceOptions {
  utterance: string
}

export const useTTS = () => {
  const [isSpeaking, setIsSpeaking] = useState(false)
  const [audioElement, setAudioElement] = useState<HTMLAudioElement | null>(
    null
  )

  const speak = async ({ utterance }: VoiceOptions) => {
    try {
      const voice = await getVoice()
      const provider = await getTTSProvider()
      const isRemoveReasoning = await getRemoveReasoningTagTTS()

      if (isRemoveReasoning) {
        utterance = removeReasoning(utterance)
      }

      if (provider === "browser") {
        const isSSML = await isSSMLEnabled()
        if (isSSML) {
          utterance = markdownToSSML(utterance)
        }
        if (
          import.meta.env.BROWSER === "chrome" ||
          import.meta.env.BROWSER === "edge"
        ) {
          chrome.tts.speak(utterance, {
            voiceName: voice,
            onEvent(event) {
              if (event.type === "start") {
                setIsSpeaking(true)
              } else if (event.type === "end") {
                setIsSpeaking(false)
              }
            }
          })
        } else {
          window.speechSynthesis.speak(new SpeechSynthesisUtterance(utterance))
          window.speechSynthesis.onvoiceschanged = () => {
            const voices = window.speechSynthesis.getVoices()
            const voice = voices.find((v) => v.name === voice)
            const utter = new SpeechSynthesisUtterance(utterance)
            utter.voice = voice
            window.speechSynthesis.speak(utter)
          }
        }
      } else if (provider === "elevenlabs") {
        const apiKey = await getElevenLabsApiKey()
        const modelId = await getElevenLabsModel()
        const voiceId = await getElevenLabsVoiceId()
        const sentences = splitMessageContent(utterance)
        let nextAudioData: ArrayBuffer | null = null
        if (!apiKey || !modelId || !voiceId) {
          throw new Error("Missing ElevenLabs configuration")
        }
        for (let i = 0; i < sentences.length; i++) {
          setIsSpeaking(true)

          let currentAudioData =
            nextAudioData ||
            (await generateSpeech(apiKey, sentences[i], voiceId, modelId))

          if (i < sentences.length - 1) {
            generateSpeech(apiKey, sentences[i + 1], voiceId, modelId)
              .then((nextAudioData) => {
                nextAudioData = nextAudioData
              })
              .catch(console.error)
          }

          const blob = new Blob([currentAudioData], { type: "audio/mpeg" })
          const url = URL.createObjectURL(blob)
          const audio = new Audio(url)
          setAudioElement(audio)

          await new Promise((resolve) => {
            audio.onended = resolve
            audio.play()
          })

          URL.revokeObjectURL(url)
        }

        setIsSpeaking(false)
        setAudioElement(null)
      }
    } catch (error) {
      setIsSpeaking(false)
      setAudioElement(null)
      notification.error({
        message: "Error",
        description: "Something went wrong while trying to play the audio"
      })
    }
  }

  const cancel = () => {
    if (audioElement) {
      audioElement.pause()
      audioElement.currentTime = 0
      setAudioElement(null)
      setIsSpeaking(false)
      return
    }

    if (
      import.meta.env.BROWSER === "chrome" ||
      import.meta.env.BROWSER === "edge"
    ) {
      chrome.tts.stop()
    } else {
      window.speechSynthesis.cancel()
    }
    setIsSpeaking(false)
  }

  useEffect(() => {
    return () => {
      cancel()
    }
  }, [])

  return {
    speak,
    cancel,
    isSpeaking
  }
}
Update import statement in local-duckduckgo.ts, prompt.tsx, wxt.config.ts, webui.tsx, PlaygroundChat.tsx, other.tsx, Markdown.tsx, and useMessageOption.tsx 2024-04-11 00:08:20 +05:30			`import { useEffect, useState } from "react"`
			`import { notification } from "antd"`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30			`import {`
			`getElevenLabsApiKey,`
			`getElevenLabsModel,`
			`getElevenLabsVoiceId,`
feat: add option to remove reasoning tag from TTS output 2025-02-09 13:00:04 +05:30			`getRemoveReasoningTagTTS,`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30			`getTTSProvider,`
			`getVoice,`
			`isSSMLEnabled`
			`} from "@/services/tts"`
Update import statement in local-duckduckgo.ts, prompt.tsx, wxt.config.ts, webui.tsx, PlaygroundChat.tsx, other.tsx, Markdown.tsx, and useMessageOption.tsx 2024-04-11 00:08:20 +05:30			`import { markdownToSSML } from "@/utils/markdown-to-ssml"`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30			`import { generateSpeech } from "@/services/elevenlabs"`
			`import { splitMessageContent } from "@/utils/tts"`
feat: add option to remove reasoning tag from TTS output 2025-02-09 13:00:04 +05:30			`import { removeReasoning } from "@/libs/reasoning"`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30
			`export interface VoiceOptions {`
Update import statement in local-duckduckgo.ts, prompt.tsx, wxt.config.ts, webui.tsx, PlaygroundChat.tsx, other.tsx, Markdown.tsx, and useMessageOption.tsx 2024-04-11 00:08:20 +05:30			`utterance: string`
			`}`

			`export const useTTS = () => {`
			`const [isSpeaking, setIsSpeaking] = useState(false)`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30			`const [audioElement, setAudioElement] = useState<HTMLAudioElement \| null>(`
			`null`
			`)`
Update import statement in local-duckduckgo.ts, prompt.tsx, wxt.config.ts, webui.tsx, PlaygroundChat.tsx, other.tsx, Markdown.tsx, and useMessageOption.tsx 2024-04-11 00:08:20 +05:30
			`const speak = async ({ utterance }: VoiceOptions) => {`
			`try {`
			`const voice = await getVoice()`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30			`const provider = await getTTSProvider()`
feat: add option to remove reasoning tag from TTS output 2025-02-09 13:00:04 +05:30			`const isRemoveReasoning = await getRemoveReasoningTagTTS()`

			`if (isRemoveReasoning) {`
			`utterance = removeReasoning(utterance)`
			`}`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30
			`if (provider === "browser") {`
			`const isSSML = await isSSMLEnabled()`
			`if (isSSML) {`
			`utterance = markdownToSSML(utterance)`
			`}`
feat: support Edge browser 2025-02-08 23:06:09 +05:30			`if (`
			`import.meta.env.BROWSER === "chrome" \|\|`
			`import.meta.env.BROWSER === "edge"`
			`) {`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30			`chrome.tts.speak(utterance, {`
			`voiceName: voice,`
			`onEvent(event) {`
			`if (event.type === "start") {`
			`setIsSpeaking(true)`
			`} else if (event.type === "end") {`
			`setIsSpeaking(false)`
			`}`
chore: Update .gitignore and add .idea folder, update npm dependencies, and improve code logic for chat history and knowledge export/import 2024-05-11 19:32:36 +05:30			`}`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30			`})`
			`} else {`
			`window.speechSynthesis.speak(new SpeechSynthesisUtterance(utterance))`
			`window.speechSynthesis.onvoiceschanged = () => {`
			`const voices = window.speechSynthesis.getVoices()`
			`const voice = voices.find((v) => v.name === voice)`
			`const utter = new SpeechSynthesisUtterance(utterance)`
			`utter.voice = voice`
			`window.speechSynthesis.speak(utter)`
			`}`
			`}`
			`} else if (provider === "elevenlabs") {`
			`const apiKey = await getElevenLabsApiKey()`
			`const modelId = await getElevenLabsModel()`
			`const voiceId = await getElevenLabsVoiceId()`
			`const sentences = splitMessageContent(utterance)`
			`let nextAudioData: ArrayBuffer \| null = null`
			`if (!apiKey \|\| !modelId \|\| !voiceId) {`
			`throw new Error("Missing ElevenLabs configuration")`
			`}`
			`for (let i = 0; i < sentences.length; i++) {`
			`setIsSpeaking(true)`

			`let currentAudioData =`
			`nextAudioData \|\|`
			`(await generateSpeech(apiKey, sentences[i], voiceId, modelId))`
feat: support Edge browser 2025-02-08 23:06:09 +05:30
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30			`if (i < sentences.length - 1) {`
			`generateSpeech(apiKey, sentences[i + 1], voiceId, modelId)`
			`.then((nextAudioData) => {`
			`nextAudioData = nextAudioData`
			`})`
			`.catch(console.error)`
Update import statement in local-duckduckgo.ts, prompt.tsx, wxt.config.ts, webui.tsx, PlaygroundChat.tsx, other.tsx, Markdown.tsx, and useMessageOption.tsx 2024-04-11 00:08:20 +05:30			`}`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30
			`const blob = new Blob([currentAudioData], { type: "audio/mpeg" })`
			`const url = URL.createObjectURL(blob)`
			`const audio = new Audio(url)`
			`setAudioElement(audio)`

			`await new Promise((resolve) => {`
			`audio.onended = resolve`
			`audio.play()`
			`})`

			`URL.revokeObjectURL(url)`
Update import statement in local-duckduckgo.ts, prompt.tsx, wxt.config.ts, webui.tsx, PlaygroundChat.tsx, other.tsx, Markdown.tsx, and useMessageOption.tsx 2024-04-11 00:08:20 +05:30			`}`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30
			`setIsSpeaking(false)`
			`setAudioElement(null)`
chore: Update .gitignore and add .idea folder, update npm dependencies, and improve code logic for chat history and knowledge export/import 2024-05-11 19:32:36 +05:30			`}`
Update import statement in local-duckduckgo.ts, prompt.tsx, wxt.config.ts, webui.tsx, PlaygroundChat.tsx, other.tsx, Markdown.tsx, and useMessageOption.tsx 2024-04-11 00:08:20 +05:30			`} catch (error) {`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30			`setIsSpeaking(false)`
			`setAudioElement(null)`
Update import statement in local-duckduckgo.ts, prompt.tsx, wxt.config.ts, webui.tsx, PlaygroundChat.tsx, other.tsx, Markdown.tsx, and useMessageOption.tsx 2024-04-11 00:08:20 +05:30			`notification.error({`
			`message: "Error",`
			`description: "Something went wrong while trying to play the audio"`
			`})`
			`}`
			`}`

			`const cancel = () => {`
feat: Add ElevenLabs TTS provider and response splitting options 2024-12-28 20:10:50 +05:30			`if (audioElement) {`
			`audioElement.pause()`
			`audioElement.currentTime = 0`
			`setAudioElement(null)`
			`setIsSpeaking(false)`
			`return`
			`}`

feat: add option to remove reasoning tag from TTS output 2025-02-09 13:00:04 +05:30			`if (`
			`import.meta.env.BROWSER === "chrome" \|\|`
			`import.meta.env.BROWSER === "edge"`
			`) {`
chore: Update .gitignore and add .idea folder, update npm dependencies, and improve code logic for chat history and knowledge export/import 2024-05-11 19:32:36 +05:30			`chrome.tts.stop()`
			`} else {`
			`window.speechSynthesis.cancel()`
			`}`
Update import statement in local-duckduckgo.ts, prompt.tsx, wxt.config.ts, webui.tsx, PlaygroundChat.tsx, other.tsx, Markdown.tsx, and useMessageOption.tsx 2024-04-11 00:08:20 +05:30			`setIsSpeaking(false)`
			`}`

			`useEffect(() => {`
			`return () => {`
			`cancel()`
			`}`
			`}, [])`

			`return {`
			`speak,`
			`cancel,`
			`isSpeaking`
			`}`
			`}`