feat: refactor speech settings and introduce voice selector component

Shishir435 · Shishir435 · commit e75544828f79 · 2025-11-04T00:40:28.000+05:30
- Replace the existing voice selection UI with a new VoiceSelector component for improved usability.
- Enhance voice loading logic to handle asynchronous updates and loading states.
- Optimize voice selection handling with memoization for better performance.
- Update speech settings to ensure compatibility with the new voice selection approach.
diff --git a/src/features/chat/components/speech-settings.tsx b/src/features/chat/components/speech-settings.tsx
@@ -1,4 +1,4 @@
-import { useEffect, useState } from "react"
+import { useEffect, useMemo, useState } from "react"
 
 import { Badge } from "@/components/ui/badge"
 import {
@@ -9,15 +9,9 @@ import {
   CardTitle
 } from "@/components/ui/card"
 import { Label } from "@/components/ui/label"
-import {
-  Select,
-  SelectContent,
-  SelectItem,
-  SelectTrigger,
-  SelectValue
-} from "@/components/ui/select"
 import { Slider } from "@/components/ui/slider"
 import { Textarea } from "@/components/ui/textarea"
+import { VoiceSelector } from "@/features/chat/components/voice-selector"
 import { useSpeechSettings } from "@/features/chat/hooks/use-speech-settings"
 import { useVoices } from "@/features/chat/hooks/use-voice"
 import { Mic, Settings, Volume2 } from "@/lib/lucide-icon"
@@ -39,30 +33,34 @@ const getPitchDescription = (pitch: number) => {
 }
 
 export const SpeechSettings = () => {
-  const voices = useVoices()
+  const { voices, isLoading: isLoadingVoices } = useVoices()
   const { rate, setRate, pitch, setPitch, voiceURI, setVoiceURI } =
     useSpeechSettings()
   const [testText, setTestText] = useState("")
 
+  const selectedVoice = useMemo(
+    () => voices.find((v) => v.voiceURI === voiceURI),
+    [voices, voiceURI]
+  )
+
   useEffect(() => {
-    if (!voiceURI && voices.length > 0) {
-      const defaultVoice = voices.find((v) => v.default) ?? voices[0]
-      if (defaultVoice) {
-        setVoiceURI(defaultVoice.voiceURI)
-      }
-    } else if (
-      voiceURI &&
-      voices.length > 0 &&
-      !voices.find((v) => v.voiceURI === voiceURI)
-    ) {
-      const defaultVoice = voices.find((v) => v.default) ?? voices[0]
-      if (defaultVoice) {
-        setVoiceURI(defaultVoice.voiceURI)
+    if (!isLoadingVoices && voices.length > 0) {
+      if (!voiceURI) {
+        const defaultVoice = voices.find((v) => v.default) ?? voices[0]
+        if (defaultVoice) {
+          setVoiceURI(defaultVoice.voiceURI)
+        }
+      } else {
+        const voiceExists = voices.some((v) => v.voiceURI === voiceURI)
+        if (!voiceExists) {
+          const defaultVoice = voices.find((v) => v.default) ?? voices[0]
+          if (defaultVoice) {
+            setVoiceURI(defaultVoice.voiceURI)
+          }
+        }
       }
     }
-  }, [voices, voiceURI, setVoiceURI])
-
-  const selectedVoice = voices.find((v) => v.voiceURI === voiceURI)
+  }, [voices, voiceURI, setVoiceURI, isLoadingVoices])
 
   return (
     <div className="mx-auto space-y-4">
@@ -93,33 +91,12 @@ export const SpeechSettings = () => {
                 </Badge>
               )}
             </div>
-            <Select
-              value={voiceURI}
-              onValueChange={setVoiceURI}
-              aria-label="Select speech synthesis voice">
-              <SelectTrigger className="h-9">
-                <SelectValue placeholder="Select a voice" />
-              </SelectTrigger>
-              <SelectContent>
-                {voices.map((voice) => (
-                  <SelectItem key={voice.voiceURI} value={voice.voiceURI}>
-                    <div className="flex w-full items-center justify-between">
-                      <span>{voice.name}</span>
-                      <div className="ml-3 flex items-center gap-2">
-                        <Badge variant="secondary" className="text-xs">
-                          {voice.lang}
-                        </Badge>
-                        {voice.default && (
-                          <Badge variant="outline" className="text-xs">
-                            default
-                          </Badge>
-                        )}
-                      </div>
-                    </div>
-                  </SelectItem>
-                ))}
-              </SelectContent>
-            </Select>
+            <VoiceSelector
+              voices={voices}
+              selectedVoiceURI={voiceURI || null}
+              onVoiceChange={setVoiceURI}
+              isLoading={isLoadingVoices}
+            />
           </div>
 
           {/* Rate Control */}
@@ -218,6 +195,9 @@ export const SpeechSettings = () => {
                   className="rounded-md bg-secondary px-3 py-1 text-xs transition-colors hover:bg-secondary/80"
                   onClick={() => {
                     if ("speechSynthesis" in window) {
+                      // Cancel any ongoing speech
+                      window.speechSynthesis.cancel()
+
                       const textToSpeak =
                         testText.trim() ||
                         "Hello, this is a test of your speech settings."
@@ -226,12 +206,19 @@ export const SpeechSettings = () => {
                       )
                       utterance.rate = rate
                       utterance.pitch = pitch
+
+                      // Use the selected voice if available
                       if (selectedVoice) {
-                        utterance.voice =
-                          window.speechSynthesis
-                            .getVoices()
-                            .find((v) => v.voiceURI === voiceURI) || null
+                        // Get fresh voice reference from speechSynthesis API
+                        // This ensures compatibility across browsers
+                        const freshVoice = window.speechSynthesis
+                          .getVoices()
+                          .find((v) => v.voiceURI === selectedVoice.voiceURI)
+                        if (freshVoice) {
+                          utterance.voice = freshVoice
+                        }
                       }
+
                       window.speechSynthesis.speak(utterance)
                     }
                   }}>
diff --git a/src/features/chat/components/voice-selector.tsx b/src/features/chat/components/voice-selector.tsx
@@ -0,0 +1,231 @@
+import { useMemo, useState } from "react"
+import { Badge } from "@/components/ui/badge"
+import { Button } from "@/components/ui/button"
+import {
+  Command,
+  CommandEmpty,
+  CommandGroup,
+  CommandInput,
+  CommandItem,
+  CommandList
+} from "@/components/ui/command"
+import {
+  Popover,
+  PopoverContent,
+  PopoverTrigger
+} from "@/components/ui/popover"
+import { Check, ChevronsUpDown, Loader2, Mic } from "@/lib/lucide-icon"
+import { cn } from "@/lib/utils"
+
+interface VoiceSelectorProps {
+  voices: SpeechSynthesisVoice[]
+  selectedVoiceURI: string | null
+  onVoiceChange: (voiceURI: string) => void
+  isLoading?: boolean
+}
+
+export const VoiceSelector = ({
+  voices,
+  selectedVoiceURI,
+  onVoiceChange,
+  isLoading = false
+}: VoiceSelectorProps) => {
+  const [open, setOpen] = useState(false)
+  const [searchQuery, setSearchQuery] = useState("")
+
+  const selectedVoice = useMemo(
+    () => voices.find((v) => v.voiceURI === selectedVoiceURI),
+    [voices, selectedVoiceURI]
+  )
+
+  // Group voices by language for better organization
+  const groupedVoices = useMemo(() => {
+    const grouped = voices.reduce(
+      (acc, voice) => {
+        const lang = voice.lang || "Unknown"
+        if (!acc[lang]) {
+          acc[lang] = []
+        }
+        acc[lang].push(voice)
+        return acc
+      },
+      {} as Record<string, SpeechSynthesisVoice[]>
+    )
+
+    // Sort languages alphabetically
+    return Object.keys(grouped)
+      .sort()
+      .map((lang) => ({
+        lang,
+        voices: grouped[lang].sort((a, b) => a.name.localeCompare(b.name))
+      }))
+  }, [voices])
+
+  // Filter voices based on search query
+  const filteredGroups = useMemo(() => {
+    if (!searchQuery.trim()) {
+      return groupedVoices
+    }
+
+    const query = searchQuery.toLowerCase()
+    return groupedVoices
+      .map((group) => ({
+        ...group,
+        voices: group.voices.filter(
+          (voice) =>
+            voice.name.toLowerCase().includes(query) ||
+            voice.lang.toLowerCase().includes(query) ||
+            voice.voiceURI.toLowerCase().includes(query)
+        )
+      }))
+      .filter((group) => group.voices.length > 0)
+  }, [groupedVoices, searchQuery])
+
+  return (
+    <Popover open={open} onOpenChange={setOpen}>
+      <PopoverTrigger asChild>
+        <Button
+          variant="outline"
+          role="combobox"
+          aria-expanded={open}
+          aria-label="Select voice"
+          className={cn(
+            "h-10 w-full justify-between gap-2 border-input bg-background px-3 text-sm font-normal shadow-sm transition-colors",
+            "hover:bg-accent hover:text-accent-foreground",
+            "focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-ring",
+            "disabled:cursor-not-allowed disabled:opacity-50",
+            open && "ring-1 ring-ring"
+          )}
+          disabled={isLoading || voices.length === 0}>
+          <div className="flex items-center gap-2 min-w-0 flex-1">
+            {isLoading ? (
+              <>
+                <Loader2 className="h-4 w-4 animate-spin text-muted-foreground shrink-0" />
+                <span className="text-muted-foreground text-sm truncate">
+                  Loading voices...
+                </span>
+              </>
+            ) : selectedVoice ? (
+              <>
+                <span className="text-sm font-medium truncate">
+                  {selectedVoice.name}
+                </span>
+                <Badge
+                  variant="secondary"
+                  className="text-[10px] h-5 px-1.5 font-normal shrink-0">
+                  {selectedVoice.lang}
+                </Badge>
+              </>
+            ) : (
+              <span className="text-muted-foreground text-sm truncate">
+                Select a voice...
+              </span>
+            )}
+          </div>
+          <ChevronsUpDown className="h-4 w-4 shrink-0 opacity-50" />
+        </Button>
+      </PopoverTrigger>
+      <PopoverContent
+        className="w-[440px] p-0 shadow-lg"
+        align="center"
+        sideOffset={6}>
+        <Command className="rounded-lg border-0" shouldFilter={false}>
+          <div className="flex items-center border-b px-3">
+            <CommandInput
+              placeholder="Search by name, language, or URI..."
+              value={searchQuery}
+              onValueChange={setSearchQuery}
+              className="h-11 border-0 focus:outline-none focus:ring-0"
+            />
+          </div>
+          <CommandList className="max-h-[320px] overflow-y-auto">
+            <CommandEmpty className="py-8">
+              <div className="flex flex-col items-center gap-2 text-center">
+                <div className="rounded-full bg-muted p-3">
+                  <Mic className="h-5 w-5 text-muted-foreground" />
+                </div>
+                <div className="space-y-1">
+                  <p className="text-sm font-medium">No voices found</p>
+                  <p className="text-xs text-muted-foreground">
+                    {searchQuery
+                      ? "Try a different search term"
+                      : "No voices available on this device"}
+                  </p>
+                </div>
+              </div>
+            </CommandEmpty>
+            <div className="p-1">
+              {filteredGroups.map((group, groupIndex) => (
+                <CommandGroup
+                  key={group.lang}
+                  className={cn("px-0 py-0", groupIndex > 0 && "mt-2")}>
+                  <div className="flex items-center justify-between px-3 py-2 mb-1">
+                    <span className="text-xs font-semibold uppercase tracking-wider text-muted-foreground">
+                      {group.lang}
+                    </span>
+                    <Badge
+                      variant="secondary"
+                      className="text-[10px] h-4 px-1.5 font-normal">
+                      {group.voices.length}
+                    </Badge>
+                  </div>
+                  {group.voices.map((voice) => {
+                    const isSelected = selectedVoiceURI === voice.voiceURI
+                    return (
+                      <CommandItem
+                        key={voice.voiceURI}
+                        value={voice.voiceURI}
+                        onSelect={() => {
+                          onVoiceChange(voice.voiceURI)
+                          setOpen(false)
+                          setSearchQuery("")
+                        }}
+                        className={cn(
+                          "group mx-1 flex items-center gap-3 rounded-md px-3 py-2.5 cursor-pointer transition-all",
+                          "aria-selected:bg-accent/50",
+                          isSelected
+                            ? "bg-accent text-accent-foreground shadow-sm"
+                            : "hover:bg-accent/50"
+                        )}>
+                        <div className="flex flex-1 items-center justify-between gap-3 min-w-0">
+                          <div className="flex flex-col min-w-0">
+                            <span
+                              className={cn(
+                                "text-sm truncate leading-tight transition-colors",
+                                isSelected ? "font-semibold" : "font-medium"
+                              )}>
+                              {voice.name}
+                            </span>
+                            {voice.localService === false && (
+                              <span className="text-[10px] text-muted-foreground mt-0.5">
+                                Network voice
+                              </span>
+                            )}
+                          </div>
+                          <div className="flex items-center gap-2 shrink-0">
+                            {voice.default && (
+                              <Badge
+                                variant="outline"
+                                className="text-[10px] h-4 px-1.5 font-normal border-muted-foreground/30">
+                                default
+                              </Badge>
+                            )}
+                            {isSelected && (
+                              <div className="flex items-center justify-center">
+                                <Check className="h-4 w-4 text-primary" />
+                              </div>
+                            )}
+                          </div>
+                        </div>
+                      </CommandItem>
+                    )
+                  })}
+                </CommandGroup>
+              ))}
+            </div>
+          </CommandList>
+        </Command>
+      </PopoverContent>
+    </Popover>
+  )
+}
diff --git a/src/features/chat/hooks/use-speech-synthesis.ts b/src/features/chat/hooks/use-speech-synthesis.ts
@@ -5,14 +5,8 @@ import { markdownToSpeechText } from "@/lib/utils"
 
 export const useSpeechSynthesis = () => {
   const [speaking, setSpeaking] = useState(false)
-  const [isLoadingVoices, setIsLoadingVoices] = useState(true)
-  const voices = useVoices()
+  const { voices, isLoading: isLoadingVoices } = useVoices()
   const { rate, pitch, voiceURI } = useSpeechSettings()
-  useEffect(() => {
-    if (voices.length > 0 && isLoadingVoices) {
-      setIsLoadingVoices(false)
-    }
-  }, [voices, isLoadingVoices])
 
   useEffect(() => {
     const handleEnd = () => setSpeaking(false)
diff --git a/src/features/chat/hooks/use-voice.ts b/src/features/chat/hooks/use-voice.ts