Add wake word integration (#96380)

* Add wake component * Add wake support to Wyoming * Add helper function to assist_pipeline (not complete) * Rename wake to wake_word * Fix platform * Use send_event and clean up * Merge wake word into pipeline * Add wake option to async_pipeline_from_audio_stream * Add start/end stages to async_pipeline_from_audio_stream * Add wake timeout * Remove layer in wake_output * Use VAD for wake word timeout * Include audio metadata in wake-start * Remove unnecessary websocket command * wake -> wake_word * Incorporate feedback * Clean up wake_word tests * Add wyoming wake word tests * Add pipeline wake word test * Add last processed state * Fix tests * Add tests for wake word * More tests for the codebot
2025-07-26 14:47:38 +00:00 · 2023-08-07 21:22:16 -05:00 · 2023-08-07 21:22:16 -05:00 · 7ea2998b55
commit 7ea2998b55
parent 798fb3e31a
28 changed files with 1802 additions and 27 deletions
--- a/2
+++ b/2
@ -1373,6 +1373,8 @@ build.json @home-assistant/supervisor
 /tests/components/vulcan/ @Antoni-Czaplicki
 /homeassistant/components/wake_on_lan/ @ntilley905
 /tests/components/wake_on_lan/ @ntilley905
 /homeassistant/components/wake_word/ @home-assistant/core @synesthesiam
 /tests/components/wake_word/ @home-assistant/core @synesthesiam
 /homeassistant/components/wallbox/ @hesselonline
 /tests/components/wallbox/ @hesselonline
 /homeassistant/components/waqi/ @andrey-git
--- a/homeassistant/components/assist_pipeline/init.py
+++ b/homeassistant/components/assist_pipeline/init.py
@ -18,6 +18,7 @@ from .pipeline import (
    PipelineInput,
    PipelineRun,
    PipelineStage,
    WakeWordSettings,
    async_create_default_pipeline,
    async_get_pipeline,
    async_get_pipelines,
@ -35,6 +36,7 @@ __all__ = (
    "PipelineEvent",
    "PipelineEventType",
    "PipelineNotFound",
    "WakeWordSettings",
 )
 CONFIG_SCHEMA = cv.empty_config_schema(DOMAIN)
@ -57,7 +59,10 @@ async def async_pipeline_from_audio_stream(
    pipeline_id: str | None = None,
    conversation_id: str | None = None,
    tts_audio_output: str | None = None,
    wake_word_settings: WakeWordSettings | None = None,
    device_id: str | None = None,
    start_stage: PipelineStage = PipelineStage.STT,
    end_stage: PipelineStage = PipelineStage.TTS,
 ) -> None:
    """Create an audio pipeline from an audio stream.
@ -72,10 +77,11 @@ async def async_pipeline_from_audio_stream(
            hass,
            context=context,
            pipeline=async_get_pipeline(hass, pipeline_id=pipeline_id),
-            start_stage=PipelineStage.STT,
+            start_stage=start_stage,
-            end_stage=PipelineStage.TTS,
+            end_stage=end_stage,
            event_callback=event_callback,
            tts_audio_output=tts_audio_output,
            wake_word_settings=wake_word_settings,
        ),
    )
    await pipeline_input.validate()
--- a/homeassistant/components/assist_pipeline/error.py
+++ b/homeassistant/components/assist_pipeline/error.py
@ -18,6 +18,14 @@ class PipelineNotFound(PipelineError):
    """Unspecified pipeline picked."""
 class WakeWordDetectionError(PipelineError):
    """Error in wake-word-detection portion of pipeline."""
 class WakeWordTimeoutError(WakeWordDetectionError):
    """Timeout when wake word was not detected."""
 class SpeechToTextError(PipelineError):
    """Error in speech-to-text portion of pipeline."""
--- a/homeassistant/components/assist_pipeline/manifest.json
+++ b/homeassistant/components/assist_pipeline/manifest.json
@ -2,7 +2,7 @@
  "domain": "assist_pipeline",
  "name": "Assist pipeline",
  "codeowners": ["@balloob", "@synesthesiam"],
-  "dependencies": ["conversation", "stt", "tts"],
+  "dependencies": ["conversation", "stt", "tts", "wake_word"],
  "documentation": "https://www.home-assistant.io/integrations/assist_pipeline",
  "iot_class": "local_push",
  "quality_scale": "internal",
--- a/homeassistant/components/assist_pipeline/pipeline.py
+++ b/homeassistant/components/assist_pipeline/pipeline.py
@ -2,7 +2,7 @@
 from __future__ import annotations
 import asyncio
-from collections.abc import AsyncIterable, Callable, Iterable
+from collections.abc import AsyncGenerator, AsyncIterable, Callable, Iterable
 from dataclasses import asdict, dataclass, field
 from enum import StrEnum
 import logging
@ -10,7 +10,14 @@ from typing import Any, cast
 import voluptuous as vol
-from homeassistant.components import conversation, media_source, stt, tts, websocket_api
+from homeassistant.components import (
    conversation,
    media_source,
    stt,
    tts,
    wake_word,
    websocket_api,
 )
 from homeassistant.components.tts.media_source import (
    generate_media_source_id as tts_generate_media_source_id,
 )
@ -39,7 +46,10 @@ from .error import (
    PipelineNotFound,
    SpeechToTextError,
    TextToSpeechError,
    WakeWordDetectionError,
    WakeWordTimeoutError,
 )
 from .vad import VoiceActivityTimeout, VoiceCommandSegmenter
 _LOGGER = logging.getLogger(__name__)
@ -241,6 +251,8 @@ class PipelineEventType(StrEnum):
    RUN_START = "run-start"
    RUN_END = "run-end"
    WAKE_WORD_START = "wake_word-start"
    WAKE_WORD_END = "wake_word-end"
    STT_START = "stt-start"
    STT_END = "stt-end"
    INTENT_START = "intent-start"
@ -297,12 +309,14 @@ class Pipeline:
 class PipelineStage(StrEnum):
    """Stages of a pipeline."""
    WAKE_WORD = "wake_word"
    STT = "stt"
    INTENT = "intent"
    TTS = "tts"
 PIPELINE_STAGE_ORDER = [
    PipelineStage.WAKE_WORD,
    PipelineStage.STT,
    PipelineStage.INTENT,
    PipelineStage.TTS,
@ -327,6 +341,17 @@ class InvalidPipelineStagesError(PipelineRunValidationError):
        )
@dataclass(frozen=True)
 class WakeWordSettings:
    """Settings for wake word detection."""
    timeout: float | None = None
    """Seconds of silence before detection times out."""
    audio_seconds_to_buffer: float = 0
    """Seconds of audio to buffer before detection and forward to STT."""
@dataclass
 class PipelineRun:
    """Running context for a pipeline."""
@ -341,17 +366,20 @@ class PipelineRun:
    runner_data: Any | None = None
    intent_agent: str | None = None
    tts_audio_output: str | None = None
    wake_word_settings: WakeWordSettings | None = None
    id: str = field(default_factory=ulid_util.ulid)
    stt_provider: stt.SpeechToTextEntity | stt.Provider = field(init=False)
    tts_engine: str = field(init=False)
    tts_options: dict | None = field(init=False, default=None)
    wake_word_engine: str = field(init=False)
    wake_word_provider: wake_word.WakeWordDetectionEntity = field(init=False)
    def __post_init__(self) -> None:
        """Set language for pipeline."""
        self.language = self.pipeline.language or self.hass.config.language
-        # stt -> intent -> tts
+        # wake -> stt -> intent -> tts
        if PIPELINE_STAGE_ORDER.index(self.end_stage) < PIPELINE_STAGE_ORDER.index(
            self.start_stage
        ):
@ -393,6 +421,141 @@ class PipelineRun:
            )
        )
    async def prepare_wake_word_detection(self) -> None:
        """Prepare wake-word-detection."""
        # Need to add to pipeline store
        engine = wake_word.async_default_engine(self.hass)
        if engine is None:
            raise WakeWordDetectionError(
                code="wake-engine-missing",
                message="No wake word engine",
            )
        wake_word_provider = wake_word.async_get_wake_word_detection_entity(
            self.hass, engine
        )
        if wake_word_provider is None:
            raise WakeWordDetectionError(
                code="wake-provider-missing",
                message=f"No wake-word-detection provider for: {engine}",
            )
        self.wake_word_engine = engine
        self.wake_word_provider = wake_word_provider
    async def wake_word_detection(
        self,
        stream: AsyncIterable[bytes],
        audio_buffer: list[bytes],
    ) -> wake_word.DetectionResult | None:
        """Run wake-word-detection portion of pipeline. Returns detection result."""
        metadata_dict = asdict(
            stt.SpeechMetadata(
                language="",
                format=stt.AudioFormats.WAV,
                codec=stt.AudioCodecs.PCM,
                bit_rate=stt.AudioBitRates.BITRATE_16,
                sample_rate=stt.AudioSampleRates.SAMPLERATE_16000,
                channel=stt.AudioChannels.CHANNEL_MONO,
            )
        )
        # Remove language since it doesn't apply to wake words yet
        metadata_dict.pop("language", None)
        self.process_event(
            PipelineEvent(
                PipelineEventType.WAKE_WORD_START,
                {
                    "engine": self.wake_word_engine,
                    "metadata": metadata_dict,
                },
            )
        )
        wake_word_settings = self.wake_word_settings or WakeWordSettings()
        wake_word_vad: VoiceActivityTimeout | None = None
        if (wake_word_settings.timeout is not None) and (
            wake_word_settings.timeout > 0
        ):
            # Use VAD to determine timeout
            wake_word_vad = VoiceActivityTimeout(wake_word_settings.timeout)
        # Audio chunk buffer.
        audio_bytes_to_buffer = int(
            wake_word_settings.audio_seconds_to_buffer * 16000 * 2
        )
        audio_ring_buffer = b""
        async def timestamped_stream() -> AsyncIterable[tuple[bytes, int]]:
            """Yield audio with timestamps (milliseconds since start of stream)."""
            nonlocal audio_ring_buffer
            timestamp_ms = 0
            async for chunk in stream:
                yield chunk, timestamp_ms
                timestamp_ms += (len(chunk) // 2) // 16  # milliseconds @ 16Khz
                # Keeping audio right before wake word detection allows the
                # voice command to be spoken immediately after the wake word.
                if audio_bytes_to_buffer > 0:
                    audio_ring_buffer += chunk
                    if len(audio_ring_buffer) > audio_bytes_to_buffer:
                        # A proper ring buffer would be far more efficient
                        audio_ring_buffer = audio_ring_buffer[
                            len(audio_ring_buffer) - audio_bytes_to_buffer :
                        ]
                if (wake_word_vad is not None) and (not wake_word_vad.process(chunk)):
                    raise WakeWordTimeoutError(
                        code="wake-word-timeout", message="Wake word was not detected"
                    )
        try:
            # Detect wake word(s)
            result = await self.wake_word_provider.async_process_audio_stream(
                timestamped_stream()
            )
            if audio_ring_buffer:
                # All audio kept from right before the wake word was detected as
                # a single chunk.
                audio_buffer.append(audio_ring_buffer)
        except WakeWordTimeoutError:
            _LOGGER.debug("Timeout during wake word detection")
            raise
        except Exception as src_error:
            _LOGGER.exception("Unexpected error during wake-word-detection")
            raise WakeWordDetectionError(
                code="wake-stream-failed",
                message="Unexpected error during wake-word-detection",
            ) from src_error
        _LOGGER.debug("wake-word-detection result %s", result)
        if result is None:
            wake_word_output: dict[str, Any] = {}
        else:
            if result.queued_audio:
                # Add audio that was pending at detection
                for chunk_ts in result.queued_audio:
                    audio_buffer.append(chunk_ts[0])
            wake_word_output = asdict(result)
            # Remove non-JSON fields
            wake_word_output.pop("queued_audio", None)
        self.process_event(
            PipelineEvent(
                PipelineEventType.WAKE_WORD_END,
                {"wake_word_output": wake_word_output},
            )
        )
        return result
    async def prepare_speech_to_text(self, metadata: stt.SpeechMetadata) -> None:
        """Prepare speech-to-text."""
        # pipeline.stt_engine can't be None or this function is not called
@ -443,9 +606,21 @@ class PipelineRun:
        )
        try:
            segmenter = VoiceCommandSegmenter()
            async def segment_stream(
                stream: AsyncIterable[bytes],
            ) -> AsyncGenerator[bytes, None]:
                """Stop stream when voice command is finished."""
                async for chunk in stream:
                    if not segmenter.process(chunk):
                        break
                    yield chunk
            # Transcribe audio stream
            result = await self.stt_provider.async_process_audio_stream(
-                metadata, stream
+                metadata, segment_stream(stream)
            )
        except Exception as src_error:
            _LOGGER.exception("Unexpected error during speech-to-text")
@ -663,17 +838,45 @@ class PipelineInput:
    async def execute(self) -> None:
        """Run pipeline."""
        self.run.start()
-        current_stage = self.run.start_stage
+        current_stage: PipelineStage | None = self.run.start_stage
        audio_buffer: list[bytes] = []
        try:
            if current_stage == PipelineStage.WAKE_WORD:
                assert self.stt_stream is not None
                detect_result = await self.run.wake_word_detection(
                    self.stt_stream, audio_buffer
                )
                if detect_result is None:
                    # No wake word. Abort the rest of the pipeline.
                    self.run.end()
                    return
                current_stage = PipelineStage.STT
            # speech-to-text
            intent_input = self.intent_input
            if current_stage == PipelineStage.STT:
                assert self.stt_metadata is not None
                assert self.stt_stream is not None
                if audio_buffer:
                    async def buffered_stream() -> AsyncGenerator[bytes, None]:
                        for chunk in audio_buffer:
                            yield chunk
                        assert self.stt_stream is not None
                        async for chunk in self.stt_stream:
                            yield chunk
                    stt_stream = cast(AsyncIterable[bytes], buffered_stream())
                else:
                    stt_stream = self.stt_stream
                intent_input = await self.run.speech_to_text(
                    self.stt_metadata,
-                    self.stt_stream,
+                    stt_stream,
                )
                current_stage = PipelineStage.INTENT
@ -707,7 +910,7 @@ class PipelineInput:
    async def validate(self) -> None:
        """Validate pipeline input against start stage."""
-        if self.run.start_stage == PipelineStage.STT:
+        if self.run.start_stage in (PipelineStage.WAKE_WORD, PipelineStage.STT):
            if self.run.pipeline.stt_engine is None:
                raise PipelineRunValidationError(
                    "the pipeline does not support speech-to-text"
@ -741,6 +944,13 @@ class PipelineInput:
        prepare_tasks = []
        if (
            start_stage_index
            <= PIPELINE_STAGE_ORDER.index(PipelineStage.WAKE_WORD)
            <= end_stage_index
        ):
            prepare_tasks.append(self.run.prepare_wake_word_detection())
        if (
            start_stage_index
            <= PIPELINE_STAGE_ORDER.index(PipelineStage.STT)
--- a/homeassistant/components/assist_pipeline/vad.py
+++ b/homeassistant/components/assist_pipeline/vad.py
@ -88,7 +88,7 @@ class VoiceCommandSegmenter:
        self.in_command = False
    def process(self, samples: bytes) -> bool:
-        """Process a 16-bit 16Khz mono audio samples.
+        """Process 16-bit 16Khz mono audio samples.
        Returns False when command is done.
        """
@ -148,3 +148,94 @@ class VoiceCommandSegmenter:
                self._silence_seconds_left = self.silence_seconds
        return True
@dataclass
 class VoiceActivityTimeout:
    """Detects silence in audio until a timeout is reached."""
    silence_seconds: float
    """Seconds of silence before timeout."""
    reset_seconds: float = 0.5
    """Seconds of speech before resetting timeout."""
    vad_mode: int = 3
    """Aggressiveness in filtering out non-speech. 3 is the most aggressive."""
    vad_frames: int = 480  # 30 ms
    """Must be 10, 20, or 30 ms at 16Khz."""
    _silence_seconds_left: float = 0.0
    """Seconds left before considering voice command as stopped."""
    _reset_seconds_left: float = 0.0
    """Seconds left before resetting start/stop time counters."""
    _vad: webrtcvad.Vad = None
    _audio_buffer: bytes = field(default_factory=bytes)
    _bytes_per_chunk: int = 480 * 2  # 16-bit samples
    _seconds_per_chunk: float = 0.03  # 30 ms
    def __post_init__(self) -> None:
        """Initialize VAD."""
        self._vad = webrtcvad.Vad(self.vad_mode)
        self._bytes_per_chunk = self.vad_frames * 2
        self._seconds_per_chunk = self.vad_frames / _SAMPLE_RATE
        self.reset()
    def reset(self) -> None:
        """Reset all counters and state."""
        self._audio_buffer = b""
        self._silence_seconds_left = self.silence_seconds
        self._reset_seconds_left = self.reset_seconds
    def process(self, samples: bytes) -> bool:
        """Process 16-bit 16Khz mono audio samples.
        Returns False when timeout is reached.
        """
        self._audio_buffer += samples
        # Process in 10, 20, or 30 ms chunks.
        num_chunks = len(self._audio_buffer) // self._bytes_per_chunk
        for chunk_idx in range(num_chunks):
            chunk_offset = chunk_idx * self._bytes_per_chunk
            chunk = self._audio_buffer[
                chunk_offset : chunk_offset + self._bytes_per_chunk
            ]
            if not self._process_chunk(chunk):
                return False
        if num_chunks > 0:
            # Remove from buffer
            self._audio_buffer = self._audio_buffer[
                num_chunks * self._bytes_per_chunk :
            ]
        return True
    def _process_chunk(self, chunk: bytes) -> bool:
        """Process a single chunk of 16-bit 16Khz mono audio.
        Returns False when timeout is reached.
        """
        if self._vad.is_speech(chunk, _SAMPLE_RATE):
            # Speech
            self._reset_seconds_left -= self._seconds_per_chunk
            if self._reset_seconds_left <= 0:
                # Reset timeout
                self._silence_seconds_left = self.silence_seconds
        else:
            # Silence
            self._silence_seconds_left -= self._seconds_per_chunk
            if self._silence_seconds_left <= 0:
                # Timeout reached
                return False
            # Slowly build reset counter back up
            self._reset_seconds_left = min(
                self.reset_seconds, self._reset_seconds_left + self._seconds_per_chunk
            )
        return True
--- a/homeassistant/components/assist_pipeline/websocket_api.py
+++ b/homeassistant/components/assist_pipeline/websocket_api.py
@ -26,11 +26,12 @@ from .pipeline import (
    PipelineInput,
    PipelineRun,
    PipelineStage,
    WakeWordSettings,
    async_get_pipeline,
 )
 from .vad import VoiceCommandSegmenter
 DEFAULT_TIMEOUT = 30
 DEFAULT_WAKE_WORD_TIMEOUT = 3
 _LOGGER = logging.getLogger(__name__)
@ -63,6 +64,18 @@ def async_register_websocket_api(hass: HomeAssistant) -> None:
        cv.key_value_schemas(
            "start_stage",
            {
                PipelineStage.WAKE_WORD: vol.Schema(
                    {
                        vol.Required("input"): {
                            vol.Required("sample_rate"): int,
                            vol.Optional("timeout"): vol.Any(float, int),
                            vol.Optional("audio_seconds_to_buffer"): vol.Any(
                                float, int
                            ),
                        }
                    },
                    extra=vol.ALLOW_EXTRA,
                ),
                PipelineStage.STT: vol.Schema(
                    {vol.Required("input"): {vol.Required("sample_rate"): int}},
                    extra=vol.ALLOW_EXTRA,
@ -102,6 +115,7 @@ async def websocket_run(
    end_stage = PipelineStage(msg["end_stage"])
    handler_id: int | None = None
    unregister_handler: Callable[[], None] | None = None
    wake_word_settings: WakeWordSettings | None = None
    # Arguments to PipelineInput
    input_args: dict[str, Any] = {
@ -109,24 +123,26 @@ async def websocket_run(
        "device_id": msg.get("device_id"),
    }
-    if start_stage == PipelineStage.STT:
+    if start_stage in (PipelineStage.WAKE_WORD, PipelineStage.STT):
        # Audio pipeline that will receive audio as binary websocket messages
        audio_queue: asyncio.Queue[bytes] = asyncio.Queue()
        incoming_sample_rate = msg["input"]["sample_rate"]
        if start_stage == PipelineStage.WAKE_WORD:
            wake_word_settings = WakeWordSettings(
                timeout=msg["input"].get("timeout", DEFAULT_WAKE_WORD_TIMEOUT),
                audio_seconds_to_buffer=msg["input"].get("audio_seconds_to_buffer", 0),
            )
        async def stt_stream() -> AsyncGenerator[bytes, None]:
            state = None
            segmenter = VoiceCommandSegmenter()
            # Yield until we receive an empty chunk
            while chunk := await audio_queue.get():
-                chunk, state = audioop.ratecv(
+                if incoming_sample_rate != 16000:
-                    chunk, 2, 1, incoming_sample_rate, 16000, state
+                    chunk, state = audioop.ratecv(
-                )
+                        chunk, 2, 1, incoming_sample_rate, 16000, state
-                if not segmenter.process(chunk):
+                    )
                    # Voice command is finished
                    break
                yield chunk
        def handle_binary(
@ -169,6 +185,7 @@ async def websocket_run(
            "stt_binary_handler_id": handler_id,
            "timeout": timeout,
        },
        wake_word_settings=wake_word_settings,
    )
    pipeline_input = PipelineInput(**input_args)
--- a/homeassistant/components/wake_word/init.py
+++ b/homeassistant/components/wake_word/init.py
@ -0,0 +1,119 @@
 """Provide functionality to wake word."""
 from __future__ import annotations
 from abc import abstractmethod
 from collections.abc import AsyncIterable
 import logging
 from typing import final
 from homeassistant.config_entries import ConfigEntry
 from homeassistant.const import STATE_UNAVAILABLE, STATE_UNKNOWN
 from homeassistant.core import HomeAssistant, callback
 from homeassistant.helpers import config_validation as cv
 from homeassistant.helpers.entity_component import EntityComponent
 from homeassistant.helpers.restore_state import RestoreEntity
 from homeassistant.helpers.typing import ConfigType
 from homeassistant.util import dt as dt_util
 from .const import DOMAIN
 from .models import DetectionResult, WakeWord
 __all__ = [
    "async_default_engine",
    "async_get_wake_word_detection_entity",
    "DetectionResult",
    "DOMAIN",
    "WakeWord",
    "WakeWordDetectionEntity",
 ]
 _LOGGER = logging.getLogger(__name__)
 CONFIG_SCHEMA = cv.empty_config_schema(DOMAIN)
@callback
 def async_default_engine(hass: HomeAssistant) -> str | None:
    """Return the domain or entity id of the default engine."""
    return next(iter(hass.states.async_entity_ids(DOMAIN)), None)
@callback
 def async_get_wake_word_detection_entity(
    hass: HomeAssistant, entity_id: str
 ) -> WakeWordDetectionEntity | None:
    """Return wake word entity."""
    component: EntityComponent = hass.data[DOMAIN]
    return component.get_entity(entity_id)
 async def async_setup(hass: HomeAssistant, config: ConfigType) -> bool:
    """Set up STT."""
    component = hass.data[DOMAIN] = EntityComponent(_LOGGER, DOMAIN, hass)
    component.register_shutdown()
    return True
 async def async_setup_entry(hass: HomeAssistant, entry: ConfigEntry) -> bool:
    """Set up a config entry."""
    component: EntityComponent = hass.data[DOMAIN]
    return await component.async_setup_entry(entry)
 async def async_unload_entry(hass: HomeAssistant, entry: ConfigEntry) -> bool:
    """Unload a config entry."""
    component: EntityComponent = hass.data[DOMAIN]
    return await component.async_unload_entry(entry)
 class WakeWordDetectionEntity(RestoreEntity):
    """Represent a single wake word provider."""
    _attr_should_poll = False
    __last_processed: str | None = None
    @property
    @final
    def state(self) -> str | None:
        """Return the state of the entity."""
        if self.__last_processed is None:
            return None
        return self.__last_processed
    @property
    @abstractmethod
    def supported_wake_words(self) -> list[WakeWord]:
        """Return a list of supported wake words."""
    @abstractmethod
    async def _async_process_audio_stream(
        self, stream: AsyncIterable[tuple[bytes, int]]
    ) -> DetectionResult | None:
        """Try to detect wake word(s) in an audio stream with timestamps.
        Audio must be 16Khz sample rate with 16-bit mono PCM samples.
        """
    async def async_process_audio_stream(
        self, stream: AsyncIterable[tuple[bytes, int]]
    ) -> DetectionResult | None:
        """Try to detect wake word(s) in an audio stream with timestamps.
        Audio must be 16Khz sample rate with 16-bit mono PCM samples.
        """
        self.__last_processed = dt_util.utcnow().isoformat()
        self.async_write_ha_state()
        return await self._async_process_audio_stream(stream)
    async def async_internal_added_to_hass(self) -> None:
        """Call when the entity is added to hass."""
        await super().async_internal_added_to_hass()
        state = await self.async_get_last_state()
        if (
            state is not None
            and state.state is not None
            and state.state not in (STATE_UNAVAILABLE, STATE_UNKNOWN)
        ):
            self.__last_processed = state.state
--- a/homeassistant/components/wake_word/const.py
+++ b/homeassistant/components/wake_word/const.py
@ -0,0 +1,2 @@
 """Wake word constants."""
 DOMAIN = "wake_word"
--- a/homeassistant/components/wake_word/manifest.json
+++ b/homeassistant/components/wake_word/manifest.json
@ -0,0 +1,8 @@
 {
  "domain": "wake_word",
  "name": "Wake-word detection",
  "codeowners": ["@home-assistant/core", "@synesthesiam"],
  "documentation": "https://www.home-assistant.io/integrations/wake_word",
  "integration_type": "entity",
  "quality_scale": "internal"
 }
--- a/homeassistant/components/wake_word/models.py
+++ b/homeassistant/components/wake_word/models.py
@ -0,0 +1,24 @@
 """Wake word models."""
 from dataclasses import dataclass
@dataclass(frozen=True)
 class WakeWord:
    """Wake word model."""
    ww_id: str
    name: str
@dataclass
 class DetectionResult:
    """Result of wake word detection."""
    ww_id: str
    """Id of detected wake word"""
    timestamp: int | None
    """Timestamp of audio chunk with detected wake word"""
    queued_audio: list[tuple[bytes, int]] | None = None
    """Audio chunks that were queued when wake word was detected."""
--- a/homeassistant/components/wyoming/config_flow.py
+++ b/homeassistant/components/wyoming/config_flow.py
@ -50,14 +50,21 @@ class ConfigFlow(config_entries.ConfigFlow, domain=DOMAIN):
                errors={"base": "cannot_connect"},
            )
-        # ASR = automated speech recognition (STT)
+        # ASR = automated speech recognition (speech-to-text)
        asr_installed = [asr for asr in service.info.asr if asr.installed]
        # TTS = text-to-speech
        tts_installed = [tts for tts in service.info.tts if tts.installed]
        # wake-word-detection
        wake_installed = [wake for wake in service.info.wake if wake.installed]
        if asr_installed:
            name = asr_installed[0].name
        elif tts_installed:
            name = tts_installed[0].name
        elif wake_installed:
            name = wake_installed[0].name
        else:
            return self.async_abort(reason="no_services")
--- a/homeassistant/components/wyoming/data.py
+++ b/homeassistant/components/wyoming/data.py
@ -29,6 +29,8 @@ class WyomingService:
            platforms.append(Platform.STT)
        if any(tts.installed for tts in info.tts):
            platforms.append(Platform.TTS)
        if any(wake.installed for wake in info.wake):
            platforms.append(Platform.WAKE_WORD)
        self.platforms = platforms
    @classmethod
--- a/homeassistant/components/wyoming/wake_word.py
+++ b/homeassistant/components/wyoming/wake_word.py
@ -0,0 +1,157 @@
 """Support for Wyoming wake-word-detection services."""
 import asyncio
 from collections.abc import AsyncIterable
 import logging
 from wyoming.audio import AudioChunk, AudioStart
 from wyoming.client import AsyncTcpClient
 from wyoming.wake import Detection
 from homeassistant.components import wake_word
 from homeassistant.config_entries import ConfigEntry
 from homeassistant.core import HomeAssistant
 from homeassistant.helpers.entity_platform import AddEntitiesCallback
 from .const import DOMAIN
 from .data import WyomingService
 from .error import WyomingError
 _LOGGER = logging.getLogger(__name__)
 async def async_setup_entry(
    hass: HomeAssistant,
    config_entry: ConfigEntry,
    async_add_entities: AddEntitiesCallback,
 ) -> None:
    """Set up Wyoming wake-word-detection."""
    service: WyomingService = hass.data[DOMAIN][config_entry.entry_id]
    async_add_entities(
        [
            WyomingWakeWordProvider(config_entry, service),
        ]
    )
 class WyomingWakeWordProvider(wake_word.WakeWordDetectionEntity):
    """Wyoming wake-word-detection provider."""
    def __init__(
        self,
        config_entry: ConfigEntry,
        service: WyomingService,
    ) -> None:
        """Set up provider."""
        self.service = service
        wake_service = service.info.wake[0]
        self._supported_wake_words = [
            wake_word.WakeWord(ww_id=ww.name, name=ww.name)
            for ww in wake_service.models
        ]
        self._attr_name = wake_service.name
        self._attr_unique_id = f"{config_entry.entry_id}-wake_word"
    @property
    def supported_wake_words(self) -> list[wake_word.WakeWord]:
        """Return a list of supported wake words."""
        return self._supported_wake_words
    async def _async_process_audio_stream(
        self, stream: AsyncIterable[tuple[bytes, int]]
    ) -> wake_word.DetectionResult | None:
        """Try to detect one or more wake words in an audio stream.
        Audio must be 16Khz sample rate with 16-bit mono PCM samples.
        """
        async def next_chunk():
            """Get the next chunk from audio stream."""
            async for chunk_bytes in stream:
                return chunk_bytes
        try:
            async with AsyncTcpClient(self.service.host, self.service.port) as client:
                await client.write_event(
                    AudioStart(
                        rate=16000,
                        width=2,
                        channels=1,
                    ).event(),
                )
                # Read audio and wake events in "parallel"
                audio_task = asyncio.create_task(next_chunk())
                wake_task = asyncio.create_task(client.read_event())
                pending = {audio_task, wake_task}
                try:
                    while True:
                        done, pending = await asyncio.wait(
                            pending, return_when=asyncio.FIRST_COMPLETED
                        )
                        if wake_task in done:
                            event = wake_task.result()
                            if event is None:
                                _LOGGER.debug("Connection lost")
                                break
                            if Detection.is_type(event.type):
                                # Successful detection
                                detection = Detection.from_event(event)
                                _LOGGER.info(detection)
                                # Retrieve queued audio
                                queued_audio: list[tuple[bytes, int]] | None = None
                                if audio_task in pending:
                                    # Save queued audio
                                    await audio_task
                                    pending.remove(audio_task)
                                    queued_audio = [audio_task.result()]
                                return wake_word.DetectionResult(
                                    ww_id=detection.name,
                                    timestamp=detection.timestamp,
                                    queued_audio=queued_audio,
                                )
                            # Next event
                            wake_task = asyncio.create_task(client.read_event())
                            pending.add(wake_task)
                        if audio_task in done:
                            # Forward audio to wake service
                            chunk_info = audio_task.result()
                            if chunk_info is None:
                                break
                            chunk_bytes, chunk_timestamp = chunk_info
                            chunk = AudioChunk(
                                rate=16000,
                                width=2,
                                channels=1,
                                audio=chunk_bytes,
                                timestamp=chunk_timestamp,
                            )
                            await client.write_event(chunk.event())
                            # Next chunk
                            audio_task = asyncio.create_task(next_chunk())
                            pending.add(audio_task)
                finally:
                    # Clean up
                    if audio_task in pending:
                        # It's critical that we don't cancel the audio task or
                        # leave it hanging. This would mess up the pipeline STT
                        # by stopping the audio stream.
                        await audio_task
                        pending.remove(audio_task)
                    for task in pending:
                        task.cancel()
        except (OSError, WyomingError) as err:
            _LOGGER.exception("Error processing audio stream: %s", err)
        return None
--- a/homeassistant/const.py
+++ b/homeassistant/const.py
@ -57,6 +57,7 @@ class Platform(StrEnum):
    TTS = "tts"
    VACUUM = "vacuum"
    UPDATE = "update"
    WAKE_WORD = "wake_word"
    WATER_HEATER = "water_heater"
    WEATHER = "weather"
--- a/tests/components/assist_pipeline/conftest.py
+++ b/tests/components/assist_pipeline/conftest.py
@ -7,7 +7,7 @@ from unittest.mock import AsyncMock
 import pytest
-from homeassistant.components import stt, tts
+from homeassistant.components import stt, tts, wake_word
 from homeassistant.components.assist_pipeline import DOMAIN
 from homeassistant.components.assist_pipeline.pipeline import (
    PipelineData,
@ -174,6 +174,40 @@ class MockSttPlatform(MockPlatform):
        self.async_get_engine = async_get_engine
 class MockWakeWordEntity(wake_word.WakeWordDetectionEntity):
    """Mock wake word entity."""
    fail_process_audio = False
    url_path = "wake_word.test"
    _attr_name = "test"
    @property
    def supported_wake_words(self) -> list[wake_word.WakeWord]:
        """Return a list of supported wake words."""
        return [wake_word.WakeWord(ww_id="test_ww", name="Test Wake Word")]
    async def _async_process_audio_stream(
        self, stream: AsyncIterable[tuple[bytes, int]]
    ) -> wake_word.DetectionResult | None:
        """Try to detect wake word(s) in an audio stream with timestamps."""
        async for chunk, timestamp in stream:
            if chunk == b"wake word":
                return wake_word.DetectionResult(
                    ww_id=self.supported_wake_words[0].ww_id,
                    timestamp=timestamp,
                    queued_audio=[(b"queued audio", 0)],
                )
        # Not detected
        return None
@pytest.fixture
 async def mock_wake_word_provider_entity(hass) -> MockWakeWordEntity:
    """Mock wake word provider."""
    return MockWakeWordEntity()
 class MockFlow(ConfigFlow):
    """Test flow."""
@ -193,6 +227,7 @@ async def init_supporting_components(
    mock_stt_provider: MockSttProvider,
    mock_stt_provider_entity: MockSttProviderEntity,
    mock_tts_provider: MockTTSProvider,
    mock_wake_word_provider_entity: MockWakeWordEntity,
    config_flow_fixture,
 ):
    """Initialize relevant components with empty configs."""
@ -201,14 +236,18 @@ async def init_supporting_components(
        hass: HomeAssistant, config_entry: ConfigEntry
    ) -> bool:
        """Set up test config entry."""
-        await hass.config_entries.async_forward_entry_setup(config_entry, stt.DOMAIN)
+        await hass.config_entries.async_forward_entry_setups(
            config_entry, [stt.DOMAIN, wake_word.DOMAIN]
        )
        return True
    async def async_unload_entry_init(
        hass: HomeAssistant, config_entry: ConfigEntry
    ) -> bool:
        """Unload up test config entry."""
-        await hass.config_entries.async_forward_entry_unload(config_entry, stt.DOMAIN)
+        await hass.config_entries.async_unload_platforms(
            config_entry, [stt.DOMAIN, wake_word.DOMAIN]
        )
        return True
    async def async_setup_entry_stt_platform(
@ -219,6 +258,14 @@ async def init_supporting_components(
        """Set up test stt platform via config entry."""
        async_add_entities([mock_stt_provider_entity])
    async def async_setup_entry_wake_word_platform(
        hass: HomeAssistant,
        config_entry: ConfigEntry,
        async_add_entities: AddEntitiesCallback,
    ) -> None:
        """Set up test wake word platform via config entry."""
        async_add_entities([mock_wake_word_provider_entity])
    mock_integration(
        hass,
        MockModule(
@ -242,11 +289,19 @@ async def init_supporting_components(
            async_setup_entry=async_setup_entry_stt_platform,
        ),
    )
    mock_platform(
        hass,
        "test.wake_word",
        MockPlatform(
            async_setup_entry=async_setup_entry_wake_word_platform,
        ),
    )
    mock_platform(hass, "test.config_flow")
    assert await async_setup_component(hass, "homeassistant", {})
    assert await async_setup_component(hass, tts.DOMAIN, {"tts": {"platform": "test"}})
    assert await async_setup_component(hass, stt.DOMAIN, {"stt": {"platform": "test"}})
    # assert await async_setup_component(hass, wake_word.DOMAIN, {"wake_word": {}})
    assert await async_setup_component(hass, "media_source", {})
    config_entry = MockConfigEntry(domain="test")
--- a/tests/components/assist_pipeline/snapshots/test_init.ambr
+++ b/tests/components/assist_pipeline/snapshots/test_init.ambr
@ -266,3 +266,114 @@
    }),
  ])
 # ---
 # name: test_pipeline_from_audio_stream_wake_word
  list([
    dict({
      'data': dict({
        'language': 'en',
        'pipeline': <ANY>,
      }),
      'type': <PipelineEventType.RUN_START: 'run-start'>,
    }),
    dict({
      'data': dict({
        'engine': 'wake_word.test',
        'metadata': dict({
          'bit_rate': <AudioBitRates.BITRATE_16: 16>,
          'channel': <AudioChannels.CHANNEL_MONO: 1>,
          'codec': <AudioCodecs.PCM: 'pcm'>,
          'format': <AudioFormats.WAV: 'wav'>,
          'sample_rate': <AudioSampleRates.SAMPLERATE_16000: 16000>,
        }),
      }),
      'type': <PipelineEventType.WAKE_WORD_START: 'wake_word-start'>,
    }),
    dict({
      'data': dict({
        'wake_word_output': dict({
          'timestamp': 2000,
          'ww_id': 'test_ww',
        }),
      }),
      'type': <PipelineEventType.WAKE_WORD_END: 'wake_word-end'>,
    }),
    dict({
      'data': dict({
        'engine': 'test',
        'metadata': dict({
          'bit_rate': <AudioBitRates.BITRATE_16: 16>,
          'channel': <AudioChannels.CHANNEL_MONO: 1>,
          'codec': <AudioCodecs.PCM: 'pcm'>,
          'format': <AudioFormats.WAV: 'wav'>,
          'language': 'en-US',
          'sample_rate': <AudioSampleRates.SAMPLERATE_16000: 16000>,
        }),
      }),
      'type': <PipelineEventType.STT_START: 'stt-start'>,
    }),
    dict({
      'data': dict({
        'stt_output': dict({
          'text': 'test transcript',
        }),
      }),
      'type': <PipelineEventType.STT_END: 'stt-end'>,
    }),
    dict({
      'data': dict({
        'conversation_id': None,
        'device_id': None,
        'engine': 'homeassistant',
        'intent_input': 'test transcript',
        'language': 'en',
      }),
      'type': <PipelineEventType.INTENT_START: 'intent-start'>,
    }),
    dict({
      'data': dict({
        'intent_output': dict({
          'conversation_id': None,
          'response': dict({
            'card': dict({
            }),
            'data': dict({
              'code': 'no_intent_match',
            }),
            'language': 'en',
            'response_type': 'error',
            'speech': dict({
              'plain': dict({
                'extra_data': None,
                'speech': "Sorry, I couldn't understand that",
              }),
            }),
          }),
        }),
      }),
      'type': <PipelineEventType.INTENT_END: 'intent-end'>,
    }),
    dict({
      'data': dict({
        'engine': 'test',
        'language': 'en-US',
        'tts_input': "Sorry, I couldn't understand that",
        'voice': 'james_earl_jones',
      }),
      'type': <PipelineEventType.TTS_START: 'tts-start'>,
    }),
    dict({
      'data': dict({
        'tts_output': dict({
          'media_id': "media-source://tts/test?message=Sorry,+I+couldn't+understand+that&language=en-US&voice=james_earl_jones",
          'mime_type': 'audio/mpeg',
          'url': '/api/tts_proxy/dae2cdcb27a1d1c3b07ba2c7db91480f9d4bfd8f_en-us_031e2ec052_test.mp3',
        }),
      }),
      'type': <PipelineEventType.TTS_END: 'tts-end'>,
    }),
    dict({
      'data': None,
      'type': <PipelineEventType.RUN_END: 'run-end'>,
    }),
  ])
 # ---
--- a/tests/components/assist_pipeline/snapshots/test_websocket.ambr
+++ b/tests/components/assist_pipeline/snapshots/test_websocket.ambr
@ -155,6 +155,243 @@
    }),
  })
 # ---
 # name: test_audio_pipeline_no_wake_word_engine
  dict({
    'code': 'wake-engine-missing',
    'message': 'No wake word engine',
  })
 # ---
 # name: test_audio_pipeline_no_wake_word_entity
  dict({
    'code': 'wake-provider-missing',
    'message': 'No wake-word-detection provider for: wake_word.bad-entity-id',
  })
 # ---
 # name: test_audio_pipeline_with_wake_word
  dict({
    'language': 'en',
    'pipeline': <ANY>,
    'runner_data': dict({
      'stt_binary_handler_id': 1,
      'timeout': 30,
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word.1
  dict({
    'engine': 'wake_word.test',
    'metadata': dict({
      'bit_rate': 16,
      'channel': 1,
      'codec': 'pcm',
      'format': 'wav',
      'sample_rate': 16000,
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word.2
  dict({
    'wake_word_output': dict({
      'queued_audio': None,
      'timestamp': 1000,
      'ww_id': 'test_ww',
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word.3
  dict({
    'engine': 'test',
    'metadata': dict({
      'bit_rate': 16,
      'channel': 1,
      'codec': 'pcm',
      'format': 'wav',
      'language': 'en-US',
      'sample_rate': 16000,
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word.4
  dict({
    'stt_output': dict({
      'text': 'test transcript',
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word.5
  dict({
    'conversation_id': None,
    'device_id': None,
    'engine': 'homeassistant',
    'intent_input': 'test transcript',
    'language': 'en',
  })
 # ---
 # name: test_audio_pipeline_with_wake_word.6
  dict({
    'intent_output': dict({
      'conversation_id': None,
      'response': dict({
        'card': dict({
        }),
        'data': dict({
          'code': 'no_intent_match',
        }),
        'language': 'en',
        'response_type': 'error',
        'speech': dict({
          'plain': dict({
            'extra_data': None,
            'speech': "Sorry, I couldn't understand that",
          }),
        }),
      }),
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word.7
  dict({
    'engine': 'test',
    'language': 'en-US',
    'tts_input': "Sorry, I couldn't understand that",
    'voice': 'james_earl_jones',
  })
 # ---
 # name: test_audio_pipeline_with_wake_word.8
  dict({
    'tts_output': dict({
      'media_id': "media-source://tts/test?message=Sorry,+I+couldn't+understand+that&language=en-US&voice=james_earl_jones",
      'mime_type': 'audio/mpeg',
      'url': '/api/tts_proxy/dae2cdcb27a1d1c3b07ba2c7db91480f9d4bfd8f_en-us_031e2ec052_test.mp3',
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_no_timeout
  dict({
    'language': 'en',
    'pipeline': <ANY>,
    'runner_data': dict({
      'stt_binary_handler_id': 1,
      'timeout': 30,
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_no_timeout.1
  dict({
    'engine': 'wake_word.test',
    'metadata': dict({
      'bit_rate': 16,
      'channel': 1,
      'codec': 'pcm',
      'format': 'wav',
      'sample_rate': 16000,
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_no_timeout.2
  dict({
    'wake_word_output': dict({
      'timestamp': 0,
      'ww_id': 'test_ww',
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_no_timeout.3
  dict({
    'engine': 'test',
    'metadata': dict({
      'bit_rate': 16,
      'channel': 1,
      'codec': 'pcm',
      'format': 'wav',
      'language': 'en-US',
      'sample_rate': 16000,
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_no_timeout.4
  dict({
    'stt_output': dict({
      'text': 'test transcript',
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_no_timeout.5
  dict({
    'conversation_id': None,
    'device_id': None,
    'engine': 'homeassistant',
    'intent_input': 'test transcript',
    'language': 'en',
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_no_timeout.6
  dict({
    'intent_output': dict({
      'conversation_id': None,
      'response': dict({
        'card': dict({
        }),
        'data': dict({
          'code': 'no_intent_match',
        }),
        'language': 'en',
        'response_type': 'error',
        'speech': dict({
          'plain': dict({
            'extra_data': None,
            'speech': "Sorry, I couldn't understand that",
          }),
        }),
      }),
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_no_timeout.7
  dict({
    'engine': 'test',
    'language': 'en-US',
    'tts_input': "Sorry, I couldn't understand that",
    'voice': 'james_earl_jones',
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_no_timeout.8
  dict({
    'tts_output': dict({
      'media_id': "media-source://tts/test?message=Sorry,+I+couldn't+understand+that&language=en-US&voice=james_earl_jones",
      'mime_type': 'audio/mpeg',
      'url': '/api/tts_proxy/dae2cdcb27a1d1c3b07ba2c7db91480f9d4bfd8f_en-us_031e2ec052_test.mp3',
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_timeout
  dict({
    'language': 'en',
    'pipeline': <ANY>,
    'runner_data': dict({
      'stt_binary_handler_id': 1,
      'timeout': 30,
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_timeout.1
  dict({
    'engine': 'wake_word.test',
    'metadata': dict({
      'bit_rate': 16,
      'channel': 1,
      'codec': 'pcm',
      'format': 'wav',
      'sample_rate': 16000,
    }),
  })
 # ---
 # name: test_audio_pipeline_with_wake_word_timeout.2
  dict({
    'code': 'wake-word-timeout',
    'message': 'Wake word was not detected',
  })
 # ---
 # name: test_intent_failed
  dict({
    'language': 'en',
--- a/tests/components/assist_pipeline/test_init.py
+++ b/tests/components/assist_pipeline/test_init.py
@ -1,5 +1,6 @@
 """Test Voice Assistant init."""
 from dataclasses import asdict
 import itertools as it
 from unittest.mock import ANY
 import pytest
@ -8,10 +9,12 @@ from syrupy.assertion import SnapshotAssertion
 from homeassistant.components import assist_pipeline, stt
 from homeassistant.core import Context, HomeAssistant
-from .conftest import MockSttProvider, MockSttProviderEntity
+from .conftest import MockSttProvider, MockSttProviderEntity, MockWakeWordEntity
 from tests.typing import WebSocketGenerator
 BYTES_ONE_SECOND = 16000 * 2
 def process_events(events: list[assist_pipeline.PipelineEvent]) -> list[dict]:
    """Process events to remove dynamic values."""
@ -280,3 +283,61 @@ async def test_pipeline_from_audio_stream_unknown_pipeline(
        )
    assert not events
 async def test_pipeline_from_audio_stream_wake_word(
    hass: HomeAssistant,
    mock_stt_provider: MockSttProvider,
    mock_wake_word_provider_entity: MockWakeWordEntity,
    init_components,
    snapshot: SnapshotAssertion,
 ) -> None:
    """Test creating a pipeline from an audio stream with wake word."""
    events = []
    # [0, 1, ...]
    wake_chunk_1 = bytes(it.islice(it.cycle(range(256)), BYTES_ONE_SECOND))
    # [0, 2, ...]
    wake_chunk_2 = bytes(it.islice(it.cycle(range(0, 256, 2)), BYTES_ONE_SECOND))
    async def audio_data():
        yield wake_chunk_1  # 1 second
        yield wake_chunk_2  # 1 second
        yield b"wake word"
        yield b"part1"
        yield b"part2"
        yield b""
    await assist_pipeline.async_pipeline_from_audio_stream(
        hass,
        Context(),
        events.append,
        stt.SpeechMetadata(
            language="",
            format=stt.AudioFormats.WAV,
            codec=stt.AudioCodecs.PCM,
            bit_rate=stt.AudioBitRates.BITRATE_16,
            sample_rate=stt.AudioSampleRates.SAMPLERATE_16000,
            channel=stt.AudioChannels.CHANNEL_MONO,
        ),
        audio_data(),
        start_stage=assist_pipeline.PipelineStage.WAKE_WORD,
        wake_word_settings=assist_pipeline.WakeWordSettings(
            audio_seconds_to_buffer=1.5
        ),
    )
    assert process_events(events) == snapshot
    # 1. Half of wake_chunk_1 + all wake_chunk_2
    # 2. queued audio (from mock wake word entity)
    # 3. part1
    # 4. part2
    assert len(mock_stt_provider.received) == 4
    first_chunk = mock_stt_provider.received[0]
    assert first_chunk == wake_chunk_1[len(wake_chunk_1) // 2 :] + wake_chunk_2
    assert mock_stt_provider.received[1:] == [b"queued audio", b"part1", b"part2"]
--- a/tests/components/assist_pipeline/test_websocket.py
+++ b/tests/components/assist_pipeline/test_websocket.py
@ -167,6 +167,224 @@ async def test_audio_pipeline(
    assert msg["result"] == {"events": events}
 async def test_audio_pipeline_with_wake_word_timeout(
    hass: HomeAssistant,
    hass_ws_client: WebSocketGenerator,
    init_components,
    snapshot: SnapshotAssertion,
 ) -> None:
    """Test timeout from a pipeline run with audio input/output + wake word."""
    events = []
    client = await hass_ws_client(hass)
    await client.send_json_auto_id(
        {
            "type": "assist_pipeline/run",
            "start_stage": "wake_word",
            "end_stage": "tts",
            "input": {
                "sample_rate": 16000,
                "timeout": 1,
            },
        }
    )
    # result
    msg = await client.receive_json()
    assert msg["success"], msg
    # run start
    msg = await client.receive_json()
    assert msg["event"]["type"] == "run-start"
    msg["event"]["data"]["pipeline"] = ANY
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
    # wake_word
    msg = await client.receive_json()
    assert msg["event"]["type"] == "wake_word-start"
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
    # 2 seconds of silence
    await client.send_bytes(bytes([1]) + bytes(16000 * 2 * 2))
    # Time out error
    msg = await client.receive_json()
    assert msg["event"]["type"] == "error"
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
 async def test_audio_pipeline_with_wake_word_no_timeout(
    hass: HomeAssistant,
    hass_ws_client: WebSocketGenerator,
    init_components,
    snapshot: SnapshotAssertion,
 ) -> None:
    """Test events from a pipeline run with audio input/output + wake word with no timeout."""
    events = []
    client = await hass_ws_client(hass)
    await client.send_json_auto_id(
        {
            "type": "assist_pipeline/run",
            "start_stage": "wake_word",
            "end_stage": "tts",
            "input": {
                "sample_rate": 16000,
                "timeout": 0,
            },
        }
    )
    # result
    msg = await client.receive_json()
    assert msg["success"], msg
    # run start
    msg = await client.receive_json()
    assert msg["event"]["type"] == "run-start"
    msg["event"]["data"]["pipeline"] = ANY
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
    # wake_word
    msg = await client.receive_json()
    assert msg["event"]["type"] == "wake_word-start"
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
    # "audio"
    await client.send_bytes(bytes([1]) + b"wake word")
    msg = await client.receive_json()
    assert msg["event"]["type"] == "wake_word-end"
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
    # stt
    msg = await client.receive_json()
    assert msg["event"]["type"] == "stt-start"
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
    # End of audio stream (handler id + empty payload)
    await client.send_bytes(bytes([1]))
    msg = await client.receive_json()
    assert msg["event"]["type"] == "stt-end"
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
    # intent
    msg = await client.receive_json()
    assert msg["event"]["type"] == "intent-start"
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
    msg = await client.receive_json()
    assert msg["event"]["type"] == "intent-end"
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
    # text-to-speech
    msg = await client.receive_json()
    assert msg["event"]["type"] == "tts-start"
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
    msg = await client.receive_json()
    assert msg["event"]["type"] == "tts-end"
    assert msg["event"]["data"] == snapshot
    events.append(msg["event"])
    # run end
    msg = await client.receive_json()
    assert msg["event"]["type"] == "run-end"
    assert msg["event"]["data"] is None
    events.append(msg["event"])
    pipeline_data: PipelineData = hass.data[DOMAIN]
    pipeline_id = list(pipeline_data.pipeline_runs)[0]
    pipeline_run_id = list(pipeline_data.pipeline_runs[pipeline_id])[0]
    await client.send_json_auto_id(
        {
            "type": "assist_pipeline/pipeline_debug/get",
            "pipeline_id": pipeline_id,
            "pipeline_run_id": pipeline_run_id,
        }
    )
    msg = await client.receive_json()
    assert msg["success"]
    assert msg["result"] == {"events": events}
 async def test_audio_pipeline_no_wake_word_engine(
    hass: HomeAssistant,
    hass_ws_client: WebSocketGenerator,
    init_components,
    snapshot: SnapshotAssertion,
 ) -> None:
    """Test timeout from a pipeline run with audio input/output + wake word."""
    client = await hass_ws_client(hass)
    with patch(
        "homeassistant.components.wake_word.async_default_engine", return_value=None
    ):
        await client.send_json_auto_id(
            {
                "type": "assist_pipeline/run",
                "start_stage": "wake_word",
                "end_stage": "tts",
                "input": {
                    "sample_rate": 16000,
                },
            }
        )
        # error
        msg = await client.receive_json()
        assert not msg["success"]
        assert "error" in msg
        assert msg["error"] == snapshot
 async def test_audio_pipeline_no_wake_word_entity(
    hass: HomeAssistant,
    hass_ws_client: WebSocketGenerator,
    init_components,
    snapshot: SnapshotAssertion,
 ) -> None:
    """Test timeout from a pipeline run with audio input/output + wake word."""
    client = await hass_ws_client(hass)
    with patch(
        "homeassistant.components.wake_word.async_default_engine",
        return_value="wake_word.bad-entity-id",
    ), patch(
        "homeassistant.components.wake_word.async_get_wake_word_detection_entity",
        return_value=None,
    ):
        await client.send_json_auto_id(
            {
                "type": "assist_pipeline/run",
                "start_stage": "wake_word",
                "end_stage": "tts",
                "input": {
                    "sample_rate": 16000,
                },
            }
        )
        # error
        msg = await client.receive_json()
        assert not msg["success"]
        assert "error" in msg
        assert msg["error"] == snapshot
 async def test_intent_timeout(
    hass: HomeAssistant,
    hass_ws_client: WebSocketGenerator,
--- a/tests/components/wake_word/init.py
+++ b/tests/components/wake_word/init.py
@ -0,0 +1 @@
 """Wake-word-detection tests."""
--- a/tests/components/wake_word/common.py
+++ b/tests/components/wake_word/common.py
@ -0,0 +1,29 @@
 """Provide common test tools for wake-word-detection."""
 from __future__ import annotations
 from collections.abc import Callable, Coroutine
 from pathlib import Path
 from typing import Any
 from homeassistant.components import wake_word
 from homeassistant.config_entries import ConfigEntry
 from homeassistant.core import HomeAssistant
 from homeassistant.helpers.entity_platform import AddEntitiesCallback
 from tests.common import MockPlatform, mock_platform
 def mock_wake_word_entity_platform(
    hass: HomeAssistant,
    tmp_path: Path,
    integration: str,
    async_setup_entry: Callable[
        [HomeAssistant, ConfigEntry, AddEntitiesCallback],
        Coroutine[Any, Any, None],
    ]
    | None = None,
 ) -> MockPlatform:
    """Specialize the mock platform for stt."""
    loaded_platform = MockPlatform(async_setup_entry=async_setup_entry)
    mock_platform(hass, f"{integration}.{wake_word.DOMAIN}", loaded_platform)
    return loaded_platform
--- a/tests/components/wake_word/snapshots/test_init.ambr
+++ b/tests/components/wake_word/snapshots/test_init.ambr
@ -0,0 +1,11 @@
 # serializer version: 1
 # name: test_ws_detect
  dict({
    'event': dict({
      'timestamp': 2048.0,
      'ww_id': 'test_ww',
    }),
    'id': 1,
    'type': 'event',
  })
 # ---
--- a/tests/components/wake_word/test_init.py
+++ b/tests/components/wake_word/test_init.py
@ -0,0 +1,226 @@
 """Test wake_word component setup."""
 from collections.abc import AsyncIterable, Generator
 from pathlib import Path
 import pytest
 from homeassistant.components import wake_word
 from homeassistant.config_entries import ConfigEntry, ConfigEntryState, ConfigFlow
 from homeassistant.core import HomeAssistant, State
 from homeassistant.helpers.entity_platform import AddEntitiesCallback
 from homeassistant.setup import async_setup_component
 from .common import mock_wake_word_entity_platform
 from tests.common import (
    MockConfigEntry,
    MockModule,
    mock_config_flow,
    mock_integration,
    mock_platform,
    mock_restore_cache,
 )
 TEST_DOMAIN = "test"
 _SAMPLES_PER_CHUNK = 1024
 _BYTES_PER_CHUNK = _SAMPLES_PER_CHUNK * 2  # 16-bit
 _MS_PER_CHUNK = (_BYTES_PER_CHUNK // 2) // 16  # 16Khz
 class MockProviderEntity(wake_word.WakeWordDetectionEntity):
    """Mock provider entity."""
    url_path = "wake_word.test"
    _attr_name = "test"
    @property
    def supported_wake_words(self) -> list[wake_word.WakeWord]:
        """Return a list of supported wake words."""
        return [wake_word.WakeWord(ww_id="test_ww", name="Test Wake Word")]
    async def _async_process_audio_stream(
        self, stream: AsyncIterable[tuple[bytes, int]]
    ) -> wake_word.DetectionResult | None:
        """Try to detect wake word(s) in an audio stream with timestamps."""
        async for _chunk, timestamp in stream:
            if timestamp >= 2000:
                return wake_word.DetectionResult(
                    ww_id=self.supported_wake_words[0].ww_id, timestamp=timestamp
                )
        # Not detected
        return None
@pytest.fixture
 def mock_provider_entity() -> MockProviderEntity:
    """Test provider entity fixture."""
    return MockProviderEntity()
 class WakeWordFlow(ConfigFlow):
    """Test flow."""
@pytest.fixture(autouse=True)
 def config_flow_fixture(hass: HomeAssistant) -> Generator[None, None, None]:
    """Mock config flow."""
    mock_platform(hass, f"{TEST_DOMAIN}.config_flow")
    with mock_config_flow(TEST_DOMAIN, WakeWordFlow):
        yield
@pytest.fixture(name="setup")
 async def setup_fixture(
    hass: HomeAssistant,
    tmp_path: Path,
 ) -> MockProviderEntity:
    """Set up the test environment."""
    provider = MockProviderEntity()
    await mock_config_entry_setup(hass, tmp_path, provider)
    return provider
 async def mock_config_entry_setup(
    hass: HomeAssistant, tmp_path: Path, mock_provider_entity: MockProviderEntity
 ) -> MockConfigEntry:
    """Set up a test provider via config entry."""
    async def async_setup_entry_init(
        hass: HomeAssistant, config_entry: ConfigEntry
    ) -> bool:
        """Set up test config entry."""
        await hass.config_entries.async_forward_entry_setup(
            config_entry, wake_word.DOMAIN
        )
        return True
    async def async_unload_entry_init(
        hass: HomeAssistant, config_entry: ConfigEntry
    ) -> bool:
        """Unload up test config entry."""
        await hass.config_entries.async_forward_entry_unload(
            config_entry, wake_word.DOMAIN
        )
        return True
    mock_integration(
        hass,
        MockModule(
            TEST_DOMAIN,
            async_setup_entry=async_setup_entry_init,
            async_unload_entry=async_unload_entry_init,
        ),
    )
    async def async_setup_entry_platform(
        hass: HomeAssistant,
        config_entry: ConfigEntry,
        async_add_entities: AddEntitiesCallback,
    ) -> None:
        """Set up test stt platform via config entry."""
        async_add_entities([mock_provider_entity])
    mock_wake_word_entity_platform(
        hass, tmp_path, TEST_DOMAIN, async_setup_entry_platform
    )
    config_entry = MockConfigEntry(domain=TEST_DOMAIN)
    config_entry.add_to_hass(hass)
    assert await hass.config_entries.async_setup(config_entry.entry_id)
    await hass.async_block_till_done()
    return config_entry
 async def test_config_entry_unload(
    hass: HomeAssistant, tmp_path: Path, mock_provider_entity: MockProviderEntity
 ) -> None:
    """Test we can unload config entry."""
    config_entry = await mock_config_entry_setup(hass, tmp_path, mock_provider_entity)
    assert config_entry.state == ConfigEntryState.LOADED
    await hass.config_entries.async_unload(config_entry.entry_id)
    assert config_entry.state == ConfigEntryState.NOT_LOADED
 async def test_detected_entity(
    hass: HomeAssistant, tmp_path: Path, setup: MockProviderEntity
 ) -> None:
    """Test successful detection through entity."""
    async def three_second_stream():
        timestamp = 0
        while timestamp < 3000:
            yield bytes(_BYTES_PER_CHUNK), timestamp
            timestamp += _MS_PER_CHUNK
    # Need 2 seconds to trigger
    result = await setup.async_process_audio_stream(three_second_stream())
    assert result == wake_word.DetectionResult("test_ww", 2048)
 async def test_not_detected_entity(
    hass: HomeAssistant, setup: MockProviderEntity
 ) -> None:
    """Test unsuccessful detection through entity."""
    async def one_second_stream():
        timestamp = 0
        while timestamp < 1000:
            yield bytes(_BYTES_PER_CHUNK), timestamp
            timestamp += _MS_PER_CHUNK
    # Need 2 seconds to trigger
    result = await setup.async_process_audio_stream(one_second_stream())
    assert result is None
 async def test_default_engine_none(hass: HomeAssistant, tmp_path: Path) -> None:
    """Test async_default_engine."""
    assert await async_setup_component(hass, wake_word.DOMAIN, {wake_word.DOMAIN: {}})
    await hass.async_block_till_done()
    assert wake_word.async_default_engine(hass) is None
 async def test_default_engine_entity(
    hass: HomeAssistant, tmp_path: Path, mock_provider_entity: MockProviderEntity
 ) -> None:
    """Test async_default_engine."""
    await mock_config_entry_setup(hass, tmp_path, mock_provider_entity)
    assert wake_word.async_default_engine(hass) == f"{wake_word.DOMAIN}.{TEST_DOMAIN}"
 async def test_get_engine_entity(
    hass: HomeAssistant, tmp_path: Path, mock_provider_entity: MockProviderEntity
 ) -> None:
    """Test async_get_speech_to_text_engine."""
    await mock_config_entry_setup(hass, tmp_path, mock_provider_entity)
    assert (
        wake_word.async_get_wake_word_detection_entity(hass, f"{wake_word.DOMAIN}.test")
        is mock_provider_entity
    )
 async def test_restore_state(
    hass: HomeAssistant,
    tmp_path: Path,
    mock_provider_entity: MockProviderEntity,
 ) -> None:
    """Test we restore state in the integration."""
    entity_id = f"{wake_word.DOMAIN}.{TEST_DOMAIN}"
    timestamp = "2023-01-01T23:59:59+00:00"
    mock_restore_cache(hass, (State(entity_id, timestamp),))
    config_entry = await mock_config_entry_setup(hass, tmp_path, mock_provider_entity)
    await hass.async_block_till_done()
    assert config_entry.state == ConfigEntryState.LOADED
    state = hass.states.get(entity_id)
    assert state
    assert state.state == timestamp
--- a/tests/components/wyoming/init.py
+++ b/tests/components/wyoming/init.py
@ -1,4 +1,6 @@
 """Tests for the Wyoming integration."""
 import asyncio
 from wyoming.info import (
    AsrModel,
    AsrProgram,
@ -7,6 +9,8 @@ from wyoming.info import (
    TtsProgram,
    TtsVoice,
    TtsVoiceSpeaker,
    WakeModel,
    WakeProgram,
 )
 TEST_ATTR = Attribution(name="Test", url="http://www.test.com")
@ -49,6 +53,25 @@ TTS_INFO = Info(
        )
    ]
 )
 WAKE_WORD_INFO = Info(
    wake=[
        WakeProgram(
            name="Test Wake Word",
            description="Test Wake Word",
            installed=True,
            attribution=TEST_ATTR,
            models=[
                WakeModel(
                    name="Test Model",
                    description="Test Model",
                    installed=True,
                    attribution=TEST_ATTR,
                    languages=["en-US"],
                )
            ],
        )
    ]
 )
 EMPTY_INFO = Info()
@ -68,6 +91,7 @@ class MockAsyncTcpClient:
    async def read_event(self):
        """Receive."""
        await asyncio.sleep(0)  # force context switch
        return self.responses.pop(0)
    async def __aenter__(self):
--- a/tests/components/wyoming/conftest.py
+++ b/tests/components/wyoming/conftest.py
@ -8,7 +8,7 @@ from homeassistant.components import stt
 from homeassistant.config_entries import ConfigEntry
 from homeassistant.core import HomeAssistant
-from . import STT_INFO, TTS_INFO
+from . import STT_INFO, TTS_INFO, WAKE_WORD_INFO
 from tests.common import MockConfigEntry
@ -52,6 +52,21 @@ def tts_config_entry(hass: HomeAssistant) -> ConfigEntry:
    return entry
@pytest.fixture
 def wake_word_config_entry(hass: HomeAssistant) -> ConfigEntry:
    """Create a config entry."""
    entry = MockConfigEntry(
        domain="wyoming",
        data={
            "host": "1.2.3.4",
            "port": 1234,
        },
        title="Test Wake Word",
    )
    entry.add_to_hass(hass)
    return entry
@pytest.fixture
 async def init_wyoming_stt(hass: HomeAssistant, stt_config_entry: ConfigEntry):
    """Initialize Wyoming STT."""
@ -72,6 +87,18 @@ async def init_wyoming_tts(hass: HomeAssistant, tts_config_entry: ConfigEntry):
        await hass.config_entries.async_setup(tts_config_entry.entry_id)
@pytest.fixture
 async def init_wyoming_wake_word(
    hass: HomeAssistant, wake_word_config_entry: ConfigEntry
 ):
    """Initialize Wyoming Wake Word."""
    with patch(
        "homeassistant.components.wyoming.data.load_wyoming_info",
        return_value=WAKE_WORD_INFO,
    ):
        await hass.config_entries.async_setup(wake_word_config_entry.entry_id)
@pytest.fixture
 def metadata(hass: HomeAssistant) -> stt.SpeechMetadata:
    """Get default STT metadata."""
--- a/tests/components/wyoming/snapshots/test_wake_word.ambr
+++ b/tests/components/wyoming/snapshots/test_wake_word.ambr
@ -0,0 +1,13 @@
 # serializer version: 1
 # name: test_streaming_audio
  dict({
    'queued_audio': list([
      tuple(
        b'chunk',
        1,
      ),
    ]),
    'timestamp': 0,
    'ww_id': 'Test Model',
  })
 # ---
--- a/tests/components/wyoming/test_wake_word.py
+++ b/tests/components/wyoming/test_wake_word.py
@ -0,0 +1,108 @@
 """Test stt."""
 from __future__ import annotations
 import asyncio
 from unittest.mock import patch
 from syrupy.assertion import SnapshotAssertion
 from wyoming.asr import Transcript
 from wyoming.wake import Detection
 from homeassistant.components import wake_word
 from homeassistant.core import HomeAssistant
 from . import MockAsyncTcpClient
 async def test_support(hass: HomeAssistant, init_wyoming_wake_word) -> None:
    """Test supported properties."""
    state = hass.states.get("wake_word.test_wake_word")
    assert state is not None
    entity = wake_word.async_get_wake_word_detection_entity(
        hass, "wake_word.test_wake_word"
    )
    assert entity is not None
    assert entity.supported_wake_words == [
        wake_word.WakeWord(ww_id="Test Model", name="Test Model")
    ]
 async def test_streaming_audio(
    hass: HomeAssistant, init_wyoming_wake_word, snapshot: SnapshotAssertion
 ) -> None:
    """Test streaming audio."""
    entity = wake_word.async_get_wake_word_detection_entity(
        hass, "wake_word.test_wake_word"
    )
    assert entity is not None
    async def audio_stream():
        yield b"chunk", 0
        # Delay to force a pending audio chunk
        await asyncio.sleep(0.05)
        yield b"chunk", 1
    client_events = [
        Transcript("not a wake word event").event(),
        Detection(name="Test Model", timestamp=0).event(),
    ]
    with patch(
        "homeassistant.components.wyoming.wake_word.AsyncTcpClient",
        MockAsyncTcpClient(client_events),
    ):
        result = await entity.async_process_audio_stream(audio_stream())
    assert result is not None
    assert result == snapshot
 async def test_streaming_audio_connection_lost(
    hass: HomeAssistant, init_wyoming_wake_word
 ) -> None:
    """Test streaming audio and losing connection."""
    entity = wake_word.async_get_wake_word_detection_entity(
        hass, "wake_word.test_wake_word"
    )
    assert entity is not None
    async def audio_stream():
        # Delay to force a pending audio chunk
        await asyncio.sleep(0.05)
        yield b"chunk", 1
    with patch(
        "homeassistant.components.wyoming.wake_word.AsyncTcpClient",
        MockAsyncTcpClient([None]),
    ):
        result = await entity.async_process_audio_stream(audio_stream())
    assert result is None
 async def test_streaming_audio_oserror(
    hass: HomeAssistant, init_wyoming_wake_word
 ) -> None:
    """Test streaming audio and error raising."""
    entity = wake_word.async_get_wake_word_detection_entity(
        hass, "wake_word.test_wake_word"
    )
    assert entity is not None
    async def audio_stream():
        yield b"chunk1", 1000
    mock_client = MockAsyncTcpClient(
        [Detection(name="Test Model", timestamp=1000).event()]
    )
    with patch(
        "homeassistant.components.wyoming.wake_word.AsyncTcpClient",
        mock_client,
    ), patch.object(mock_client, "read_event", side_effect=OSError("Boom!")):
        result = await entity.async_process_audio_stream(audio_stream())
    assert result is None
		`@ -0,0 +1,2 @@`
							`"""Wake word constants."""`
							`DOMAIN = "wake_word"`