ESPHome: esphome/components/voice_assistant/voice_assistant.h Source File

#pragma once


#include "esphome/core/defines.h"


#ifdef USE_VOICE_ASSISTANT


#include "esphome/core/automation.h"

#include "esphome/core/component.h"

#include "esphome/core/helpers.h"

#include "esphome/core/ring_buffer.h"


#include "esphome/components/api/api_connection.h"

#include "esphome/components/api/api_pb2.h"

#include "esphome/components/microphone/microphone_source.h"

#ifdef USE_MEDIA_PLAYER

#include "esphome/components/media_player/media_player.h"

#endif

#ifdef USE_MICRO_WAKE_WORD

#include "esphome/components/micro_wake_word/micro_wake_word.h"

#endif

#ifdef USE_SPEAKER

#include "esphome/components/speaker/speaker.h"

#endif

#include "esphome/components/socket/socket.h"


#include <span>

#include <vector>


namespace esphome {

namespace voice_assistant {


// Version 1: Initial version

// Version 2: Adds raw speaker support

static const uint32_t LEGACY_INITIAL_VERSION = 1;

static const uint32_t LEGACY_SPEAKER_SUPPORT = 2;


enum VoiceAssistantFeature : uint32_t {

  FEATURE_VOICE_ASSISTANT = 1 << 0,

  FEATURE_SPEAKER = 1 << 1,

  FEATURE_API_AUDIO = 1 << 2,

  FEATURE_TIMERS = 1 << 3,

  FEATURE_ANNOUNCE = 1 << 4,

  FEATURE_START_CONVERSATION = 1 << 5,

};


enum class State {

  IDLE,

  START_MICROPHONE,

  STARTING_MICROPHONE,

  WAIT_FOR_VAD,

  WAITING_FOR_VAD,

  START_PIPELINE,

  STARTING_PIPELINE,

  STREAMING_MICROPHONE,

  STOP_MICROPHONE,

  STOPPING_MICROPHONE,

  AWAITING_RESPONSE,

  STREAMING_RESPONSE,

  RESPONSE_FINISHED,

};


enum AudioMode : uint8_t {

  AUDIO_MODE_UDP,

  AUDIO_MODE_API,

};


struct Timer {

  std::string id;

  std::string name;

  uint32_t total_seconds;

  uint32_t seconds_left;

  bool is_active;


  static constexpr size_t TO_STR_BUFFER_SIZE = 128;


  const char *to_str(std::span<char, TO_STR_BUFFER_SIZE> buffer) const {

    snprintf(buffer.data(), buffer.size(),

             "Timer(id=%s, name=%s, total_seconds=%" PRIu32 ", seconds_left=%" PRIu32 ", is_active=%s)",

             this->id.c_str(), this->name.c_str(), this->total_seconds, this->seconds_left, YESNO(this->is_active));

    return buffer.data();

  }


  // Remove before 2026.8.0

  ESPDEPRECATED("Use to_str() instead. Removed in 2026.8.0", "2026.2.0")

  std::string to_string() const {  // NOLINT

    char buffer[TO_STR_BUFFER_SIZE];

    return this->to_str(buffer);

  }

};


struct WakeWord {

  std::string id;

  std::string wake_word;

  std::vector<std::string> trained_languages;

};


struct Configuration {

  std::vector<WakeWord> available_wake_words;

  std::vector<std::string> active_wake_words;

  uint32_t max_active_wake_words;

};


#ifdef USE_MEDIA_PLAYER


enum class MediaPlayerResponseState {

  IDLE,

  URL_SENT,

  PLAYING,

  FINISHED,

};


#endif


class VoiceAssistant : public Component {

 public:

  VoiceAssistant();


  void loop() override;

  void setup() override;

  float get_setup_priority() const override;

  void start_streaming();

  void start_streaming(struct sockaddr_storage *addr, uint16_t port);

  void failed_to_start();


  void set_microphone_source(microphone::MicrophoneSource *mic_source) { this->mic_source_ = mic_source; }

#ifdef USE_MICRO_WAKE_WORD

  void set_micro_wake_word(micro_wake_word::MicroWakeWord *mww) { this->micro_wake_word_ = mww; }

#endif

#ifdef USE_SPEAKER


  void set_speaker(speaker::Speaker *speaker) {

    this->speaker_ = speaker;

    this->local_output_ = true;

  }


#endif

#ifdef USE_MEDIA_PLAYER


  void set_media_player(media_player::MediaPlayer *media_player) {

    this->media_player_ = media_player;

    this->local_output_ = true;

  }


#endif


  uint32_t get_legacy_version() const {

#ifdef USE_SPEAKER

    if (this->speaker_ != nullptr) {

      return LEGACY_SPEAKER_SUPPORT;

    }

#endif

    return LEGACY_INITIAL_VERSION;

  }


  uint32_t get_feature_flags() const {

    uint32_t flags = 0;

    flags |= VoiceAssistantFeature::FEATURE_VOICE_ASSISTANT;

    flags |= VoiceAssistantFeature::FEATURE_API_AUDIO;

#ifdef USE_SPEAKER

    if (this->speaker_ != nullptr) {

      flags |= VoiceAssistantFeature::FEATURE_SPEAKER;

    }

#endif


    if (this->has_timers_) {

      flags |= VoiceAssistantFeature::FEATURE_TIMERS;

    }


#ifdef USE_MEDIA_PLAYER

    if (this->media_player_ != nullptr) {

      flags |= VoiceAssistantFeature::FEATURE_ANNOUNCE;

      flags |= VoiceAssistantFeature::FEATURE_START_CONVERSATION;

    }

#endif


    return flags;

  }


  void request_start(bool continuous, bool silence_detection);

  void request_stop();


  void on_event(const api::VoiceAssistantEventResponse &msg);

  void on_audio(const api::VoiceAssistantAudio &msg);

  void on_timer_event(const api::VoiceAssistantTimerEventResponse &msg);

  void on_announce(const api::VoiceAssistantAnnounceRequest &msg);

  void on_set_configuration(const std::vector<std::string> &active_wake_words);

  const Configuration &get_configuration();


  bool is_running() const { return this->state_ != State::IDLE; }

  void set_continuous(bool continuous) { this->continuous_ = continuous; }

  bool is_continuous() const { return this->continuous_; }


  void set_use_wake_word(bool use_wake_word) { this->use_wake_word_ = use_wake_word; }


  void set_noise_suppression_level(uint8_t noise_suppression_level) {

    this->noise_suppression_level_ = noise_suppression_level;

  }


  void set_auto_gain(uint8_t auto_gain) { this->auto_gain_ = auto_gain; }

  void set_volume_multiplier(float volume_multiplier) { this->volume_multiplier_ = volume_multiplier; }

  void set_conversation_timeout(uint32_t conversation_timeout) { this->conversation_timeout_ = conversation_timeout; }

  void reset_conversation_id();


  Trigger<> *get_intent_end_trigger() { return &this->intent_end_trigger_; }

  Trigger<> *get_intent_start_trigger() { return &this->intent_start_trigger_; }

  Trigger<std::string> *get_intent_progress_trigger() { return &this->intent_progress_trigger_; }

  Trigger<> *get_listening_trigger() { return &this->listening_trigger_; }

  Trigger<> *get_end_trigger() { return &this->end_trigger_; }

  Trigger<> *get_start_trigger() { return &this->start_trigger_; }

  Trigger<> *get_stt_vad_end_trigger() { return &this->stt_vad_end_trigger_; }

  Trigger<> *get_stt_vad_start_trigger() { return &this->stt_vad_start_trigger_; }

#ifdef USE_SPEAKER

  Trigger<> *get_tts_stream_start_trigger() { return &this->tts_stream_start_trigger_; }

  Trigger<> *get_tts_stream_end_trigger() { return &this->tts_stream_end_trigger_; }

#endif

  Trigger<> *get_wake_word_detected_trigger() { return &this->wake_word_detected_trigger_; }

  Trigger<std::string> *get_stt_end_trigger() { return &this->stt_end_trigger_; }

  Trigger<std::string> *get_tts_end_trigger() { return &this->tts_end_trigger_; }

  Trigger<std::string> *get_tts_start_trigger() { return &this->tts_start_trigger_; }

  Trigger<std::string, std::string> *get_error_trigger() { return &this->error_trigger_; }

  Trigger<> *get_idle_trigger() { return &this->idle_trigger_; }


  Trigger<> *get_client_connected_trigger() { return &this->client_connected_trigger_; }

  Trigger<> *get_client_disconnected_trigger() { return &this->client_disconnected_trigger_; }


  void client_subscription(api::APIConnection *client, bool subscribe);

  api::APIConnection *get_api_connection() const { return this->api_client_; }


  void set_wake_word(const std::string &wake_word) { this->wake_word_ = wake_word; }


  Trigger<Timer> *get_timer_started_trigger() { return &this->timer_started_trigger_; }

  Trigger<Timer> *get_timer_updated_trigger() { return &this->timer_updated_trigger_; }

  Trigger<Timer> *get_timer_cancelled_trigger() { return &this->timer_cancelled_trigger_; }

  Trigger<Timer> *get_timer_finished_trigger() { return &this->timer_finished_trigger_; }

  Trigger<const std::vector<Timer> &> *get_timer_tick_trigger() { return &this->timer_tick_trigger_; }

  void set_has_timers(bool has_timers) { this->has_timers_ = has_timers; }

  const std::vector<Timer> &get_timers() const { return this->timers_; }


 protected:

  bool allocate_buffers_();

  void clear_buffers_();

  void deallocate_buffers_();


  void set_state_(State state);

  void set_state_(State state, State desired_state);

  void signal_stop_();

  void start_playback_timeout_();


  std::unique_ptr<socket::Socket> socket_ = nullptr;

  struct sockaddr_storage dest_addr_;


  Trigger<> intent_end_trigger_;

  Trigger<> intent_start_trigger_;

  Trigger<> listening_trigger_;

  Trigger<> end_trigger_;

  Trigger<> start_trigger_;

  Trigger<> stt_vad_start_trigger_;

  Trigger<> stt_vad_end_trigger_;

#ifdef USE_SPEAKER

  Trigger<> tts_stream_start_trigger_;

  Trigger<> tts_stream_end_trigger_;

#endif

  Trigger<std::string> intent_progress_trigger_;

  Trigger<> wake_word_detected_trigger_;

  Trigger<std::string> stt_end_trigger_;

  Trigger<std::string> tts_end_trigger_;

  Trigger<std::string> tts_start_trigger_;

  Trigger<std::string, std::string> error_trigger_;

  Trigger<> idle_trigger_;


  Trigger<> client_connected_trigger_;

  Trigger<> client_disconnected_trigger_;


  api::APIConnection *api_client_{nullptr};


  std::vector<Timer> timers_;

  void timer_tick_();

  Trigger<Timer> timer_started_trigger_;

  Trigger<Timer> timer_finished_trigger_;

  Trigger<Timer> timer_updated_trigger_;

  Trigger<Timer> timer_cancelled_trigger_;

  Trigger<const std::vector<Timer> &> timer_tick_trigger_;

  bool has_timers_{false};

  bool timer_tick_running_{false};


  microphone::MicrophoneSource *mic_source_{nullptr};

#ifdef USE_SPEAKER

  void write_speaker_();

  speaker::Speaker *speaker_{nullptr};

  uint8_t *speaker_buffer_{nullptr};

  size_t speaker_buffer_index_{0};

  size_t speaker_buffer_size_{0};

  size_t speaker_bytes_received_{0};

  bool wait_for_stream_end_{false};

  bool stream_ended_{false};

#endif

#ifdef USE_MEDIA_PLAYER

  media_player::MediaPlayer *media_player_{nullptr};

  std::string tts_response_url_{""};

  bool started_streaming_tts_{false};


  MediaPlayerResponseState media_player_response_state_{MediaPlayerResponseState::IDLE};

#endif


  bool local_output_{false};


  std::string conversation_id_{""};


  std::string wake_word_{""};


  std::shared_ptr<RingBuffer> ring_buffer_;


  bool use_wake_word_;

  uint8_t noise_suppression_level_;

  uint8_t auto_gain_;

  float volume_multiplier_;

  uint32_t conversation_timeout_;


  uint8_t *send_buffer_{nullptr};


  bool continuous_{false};

  bool silence_detection_;


  bool continue_conversation_{false};


  State state_{State::IDLE};

  State desired_state_{State::IDLE};


  AudioMode audio_mode_{AUDIO_MODE_UDP};

  bool udp_socket_running_{false};

  bool start_udp_socket_();


  Configuration config_{};


#ifdef USE_MICRO_WAKE_WORD

  micro_wake_word::MicroWakeWord *micro_wake_word_{nullptr};

#endif

};


template<typename... Ts> class StartAction : public Action<Ts...>, public Parented<VoiceAssistant> {

  TEMPLATABLE_VALUE(std::string, wake_word);


 public:


  void play(const Ts &...x) override {

    this->parent_->set_wake_word(this->wake_word_.value(x...));

    this->parent_->request_start(false, this->silence_detection_);

  }


  void set_silence_detection(bool silence_detection) { this->silence_detection_ = silence_detection; }


 protected:

  bool silence_detection_;

};


template<typename... Ts> class StartContinuousAction : public Action<Ts...>, public Parented<VoiceAssistant> {

 public:

  void play(const Ts &...x) override { this->parent_->request_start(true, true); }

};


template<typename... Ts> class StopAction : public Action<Ts...>, public Parented<VoiceAssistant> {

 public:

  void play(const Ts &...x) override { this->parent_->request_stop(); }

};


template<typename... Ts> class IsRunningCondition : public Condition<Ts...>, public Parented<VoiceAssistant> {

 public:

  bool check(const Ts &...x) override { return this->parent_->is_running() || this->parent_->is_continuous(); }

};


template<typename... Ts> class ConnectedCondition : public Condition<Ts...>, public Parented<VoiceAssistant> {

 public:

  bool check(const Ts &...x) override { return this->parent_->get_api_connection() != nullptr; }

};


extern VoiceAssistant *global_voice_assistant;  // NOLINT(cppcoreguidelines-avoid-non-const-global-variables)


}  // namespace voice_assistant

}  // namespace esphome


#endif  // USE_VOICE_ASSISTANT

api_connection.h

api_pb2.h

esphome::Action
Definition automation.h:351

esphome::Component
Definition component.h:87

esphome::Condition
Base class for all automation conditions.
Definition automation.h:304

esphome::Parented
Helper class to easily give an object a parent of type T.
Definition helpers.h:1618

esphome::Parented< VoiceAssistant >::parent_
VoiceAssistant * parent_
Definition helpers.h:1629

esphome::Trigger<>

esphome::api::APIConnection
Definition api_connection.h:35

esphome::api::VoiceAssistantAnnounceRequest
Definition api_pb2.h:2429

esphome::api::VoiceAssistantAudio
Definition api_pb2.h:2388

esphome::api::VoiceAssistantEventResponse
Definition api_pb2.h:2371

esphome::api::VoiceAssistantTimerEventResponse
Definition api_pb2.h:2408

esphome::media_player::MediaPlayer
Definition media_player.h:149

esphome::micro_wake_word::MicroWakeWord
Definition micro_wake_word.h:39

esphome::microphone::MicrophoneSource
Definition microphone_source.h:18

esphome::speaker::Speaker
Definition speaker.h:29

esphome::voice_assistant::ConnectedCondition
Definition voice_assistant.h:363

esphome::voice_assistant::ConnectedCondition::check
bool check(const Ts &...x) override
Definition voice_assistant.h:365

esphome::voice_assistant::IsRunningCondition
Definition voice_assistant.h:358

esphome::voice_assistant::IsRunningCondition::check
bool check(const Ts &...x) override
Definition voice_assistant.h:360

esphome::voice_assistant::StartAction
Definition voice_assistant.h:333

esphome::voice_assistant::StartAction::play
void play(const Ts &...x) override
Definition voice_assistant.h:337

esphome::voice_assistant::StartAction::set_silence_detection
void set_silence_detection(bool silence_detection)
Definition voice_assistant.h:342

esphome::voice_assistant::StartAction::silence_detection_
bool silence_detection_
Definition voice_assistant.h:345

esphome::voice_assistant::StartContinuousAction
Definition voice_assistant.h:348

esphome::voice_assistant::StartContinuousAction::play
void play(const Ts &...x) override
Definition voice_assistant.h:350

esphome::voice_assistant::StopAction
Definition voice_assistant.h:353

esphome::voice_assistant::StopAction::play
void play(const Ts &...x) override
Definition voice_assistant.h:355

esphome::voice_assistant::VoiceAssistant
Definition voice_assistant.h:112

esphome::voice_assistant::VoiceAssistant::intent_end_trigger_
Trigger intent_end_trigger_
Definition voice_assistant.h:245

esphome::voice_assistant::VoiceAssistant::socket_
std::unique_ptr< socket::Socket > socket_
Definition voice_assistant.h:242

esphome::voice_assistant::VoiceAssistant::get_timer_started_trigger
Trigger< Timer > * get_timer_started_trigger()
Definition voice_assistant.h:224

esphome::voice_assistant::VoiceAssistant::VoiceAssistant
VoiceAssistant()
Definition voice_assistant.cpp:30

esphome::voice_assistant::VoiceAssistant::get_configuration
const Configuration & get_configuration()
Definition voice_assistant.cpp:975

esphome::voice_assistant::VoiceAssistant::local_output_
bool local_output_
Definition voice_assistant.h:298

esphome::voice_assistant::VoiceAssistant::set_conversation_timeout
void set_conversation_timeout(uint32_t conversation_timeout)
Definition voice_assistant.h:194

esphome::voice_assistant::VoiceAssistant::speaker_buffer_size_
size_t speaker_buffer_size_
Definition voice_assistant.h:285

esphome::voice_assistant::VoiceAssistant::started_streaming_tts_
bool started_streaming_tts_
Definition voice_assistant.h:293

esphome::voice_assistant::VoiceAssistant::tts_response_url_
std::string tts_response_url_
Definition voice_assistant.h:292

esphome::voice_assistant::VoiceAssistant::start_udp_socket_
bool start_udp_socket_()
Definition voice_assistant.cpp:64

esphome::voice_assistant::VoiceAssistant::wait_for_stream_end_
bool wait_for_stream_end_
Definition voice_assistant.h:287

esphome::voice_assistant::VoiceAssistant::get_stt_end_trigger
Trigger< std::string > * get_stt_end_trigger()
Definition voice_assistant.h:210

esphome::voice_assistant::VoiceAssistant::speaker_buffer_index_
size_t speaker_buffer_index_
Definition voice_assistant.h:284

esphome::voice_assistant::VoiceAssistant::udp_socket_running_
bool udp_socket_running_
Definition voice_assistant.h:323

esphome::voice_assistant::VoiceAssistant::get_legacy_version
uint32_t get_legacy_version() const
Definition voice_assistant.h:140

esphome::voice_assistant::VoiceAssistant::intent_start_trigger_
Trigger intent_start_trigger_
Definition voice_assistant.h:246

esphome::voice_assistant::VoiceAssistant::wake_word_
std::string wake_word_
Definition voice_assistant.h:302

esphome::voice_assistant::VoiceAssistant::get_intent_progress_trigger
Trigger< std::string > * get_intent_progress_trigger()
Definition voice_assistant.h:199

esphome::voice_assistant::VoiceAssistant::on_timer_event
void on_timer_event(const api::VoiceAssistantTimerEventResponse &msg)
Definition voice_assistant.cpp:863

esphome::voice_assistant::VoiceAssistant::start_streaming
void start_streaming()
Definition voice_assistant.cpp:500

esphome::voice_assistant::VoiceAssistant::get_wake_word_detected_trigger
Trigger * get_wake_word_detected_trigger()
Definition voice_assistant.h:209

esphome::voice_assistant::VoiceAssistant::get_stt_vad_end_trigger
Trigger * get_stt_vad_end_trigger()
Definition voice_assistant.h:203

esphome::voice_assistant::VoiceAssistant::signal_stop_
void signal_stop_()
Definition voice_assistant.cpp:607

esphome::voice_assistant::VoiceAssistant::tts_stream_start_trigger_
Trigger tts_stream_start_trigger_
Definition voice_assistant.h:253

esphome::voice_assistant::VoiceAssistant::client_connected_trigger_
Trigger client_connected_trigger_
Definition voice_assistant.h:264

esphome::voice_assistant::VoiceAssistant::start_trigger_
Trigger start_trigger_
Definition voice_assistant.h:249

esphome::voice_assistant::VoiceAssistant::timer_cancelled_trigger_
Trigger< Timer > timer_cancelled_trigger_
Definition voice_assistant.h:274

esphome::voice_assistant::VoiceAssistant::timers_
std::vector< Timer > timers_
Definition voice_assistant.h:269

esphome::voice_assistant::VoiceAssistant::state_
State state_
Definition voice_assistant.h:319

esphome::voice_assistant::VoiceAssistant::on_audio
void on_audio(const api::VoiceAssistantAudio &msg)
Definition voice_assistant.cpp:847

esphome::voice_assistant::VoiceAssistant::get_client_disconnected_trigger
Trigger * get_client_disconnected_trigger()
Definition voice_assistant.h:217

esphome::voice_assistant::VoiceAssistant::get_tts_end_trigger
Trigger< std::string > * get_tts_end_trigger()
Definition voice_assistant.h:211

esphome::voice_assistant::VoiceAssistant::loop
void loop() override
Definition voice_assistant.cpp:184

esphome::voice_assistant::VoiceAssistant::get_timer_updated_trigger
Trigger< Timer > * get_timer_updated_trigger()
Definition voice_assistant.h:225

esphome::voice_assistant::VoiceAssistant::get_timers
const std::vector< Timer > & get_timers() const
Definition voice_assistant.h:230

esphome::voice_assistant::VoiceAssistant::volume_multiplier_
float volume_multiplier_
Definition voice_assistant.h:309

esphome::voice_assistant::VoiceAssistant::get_end_trigger
Trigger * get_end_trigger()
Definition voice_assistant.h:201

esphome::voice_assistant::VoiceAssistant::media_player_
media_player::MediaPlayer * media_player_
Definition voice_assistant.h:291

esphome::voice_assistant::VoiceAssistant::use_wake_word_
bool use_wake_word_
Definition voice_assistant.h:306

esphome::voice_assistant::VoiceAssistant::get_setup_priority
float get_setup_priority() const override
Definition voice_assistant.cpp:62

esphome::voice_assistant::VoiceAssistant::audio_mode_
AudioMode audio_mode_
Definition voice_assistant.h:322

esphome::voice_assistant::VoiceAssistant::wake_word_detected_trigger_
Trigger wake_word_detected_trigger_
Definition voice_assistant.h:257

esphome::voice_assistant::VoiceAssistant::set_state_
void set_state_(State state)
Definition voice_assistant.cpp:481

esphome::voice_assistant::VoiceAssistant::speaker_buffer_
uint8_t * speaker_buffer_
Definition voice_assistant.h:283

esphome::voice_assistant::VoiceAssistant::stt_vad_end_trigger_
Trigger stt_vad_end_trigger_
Definition voice_assistant.h:251

esphome::voice_assistant::VoiceAssistant::set_media_player
void set_media_player(media_player::MediaPlayer *media_player)
Definition voice_assistant.h:134

esphome::voice_assistant::VoiceAssistant::client_subscription
void client_subscription(api::APIConnection *client, bool subscribe)
Definition voice_assistant.cpp:421

esphome::voice_assistant::VoiceAssistant::timer_started_trigger_
Trigger< Timer > timer_started_trigger_
Definition voice_assistant.h:271

esphome::voice_assistant::VoiceAssistant::get_client_connected_trigger
Trigger * get_client_connected_trigger()
Definition voice_assistant.h:216

esphome::voice_assistant::VoiceAssistant::get_timer_cancelled_trigger
Trigger< Timer > * get_timer_cancelled_trigger()
Definition voice_assistant.h:226

esphome::voice_assistant::VoiceAssistant::media_player_response_state_
MediaPlayerResponseState media_player_response_state_
Definition voice_assistant.h:295

esphome::voice_assistant::VoiceAssistant::deallocate_buffers_
void deallocate_buffers_()
Definition voice_assistant.cpp:159

esphome::voice_assistant::VoiceAssistant::silence_detection_
bool silence_detection_
Definition voice_assistant.h:315

esphome::voice_assistant::VoiceAssistant::is_continuous
bool is_continuous() const
Definition voice_assistant.h:185

esphome::voice_assistant::VoiceAssistant::listening_trigger_
Trigger listening_trigger_
Definition voice_assistant.h:247

esphome::voice_assistant::VoiceAssistant::clear_buffers_
void clear_buffers_()
Definition voice_assistant.cpp:139

esphome::voice_assistant::VoiceAssistant::setup
void setup() override
Definition voice_assistant.cpp:32

esphome::voice_assistant::VoiceAssistant::allocate_buffers_
bool allocate_buffers_()
Definition voice_assistant.cpp:107

esphome::voice_assistant::VoiceAssistant::ring_buffer_
std::shared_ptr< RingBuffer > ring_buffer_
Definition voice_assistant.h:304

esphome::voice_assistant::VoiceAssistant::get_stt_vad_start_trigger
Trigger * get_stt_vad_start_trigger()
Definition voice_assistant.h:204

esphome::voice_assistant::VoiceAssistant::get_tts_stream_end_trigger
Trigger * get_tts_stream_end_trigger()
Definition voice_assistant.h:207

esphome::voice_assistant::VoiceAssistant::set_continuous
void set_continuous(bool continuous)
Definition voice_assistant.h:184

esphome::voice_assistant::VoiceAssistant::noise_suppression_level_
uint8_t noise_suppression_level_
Definition voice_assistant.h:307

esphome::voice_assistant::VoiceAssistant::on_event
void on_event(const api::VoiceAssistantEventResponse &msg)
Definition voice_assistant.cpp:629

esphome::voice_assistant::VoiceAssistant::error_trigger_
Trigger< std::string, std::string > error_trigger_
Definition voice_assistant.h:261

esphome::voice_assistant::VoiceAssistant::get_intent_end_trigger
Trigger * get_intent_end_trigger()
Definition voice_assistant.h:197

esphome::voice_assistant::VoiceAssistant::stt_end_trigger_
Trigger< std::string > stt_end_trigger_
Definition voice_assistant.h:258

esphome::voice_assistant::VoiceAssistant::conversation_timeout_
uint32_t conversation_timeout_
Definition voice_assistant.h:310

esphome::voice_assistant::VoiceAssistant::get_timer_finished_trigger
Trigger< Timer > * get_timer_finished_trigger()
Definition voice_assistant.h:227

esphome::voice_assistant::VoiceAssistant::timer_tick_trigger_
Trigger< const std::vector< Timer > & > timer_tick_trigger_
Definition voice_assistant.h:275

esphome::voice_assistant::VoiceAssistant::write_speaker_
void write_speaker_()
Definition voice_assistant.cpp:403

esphome::voice_assistant::VoiceAssistant::intent_progress_trigger_
Trigger< std::string > intent_progress_trigger_
Definition voice_assistant.h:256

esphome::voice_assistant::VoiceAssistant::set_auto_gain
void set_auto_gain(uint8_t auto_gain)
Definition voice_assistant.h:192

esphome::voice_assistant::VoiceAssistant::on_announce
void on_announce(const api::VoiceAssistantAnnounceRequest &msg)
Definition voice_assistant.cpp:922

esphome::voice_assistant::VoiceAssistant::request_start
void request_start(bool continuous, bool silence_detection)
Definition voice_assistant.cpp:546

esphome::voice_assistant::VoiceAssistant::tts_start_trigger_
Trigger< std::string > tts_start_trigger_
Definition voice_assistant.h:260

esphome::voice_assistant::VoiceAssistant::auto_gain_
uint8_t auto_gain_
Definition voice_assistant.h:308

esphome::voice_assistant::VoiceAssistant::has_timers_
bool has_timers_
Definition voice_assistant.h:276

esphome::voice_assistant::VoiceAssistant::set_speaker
void set_speaker(speaker::Speaker *speaker)
Definition voice_assistant.h:128

esphome::voice_assistant::VoiceAssistant::api_client_
api::APIConnection * api_client_
Definition voice_assistant.h:267

esphome::voice_assistant::VoiceAssistant::get_tts_start_trigger
Trigger< std::string > * get_tts_start_trigger()
Definition voice_assistant.h:212

esphome::voice_assistant::VoiceAssistant::get_api_connection
api::APIConnection * get_api_connection() const
Definition voice_assistant.h:220

esphome::voice_assistant::VoiceAssistant::request_stop
void request_stop()
Definition voice_assistant.cpp:561

esphome::voice_assistant::VoiceAssistant::config_
Configuration config_
Definition voice_assistant.h:326

esphome::voice_assistant::VoiceAssistant::is_running
bool is_running() const
Definition voice_assistant.h:183

esphome::voice_assistant::VoiceAssistant::tts_end_trigger_
Trigger< std::string > tts_end_trigger_
Definition voice_assistant.h:259

esphome::voice_assistant::VoiceAssistant::set_has_timers
void set_has_timers(bool has_timers)
Definition voice_assistant.h:229

esphome::voice_assistant::VoiceAssistant::set_microphone_source
void set_microphone_source(microphone::MicrophoneSource *mic_source)
Definition voice_assistant.h:123

esphome::voice_assistant::VoiceAssistant::dest_addr_
struct sockaddr_storage dest_addr_
Definition voice_assistant.h:243

esphome::voice_assistant::VoiceAssistant::continuous_
bool continuous_
Definition voice_assistant.h:314

esphome::voice_assistant::VoiceAssistant::get_feature_flags
uint32_t get_feature_flags() const
Definition voice_assistant.h:149

esphome::voice_assistant::VoiceAssistant::timer_tick_
void timer_tick_()
Definition voice_assistant.cpp:913

esphome::voice_assistant::VoiceAssistant::get_listening_trigger
Trigger * get_listening_trigger()
Definition voice_assistant.h:200

esphome::voice_assistant::VoiceAssistant::speaker_
speaker::Speaker * speaker_
Definition voice_assistant.h:282

esphome::voice_assistant::VoiceAssistant::timer_updated_trigger_
Trigger< Timer > timer_updated_trigger_
Definition voice_assistant.h:273

esphome::voice_assistant::VoiceAssistant::stream_ended_
bool stream_ended_
Definition voice_assistant.h:288

esphome::voice_assistant::VoiceAssistant::get_idle_trigger
Trigger * get_idle_trigger()
Definition voice_assistant.h:214

esphome::voice_assistant::VoiceAssistant::set_wake_word
void set_wake_word(const std::string &wake_word)
Definition voice_assistant.h:222

esphome::voice_assistant::VoiceAssistant::send_buffer_
uint8_t * send_buffer_
Definition voice_assistant.h:312

esphome::voice_assistant::VoiceAssistant::set_micro_wake_word
void set_micro_wake_word(micro_wake_word::MicroWakeWord *mww)
Definition voice_assistant.h:125

esphome::voice_assistant::VoiceAssistant::get_start_trigger
Trigger * get_start_trigger()
Definition voice_assistant.h:202

esphome::voice_assistant::VoiceAssistant::end_trigger_
Trigger end_trigger_
Definition voice_assistant.h:248

esphome::voice_assistant::VoiceAssistant::tts_stream_end_trigger_
Trigger tts_stream_end_trigger_
Definition voice_assistant.h:254

esphome::voice_assistant::VoiceAssistant::get_intent_start_trigger
Trigger * get_intent_start_trigger()
Definition voice_assistant.h:198

esphome::voice_assistant::VoiceAssistant::set_volume_multiplier
void set_volume_multiplier(float volume_multiplier)
Definition voice_assistant.h:193

esphome::voice_assistant::VoiceAssistant::stt_vad_start_trigger_
Trigger stt_vad_start_trigger_
Definition voice_assistant.h:250

esphome::voice_assistant::VoiceAssistant::start_playback_timeout_
void start_playback_timeout_()
Definition voice_assistant.cpp:618

esphome::voice_assistant::VoiceAssistant::reset_conversation_id
void reset_conversation_id()
Definition voice_assistant.cpp:179

esphome::voice_assistant::VoiceAssistant::conversation_id_
std::string conversation_id_
Definition voice_assistant.h:300

esphome::voice_assistant::VoiceAssistant::mic_source_
microphone::MicrophoneSource * mic_source_
Definition voice_assistant.h:279

esphome::voice_assistant::VoiceAssistant::micro_wake_word_
micro_wake_word::MicroWakeWord * micro_wake_word_
Definition voice_assistant.h:329

esphome::voice_assistant::VoiceAssistant::get_error_trigger
Trigger< std::string, std::string > * get_error_trigger()
Definition voice_assistant.h:213

esphome::voice_assistant::VoiceAssistant::set_noise_suppression_level
void set_noise_suppression_level(uint8_t noise_suppression_level)
Definition voice_assistant.h:189

esphome::voice_assistant::VoiceAssistant::set_use_wake_word
void set_use_wake_word(bool use_wake_word)
Definition voice_assistant.h:187

esphome::voice_assistant::VoiceAssistant::speaker_bytes_received_
size_t speaker_bytes_received_
Definition voice_assistant.h:286

esphome::voice_assistant::VoiceAssistant::continue_conversation_
bool continue_conversation_
Definition voice_assistant.h:317

esphome::voice_assistant::VoiceAssistant::failed_to_start
void failed_to_start()
Definition voice_assistant.cpp:494

esphome::voice_assistant::VoiceAssistant::on_set_configuration
void on_set_configuration(const std::vector< std::string > &active_wake_words)
Definition voice_assistant.cpp:954

esphome::voice_assistant::VoiceAssistant::get_timer_tick_trigger
Trigger< const std::vector< Timer > & > * get_timer_tick_trigger()
Definition voice_assistant.h:228

esphome::voice_assistant::VoiceAssistant::timer_finished_trigger_
Trigger< Timer > timer_finished_trigger_
Definition voice_assistant.h:272

esphome::voice_assistant::VoiceAssistant::idle_trigger_
Trigger idle_trigger_
Definition voice_assistant.h:262

esphome::voice_assistant::VoiceAssistant::timer_tick_running_
bool timer_tick_running_
Definition voice_assistant.h:277

esphome::voice_assistant::VoiceAssistant::client_disconnected_trigger_
Trigger client_disconnected_trigger_
Definition voice_assistant.h:265

esphome::voice_assistant::VoiceAssistant::get_tts_stream_start_trigger
Trigger * get_tts_stream_start_trigger()
Definition voice_assistant.h:206

esphome::voice_assistant::VoiceAssistant::desired_state_
State desired_state_
Definition voice_assistant.h:320

component.h

automation.h

defines.h

flags
uint16_t flags
Definition dns_server_esp32_idf.cpp:1

state
bool state
Definition fan.h:2

helpers.h

media_player.h

micro_wake_word.h

microphone_source.h

esphome::light::uint32_t
uint32_t
Definition light_call.cpp:601

esphome::voice_assistant::VoiceAssistantFeature
VoiceAssistantFeature
Definition voice_assistant.h:37

esphome::voice_assistant::FEATURE_TIMERS
@ FEATURE_TIMERS
Definition voice_assistant.h:41

esphome::voice_assistant::FEATURE_SPEAKER
@ FEATURE_SPEAKER
Definition voice_assistant.h:39

esphome::voice_assistant::FEATURE_START_CONVERSATION
@ FEATURE_START_CONVERSATION
Definition voice_assistant.h:43

esphome::voice_assistant::FEATURE_API_AUDIO
@ FEATURE_API_AUDIO
Definition voice_assistant.h:40

esphome::voice_assistant::FEATURE_ANNOUNCE
@ FEATURE_ANNOUNCE
Definition voice_assistant.h:42

esphome::voice_assistant::FEATURE_VOICE_ASSISTANT
@ FEATURE_VOICE_ASSISTANT
Definition voice_assistant.h:38

esphome::voice_assistant::MediaPlayerResponseState
MediaPlayerResponseState
Definition voice_assistant.h:104

esphome::voice_assistant::MediaPlayerResponseState::FINISHED
@ FINISHED

esphome::voice_assistant::MediaPlayerResponseState::PLAYING
@ PLAYING

esphome::voice_assistant::MediaPlayerResponseState::IDLE
@ IDLE

esphome::voice_assistant::MediaPlayerResponseState::URL_SENT
@ URL_SENT

esphome::voice_assistant::AudioMode
AudioMode
Definition voice_assistant.h:62

esphome::voice_assistant::AUDIO_MODE_UDP
@ AUDIO_MODE_UDP
Definition voice_assistant.h:63

esphome::voice_assistant::AUDIO_MODE_API
@ AUDIO_MODE_API
Definition voice_assistant.h:64

esphome::voice_assistant::State
State
Definition voice_assistant.h:46

esphome::voice_assistant::State::STREAMING_RESPONSE
@ STREAMING_RESPONSE

esphome::voice_assistant::State::STOPPING_MICROPHONE
@ STOPPING_MICROPHONE

esphome::voice_assistant::State::STOP_MICROPHONE
@ STOP_MICROPHONE

esphome::voice_assistant::State::WAIT_FOR_VAD
@ WAIT_FOR_VAD

esphome::voice_assistant::State::WAITING_FOR_VAD
@ WAITING_FOR_VAD

esphome::voice_assistant::State::STARTING_PIPELINE
@ STARTING_PIPELINE

esphome::voice_assistant::State::IDLE
@ IDLE

esphome::voice_assistant::State::STREAMING_MICROPHONE
@ STREAMING_MICROPHONE

esphome::voice_assistant::State::AWAITING_RESPONSE
@ AWAITING_RESPONSE

esphome::voice_assistant::State::STARTING_MICROPHONE
@ STARTING_MICROPHONE

esphome::voice_assistant::State::START_PIPELINE
@ START_PIPELINE

esphome::voice_assistant::State::RESPONSE_FINISHED
@ RESPONSE_FINISHED

esphome::voice_assistant::State::START_MICROPHONE
@ START_MICROPHONE

esphome::voice_assistant::global_voice_assistant
VoiceAssistant * global_voice_assistant
Definition voice_assistant.cpp:1007

esphome
Providing packet encoding functions for exchanging data with a remote host.
Definition a01nyub.cpp:7

esphome::ESPDEPRECATED
struct ESPDEPRECATED("Use std::index_sequence instead. Removed in 2026.6.0", "2025.12.0") seq
Definition automation.h:26

ring_buffer.h

socket.h

speaker.h

esphome::voice_assistant::Configuration
Definition voice_assistant.h:97

esphome::voice_assistant::Configuration::available_wake_words
std::vector< WakeWord > available_wake_words
Definition voice_assistant.h:98

esphome::voice_assistant::Configuration::active_wake_words
std::vector< std::string > active_wake_words
Definition voice_assistant.h:99

esphome::voice_assistant::Configuration::max_active_wake_words
uint32_t max_active_wake_words
Definition voice_assistant.h:100

esphome::voice_assistant::Timer
Definition voice_assistant.h:67

esphome::voice_assistant::Timer::total_seconds
uint32_t total_seconds
Definition voice_assistant.h:70

esphome::voice_assistant::Timer::name
std::string name
Definition voice_assistant.h:69

esphome::voice_assistant::Timer::TO_STR_BUFFER_SIZE
static constexpr size_t TO_STR_BUFFER_SIZE
Buffer size for to_str() - sufficient for typical timer names.
Definition voice_assistant.h:75

esphome::voice_assistant::Timer::is_active
bool is_active
Definition voice_assistant.h:72

esphome::voice_assistant::Timer::to_str
const char * to_str(std::span< char, TO_STR_BUFFER_SIZE > buffer) const
Format to buffer, returns pointer to buffer (may truncate long names)
Definition voice_assistant.h:77

esphome::voice_assistant::Timer::id
std::string id
Definition voice_assistant.h:68

esphome::voice_assistant::Timer::seconds_left
uint32_t seconds_left
Definition voice_assistant.h:71

esphome::voice_assistant::WakeWord
Definition voice_assistant.h:91

esphome::voice_assistant::WakeWord::wake_word
std::string wake_word
Definition voice_assistant.h:93

esphome::voice_assistant::WakeWord::trained_languages
std::vector< std::string > trained_languages
Definition voice_assistant.h:94

esphome::voice_assistant::WakeWord::id
std::string id
Definition voice_assistant.h:92

sockaddr_storage
Definition headers.h:90

x
uint16_t x
Definition tt21100.cpp:5