ESPHome: esphome/components/micro_wake_word/streaming_model.h Source File

#pragma once


#ifdef USE_ESP_IDF


#include "preprocessor_settings.h"


#include "esphome/core/preferences.h"


#include <tensorflow/lite/core/c/common.h>

#include <tensorflow/lite/micro/micro_interpreter.h>

#include <tensorflow/lite/micro/micro_mutable_op_resolver.h>


namespace esphome {

namespace micro_wake_word {


static const uint8_t MIN_SLICES_BEFORE_DETECTION = 100;

static const uint32_t STREAMING_MODEL_VARIABLE_ARENA_SIZE = 1024;


struct DetectionEvent {

  std::string *wake_word;

  bool detected;

  bool partially_detection;  // Set if the most recent probability exceed the threshold, but the sliding window average

                             // hasn't yet

  uint8_t max_probability;

  uint8_t average_probability;

  bool blocked_by_vad = false;

};


class StreamingModel {

 public:

  virtual void log_model_config() = 0;

  virtual DetectionEvent determine_detected() = 0;


  // Performs inference on the given features.

  //  - If the model is enabled but not loaded, it will load it

  //  - If the model is disabled but loaded, it will unload it

  // Returns true if sucessful or false if there is an error

  bool perform_streaming_inference(const int8_t features[PREPROCESSOR_FEATURE_SIZE]);


  void reset_probabilities();


  void unload_model();


  virtual void enable() { this->enabled_ = true; }


  virtual void disable() { this->enabled_ = false; }


  bool is_enabled() const { return this->enabled_; }


  bool get_unprocessed_probability_status() const { return this->unprocessed_probability_status_; }


  // Quantized probability cutoffs mapping 0.0 - 1.0 to 0 - 255

  uint8_t get_default_probability_cutoff() const { return this->default_probability_cutoff_; }

  uint8_t get_probability_cutoff() const { return this->probability_cutoff_; }

  void set_probability_cutoff(uint8_t probability_cutoff) { this->probability_cutoff_ = probability_cutoff; }


 protected:

  bool load_model_();

  bool register_streaming_ops_(tflite::MicroMutableOpResolver<20> &op_resolver);


  tflite::MicroMutableOpResolver<20> streaming_op_resolver_;


  bool loaded_{false};

  bool enabled_{true};

  bool unprocessed_probability_status_{false};

  uint8_t current_stride_step_{0};

  int16_t ignore_windows_{-MIN_SLICES_BEFORE_DETECTION};


  uint8_t default_probability_cutoff_;

  uint8_t probability_cutoff_;

  size_t sliding_window_size_;


  size_t last_n_index_{0};

  size_t tensor_arena_size_;

  std::vector<uint8_t> recent_streaming_probabilities_;


  const uint8_t *model_start_;

  uint8_t *tensor_arena_{nullptr};

  uint8_t *var_arena_{nullptr};

  std::unique_ptr<tflite::MicroInterpreter> interpreter_;

  tflite::MicroResourceVariables *mrv_{nullptr};

  tflite::MicroAllocator *ma_{nullptr};

};


class WakeWordModel final : public StreamingModel {

 public:

  WakeWordModel(const std::string &id, const uint8_t *model_start, uint8_t default_probability_cutoff,

                size_t sliding_window_average_size, const std::string &wake_word, size_t tensor_arena_size,

                bool default_enabled, bool internal_only);


  void log_model_config() override;


  DetectionEvent determine_detected() override;


  const std::string &get_id() const { return this->id_; }

  const std::string &get_wake_word() const { return this->wake_word_; }


  void add_trained_language(const std::string &language) { this->trained_languages_.push_back(language); }

  const std::vector<std::string> &get_trained_languages() const { return this->trained_languages_; }


  void enable() override;


  void disable() override;


  bool get_internal_only() { return this->internal_only_; }


 protected:

  std::string id_;

  std::string wake_word_;

  std::vector<std::string> trained_languages_;


  bool internal_only_;


  ESPPreferenceObject pref_;

};


class VADModel final : public StreamingModel {

 public:

  VADModel(const uint8_t *model_start, uint8_t default_probability_cutoff, size_t sliding_window_size,

           size_t tensor_arena_size);


  void log_model_config() override;


  DetectionEvent determine_detected() override;

};


}  // namespace micro_wake_word

}  // namespace esphome


#endif

esphome::ESPPreferenceObject
Definition preferences.h:16

esphome::micro_wake_word::StreamingModel
Definition streaming_model.h:29

esphome::micro_wake_word::StreamingModel::disable
virtual void disable()
Disable the model. The next performing_streaming_inference call will unload it.
Definition streaming_model.h:50

esphome::micro_wake_word::StreamingModel::ma_
tflite::MicroAllocator * ma_
Definition streaming_model.h:90

esphome::micro_wake_word::StreamingModel::determine_detected
virtual DetectionEvent determine_detected()=0

esphome::micro_wake_word::StreamingModel::load_model_
bool load_model_()
Allocates tensor and variable arenas and sets up the model interpreter.
Definition streaming_model.cpp:25

esphome::micro_wake_word::StreamingModel::tensor_arena_
uint8_t * tensor_arena_
Definition streaming_model.h:86

esphome::micro_wake_word::StreamingModel::get_default_probability_cutoff
uint8_t get_default_probability_cutoff() const
Definition streaming_model.h:58

esphome::micro_wake_word::StreamingModel::enable
virtual void enable()
Enable the model. The next performing_streaming_inference call will load it.
Definition streaming_model.h:47

esphome::micro_wake_word::StreamingModel::current_stride_step_
uint8_t current_stride_step_
Definition streaming_model.h:74

esphome::micro_wake_word::StreamingModel::ignore_windows_
int16_t ignore_windows_
Definition streaming_model.h:75

esphome::micro_wake_word::StreamingModel::log_model_config
virtual void log_model_config()=0

esphome::micro_wake_word::StreamingModel::sliding_window_size_
size_t sliding_window_size_
Definition streaming_model.h:79

esphome::micro_wake_word::StreamingModel::interpreter_
std::unique_ptr< tflite::MicroInterpreter > interpreter_
Definition streaming_model.h:88

esphome::micro_wake_word::StreamingModel::default_probability_cutoff_
uint8_t default_probability_cutoff_
Definition streaming_model.h:77

esphome::micro_wake_word::StreamingModel::get_unprocessed_probability_status
bool get_unprocessed_probability_status() const
Definition streaming_model.h:55

esphome::micro_wake_word::StreamingModel::streaming_op_resolver_
tflite::MicroMutableOpResolver< 20 > streaming_op_resolver_
Definition streaming_model.h:69

esphome::micro_wake_word::StreamingModel::register_streaming_ops_
bool register_streaming_ops_(tflite::MicroMutableOpResolver< 20 > &op_resolver)
Returns true if successfully registered the streaming model's TensorFlow operations.
Definition streaming_model.cpp:260

esphome::micro_wake_word::StreamingModel::loaded_
bool loaded_
Definition streaming_model.h:71

esphome::micro_wake_word::StreamingModel::reset_probabilities
void reset_probabilities()
Sets all recent_streaming_probabilities to 0 and resets the ignore window count.
Definition streaming_model.cpp:155

esphome::micro_wake_word::StreamingModel::tensor_arena_size_
size_t tensor_arena_size_
Definition streaming_model.h:82

esphome::micro_wake_word::StreamingModel::recent_streaming_probabilities_
std::vector< uint8_t > recent_streaming_probabilities_
Definition streaming_model.h:83

esphome::micro_wake_word::StreamingModel::last_n_index_
size_t last_n_index_
Definition streaming_model.h:81

esphome::micro_wake_word::StreamingModel::var_arena_
uint8_t * var_arena_
Definition streaming_model.h:87

esphome::micro_wake_word::StreamingModel::unprocessed_probability_status_
bool unprocessed_probability_status_
Definition streaming_model.h:73

esphome::micro_wake_word::StreamingModel::get_probability_cutoff
uint8_t get_probability_cutoff() const
Definition streaming_model.h:59

esphome::micro_wake_word::StreamingModel::mrv_
tflite::MicroResourceVariables * mrv_
Definition streaming_model.h:89

esphome::micro_wake_word::StreamingModel::perform_streaming_inference
bool perform_streaming_inference(const int8_t features[PREPROCESSOR_FEATURE_SIZE])
Definition streaming_model.cpp:110

esphome::micro_wake_word::StreamingModel::probability_cutoff_
uint8_t probability_cutoff_
Definition streaming_model.h:78

esphome::micro_wake_word::StreamingModel::unload_model
void unload_model()
Destroys the TFLite interpreter and frees the tensor and variable arenas' memory.
Definition streaming_model.cpp:92

esphome::micro_wake_word::StreamingModel::enabled_
bool enabled_
Definition streaming_model.h:72

esphome::micro_wake_word::StreamingModel::set_probability_cutoff
void set_probability_cutoff(uint8_t probability_cutoff)
Definition streaming_model.h:60

esphome::micro_wake_word::StreamingModel::is_enabled
bool is_enabled() const
Return true if the model is enabled.
Definition streaming_model.h:53

esphome::micro_wake_word::StreamingModel::model_start_
const uint8_t * model_start_
Definition streaming_model.h:85

esphome::micro_wake_word::VADModel
Definition streaming_model.h:140

esphome::micro_wake_word::VADModel::determine_detected
DetectionEvent determine_detected() override
Checks for voice activity by comparing the max probability in the sliding window with the probability...
Definition streaming_model.cpp:237

esphome::micro_wake_word::VADModel::VADModel
VADModel(const uint8_t *model_start, uint8_t default_probability_cutoff, size_t sliding_window_size, size_t tensor_arena_size)
Definition streaming_model.cpp:226

esphome::micro_wake_word::VADModel::log_model_config
void log_model_config() override
Definition streaming_model.cpp:19

esphome::micro_wake_word::WakeWordModel
Definition streaming_model.h:93

esphome::micro_wake_word::WakeWordModel::enable
void enable() override
Enable the model and save to flash. The next performing_streaming_inference call will load it.
Definition streaming_model.cpp:188

esphome::micro_wake_word::WakeWordModel::id_
std::string id_
Definition streaming_model.h:131

esphome::micro_wake_word::WakeWordModel::get_wake_word
const std::string & get_wake_word() const
Definition streaming_model.h:117

esphome::micro_wake_word::WakeWordModel::determine_detected
DetectionEvent determine_detected() override
Checks for the wake word by comparing the mean probability in the sliding window with the probability...
Definition streaming_model.cpp:202

esphome::micro_wake_word::WakeWordModel::log_model_config
void log_model_config() override
Definition streaming_model.cpp:13

esphome::micro_wake_word::WakeWordModel::wake_word_
std::string wake_word_
Definition streaming_model.h:132

esphome::micro_wake_word::WakeWordModel::get_id
const std::string & get_id() const
Definition streaming_model.h:116

esphome::micro_wake_word::WakeWordModel::get_trained_languages
const std::vector< std::string > & get_trained_languages() const
Definition streaming_model.h:120

esphome::micro_wake_word::WakeWordModel::get_internal_only
bool get_internal_only()
Definition streaming_model.h:128

esphome::micro_wake_word::WakeWordModel::pref_
ESPPreferenceObject pref_
Definition streaming_model.h:137

esphome::micro_wake_word::WakeWordModel::WakeWordModel
WakeWordModel(const std::string &id, const uint8_t *model_start, uint8_t default_probability_cutoff, size_t sliding_window_average_size, const std::string &wake_word, size_t tensor_arena_size, bool default_enabled, bool internal_only)
Constructs a wake word model object.
Definition streaming_model.cpp:162

esphome::micro_wake_word::WakeWordModel::add_trained_language
void add_trained_language(const std::string &language)
Definition streaming_model.h:119

esphome::micro_wake_word::WakeWordModel::disable
void disable() override
Disable the model and save to flash. The next performing_streaming_inference call will unload it.
Definition streaming_model.cpp:195

esphome::micro_wake_word::WakeWordModel::trained_languages_
std::vector< std::string > trained_languages_
Definition streaming_model.h:133

esphome::micro_wake_word::WakeWordModel::internal_only_
bool internal_only_
Definition streaming_model.h:135

preferences.h

esphome
Providing packet encoding functions for exchanging data with a remote host.
Definition a01nyub.cpp:7

preprocessor_settings.h

esphome::micro_wake_word::DetectionEvent
Definition streaming_model.h:19

esphome::micro_wake_word::DetectionEvent::detected
bool detected
Definition streaming_model.h:21

esphome::micro_wake_word::DetectionEvent::wake_word
std::string * wake_word
Definition streaming_model.h:20

esphome::micro_wake_word::DetectionEvent::max_probability
uint8_t max_probability
Definition streaming_model.h:24

esphome::micro_wake_word::DetectionEvent::average_probability
uint8_t average_probability
Definition streaming_model.h:25

esphome::micro_wake_word::DetectionEvent::partially_detection
bool partially_detection
Definition streaming_model.h:22

esphome::micro_wake_word::DetectionEvent::blocked_by_vad
bool blocked_by_vad
Definition streaming_model.h:26