ESPHome: esphome/components/sound_level/sound_level.cpp Source File

#include "sound_level.h"


#ifdef USE_ESP32


#include "esphome/core/log.h"


#include <cmath>

#include <cstdint>


namespace esphome {


namespace sound_level {


static const char *const TAG = "sound_level";


static const uint32_t AUDIO_BUFFER_DURATION_MS = 30;

static const uint32_t RING_BUFFER_DURATION_MS = 120;


// Square INT16_MIN since INT16_MIN^2 > INT16_MAX^2

static const double MAX_SAMPLE_SQUARED_DENOMINATOR = INT16_MIN * INT16_MIN;


void SoundLevelComponent::dump_config() {

  ESP_LOGCONFIG(TAG, "Sound Level Component:");

  ESP_LOGCONFIG(TAG, "  Measurement Duration: %" PRIu32 " ms", measurement_duration_ms_);

  LOG_SENSOR("  ", "Peak:", this->peak_sensor_);


  LOG_SENSOR("  ", "RMS:", this->rms_sensor_);

}


void SoundLevelComponent::setup() {

  this->microphone_source_->add_data_callback([this](const std::vector<uint8_t> &data) {

    std::shared_ptr<RingBuffer> temp_ring_buffer = this->ring_buffer_.lock();

    if (this->ring_buffer_.use_count() == 2) {

      // ``audio_buffer_`` and ``temp_ring_buffer`` share ownership of a ring buffer, so its safe/useful to write

      temp_ring_buffer->write((void *) data.data(), data.size());

    }

  });


  if (!this->microphone_source_->is_passive()) {

    // Automatically start the microphone if not in passive mode

    this->microphone_source_->start();

  }

}


void SoundLevelComponent::loop() {

  if ((this->peak_sensor_ == nullptr) && (this->rms_sensor_ == nullptr)) {

    // No sensors configured, nothing to do

    return;

  }


  if (this->microphone_source_->is_running() && !this->status_has_error()) {

    // Allocate buffers

    if (this->start_()) {

      this->status_clear_warning();

    }

  } else {

    if (!this->status_has_warning()) {

      this->status_set_warning("Microphone isn't running, can't compute statistics");


      // Deallocate buffers, if necessary

      this->stop_();


      // Reset sensor outputs

      if (this->peak_sensor_ != nullptr) {

        this->peak_sensor_->publish_state(NAN);

      }

      if (this->rms_sensor_ != nullptr) {

        this->rms_sensor_->publish_state(NAN);

      }


      // Reset accumulators

      this->squared_peak_ = 0;

      this->squared_samples_sum_ = 0;

      this->sample_count_ = 0;

    }


    return;

  }


  if (this->status_has_error()) {

    return;

  }


  // Copy data from ring buffer into the transfer buffer - don't block to avoid slowing the main loop

  this->audio_buffer_->transfer_data_from_source(0);


  if (this->audio_buffer_->available() == 0) {

    // No new audio available for processing

    return;

  }


  const uint32_t samples_in_window =

      this->microphone_source_->get_audio_stream_info().ms_to_samples(this->measurement_duration_ms_);

  const uint32_t samples_available_to_process =

      this->microphone_source_->get_audio_stream_info().bytes_to_samples(this->audio_buffer_->available());

  const uint32_t samples_to_process = std::min(samples_in_window - this->sample_count_, samples_available_to_process);


  // MicrophoneSource always provides int16 samples due to Python codegen settings

  const int16_t *audio_data = reinterpret_cast<const int16_t *>(this->audio_buffer_->get_buffer_start());


  // Process all the new audio samples

  for (uint32_t i = 0; i < samples_to_process; ++i) {

    // Squaring int16 samples won't overflow an int32

    int32_t squared_sample = static_cast<int32_t>(audio_data[i]) * static_cast<int32_t>(audio_data[i]);


    if (this->peak_sensor_ != nullptr) {

      this->squared_peak_ = std::max(this->squared_peak_, squared_sample);

    }


    if (this->rms_sensor_ != nullptr) {

      // Squared sum is an uint64 type - at max levels, an uint32 type would overflow after ~8 samples

      this->squared_samples_sum_ += squared_sample;

    }


    ++this->sample_count_;

  }


  // Remove the processed samples from ``audio_buffer_``

  this->audio_buffer_->decrease_buffer_length(

      this->microphone_source_->get_audio_stream_info().samples_to_bytes(samples_to_process));


  if (this->sample_count_ == samples_in_window) {

    // Processed enough samples for the measurement window, compute and publish the sensor values

    if (this->peak_sensor_ != nullptr) {

      const float peak_db = 10.0f * log10(static_cast<float>(this->squared_peak_) / MAX_SAMPLE_SQUARED_DENOMINATOR);

      this->peak_sensor_->publish_state(peak_db);


      this->squared_peak_ = 0;  // reset accumulator

    }


    if (this->rms_sensor_ != nullptr) {

      // Calculations are done with doubles instead of floats - floats lose precision for even modest window durations

      const double rms_db = 10.0 * log10((this->squared_samples_sum_ / MAX_SAMPLE_SQUARED_DENOMINATOR) /

                                         static_cast<double>(samples_in_window));

      this->rms_sensor_->publish_state(rms_db);


      this->squared_samples_sum_ = 0;  // reset accumulator

    }


    this->sample_count_ = 0;  // reset counter

  }

}


void SoundLevelComponent::start() {

  if (this->microphone_source_->is_passive()) {

    ESP_LOGW(TAG, "Can't start the microphone in passive mode");

    return;

  }

  this->microphone_source_->start();

}


void SoundLevelComponent::stop() {

  if (this->microphone_source_->is_passive()) {

    ESP_LOGW(TAG, "Can't stop microphone in passive mode");

    return;

  }

  this->microphone_source_->stop();

}


bool SoundLevelComponent::start_() {

  if (this->audio_buffer_ != nullptr) {

    return true;

  }


  // Allocate a transfer buffer

  this->audio_buffer_ = audio::AudioSourceTransferBuffer::create(

      this->microphone_source_->get_audio_stream_info().ms_to_bytes(AUDIO_BUFFER_DURATION_MS));

  if (this->audio_buffer_ == nullptr) {

    this->status_momentary_error("Failed to allocate transfer buffer", 15000);

    return false;

  }


  // Allocates a new ring buffer, adds it as a source for the transfer buffer, and points ring_buffer_ to it

  this->ring_buffer_.reset();  // Reset pointer to any previous ring buffer allocation

  std::shared_ptr<RingBuffer> temp_ring_buffer =

      RingBuffer::create(this->microphone_source_->get_audio_stream_info().ms_to_bytes(RING_BUFFER_DURATION_MS));

  if (temp_ring_buffer.use_count() == 0) {

    this->status_momentary_error("Failed to allocate ring buffer", 15000);

    this->stop_();

    return false;

  } else {

    this->ring_buffer_ = temp_ring_buffer;

    this->audio_buffer_->set_source(temp_ring_buffer);

  }


  this->status_clear_error();

  return true;

}


void SoundLevelComponent::stop_() { this->audio_buffer_.reset(); }


}  // namespace sound_level


}  // namespace esphome


#endif

esphome::Component::status_clear_error
void status_clear_error()
Definition component.cpp:184

esphome::Component::status_momentary_error
void status_momentary_error(const std::string &name, uint32_t length=5000)
Definition component.cpp:194

esphome::Component::status_has_warning
bool status_has_warning() const
Definition component.cpp:159

esphome::Component::status_has_error
bool status_has_error() const
Definition component.cpp:160

esphome::Component::status_set_warning
void status_set_warning(const char *message="unspecified")
Definition component.cpp:161

esphome::Component::status_clear_warning
void status_clear_warning()
Definition component.cpp:178

esphome::RingBuffer::create
static std::unique_ptr< RingBuffer > create(size_t len)
Definition ring_buffer.cpp:22

esphome::audio::AudioSourceTransferBuffer::create
static std::unique_ptr< AudioSourceTransferBuffer > create(size_t buffer_size)
Creates a new source transfer buffer.
Definition audio_transfer_buffer.cpp:22

esphome::audio::AudioStreamInfo::ms_to_bytes
size_t ms_to_bytes(uint32_t ms) const
Converts duration to bytes.
Definition audio.h:73

esphome::audio::AudioStreamInfo::ms_to_samples
uint32_t ms_to_samples(uint32_t ms) const
Converts duration to samples.
Definition audio.h:68

esphome::audio::AudioStreamInfo::samples_to_bytes
size_t samples_to_bytes(uint32_t samples) const
Converts samples to bytes.
Definition audio.h:58

esphome::audio::AudioStreamInfo::bytes_to_samples
uint32_t bytes_to_samples(size_t bytes) const
Convert bytes to samples.
Definition audio.h:48

esphome::microphone::MicrophoneSource::is_running
bool is_running() const
Definition microphone_source.h:63

esphome::microphone::MicrophoneSource::stop
void stop()
Definition microphone_source.cpp:39

esphome::microphone::MicrophoneSource::start
void start()
Definition microphone_source.cpp:32

esphome::microphone::MicrophoneSource::is_passive
bool is_passive() const
Definition microphone_source.h:62

esphome::microphone::MicrophoneSource::add_data_callback
void add_data_callback(std::function< void(const std::vector< uint8_t > &)> &&data_callback)
Definition microphone_source.cpp:9

esphome::microphone::MicrophoneSource::get_audio_stream_info
audio::AudioStreamInfo get_audio_stream_info()
Gets the AudioStreamInfo of the data after processing.
Definition microphone_source.cpp:27

esphome::sensor::Sensor::publish_state
void publish_state(float state)
Publish a new state to the front-end.
Definition sensor.cpp:39

esphome::sound_level::SoundLevelComponent::dump_config
void dump_config() override
Definition sound_level.cpp:21

esphome::sound_level::SoundLevelComponent::rms_sensor_
sensor::Sensor * rms_sensor_
Definition sound_level.h:49

esphome::sound_level::SoundLevelComponent::start
void start()
Starts the MicrophoneSource to start measuring sound levels.
Definition sound_level.cpp:143

esphome::sound_level::SoundLevelComponent::audio_buffer_
std::unique_ptr< audio::AudioSourceTransferBuffer > audio_buffer_
Definition sound_level.h:51

esphome::sound_level::SoundLevelComponent::measurement_duration_ms_
uint32_t measurement_duration_ms_
Definition sound_level.h:58

esphome::sound_level::SoundLevelComponent::setup
void setup() override
Definition sound_level.cpp:29

esphome::sound_level::SoundLevelComponent::microphone_source_
microphone::MicrophoneSource * microphone_source_
Definition sound_level.h:46

esphome::sound_level::SoundLevelComponent::stop
void stop()
Stops the MicrophoneSource.
Definition sound_level.cpp:151

esphome::sound_level::SoundLevelComponent::squared_peak_
int32_t squared_peak_
Definition sound_level.h:54

esphome::sound_level::SoundLevelComponent::ring_buffer_
std::weak_ptr< RingBuffer > ring_buffer_
Definition sound_level.h:52

esphome::sound_level::SoundLevelComponent::peak_sensor_
sensor::Sensor * peak_sensor_
Definition sound_level.h:48

esphome::sound_level::SoundLevelComponent::loop
void loop() override
Definition sound_level.cpp:44

esphome::sound_level::SoundLevelComponent::stop_
void stop_()
Internal start command that, if necessary, allocates audio_buffer_ and a ring buffer which / audio_bu...
Definition sound_level.cpp:189

esphome::sound_level::SoundLevelComponent::sample_count_
uint32_t sample_count_
Definition sound_level.h:56

esphome::sound_level::SoundLevelComponent::squared_samples_sum_
uint64_t squared_samples_sum_
Definition sound_level.h:55

log.h

esphome
Providing packet encoding functions for exchanging data with a remote host.
Definition a01nyub.cpp:7

sound_level.h