ESPHome: esphome/components/i2s_audio/speaker/i2s_audio_speaker_standard.cpp Source File

#include "i2s_audio_speaker_standard.h"


#ifdef USE_ESP32


#include <driver/i2s_std.h>

#include <hal/dma_types.h>


#include "esphome/components/audio/audio.h"

#include "esphome/components/audio/audio_transfer_buffer.h"


#include "esphome/core/hal.h"

#include "esphome/core/log.h"


#include "esp_timer.h"


namespace esphome::i2s_audio {


static const char *const TAG = "i2s_audio.speaker.std";


static constexpr uint32_t DMA_BUFFER_DURATION_MS = 10;

static constexpr size_t DMA_BUFFERS_COUNT = 5;

// ESP-IDF clamps each DMA descriptor to this many bytes when allocating the channel (see i2s_get_buf_size in

// the I2S driver). Mirror its target-dependent selection so the requested dma_frame_num stays in range; the

// speaker task reads the size actually allocated back from the driver rather than relying on this value.

#if SOC_CACHE_INTERNAL_MEM_VIA_L1CACHE

static constexpr size_t I2S_DMA_BUFFER_MAX_SIZE = DMA_DESCRIPTOR_BUFFER_MAX_SIZE_64B_ALIGNED;

#else

static constexpr size_t I2S_DMA_BUFFER_MAX_SIZE = DMA_DESCRIPTOR_BUFFER_MAX_SIZE_4B_ALIGNED;

#endif

// Sized to comfortably absorb scheduling jitter: at most DMA_BUFFERS_COUNT events can be in flight,

// doubled so that a transient backlog never overruns the queue (which would desync the lockstep

// invariant between i2s_event_queue_ and write_records_queue_).

static constexpr size_t I2S_EVENT_QUEUE_COUNT = DMA_BUFFERS_COUNT * 2;

// Generous timeout for ``i2s_channel_write`` blocking. A buffer frees roughly every

// DMA_BUFFER_DURATION_MS, so a multiple of that gives plenty of slack against scheduling jitter

// without masking real failures.

static constexpr TickType_t WRITE_TIMEOUT_TICKS = pdMS_TO_TICKS(DMA_BUFFER_DURATION_MS * (DMA_BUFFERS_COUNT + 1));


// Requested frames per DMA buffer for the given stream, clamped so the byte size stays within the ESP-IDF

// maximum DMA descriptor size. This is only the value handed to the channel config: ESP-IDF may still adjust

// it (e.g. cache-line rounding on some targets), so the speaker task reads the size actually allocated back

// from the driver instead of assuming this value. Clamping here keeps the request in range and avoids a

// noisy ESP-IDF "dma frame num is out of dma buffer size" warning at high sample rates or bit depths.

static uint32_t dma_buffer_frames(const audio::AudioStreamInfo &stream_info) {

  const uint32_t frames_from_duration = stream_info.ms_to_frames(DMA_BUFFER_DURATION_MS);

  const uint32_t max_frames = I2S_DMA_BUFFER_MAX_SIZE / stream_info.frames_to_bytes(1);

  return std::min(frames_from_duration, max_frames);

}


void I2SAudioSpeaker::dump_config() {

  I2SAudioSpeakerBase::dump_config();

  const char *fmt_str;

  switch (this->i2s_comm_fmt_) {

    case I2SCommFmt::PCM:

      fmt_str = "pcm";

      break;

    case I2SCommFmt::MSB:

      fmt_str = "msb";

      break;

    default:

      fmt_str = "std";

      break;

  }

  ESP_LOGCONFIG(TAG, "  Communication format: %s", fmt_str);

}


void I2SAudioSpeaker::run_speaker_task() {

  xEventGroupSetBits(this->event_group_, SpeakerEventGroupBits::TASK_STARTING);


  const uint32_t dma_buffers_duration_ms = DMA_BUFFER_DURATION_MS * DMA_BUFFERS_COUNT;

  // Ensure ring buffer duration is at least the duration of all DMA buffers

  const uint32_t ring_buffer_duration = std::max(dma_buffers_duration_ms, this->buffer_duration_ms_);


  // The DMA buffers may have more bits per sample, so calculate buffer sizes based on the input audio stream info

  const size_t bytes_per_frame = this->current_stream_info_.frames_to_bytes(1);

  // Round the ring buffer size down to a multiple of bytes_per_frame so the wrap boundary stays frame-aligned and

  // avoids unnecessary single-frame splices.

  const size_t ring_buffer_size =

      (this->current_stream_info_.ms_to_bytes(ring_buffer_duration) / bytes_per_frame) * bytes_per_frame;

  // ESP-IDF may allocate smaller (or cache-line-rounded) DMA buffers than dma_buffer_frames() requested: it

  // clamps each descriptor to the max DMA descriptor size and, on targets that route internal memory through

  // the L1 cache (e.g. ESP32-P4), rounds the buffer to the cache line. Read the size the driver actually

  // allocated so preload, silence padding, and the write/event lockstep all match it exactly. The channel is

  // in the READY state here because start_i2s_driver() initialized it before this task was created.

  size_t dma_buffer_bytes;

  i2s_chan_info_t chan_info;

  if (i2s_channel_get_info(this->tx_handle_, &chan_info) == ESP_OK && chan_info.total_dma_buf_size > 0) {

    // total_dma_buf_size spans all DMA_BUFFERS_COUNT descriptors and is an exact multiple of the count.

    dma_buffer_bytes = chan_info.total_dma_buf_size / DMA_BUFFERS_COUNT;

  } else {

    // Should not happen for a READY channel; fall back to the requested size.

    dma_buffer_bytes = this->current_stream_info_.frames_to_bytes(dma_buffer_frames(this->current_stream_info_));

  }

  const uint32_t frames_per_dma_buffer = this->current_stream_info_.bytes_to_frames(dma_buffer_bytes);


  bool successful_setup = false;


  std::unique_ptr<audio::RingBufferAudioSource> audio_source;


  // Pre-zeroed buffer used to silence-pad each DMA descriptor whenever real audio doesn't fully fill it.

  RAMAllocator<uint8_t> silence_allocator;

  uint8_t *silence_buffer = silence_allocator.allocate(dma_buffer_bytes);


  if (silence_buffer != nullptr) {

    memset(silence_buffer, 0, dma_buffer_bytes);


    std::shared_ptr<ring_buffer::RingBuffer> temp_ring_buffer = ring_buffer::RingBuffer::create(ring_buffer_size);

    audio_source =

        audio::RingBufferAudioSource::create(temp_ring_buffer, dma_buffer_bytes, static_cast<uint8_t>(bytes_per_frame));


    if (audio_source != nullptr) {

      // audio_source is nullptr if the ring buffer fails to allocate

      this->audio_ring_buffer_ = temp_ring_buffer;

      successful_setup = true;

    }

  }


  if (successful_setup) {

    // Preload every DMA descriptor with silence and push a matching zero-real-frames record per buffer.

    // This guarantees that every on_sent event has a corresponding write record from the start, so

    // ``i2s_event_queue_`` and ``write_records_queue_`` stay in lockstep for the entire task lifetime.

    for (size_t i = 0; i < DMA_BUFFERS_COUNT; i++) {

      size_t bytes_loaded = 0;

      esp_err_t err = i2s_channel_preload_data(this->tx_handle_, silence_buffer, dma_buffer_bytes, &bytes_loaded);

      if (err != ESP_OK || bytes_loaded != dma_buffer_bytes) {

        ESP_LOGV(TAG, "Failed to preload silence into DMA buffer %u (err=%d, loaded=%u)", (unsigned) i, (int) err,

                 (unsigned) bytes_loaded);

        successful_setup = false;

        break;

      }

      uint32_t zero_real_frames = 0;

      if (xQueueSend(this->write_records_queue_, &zero_real_frames, 0) != pdTRUE) {

        // Should never happen: the queue was just reset and is sized for DMA_BUFFERS_COUNT * 2 entries.

        ESP_LOGV(TAG, "Failed to push preload write record");

        successful_setup = false;

        break;

      }

    }

  }


  if (successful_setup) {

    // Register the on_sent callback BEFORE enabling the channel so the very first transmitted buffer

    // generates a queued event that pairs with the first preloaded silence record.

    const i2s_event_callbacks_t callbacks = {.on_sent = i2s_on_sent_cb};

    i2s_channel_register_event_callback(this->tx_handle_, &callbacks, this);


    if (i2s_channel_enable(this->tx_handle_) != ESP_OK) {

      ESP_LOGV(TAG, "Failed to enable I2S channel");

      successful_setup = false;

    }

  }


  if (!successful_setup) {

    xEventGroupSetBits(this->event_group_, SpeakerEventGroupBits::ERR_ESP_NO_MEM);

  } else {

    bool stop_gracefully = false;

    // Number of records currently in ``write_records_queue_`` that carry real audio. Used by graceful

    // stop to wait until every real-audio buffer has been confirmed played by an ISR event.

    uint32_t pending_real_buffers = 0;

    uint32_t last_data_received_time = millis();


    xEventGroupSetBits(this->event_group_, SpeakerEventGroupBits::TASK_RUNNING);


    // Main speaker task loop. Continues while:

    // - Paused, OR

    // - No timeout configured, OR

    // - Timeout hasn't elapsed since last data

    //

    // Always-fill model: every iteration writes exactly one DMA buffer's worth, mixing real audio

    // and silence padding as needed. The blocking ``i2s_channel_write`` paces the loop at the DMA

    // consumption rate, and every buffer write is matched 1:1 with a record on ``write_records_queue_``.

    //

    // While paused, the real-audio fill is skipped and the entire DMA buffer is filled with silence;

    // the same blocking ``i2s_channel_write`` provides natural pacing (one buffer per ~DMA_BUFFER_DURATION_MS),

    // so the lockstep invariant is preserved without burning CPU.

    while (this->pause_state_ || !this->timeout_.has_value() ||

           (millis() - last_data_received_time) <= this->timeout_.value()) {

      uint32_t event_group_bits = xEventGroupGetBits(this->event_group_);


      if (event_group_bits & SpeakerEventGroupBits::COMMAND_STOP) {

        // COMMAND_STOP is set both by user-initiated stop() and by the ISR when it drops a completion

        // event (paired with ERR_DROPPED_EVENT so loop() can distinguish the two cases).

        xEventGroupClearBits(this->event_group_, SpeakerEventGroupBits::COMMAND_STOP);

        ESP_LOGV(TAG, "Exiting: COMMAND_STOP received");

        break;

      }

      if (event_group_bits & SpeakerEventGroupBits::COMMAND_STOP_GRACEFULLY) {

        xEventGroupClearBits(this->event_group_, SpeakerEventGroupBits::COMMAND_STOP_GRACEFULLY);

        stop_gracefully = true;

      }


      if (this->audio_stream_info_ != this->current_stream_info_) {

        // Audio stream info changed, stop the speaker task so it will restart with the proper settings.

        ESP_LOGV(TAG, "Exiting: stream info changed");

        break;

      }


      // Drain ISR-stamped completion events. Each event corresponds 1:1 with a write_records_queue_

      // entry by construction (preloaded records at startup, plus exactly one record pushed per

      // iteration alongside exactly one DMA-buffer-sized write).

      int64_t write_timestamp;

      bool lockstep_broken = false;

      while (xQueueReceive(this->i2s_event_queue_, &write_timestamp, 0)) {

        uint32_t real_frames = 0;

        if (xQueueReceive(this->write_records_queue_, &real_frames, 0) != pdTRUE) {

          // Should never happen: would indicate the lockstep invariant is broken.

          ESP_LOGV(TAG, "Event without matching write record");

          xEventGroupSetBits(this->event_group_, SpeakerEventGroupBits::ERR_LOCKSTEP_DESYNC);

          lockstep_broken = true;

          break;

        }

        if (real_frames > 0) {

          pending_real_buffers--;

          // Real audio is packed at the start of each DMA buffer with any silence padding on the

          // tail, so the real audio finished playing earlier than the buffer-completion timestamp

          // by the duration of the trailing zeros.

          const uint32_t silence_frames = frames_per_dma_buffer - real_frames;

          const int64_t adjusted_ts =

              write_timestamp - this->current_stream_info_.frames_to_microseconds(silence_frames);

          this->audio_output_callback_(real_frames, adjusted_ts);

        }

      }

      if (lockstep_broken) {

        break;

      }


      // Graceful stop: exit only after the source's exposed chunk is drained, the underlying ring

      // buffer has nothing left to hand over, and every real-audio buffer we submitted has been

      // confirmed played. ``has_buffered_data()`` returns bytes still sitting in the ring buffer

      // awaiting fill().

      if (stop_gracefully && audio_source->available() == 0 && !this->has_buffered_data() &&

          pending_real_buffers == 0) {

        ESP_LOGV(TAG, "Exiting: graceful stop complete");

        break;

      }


      // Compose exactly one DMA buffer's worth: drain as much real audio as the source currently

      // exposes (may take multiple fill() calls when crossing a ring buffer wrap), then pad any

      // remainder with silence. All writes pack into the next free DMA descriptor in order, so the

      // descriptor ends up holding [real audio][silence padding].

      size_t bytes_written_total = 0;

      size_t real_bytes_total = 0;

      bool partial_write_failure = false;


      if (!this->pause_state_) {

        while (bytes_written_total < dma_buffer_bytes) {

          size_t bytes_read = audio_source->fill(pdMS_TO_TICKS(DMA_BUFFER_DURATION_MS) / 2, false);

          if (bytes_read > 0) {

            uint8_t *new_data = audio_source->mutable_data() + audio_source->available() - bytes_read;

            this->apply_software_volume_(new_data, bytes_read);

            this->swap_esp32_mono_samples_(new_data, bytes_read);

          }


          const size_t to_write = std::min(audio_source->available(), dma_buffer_bytes - bytes_written_total);

          if (to_write == 0) {

            // Ring buffer has nothing more to hand over right now; pad the rest of this DMA buffer

            // with silence so the lockstep invariant (one write per iteration) is preserved.

            break;

          }


          size_t bw = 0;

          i2s_channel_write(this->tx_handle_, audio_source->data(), to_write, &bw, WRITE_TIMEOUT_TICKS);

          if (bw != to_write) {

            // A short real-audio write breaks DMA descriptor alignment for every subsequent event;

            // the only safe recovery is to restart the task.

            ESP_LOGV(TAG, "Partial real audio write: %u of %u bytes", (unsigned) bw, (unsigned) to_write);

            xEventGroupSetBits(this->event_group_, SpeakerEventGroupBits::ERR_PARTIAL_WRITE);

            partial_write_failure = true;

            break;

          }

          audio_source->consume(bw);

          bytes_written_total += bw;

          real_bytes_total += bw;

        }

        if (real_bytes_total > 0) {

          last_data_received_time = millis();

        }

      }


      if (partial_write_failure) {

        break;

      }


      const size_t silence_bytes = dma_buffer_bytes - bytes_written_total;

      if (silence_bytes > 0) {

        size_t bw = 0;

        i2s_channel_write(this->tx_handle_, silence_buffer, silence_bytes, &bw, WRITE_TIMEOUT_TICKS);

        if (bw != silence_bytes) {

          // Same descriptor-alignment hazard as a partial real-audio write.

          ESP_LOGV(TAG, "Partial silence write: %u of %u bytes", (unsigned) bw, (unsigned) silence_bytes);

          xEventGroupSetBits(this->event_group_, SpeakerEventGroupBits::ERR_PARTIAL_WRITE);

          break;

        }

      }


      const uint32_t real_frames_in_buffer = this->current_stream_info_.bytes_to_frames(real_bytes_total);

      // Push the matching write record. Capacity headroom in I2S_EVENT_QUEUE_COUNT guarantees this

      // succeeds even with a transient backlog of unprocessed events; if it ever fails the lockstep

      // invariant is broken and every subsequent timestamp would be silently wrong, so bail.

      if (xQueueSend(this->write_records_queue_, &real_frames_in_buffer, 0) != pdTRUE) {

        ESP_LOGV(TAG, "Exiting: write records queue full");

        xEventGroupSetBits(this->event_group_, SpeakerEventGroupBits::ERR_LOCKSTEP_DESYNC);

        break;

      }

      if (real_frames_in_buffer > 0) {

        pending_real_buffers++;

      }

    }

  }


  xEventGroupSetBits(this->event_group_, SpeakerEventGroupBits::TASK_STOPPING);


  audio_source.reset();


  if (silence_buffer != nullptr) {

    silence_allocator.deallocate(silence_buffer, dma_buffer_bytes);

    silence_buffer = nullptr;

  }


  xEventGroupSetBits(this->event_group_, SpeakerEventGroupBits::TASK_STOPPED);


  while (true) {

    // Continuously delay until the loop method deletes the task

    vTaskDelay(pdMS_TO_TICKS(10));

  }

}


esp_err_t I2SAudioSpeaker::start_i2s_driver(audio::AudioStreamInfo &audio_stream_info) {

  this->current_stream_info_ = audio_stream_info;


  if ((this->i2s_role_ & I2S_ROLE_SLAVE) && (this->sample_rate_ != audio_stream_info.get_sample_rate())) {  // NOLINT

    // Can't reconfigure I2S bus, so the sample rate must match the configured value

    ESP_LOGE(TAG, "Incompatible stream settings");

    return ESP_ERR_NOT_SUPPORTED;

  }


  if (this->slot_bit_width_ != I2S_SLOT_BIT_WIDTH_AUTO &&

      (i2s_slot_bit_width_t) audio_stream_info.get_bits_per_sample() > this->slot_bit_width_) {

    // Currently can't handle the case when the incoming audio has more bits per sample than the configured value

    ESP_LOGE(TAG, "Stream bits per sample must be less than or equal to the speaker's configuration");

    return ESP_ERR_NOT_SUPPORTED;

  }


#ifdef USE_ESP32_VARIANT_ESP32

  // The original ESP32 I2S peripheral stores each sample in a whole number of 16-bit words (a 24-bit sample

  // occupies 4 bytes in the DMA buffer, an 8-bit sample 2 bytes), but ESPHome's audio pipeline packs samples

  // tightly (3 bytes for 24-bit, 1 for 8-bit). The two layouts only line up when the bit depth is a multiple

  // of 16, so reject anything else rather than emit corrupted audio.

  if (audio_stream_info.get_bits_per_sample() % 16 != 0) {

    ESP_LOGE(TAG, "ESP32 supports only 16- or 32-bit audio, got %u-bit",

             (unsigned) audio_stream_info.get_bits_per_sample());

    return ESP_ERR_NOT_SUPPORTED;

  }

#endif  // USE_ESP32_VARIANT_ESP32


  if (!this->parent_->try_lock()) {

    ESP_LOGE(TAG, "Parent bus is busy");

    return ESP_ERR_INVALID_STATE;

  }


  uint32_t dma_buffer_length = dma_buffer_frames(audio_stream_info);


  i2s_role_t i2s_role = this->i2s_role_;

  i2s_clock_src_t clk_src = I2S_CLK_SRC_DEFAULT;


#if SOC_CLK_APLL_SUPPORTED

  if (this->use_apll_) {

    clk_src = i2s_clock_src_t::I2S_CLK_SRC_APLL;

  }

#endif  // SOC_CLK_APLL_SUPPORTED


  // Log DMA configuration for debugging

  ESP_LOGV(TAG, "I2S DMA config: %zu buffers x %lu frames", (size_t) DMA_BUFFERS_COUNT,

           (unsigned long) dma_buffer_length);


  i2s_chan_config_t chan_cfg = {

      .id = this->parent_->get_port(),

      .role = i2s_role,

      .dma_desc_num = DMA_BUFFERS_COUNT,

      .dma_frame_num = dma_buffer_length,

      .auto_clear = true,

      .intr_priority = 3,

  };


  // Build standard I2S clock/slot/gpio configuration

  i2s_std_clk_config_t clk_cfg = {

      .sample_rate_hz = audio_stream_info.get_sample_rate(),

      .clk_src = clk_src,

      .mclk_multiple = this->mclk_multiple_,

  };


  i2s_slot_mode_t slot_mode = this->slot_mode_;

  i2s_std_slot_mask_t slot_mask = this->std_slot_mask_;

  if (audio_stream_info.get_channels() == 1) {

    slot_mode = I2S_SLOT_MODE_MONO;

  } else if (audio_stream_info.get_channels() == 2) {

    slot_mode = I2S_SLOT_MODE_STEREO;

    slot_mask = I2S_STD_SLOT_BOTH;

  }


  i2s_std_slot_config_t slot_cfg;

  switch (this->i2s_comm_fmt_) {

    case I2SCommFmt::PCM:

      slot_cfg =

          I2S_STD_PCM_SLOT_DEFAULT_CONFIG((i2s_data_bit_width_t) audio_stream_info.get_bits_per_sample(), slot_mode);

      break;

    case I2SCommFmt::MSB:

      slot_cfg =

          I2S_STD_MSB_SLOT_DEFAULT_CONFIG((i2s_data_bit_width_t) audio_stream_info.get_bits_per_sample(), slot_mode);

      break;

    default:

      slot_cfg = I2S_STD_PHILIPS_SLOT_DEFAULT_CONFIG((i2s_data_bit_width_t) audio_stream_info.get_bits_per_sample(),

                                                     slot_mode);

      break;

  }


#ifdef USE_ESP32_VARIANT_ESP32

  // There seems to be a bug on the ESP32 (non-variant) platform where setting the slot bit width higher than the

  // bits per sample causes the audio to play too fast. Setting the ws_width to the configured slot bit width seems

  // to make it play at the correct speed while sending more bits per slot.

  if (this->slot_bit_width_ != I2S_SLOT_BIT_WIDTH_AUTO) {

    uint32_t configured_bit_width = static_cast<uint32_t>(this->slot_bit_width_);

    slot_cfg.ws_width = configured_bit_width;

    if (configured_bit_width > 16) {

      slot_cfg.msb_right = false;

    }

  }

#else

  slot_cfg.slot_bit_width = this->slot_bit_width_;

  if (this->slot_bit_width_ != I2S_SLOT_BIT_WIDTH_AUTO) {

    slot_cfg.ws_width = static_cast<uint32_t>(this->slot_bit_width_);

  }

#endif  // USE_ESP32_VARIANT_ESP32

  slot_cfg.slot_mask = slot_mask;


  i2s_std_gpio_config_t gpio_cfg = this->parent_->get_pin_config();

  gpio_cfg.dout = this->dout_pin_;


  i2s_std_config_t std_cfg = {

      .clk_cfg = clk_cfg,

      .slot_cfg = slot_cfg,

      .gpio_cfg = gpio_cfg,

  };


  esp_err_t err = this->init_i2s_channel_(chan_cfg, std_cfg, I2S_EVENT_QUEUE_COUNT);

  if (err != ESP_OK) {

    return err;

  }


  // The speaker task will enable the channel after preloading.


  return ESP_OK;

}


}  // namespace esphome::i2s_audio


#endif  // USE_ESP32

audio.h

audio_transfer_buffer.h

esphome::Parented< I2SAudioComponent >::parent_
I2SAudioComponent * parent_
Definition helpers.h:1872

esphome::RAMAllocator
An STL allocator that uses SPI or internal RAM.
Definition helpers.h:2053

esphome::RAMAllocator::deallocate
void deallocate(T *p, size_t n)
Definition helpers.h:2110

esphome::RAMAllocator::allocate
T * allocate(size_t n)
Definition helpers.h:2080

esphome::audio::AudioStreamInfo
Definition audio.h:11

esphome::audio::AudioStreamInfo::ms_to_bytes
size_t ms_to_bytes(uint32_t ms) const
Converts duration to bytes.
Definition audio.h:73

esphome::audio::AudioStreamInfo::frames_to_bytes
size_t frames_to_bytes(uint32_t frames) const
Converts frames to bytes.
Definition audio.h:53

esphome::audio::AudioStreamInfo::get_bits_per_sample
uint8_t get_bits_per_sample() const
Definition audio.h:28

esphome::audio::AudioStreamInfo::frames_to_microseconds
uint32_t frames_to_microseconds(uint32_t frames) const
Computes the duration, in microseconds, the given amount of frames represents.
Definition audio.cpp:25

esphome::audio::AudioStreamInfo::bytes_to_frames
uint32_t bytes_to_frames(size_t bytes) const
Convert bytes to frames.
Definition audio.h:43

esphome::audio::AudioStreamInfo::get_channels
uint8_t get_channels() const
Definition audio.h:29

esphome::audio::AudioStreamInfo::get_sample_rate
uint32_t get_sample_rate() const
Definition audio.h:30

esphome::audio::RingBufferAudioSource::create
static std::unique_ptr< RingBufferAudioSource > create(std::shared_ptr< ring_buffer::RingBuffer > ring_buffer, size_t max_fill_bytes, uint8_t alignment_bytes=1)
Creates a new ring-buffer-backed audio source after validating its parameters.
Definition audio_transfer_buffer.cpp:210

esphome::i2s_audio::I2SAudioBase::std_slot_mask_
i2s_std_slot_mask_t std_slot_mask_
Definition i2s_audio.h:28

esphome::i2s_audio::I2SAudioBase::slot_bit_width_
i2s_slot_bit_width_t slot_bit_width_
Definition i2s_audio.h:29

esphome::i2s_audio::I2SAudioBase::i2s_role_
i2s_role_t i2s_role_
Definition i2s_audio.h:26

esphome::i2s_audio::I2SAudioBase::slot_mode_
i2s_slot_mode_t slot_mode_
Definition i2s_audio.h:27

esphome::i2s_audio::I2SAudioBase::sample_rate_
uint32_t sample_rate_
Definition i2s_audio.h:30

esphome::i2s_audio::I2SAudioBase::mclk_multiple_
i2s_mclk_multiple_t mclk_multiple_
Definition i2s_audio.h:32

esphome::i2s_audio::I2SAudioBase::use_apll_
bool use_apll_
Definition i2s_audio.h:31

esphome::i2s_audio::I2SAudioSpeakerBase::buffer_duration_ms_
uint32_t buffer_duration_ms_
Definition i2s_audio_speaker.h:151

esphome::i2s_audio::I2SAudioSpeakerBase::i2s_on_sent_cb
static bool i2s_on_sent_cb(i2s_chan_handle_t handle, i2s_event_data_t *event, void *user_ctx)
Callback function used to send playback timestamps to the speaker task.
Definition i2s_audio_speaker.cpp:316

esphome::i2s_audio::I2SAudioSpeakerBase::tx_handle_
i2s_chan_handle_t tx_handle_
Definition i2s_audio_speaker.h:162

esphome::i2s_audio::I2SAudioSpeakerBase::pause_state_
bool pause_state_
Definition i2s_audio_speaker.h:155

esphome::i2s_audio::I2SAudioSpeakerBase::apply_software_volume_
void apply_software_volume_(uint8_t *data, size_t bytes_read)
Apply software volume control using Q15 fixed-point scaling.
Definition i2s_audio_speaker.cpp:343

esphome::i2s_audio::I2SAudioSpeakerBase::audio_ring_buffer_
std::weak_ptr< ring_buffer::RingBuffer > audio_ring_buffer_
Definition i2s_audio_speaker.h:149

esphome::i2s_audio::I2SAudioSpeakerBase::swap_esp32_mono_samples_
void swap_esp32_mono_samples_(uint8_t *data, size_t bytes_read)
Swap adjacent 16-bit mono samples for ESP32 (non-variant) hardware quirk.
Definition i2s_audio_speaker.cpp:354

esphome::i2s_audio::I2SAudioSpeakerBase::current_stream_info_
audio::AudioStreamInfo current_stream_info_
Definition i2s_audio_speaker.h:159

esphome::i2s_audio::I2SAudioSpeakerBase::dump_config
void dump_config() override
Definition i2s_audio_speaker.cpp:42

esphome::i2s_audio::I2SAudioSpeakerBase::timeout_
optional< uint32_t > timeout_
Definition i2s_audio_speaker.h:153

esphome::i2s_audio::I2SAudioSpeakerBase::write_records_queue_
QueueHandle_t write_records_queue_
Definition i2s_audio_speaker.h:147

esphome::i2s_audio::I2SAudioSpeakerBase::i2s_event_queue_
QueueHandle_t i2s_event_queue_
Definition i2s_audio_speaker.h:146

esphome::i2s_audio::I2SAudioSpeakerBase::event_group_
EventGroupHandle_t event_group_
Definition i2s_audio_speaker.h:143

esphome::i2s_audio::I2SAudioSpeakerBase::init_i2s_channel_
esp_err_t init_i2s_channel_(const i2s_chan_config_t &chan_cfg, const i2s_std_config_t &std_cfg, size_t event_queue_size)
Shared I2S channel allocation, initialization, and event queue setup.
Definition i2s_audio_speaker.cpp:254

esphome::i2s_audio::I2SAudioSpeakerBase::dout_pin_
gpio_num_t dout_pin_
Definition i2s_audio_speaker.h:161

esphome::i2s_audio::I2SAudioSpeaker::i2s_comm_fmt_
I2SCommFmt i2s_comm_fmt_
Definition i2s_audio_speaker_standard.h:27

esphome::i2s_audio::I2SAudioSpeaker::dump_config
void dump_config() override
Definition i2s_audio_speaker_standard.cpp:50

esphome::i2s_audio::I2SAudioSpeaker::start_i2s_driver
esp_err_t start_i2s_driver(audio::AudioStreamInfo &audio_stream_info) override
Definition i2s_audio_speaker_standard.cpp:328

esphome::i2s_audio::I2SAudioSpeaker::run_speaker_task
void run_speaker_task() override
Definition i2s_audio_speaker_standard.cpp:67

esphome::ring_buffer::RingBuffer::create
static std::unique_ptr< RingBuffer > create(size_t len, MemoryPreference preference=MemoryPreference::EXTERNAL_FIRST)
Definition ring_buffer.cpp:20

esphome::speaker::Speaker::audio_output_callback_
CallbackManager< void(uint32_t, int64_t)> audio_output_callback_
Definition speaker.h:122

esphome::speaker::Speaker::audio_stream_info_
audio::AudioStreamInfo audio_stream_info_
Definition speaker.h:114

hal.h

i2s_audio_speaker_standard.h

log.h

esphome::i2s_audio
Definition i2s_audio.h:11

esphome::i2s_audio::TASK_RUNNING
@ TASK_RUNNING
Definition i2s_audio_microphone.cpp:28

esphome::i2s_audio::COMMAND_STOP_GRACEFULLY
@ COMMAND_STOP_GRACEFULLY
Definition i2s_audio_speaker.h:28

esphome::i2s_audio::TASK_STOPPING
@ TASK_STOPPING
Definition i2s_audio_speaker.h:32

esphome::i2s_audio::ERR_LOCKSTEP_DESYNC
@ ERR_LOCKSTEP_DESYNC
Definition i2s_audio_speaker.h:39

esphome::i2s_audio::TASK_STOPPED
@ TASK_STOPPED
Definition i2s_audio_microphone.cpp:29

esphome::i2s_audio::COMMAND_STOP
@ COMMAND_STOP
Definition i2s_audio_microphone.cpp:25

esphome::i2s_audio::TASK_STARTING
@ TASK_STARTING
Definition i2s_audio_microphone.cpp:27

esphome::i2s_audio::ERR_ESP_NO_MEM
@ ERR_ESP_NO_MEM
Definition i2s_audio_speaker.h:35

esphome::i2s_audio::ERR_PARTIAL_WRITE
@ ERR_PARTIAL_WRITE
Definition i2s_audio_speaker.h:38

esphome::i2s_audio::I2SCommFmt::PCM
@ PCM

esphome::i2s_audio::I2SCommFmt::MSB
@ MSB

esphome::new_data
auto * new_data
Definition helpers.cpp:29

esphome::millis
uint32_t IRAM_ATTR HOT millis()
Definition hal.cpp:28

uint32_t
static void uint32_t
Definition crash_handler.cpp:141