16static const UBaseType_t MIXER_TASK_PRIORITY = 10;
18static const uint32_t STOPPING_TIMEOUT_MS = 5000;
19static const uint32_t TRANSFER_BUFFER_DURATION_MS = 50;
20static const uint32_t TASK_DELAY_MS = 25;
21static const uint32_t MIXER_AUTO_STOP_DEBOUNCE_MS = 200;
23static const size_t TASK_STACK_SIZE = 4096;
25static const int16_t MAX_AUDIO_SAMPLE_VALUE = INT16_MAX;
26static const int16_t MIN_AUDIO_SAMPLE_VALUE = INT16_MIN;
28static const char *
const TAG =
"speaker_mixer";
33static const std::array<int16_t, 51> DECIBEL_REDUCTION_TABLE = {
34 32767, 29201, 26022, 23189, 20665, 18415, 16410, 14624, 13032, 11613, 10349, 9222, 8218, 7324, 6527, 5816, 5183,
35 4619, 4116, 3668, 3269, 2913, 2596, 2313, 2061, 1837, 1637, 1459, 1300, 1158, 1032, 920, 820, 731,
36 651, 580, 517, 461, 411, 366, 326, 291, 259, 231, 206, 183, 163, 146, 130, 116, 103};
57static inline uint32_t atomic_subtract_clamped(std::atomic<uint32_t> &var,
uint32_t amount) {
58 uint32_t current = var.load(std::memory_order_acquire);
63 subtracted = std::min(amount, current);
64 new_value = current - subtracted;
65 }
while (!var.compare_exchange_weak(current, new_value, std::memory_order_release, std::memory_order_acquire));
70static bool create_event_group(EventGroupHandle_t &event_group, Component *
component) {
71 event_group = xEventGroupCreate();
72 if (event_group ==
nullptr) {
73 ESP_LOGE(TAG,
"Failed to create event group");
82 "Mixer Source Speaker\n"
83 " Buffer Duration: %" PRIu32
" ms",
86 ESP_LOGCONFIG(TAG,
" Timeout: %" PRIu32
" ms", this->
timeout_ms_.value());
88 ESP_LOGCONFIG(TAG,
" Timeout: never");
103 uint32_t remaining_frames = new_frames - delay_to_drain;
106 if (remaining_frames > 0) {
108 if (speakers_playback_frames > 0) {
132 xEventGroupClearBits(this->
event_group_, SOURCE_SPEAKER_COMMAND_FINISH);
136 xEventGroupClearBits(this->
event_group_, SOURCE_SPEAKER_COMMAND_FINISH);
141 xEventGroupClearBits(this->
event_group_, SOURCE_SPEAKER_COMMAND_START);
145 xEventGroupClearBits(this->
event_group_, SOURCE_SPEAKER_COMMAND_START);
152 esp_err_t err = this->
start_();
166 case ESP_ERR_NOT_SUPPORTED:
169 case ESP_ERR_INVALID_ARG:
172 case ESP_ERR_INVALID_STATE:
186 (this->pending_playback_frames_.load(std::memory_order_acquire) == 0)) {
189 this->stop_gracefully_) {
203 (this->pending_playback_frames_.load(std::memory_order_acquire) == 0)) {
228 size_t bytes_written = 0;
229 std::shared_ptr<ring_buffer::RingBuffer> temp_ring_buffer = this->
ring_buffer_.lock();
230 if (temp_ring_buffer.use_count() > 0) {
232 bytes_written = temp_ring_buffer->write_without_replacement(data,
length, ticks_to_wait);
233 if (bytes_written > 0) {
238 vTaskDelay(ticks_to_wait);
240 return bytes_written;
246 if (!(event_bits & command_bit)) {
260 const size_t ring_buffer_size =
263 std::shared_ptr<ring_buffer::RingBuffer> temp_ring_buffer = this->
ring_buffer_.lock();
264 if (!temp_ring_buffer) {
269 if (!temp_ring_buffer) {
270 return ESP_ERR_NO_MEM;
275 static_cast<uint8_t
>(bytes_per_frame));
276 if (source ==
nullptr) {
277 return ESP_ERR_NO_MEM;
290 return ((this->
audio_source_.use_count() > 0) && this->audio_source_->has_buffered_data());
308 TickType_t ticks_to_wait) {
309 if (audio_source->available() > 0) {
314 size_t bytes_read = audio_source->fill(ticks_to_wait,
false);
317 if (samples_to_duck > 0) {
318 int16_t *current_buffer =
reinterpret_cast<int16_t *
>(audio_source->mutable_data());
337 uint8_t total_ducking_steps = 0;
347 if ((duration > 0) && (total_ducking_steps > 0)) {
363 int8_t *current_ducking_db_reduction,
uint32_t *ducking_transition_samples_remaining,
364 uint32_t samples_per_ducking_step, int8_t db_change_per_ducking_step) {
365 if (*ducking_transition_samples_remaining > 0) {
370 input_samples_to_duck / samples_per_ducking_step + (input_samples_to_duck % samples_per_ducking_step != 0);
372 for (
uint32_t i = 0; i < ducking_steps_in_batch; ++i) {
373 uint32_t samples_left_in_step = *ducking_transition_samples_remaining % samples_per_ducking_step;
375 if (samples_left_in_step == 0) {
376 samples_left_in_step = samples_per_ducking_step;
379 uint32_t samples_to_duck = std::min(input_samples_to_duck, samples_left_in_step);
380 samples_to_duck = std::min(samples_to_duck, *ducking_transition_samples_remaining);
383 uint8_t safe_db_reduction_index =
384 clamp<uint8_t>(*current_ducking_db_reduction, 0, DECIBEL_REDUCTION_TABLE.size() - 1);
385 int16_t q15_scale_factor = DECIBEL_REDUCTION_TABLE[safe_db_reduction_index];
389 if (samples_left_in_step - samples_to_duck == 0) {
391 *current_ducking_db_reduction += db_change_per_ducking_step;
394 input_buffer += samples_to_duck;
395 *ducking_transition_samples_remaining -= samples_to_duck;
396 input_samples_to_duck -= samples_to_duck;
400 if ((*current_ducking_db_reduction > 0) && (input_samples_to_duck > 0)) {
403 uint8_t safe_db_reduction_index =
404 clamp<uint8_t>(*current_ducking_db_reduction, 0, DECIBEL_REDUCTION_TABLE.size() - 1);
405 int16_t q15_scale_factor = DECIBEL_REDUCTION_TABLE[safe_db_reduction_index];
420 " Number of output channels: %u",
446 this->task_stack_in_psram_)) {
447 xEventGroupClearBits(this->
event_group_, MIXER_TASK_COMMAND_START);
449 ESP_LOGE(TAG,
"Failed to start; retrying in 1 second");
457 ESP_LOGD(TAG,
"Starting");
458 xEventGroupClearBits(this->
event_group_, MIXER_TASK_STATE_STARTING);
462 xEventGroupClearBits(this->
event_group_, MIXER_TASK_ERR_ESP_NO_MEM);
465 ESP_LOGV(TAG,
"Started");
467 xEventGroupClearBits(this->
event_group_, MIXER_TASK_STATE_RUNNING);
470 ESP_LOGV(TAG,
"Stopping");
471 xEventGroupClearBits(this->
event_group_, MIXER_TASK_STATE_STOPPING);
475 ESP_LOGD(TAG,
"Stopped");
483 bool all_stopped =
true;
486 all_stopped &= speaker->is_stopped();
500 xEventGroupClearBits(this->
event_group_, MIXER_TASK_COMMAND_STOP);
505 event_group_bits = xEventGroupGetBits(this->
event_group_);
506 if (event_group_bits == 0) {
517 return ESP_ERR_NOT_SUPPORTED;
526 return ESP_ERR_INVALID_ARG;
538 xEventGroupSetBits(this->
event_group_, MIXER_TASK_COMMAND_START);
548 uint8_t input_channels = input_stream_info.
get_channels();
549 uint8_t output_channels = output_stream_info.
get_channels();
550 const uint8_t max_input_channel_index = input_channels - 1;
552 if (input_channels == output_channels) {
553 size_t bytes_to_copy = input_stream_info.
frames_to_bytes(frames_to_transfer);
554 memcpy(output_buffer, input_buffer, bytes_to_copy);
559 for (
uint32_t frame_index = 0; frame_index < frames_to_transfer; ++frame_index) {
560 for (uint8_t output_channel_index = 0; output_channel_index < output_channels; ++output_channel_index) {
561 uint8_t input_channel_index = std::min(output_channel_index, max_input_channel_index);
562 output_buffer[output_channels * frame_index + output_channel_index] =
563 input_buffer[input_channels * frame_index + input_channel_index];
572 const uint8_t primary_channels = primary_stream_info.
get_channels();
573 const uint8_t secondary_channels = secondary_stream_info.
get_channels();
574 const uint8_t output_channels = output_stream_info.
get_channels();
576 const uint8_t max_primary_channel_index = primary_channels - 1;
577 const uint8_t max_secondary_channel_index = secondary_channels - 1;
579 for (
uint32_t frames_index = 0; frames_index < frames_to_mix; ++frames_index) {
580 for (uint8_t output_channel_index = 0; output_channel_index < output_channels; ++output_channel_index) {
581 const uint32_t secondary_channel_index = std::min(output_channel_index, max_secondary_channel_index);
582 const int32_t secondary_sample = secondary_buffer[frames_index * secondary_channels + secondary_channel_index];
584 const uint32_t primary_channel_index = std::min(output_channel_index, max_primary_channel_index);
585 const int32_t primary_sample =
586 static_cast<int32_t
>(primary_buffer[frames_index * primary_channels + primary_channel_index]);
588 const int32_t added_sample = secondary_sample + primary_sample;
590 output_buffer[frames_index * output_channels + output_channel_index] =
591 static_cast<int16_t
>(clamp<int32_t>(added_sample, MIN_AUDIO_SAMPLE_VALUE, MAX_AUDIO_SAMPLE_VALUE));
606 if (output_transfer_buffer ==
nullptr) {
609 vTaskSuspend(
nullptr);
616 bool sent_finished =
false;
631 output_transfer_buffer->transfer_data_to_sink(pdMS_TO_TICKS(TASK_DELAY_MS),
false);
634 this_mixer->
audio_stream_info_.value().bytes_to_frames(output_transfer_buffer->free());
636 speakers_with_data.
clear();
637 audio_sources_with_data.
clear();
640 if (speaker->is_running() && !speaker->get_pause_state()) {
642 std::shared_ptr<audio::RingBufferAudioSource> audio_source = speaker->get_audio_source().lock();
643 if (audio_source.use_count() == 0) {
647 speaker->process_data_from_source(audio_source, 0);
649 if (audio_source->available() > 0) {
651 audio_sources_with_data.
push_back(audio_source);
657 if (audio_sources_with_data.
empty()) {
659 delay(TASK_DELAY_MS);
663 uint32_t frames_to_mix = output_frames_free;
665 if ((audio_sources_with_data.
size() == 1) || this_mixer->
queue_mode_) {
674 const uint32_t frames_available_in_buffer =
675 active_stream_info.
bytes_to_frames(audio_sources_with_data[0]->available());
676 frames_to_mix = std::min(frames_to_mix, frames_available_in_buffer);
677 copy_frames(
reinterpret_cast<const int16_t *
>(audio_sources_with_data[0]->data()), active_stream_info,
678 reinterpret_cast<int16_t *
>(output_transfer_buffer->get_buffer_end()),
682 if (!speakers_with_data[0]->has_contributed_.load(std::memory_order_acquire)) {
683 speakers_with_data[0]->playback_delay_frames_.store(
684 this_mixer->
frames_in_pipeline_.load(std::memory_order_acquire), std::memory_order_release);
685 speakers_with_data[0]->has_contributed_.store(
true, std::memory_order_release);
689 speakers_with_data[0]->pending_playback_frames_.fetch_add(frames_to_mix, std::memory_order_release);
690 audio_sources_with_data[0]->consume(active_stream_info.
frames_to_bytes(frames_to_mix));
693 output_transfer_buffer->increase_buffer_length(
699 if (!sent_finished) {
701 sent_finished =
true;
712 sent_finished =
false;
717 for (
size_t i = 0; i < audio_sources_with_data.
size(); ++i) {
718 const uint32_t frames_available_in_buffer =
719 speakers_with_data[i]->get_audio_stream_info().bytes_to_frames(audio_sources_with_data[i]->available());
720 frames_to_mix = std::min(frames_to_mix, frames_available_in_buffer);
722 const int16_t *primary_buffer =
reinterpret_cast<const int16_t *
>(audio_sources_with_data[0]->data());
726 for (
size_t i = 1; i < audio_sources_with_data.
size(); ++i) {
728 reinterpret_cast<const int16_t *
>(audio_sources_with_data[i]->data()),
729 speakers_with_data[i]->get_audio_stream_info(),
730 reinterpret_cast<int16_t *
>(output_transfer_buffer->get_buffer_end()),
733 if (i != audio_sources_with_data.
size() - 1) {
735 primary_buffer =
reinterpret_cast<const int16_t *
>(output_transfer_buffer->get_buffer_end());
744 for (
size_t i = 0; i < audio_sources_with_data.
size(); ++i) {
746 if (!speakers_with_data[i]->has_contributed_.load(std::memory_order_acquire)) {
747 speakers_with_data[i]->playback_delay_frames_.store(current_pipeline_frames, std::memory_order_release);
748 speakers_with_data[i]->has_contributed_.store(
true, std::memory_order_release);
751 speakers_with_data[i]->pending_playback_frames_.fetch_add(frames_to_mix, std::memory_order_release);
752 audio_sources_with_data[i]->consume(
753 speakers_with_data[i]->get_audio_stream_info().frames_to_bytes(frames_to_mix));
757 output_transfer_buffer->increase_buffer_length(
771 vTaskSuspend(
nullptr);
void wake_loop_threadsafe()
Wake the main event loop from another thread or callback.
void status_momentary_error(const char *name, uint32_t length=5000)
Set error status flag and automatically clear it after a timeout.
void status_clear_error()
void enable_loop_soon_any_context()
Thread and ISR-safe version of enable_loop() that can be called from any context.
bool status_has_error() const
void disable_loop()
Disable this component's loop.
Fixed-capacity vector - allocates once at runtime, never reallocates This avoids std::vector template...
void push_back(const T &value)
Add element without bounds checking Caller must ensure sufficient capacity was allocated via init() S...
bool create(TaskFunction_t fn, const char *name, uint32_t stack_size, void *param, UBaseType_t priority, bool use_psram)
Allocate stack and create task.
bool is_created() const
Check if the task has been created and not yet destroyed.
void deallocate()
Delete the task (if running) and free the stack buffer.
static std::unique_ptr< AudioSinkTransferBuffer > create(size_t buffer_size)
Creates a new sink transfer buffer.
size_t ms_to_bytes(uint32_t ms) const
Converts duration to bytes.
size_t frames_to_bytes(uint32_t frames) const
Converts frames to bytes.
uint8_t get_bits_per_sample() const
uint32_t ms_to_samples(uint32_t ms) const
Converts duration to samples.
uint32_t bytes_to_frames(size_t bytes) const
Convert bytes to frames.
uint8_t get_channels() const
uint32_t get_sample_rate() const
uint32_t bytes_to_samples(size_t bytes) const
Convert bytes to samples.
static std::unique_ptr< RingBufferAudioSource > create(std::shared_ptr< ring_buffer::RingBuffer > ring_buffer, size_t max_fill_bytes, uint8_t alignment_bytes=1)
Creates a new ring-buffer-backed audio source after validating its parameters.
uint32_t all_stopped_since_ms_
void dump_config() override
esp_err_t start(audio::AudioStreamInfo &stream_info)
Starts the mixer task.
FixedVector< SourceSpeaker * > source_speakers_
speaker::Speaker * get_output_speaker() const
static void mix_audio_samples(const int16_t *primary_buffer, audio::AudioStreamInfo primary_stream_info, const int16_t *secondary_buffer, audio::AudioStreamInfo secondary_stream_info, int16_t *output_buffer, audio::AudioStreamInfo output_stream_info, uint32_t frames_to_mix)
Mixes the primary and secondary streams taking into account the number of channels in each stream.
static void copy_frames(const int16_t *input_buffer, audio::AudioStreamInfo input_stream_info, int16_t *output_buffer, audio::AudioStreamInfo output_stream_info, uint32_t frames_to_transfer)
Copies audio frames from the input buffer to the output buffer taking into account the number of chan...
std::atomic< uint32_t > frames_in_pipeline_
static void audio_mixer_task(void *params)
EventGroupHandle_t event_group_
speaker::Speaker * output_speaker_
optional< audio::AudioStreamInfo > audio_stream_info_
uint32_t buffer_duration_ms_
optional< uint32_t > timeout_ms_
float get_volume() override
void set_mute_state(bool mute_state) override
Mute state changes are passed to the parent's output speaker.
int8_t current_ducking_db_reduction_
static void duck_samples(int16_t *input_buffer, uint32_t input_samples_to_duck, int8_t *current_ducking_db_reduction, uint32_t *ducking_transition_samples_remaining, uint32_t samples_per_ducking_step, int8_t db_change_per_ducking_step)
Ducks audio samples by a specified amount.
void send_command_(uint32_t command_bit, bool wake_loop=false)
bool get_mute_state() override
uint32_t samples_per_ducking_step_
std::shared_ptr< audio::RingBufferAudioSource > audio_source_
std::atomic< uint32_t > playback_delay_frames_
std::weak_ptr< ring_buffer::RingBuffer > ring_buffer_
uint32_t stopping_start_ms_
void apply_ducking(uint8_t decibel_reduction, uint32_t duration)
Sets the ducking level for the source speaker.
int8_t target_ducking_db_reduction_
size_t play(const uint8_t *data, size_t length, TickType_t ticks_to_wait) override
size_t process_data_from_source(std::shared_ptr< audio::RingBufferAudioSource > &audio_source, TickType_t ticks_to_wait)
Exposes the next ring buffer chunk (zero-copy) and ducks the freshly exposed bytes in place.
uint32_t ducking_transition_samples_remaining_
std::atomic< bool > has_contributed_
void dump_config() override
void enter_stopping_state_()
int8_t db_change_per_ducking_step_
void set_volume(float volume) override
Volume state changes are passed to the parent's output speaker.
bool has_buffered_data() const override
uint32_t last_seen_data_ms_
EventGroupHandle_t event_group_
std::atomic< uint32_t > pending_playback_frames_
static std::unique_ptr< RingBuffer > create(size_t len, MemoryPreference preference=MemoryPreference::EXTERNAL_FIRST)
virtual void set_volume(float volume)
virtual float get_volume()
virtual bool get_pause_state() const
CallbackManager< void(uint32_t, int64_t)> audio_output_callback_
void set_audio_stream_info(const audio::AudioStreamInfo &audio_stream_info)
audio::AudioStreamInfo & get_audio_stream_info()
void add_audio_output_callback(F &&callback)
Callback function for sending the duration of the audio written to the speaker since the last callbac...
virtual bool get_mute_state()
virtual void set_mute_state(bool mute_state)
audio::AudioStreamInfo audio_stream_info_
const Component * component
void scale_audio_samples(const int16_t *audio_samples, int16_t *output_buffer, int16_t scale_factor, size_t samples_to_scale)
Scales Q15 fixed point audio samples.
@ MIXER_TASK_STATE_STOPPED
@ MIXER_TASK_STATE_RUNNING
@ MIXER_TASK_COMMAND_STOP
@ MIXER_TASK_STATE_STARTING
@ MIXER_TASK_STATE_STOPPING
@ MIXER_TASK_ERR_ESP_NO_MEM
@ MIXER_TASK_COMMAND_START
@ SOURCE_SPEAKER_COMMAND_STOP
@ SOURCE_SPEAKER_COMMAND_FINISH
@ SOURCE_SPEAKER_COMMAND_START
void HOT delay(uint32_t ms)
uint32_t IRAM_ATTR HOT millis()
Application App
Global storage of Application pointer - only one Application can exist.