espressif
diff --git a/Diff for: ‎libraries/TFLiteMicro/examples/micro_speech/README.md
+22 b/Diff for: ‎libraries/TFLiteMicro/examples/micro_speech/README.md
+22
diff --git a/Diff for: ‎libraries/TFLiteMicro/examples/micro_speech/audio_provider.cpp
+198 b/Diff for: ‎libraries/TFLiteMicro/examples/micro_speech/audio_provider.cpp
+198
diff --git a/Diff for: ‎libraries/TFLiteMicro/examples/micro_speech/audio_provider.h
+44 b/Diff for: ‎libraries/TFLiteMicro/examples/micro_speech/audio_provider.h
+44
diff --git a/Diff for: ‎libraries/TFLiteMicro/examples/micro_speech/command_responder.cpp
+27 b/Diff for: ‎libraries/TFLiteMicro/examples/micro_speech/command_responder.cpp
+27
diff --git a/Diff for: ‎libraries/TFLiteMicro/examples/micro_speech/command_responder.h
+30 b/Diff for: ‎libraries/TFLiteMicro/examples/micro_speech/command_responder.h
+30
@@ -0,0 +1,22 @@
+# Micro Speech Example
+
+This example shows how to run a 20 kB model that can recognize 2 keywords,
+"yes" and "no", from speech data.
+
+The application listens to its surroundings with a microphone and indicates
+when it has detected a word by displaying data on a screen.
+
+## Deploy to ESP32
+
+The sample has been tested on ESP-IDF version `release/v4.2` and `release/v4.4` with the following devices:
+- [ESP32-DevKitC](http://esp-idf.readthedocs.io/en/latest/get-started/get-started-devkitc.html)
+- [ESP32-S3-DevKitC](https://docs.espressif.com/projects/esp-idf/en/latest/esp32s3/hw-reference/esp32s3/user-guide-devkitc-1.html)
+- [ESP-EYE](https://github.com/espressif/esp-who/blob/master/docs/en/get-started/ESP-EYE_Getting_Started_Guide.md)
+
+### Sample output
+
+  * When a keyword is detected you will see following output sample output on the log screen:
+
+```
+Heard yes (<score>) at <time>
+```
@@ -0,0 +1,198 @@
+/* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "audio_provider.h"
+
+#include <cstdlib>
+#include <cstring>
+
+// FreeRTOS.h must be included before some of the following dependencies.
+// Solves b/150260343.
+// clang-format off
+#include "freertos/FreeRTOS.h"
+// clang-format on
+
+#include "driver/i2s.h"
+#include "esp_log.h"
+#include "esp_spi_flash.h"
+#include "esp_system.h"
+#include "esp_timer.h"
+#include "freertos/task.h"
+#include "ringbuf.h"
+#include "micro_model_settings.h"
+
+using namespace std;
+
+#define NO_I2S_SUPPORT CONFIG_IDF_TARGET_ESP32C2 || \
+                          (CONFIG_IDF_TARGET_ESP32C3 \
+                          && (ESP_IDF_VERSION < ESP_IDF_VERSION_VAL(4, 4, 0)))
+
+static const char* TAG = "TF_LITE_AUDIO_PROVIDER";
+/* ringbuffer to hold the incoming audio data */
+ringbuf_t* g_audio_capture_buffer;
+volatile int32_t g_latest_audio_timestamp = 0;
+/* model requires 20ms new data from g_audio_capture_buffer and 10ms old data
+ * each time , storing old data in the histrory buffer , {
+ * history_samples_to_keep = 10 * 16 } */
+constexpr int32_t history_samples_to_keep =
+    ((kFeatureSliceDurationMs - kFeatureSliceStrideMs) *
+     (kAudioSampleFrequency / 1000));
+/* new samples to get each time from ringbuffer, { new_samples_to_get =  20 * 16
+ * } */
+constexpr int32_t new_samples_to_get =
+    (kFeatureSliceStrideMs * (kAudioSampleFrequency / 1000));
+
+namespace {
+int16_t g_audio_output_buffer[kMaxAudioSampleSize];
+bool g_is_audio_initialized = false;
+int16_t g_history_buffer[history_samples_to_keep];
+}  // namespace
+
+const int32_t kAudioCaptureBufferSize = 80000;
+const int32_t i2s_bytes_to_read = 3200;
+
+#if NO_I2S_SUPPORT
+  // nothing to be done here
+#else
+static void i2s_init(void) {
+  // Start listening for audio: MONO @ 16KHz
+  i2s_config_t i2s_config = {
+      .mode = (i2s_mode_t)(I2S_MODE_MASTER | I2S_MODE_RX | I2S_MODE_TX),
+      .sample_rate = 16000,
+      .bits_per_sample = (i2s_bits_per_sample_t)16,
+      .channel_format = I2S_CHANNEL_FMT_ONLY_LEFT,
+      .communication_format = I2S_COMM_FORMAT_I2S,
+      .intr_alloc_flags = 0,
+      .dma_buf_count = 3,
+      .dma_buf_len = 300,
+      .use_apll = false,
+      .tx_desc_auto_clear = false,
+      .fixed_mclk = -1,
+  };
+  i2s_pin_config_t pin_config = {
+      .bck_io_num = 26,    // IIS_SCLK
+      .ws_io_num = 32,     // IIS_LCLK
+      .data_out_num = -1,  // IIS_DSIN
+      .data_in_num = 33,   // IIS_DOUT
+  };
+  esp_err_t ret = 0;
+  ret = i2s_driver_install((i2s_port_t)1, &i2s_config, 0, NULL);
+  if (ret != ESP_OK) {
+    ESP_LOGE(TAG, "Error in i2s_driver_install");
+  }
+  ret = i2s_set_pin((i2s_port_t)1, &pin_config);
+  if (ret != ESP_OK) {
+    ESP_LOGE(TAG, "Error in i2s_set_pin");
+  }
+
+  ret = i2s_zero_dma_buffer((i2s_port_t)1);
+  if (ret != ESP_OK) {
+    ESP_LOGE(TAG, "Error in initializing dma buffer with 0");
+  }
+}
+#endif
+
+static void CaptureSamples(void* arg) {
+#if NO_I2S_SUPPORT
+  ESP_LOGE(TAG, "i2s support not available on C3 chip for IDF < 4.4.0");
+  return;
+#else
+  size_t bytes_read = i2s_bytes_to_read;
+  uint8_t i2s_read_buffer[i2s_bytes_to_read] = {};
+  i2s_init();
+  while (1) {
+    /* read 100ms data at once from i2s */
+    i2s_read((i2s_port_t)1, (void*)i2s_read_buffer, i2s_bytes_to_read,
+             &bytes_read, pdMS_TO_TICKS(100));
+    if (bytes_read <= 0) {
+      ESP_LOGE(TAG, "Error in I2S read : %d", bytes_read);
+    } else {
+      if (bytes_read < i2s_bytes_to_read) {
+        ESP_LOGW(TAG, "Partial I2S read");
+      }
+      /* write bytes read by i2s into ring buffer */
+      int bytes_written = rb_write(g_audio_capture_buffer,
+                                   (uint8_t*)i2s_read_buffer, bytes_read, pdMS_TO_TICKS(100));
+      /* update the timestamp (in ms) to let the model know that new data has
+       * arrived */
+      g_latest_audio_timestamp = g_latest_audio_timestamp +
+          ((1000 * (bytes_written / 2)) / kAudioSampleFrequency);
+      if (bytes_written <= 0) {
+        ESP_LOGE(TAG, "Could Not Write in Ring Buffer: %d ", bytes_written);
+      } else if (bytes_written < bytes_read) {
+        ESP_LOGW(TAG, "Partial Write");
+      }
+    }
+  }
+#endif
+  vTaskDelete(NULL);
+}
+
+TfLiteStatus InitAudioRecording() {
+  g_audio_capture_buffer = rb_init("tf_ringbuffer", kAudioCaptureBufferSize);
+  if (!g_audio_capture_buffer) {
+    ESP_LOGE(TAG, "Error creating ring buffer");
+    return kTfLiteError;
+  }
+  /* create CaptureSamples Task which will get the i2s_data from mic and fill it
+   * in the ring buffer */
+  xTaskCreate(CaptureSamples, "CaptureSamples", 1024 * 32, NULL, 10, NULL);
+  while (!g_latest_audio_timestamp) {
+    vTaskDelay(1); // one tick delay to avoid watchdog
+  }
+  ESP_LOGI(TAG, "Audio Recording started");
+  return kTfLiteOk;
+}
+
+TfLiteStatus GetAudioSamples(int start_ms, int duration_ms,
+                             int* audio_samples_size, int16_t** audio_samples) {
+  if (!g_is_audio_initialized) {
+    TfLiteStatus init_status = InitAudioRecording();
+    if (init_status != kTfLiteOk) {
+      return init_status;
+    }
+    g_is_audio_initialized = true;
+  }
+  /* copy 160 samples (320 bytes) into output_buff from history */
+  memcpy((void*)(g_audio_output_buffer), (void*)(g_history_buffer),
+         history_samples_to_keep * sizeof(int16_t));
+
+  /* copy 320 samples (640 bytes) from rb at ( int16_t*(g_audio_output_buffer) +
+   * 160 ), first 160 samples (320 bytes) will be from history */
+  int bytes_read =
+      rb_read(g_audio_capture_buffer,
+              ((uint8_t*)(g_audio_output_buffer + history_samples_to_keep)),
+              new_samples_to_get * sizeof(int16_t), pdMS_TO_TICKS(100));
+  if (bytes_read < 0) {
+    ESP_LOGE(TAG, " Model Could not read data from Ring Buffer");
+  } else if (bytes_read < new_samples_to_get * sizeof(int16_t)) {
+    ESP_LOGD(TAG, "RB FILLED RIGHT NOW IS %d",
+             rb_filled(g_audio_capture_buffer));
+    ESP_LOGD(TAG, " Partial Read of Data by Model ");
+    ESP_LOGV(TAG, " Could only read %d bytes when required %d bytes ",
+             bytes_read, (int) (new_samples_to_get * sizeof(int16_t)));
+  }
+
+  /* copy 320 bytes from output_buff into history */
+  memcpy((void*)(g_history_buffer),
+         (void*)(g_audio_output_buffer + new_samples_to_get),
+         history_samples_to_keep * sizeof(int16_t));
+
+  *audio_samples_size = kMaxAudioSampleSize;
+  *audio_samples = g_audio_output_buffer;
+  return kTfLiteOk;
+}
+
+int32_t LatestAudioTimestamp() { return g_latest_audio_timestamp; }
@@ -0,0 +1,44 @@
+/* Copyright 2018 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef TENSORFLOW_LITE_MICRO_EXAMPLES_MICRO_SPEECH_AUDIO_PROVIDER_H_
+#define TENSORFLOW_LITE_MICRO_EXAMPLES_MICRO_SPEECH_AUDIO_PROVIDER_H_
+
+#include "tensorflow/lite/c/common.h"
+
+// This is an abstraction around an audio source like a microphone, and is
+// expected to return 16-bit PCM sample data for a given point in time. The
+// sample data itself should be used as quickly as possible by the caller, since
+// to allow memory optimizations there are no guarantees that the samples won't
+// be overwritten by new data in the future. In practice, implementations should
+// ensure that there's a reasonable time allowed for clients to access the data
+// before any reuse.
+// The reference implementation can have no platform-specific dependencies, so
+// it just returns an array filled with zeros. For real applications, you should
+// ensure there's a specialized implementation that accesses hardware APIs.
+TfLiteStatus GetAudioSamples(int start_ms, int duration_ms,
+                             int* audio_samples_size, int16_t** audio_samples);
+
+// Returns the time that audio data was last captured in milliseconds. There's
+// no contract about what time zero represents, the accuracy, or the granularity
+// of the result. Subsequent calls will generally not return a lower value, but
+// even that's not guaranteed if there's an overflow wraparound.
+// The reference implementation of this function just returns a constantly
+// incrementing value for each call, since it would need a non-portable platform
+// call to access time information. For real applications, you'll need to write
+// your own platform-specific implementation.
+int32_t LatestAudioTimestamp();
+
+#endif  // TENSORFLOW_LITE_MICRO_EXAMPLES_MICRO_SPEECH_AUDIO_PROVIDER_H_
@@ -0,0 +1,27 @@
+/* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "command_responder.h"
+#include "tensorflow/lite/micro/micro_log.h"
+
+// The default implementation writes out the name of the recognized command
+// to the error console. Real applications will want to take some custom
+// action instead, and should implement their own versions of this function.
+void RespondToCommand(int32_t current_time, const char* found_command,
+                      uint8_t score, bool is_new_command) {
+  if (is_new_command) {
+    MicroPrintf("Heard %s (%d) @%dms", found_command, score, current_time);
+  }
+}
@@ -0,0 +1,30 @@
+/* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+// Provides an interface to take an action based on an audio command.
+
+#ifndef TENSORFLOW_LITE_MICRO_EXAMPLES_MICRO_SPEECH_COMMAND_RESPONDER_H_
+#define TENSORFLOW_LITE_MICRO_EXAMPLES_MICRO_SPEECH_COMMAND_RESPONDER_H_
+
+#include "tensorflow/lite/c/common.h"
+
+// Called every time the results of an audio recognition run are available. The
+// human-readable name of any recognized command is in the `found_command`
+// argument, `score` has the numerical confidence, and `is_new_command` is set
+// if the previous command was different to this one.
+void RespondToCommand(int32_t current_time, const char* found_command,
+                      uint8_t score, bool is_new_command);
+
+#endif  // TENSORFLOW_LITE_MICRO_EXAMPLES_MICRO_SPEECH_COMMAND_RESPONDER_H_