diff --git a/CHANGELOG.md b/CHANGELOG.md index 8694918..7497327 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -4,6 +4,9 @@ - Available storage is less than the remaining flash space on IDF v5.0. If you can not map model partition successfully, please check the left free storage by `spi_flash_mmap_get_free_pages(ESP_PARTITION_MMAP_DATA)` or update IDF to v5.1 or later. +## 1.7.1 +- Add 喵喵同学,Hi,joy, (Hi,Lily/Hi,莉莉) wakenet model + ## 1.7.0 - Add first Noise Suppression model: nsnet2 - Add more wake word model trained by TTS sample diff --git a/CMakeLists.txt b/CMakeLists.txt index 688a7a7..8275dd4 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -72,6 +72,7 @@ elseif(${IDF_TARGET} STREQUAL "esp32s3") target_link_libraries(${COMPONENT_TARGET} "-L ${CMAKE_CURRENT_SOURCE_DIR}/lib/esp32s3") target_link_libraries(${COMPONENT_TARGET} "-L ${CMAKE_CURRENT_SOURCE_DIR}/esp-tts/esp_tts_chinese/esp32s3") + add_prebuilt_library(flite_g2p "${CMAKE_CURRENT_SOURCE_DIR}/lib/esp32s3/libflite_g2p.a" PRIV_REQUIRES ${COMPONENT_NAME}) add_prebuilt_library(esp_audio_processor "${CMAKE_CURRENT_SOURCE_DIR}/lib/esp32s3/libesp_audio_processor.a" PRIV_REQUIRES ${COMPONENT_NAME}) add_prebuilt_library(wakenet "${CMAKE_CURRENT_SOURCE_DIR}/lib/esp32s3/libwakenet.a" PRIV_REQUIRES ${COMPONENT_NAME}) add_prebuilt_library(multinet "${CMAKE_CURRENT_SOURCE_DIR}/lib/esp32s3/libmultinet.a" PRIV_REQUIRES ${COMPONENT_NAME}) diff --git a/Kconfig.projbuild b/Kconfig.projbuild index c109183..3f9e2cc 100644 --- a/Kconfig.projbuild +++ b/Kconfig.projbuild @@ -158,6 +158,10 @@ choice SR_WN_MODEL_LOAD bool "Hi,Joy (wn9_hijoy_tts)" depends on IDF_TARGET_ESP32S3 + config SR_WN_WN9_HILILI_TTS + bool "Hi,Lily/Hi,莉莉 (wn9_hilili_tts)" + depends on IDF_TARGET_ESP32S3 + config SR_WN_WN9_CUSTOMWORD bool "customized word (wn9_customword)" depends on IDF_TARGET_ESP32S3 @@ -231,6 +235,10 @@ menu "Load Multiple Wake Words" bool "Hi,Joy (wn9_hijoy_tts)" depends on IDF_TARGET_ESP32S3 + config SR_WN_WN9_HILILI_TTS_MULTI + bool "Hi,Lily/Hi,莉莉 (wn9_hilili_tts)" + depends on IDF_TARGET_ESP32S3 + endmenu config USE_MULTINET diff --git a/README.md b/README.md index b169cfe..a7982f2 100644 --- a/README.md +++ b/README.md @@ -25,7 +25,8 @@ The new algorithms will no longer support ESP32 chips. Espressif wake word engine **WakeNet** is specially designed to provide a high performance and low memory footprint wake word detection algorithm for users, which enables devices always listen to wake words, such as “Alexa”, “Hi,lexin” and “Hi,ESP”. -Espressif has not only provided an official wake word "Hi,Lexin","Hi,ESP" to the public for free, but also allows customized wake words. For details on how to customize your own wake words, please see [Espressif Speech Wake Words Customization Process](https://docs.espressif.com/projects/esp-sr/en/latest/esp32s3/wake_word_engine/ESP_Wake_Words_Customization.html) or [Training Wake Words by TTS sample](https://github.com/espressif/esp-sr/issues/88). +Espressif offers two ways to customize the wake word, please refer to the following document to choose the one that meets your needs: +[Espressif Speech Wake Words Customization Process](https://docs.espressif.com/projects/esp-sr/en/latest/esp32s3/wake_word_engine/ESP_Wake_Words_Customization.html) or [Training Wake Words by TTS sample](https://github.com/espressif/esp-sr/issues/88). The following wake words are supported in esp-sr: @@ -49,8 +50,9 @@ The following wake words are supported in esp-sr: |Hi,小星 | | wn9_hixiaoxing_tts | |小龙小龙 | | wn9_xiaolongxiaolong_tts | |喵喵同学 | | wn9_miaomiaotongxue_tts | +|Hi,Lily/Hi,莉莉 | | wn9_hilili_tts | -*NOTE:* `_tts` suffix means this WakeNet model is trained by TTS samples. +*NOTE:* `_tts` suffix means this WakeNet model is trained by TTS samples. ## Speech Command Recognition diff --git a/idf_component.yml b/idf_component.yml index c7daf08..ec51140 100644 --- a/idf_component.yml +++ b/idf_component.yml @@ -1,4 +1,4 @@ -version: "1.7.0" +version: "1.7.1" description: esp_sr provides basic algorithms for Speech Recognition applications url: https://github.com/espressif/esp-sr dependencies: diff --git a/model/wakenet_model/wn9_hilili_tts/_MODEL_INFO_ b/model/wakenet_model/wn9_hilili_tts/_MODEL_INFO_ new file mode 100644 index 0000000..53f380e --- /dev/null +++ b/model/wakenet_model/wn9_hilili_tts/_MODEL_INFO_ @@ -0,0 +1,2 @@ +# (neural network type)_(model data version)_(label1_detection window length_threshold for 90%_threshold for 95%)_(label2 ...)_... +wakenet9l_tts1h8_Hilily_3_0.633_0.639 \ No newline at end of file diff --git a/model/wakenet_model/wn9_hilili_tts/wn9_data b/model/wakenet_model/wn9_hilili_tts/wn9_data new file mode 100644 index 0000000..e32961d Binary files /dev/null and b/model/wakenet_model/wn9_hilili_tts/wn9_data differ diff --git a/model/wakenet_model/wn9_hilili_tts/wn9_index b/model/wakenet_model/wn9_hilili_tts/wn9_index new file mode 100644 index 0000000..5e7c881 Binary files /dev/null and b/model/wakenet_model/wn9_hilili_tts/wn9_index differ