| /* |
| * Copyright (c) 2019-2021, The Linux Foundation. All rights reserved. |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions are |
| * met: |
| * * Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * * Redistributions in binary form must reproduce the above |
| * copyright notice, this list of conditions and the following |
| * disclaimer in the documentation and/or other materials provided |
| * with the distribution. |
| * * Neither the name of The Linux Foundation nor the names of its |
| * contributors may be used to endorse or promote products derived |
| * from this software without specific prior written permission. |
| * |
| * THIS SOFTWARE IS PROVIDED "AS IS" AND ANY EXPRESS OR IMPLIED |
| * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF |
| * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT |
| * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS |
| * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR |
| * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF |
| * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR |
| * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, |
| * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE |
| * OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN |
| * IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| * |
| * Changes from Qualcomm Innovation Center are provided under the following license |
| * |
| * Copyright (c) 2022 Qualcomm Innovation Center, Inc. All rights reserved. |
| * SPDX-License-Identifier: BSD-3-Clause-Clear |
| */ |
| |
| |
| #ifndef SOUNDTRIGGERENGINE_H |
| #define SOUNDTRIGGERENGINE_H |
| |
| #include <condition_variable> |
| #include <thread> |
| #include <mutex> |
| #include <vector> |
| #include <chrono> |
| |
| #include "PalDefs.h" |
| #include "PalCommon.h" |
| #include "PalRingBuffer.h" |
| #include "Device.h" |
| #include "SoundTriggerUtils.h" |
| #include "VoiceUIPlatformInfo.h" |
| #include "VoiceUIInterface.h" |
| |
| #define MAX_MODELS_SUPPORTED 8 |
| #define BITS_PER_BYTE 8 |
| #define US_PER_SEC 1000000 |
| #define MS_PER_SEC 1000 |
| |
| |
| using ChronoSteadyClock_t = std::chrono::time_point<std::chrono::steady_clock>; |
| |
| class Stream; |
| class VoiceUIInterface; |
| |
| struct model_stats |
| { |
| uint32_t detected_model_id; |
| uint32_t detected_keyword_id; |
| uint32_t best_channel_idx; |
| uint32_t best_confidence_level; |
| uint32_t kw_start_timestamp_lsw; |
| uint32_t kw_start_timestamp_msw; |
| uint32_t kw_end_timestamp_lsw; |
| uint32_t kw_end_timestamp_msw; |
| uint32_t detection_timestamp_lsw; |
| uint32_t detection_timestamp_msw; |
| }; |
| |
| struct detection_event_info_pdk |
| { |
| uint32_t num_detected_models; |
| struct model_stats detected_model_stats[MAX_MODELS_SUPPORTED]; |
| uint32_t ftrt_data_length_in_us; |
| }; |
| |
| struct detection_event_info |
| { |
| uint16_t status; |
| uint16_t num_confidence_levels; |
| uint8_t confidence_levels[20]; |
| uint32_t kw_start_timestamp_lsw; |
| uint32_t kw_start_timestamp_msw; |
| uint32_t kw_end_timestamp_lsw; |
| uint32_t kw_end_timestamp_msw; |
| uint32_t detection_timestamp_lsw; |
| uint32_t detection_timestamp_msw; |
| uint32_t ftrt_data_length_in_us; |
| }; |
| |
| class SoundTriggerEngine |
| { |
| public: |
| static std::shared_ptr<SoundTriggerEngine> Create(Stream *s, |
| listen_model_indicator_enum type, st_module_type_t module_type, |
| std::shared_ptr<VUIStreamConfig> sm_cfg); |
| |
| virtual ~SoundTriggerEngine() {} |
| |
| virtual int32_t LoadSoundModel(Stream *s, uint8_t *data, |
| uint32_t data_size) = 0; |
| virtual int32_t UnloadSoundModel(Stream *s) = 0; |
| virtual int32_t StartRecognition(Stream *s) = 0; |
| virtual int32_t RestartRecognition(Stream *s) = 0; |
| virtual int32_t StopRecognition(Stream *s) = 0; |
| virtual int32_t UpdateConfLevels( |
| Stream *s, |
| struct pal_st_recognition_config *config, |
| uint8_t *conf_levels, |
| uint32_t num_conf_levels) = 0; |
| virtual int32_t UpdateBufConfig(Stream *s, uint32_t hist_buffer_duration, |
| uint32_t pre_roll_duration) = 0; |
| virtual void GetUpdatedBufConfig(uint32_t *hist_buffer_duration, |
| uint32_t *pre_roll_duration) = 0; |
| virtual void SetDetected(bool detected) = 0; |
| virtual int32_t GetParameters(uint32_t param_id, void **payload) = 0; |
| virtual int32_t ConnectSessionDevice( |
| Stream* stream_handle, |
| pal_stream_type_t stream_type, |
| std::shared_ptr<Device> device_to_connect) = 0; |
| virtual int32_t DisconnectSessionDevice( |
| Stream* stream_handle, |
| pal_stream_type_t stream_type, |
| std::shared_ptr<Device> device_to_disconnect) = 0; |
| virtual int32_t SetupSessionDevice( |
| Stream* streamHandle, |
| pal_stream_type_t streamType, |
| std::shared_ptr<Device> deviceToConnect) = 0; |
| virtual void DetachStream(Stream *s, bool erase_engine) {} |
| virtual void SetCaptureRequested(bool is_requested) = 0; |
| virtual void UpdateStateToActive() {}; |
| virtual int32_t ReconfigureDetectionGraph(Stream *s) { return 0; } |
| virtual int32_t setECRef( |
| Stream *s, |
| std::shared_ptr<Device> dev, |
| bool is_enable, |
| bool setEcForFirstTime) = 0; |
| virtual ChronoSteadyClock_t GetDetectedTime() = 0; |
| |
| int32_t CreateBuffer(uint32_t buffer_size, uint32_t engine_size, |
| std::vector<PalRingBufferReader *> &reader_list); |
| int32_t SetBufferReader(PalRingBufferReader *reader); |
| int32_t ResetBufferReaders(std::vector<PalRingBufferReader *> &reader_list); |
| uint32_t UsToBytes(uint64_t input_us); |
| uint32_t FrameToBytes(uint32_t frames); |
| uint32_t BytesToFrames(uint32_t bytes); |
| |
| std::shared_ptr<VoiceUIInterface> GetVoiceUIInterface() { return vui_intf_; } |
| void SetVoiceUIInterface(std::shared_ptr<VoiceUIInterface> intf) { |
| vui_intf_ = intf; |
| } |
| |
| protected: |
| listen_model_indicator_enum engine_type_; |
| std::shared_ptr<VoiceUIPlatformInfo> vui_ptfm_info_; |
| std::shared_ptr<VUIStreamConfig> sm_cfg_; |
| std::shared_ptr<VoiceUIInterface> vui_intf_; |
| uint8_t *sm_data_; |
| uint32_t sm_data_size_; |
| bool capture_requested_; |
| Stream *stream_handle_; |
| PalRingBuffer *buffer_; |
| PalRingBufferReader *reader_; |
| uint32_t sample_rate_; |
| uint32_t bit_width_; |
| uint32_t channels_; |
| |
| std::thread buffer_thread_handler_; |
| std::mutex mutex_; |
| std::condition_variable cv_; |
| bool exit_thread_; |
| bool exit_buffering_; |
| }; |
| |
| #endif // SOUNDTRIGGERENGINE_H |