hal: Extract source track meta data - Source track meta data is extracted with STT algo running in Android Audio record path. Change-Id: Id1a4e0811df0f9a11ed32e44e18e962243b09e91

commit: cf29fe9000e706022f53fbe69e1fa64a4363440c [log] [tgz]
author: Hari Krishna Chowdary Yennana <quic_hyennnan@quicinc.com> Mon Jun 26 16:44:23 2023 +0530
committer: Hari Krishna Chowdary Yennana <quic_hyennnan@quicinc.com> Thu Aug 17 16:51:05 2023 +0530
tree: b024ba23f52707ff0c613911cd9b154960eb8968
parent: 0859aa48ee398832b6deec3633e248cb25ecf223 [diff]
diff --git a/Android.mk b/Android.mk
index 34effe0..bd1bae2 100644
--- a/Android.mk
+++ b/Android.mk

@@ -19,6 +19,9 @@
 include $(MY_LOCAL_PATH)/post_proc/Android.mk
 include $(MY_LOCAL_PATH)/qahw/Android.mk
 include $(MY_LOCAL_PATH)/qahw_api/Android.mk
+ifeq ($(AUDIO_FEATURE_ENABLED_STT_SUPPORT),true)
+include $(MY_LOCAL_PATH)/stt_meta/Android.mk
+endif
 endif
 
 ifeq ($(USE_LEGACY_AUDIO_DAEMON), true)

diff --git a/stt_meta/Android.mk b/stt_meta/Android.mk
new file mode 100644
index 0000000..8ebd0a5
--- /dev/null
+++ b/stt_meta/Android.mk

@@ -0,0 +1,21 @@
+LOCAL_PATH := $(call my-dir)
+
+# stt_meta_extract
+# ==============================================================================
+include $(CLEAR_VARS)
+LOCAL_SRC_FILES := stt_meta_extract.c
+LOCAL_MODULE := stt_meta_extract
+LOCAL_CFLAGS += -Wall -Werror -Wno-sign-compare
+LOCAL_SHARED_LIBRARIES := \
+    libtinyalsa \
+    libcutils \
+    liblog
+
+LOCAL_C_INCLUDES += \
+    external/tinyalsa/include
+
+LOCAL_32_BIT_ONLY := true
+
+LOCAL_VENDOR_MODULE := true
+
+include $(BUILD_EXECUTABLE)

diff --git a/stt_meta/stt_meta_extract.c b/stt_meta/stt_meta_extract.c
new file mode 100644
index 0000000..49932bc
--- /dev/null
+++ b/stt_meta/stt_meta_extract.c

@@ -0,0 +1,531 @@
+/*
+* Copyright (c) 2015-2019, The Linux Foundation. All rights reserved.
+* Copyright (c) 2021,2023 Qualcomm Innovation Center, Inc. All rights reserved.
+*
+* Redistribution and use in source and binary forms, with or without
+* modification, are permitted provided that the following conditions are
+* met:
+*    * Redistributions of source code must retain the above copyright
+*      notice, this list of conditions and the following disclaimer.
+*    * Redistributions in binary form must reproduce the above
+*      copyright notice, this list of conditions and the following
+*      disclaimer in the documentation and/or other materials provided
+*      with the distribution.
+*    * Neither the name of The Linux Foundation nor the names of its
+*      contributors may be used to endorse or promote products derived
+*      from this software without specific prior written permission.
+*
+* THIS SOFTWARE IS PROVIDED "AS IS" AND ANY EXPRESS OR IMPLIED
+* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT
+* ARE DISCLAIMED.  IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS
+* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+* WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+* OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+* IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*/
+
+/* Test app to capture STT data using ctls from kernel */
+
+#include <tinyalsa/asoundlib.h>
+#include <errno.h>
+#include <math.h>
+#include "stt_meta_extract.h"
+#include <log/log.h>
+#include <cutils/str_parms.h>
+#include <cutils/properties.h>
+#undef LOG_TAG
+#define LOG_TAG "stt_meta"
+#undef LOG_NDEBUG
+/*#define LOG_NDDEBUG 0*/
+/*#define LOG_NDEBUG 0*/
+
+#define nullptr NULL
+
+static int get_sourcetrack_metadata(void *payload, unsigned int meta_size,
+                                                  struct mixer_ctl *ctl) {
+
+    int ret = 0;
+    unsigned int count;
+
+    if (!ctl || !payload) {
+        ALOGE("%s: Invalid params, ctl / source track payload is NULL", __func__);
+        return -EINVAL;
+    }
+
+    ALOGD("%s from mixer", __func__);
+    mixer_ctl_update(ctl);
+
+    count = mixer_ctl_get_num_values(ctl);
+
+    if (count != meta_size) {
+        ALOGE("%s: mixer_ctl_get_num_values() invalid source tracking data size %d",
+                                                                    __func__, count);
+        ret = -EINVAL;
+        goto done;
+    }
+
+    ret = mixer_ctl_get_array(ctl, payload, count);
+
+    if (ret != 0) {
+        ALOGE("%s: mixer_ctl_get_array() failed to get Source Tracking Params", __func__);
+        ret = -EINVAL;
+        goto done;
+    }
+
+done:
+    ALOGD("%s exit with %d", __func__, ret);
+    return ret;
+}
+
+static int get_soundfocus_metadata(struct sound_focus_meta *sound_focus_meta,
+                                                     struct mixer_ctl *ctl) {
+    int ret = 0, count;
+    struct timespec ts;
+
+    if (!ctl) {
+        ALOGE("%s: not a valid ctrl", __func__);
+        return -EINVAL;
+    } else {
+        ALOGD("%s: from mixer", __func__);
+        mixer_ctl_update(ctl);
+        count = mixer_ctl_get_num_values(ctl);
+
+        if (count != (sizeof(struct sound_focus_meta) - sizeof(ts))) {
+            ALOGE("%s: mixer_ctl_get_num_values() invalid sound focus data size %d",
+                                                                           __func__, count);
+            ret = -EINVAL;
+            goto done;
+        }
+
+        ret = mixer_ctl_get_array(ctl, (void *)sound_focus_meta, count);
+        if (ret != 0) {
+            ALOGE("%s: mixer_ctl_get_array() failed to get Sound Focus Params", __func__);
+            ret = -EINVAL;
+            goto done;
+        }
+
+        clock_gettime(CLOCK_MONOTONIC, &ts);
+        sound_focus_meta->ts = ts;
+    }
+
+done:
+    ALOGD("%s exit with %d", __func__, ret);
+    return ret;
+}
+
+static int set_soundfocus_metadata(struct sound_focus_meta *sound_focus_meta,
+                                                     struct mixer_ctl *ctl) {
+    int ret = 0, count;
+    struct timespec ts;
+
+    if (!ctl) {
+        ALOGE("%s: not a valid ctrl", __func__);
+        return -EINVAL;
+    } else {
+        ALOGD("%s: Setting Sound Focus Params func", __func__);
+        mixer_ctl_update(ctl);
+        count = mixer_ctl_get_num_values(ctl);
+
+        if (count != (sizeof(struct sound_focus_meta) - sizeof(ts))) {
+            ALOGE("%s: mixer_ctl_get_num_values() invalid sound focus data size %d",
+                                                                           __func__, count);
+            ret = -EINVAL;
+            goto done;
+        }
+
+        ret = mixer_ctl_set_array(ctl, (void *)sound_focus_meta, count);
+        if (ret != 0) {
+            ALOGE("%s: mixer_ctl_set_array() failed to set Sound Focus Params", __func__);
+            ret = -EINVAL;
+            goto done;
+        }
+    }
+
+done:
+    ALOGD("%s exit with %d", __func__, ret);
+    return ret;
+}
+
+static void updatestt_data(char* str, struct sound_focus_meta *sound_focus_meta) {
+    int str_len = strlen(str);
+    int j = 0, i;
+    int *arr=(int*)malloc(str_len*sizeof(int));
+
+    for (i = 0; str[i] != '\0'; i++) {
+        if (str[i] == ',')
+            j++;
+        else
+            arr[j] = arr[j] * DECI + (str[i] - ASCI_NUM);
+    }
+    j=0;
+    for (i = 0; i < NUM_SECTORS; i++) {
+        sound_focus_meta->start_angle[i] = arr[j++];
+    }
+    for (i = 0; i < NUM_SECTORS; i++) {
+        sound_focus_meta->enable[i] = arr[j++];
+    }
+    sound_focus_meta->gain_step = arr[j];
+}
+
+static void usage() {
+    printf(" \n Command \n");
+    printf(" \n stt_meta_extract <options>\n");
+    printf(" \n Options\n");
+    printf(" -t  --source_track_data         - get source tracking params data with recording\n");
+    printf(" -f  --sound_focus_data          - get sound focus params data with recording\n");
+    printf(" -s  --sound focus set           - set sound focus params data with recording\n\n");
+    printf(" -g  --meta-time-gap             - time between successive get data in msec\n\n");
+    printf(" -n  --get-data-iterations       - get iterations cnt, (-ve) for cont get data\n\n");
+    printf(" -h  --help                      - Show this help\n\n");
+    printf(" \n Examples \n");
+    printf(" stt_meta_extract      -> Get source track meta data while record in progress\n\n");
+    printf(" stt_meta_extract -t 1 -> Get source track meta data while record in progress\n\n");
+    printf(" stt_meta_extract -f 1 -> Get sound focus meta data while record in progress\n\n");
+    printf(" stt_meta_extract -s 45,110,235,310,1,0,0,1,50 -> Set sound focus param data\n");
+    printf("                                    secort_startangles[4],secotr_enable[4],gain \n\n");
+    printf(" stt_meta_extract -g 200 -n 5 ->    Get stt meta data 5 times for every 200msec\n\n");
+    printf(" stt_meta_extract -b TX_CDC_DMA_TX_3 -> Get stt meta with be TX_CDC_DMA_TX_3 \n\n");
+}
+
+static int derive_mixer_ctl_stt(struct mixer **stt_mixer, struct mixer_ctl **ctl_st, struct mixer_ctl **ctl_sf,
+                                 struct mixer_ctl **ctl_st_fnn, char* be_intf, enum fluence_version fversion) {
+
+    char sound_focus_mixer_ctl_name[MIXER_PATH_MAX_LENGTH] = "Sound Focus Audio Tx ";
+    char source_tracking_mixer_ctl_name[MIXER_PATH_MAX_LENGTH] = "Source Tracking Audio Tx ";
+    char st_fnn_mixer_ctl_name[MIXER_PATH_MAX_LENGTH] = "FNN STM Audio Tx ";
+    struct mixer *mixer = NULL;
+    int ret = 0, retry_num = 0;
+    struct mixer_ctl *ctl = NULL;
+
+    if (!stt_mixer) {
+        ALOGE("%s: invalid mixer", __func__);
+        return -EINVAL;
+    }
+
+    if (!ctl_st) {
+        ALOGE("%s: invalid Source tracking mixer ctl", __func__);
+        return -EINVAL;
+    }
+
+    if (!ctl_sf) {
+        ALOGE("%s: invalid Sound focus mixer ctl", __func__);
+        return -EINVAL;
+    }
+
+    if (!ctl_st_fnn) {
+        ALOGE("%s: invalid Sound tracking mixer ctl for fnn", __func__);
+        return -EINVAL;
+    }
+
+    strlcat(sound_focus_mixer_ctl_name, be_intf, MIXER_PATH_MAX_LENGTH);
+    strlcat(source_tracking_mixer_ctl_name, be_intf, MIXER_PATH_MAX_LENGTH);
+    strlcat(st_fnn_mixer_ctl_name, be_intf, MIXER_PATH_MAX_LENGTH);
+
+    mixer = mixer_open(SOUND_CARD);
+
+    while (!mixer && retry_num < MIXER_OPEN_MAX_NUM_RETRY) {
+        usleep(RETRY_US);
+        mixer = mixer_open(SOUND_CARD);
+        retry_num++;
+    }
+
+    if (!mixer) {
+        ALOGE("%s: ERROR. Unable to open the mixer, aborting", __func__);
+        ret = -EINVAL;
+        goto clean;
+    } else {
+        *stt_mixer = mixer;
+    }
+
+    switch (fversion) {
+        case FV_11:
+        {
+            ctl = mixer_get_ctl_by_name(mixer, source_tracking_mixer_ctl_name);
+
+            if (!ctl) {
+                ALOGE("%s: Could not get ctl for mixer cmd - %s",
+                        __func__, source_tracking_mixer_ctl_name);
+                ret = -EINVAL;
+                goto clean;
+            } else {
+                *ctl_st = ctl;
+            }
+
+            ctl = mixer_get_ctl_by_name(mixer, sound_focus_mixer_ctl_name);
+            if (!ctl) {
+                ALOGE("%s: Could not get ctl for mixer cmd - %s",
+                        __func__, source_tracking_mixer_ctl_name);
+                ret = -EINVAL;
+                goto clean;
+            } else {
+                *ctl_sf = ctl;
+            }
+            break;
+        }
+        case FV_13:
+        {
+            ctl = mixer_get_ctl_by_name(mixer, st_fnn_mixer_ctl_name);
+            if (!ctl) {
+                ALOGE("%s: Could not get ctl for mixer cmd - %s",
+                        __func__, st_fnn_mixer_ctl_name);
+                ret = -EINVAL;
+                goto clean;
+            } else {
+                *ctl_st_fnn = ctl;
+            }
+            break;
+        }
+        default:
+            ALOGE("%s: invalid fluence type", __func__);
+            break;
+    }
+
+    return ret;
+
+clean:
+    if (mixer)
+        mixer_close(mixer);
+
+    return ret;
+}
+
+int main(int argc, char* argv[]) {
+    int get_data_iter = 1, get_data_time_gap = RETRY_US, idx, count, sect, ret = 0;
+    bool is_source_track_get = true, is_sound_focus_get = false, is_sound_focus_set = false;
+    char *be_intf = "TX_CDC_DMA_TX_3";
+    FILE * log_file = NULL;
+    const char *log_filename = NULL;
+    char fluence_property[PROPERTY_VALUE_MAX];
+    enum fluence_version fv;
+    struct timespec ts;
+
+    struct sound_focus_meta sound_focus_metadataset;
+    struct source_track_meta source_track_metadata;
+    struct sound_focus_meta sound_focus_metadata;
+    struct source_track_meta_fnn source_track_metadata_fnn;
+    /* Open mixer for snd card 0 */
+    struct mixer *stt_mixer = NULL;
+    struct mixer_ctl *ctl_st = NULL, *ctl_sf = NULL, *ctl_st_fnn = NULL;
+
+    struct option long_options[] = {
+        {"meta-time-gap",       required_argument,    0, 'g'},    // time-gap between two meta data
+        {"get-data-iterations", required_argument,    0, 'n'},    // number of meta data events
+        {"source_track_data",   required_argument,    0, 't'},    // Extract Source track meta data
+        {"sound_focus_data",    required_argument,    0, 'f'},    // Extract Sound focus meta data
+        {"sound focus set",     required_argument,    0, 's'},   // Set Sound focus meta data
+        {"audio be interface",  required_argument,    0, 'b'},   // update audio back end interface
+        {"log file_name",       required_argument,    0, 'l'},   // update log file name
+        {"help",                no_argument,          0, 'h'}
+    };
+
+    int opt = 0;
+    int option_index = 0;
+    char *str;
+    log_file = stdout;
+
+    memset(&sound_focus_metadataset, 0x0, sizeof(struct sound_focus_meta));
+    memset(&source_track_metadata_fnn, 0xFF, sizeof(struct source_track_meta_fnn));
+    memset(&source_track_metadata, 0xFF, sizeof(struct source_track_meta));
+    memset(&sound_focus_metadata, 0x0, sizeof(struct sound_focus_meta));
+
+    while ((opt = getopt_long(argc,
+                              argv,
+                              "-g:n:t:f:s:b:l:h:",
+                              long_options,
+                              &option_index)) != -1) {
+        printf("for argument %c, value is %s\n", opt, optarg);
+
+        switch (opt) {
+        case 'g':
+            get_data_time_gap = NSEC_MSEC_CONVERT * atoi(optarg);
+            break;
+        case 'n':
+            get_data_iter = atoi(optarg);     /* -ve value for cont get data, +ve for iterations */
+            break;
+        case 't':
+            is_source_track_get = atoi(optarg);
+            break;
+        case 'f':
+            is_sound_focus_get = atoi(optarg);
+            break;
+        case 's':
+            str = optarg;
+            updatestt_data(str, &sound_focus_metadataset);
+            is_sound_focus_set = true;
+            break;
+        case 'b':
+            be_intf = optarg;
+            break;
+        case 'l':
+            log_filename = optarg;
+            if (strcasecmp(log_filename, "stdout") &&
+                strcasecmp(log_filename, "1") &&
+                (log_file = fopen(log_filename,"wb")) == NULL) {
+                fprintf(log_file, "Cannot open log file %s\n", log_filename);
+                fprintf(stderr, "Cannot open log file %s\n", log_filename);
+                /* continue to log to std out. */
+                log_file = stdout;
+            }
+            break;
+        case 'h':
+            usage();
+            return 0;
+            break;
+        default:
+            usage();
+            return 0;
+        }
+    }
+
+    printf("STT GET META \n");
+
+    property_get("ro.vendor.audio.sdk.fluencetype", fluence_property, NULL);
+
+    if (property_get_bool("ro.vendor.audio.sdk.fluence.nn.enabled",false)) {
+        if((!strncmp("fluencenn", fluence_property, sizeof("fluencenn"))) ||
+                       (!strncmp("none", fluence_property, sizeof("none"))))
+            fv = FV_13;
+        else
+            fv = FV_11;
+    }
+    else {
+        fv = FV_11;
+    }
+
+    ret = derive_mixer_ctl_stt(&stt_mixer, &ctl_st, &ctl_sf, &ctl_st_fnn, be_intf, fv);
+
+    if (ret != 0) {
+        printf("failed to derive mixer controls %d", ret);
+        goto done;
+    }
+
+    fprintf(log_file, "get_source_track meta data with gap of %d us \n", get_data_time_gap);
+
+    if (is_sound_focus_set) {
+        if (fv != FV_11) {
+            printf("sound_focus set is not supported for fluence version %d ", fv);
+            ret = -1;
+            goto done;
+        }
+
+        ret = set_soundfocus_metadata(&sound_focus_metadataset, ctl_sf);
+
+        if (ret != 0) {
+            printf("failed to set soundfocus metadata %d", ret);
+            goto done;
+        }
+
+        ret = get_soundfocus_metadata(&sound_focus_metadata, ctl_sf);
+
+        if (ret != 0) {
+            printf("failed to get soundfocus metadata %d", ret);
+            goto done;
+        }
+
+    }
+
+    while (get_data_iter != 0) {
+        switch (fv) {
+            case FV_13:
+            {
+                if (is_source_track_get) {
+                    ret = get_sourcetrack_metadata((void *)&source_track_metadata_fnn,
+                          sizeof(struct source_track_meta_fnn), ctl_st_fnn);
+                    if (ret != 0) {
+                        printf("failed to get source track meta data %d", ret);
+                        goto done;
+                    }
+
+                }
+
+                /* Print meta data */
+                fprintf(log_file, "time stamp session_time_lsw %u session_time_msw %u \n",
+                source_track_metadata_fnn.session_time_lsw,source_track_metadata_fnn.session_time_msw);
+
+                for (idx = 0; idx < TOTAL_SPEAKERS; idx++)
+                    printf("speakers[%d]=%d ",idx, source_track_metadata_fnn.speakers[idx]);
+
+                fprintf(log_file, "\nreserved=%d\n",source_track_metadata_fnn.reserved);
+
+                for (idx = 0; idx < TOTAL_DEGREES; idx++)
+                    printf("polarActivity[%d]=%d ",idx, source_track_metadata_fnn.polarActivity[idx]);
+
+                break;
+            }
+            case FV_11:
+            {
+                if (is_sound_focus_get) {
+                    ret = get_soundfocus_metadata(&sound_focus_metadata, ctl_sf);
+                    if (ret != 0) {
+                        printf("failed to get soundfocus metadata %d", ret);
+                        goto done;
+                    }
+                }
+
+                if (is_source_track_get) {
+                    ret = get_sourcetrack_metadata((void *)&source_track_metadata, sizeof(struct source_track_meta) - sizeof(struct timespec), ctl_st);
+                    if (ret != 0) {
+                        printf("failed to get source track meta data %d", ret);
+                        goto done;
+                    }
+                    clock_gettime(CLOCK_MONOTONIC, &ts);
+                    source_track_metadata.ts = ts;
+                }
+
+                /* Print meta data */
+                fprintf(log_file, "time stamp sec %ld msec %ld \n", (source_track_metadata.ts).tv_sec,
+                                              (source_track_metadata.ts).tv_nsec / NSEC_MSEC_CONVERT);
+                for (idx = 0; idx < NUM_SECTORS; idx++){
+                    printf("vad[%d]=%d ",idx, source_track_metadata.vad[idx]);
+                    if (idx < (NUM_SECTORS-1))
+                        printf("doa_noise[%d]=%d \n",
+                                idx, source_track_metadata.doa_noise[idx]);
+                }
+
+                fprintf(log_file, "doa_speech=%d\n",source_track_metadata.doa_speech);
+                if (is_sound_focus_get || is_sound_focus_set) {
+                    fprintf(log_file, "polar_activity:");
+                    for (sect = 0; sect < NUM_SECTORS; sect++ ){
+                        fprintf(log_file, "Sector No-%d:",sect + 1);
+                        idx = sound_focus_metadata.start_angle[sect];
+                        fprintf(log_file, "idx %d:",idx);
+                        count = sound_focus_metadata.start_angle[(sect + 1)%NUM_SECTORS] -
+                                    sound_focus_metadata.start_angle[sect];
+                        fprintf(log_file, "count %d:",count);
+                        if (count < 0)
+                            count = count + TOTAL_DEGREES;
+                        do {
+                            fprintf(log_file, "%d ",
+                                source_track_metadata.polar_activity[idx%TOTAL_DEGREES]);
+                            count--;
+                            idx++;
+                        } while (count);
+                    }
+                }
+                break;
+            }
+            default:
+                printf("fluence version is not supported");
+                break;
+        }
+
+        usleep(get_data_time_gap);
+        if (get_data_iter > 0)
+            get_data_iter--;
+    }
+
+done:
+    mixer_close(stt_mixer);
+    stt_mixer = NULL;
+
+    if ((log_file != stdout) && (log_file != nullptr))
+        fclose(log_file);
+
+    fprintf(log_file, "\nADL: BYE BYE\n");
+
+    return ret;
+}

diff --git a/stt_meta/stt_meta_extract.h b/stt_meta/stt_meta_extract.h
new file mode 100644
index 0000000..46df64e
--- /dev/null
+++ b/stt_meta/stt_meta_extract.h

@@ -0,0 +1,113 @@
+/*
+* Copyright (c) 2021,2023 Qualcomm Innovation Center, Inc. All rights reserved.
+*
+* Redistribution and use in source and binary forms, with or without
+* modification, are permitted provided that the following conditions are
+* met:
+*    * Redistributions of source code must retain the above copyright
+*      notice, this list of conditions and the following disclaimer.
+*    * Redistributions in binary form must reproduce the above
+*      copyright notice, this list of conditions and the following
+*      disclaimer in the documentation and/or other materials provided
+*      with the distribution.
+*    * Neither the name of The Linux Foundation nor the names of its
+*      contributors may be used to endorse or promote products derived
+*      from this software without specific prior written permission.
+*
+* THIS SOFTWARE IS PROVIDED "AS IS" AND ANY EXPRESS OR IMPLIED
+* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT
+* ARE DISCLAIMED.  IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS
+* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+* WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+* OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+* IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*/
+
+
+
+#ifndef STT_META_EXTRACT_H
+#define STT_META_EXTRACT_H
+#include <getopt.h>
+#include <time.h>
+#include <dlfcn.h>
+#include <unistd.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#define SOUND_CARD 0
+#define MIXER_OPEN_MAX_NUM_RETRY 10
+#define RETRY_US 500000
+#define MAX_SECTORS 8
+#define NUM_SECTORS 4
+#define TOTAL_DEGREES 360
+#define TOTAL_SPEAKERS 5
+#define NSEC_MSEC_CONVERT 1000
+#define ASCI_NUM 48
+#define DECI 10
+#define MIXER_PATH_MAX_LENGTH 100
+
+enum fluence_version {
+    FV_11,
+    FV_13
+};
+
+struct sound_focus_param {
+    uint16_t  start_angle[MAX_SECTORS];
+    uint8_t   enable[MAX_SECTORS];
+    uint16_t  gain_step;
+} __attribute__((packed));
+
+struct sound_focus_meta {
+    uint16_t  start_angle[MAX_SECTORS];
+    uint8_t   enable[MAX_SECTORS];
+    uint16_t  gain_step;
+    struct   timespec ts;
+} __attribute__((packed));
+
+struct source_tracking_param_fnn {
+    int32_t  speech_probablity_q20;
+    int16_t  speakers[TOTAL_SPEAKERS];
+    int16_t  reserved;
+    uint8_t  polarActivity[TOTAL_DEGREES];
+    uint32_t  session_time_lsw;
+    uint32_t  session_time_msw;
+} __attribute__((packed));
+
+struct source_track_meta_fnn {
+    int32_t  speech_probablity_q20;
+    int16_t  speakers[TOTAL_SPEAKERS];
+    int16_t  reserved;
+    uint8_t  polarActivity[TOTAL_DEGREES];
+    uint32_t  session_time_lsw;
+    uint32_t  session_time_msw;
+} __attribute__((packed));
+
+struct source_tracking_param {
+    uint8_t   vad[MAX_SECTORS];
+    uint16_t  doa_speech;
+    uint16_t  doa_noise[NUM_SECTORS-1];
+    uint8_t   polar_activity[TOTAL_DEGREES];
+} __attribute__((packed));
+
+struct source_track_meta {
+    uint8_t   vad[MAX_SECTORS];
+    uint16_t  doa_speech;
+    uint16_t  doa_noise[NUM_SECTORS-1];
+    uint8_t   polar_activity[TOTAL_DEGREES];
+    struct   timespec ts;
+} __attribute__((packed));
+
+static int get_sourcetrack_metadata(void *source_track_meta, unsigned int meta_size,
+                                                             struct mixer_ctl *ctl);
+
+static int get_soundfocus_metadata(struct sound_focus_meta *sound_focus_meta,
+                                                      struct mixer_ctl *ctl);
+
+static int set_soundfocus_metadata(struct sound_focus_meta *sound_focus_meta,
+                                                      struct mixer_ctl *ctl);
+
+#endif
commit	cf29fe9000e706022f53fbe69e1fa64a4363440c	[log] [tgz]
author	Hari Krishna Chowdary Yennana <quic_hyennnan@quicinc.com>	Mon Jun 26 16:44:23 2023 +0530
committer	Hari Krishna Chowdary Yennana <quic_hyennnan@quicinc.com>	Thu Aug 17 16:51:05 2023 +0530
tree	b024ba23f52707ff0c613911cd9b154960eb8968
parent	0859aa48ee398832b6deec3633e248cb25ecf223 [diff]