/* * Copyright 2019 The Chromium OS Authors. All rights reserved. * Use of this source code is governed by a BSD-style license that can be * found in the LICENSE file. */ #include "audio_codec.h" #include "console.h" #include "host_command.h" #include "hotword_dsp_api.h" #include "sha256.h" #include "system.h" #include "task.h" #include "util.h" #define CPRINTS(format, args...) cprints(CC_AUDIO_CODEC, format, ## args) /* * To shorten the variable names, or the following code is likely to greater * than 80 columns. */ #define AUDIO_BUF_LEN CONFIG_AUDIO_CODEC_WOV_AUDIO_BUF_LEN #define LANG_BUF_LEN CONFIG_AUDIO_CODEC_WOV_LANG_BUF_LEN static uint8_t lang_hash[SHA256_DIGEST_SIZE]; static uint32_t lang_len; /* * The variables below are shared between host command and WoV task. This lock * is designed to protect them. */ static struct mutex lock; /* * wov_enabled is shared. * * host command task: * - is the only writer * - no need to lock if read */ static uint8_t wov_enabled; /* * hotword_detected is shared. */ static uint8_t hotword_detected; /* * audio_buf_rp and audio_buf_wp are shared. * * Note that: sample width is 16-bit. * * Typical ring-buffer implementation: * If audio_buf_rp == audio_buf_wp, empty. * If (audio_buf_wp + 2) % buf_len == audio_buf_rp, full. */ static uint32_t audio_buf_rp, audio_buf_wp; static int is_buf_full(void) { return ((audio_buf_wp + 2) % AUDIO_BUF_LEN) == audio_buf_rp; } /* only used by host command */ static uint8_t speech_lib_loaded; static int check_lang_buf(uint8_t *data, uint32_t len, const uint8_t *hash) { /* * Note: sizeof(struct sha256_ctx) = 200 bytes * should put into .bss, or stack is likely to overflow (~640 bytes) */ static struct sha256_ctx ctx; uint8_t *digest; int i; uint8_t *p = (uint8_t *)audio_codec_wov_lang_buf_addr; SHA256_init(&ctx); SHA256_update(&ctx, data, len); digest = SHA256_final(&ctx); #ifdef DEBUG_AUDIO_CODEC CPRINTS("data=%08x len=%d", data, len); hexdump(digest, SHA256_DIGEST_SIZE); #endif if (memcmp(digest, hash, SHA256_DIGEST_SIZE) != 0) return EC_ERROR_UNKNOWN; for (i = len; i < LANG_BUF_LEN; ++i) if (p[i]) return EC_ERROR_UNKNOWN; return EC_SUCCESS; } #ifdef CONFIG_AUDIO_CODEC_CAP_WOV_LANG_SHM static enum ec_status wov_set_lang_shm(struct host_cmd_handler_args *args) { const struct ec_param_ec_codec_wov *p = args->params; const struct ec_param_ec_codec_wov_set_lang_shm *pp = &p->set_lang_shm_param; if (pp->total_len > LANG_BUF_LEN) return EC_RES_INVALID_PARAM; if (wov_enabled) return EC_RES_BUSY; if (check_lang_buf((uint8_t *)audio_codec_wov_lang_buf_addr, pp->total_len, pp->hash) != EC_SUCCESS) return EC_RES_ERROR; memcpy(lang_hash, pp->hash, sizeof(lang_hash)); lang_len = pp->total_len; speech_lib_loaded = 0; args->response_size = 0; return EC_RES_SUCCESS; } #else static enum ec_status wov_set_lang(struct host_cmd_handler_args *args) { const struct ec_param_ec_codec_wov *p = args->params; const struct ec_param_ec_codec_wov_set_lang *pp = &p->set_lang_param; if (pp->total_len > LANG_BUF_LEN) return EC_RES_INVALID_PARAM; if (pp->offset >= LANG_BUF_LEN) return EC_RES_INVALID_PARAM; if (pp->len > ARRAY_SIZE(pp->buf)) return EC_RES_INVALID_PARAM; if (pp->offset + pp->len > pp->total_len) return EC_RES_INVALID_PARAM; if (wov_enabled) return EC_RES_BUSY; if (!pp->offset) memset((uint8_t *)audio_codec_wov_lang_buf_addr, 0, LANG_BUF_LEN); memcpy((uint8_t *)audio_codec_wov_lang_buf_addr + pp->offset, pp->buf, pp->len); if (pp->offset + pp->len == pp->total_len) { if (check_lang_buf((uint8_t *)audio_codec_wov_lang_buf_addr, pp->total_len, pp->hash) != EC_SUCCESS) return EC_RES_ERROR; memcpy(lang_hash, pp->hash, sizeof(lang_hash)); lang_len = pp->total_len; speech_lib_loaded = 0; } args->response_size = 0; return EC_RES_SUCCESS; } #endif /* CONFIG_AUDIO_CODEC_CAP_WOV_LANG_SHM */ static enum ec_status wov_get_lang(struct host_cmd_handler_args *args) { struct ec_response_ec_codec_wov_get_lang *r = args->response; memcpy(r->hash, lang_hash, sizeof(r->hash)); args->response_size = sizeof(*r); return EC_RES_SUCCESS; } static enum ec_status wov_enable(struct host_cmd_handler_args *args) { if (wov_enabled) return EC_RES_BUSY; if (audio_codec_wov_enable() != EC_SUCCESS) return EC_RES_ERROR; if (!speech_lib_loaded) { if (!GoogleHotwordDspInit( (void *)audio_codec_wov_lang_buf_addr)) return EC_RES_ERROR; speech_lib_loaded = 1; } else { GoogleHotwordDspReset(); } mutex_lock(&lock); wov_enabled = 1; hotword_detected = 0; audio_buf_rp = audio_buf_wp = 0; mutex_unlock(&lock); #ifdef HAS_TASK_WOV task_wake(TASK_ID_WOV); #endif args->response_size = 0; return EC_RES_SUCCESS; } static enum ec_status wov_disable(struct host_cmd_handler_args *args) { if (!wov_enabled) return EC_RES_BUSY; if (audio_codec_wov_disable() != EC_SUCCESS) return EC_RES_ERROR; mutex_lock(&lock); wov_enabled = 0; hotword_detected = 0; audio_buf_rp = audio_buf_wp = 0; mutex_unlock(&lock); args->response_size = 0; return EC_RES_SUCCESS; } #ifdef CONFIG_AUDIO_CODEC_CAP_WOV_AUDIO_SHM static enum ec_status wov_read_audio_shm(struct host_cmd_handler_args *args) { struct ec_response_ec_codec_wov_read_audio_shm *r = args->response; if (!wov_enabled) return EC_RES_ACCESS_DENIED; mutex_lock(&lock); if (!hotword_detected) { mutex_unlock(&lock); return EC_RES_ACCESS_DENIED; } r->offset = audio_buf_rp; if (audio_buf_rp <= audio_buf_wp) r->len = audio_buf_wp - audio_buf_rp; else r->len = AUDIO_BUF_LEN - audio_buf_rp; audio_buf_rp += r->len; if (audio_buf_rp == AUDIO_BUF_LEN) audio_buf_rp = 0; mutex_unlock(&lock); #ifdef DEBUG_AUDIO_CODEC if (!r->len) CPRINTS("underrun detected"); #endif args->response_size = sizeof(*r); return EC_RES_SUCCESS; } #else static enum ec_status wov_read_audio(struct host_cmd_handler_args *args) { struct ec_response_ec_codec_wov_read_audio *r = args->response; uint8_t *p; if (!wov_enabled) return EC_RES_ACCESS_DENIED; mutex_lock(&lock); if (!hotword_detected) { mutex_unlock(&lock); return EC_RES_ACCESS_DENIED; } if (audio_buf_rp <= audio_buf_wp) r->len = audio_buf_wp - audio_buf_rp; else r->len = AUDIO_BUF_LEN - audio_buf_rp; r->len = MIN(sizeof(r->buf), r->len); p = (uint8_t *)audio_codec_wov_audio_buf_addr + audio_buf_rp; audio_buf_rp += r->len; if (audio_buf_rp == AUDIO_BUF_LEN) audio_buf_rp = 0; mutex_unlock(&lock); #ifdef DEBUG_AUDIO_CODEC if (!r->len) CPRINTS("underrun detected"); #endif /* * Note: it is possible to copy corrupted audio data if overrun * happened at the point. To keep it simple and align to SHM mode, * we ignore the case if overrun happened. */ memcpy(r->buf, p, r->len); args->response_size = sizeof(*r); return EC_RES_SUCCESS; } #endif /* CONFIG_AUDIO_CODEC_CAP_WOV_AUDIO_SHM */ static int (*sub_cmds[])(struct host_cmd_handler_args *) = { #ifdef CONFIG_AUDIO_CODEC_CAP_WOV_LANG_SHM [EC_CODEC_WOV_SET_LANG_SHM] = wov_set_lang_shm, #else [EC_CODEC_WOV_SET_LANG] = wov_set_lang, #endif [EC_CODEC_WOV_GET_LANG] = wov_get_lang, [EC_CODEC_WOV_ENABLE] = wov_enable, [EC_CODEC_WOV_DISABLE] = wov_disable, #ifdef CONFIG_AUDIO_CODEC_CAP_WOV_AUDIO_SHM [EC_CODEC_WOV_READ_AUDIO_SHM] = wov_read_audio_shm, #else [EC_CODEC_WOV_READ_AUDIO] = wov_read_audio, #endif }; #ifdef DEBUG_AUDIO_CODEC static char *strcmd[] = { #ifdef CONFIG_AUDIO_CODEC_CAP_WOV_LANG_SHM [EC_CODEC_WOV_SET_LANG_SHM] = "EC_CODEC_WOV_SET_LANG_SHM", #else [EC_CODEC_WOV_SET_LANG] = "EC_CODEC_WOV_SET_LANG", #endif [EC_CODEC_WOV_GET_LANG] = "EC_CODEC_WOV_GET_LANG", [EC_CODEC_WOV_ENABLE] = "EC_CODEC_WOV_ENABLE", [EC_CODEC_WOV_DISABLE] = "EC_CODEC_WOV_DISABLE", #ifdef CONFIG_AUDIO_CODEC_CAP_WOV_AUDIO_SHM [EC_CODEC_WOV_READ_AUDIO_SHM] = "EC_CODEC_WOV_READ_AUDIO_SHM", #else [EC_CODEC_WOV_READ_AUDIO] = "EC_CODEC_WOV_READ_AUDIO", #endif }; BUILD_ASSERT(ARRAY_SIZE(sub_cmds) == ARRAY_SIZE(strcmd)); #endif static enum ec_status wov_host_command(struct host_cmd_handler_args *args) { const struct ec_param_ec_codec_wov *p = args->params; #ifdef DEBUG_AUDIO_CODEC CPRINTS("WoV subcommand: %s", strcmd[p->cmd]); #endif if (p->cmd < EC_CODEC_WOV_SUBCMD_COUNT && sub_cmds[p->cmd]) return sub_cmds[p->cmd](args); return EC_RES_INVALID_PARAM; } DECLARE_HOST_COMMAND(EC_CMD_EC_CODEC_WOV, wov_host_command, EC_VER_MASK(0)); /* * Exported interfaces. */ void audio_codec_wov_task(void *arg) { uint32_t n, req; uint8_t *p; int r; while (1) { mutex_lock(&lock); if (!wov_enabled) { mutex_unlock(&lock); task_wait_event(-1); continue; } /* Clear the buffer if full. */ if (is_buf_full()) { audio_buf_wp = audio_buf_rp; #ifdef DEBUG_AUDIO_CODEC if (hotword_detected) CPRINTS("overrun detected"); #endif } /* * Note: sample width is 16-bit. * * The linear ring buffer wastes one sample bytes to * detect buffer full. * * If buffer is empty, maximum req is BUF_LEN - 2. * If wp > rp, wp can fill to the end of linear buffer. * If wp < rp, wp can fill up to rp - 2. */ if (audio_buf_wp == audio_buf_rp) req = AUDIO_BUF_LEN - MAX(audio_buf_wp, 2); else if (audio_buf_wp > audio_buf_rp) req = AUDIO_BUF_LEN - audio_buf_wp; else req = audio_buf_rp - audio_buf_wp - 2; p = (uint8_t *)audio_codec_wov_audio_buf_addr + audio_buf_wp; mutex_unlock(&lock); n = audio_codec_wov_read(p, req); if (n < 0) { CPRINTS("failed to read: %d", n); break; } else if (n == 0) { if (audio_codec_wov_enable_notifier() != EC_SUCCESS) { CPRINTS("failed to enable_notifier"); break; } task_wait_event(-1); continue; } mutex_lock(&lock); audio_buf_wp += n; if (audio_buf_wp == AUDIO_BUF_LEN) audio_buf_wp = 0; mutex_unlock(&lock); /* * GoogleHotwordDspProcess() needs number of samples. In the * case, sample is S16_LE. Thus, n / 2. */ if (!hotword_detected && GoogleHotwordDspProcess(p, n / 2, &r)) { CPRINTS("hotword detected"); mutex_lock(&lock); /* * Note: preserve 40% of buf size for AP to read * (see go/cros-ec-codec#heading=h.582ga6pgfl2g) */ audio_buf_rp = audio_buf_wp + (AUDIO_BUF_LEN * 2 / 5); if (audio_buf_rp >= AUDIO_BUF_LEN) audio_buf_rp -= AUDIO_BUF_LEN; hotword_detected = 1; mutex_unlock(&lock); host_set_single_event(EC_HOST_EVENT_WOV); } /* * Reasons to sleep here: * 1. read the audio data in a fixed pace (10ms) * 2. yield the processor in case of watchdog thought EC crashed */ task_wait_event(10 * MSEC); } }