[Core] Add partial Asr support
This commit is contained in:
parent
b1714199ce
commit
623fecd599
|
@ -68,6 +68,7 @@ typedef struct {
|
||||||
char *grammar;
|
char *grammar;
|
||||||
char *channel_uuid;
|
char *channel_uuid;
|
||||||
switch_vad_t *vad;
|
switch_vad_t *vad;
|
||||||
|
int partial;
|
||||||
} test_asr_t;
|
} test_asr_t;
|
||||||
|
|
||||||
|
|
||||||
|
@ -268,12 +269,17 @@ static switch_status_t test_asr_get_results(switch_asr_handle_t *ah, char **resu
|
||||||
}
|
}
|
||||||
|
|
||||||
if (switch_test_flag(context, ASRFLAG_RESULT)) {
|
if (switch_test_flag(context, ASRFLAG_RESULT)) {
|
||||||
|
int is_partial = context->partial-- > 0 ? 1 : 0;
|
||||||
|
|
||||||
*resultstr = switch_mprintf("{\"grammar\": \"%s\", \"text\": \"%s\", \"confidence\": %f}", context->grammar, context->result_text, context->result_confidence);
|
*resultstr = switch_mprintf("{\"grammar\": \"%s\", \"text\": \"%s\", \"confidence\": %f}", context->grammar, context->result_text, context->result_confidence);
|
||||||
|
|
||||||
switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_ERROR, "Result: %s\n", *resultstr);
|
switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_NOTICE, "%sResult: %s\n", is_partial ? "Partial " : "Final ", *resultstr);
|
||||||
|
|
||||||
status = SWITCH_STATUS_SUCCESS;
|
if (is_partial) {
|
||||||
|
status = SWITCH_STATUS_MORE_DATA;
|
||||||
|
} else {
|
||||||
|
status = SWITCH_STATUS_SUCCESS;
|
||||||
|
}
|
||||||
} else if (switch_test_flag(context, ASRFLAG_NOINPUT_TIMEOUT)) {
|
} else if (switch_test_flag(context, ASRFLAG_NOINPUT_TIMEOUT)) {
|
||||||
switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_DEBUG, "Result: NO INPUT\n");
|
switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_DEBUG, "Result: NO INPUT\n");
|
||||||
|
|
||||||
|
@ -361,6 +367,9 @@ static void test_asr_text_param(switch_asr_handle_t *ah, char *param, const char
|
||||||
} else if (!strcasecmp("confidence", param) && fval >= 0.0) {
|
} else if (!strcasecmp("confidence", param) && fval >= 0.0) {
|
||||||
context->result_confidence = fval;
|
context->result_confidence = fval;
|
||||||
switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_DEBUG, "confidence = %f\n", fval);
|
switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_DEBUG, "confidence = %f\n", fval);
|
||||||
|
} else if (!strcasecmp("partial", param) && switch_true(val)) {
|
||||||
|
context->partial = 3;
|
||||||
|
switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_DEBUG, "partial = %d\n", context->partial);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -1055,7 +1055,7 @@ SWITCH_DECLARE(char *) CoreSession::playAndDetectSpeech(char *file, char *engine
|
||||||
|
|
||||||
char *result = NULL;
|
char *result = NULL;
|
||||||
|
|
||||||
switch_status_t status = switch_ivr_play_and_detect_speech(session, file, engine, grammar, &result, 0, NULL);
|
switch_status_t status = switch_ivr_play_and_detect_speech(session, file, engine, grammar, &result, 0, ap);
|
||||||
if (status == SWITCH_STATUS_SUCCESS) {
|
if (status == SWITCH_STATUS_SUCCESS) {
|
||||||
// good
|
// good
|
||||||
} else if (status == SWITCH_STATUS_GENERR) {
|
} else if (status == SWITCH_STATUS_GENERR) {
|
||||||
|
@ -1063,12 +1063,12 @@ SWITCH_DECLARE(char *) CoreSession::playAndDetectSpeech(char *file, char *engine
|
||||||
} else if (status == SWITCH_STATUS_NOT_INITALIZED) {
|
} else if (status == SWITCH_STATUS_NOT_INITALIZED) {
|
||||||
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_ERROR, "ASR INIT ERROR\n");
|
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_ERROR, "ASR INIT ERROR\n");
|
||||||
} else {
|
} else {
|
||||||
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_ERROR, "ERROR\n");
|
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_ERROR, "ERROR status = %d\n", status);
|
||||||
}
|
}
|
||||||
|
|
||||||
end_allow_threads();
|
end_allow_threads();
|
||||||
|
|
||||||
return result; // remeber to free me
|
return result ? strdup(result) : NULL; // remeber to free me
|
||||||
}
|
}
|
||||||
|
|
||||||
SWITCH_DECLARE(void) CoreSession::say(const char *tosay, const char *module_name, const char *say_type, const char *say_method, const char *say_gender)
|
SWITCH_DECLARE(void) CoreSession::say(const char *tosay, const char *module_name, const char *say_type, const char *say_method, const char *say_gender)
|
||||||
|
|
|
@ -4696,8 +4696,16 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_bind_dtmf_meta_session(switch_core_se
|
||||||
typedef struct {
|
typedef struct {
|
||||||
int done;
|
int done;
|
||||||
char *result;
|
char *result;
|
||||||
|
switch_input_args_t *original_args;
|
||||||
} play_and_detect_speech_state_t;
|
} play_and_detect_speech_state_t;
|
||||||
|
|
||||||
|
static void deliver_asr_event(switch_core_session_t *session, switch_event_t *event, switch_input_args_t *args)
|
||||||
|
{
|
||||||
|
if (args && args->input_callback) {
|
||||||
|
args->input_callback(session, (void *)event, SWITCH_INPUT_TYPE_EVENT, args->buf, args->buflen);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
static switch_status_t play_and_detect_input_callback(switch_core_session_t *session, void *input, switch_input_type_t input_type, void *data, unsigned int len)
|
static switch_status_t play_and_detect_input_callback(switch_core_session_t *session, void *input, switch_input_type_t input_type, void *data, unsigned int len)
|
||||||
{
|
{
|
||||||
play_and_detect_speech_state_t *state = (play_and_detect_speech_state_t *)data;
|
play_and_detect_speech_state_t *state = (play_and_detect_speech_state_t *)data;
|
||||||
|
@ -4708,7 +4716,10 @@ static switch_status_t play_and_detect_input_callback(switch_core_session_t *ses
|
||||||
event = (switch_event_t *)input;
|
event = (switch_event_t *)input;
|
||||||
if (event->event_id == SWITCH_EVENT_DETECTED_SPEECH) {
|
if (event->event_id == SWITCH_EVENT_DETECTED_SPEECH) {
|
||||||
const char *speech_type = switch_event_get_header(event, "Speech-Type");
|
const char *speech_type = switch_event_get_header(event, "Speech-Type");
|
||||||
|
|
||||||
if (!zstr(speech_type)) {
|
if (!zstr(speech_type)) {
|
||||||
|
deliver_asr_event(session, event, state->original_args);
|
||||||
|
|
||||||
if (!strcasecmp(speech_type, "detected-speech")) {
|
if (!strcasecmp(speech_type, "detected-speech")) {
|
||||||
const char *result;
|
const char *result;
|
||||||
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) DETECTED SPEECH\n", switch_channel_get_name(channel));
|
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) DETECTED SPEECH\n", switch_channel_get_name(channel));
|
||||||
|
@ -4718,8 +4729,11 @@ static switch_status_t play_and_detect_input_callback(switch_core_session_t *ses
|
||||||
} else {
|
} else {
|
||||||
state->result = "";
|
state->result = "";
|
||||||
}
|
}
|
||||||
|
state->original_args = NULL;
|
||||||
state->done = PLAY_AND_DETECT_DONE_RECOGNIZING;
|
state->done = PLAY_AND_DETECT_DONE_RECOGNIZING;
|
||||||
return SWITCH_STATUS_BREAK;
|
return SWITCH_STATUS_BREAK;
|
||||||
|
} else if (!strcasecmp(speech_type, "detected-partial-speech")) {
|
||||||
|
// ok
|
||||||
} else if (!strcasecmp(speech_type, "begin-speaking")) {
|
} else if (!strcasecmp(speech_type, "begin-speaking")) {
|
||||||
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) START OF SPEECH\n", switch_channel_get_name(channel));
|
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) START OF SPEECH\n", switch_channel_get_name(channel));
|
||||||
return SWITCH_STATUS_BREAK;
|
return SWITCH_STATUS_BREAK;
|
||||||
|
@ -4727,6 +4741,8 @@ static switch_status_t play_and_detect_input_callback(switch_core_session_t *ses
|
||||||
state->done = PLAY_AND_DETECT_DONE_RECOGNIZING;
|
state->done = PLAY_AND_DETECT_DONE_RECOGNIZING;
|
||||||
state->result = "";
|
state->result = "";
|
||||||
return SWITCH_STATUS_BREAK;
|
return SWITCH_STATUS_BREAK;
|
||||||
|
} else {
|
||||||
|
switch_log_printf(SWITCH_CHANNEL_LOG, SWITCH_LOG_ERROR, "unhandled speech type %s\n", speech_type);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -4765,7 +4781,7 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_detect_speech(switch_core_se
|
||||||
switch_status_t status = SWITCH_STATUS_FALSE;
|
switch_status_t status = SWITCH_STATUS_FALSE;
|
||||||
int recognizing = 0;
|
int recognizing = 0;
|
||||||
switch_input_args_t myargs = { 0 };
|
switch_input_args_t myargs = { 0 };
|
||||||
play_and_detect_speech_state_t state = { 0, "" };
|
play_and_detect_speech_state_t state = { 0, "", NULL };
|
||||||
switch_channel_t *channel = switch_core_session_get_channel(session);
|
switch_channel_t *channel = switch_core_session_get_channel(session);
|
||||||
|
|
||||||
arg_recursion_check_start(args);
|
arg_recursion_check_start(args);
|
||||||
|
@ -4776,10 +4792,6 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_detect_speech(switch_core_se
|
||||||
|
|
||||||
if (!input_timeout) input_timeout = 5000;
|
if (!input_timeout) input_timeout = 5000;
|
||||||
|
|
||||||
if (!args) {
|
|
||||||
args = &myargs;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* start speech detection */
|
/* start speech detection */
|
||||||
if ((status = switch_ivr_detect_speech(session, mod_name, grammar, "", NULL, NULL)) != SWITCH_STATUS_SUCCESS) {
|
if ((status = switch_ivr_detect_speech(session, mod_name, grammar, "", NULL, NULL)) != SWITCH_STATUS_SUCCESS) {
|
||||||
/* map SWITCH_STATUS_FALSE to SWITCH_STATUS_GENERR to indicate grammar load failed
|
/* map SWITCH_STATUS_FALSE to SWITCH_STATUS_GENERR to indicate grammar load failed
|
||||||
|
@ -4792,12 +4804,19 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_detect_speech(switch_core_se
|
||||||
recognizing = 1;
|
recognizing = 1;
|
||||||
|
|
||||||
/* play the prompt, looking for detection result */
|
/* play the prompt, looking for detection result */
|
||||||
args->input_callback = play_and_detect_input_callback;
|
|
||||||
args->buf = &state;
|
|
||||||
args->buflen = sizeof(state);
|
|
||||||
status = switch_ivr_play_file(session, NULL, file, args);
|
|
||||||
|
|
||||||
if (args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
|
if (args) {
|
||||||
|
state.original_args = args;
|
||||||
|
myargs.dmachine = args->dmachine;
|
||||||
|
}
|
||||||
|
|
||||||
|
myargs.input_callback = play_and_detect_input_callback;
|
||||||
|
myargs.buf = &state;
|
||||||
|
myargs.buflen = sizeof(state);
|
||||||
|
|
||||||
|
status = switch_ivr_play_file(session, NULL, file, &myargs);
|
||||||
|
|
||||||
|
if (args && args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
|
||||||
state.done |= PLAY_AND_DETECT_DONE;
|
state.done |= PLAY_AND_DETECT_DONE;
|
||||||
goto done;
|
goto done;
|
||||||
}
|
}
|
||||||
|
@ -4812,9 +4831,9 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_detect_speech(switch_core_se
|
||||||
switch_ivr_detect_speech_start_input_timers(session);
|
switch_ivr_detect_speech_start_input_timers(session);
|
||||||
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) WAITING FOR RESULT\n", switch_channel_get_name(channel));
|
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) WAITING FOR RESULT\n", switch_channel_get_name(channel));
|
||||||
while (!state.done && switch_channel_ready(channel)) {
|
while (!state.done && switch_channel_ready(channel)) {
|
||||||
status = switch_ivr_sleep(session, input_timeout, SWITCH_FALSE, args);
|
status = switch_ivr_sleep(session, input_timeout, SWITCH_FALSE, &myargs);
|
||||||
|
|
||||||
if (args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
|
if (args && args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
|
||||||
state.done |= PLAY_AND_DETECT_DONE;
|
state.done |= PLAY_AND_DETECT_DONE;
|
||||||
goto done;
|
goto done;
|
||||||
}
|
}
|
||||||
|
@ -4826,8 +4845,6 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_detect_speech(switch_core_se
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
done:
|
done:
|
||||||
if (recognizing && !(state.done & PLAY_AND_DETECT_DONE_RECOGNIZING)) {
|
if (recognizing && !(state.done & PLAY_AND_DETECT_DONE_RECOGNIZING)) {
|
||||||
switch_ivr_pause_detect_speech(session);
|
switch_ivr_pause_detect_speech(session);
|
||||||
|
|
|
@ -3192,8 +3192,16 @@ typedef struct {
|
||||||
char terminator;
|
char terminator;
|
||||||
switch_time_t last_digit_time;
|
switch_time_t last_digit_time;
|
||||||
switch_bool_t is_speech;
|
switch_bool_t is_speech;
|
||||||
|
switch_input_args_t *original_args;
|
||||||
} switch_collect_input_state_t;
|
} switch_collect_input_state_t;
|
||||||
|
|
||||||
|
static void deliver_asr_event(switch_core_session_t *session, switch_event_t *event, switch_input_args_t *args)
|
||||||
|
{
|
||||||
|
if (args && args->input_callback) {
|
||||||
|
args->input_callback(session, (void *)event, SWITCH_INPUT_TYPE_EVENT, args->buf, args->buflen);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
static switch_status_t switch_collect_input_callback(switch_core_session_t *session, void *input, switch_input_type_t input_type, void *data, unsigned int len)
|
static switch_status_t switch_collect_input_callback(switch_core_session_t *session, void *input, switch_input_type_t input_type, void *data, unsigned int len)
|
||||||
{
|
{
|
||||||
switch_collect_input_state_t *state = (switch_collect_input_state_t *)data;
|
switch_collect_input_state_t *state = (switch_collect_input_state_t *)data;
|
||||||
|
@ -3209,13 +3217,15 @@ static switch_status_t switch_collect_input_callback(switch_core_session_t *sess
|
||||||
|
|
||||||
if (zstr(speech_type)) return SWITCH_STATUS_SUCCESS;
|
if (zstr(speech_type)) return SWITCH_STATUS_SUCCESS;
|
||||||
|
|
||||||
|
deliver_asr_event(session, event, state->original_args);
|
||||||
|
|
||||||
if (!strcasecmp(speech_type, "detected-speech")) {
|
if (!strcasecmp(speech_type, "detected-speech")) {
|
||||||
const char *result = switch_event_get_body(event);
|
const char *result = switch_event_get_body(event);
|
||||||
|
|
||||||
/* stop waiting for speech */
|
/* stop waiting for speech */
|
||||||
switch_set_flag(state, SWITCH_COLLECT_INPUT_SPEECH_DONE);
|
switch_set_flag(state, SWITCH_COLLECT_INPUT_SPEECH_DONE);
|
||||||
|
|
||||||
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) DETECTED SPEECH\n", switch_channel_get_name(channel));
|
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) DETECTED SPEECH %s\n", switch_channel_get_name(channel), speech_type);
|
||||||
|
|
||||||
if (!zstr(result)) {
|
if (!zstr(result)) {
|
||||||
state->recognition_result = cJSON_Parse(result);
|
state->recognition_result = cJSON_Parse(result);
|
||||||
|
@ -3230,15 +3240,12 @@ static switch_status_t switch_collect_input_callback(switch_core_session_t *sess
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
return SWITCH_STATUS_BREAK;
|
return SWITCH_STATUS_BREAK;
|
||||||
}
|
} else if (!strcasecmp(speech_type, "detected-partial-speech")) {
|
||||||
|
} else if (!strcasecmp("closed", speech_type)) {
|
||||||
if (!strcasecmp("closed", speech_type)) {
|
|
||||||
/* stop waiting for speech */
|
/* stop waiting for speech */
|
||||||
switch_set_flag(state, SWITCH_COLLECT_INPUT_SPEECH_DONE);
|
switch_set_flag(state, SWITCH_COLLECT_INPUT_SPEECH_DONE);
|
||||||
return SWITCH_STATUS_BREAK;
|
return SWITCH_STATUS_BREAK;
|
||||||
}
|
} else if (!strcasecmp(speech_type, "begin-speaking")) {
|
||||||
|
|
||||||
if (!strcasecmp(speech_type, "begin-speaking")) {
|
|
||||||
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) START OF SPEECH\n", switch_channel_get_name(channel));
|
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) START OF SPEECH\n", switch_channel_get_name(channel));
|
||||||
state->is_speech = SWITCH_TRUE;
|
state->is_speech = SWITCH_TRUE;
|
||||||
|
|
||||||
|
@ -3246,6 +3253,8 @@ static switch_status_t switch_collect_input_callback(switch_core_session_t *sess
|
||||||
/* barge in on prompt */
|
/* barge in on prompt */
|
||||||
return SWITCH_STATUS_BREAK;
|
return SWITCH_STATUS_BREAK;
|
||||||
}
|
}
|
||||||
|
} else {
|
||||||
|
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "Unhandled Speech-Type %s\n", speech_type);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -3360,10 +3369,6 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_collect_input(switch_core_se
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if (!args) {
|
|
||||||
args = &myargs;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* start speech recognition, if enabled */
|
/* start speech recognition, if enabled */
|
||||||
if (recognizer_grammar && recognizer_mod_name) {
|
if (recognizer_grammar && recognizer_mod_name) {
|
||||||
if ((status = switch_ivr_detect_speech(session, recognizer_mod_name, recognizer_grammar, "", NULL, NULL)) != SWITCH_STATUS_SUCCESS) {
|
if ((status = switch_ivr_detect_speech(session, recognizer_mod_name, recognizer_grammar, "", NULL, NULL)) != SWITCH_STATUS_SUCCESS) {
|
||||||
|
@ -3380,14 +3385,22 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_collect_input(switch_core_se
|
||||||
}
|
}
|
||||||
|
|
||||||
/* play the prompt, looking for input result */
|
/* play the prompt, looking for input result */
|
||||||
args->input_callback = switch_collect_input_callback;
|
|
||||||
args->buf = &state;
|
if (args) {
|
||||||
args->buflen = sizeof(state);
|
state.original_args = args;
|
||||||
|
myargs.dmachine = args->dmachine;
|
||||||
|
}
|
||||||
|
|
||||||
|
myargs.input_callback = switch_collect_input_callback;
|
||||||
|
myargs.buf = &state;
|
||||||
|
myargs.buflen = sizeof(state);
|
||||||
|
|
||||||
|
|
||||||
switch_set_flag(&state, SWITCH_COLLECT_INPUT_PROMPT);
|
switch_set_flag(&state, SWITCH_COLLECT_INPUT_PROMPT);
|
||||||
status = switch_ivr_play_file(session, NULL, prompt, args);
|
status = switch_ivr_play_file(session, NULL, prompt, &myargs);
|
||||||
switch_clear_flag(&state, SWITCH_COLLECT_INPUT_PROMPT);
|
switch_clear_flag(&state, SWITCH_COLLECT_INPUT_PROMPT);
|
||||||
|
|
||||||
if (args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
|
if (args && args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
|
||||||
switch_set_flag(&state, SWITCH_COLLECT_INPUT_DIGITS_DONE);
|
switch_set_flag(&state, SWITCH_COLLECT_INPUT_DIGITS_DONE);
|
||||||
switch_set_flag(&state, SWITCH_COLLECT_INPUT_SPEECH_DONE);
|
switch_set_flag(&state, SWITCH_COLLECT_INPUT_SPEECH_DONE);
|
||||||
status = SWITCH_STATUS_SUCCESS;
|
status = SWITCH_STATUS_SUCCESS;
|
||||||
|
@ -3412,9 +3425,9 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_collect_input(switch_core_se
|
||||||
while ((!switch_test_flag(&state, SWITCH_COLLECT_INPUT_DIGITS_DONE) || !switch_test_flag(&state, SWITCH_COLLECT_INPUT_SPEECH_DONE))
|
while ((!switch_test_flag(&state, SWITCH_COLLECT_INPUT_DIGITS_DONE) || !switch_test_flag(&state, SWITCH_COLLECT_INPUT_SPEECH_DONE))
|
||||||
&& switch_channel_ready(channel)) {
|
&& switch_channel_ready(channel)) {
|
||||||
|
|
||||||
status = switch_ivr_sleep(session, sleep_time, SWITCH_FALSE, args);
|
status = switch_ivr_sleep(session, sleep_time, SWITCH_FALSE, &myargs);
|
||||||
|
|
||||||
if (args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
|
if (args && args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
|
||||||
// dmachine done
|
// dmachine done
|
||||||
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_DEBUG, "(%s) DMACHINE DONE\n", switch_channel_get_name(channel));
|
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_DEBUG, "(%s) DMACHINE DONE\n", switch_channel_get_name(channel));
|
||||||
switch_set_flag(&state, SWITCH_COLLECT_INPUT_DIGITS_DONE);
|
switch_set_flag(&state, SWITCH_COLLECT_INPUT_DIGITS_DONE);
|
||||||
|
|
|
@ -33,6 +33,34 @@
|
||||||
|
|
||||||
#include <test/switch_test.h>
|
#include <test/switch_test.h>
|
||||||
|
|
||||||
|
static switch_status_t partial_play_and_collect_input_callback(switch_core_session_t *session, void *input, switch_input_type_t input_type, void *data, __attribute__((unused))unsigned int len)
|
||||||
|
{
|
||||||
|
switch_status_t status = SWITCH_STATUS_SUCCESS;
|
||||||
|
int *count = (int *)data;
|
||||||
|
|
||||||
|
if (input_type == SWITCH_INPUT_TYPE_EVENT) {
|
||||||
|
switch_event_t *event = (switch_event_t *)input;
|
||||||
|
|
||||||
|
if (event->event_id == SWITCH_EVENT_DETECTED_SPEECH) {
|
||||||
|
const char *speech_type = switch_event_get_header(event, "Speech-Type");
|
||||||
|
|
||||||
|
if (zstr(speech_type) || strcmp(speech_type, "detected-partial-speech")) {
|
||||||
|
return status;
|
||||||
|
}
|
||||||
|
|
||||||
|
(*count)++;
|
||||||
|
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "partial events count: %d\n", *count);
|
||||||
|
|
||||||
|
char *body = switch_event_get_body(event);
|
||||||
|
switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_NOTICE, "body=[%s]\n", body);
|
||||||
|
}
|
||||||
|
} else if (input_type == SWITCH_INPUT_TYPE_DTMF) {
|
||||||
|
// never mind
|
||||||
|
}
|
||||||
|
|
||||||
|
return status;
|
||||||
|
}
|
||||||
|
|
||||||
FST_CORE_BEGIN("./conf_playsay")
|
FST_CORE_BEGIN("./conf_playsay")
|
||||||
{
|
{
|
||||||
FST_SUITE_BEGIN(switch_ivr_play_say)
|
FST_SUITE_BEGIN(switch_ivr_play_say)
|
||||||
|
@ -77,15 +105,16 @@ FST_CORE_BEGIN("./conf_playsay")
|
||||||
fst_sched_recv_dtmf("+2", "2");
|
fst_sched_recv_dtmf("+2", "2");
|
||||||
fst_sched_recv_dtmf("+3", "3");
|
fst_sched_recv_dtmf("+3", "3");
|
||||||
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
||||||
|
fst_check(recognition_result == NULL);
|
||||||
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
||||||
fst_check_string_equals(cJSON_GetObjectCstr(recognition_result, "text"), NULL);
|
fst_check_string_equals(cJSON_GetObjectCstr(recognition_result, "text"), NULL);
|
||||||
fst_check_string_equals(digits_collected, "123");
|
fst_check_string_equals(digits_collected, "123");
|
||||||
fst_check(terminator_collected == 0);
|
fst_check(terminator_collected == 0);
|
||||||
|
cJSON_Delete(recognition_result);
|
||||||
}
|
}
|
||||||
FST_SESSION_END()
|
FST_SESSION_END()
|
||||||
|
|
||||||
FST_SESSION_BEGIN(play_and_collect_input)
|
FST_SESSION_BEGIN(play_and_collect_input_success)
|
||||||
{
|
{
|
||||||
char terminator_collected = 0;
|
char terminator_collected = 0;
|
||||||
char *digits_collected = NULL;
|
char *digits_collected = NULL;
|
||||||
|
@ -113,7 +142,7 @@ FST_CORE_BEGIN("./conf_playsay")
|
||||||
recognition_result = NULL;
|
recognition_result = NULL;
|
||||||
fst_time_mark();
|
fst_time_mark();
|
||||||
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
||||||
|
fst_check(recognition_result == NULL);
|
||||||
// check results
|
// check results
|
||||||
fst_check_duration(2500, 1000); // should return immediately when term digit is received
|
fst_check_duration(2500, 1000); // should return immediately when term digit is received
|
||||||
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
||||||
|
@ -145,7 +174,7 @@ FST_CORE_BEGIN("./conf_playsay")
|
||||||
recognition_result = NULL;
|
recognition_result = NULL;
|
||||||
fst_time_mark();
|
fst_time_mark();
|
||||||
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
||||||
|
fst_check(recognition_result == NULL);
|
||||||
// check results
|
// check results
|
||||||
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
||||||
fst_check_duration(7000, 1000); // should return after timeout when prompt finishes playing
|
fst_check_duration(7000, 1000); // should return after timeout when prompt finishes playing
|
||||||
|
@ -161,7 +190,7 @@ FST_CORE_BEGIN("./conf_playsay")
|
||||||
recognition_result = NULL;
|
recognition_result = NULL;
|
||||||
fst_time_mark();
|
fst_time_mark();
|
||||||
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
||||||
|
fst_check(recognition_result == NULL);
|
||||||
// check results
|
// check results
|
||||||
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
||||||
fst_check_duration(2500, 1000); // should return after timeout when prompt finishes playing
|
fst_check_duration(2500, 1000); // should return after timeout when prompt finishes playing
|
||||||
|
@ -182,7 +211,7 @@ FST_CORE_BEGIN("./conf_playsay")
|
||||||
recognition_result = NULL;
|
recognition_result = NULL;
|
||||||
fst_time_mark();
|
fst_time_mark();
|
||||||
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
||||||
|
fst_check(recognition_result == NULL);
|
||||||
// check results
|
// check results
|
||||||
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
||||||
fst_check_duration(10000, 1000); // should return when dtmf terminator is pressed
|
fst_check_duration(10000, 1000); // should return when dtmf terminator is pressed
|
||||||
|
@ -201,7 +230,7 @@ FST_CORE_BEGIN("./conf_playsay")
|
||||||
recognition_result = NULL;
|
recognition_result = NULL;
|
||||||
fst_time_mark();
|
fst_time_mark();
|
||||||
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
||||||
|
fst_requires(recognition_result);
|
||||||
// check results
|
// check results
|
||||||
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
||||||
fst_check_duration(2500, 1000); // returns when utterance is done
|
fst_check_duration(2500, 1000); // returns when utterance is done
|
||||||
|
@ -218,7 +247,7 @@ FST_CORE_BEGIN("./conf_playsay")
|
||||||
recognition_result = NULL;
|
recognition_result = NULL;
|
||||||
fst_time_mark();
|
fst_time_mark();
|
||||||
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
||||||
|
fst_check(recognition_result == NULL);
|
||||||
// check results
|
// check results
|
||||||
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
||||||
fst_check_duration(2500, 1000); // returns when single digit is pressed
|
fst_check_duration(2500, 1000); // returns when single digit is pressed
|
||||||
|
@ -236,7 +265,7 @@ FST_CORE_BEGIN("./conf_playsay")
|
||||||
recognition_result = NULL;
|
recognition_result = NULL;
|
||||||
fst_time_mark();
|
fst_time_mark();
|
||||||
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
||||||
|
fst_check(recognition_result == NULL);
|
||||||
// check results
|
// check results
|
||||||
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
||||||
fst_check_duration(2000, 1000); // returns when single digit is pressed
|
fst_check_duration(2000, 1000); // returns when single digit is pressed
|
||||||
|
@ -254,7 +283,7 @@ FST_CORE_BEGIN("./conf_playsay")
|
||||||
recognition_result = NULL;
|
recognition_result = NULL;
|
||||||
fst_time_mark();
|
fst_time_mark();
|
||||||
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
||||||
|
fst_requires(recognition_result);
|
||||||
// check results
|
// check results
|
||||||
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
||||||
fst_check_duration(7000, 1000); // inter-digit timeout after 2nd digit pressed
|
fst_check_duration(7000, 1000); // inter-digit timeout after 2nd digit pressed
|
||||||
|
@ -265,6 +294,72 @@ FST_CORE_BEGIN("./conf_playsay")
|
||||||
recognition_result = NULL;
|
recognition_result = NULL;
|
||||||
}
|
}
|
||||||
FST_SESSION_END()
|
FST_SESSION_END()
|
||||||
|
|
||||||
|
FST_SESSION_BEGIN(play_and_collect_input_partial)
|
||||||
|
{
|
||||||
|
char terminator_collected = 0;
|
||||||
|
char *digits_collected = NULL;
|
||||||
|
cJSON *recognition_result = NULL;
|
||||||
|
|
||||||
|
// args
|
||||||
|
const char *play_files = "silence_stream://1000";
|
||||||
|
const char *speech_engine = "test";
|
||||||
|
const char *terminators = "#";
|
||||||
|
int min_digits = 1;
|
||||||
|
int max_digits = 99;
|
||||||
|
int digit_timeout = 500;
|
||||||
|
int no_input_timeout = digit_timeout;
|
||||||
|
int speech_complete_timeout = digit_timeout;
|
||||||
|
int speech_recognition_timeout = 60000;
|
||||||
|
char *speech_grammar_args = switch_core_session_sprintf(fst_session, "{start-input-timers=false,no-input-timeout=%d,vad-silence-ms=%d,speech-timeout=%d,language=en-US,partial=true}default",
|
||||||
|
no_input_timeout, speech_complete_timeout, speech_recognition_timeout);
|
||||||
|
switch_status_t status;
|
||||||
|
|
||||||
|
switch_ivr_displace_session(fst_session, "file_string://silence_stream://500,0!tone_stream://%%(2000,0,350,440)", 0, "r");
|
||||||
|
terminator_collected = 0;
|
||||||
|
digits_collected = NULL;
|
||||||
|
if (recognition_result) cJSON_Delete(recognition_result);
|
||||||
|
recognition_result = NULL;
|
||||||
|
fst_time_mark();
|
||||||
|
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
|
||||||
|
fst_requires(recognition_result);
|
||||||
|
// check results
|
||||||
|
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
||||||
|
fst_check_duration(2500, 1000); // returns when utterance is done
|
||||||
|
fst_check_string_equals(cJSON_GetObjectCstr(recognition_result, "text"), "agent");
|
||||||
|
fst_check_string_equals(digits_collected, NULL);
|
||||||
|
fst_check(terminator_collected == 0);
|
||||||
|
|
||||||
|
|
||||||
|
switch_ivr_displace_session(fst_session, "file_string://silence_stream://500,0!tone_stream://%%(2000,0,350,440)", 0, "r");
|
||||||
|
terminator_collected = 0;
|
||||||
|
digits_collected = NULL;
|
||||||
|
if (recognition_result) cJSON_Delete(recognition_result);
|
||||||
|
recognition_result = NULL;
|
||||||
|
|
||||||
|
switch_input_args_t collect_input_args = { 0 };
|
||||||
|
switch_input_args_t *args = NULL;
|
||||||
|
int count = 0;
|
||||||
|
|
||||||
|
args = &collect_input_args;
|
||||||
|
args->input_callback = partial_play_and_collect_input_callback;
|
||||||
|
args->buf = &count;
|
||||||
|
args->buflen = sizeof(int);
|
||||||
|
|
||||||
|
fst_time_mark();
|
||||||
|
status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, args);
|
||||||
|
fst_requires(recognition_result);
|
||||||
|
// check results
|
||||||
|
fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
|
||||||
|
fst_check_duration(2500, 1000); // returns when utterance is done
|
||||||
|
fst_check_string_equals(cJSON_GetObjectCstr(recognition_result, "text"), "agent");
|
||||||
|
fst_check_string_equals(digits_collected, NULL);
|
||||||
|
fst_check(terminator_collected == 0);
|
||||||
|
switch_log_printf(SWITCH_CHANNEL_LOG, SWITCH_LOG_INFO, "xxx count = %d\n", count);
|
||||||
|
fst_check(count == 3); // 3 partial results
|
||||||
|
cJSON_Delete(recognition_result);
|
||||||
|
}
|
||||||
|
FST_SESSION_END()
|
||||||
}
|
}
|
||||||
FST_SUITE_END()
|
FST_SUITE_END()
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue