[Core] Add partial Asr support

author Seven Du <seven@signalwire.com>

Wed, 12 Feb 2020 16:34:59 +0000 (00:34 +0800)

committer Andrey Volk <andywolk@gmail.com>

Sat, 23 Oct 2021 18:59:49 +0000 (21:59 +0300)
author Seven Du <seven@signalwire.com>
Wed, 12 Feb 2020 16:34:59 +0000 (00:34 +0800)
committer Andrey Volk <andywolk@gmail.com>
Sat, 23 Oct 2021 18:59:49 +0000 (21:59 +0300)
diff --git a/src/mod/applications/mod_test/mod_test.c b/src/mod/applications/mod_test/mod_test.c

index 9791d7a611614e5b56c37b25b6024f9c6cd1bb7c..02292a7a3b48d9db64ab54c02447f8d60c185387 100644 (file)
--- a/src/mod/applications/mod_test/mod_test.c
+++ b/src/mod/applications/mod_test/mod_test.c
@@ -68,6 +68,7 @@ typedef struct {
         char *grammar;
         char *channel_uuid;
         switch_vad_t *vad;
+       int partial;
  } test_asr_t;
  
  
@@ -268,12 +269,17 @@ static switch_status_t test_asr_get_results(switch_asr_handle_t *ah, char **resu
         }
  
         if (switch_test_flag(context, ASRFLAG_RESULT)) {
+               int is_partial = context->partial-- > 0 ? 1 : 0;
  
                 *resultstr = switch_mprintf("{\"grammar\": \"%s\", \"text\": \"%s\", \"confidence\": %f}", context->grammar, context->result_text, context->result_confidence);
  
-               switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_ERROR, "Result: %s\n", *resultstr);
+               switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_NOTICE, "%sResult: %s\n", is_partial ? "Partial " : "Final ", *resultstr);
  
-               status = SWITCH_STATUS_SUCCESS;
+               if (is_partial) {
+                       status = SWITCH_STATUS_MORE_DATA;
+               } else {
+                       status = SWITCH_STATUS_SUCCESS;
+               }
         } else if (switch_test_flag(context, ASRFLAG_NOINPUT_TIMEOUT)) {
                 switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_DEBUG, "Result: NO INPUT\n");
  
@@ -361,6 +367,9 @@ static void test_asr_text_param(switch_asr_handle_t *ah, char *param, const char
                 } else if (!strcasecmp("confidence", param) && fval >= 0.0) {
                         context->result_confidence = fval;
                         switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_DEBUG, "confidence = %f\n", fval);
+               } else if (!strcasecmp("partial", param) && switch_true(val)) {
+                       context->partial = 3;
+                       switch_log_printf(SWITCH_CHANNEL_UUID_LOG(context->channel_uuid), SWITCH_LOG_DEBUG, "partial = %d\n", context->partial);
                 }
         }
  }
diff --git a/src/switch_cpp.cpp b/src/switch_cpp.cpp

index c412f2b7dcbcf3e7e1c00623907f7cc375abb51a..fe71a6400ad4a562a832f833f77bc7f3047f916f 100644 (file)
--- a/src/switch_cpp.cpp
+++ b/src/switch_cpp.cpp
@@ -1055,7 +1055,7 @@ SWITCH_DECLARE(char *) CoreSession::playAndDetectSpeech(char *file, char *engine
  
         char *result = NULL;
  
-       switch_status_t status = switch_ivr_play_and_detect_speech(session, file, engine, grammar, &result, 0, NULL);
+       switch_status_t status = switch_ivr_play_and_detect_speech(session, file, engine, grammar, &result, 0, ap);
         if (status == SWITCH_STATUS_SUCCESS) {
                 // good
         } else if (status == SWITCH_STATUS_GENERR) {
@@ -1063,12 +1063,12 @@ SWITCH_DECLARE(char *) CoreSession::playAndDetectSpeech(char *file, char *engine
         } else if (status == SWITCH_STATUS_NOT_INITALIZED) {
                 switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_ERROR, "ASR INIT ERROR\n");
         } else {
-               switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_ERROR, "ERROR\n");
+               switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_ERROR, "ERROR status = %d\n", status);
         }
  
         end_allow_threads();
  
-       return result; // remeber to free me
+       return result ? strdup(result) : NULL; // remeber to free me
  }
  
  SWITCH_DECLARE(void) CoreSession::say(const char *tosay, const char *module_name, const char *say_type, const char *say_method, const char *say_gender)
diff --git a/src/switch_ivr_async.c b/src/switch_ivr_async.c

index 07f28a36e8f5b5898ed608b85a39ab29a2edb829..a08223393c7160e12cd70f7e6fc7389a4d42a439 100644 (file)
--- a/src/switch_ivr_async.c
+++ b/src/switch_ivr_async.c
@@ -4696,8 +4696,16 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_bind_dtmf_meta_session(switch_core_se
  typedef struct {
         int done;
         char *result;
+       switch_input_args_t *original_args;
  } play_and_detect_speech_state_t;
  
+static void deliver_asr_event(switch_core_session_t *session, switch_event_t *event, switch_input_args_t *args)
+{
+       if (args && args->input_callback) {
+               args->input_callback(session, (void *)event, SWITCH_INPUT_TYPE_EVENT, args->buf, args->buflen);
+       }
+}
+
  static switch_status_t play_and_detect_input_callback(switch_core_session_t *session, void *input, switch_input_type_t input_type, void *data, unsigned int len)
  {
         play_and_detect_speech_state_t *state = (play_and_detect_speech_state_t *)data;
@@ -4708,7 +4716,10 @@ static switch_status_t play_and_detect_input_callback(switch_core_session_t *ses
                         event = (switch_event_t *)input;
                         if (event->event_id == SWITCH_EVENT_DETECTED_SPEECH) {
                                 const char *speech_type = switch_event_get_header(event, "Speech-Type");
+
                                 if (!zstr(speech_type)) {
+                                       deliver_asr_event(session, event, state->original_args);
+
                                         if (!strcasecmp(speech_type, "detected-speech")) {
                                                 const char *result;
                                                 switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) DETECTED SPEECH\n", switch_channel_get_name(channel));
@@ -4718,8 +4729,11 @@ static switch_status_t play_and_detect_input_callback(switch_core_session_t *ses
                                                 } else {
                                                         state->result = "";
                                                 }
+                                               state->original_args = NULL;
                                                 state->done = PLAY_AND_DETECT_DONE_RECOGNIZING;
                                                 return SWITCH_STATUS_BREAK;
+                                       } else if (!strcasecmp(speech_type, "detected-partial-speech")) {
+                                               // ok
                                         } else if (!strcasecmp(speech_type, "begin-speaking")) {
                                                 switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) START OF SPEECH\n", switch_channel_get_name(channel));
                                                 return SWITCH_STATUS_BREAK;
@@ -4727,6 +4741,8 @@ static switch_status_t play_and_detect_input_callback(switch_core_session_t *ses
                                                 state->done = PLAY_AND_DETECT_DONE_RECOGNIZING;
                                                 state->result = "";
                                                 return SWITCH_STATUS_BREAK;
+                                       } else {
+                                               switch_log_printf(SWITCH_CHANNEL_LOG, SWITCH_LOG_ERROR, "unhandled speech type %s\n", speech_type);
                                         }
                                 }
                         }
@@ -4765,7 +4781,7 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_detect_speech(switch_core_se
         switch_status_t status = SWITCH_STATUS_FALSE;
         int recognizing = 0;
         switch_input_args_t myargs = { 0 };
-       play_and_detect_speech_state_t state = { 0, "" };
+       play_and_detect_speech_state_t state = { 0, "", NULL };
         switch_channel_t *channel = switch_core_session_get_channel(session);
  
         arg_recursion_check_start(args);
@@ -4776,10 +4792,6 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_detect_speech(switch_core_se
  
         if (!input_timeout) input_timeout = 5000;
  
-       if (!args) {
-               args = &myargs;
-       }
-
         /* start speech detection */
         if ((status = switch_ivr_detect_speech(session, mod_name, grammar, "", NULL, NULL)) != SWITCH_STATUS_SUCCESS) {
                 /* map SWITCH_STATUS_FALSE to SWITCH_STATUS_GENERR to indicate grammar load failed
@@ -4792,12 +4804,19 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_detect_speech(switch_core_se
         recognizing = 1;
  
         /* play the prompt, looking for detection result */
-       args->input_callback = play_and_detect_input_callback;
-       args->buf = &state;
-       args->buflen = sizeof(state);
-       status = switch_ivr_play_file(session, NULL, file, args);
  
-       if (args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
+       if (args) {
+               state.original_args = args;
+               myargs.dmachine = args->dmachine;
+       }
+
+       myargs.input_callback = play_and_detect_input_callback;
+       myargs.buf = &state;
+       myargs.buflen = sizeof(state);
+
+       status = switch_ivr_play_file(session, NULL, file, &myargs);
+
+       if (args && args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
                 state.done |= PLAY_AND_DETECT_DONE;
                 goto done;
         }
@@ -4812,9 +4831,9 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_detect_speech(switch_core_se
                 switch_ivr_detect_speech_start_input_timers(session);
                 switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) WAITING FOR RESULT\n", switch_channel_get_name(channel));
                 while (!state.done && switch_channel_ready(channel)) {
-                       status = switch_ivr_sleep(session, input_timeout, SWITCH_FALSE, args);
+                       status = switch_ivr_sleep(session, input_timeout, SWITCH_FALSE, &myargs);
  
-                       if (args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
+                       if (args && args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
                                 state.done |= PLAY_AND_DETECT_DONE;
                                 goto done;
                         }
@@ -4826,8 +4845,6 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_detect_speech(switch_core_se
                 }
         }
  
-
-
  done:
         if (recognizing && !(state.done & PLAY_AND_DETECT_DONE_RECOGNIZING)) {
                 switch_ivr_pause_detect_speech(session);
diff --git a/src/switch_ivr_play_say.c b/src/switch_ivr_play_say.c

index 091c76f982ac08d2bb749a22e6f0b3a37577e4c4..b27a56bda43f3c0ec46ea5a70e810f4a16a47a60 100644 (file)
--- a/src/switch_ivr_play_say.c
+++ b/src/switch_ivr_play_say.c
@@ -3192,8 +3192,16 @@ typedef struct {
         char terminator;
         switch_time_t last_digit_time;
         switch_bool_t is_speech;
+       switch_input_args_t *original_args;
  } switch_collect_input_state_t;
  
+static void deliver_asr_event(switch_core_session_t *session, switch_event_t *event, switch_input_args_t *args)
+{
+       if (args && args->input_callback) {
+               args->input_callback(session, (void *)event, SWITCH_INPUT_TYPE_EVENT, args->buf, args->buflen);
+       }
+}
+
  static switch_status_t switch_collect_input_callback(switch_core_session_t *session, void *input, switch_input_type_t input_type, void *data, unsigned int len)
  {
         switch_collect_input_state_t *state = (switch_collect_input_state_t *)data;
@@ -3209,13 +3217,15 @@ static switch_status_t switch_collect_input_callback(switch_core_session_t *sess
  
                 if (zstr(speech_type)) return SWITCH_STATUS_SUCCESS;
  
+               deliver_asr_event(session, event, state->original_args);
+
                 if (!strcasecmp(speech_type, "detected-speech")) {
                         const char *result = switch_event_get_body(event);
  
                         /* stop waiting for speech */
                         switch_set_flag(state, SWITCH_COLLECT_INPUT_SPEECH_DONE);
  
-                       switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) DETECTED SPEECH\n", switch_channel_get_name(channel));
+                       switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) DETECTED SPEECH %s\n", switch_channel_get_name(channel), speech_type);
  
                         if (!zstr(result)) {
                                 state->recognition_result = cJSON_Parse(result);
@@ -3230,15 +3240,12 @@ static switch_status_t switch_collect_input_callback(switch_core_session_t *sess
                                 }
                         }
                         return SWITCH_STATUS_BREAK;
-               }
-
-               if (!strcasecmp("closed", speech_type)) {
+               } else if (!strcasecmp(speech_type, "detected-partial-speech")) {
+               } else if (!strcasecmp("closed", speech_type)) {
                         /* stop waiting for speech */
                         switch_set_flag(state, SWITCH_COLLECT_INPUT_SPEECH_DONE);
                         return SWITCH_STATUS_BREAK;
-               }
-
-               if (!strcasecmp(speech_type, "begin-speaking")) {
+               } else if (!strcasecmp(speech_type, "begin-speaking")) {
                         switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "(%s) START OF SPEECH\n", switch_channel_get_name(channel));
                         state->is_speech = SWITCH_TRUE;
  
@@ -3246,6 +3253,8 @@ static switch_status_t switch_collect_input_callback(switch_core_session_t *sess
                                 /* barge in on prompt */
                                 return SWITCH_STATUS_BREAK;
                         }
+               } else {
+                       switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "Unhandled Speech-Type %s\n", speech_type);
                 }
         }
  
@@ -3360,10 +3369,6 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_collect_input(switch_core_se
                 }
         }
  
-       if (!args) {
-               args = &myargs;
-       }
-
         /* start speech recognition, if enabled */
         if (recognizer_grammar && recognizer_mod_name) {
                 if ((status = switch_ivr_detect_speech(session, recognizer_mod_name, recognizer_grammar, "", NULL, NULL)) != SWITCH_STATUS_SUCCESS) {
@@ -3380,14 +3385,22 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_collect_input(switch_core_se
         }
  
         /* play the prompt, looking for input result */
-       args->input_callback = switch_collect_input_callback;
-       args->buf = &state;
-       args->buflen = sizeof(state);
+
+       if (args) {
+               state.original_args = args;
+               myargs.dmachine = args->dmachine;
+       }
+
+       myargs.input_callback = switch_collect_input_callback;
+       myargs.buf = &state;
+       myargs.buflen = sizeof(state);
+
+
         switch_set_flag(&state, SWITCH_COLLECT_INPUT_PROMPT);
-       status = switch_ivr_play_file(session, NULL, prompt, args);
+       status = switch_ivr_play_file(session, NULL, prompt, &myargs);
         switch_clear_flag(&state, SWITCH_COLLECT_INPUT_PROMPT);
  
-       if (args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
+       if (args && args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
                 switch_set_flag(&state, SWITCH_COLLECT_INPUT_DIGITS_DONE);
                 switch_set_flag(&state, SWITCH_COLLECT_INPUT_SPEECH_DONE);
                 status = SWITCH_STATUS_SUCCESS;
@@ -3412,9 +3425,9 @@ SWITCH_DECLARE(switch_status_t) switch_ivr_play_and_collect_input(switch_core_se
                 while ((!switch_test_flag(&state, SWITCH_COLLECT_INPUT_DIGITS_DONE) || !switch_test_flag(&state, SWITCH_COLLECT_INPUT_SPEECH_DONE))
                            && switch_channel_ready(channel)) {
  
-                       status = switch_ivr_sleep(session, sleep_time, SWITCH_FALSE, args);
+                       status = switch_ivr_sleep(session, sleep_time, SWITCH_FALSE, &myargs);
  
-                       if (args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
+                       if (args && args->dmachine && switch_ivr_dmachine_last_ping(args->dmachine) != SWITCH_STATUS_SUCCESS) {
                                 // dmachine done
                                 switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_DEBUG, "(%s) DMACHINE DONE\n", switch_channel_get_name(channel));
                                 switch_set_flag(&state, SWITCH_COLLECT_INPUT_DIGITS_DONE);
diff --git a/tests/unit/switch_ivr_play_say.c b/tests/unit/switch_ivr_play_say.c

index 6dd1c524f50b963acd57c2372626a57abbca1553..1d0bab84f1c41c5214e63e7257837a8d407c9ba0 100644 (file)
--- a/tests/unit/switch_ivr_play_say.c
+++ b/tests/unit/switch_ivr_play_say.c
@@ -33,6 +33,34 @@
  
  #include <test/switch_test.h>
  
+static switch_status_t partial_play_and_collect_input_callback(switch_core_session_t *session, void *input, switch_input_type_t input_type, void *data, __attribute__((unused))unsigned int len)
+{
+       switch_status_t status = SWITCH_STATUS_SUCCESS;
+       int *count = (int *)data;
+
+       if (input_type == SWITCH_INPUT_TYPE_EVENT) {
+               switch_event_t *event = (switch_event_t *)input;
+
+               if (event->event_id == SWITCH_EVENT_DETECTED_SPEECH) {
+                       const char *speech_type = switch_event_get_header(event, "Speech-Type");
+
+                       if (zstr(speech_type) || strcmp(speech_type, "detected-partial-speech")) {
+                               return status;
+                       }
+
+                       (*count)++;
+                       switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_INFO, "partial events count: %d\n", *count);
+
+                       char *body = switch_event_get_body(event);
+                       switch_log_printf(SWITCH_CHANNEL_SESSION_LOG(session), SWITCH_LOG_NOTICE, "body=[%s]\n", body);
+               }
+       } else if (input_type == SWITCH_INPUT_TYPE_DTMF) {
+               // never mind
+       }
+
+       return status;
+}
+
  FST_CORE_BEGIN("./conf_playsay")
  {
         FST_SUITE_BEGIN(switch_ivr_play_say)
@@ -77,15 +105,16 @@ FST_CORE_BEGIN("./conf_playsay")
                         fst_sched_recv_dtmf("+2", "2");
                         fst_sched_recv_dtmf("+3", "3");
                         status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
-
+                       fst_check(recognition_result == NULL);
                         fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
                         fst_check_string_equals(cJSON_GetObjectCstr(recognition_result, "text"), NULL);
                         fst_check_string_equals(digits_collected, "123");
                         fst_check(terminator_collected == 0);
+                       cJSON_Delete(recognition_result);
                 }
                 FST_SESSION_END()
  
-               FST_SESSION_BEGIN(play_and_collect_input)
+               FST_SESSION_BEGIN(play_and_collect_input_success)
                 {
                         char terminator_collected = 0;
                         char *digits_collected = NULL;
@@ -113,7 +142,7 @@ FST_CORE_BEGIN("./conf_playsay")
                         recognition_result = NULL;
                         fst_time_mark();
                         status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
-
+                       fst_check(recognition_result == NULL);
                         // check results
                         fst_check_duration(2500, 1000); // should return immediately when term digit is received
                         fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
@@ -145,7 +174,7 @@ FST_CORE_BEGIN("./conf_playsay")
                         recognition_result = NULL;
                         fst_time_mark();
                         status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
-
+                       fst_check(recognition_result == NULL);
                         // check results
                         fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
                         fst_check_duration(7000, 1000); // should return after timeout when prompt finishes playing
@@ -161,7 +190,7 @@ FST_CORE_BEGIN("./conf_playsay")
                         recognition_result = NULL;
                         fst_time_mark();
                         status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
-
+                       fst_check(recognition_result == NULL);
                         // check results
                         fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
                         fst_check_duration(2500, 1000); // should return after timeout when prompt finishes playing
@@ -182,7 +211,7 @@ FST_CORE_BEGIN("./conf_playsay")
                         recognition_result = NULL;
                         fst_time_mark();
                         status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
-
+                       fst_check(recognition_result == NULL);
                         // check results
                         fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
                         fst_check_duration(10000, 1000); // should return when dtmf terminator is pressed
@@ -201,7 +230,7 @@ FST_CORE_BEGIN("./conf_playsay")
                         recognition_result = NULL;
                         fst_time_mark();
                         status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
-
+                       fst_requires(recognition_result);
                         // check results
                         fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
                         fst_check_duration(2500, 1000); // returns when utterance is done
@@ -218,7 +247,7 @@ FST_CORE_BEGIN("./conf_playsay")
                         recognition_result = NULL;
                         fst_time_mark();
                         status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
-
+                       fst_check(recognition_result == NULL);
                         // check results
                         fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
                         fst_check_duration(2500, 1000); // returns when single digit is pressed
@@ -236,7 +265,7 @@ FST_CORE_BEGIN("./conf_playsay")
                         recognition_result = NULL;
                         fst_time_mark();
                         status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
-
+                       fst_check(recognition_result == NULL);
                         // check results
                         fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
                         fst_check_duration(2000, 1000); // returns when single digit is pressed
@@ -254,7 +283,7 @@ FST_CORE_BEGIN("./conf_playsay")
                         recognition_result = NULL;
                         fst_time_mark();
                         status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
-
+                       fst_requires(recognition_result);
                         // check results
                         fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
                         fst_check_duration(7000, 1000); // inter-digit timeout after 2nd digit pressed
@@ -265,6 +294,72 @@ FST_CORE_BEGIN("./conf_playsay")
                         recognition_result = NULL;
                 }
                 FST_SESSION_END()
+
+               FST_SESSION_BEGIN(play_and_collect_input_partial)
+               {
+                       char terminator_collected = 0;
+                       char *digits_collected = NULL;
+                       cJSON *recognition_result = NULL;
+
+                       // args
+                       const char *play_files = "silence_stream://1000";
+                       const char *speech_engine = "test";
+                       const char *terminators = "#";
+                       int min_digits = 1;
+                       int max_digits = 99;
+                       int digit_timeout = 500;
+                       int no_input_timeout = digit_timeout;
+                       int speech_complete_timeout = digit_timeout;
+                       int speech_recognition_timeout = 60000;
+                       char *speech_grammar_args = switch_core_session_sprintf(fst_session, "{start-input-timers=false,no-input-timeout=%d,vad-silence-ms=%d,speech-timeout=%d,language=en-US,partial=true}default",
+                                                                                       no_input_timeout, speech_complete_timeout, speech_recognition_timeout);
+                       switch_status_t status;
+
+                       switch_ivr_displace_session(fst_session, "file_string://silence_stream://500,0!tone_stream://%%(2000,0,350,440)", 0, "r");
+                       terminator_collected = 0;
+                       digits_collected = NULL;
+                       if (recognition_result) cJSON_Delete(recognition_result);
+                       recognition_result = NULL;
+                       fst_time_mark();
+                       status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, NULL);
+                       fst_requires(recognition_result);
+                       // check results
+                       fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
+                       fst_check_duration(2500, 1000); // returns when utterance is done
+                       fst_check_string_equals(cJSON_GetObjectCstr(recognition_result, "text"), "agent");
+                       fst_check_string_equals(digits_collected, NULL);
+                       fst_check(terminator_collected == 0);
+
+
+                       switch_ivr_displace_session(fst_session, "file_string://silence_stream://500,0!tone_stream://%%(2000,0,350,440)", 0, "r");
+                       terminator_collected = 0;
+                       digits_collected = NULL;
+                       if (recognition_result) cJSON_Delete(recognition_result);
+                       recognition_result = NULL;
+
+                       switch_input_args_t collect_input_args = { 0 };
+                       switch_input_args_t *args = NULL;
+                       int count = 0;
+
+                       args = &collect_input_args;
+                       args->input_callback = partial_play_and_collect_input_callback;
+                       args->buf = &count;
+                       args->buflen = sizeof(int);
+
+                       fst_time_mark();
+                       status = switch_ivr_play_and_collect_input(fst_session, play_files, speech_engine, speech_grammar_args, min_digits, max_digits, terminators, digit_timeout, &recognition_result, &digits_collected, &terminator_collected, args);
+                       fst_requires(recognition_result);
+                       // check results
+                       fst_check(status == SWITCH_STATUS_SUCCESS); // might be break?
+                       fst_check_duration(2500, 1000); // returns when utterance is done
+                       fst_check_string_equals(cJSON_GetObjectCstr(recognition_result, "text"), "agent");
+                       fst_check_string_equals(digits_collected, NULL);
+                       fst_check(terminator_collected == 0);
+                       switch_log_printf(SWITCH_CHANNEL_LOG, SWITCH_LOG_INFO, "xxx count = %d\n", count);
+                       fst_check(count == 3); // 3 partial results
+                       cJSON_Delete(recognition_result);
+               }
+               FST_SESSION_END()
         }
         FST_SUITE_END()
  }
author	Seven Du <seven@signalwire.com>
	Wed, 12 Feb 2020 16:34:59 +0000 (00:34 +0800)
committer	Andrey Volk <andywolk@gmail.com>
	Sat, 23 Oct 2021 18:59:49 +0000 (21:59 +0300)
src/mod/applications/mod_test/mod_test.c		patch \| blob \| blame \| history
src/switch_cpp.cpp		patch \| blob \| blame \| history
src/switch_ivr_async.c		patch \| blob \| blame \| history
src/switch_ivr_play_say.c		patch \| blob \| blame \| history
tests/unit/switch_ivr_play_say.c		patch \| blob \| blame \| history