/** Create demo synthesizer channel */ static mrcp_channel_t* synth_application_channel_create(mrcp_session_t *session) { mrcp_channel_t *channel; mpf_termination_t *termination; /* create channel */ synth_app_channel_t *synth_channel = apr_palloc(session->pool,sizeof(synth_app_channel_t)); synth_channel->audio_out = NULL; /* create audio stream */ synth_channel->audio_stream = mpf_audio_stream_create( synth_channel, /* object to associate */ &audio_stream_vtable, /* virtual methods table of audio stream */ STREAM_MODE_SEND, /* stream mode/direction */ session->pool); /* memory pool to allocate memory from */ /* create raw termination */ termination = mpf_raw_termination_create( NULL, /* no object to associate */ synth_channel->audio_stream, /* audio stream */ NULL, /* no video stream */ session->pool); /* memory pool to allocate memory from */ channel = mrcp_application_channel_create( session, /* session, channel belongs to */ MRCP_SYNTHESIZER_RESOURCE, /* MRCP resource identifier */ termination, /* media termination, used to terminate audio stream */ NULL, /* RTP descriptor, used to create RTP termination (NULL by default) */ synth_channel); /* object to associate */ return channel; }
mrcp_channel_t* UmcSession::CreateMrcpChannel( mrcp_resource_id resource_id, mpf_termination_t* pTermination, mpf_rtp_termination_descriptor_t* pRtpDescriptor, void* pObj) { return mrcp_application_channel_create( m_pMrcpSession, /* session, channel belongs to */ resource_id, /* MRCP resource identifier */ pTermination, /* media termination, used to terminate audio stream */ NULL, /* RTP descriptor, used to create RTP termination (NULL by default) */ pObj); /* object to associate */ }
/** Create demo channel */ static mrcp_channel_t* demo_application_channel_create(mrcp_session_t *session) { mrcp_channel_t *channel; /* create channel */ demo_app_channel_t *demo_channel = apr_palloc(session->pool,sizeof(demo_app_channel_t)); mpf_rtp_termination_descriptor_t *rtp_descriptor = demo_rtp_descriptor_create(session->pool); channel = mrcp_application_channel_create( session, /* session, channel belongs to */ MRCP_SYNTHESIZER_RESOURCE, /* MRCP resource identifier */ NULL, /* no termination (not to use internal media processing) */ rtp_descriptor, /* RTP descriptor, used to create RTP termination */ demo_channel); /* object to associate */ return channel; }
/** Create demo recognizer channel */ static mrcp_channel_t* recog_application_channel_create(mrcp_session_t *session) { mrcp_channel_t *channel; mpf_termination_t *termination; mpf_stream_capabilities_t *capabilities; /* create channel */ recog_app_channel_t *recog_channel = apr_palloc(session->pool,sizeof(recog_app_channel_t)); recog_channel->streaming = FALSE; recog_channel->audio_in = NULL; recog_channel->time_to_complete = 0; /* create source stream capabilities */ capabilities = mpf_source_stream_capabilities_create(session->pool); /* add codec capabilities (Linear PCM) */ mpf_codec_capabilities_add( &capabilities->codecs, MPF_SAMPLE_RATE_8000 | MPF_SAMPLE_RATE_16000, "LPCM"); #if 0 /* more capabilities can be added or replaced */ mpf_codec_capabilities_add( &capabilities->codecs, MPF_SAMPLE_RATE_8000 | MPF_SAMPLE_RATE_16000, "PCMU"); #endif termination = mrcp_application_audio_termination_create( session, /* session, termination belongs to */ &audio_stream_vtable, /* virtual methods table of audio stream */ capabilities, /* capabilities of audio stream */ recog_channel); /* object to associate */ channel = mrcp_application_channel_create( session, /* session, channel belongs to */ MRCP_RECOGNIZER_RESOURCE, /* MRCP resource identifier */ termination, /* media termination, used to terminate audio stream */ NULL, /* RTP descriptor, used to create RTP termination (NULL by default) */ recog_channel); /* object to associate */ return channel; }
/** Create demo synthesizer channel */ static mrcp_channel_t* synth_application_channel_create(mrcp_session_t *session) { mrcp_channel_t *channel; mpf_termination_t *termination; mpf_stream_capabilities_t *capabilities; apr_pool_t *pool = mrcp_application_session_pool_get(session); /* create channel */ synth_app_channel_t *synth_channel = apr_palloc(pool,sizeof(synth_app_channel_t)); synth_channel->audio_out = NULL; /* create sink stream capabilities */ capabilities = mpf_sink_stream_capabilities_create(pool); /* add codec capabilities (Linear PCM) */ mpf_codec_capabilities_add( &capabilities->codecs, MPF_SAMPLE_RATE_8000 | MPF_SAMPLE_RATE_16000, "LPCM"); #if 0 /* more capabilities can be added or replaced */ mpf_codec_capabilities_add( &capabilities->codecs, MPF_SAMPLE_RATE_8000 | MPF_SAMPLE_RATE_16000, "PCMU"); #endif termination = mrcp_application_audio_termination_create( session, /* session, termination belongs to */ &audio_stream_vtable, /* virtual methods table of audio stream */ capabilities, /* capabilities of audio stream */ synth_channel); /* object to associate */ channel = mrcp_application_channel_create( session, /* session, channel belongs to */ MRCP_SYNTHESIZER_RESOURCE, /* MRCP resource identifier */ termination, /* media termination, used to terminate audio stream */ NULL, /* RTP descriptor, used to create RTP termination (NULL by default) */ synth_channel); /* object to associate */ return channel; }
/** \brief Create recognition channel */ static apt_bool_t uni_recog_channel_create(uni_speech_t *uni_speech, ast_format_compat *format) { mrcp_channel_t *channel; mpf_termination_t *termination; mpf_stream_capabilities_t *capabilities; apr_pool_t *pool = mrcp_application_session_pool_get(uni_speech->session); /* Create source stream capabilities */ capabilities = mpf_source_stream_capabilities_create(pool); /* Add codec capabilities (Linear PCM) */ mpf_codec_capabilities_add( &capabilities->codecs, MPF_SAMPLE_RATE_8000, "LPCM"); /* Create media termination */ termination = mrcp_application_audio_termination_create( uni_speech->session, /* session, termination belongs to */ &audio_stream_vtable, /* virtual methods table of audio stream */ capabilities, /* stream capabilities */ uni_speech); /* object to associate */ /* Create MRCP channel */ channel = mrcp_application_channel_create( uni_speech->session, /* session, channel belongs to */ MRCP_RECOGNIZER_RESOURCE, /* MRCP resource identifier */ termination, /* media termination, used to terminate audio stream */ NULL, /* RTP descriptor, used to create RTP termination (NULL by default) */ uni_speech); /* object to associate */ if(!channel) { return FALSE; } uni_speech->channel = channel; return TRUE; }
/** Create ASR session */ ASR_CLIENT_DECLARE(asr_session_t*) asr_session_create(asr_engine_t *engine, const char *profile) { mpf_termination_t *termination; mrcp_channel_t *channel; mrcp_session_t *session; const mrcp_app_message_t *app_message; apr_pool_t *pool; asr_session_t *asr_session; mpf_stream_capabilities_t *capabilities; /* create session */ session = mrcp_application_session_create(engine->mrcp_app,profile,NULL); if(!session) { return NULL; } pool = mrcp_application_session_pool_get(session); asr_session = apr_palloc(pool,sizeof(asr_session_t)); mrcp_application_session_object_set(session,asr_session); /* create source stream capabilities */ capabilities = mpf_source_stream_capabilities_create(pool); /* add codec capabilities (Linear PCM) */ mpf_codec_capabilities_add( &capabilities->codecs, MPF_SAMPLE_RATE_8000, "LPCM"); termination = mrcp_application_audio_termination_create( session, /* session, termination belongs to */ &audio_stream_vtable, /* virtual methods table of audio stream */ capabilities, /* capabilities of audio stream */ asr_session); /* object to associate */ channel = mrcp_application_channel_create( session, /* session, channel belongs to */ MRCP_RECOGNIZER_RESOURCE, /* MRCP resource identifier */ termination, /* media termination, used to terminate audio stream */ NULL, /* RTP descriptor, used to create RTP termination (NULL by default) */ asr_session); /* object to associate */ if(!channel) { mrcp_application_session_destroy(session); return NULL; } asr_session->engine = engine; asr_session->mrcp_session = session; asr_session->mrcp_channel = channel; asr_session->recog_complete = NULL; asr_session->input_mode = INPUT_MODE_NONE; asr_session->streaming = FALSE; asr_session->audio_in = NULL; asr_session->media_buffer = NULL; asr_session->mutex = NULL; asr_session->wait_object = NULL; asr_session->app_message = NULL; /* Create cond wait object and mutex */ apr_thread_mutex_create(&asr_session->mutex,APR_THREAD_MUTEX_DEFAULT,pool); apr_thread_cond_create(&asr_session->wait_object,pool); /* Create media buffer */ asr_session->media_buffer = mpf_frame_buffer_create(160,20,pool); /* Send add channel request and wait for the response */ apr_thread_mutex_lock(asr_session->mutex); app_message = NULL; if(mrcp_application_channel_add(asr_session->mrcp_session,asr_session->mrcp_channel) == TRUE) { apr_thread_cond_wait(asr_session->wait_object,asr_session->mutex); app_message = asr_session->app_message; asr_session->app_message = NULL; } apr_thread_mutex_unlock(asr_session->mutex); if(sig_response_check(app_message) == FALSE) { asr_session_destroy_ex(asr_session,TRUE); return NULL; } return asr_session; }
int main(int argc, char const* argv[]) { apr_pool_t* pool = NULL; apr_pool_t* spool = NULL; int i; struct iovec cattext[101]; static char const SP = ' '; char const* outfile; apr_status_t status; apt_dir_layout_t* dirLayout = NULL; mrcp_client_t* client = NULL; mrcp_application_t* app = NULL; mrcp_session_t* sess = NULL; mpf_stream_capabilities_t* caps = NULL; mpf_termination_t* term = NULL; mrcp_channel_t* chan = NULL; struct stat info; if (argc < 2) { puts("Usage:"); printf("\t%s \"This is a synthetic voice.\"", argv[0]); exit(1); } /* Just detect various directory layout constellations */ if (stat(ROOT_DIR, &info)) ROOT_DIR = ROOT_DIR2; if (stat(ROOT_DIR, &info)) ROOT_DIR = ROOT_DIR3; /* Initialize platform first */ if (apr_initialize() != APR_SUCCESS) FAIL("Cannot initialize APR platform"); pool = apt_pool_create(); if (!pool) FAIL("Not enough memory"); for (i = 0; (i < argc - 2) && (i < 50); i += 2) { cattext[2 * i].iov_base = (void*) argv[i + 1]; cattext[2 * i].iov_len = strlen(argv[i + 1]); cattext[2 * i + 1].iov_base = (void*) &SP; cattext[2 * i + 1].iov_len = 1; } cattext[2 * i].iov_base = (void*) argv[i + 1]; cattext[2 * i].iov_len = strlen(argv[i + 1]); text = apr_pstrcatv(pool, cattext, 2 * i + 1, NULL); if (!text) FAIL("Not enough memory"); outfile = apr_pstrcat(pool, ROOT_DIR, "/data/", PCM_OUT_FILE, NULL); printf("This is a sample C UniMRCP client synthesizer scenario.\n"); printf("Use client configuration from %s/conf/unimrcpclient.xml\n", ROOT_DIR); printf("Use profile %s\n", MRCP_PROFILE); printf("Synthesize text: `%s'\n", text); printf("Write output to file: %s\n", outfile); printf("\n"); printf("Press enter to start the session...\n"); (void) getchar(); apt_log_instance_create(APT_LOG_OUTPUT_NONE, APT_PRIO_DEBUG, pool); apt_log_ext_handler_set(UniSynth_logger); dirLayout = apt_default_dir_layout_create(ROOT_DIR, pool); /* Create and start the client in a root dir */ client = unimrcp_client_create(dirLayout); if (!client) FAIL("Cannot create UniMRCP client"); app = mrcp_application_create(UniSynthAppMsgHandler, NULL, mrcp_client_memory_pool_get(client)); if (!app) FAIL("Cannot create MRCP application"); if (!mrcp_client_application_register(client, app, "Sample C app")) FAIL("Cannot register MRCP application"); if (!mrcp_client_start(client)) FAIL("Cannot start MRCP client"); /* Create a session using MRCP profile MRCP_PROFILE */ sess = mrcp_application_session_create(app, MRCP_PROFILE, NULL); if (!sess) FAIL("Cannot create session"); spool = mrcp_application_session_pool_get(sess); /* Create audio termination with capabilities */ caps = mpf_stream_capabilities_create(STREAM_DIRECTION_SEND, spool); if (!caps) FAIL("Error creating capabilities"); if (!mpf_codec_capabilities_add(&caps->codecs, MPF_SAMPLE_RATE_8000, "LPCM")) FAIL("Error adding codec capabilities"); term = mrcp_application_audio_termination_create(sess, &stream_vtable, caps, NULL); if (!term) FAIL("Cannot create audio termination"); /* Add signaling channel (and start processing in OnAdd method */ f = fopen(outfile, "wb"); if (!f) FAIL("Cannot open output file"); status = apr_thread_mutex_create(&mutex, APR_THREAD_MUTEX_DEFAULT, pool); if (status != APR_SUCCESS) FAIL("Cannot create mutex"); status = apr_thread_cond_create(&cond, pool); if (status != APR_SUCCESS) FAIL("Cannot create condition variable"); chan = mrcp_application_channel_create(sess, MRCP_SYNTHESIZER_RESOURCE, term, NULL, NULL); if (!chan) FAIL("Cannot create channel"); if (!mrcp_application_channel_add(sess, chan)) FAIL("Cannot add channel"); /* Now wait until the processing finishes */ apr_thread_mutex_lock(mutex); while (err < 0) apr_thread_cond_wait(cond, mutex); apr_thread_mutex_unlock(mutex); cleanup: if (sess) mrcp_application_session_terminate(sess); if (f) fclose(f); if (client) mrcp_client_shutdown(client); if (app) mrcp_application_destroy(app); if (client) mrcp_client_destroy(client); apt_log_instance_destroy(); if (pool) apr_pool_destroy(pool); apr_terminate(); puts("Program finished, memory released. Press any key to exit."); (void) getchar(); return err; }
/* Open the speech channel. */ int speech_channel_open(speech_channel_t *schannel, ast_mrcp_profile_t *profile) { int status = 0; mpf_termination_t *termination = NULL; mrcp_resource_type_e resource_type; if ((schannel == NULL) || (profile == NULL)) return -1; if (schannel->mutex != NULL) apr_thread_mutex_lock(schannel->mutex); /* Make sure we can open channel. */ if (schannel->state != SPEECH_CHANNEL_CLOSED) { if (schannel->mutex != NULL) apr_thread_mutex_unlock(schannel->mutex); return -1; } schannel->profile = profile; /* Create MRCP session. */ if ((schannel->unimrcp_session = mrcp_application_session_create(schannel->application->app, profile->name, schannel)) == NULL) { /* Profile doesn't exist? */ ast_log(LOG_ERROR, "(%s) Unable to create session with %s\n", schannel->name, profile->name); if (schannel->mutex != NULL) apr_thread_mutex_unlock(schannel->mutex); return 2; } /* Set session name for logging purposes. */ mrcp_application_session_name_set(schannel->unimrcp_session, schannel->name); /* Create audio termination and add to channel. */ if ((termination = speech_channel_create_mpf_termination(schannel)) == NULL) { ast_log(LOG_ERROR, "(%s) Unable to create termination with %s\n", schannel->name, profile->name); if (!mrcp_application_session_destroy(schannel->unimrcp_session)) ast_log(LOG_WARNING, "(%s) Unable to destroy application session for %s\n", schannel->name, profile->name); if (schannel->mutex != NULL) apr_thread_mutex_unlock(schannel->mutex); return -1; } if (schannel->type == SPEECH_CHANNEL_SYNTHESIZER) resource_type = MRCP_SYNTHESIZER_RESOURCE; else resource_type = MRCP_RECOGNIZER_RESOURCE; if ((schannel->unimrcp_channel = mrcp_application_channel_create(schannel->unimrcp_session, resource_type, termination, NULL, schannel)) == NULL) { ast_log(LOG_ERROR, "(%s) Unable to create channel with %s\n", schannel->name, profile->name); if (!mrcp_application_session_destroy(schannel->unimrcp_session)) ast_log(LOG_WARNING, "(%s) Unable to destroy application session for %s\n", schannel->name, profile->name); if (schannel->mutex != NULL) apr_thread_mutex_unlock(schannel->mutex); return -1; } /* Add channel to session. This establishes the connection to the MRCP server. */ if (mrcp_application_channel_add(schannel->unimrcp_session, schannel->unimrcp_channel) != TRUE) { ast_log(LOG_ERROR, "(%s) Unable to add channel to session with %s\n", schannel->name, profile->name); if (!mrcp_application_session_destroy(schannel->unimrcp_session)) ast_log(LOG_WARNING, "(%s) Unable to destroy application session for %s\n", schannel->name, profile->name); if (schannel->mutex != NULL) apr_thread_mutex_unlock(schannel->mutex); return -1; } /* Wait for channel to be ready. */ while ((schannel->mutex != NULL) && (schannel->cond != NULL) && (schannel->state == SPEECH_CHANNEL_CLOSED)) apr_thread_cond_timedwait(schannel->cond, schannel->mutex, SPEECH_CHANNEL_TIMEOUT_USEC); if (schannel->state == SPEECH_CHANNEL_READY) { ast_log(LOG_DEBUG, "(%s) channel is ready\n", schannel->name); } else if (schannel->state == SPEECH_CHANNEL_CLOSED) { ast_log(LOG_ERROR, "(%s) Timed out waiting for channel to be ready\n", schannel->name); /* Can't retry. */ status = -1; } else if (schannel->state == SPEECH_CHANNEL_ERROR) { /* Wait for session to be cleaned up. */ if (schannel->cond != NULL) apr_thread_cond_timedwait(schannel->cond, schannel->mutex, SPEECH_CHANNEL_TIMEOUT_USEC); if (schannel->state != SPEECH_CHANNEL_CLOSED) { /* Major issue. Can't retry. */ status = -1; } else { /* Failed to open profile, retry is allowed. */ status = 2; } } if (schannel->type == SPEECH_CHANNEL_RECOGNIZER) { recognizer_data_t *r = (recognizer_data_t *)apr_palloc(schannel->pool, sizeof(recognizer_data_t)); if (r != NULL) { schannel->data = r; memset(r, 0, sizeof(recognizer_data_t)); if ((r->grammars = apr_hash_make(schannel->pool)) == NULL) { ast_log(LOG_ERROR, "Unable to allocate hash for grammars\n"); status = -1; } } else { ast_log(LOG_ERROR, "Unable to allocate recognizer data structure\n"); status = -1; } } if (schannel->mutex != NULL) apr_thread_mutex_unlock(schannel->mutex); return status; }