2 * Copyright (c) 2011-2014 Samsung Electronics Co., Ltd All Rights Reserved
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at
6 * http://www.apache.org/licenses/LICENSE-2.0
7 * Unless required by applicable law or agreed to in writing, software
8 * distributed under the License is distributed on an "AS IS" BASIS,
9 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
10 * See the License for the specific language governing permissions and
11 * limitations under the License.
18 #include <sound_manager.h>
21 #include "sttd_dbus.h"
22 #include "sttd_recorder.h"
23 #include "sttd_main.h"
27 #define FRAME_LENGTH 160
28 #define BUFFER_LENGTH FRAME_LENGTH * 2
30 static pthread_mutex_t sttd_audio_in_handle_mutex = PTHREAD_MUTEX_INITIALIZER;
33 STTD_RECORDER_STATE_NONE = -1,
34 STTD_RECORDER_STATE_READY = 0, /**< Recorder is ready to start */
35 STTD_RECORDER_STATE_RECORDING /**< In the middle of recording */
36 } sttd_recorder_state;
42 sttp_audio_type_e audio_type;
45 static GSList *g_recorder_list;
47 static int g_recording_engine_id;
49 static stt_recorder_audio_cb g_audio_cb;
51 static sound_stream_info_h g_stream_info_h;
53 static stt_recorder_interrupt_cb g_interrupt_cb;
55 static sttd_recorder_state g_recorder_state = STTD_RECORDER_STATE_NONE;
57 static int g_buffer_count;
59 /* Sound buf save for test */
64 static char g_temp_file_name[128] = {'\0',};
68 static int g_count = 1;
71 const char* __stt_get_focus_changed_reason_code(sound_stream_focus_change_reason_e reason)
74 case SOUND_STREAM_FOCUS_CHANGED_BY_MEDIA: return "SOUND_STREAM_FOCUS_CHANGED_BY_MEDIA";
75 case SOUND_STREAM_FOCUS_CHANGED_BY_SYSTEM: return "SOUND_STREAM_FOCUS_CHANGED_BY_SYSTEM";
76 case SOUND_STREAM_FOCUS_CHANGED_BY_ALARM: return "SOUND_STREAM_FOCUS_CHANGED_BY_ALARM";
77 case SOUND_STREAM_FOCUS_CHANGED_BY_NOTIFICATION: return "SOUND_STREAM_FOCUS_CHANGED_BY_NOTIFICATION";
78 case SOUND_STREAM_FOCUS_CHANGED_BY_EMERGENCY: return "SOUND_STREAM_FOCUS_CHANGED_BY_EMERGENCY";
79 case SOUND_STREAM_FOCUS_CHANGED_BY_VOICE_INFORMATION: return "SOUND_STREAM_FOCUS_CHANGED_BY_VOICE_INFORMATION";
80 case SOUND_STREAM_FOCUS_CHANGED_BY_VOICE_RECOGNITION: return "SOUND_STREAM_FOCUS_CHANGED_BY_VOICE_RECOGNITION";
81 case SOUND_STREAM_FOCUS_CHANGED_BY_RINGTONE: return "SOUND_STREAM_FOCUS_CHANGED_BY_RINGTONE";
82 case SOUND_STREAM_FOCUS_CHANGED_BY_VOIP: return "SOUND_STREAM_FOCUS_CHANGED_BY_VOIP";
83 case SOUND_STREAM_FOCUS_CHANGED_BY_CALL: return "SOUND_STREAM_FOCUS_CHANGED_BY_CALL";
84 case SOUND_STREAM_FOCUS_CHANGED_BY_MEDIA_EXTERNAL_ONLY: return "SOUND_STREAM_FOCUS_CHANGED_BY_MEDIA_EXTERNAL_ONLY";
85 default: return "Undefined reason code";
89 void __recorder_focus_state_cb(sound_stream_info_h stream_info, sound_stream_focus_change_reason_e reason, const char *extra_info, void *user_data)
91 SLOG(LOG_DEBUG, TAG_STTD, "[Recorder] Focus state changed cb");
93 if (stream_info != g_stream_info_h) {
94 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Invalid stream info handle");
99 sound_stream_focus_state_e state_for_recording;
100 ret = sound_manager_get_focus_state(g_stream_info_h, NULL, &state_for_recording);
101 if (SOUND_MANAGER_ERROR_NONE != ret) {
102 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to get focus state");
106 SLOG(LOG_WARN, TAG_STTD, "[Recorder] focus state changed to (%d) with reason(%s)", (int)state_for_recording, __stt_get_focus_changed_reason_code(reason));
108 if (STTD_RECORDER_STATE_RECORDING == g_recorder_state && SOUND_STREAM_FOCUS_STATE_RELEASED == state_for_recording) {
109 SLOG(LOG_WARN, TAG_STTD, "[Recorder] Focus released as interrupt");
110 if (NULL != g_interrupt_cb) {
117 int sttd_recorder_initialize(stt_recorder_audio_cb audio_cb, stt_recorder_interrupt_cb interrupt_cb)
119 if (NULL == audio_cb || NULL == interrupt_cb) {
120 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Input param is NOT valid");
121 return STTD_ERROR_INVALID_PARAMETER;
124 if (STTD_RECORDER_STATE_NONE != g_recorder_state) {
125 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Current state of recorder is recording");
126 return STTD_ERROR_INVALID_STATE;
129 if (0 != pthread_mutex_init(&sttd_audio_in_handle_mutex, NULL)) {
130 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to initialize audio in handle mutex.");
133 g_audio_cb = audio_cb;
134 g_interrupt_cb = interrupt_cb;
135 g_recorder_state = STTD_RECORDER_STATE_NONE;
136 g_recording_engine_id = -1;
138 if (0 != sound_manager_create_stream_information(SOUND_STREAM_TYPE_VOICE_RECOGNITION, __recorder_focus_state_cb, NULL, &g_stream_info_h)) {
139 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to create stream info");
145 int sttd_recorder_deinitialize()
147 if (0 != pthread_mutex_destroy(&sttd_audio_in_handle_mutex)) {
148 SLOG(LOG_ERROR, TAG_STTD, "[Server ERROR] Fail to destroy audio in handle mutex.");
151 if (0 != sound_manager_destroy_stream_information(g_stream_info_h)) {
152 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to destroy stream info");
155 /* Remove all recorder */
157 stt_recorder_s *recorder = NULL;
159 iter = g_slist_nth(g_recorder_list, 0);
161 while (NULL != iter) {
162 recorder = iter->data;
164 if (NULL != recorder) {
165 g_recorder_list = g_slist_remove(g_recorder_list, recorder);
166 audio_in_destroy(recorder->audio_h);
171 iter = g_slist_nth(g_recorder_list, 0);
174 g_recorder_state = STTD_RECORDER_STATE_NONE;
179 static stt_recorder_s* __get_recorder(int engine_id)
182 stt_recorder_s *recorder = NULL;
184 iter = g_slist_nth(g_recorder_list, 0);
186 while (NULL != iter) {
187 recorder = iter->data;
189 if (recorder->engine_id == engine_id) {
193 iter = g_slist_next(iter);
199 int sttd_recorder_set_audio_session()
204 int sttd_recorder_unset_audio_session()
209 int sttd_recorder_create(int engine_id, int uid, sttp_audio_type_e type, int channel, unsigned int sample_rate)
211 /* Check engine id is valid */
212 if (NULL != __get_recorder(engine_id)) {
213 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Engine id is already registered");
214 return STTD_ERROR_INVALID_PARAMETER;
217 audio_channel_e audio_ch;
218 audio_sample_type_e audio_type;
219 audio_in_h temp_in_h;
222 case 1: audio_ch = AUDIO_CHANNEL_MONO; break;
223 case 2: audio_ch = AUDIO_CHANNEL_STEREO; break;
225 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Input channel is not supported");
226 return STTD_ERROR_OPERATION_FAILED;
231 case STTP_AUDIO_TYPE_PCM_S16_LE: audio_type = AUDIO_SAMPLE_TYPE_S16_LE; break;
232 case STTP_AUDIO_TYPE_PCM_U8: audio_type = AUDIO_SAMPLE_TYPE_U8; break;
234 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Invalid Audio Type");
235 return STTD_ERROR_OPERATION_FAILED;
240 ret = audio_in_create(sample_rate, audio_ch, audio_type, &temp_in_h);
241 if (AUDIO_IO_ERROR_NONE != ret) {
242 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to create audio handle : %d", ret);
243 return STTD_ERROR_OPERATION_FAILED;
246 stt_recorder_s* recorder;
247 recorder = (stt_recorder_s*)calloc(1, sizeof(stt_recorder_s));
248 if (NULL == recorder) {
249 audio_in_destroy(temp_in_h);
250 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to allocate memory");
251 return STTD_ERROR_OUT_OF_MEMORY;
254 recorder->engine_id = engine_id;
256 recorder->audio_h = temp_in_h;
257 recorder->audio_type = type;
259 g_recorder_list = g_slist_append(g_recorder_list, recorder);
261 g_recorder_state = STTD_RECORDER_STATE_READY;
266 int sttd_recorder_destroy(int engine_id)
268 // critical section required because this function can be called from stt engine thread context
269 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Enter critical section");
270 pthread_mutex_lock(&sttd_audio_in_handle_mutex);
272 /* Check engine id is valid */
273 stt_recorder_s* recorder;
274 recorder = __get_recorder(engine_id);
275 if (NULL == recorder) {
276 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Engine id is not valid");
277 pthread_mutex_unlock(&sttd_audio_in_handle_mutex);
278 return STTD_ERROR_INVALID_PARAMETER;
282 if (STTD_RECORDER_STATE_RECORDING == g_recorder_state) {
283 ret = audio_in_unprepare(recorder->audio_h);
284 if (AUDIO_IO_ERROR_NONE != ret) {
285 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to unprepare audioin : %d", ret);
288 g_recorder_state = STTD_RECORDER_STATE_READY;
291 ret = audio_in_destroy(recorder->audio_h);
292 if (AUDIO_IO_ERROR_NONE != ret) {
293 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to destroy audioin : %d", ret);
296 g_recorder_list = g_slist_remove(g_recorder_list, recorder);
300 pthread_mutex_unlock(&sttd_audio_in_handle_mutex);
301 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Leave critical section");
306 static float get_volume_decibel(char* data, int size, sttp_audio_type_e type)
308 #define MAX_AMPLITUDE_MEAN_16 32768
309 #define MAX_AMPLITUDE_MEAN_08 128
316 unsigned long long square_sum = 0;
318 if (type == STTP_AUDIO_TYPE_PCM_S16_LE)
323 for (i = 0; i < size; i += (depthByte<<1)) {
324 if (depthByte == 2) {
326 memcpy(&pcm16, data + i, sizeof(short));
327 square_sum += pcm16 * pcm16;
330 memcpy(&pcm8, data + i, sizeof(char));
331 square_sum += pcm8 * pcm8;
339 rms = sqrt(square_sum/count);
342 db = 20 * log10(rms/MAX_AMPLITUDE_MEAN_16);
344 db = 20 * log10(rms/MAX_AMPLITUDE_MEAN_08);
349 Eina_Bool __read_audio_func(void *data)
352 static char g_buffer[BUFFER_LENGTH];
354 /* Check engine id is valid */
355 stt_recorder_s* recorder;
356 recorder = __get_recorder(g_recording_engine_id);
357 if (NULL == recorder) {
361 if (STTD_RECORDER_STATE_READY == g_recorder_state) {
362 SLOG(LOG_DEBUG, TAG_STTD, "[Recorder] Exit audio reading func");
366 read_byte = audio_in_read(recorder->audio_h, g_buffer, BUFFER_LENGTH);
368 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Fail to read audio : %d", read_byte);
369 g_recorder_state = STTD_RECORDER_STATE_READY;
373 if (0 != g_audio_cb(g_buffer, read_byte)) {
374 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Fail audio callback");
375 sttd_recorder_stop(g_recording_engine_id);
379 if (0 == g_buffer_count % 30) {
380 float vol_db = get_volume_decibel(g_buffer, BUFFER_LENGTH, recorder->audio_type);
381 if (0 != sttdc_send_set_volume(recorder->uid, vol_db)) {
382 SLOG(LOG_ERROR, TAG_STTD, "[Recorder] Fail to send recording volume(%f)", vol_db);
387 if (0 == g_buffer_count % 50) {
388 SLOG(LOG_DEBUG, TAG_STTD, "[Recorder][%d] Recording... : read_size(%d)", g_buffer_count, read_byte);
390 if (100000 == g_buffer_count) {
398 /* write pcm buffer */
399 fwrite(g_buffer, 1, BUFFER_LENGTH, g_pFile);
405 int sttd_recorder_start(int engine_id)
407 if (STTD_RECORDER_STATE_RECORDING == g_recorder_state)
410 /* Check engine id is valid */
411 stt_recorder_s* recorder;
412 recorder = __get_recorder(engine_id);
413 if (NULL == recorder) {
414 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Engine id is not valid");
415 return STTD_ERROR_INVALID_PARAMETER;
419 ret = sound_manager_acquire_focus(g_stream_info_h, SOUND_STREAM_FOCUS_FOR_RECORDING, NULL);
420 if (SOUND_MANAGER_ERROR_NONE != ret) {
421 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to acquire focus : %d", ret);
423 ret = audio_in_set_stream_info(recorder->audio_h, g_stream_info_h);
424 if (AUDIO_IO_ERROR_NONE != ret) {
425 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to set stream info");
429 ret = audio_in_prepare(recorder->audio_h);
430 if (AUDIO_IO_ERROR_NONE != ret) {
431 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to start audio : %d", ret);
432 return STTD_ERROR_RECORDER_BUSY;
435 /* Add ecore timer to read audio data */
436 ecore_timer_add(0, __read_audio_func, NULL);
438 g_recorder_state = STTD_RECORDER_STATE_RECORDING;
439 g_recording_engine_id = engine_id;
446 snprintf(g_temp_file_name, sizeof(g_temp_file_name), "/tmp/stt_temp_%d_%d", getpid(), g_count);
447 SECURE_SLOG(LOG_DEBUG, TAG_STTD, "[Recorder] Temp file name=[%s]", g_temp_file_name);
450 g_pFile = fopen(g_temp_file_name, "wb+");
452 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] File not found!");
460 int sttd_recorder_stop(int engine_id)
462 if (STTD_RECORDER_STATE_READY == g_recorder_state)
465 /* Check engine id is valid */
466 stt_recorder_s* recorder;
467 recorder = __get_recorder(engine_id);
468 if (NULL == recorder) {
469 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Engine id is not valid");
470 return STTD_ERROR_INVALID_PARAMETER;
474 ret = audio_in_unprepare(recorder->audio_h);
475 if (AUDIO_IO_ERROR_NONE != ret) {
476 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to unprepare audioin : %d", ret);
479 g_recorder_state = STTD_RECORDER_STATE_READY;
480 g_recording_engine_id = -1;
482 ret = sound_manager_release_focus(g_stream_info_h, SOUND_STREAM_FOCUS_FOR_RECORDING, NULL);
483 if (SOUND_MANAGER_ERROR_NONE != ret) {
484 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to release focus :%d", ret);