2 * Copyright (c) 2011-2016 Samsung Electronics Co., Ltd All Rights Reserved
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at
6 * http://www.apache.org/licenses/LICENSE-2.0
7 * Unless required by applicable law or agreed to in writing, software
8 * distributed under the License is distributed on an "AS IS" BASIS,
9 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
10 * See the License for the specific language governing permissions and
11 * limitations under the License.
22 #include <sound_manager.h>
23 #include <sound_manager_internal.h>
25 #include <bluetooth_product.h>
29 #include "sttd_dbus.h"
30 #include "sttd_recorder.h"
31 #include "sttd_main.h"
34 #define FRAME_LENGTH 320
35 #define BUFFER_LENGTH FRAME_LENGTH * 2
37 static pthread_mutex_t sttd_audio_in_handle_mutex = PTHREAD_MUTEX_INITIALIZER;
39 static Ecore_Timer* g_audio_timer = NULL;
42 STTD_RECORDER_STATE_NONE = -1,
43 STTD_RECORDER_STATE_READY = 0, /**< Recorder is ready to start */
44 STTD_RECORDER_STATE_RECORDING /**< In the middle of recording */
45 } sttd_recorder_state;
50 stte_audio_type_e audio_type;
53 static stt_recorder_s* g_recorder = NULL;
55 static stt_recorder_audio_cb g_audio_cb;
57 static sound_stream_info_h g_stream_info_h;
59 static stt_recorder_interrupt_cb g_interrupt_cb;
61 static sttd_recorder_state g_recorder_state = STTD_RECORDER_STATE_NONE;
63 static int g_buffer_count;
65 static int g_stream_focus_id;
67 /* Sound buf save for test */
72 static char g_temp_file_name[128] = {'\0',};
76 static int g_count = 1;
80 static float get_volume_decibel(char* data, int size, stte_audio_type_e type);
82 //static stt_recorder_s* __get_recorder(int engine_id);
84 #define SMART_CONTROL_EXTEND_CMD 0x03
85 #define SMART_CONTROL_START_CMD 0x04
87 static void _bt_cb_hid_state_changed(int result, bool connected, const char *remote_address, void *user_data)
89 SLOG(LOG_DEBUG, TAG_STTD, "[Recorder] Bluetooth Event [%d] Received address [%s]", result, remote_address);
92 static void _bt_hid_audio_data_receive_cb(bt_hid_voice_data_s *voice_data, void *user_data)
94 if (STTD_RECORDER_STATE_RECORDING != g_recorder_state) {
95 /* SLOG(LOG_DEBUG, TAG_STTD, "[Recorder] Exit audio reading normal func"); */
99 if (NULL != g_audio_cb) {
100 if (0 != g_audio_cb((void*)voice_data->audio_buf, (unsigned int)voice_data->length)) {
101 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to read audio");
102 sttd_recorder_stop();
105 if (NULL == g_recorder) {
109 float vol_db = get_volume_decibel((char*)voice_data->audio_buf, (int)voice_data->length, g_recorder->audio_type);
110 if (0 != sttdc_send_set_volume(g_recorder->uid, vol_db)) {
111 SLOG(LOG_ERROR, TAG_STTD, "[Recorder] Fail to send recording volume(%f)", vol_db);
115 if (0 == g_buffer_count || 0 == g_buffer_count % 50) {
116 SLOG(LOG_WARN, TAG_STTD, "[Recorder][%d] Recording... : read_size(%d)", g_buffer_count, voice_data->length);
118 if (100000 == g_buffer_count) {
126 /* write pcm buffer */
127 fwrite(data, 1, len, g_pFile);
134 const char* __stt_get_focus_changed_reason_code(sound_stream_focus_change_reason_e reason)
137 case SOUND_STREAM_FOCUS_CHANGED_BY_MEDIA: return "SOUND_STREAM_FOCUS_CHANGED_BY_MEDIA";
138 case SOUND_STREAM_FOCUS_CHANGED_BY_SYSTEM: return "SOUND_STREAM_FOCUS_CHANGED_BY_SYSTEM";
139 case SOUND_STREAM_FOCUS_CHANGED_BY_ALARM: return "SOUND_STREAM_FOCUS_CHANGED_BY_ALARM";
140 case SOUND_STREAM_FOCUS_CHANGED_BY_NOTIFICATION: return "SOUND_STREAM_FOCUS_CHANGED_BY_NOTIFICATION";
141 case SOUND_STREAM_FOCUS_CHANGED_BY_EMERGENCY: return "SOUND_STREAM_FOCUS_CHANGED_BY_EMERGENCY";
142 case SOUND_STREAM_FOCUS_CHANGED_BY_VOICE_INFORMATION: return "SOUND_STREAM_FOCUS_CHANGED_BY_VOICE_INFORMATION";
143 case SOUND_STREAM_FOCUS_CHANGED_BY_VOICE_RECOGNITION: return "SOUND_STREAM_FOCUS_CHANGED_BY_VOICE_RECOGNITION";
144 case SOUND_STREAM_FOCUS_CHANGED_BY_RINGTONE: return "SOUND_STREAM_FOCUS_CHANGED_BY_RINGTONE";
145 case SOUND_STREAM_FOCUS_CHANGED_BY_VOIP: return "SOUND_STREAM_FOCUS_CHANGED_BY_VOIP";
146 case SOUND_STREAM_FOCUS_CHANGED_BY_CALL: return "SOUND_STREAM_FOCUS_CHANGED_BY_CALL";
147 case SOUND_STREAM_FOCUS_CHANGED_BY_MEDIA_EXTERNAL_ONLY: return "SOUND_STREAM_FOCUS_CHANGED_BY_MEDIA_EXTERNAL_ONLY";
148 default: return "Undefined reason code";
152 void __recorder_focus_state_watch_cb(int id, sound_stream_focus_mask_e focus_mask, sound_stream_focus_state_e focus_state,
153 sound_stream_focus_change_reason_e reason, const char *extra_info, void *user_data)
155 SLOG(LOG_WARN, TAG_STTD, "[Recorder] focus_state_watch_cb is called, focus_state(%d), reason(%s)", (int)focus_state, __stt_get_focus_changed_reason_code(reason));
157 if (STTD_RECORDER_STATE_RECORDING == g_recorder_state && SOUND_STREAM_FOCUS_STATE_ACQUIRED == focus_state) {
158 SLOG(LOG_WARN, TAG_STTD, "[Recorder] Focus released as interrupt");
159 if (NULL != g_interrupt_cb) {
165 int sttd_recorder_initialize(stt_recorder_audio_cb audio_cb, stt_recorder_interrupt_cb interrupt_cb)
167 if (NULL == audio_cb || NULL == interrupt_cb) {
168 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Input param is NOT valid");
169 return STTD_ERROR_INVALID_PARAMETER;
172 if (STTD_RECORDER_STATE_NONE != g_recorder_state) {
173 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Current state of recorder is recording");
174 return STTD_ERROR_INVALID_STATE;
177 if (0 != pthread_mutex_init(&sttd_audio_in_handle_mutex, NULL)) {
178 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to initialize audio in handle mutex.");
181 g_audio_cb = audio_cb;
182 g_interrupt_cb = interrupt_cb;
183 g_recorder_state = STTD_RECORDER_STATE_NONE;
186 if (0 != sound_manager_create_stream_information_internal(SOUND_STREAM_TYPE_VOICE_RECOGNITION_SERVICE, NULL, NULL, &g_stream_info_h)) {
187 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to create stream info");
190 if (0 != sound_manager_add_focus_state_watch_cb(SOUND_STREAM_FOCUS_FOR_BOTH, __recorder_focus_state_watch_cb, NULL, &g_stream_focus_id)) {
191 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to add focus state watch callback");
195 if (BT_ERROR_NONE != bt_product_init()) {
196 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to init bt");
197 return STTD_ERROR_OPERATION_FAILED;
200 if (BT_ERROR_NONE != bt_hid_host_initialize(_bt_cb_hid_state_changed, NULL)) {
201 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail bt_hid_host_initialize()");
202 return STTD_ERROR_OPERATION_FAILED;
209 int sttd_recorder_deinitialize()
211 if (0 != pthread_mutex_destroy(&sttd_audio_in_handle_mutex)) {
212 SLOG(LOG_ERROR, TAG_STTD, "[Server ERROR] Fail to destroy audio in handle mutex.");
215 if (0 != sound_manager_remove_focus_state_watch_cb(g_stream_focus_id)) {
216 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to remove focus state watch callback");
219 if (0 != sound_manager_destroy_stream_information(g_stream_info_h)) {
220 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to destroy stream info");
223 if (NULL != g_recorder) {
224 audio_in_destroy(g_recorder->audio_h);
225 g_recorder->audio_h = NULL;
230 #ifdef __UNUSED_CODES__
231 /* Remove all recorder */
233 stt_recorder_s *recorder = NULL;
235 iter = g_slist_nth(g_recorder_list, 0);
237 while (NULL != iter) {
238 recorder = iter->data;
240 if (NULL != recorder) {
241 g_recorder_list = g_slist_remove(g_recorder_list, recorder);
242 if (recorder->audio_h) {
243 audio_in_destroy(recorder->audio_h);
244 recorder->audio_h = NULL;
249 iter = g_slist_nth(g_recorder_list, 0);
254 bt_hid_host_deinitialize();
259 g_recorder_state = STTD_RECORDER_STATE_NONE;
264 int sttd_recorder_set_audio_session()
269 int sttd_recorder_unset_audio_session()
274 int sttd_recorder_create(stte_audio_type_e type, int channel, unsigned int sample_rate)
276 /* Check engine id is valid */
277 if (NULL != g_recorder) {
278 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Engine id is already registered");
279 return STTD_ERROR_INVALID_PARAMETER;
282 audio_in_h temp_in_h = NULL;
285 audio_channel_e audio_ch;
286 audio_sample_type_e audio_type;
289 case 1: audio_ch = AUDIO_CHANNEL_MONO; break;
290 case 2: audio_ch = AUDIO_CHANNEL_STEREO; break;
292 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Input channel is not supported");
293 return STTD_ERROR_OPERATION_FAILED;
298 case STTE_AUDIO_TYPE_PCM_S16_LE: audio_type = AUDIO_SAMPLE_TYPE_S16_LE; break;
299 case STTE_AUDIO_TYPE_PCM_U8: audio_type = AUDIO_SAMPLE_TYPE_U8; break;
301 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Invalid Audio Type");
302 return STTD_ERROR_OPERATION_FAILED;
307 ret = audio_in_create(sample_rate, audio_ch, audio_type, &temp_in_h);
308 if (AUDIO_IO_ERROR_NONE != ret) {
309 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to create audio handle : %d", ret);
310 return STTD_ERROR_OPERATION_FAILED;
313 if (BT_ERROR_NONE != bt_hid_set_audio_data_receive_cb(_bt_hid_audio_data_receive_cb, NULL)) {
314 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail bt_hid_set_audio_data_receive_cb()");
315 return STTD_ERROR_OPERATION_FAILED;
319 stt_recorder_s* recorder;
320 recorder = (stt_recorder_s*)calloc(1, sizeof(stt_recorder_s));
321 if (NULL == recorder) {
324 audio_in_destroy(temp_in_h);
328 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to allocate memory");
329 return STTD_ERROR_OUT_OF_MEMORY;
333 recorder->audio_h = temp_in_h;
334 recorder->audio_type = type;
336 g_recorder = recorder;
338 g_recorder_state = STTD_RECORDER_STATE_READY;
343 int sttd_recorder_destroy()
345 // critical section required because this function can be called from stt engine thread context
346 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Enter critical section");
347 pthread_mutex_lock(&sttd_audio_in_handle_mutex);
349 /* Check engine id is valid */
350 if (NULL == g_recorder) {
351 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Engine id is not valid");
352 pthread_mutex_unlock(&sttd_audio_in_handle_mutex);
353 return STTD_ERROR_INVALID_PARAMETER;
358 if (STTD_RECORDER_STATE_RECORDING == g_recorder_state) {
359 if (g_recorder->audio_h) {
360 ret = audio_in_unprepare(g_recorder->audio_h);
361 if (AUDIO_IO_ERROR_NONE != ret) {
362 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to unprepare audioin : %d", ret);
366 g_recorder_state = STTD_RECORDER_STATE_READY;
369 if (g_recorder->audio_h) {
370 ret = audio_in_destroy(g_recorder->audio_h);
371 if (AUDIO_IO_ERROR_NONE != ret) {
372 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to destroy audioin : %d", ret);
374 g_recorder->audio_h = NULL;
378 if (STTD_RECORDER_STATE_RECORDING == g_recorder_state) {
379 g_recorder_state = STTD_RECORDER_STATE_READY;
382 bt_hid_unset_audio_data_receive_cb();
388 pthread_mutex_unlock(&sttd_audio_in_handle_mutex);
389 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Leave critical section");
394 float get_volume_decibel(char* data, int size, stte_audio_type_e type)
396 #define MAX_AMPLITUDE_MEAN_16 32768
397 #define MAX_AMPLITUDE_MEAN_08 128
404 unsigned long long square_sum = 0;
406 if (type == STTE_AUDIO_TYPE_PCM_S16_LE)
411 for (i = 0; i < size; i += (depthByte<<1)) {
412 if (depthByte == 2) {
414 memcpy(&pcm16, data + i, sizeof(short));
415 square_sum += pcm16 * pcm16;
418 memcpy(&pcm8, data + i, sizeof(char));
419 square_sum += pcm8 * pcm8;
427 rms = sqrt((double)square_sum/count);
430 db = 20 * log10(rms/MAX_AMPLITUDE_MEAN_16);
432 db = 20 * log10(rms/MAX_AMPLITUDE_MEAN_08);
438 Eina_Bool __read_audio_func(void *data)
441 static char g_buffer[BUFFER_LENGTH];
443 /* Check engine id is valid */
444 if (NULL == g_recorder) {
448 if (STTD_RECORDER_STATE_READY == g_recorder_state) {
449 SLOG(LOG_DEBUG, TAG_STTD, "[Recorder] Exit audio reading func");
453 read_byte = audio_in_read(g_recorder->audio_h, g_buffer, BUFFER_LENGTH);
455 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Fail to read audio : %d", read_byte);
456 g_recorder_state = STTD_RECORDER_STATE_READY;
460 if (0 != g_audio_cb(g_buffer, read_byte)) {
461 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Fail audio callback");
462 sttd_recorder_stop();
466 if (NULL == g_recorder)
467 SLOG(LOG_WARN, TAG_STTD, "[Recorder] g_recorder is NULL. It is already stopped and destroyed.");
469 if (0 == g_buffer_count % 30 && NULL != g_recorder) {
470 float vol_db = get_volume_decibel(g_buffer, BUFFER_LENGTH, g_recorder->audio_type);
471 if (0 != sttdc_send_set_volume(g_recorder->uid, vol_db)) {
472 SLOG(LOG_ERROR, TAG_STTD, "[Recorder] Fail to send recording volume(%f)", vol_db);
477 if (0 == g_buffer_count % 50) {
478 SLOG(LOG_DEBUG, TAG_STTD, "[Recorder][%d] Recording... : read_size(%d)", g_buffer_count, read_byte);
480 if (100000 == g_buffer_count) {
488 /* write pcm buffer */
489 fwrite(g_buffer, 1, BUFFER_LENGTH, g_pFile);
496 int sttd_recorder_start(int uid)
498 if (STTD_RECORDER_STATE_RECORDING == g_recorder_state)
503 /* Check engine id is valid */
504 if (NULL == g_recorder) {
505 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Engine id is not valid");
506 return STTD_ERROR_INVALID_PARAMETER;
509 ret = audio_in_set_sound_stream_info(g_recorder->audio_h, g_stream_info_h);
510 if (AUDIO_IO_ERROR_NONE != ret) {
511 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to set stream info");
514 ret = audio_in_prepare(g_recorder->audio_h);
515 if (AUDIO_IO_ERROR_NONE != ret) {
516 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to start audio : %d", ret);
517 return STTD_ERROR_RECORDER_BUSY;
520 /* Add ecore timer to read audio data */
521 if (NULL != g_audio_timer) {
522 ecore_timer_del(g_audio_timer);
523 g_audio_timer = NULL;
526 g_audio_timer = ecore_timer_add(0, __read_audio_func, NULL);
527 if (NULL == g_audio_timer) {
528 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Fail to create timer of read_audio");
529 return STTD_ERROR_OPERATION_FAILED;
533 g_recorder_state = STTD_RECORDER_STATE_RECORDING;
534 g_recorder->uid = uid;
542 snprintf(g_temp_file_name, sizeof(g_temp_file_name), "/tmp/stt_temp_%d_%d", getpid(), g_count);
543 ret = access(g_temp_file_name, 0);
546 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] File is already exist");
547 if (0 == remove(g_temp_file_name)) {
548 SLOG(LOG_DEBUG, TAG_STTD, "[Recorder] Remove file");
558 SECURE_SLOG(LOG_DEBUG, TAG_STTD, "[Recorder] Temp file name=[%s]", g_temp_file_name);
561 g_pFile = fopen(g_temp_file_name, "wb+x");
563 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] File not found!");
571 int sttd_recorder_stop()
573 if (STTD_RECORDER_STATE_READY == g_recorder_state)
576 // critical section required because this function can be called from stt engine thread context
577 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Enter critical section");
578 pthread_mutex_lock(&sttd_audio_in_handle_mutex);
580 /* Check engine id is valid */
581 if (NULL == g_recorder) {
582 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Engine id is not valid");
583 pthread_mutex_unlock(&sttd_audio_in_handle_mutex);
584 return STTD_ERROR_INVALID_PARAMETER;
587 g_recorder->uid = -1;
591 if (NULL != g_audio_timer) {
592 ecore_timer_del(g_audio_timer);
593 g_audio_timer = NULL;
596 ret = audio_in_unprepare(g_recorder->audio_h);
597 if (AUDIO_IO_ERROR_NONE != ret) {
598 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to unprepare audioin : %d", ret);
602 bool stopped = false;
603 while (5 > bt_retry) {
604 ret = bt_hid_rc_stop_sending_voice(NULL);
605 if (BT_ERROR_NONE == ret) {
606 SLOG(LOG_DEBUG, TAG_STTD, "[Recorder] Stop bt audio");
609 } else if (BT_ERROR_NOW_IN_PROGRESS == ret) {
610 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail bt_hid_rc_stop_sending_voice()");
614 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] bt_hid_rc_stop_sending_voice(): ret(%d)", ret);
618 if (false == stopped) {
619 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to stop bt audio(%d)", ret);
620 // return STTD_ERROR_OPERATION_FAILED;
624 g_recorder_state = STTD_RECORDER_STATE_READY;
629 pthread_mutex_unlock(&sttd_audio_in_handle_mutex);
630 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Leave critical section");
635 int sttd_recorder_start_file(int uid, const char *filepath)
637 if (STTD_RECORDER_STATE_RECORDING == g_recorder_state)
640 /* Check engine id is valid */
641 if (NULL == g_recorder) {
642 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Engine id is not valid");
643 return STTD_ERROR_INVALID_PARAMETER;
645 g_recorder_state = STTD_RECORDER_STATE_RECORDING;
646 g_recorder->uid = uid;
649 int totalReadBytes = 0;
651 FILE *infile = fopen(filepath, "rb");
654 if (infile != NULL) {
655 while (!feof(infile)) {
656 static char pcm_buff[BUFFER_LENGTH];
657 int read_byte = fread(pcm_buff, 1, BUFFER_LENGTH, infile);
658 totalReadBytes += read_byte;
659 if (0 != read_byte) {
660 if (0 != g_audio_cb(pcm_buff, read_byte)) {
661 SLOG(LOG_ERROR, TAG_STTD, "[Recorder ERROR] Fail to call audio callback");
666 float vol_db = get_volume_decibel(pcm_buff, BUFFER_LENGTH, g_recorder->audio_type);
667 if (0 != sttdc_send_set_volume(g_recorder->uid, vol_db)) {
668 SLOG(LOG_ERROR, TAG_STTD, "[Recorder] Fail to send recording volume(%f)", vol_db);
674 SLOG(LOG_DEBUG, TAG_STTD, "[Recorder][%d] Recording... : read_size(%d)", cnt, read_byte);
681 SLOG(LOG_DEBUG, TAG_STTD, "[Recorder][%d] total bytes(%d)", cnt, totalReadBytes);
685 int sttd_recorder_stop_file()
687 if (STTD_RECORDER_STATE_READY == g_recorder_state)
690 /* Check engine id is valid */
691 if (NULL == g_recorder) {
692 SLOG(LOG_WARN, TAG_STTD, "[Recorder WARNING] Engine id is not valid");
693 return STTD_ERROR_INVALID_PARAMETER;
696 g_recorder->uid = -1;
697 g_recorder_state = STTD_RECORDER_STATE_READY;
702 int sttd_recorder_clear()
705 SLOG(LOG_DEBUG, TAG_STTD, "[Recorder DEBUG] Clear recorder on TV");
707 if (STTD_RECORDER_STATE_RECORDING == g_recorder_state) {
708 sttd_recorder_stop();
710 if (STTD_RECORDER_STATE_READY == g_recorder_state) {
711 sttd_recorder_destroy();
715 return STTD_ERROR_NONE;