ailia_speech  1.3.0.0
ailia_speech.h
[詳解]
1 
9 #ifndef INCLUDED_AILIA_SPEECH
10 #define INCLUDED_AILIA_SPEECH
11 
12 /* エラーコードと構造体 */
13 
14 #include "ailia.h"
15 #include "ailia_tokenizer.h"
16 
17 /* 呼び出し規約 */
18 
19 #if defined(_WIN64) || defined(_M_X64) || defined(__amd64__) || defined(__x86_64__) || defined(__APPLE__) || \
20  defined(__ANDROID__) || defined(ANDROID) || defined(__linux__) || defined(NN_NINTENDO_SDK)
21 #define AILIA_API
22 #else
23 #define AILIA_API __stdcall
24 #endif
25 
26 #ifdef __cplusplus
27 extern "C" {
28 #endif
29 
30 /****************************************************************
31  * モデルタイプ定義
32  **/
33 
43 #define AILIA_SPEECH_MODEL_TYPE_WHISPER_MULTILINGUAL_TINY (0)
44 
54 #define AILIA_SPEECH_MODEL_TYPE_WHISPER_MULTILINGUAL_BASE (1)
55 
65 #define AILIA_SPEECH_MODEL_TYPE_WHISPER_MULTILINGUAL_SMALL (2)
66 
76 #define AILIA_SPEECH_MODEL_TYPE_WHISPER_MULTILINGUAL_MEDIUM (3)
77 
87 #define AILIA_SPEECH_MODEL_TYPE_WHISPER_MULTILINGUAL_LARGE (4)
88 
98 #define AILIA_SPEECH_MODEL_TYPE_WHISPER_MULTILINGUAL_LARGE_V3 (5)
99 
100 /****************************************************************
101  * タスク定義
102  **/
103 
113 #define AILIA_SPEECH_TASK_TRANSCRIBE (0)
114 
124 #define AILIA_SPEECH_TASK_TRANSLATE (1)
125 
126 /****************************************************************
127  * 制約定義
128  **/
129 
139 #define AILIA_SPEECH_CONSTRAINT_CHARACTERS (0)
140 
150 #define AILIA_SPEECH_CONSTRAINT_WORDS (1)
151 
152 /****************************************************************
153  * フラグ定義
154  **/
155 
165 #define AILIA_SPEECH_FLAG_NONE (0)
166 
176 #define AILIA_SPEECH_FLAG_LIVE (1)
177 
178 /****************************************************************
179  * VAD定義
180  **/
181 
191 #define AILIA_SPEECH_VAD_TYPE_SILERO (0)
192 
193 /****************************************************************
194  * 辞書定義
195  **/
196 
206 #define AILIA_SPEECH_DICTIONARY_TYPE_REPLACE (0)
207 
208 /****************************************************************
209  * 後処理定義
210  **/
211 
221 #define AILIA_SPEECH_POST_PROCESS_TYPE_T5 (0)
222 
236 #define AILIA_SPEECH_POST_PROCESS_TYPE_FUGUMT_EN_JA (1)
237 
251 #define AILIA_SPEECH_POST_PROCESS_TYPE_FUGUMT_JA_EN (2)
252 
253 /****************************************************************
254  * APIコールバック定義
255  **/
256 
257 //接続が必要なAPI
258 
259 #if defined(_WIN32) && !defined(_WIN64)
260  #define AILIA_SPEECH_USER_API __stdcall
261 #else
262  #define AILIA_SPEECH_USER_API
263 #endif
264 
265 // ailia.audio API
267 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_AUDIO_GET_MEL_SPECTROGRAM)(void*, const void*, int, int, int, int, int, int, int, int, float, int, float, float, int, int, int);
268 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_AUDIO_RESAMPLE)(void*, const void*, int, int, int, int);
270 
271 // ailia.tokenizer API
272 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_TOKENIZER_CREATE)(struct AILIATokenizer** , int, int);
273 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_TOKENIZER_OPEN_MODEL_FILE_A)(struct AILIATokenizer* , const char *);
274 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_TOKENIZER_OPEN_MODEL_FILE_W)(struct AILIATokenizer* , const wchar_t *);
275 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_TOKENIZER_ENCODE)(struct AILIATokenizer* , const char *);
276 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TOKEN_COUNT)(struct AILIATokenizer* , unsigned int*);
277 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TOKENS)(struct AILIATokenizer* , int* , unsigned int);
278 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_TOKENIZER_DECODE)(struct AILIATokenizer* , const int *, unsigned int);
279 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TEXT_LENGTH)(struct AILIATokenizer* , unsigned int*);
280 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TEXT)(struct AILIATokenizer* , char* , unsigned int);
282 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_TOKENIZER_UTF8_TO_UTF32)(unsigned int* , unsigned int* , const char* , unsigned int);
283 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_TOKENIZER_UTF32_TO_UTF8)(char* , unsigned int* , unsigned int);
284 
285 // ailia API
286 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_CREATE)(struct AILIANetwork **, int, int);
287 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_FILE_A)(struct AILIANetwork *, const char *);
288 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_FILE_W)(struct AILIANetwork *, const wchar_t *);
289 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_MEM)(struct AILIANetwork *, const void *, unsigned int);
290 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_SET_MEMORY_MODE)(struct AILIANetwork*, unsigned int);
291 typedef void(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_DESTROY)(struct AILIANetwork *);
292 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_UPDATE)(struct AILIANetwork *);
293 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_GET_BLOB_INDEX_BY_INPUT_INDEX)(struct AILIANetwork *, unsigned int *, unsigned int);
294 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_GET_BLOB_INDEX_BY_OUTPUT_INDEX)(struct AILIANetwork *, unsigned int *, unsigned int);
295 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_GET_BLOB_DATA)(struct AILIANetwork *, void*, unsigned int, unsigned int);
296 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_SET_INPUT_BLOB_DATA)(struct AILIANetwork *, const void*, unsigned int, unsigned int);
297 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_SET_INPUT_BLOB_SHAPE)(struct AILIANetwork *, const AILIAShape*, unsigned int, unsigned int);
298 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_GET_BLOB_SHAPE)(struct AILIANetwork *, AILIAShape*, unsigned int, unsigned int);
299 typedef const char*(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_GET_ERROR_DETAIL)(struct AILIANetwork *);
300 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_COPY_BLOB_DATA)(struct AILIANetwork* dst_net, unsigned int dst_blob_idx, struct AILIANetwork* src_net, unsigned int src_blob_idx);
301 typedef int (AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_AILIA_GET_ENVIRONMENT)(AILIAEnvironment** env, unsigned int env_idx, unsigned int version);
302 
303 
313 #define AILIA_SPEECH_API_CALLBACK_VERSION (6)
314 
315 /* APIコールバック関数構造体 */
316 typedef struct _AILIASpeechApiCallback {
350 
351 /****************************************************************
352  * 中間情報取得コールバック
353  **/
354 
370 typedef int(AILIA_SPEECH_USER_API* AILIA_SPEECH_USER_API_INTERMEDIATE_CALLBACK)(void *handle, const char *text);
371 
372 /****************************************************************
373  * ネットワークオブジェクトのインスタンス
374  **/
375 
376 struct AILIASpeech;
377 
387 #define AILIA_SPEECH_TEXT_VERSION (2)
388 
389 typedef struct _AILIASpeechText{
390 const char * text;
393 unsigned int person_id; // Reserved
394 const char * language;
397 
398 /****************************************************************
399  * Speech2Text API
400  **/
401 
433 int AILIA_API ailiaSpeechCreate(struct AILIASpeech** net, int env_id, int num_thread, int memory_mode, int task, int flags, AILIASpeechApiCallback callback, int version);
434 
454 int AILIA_API ailiaSpeechOpenModelFileA(struct AILIASpeech* net, const char* encoder_path, const char* decoder_path, int model_type);
455 
479 int AILIA_API ailiaSpeechOpenModelFileW(struct AILIASpeech* net, const wchar_t* encoder_path, const wchar_t* decoder_path, int model_type);
480 
498 int AILIA_API ailiaSpeechOpenVadFileA(struct AILIASpeech* net, const char* vad_path, int vad_type);
499 
517 int AILIA_API ailiaSpeechOpenVadFileW(struct AILIASpeech* net, const wchar_t* vad_path, int vad_type);
518 
536 int AILIA_API ailiaSpeechOpenDictionaryFileA(struct AILIASpeech* net, const char* dictionary_path, int dictionary_type);
537 
555 int AILIA_API ailiaSpeechOpenDictionaryFileW(struct AILIASpeech* net, const wchar_t* dictionary_path, int dictionary_type);
556 
582 int AILIA_API ailiaSpeechOpenPostProcessFileA(struct AILIASpeech* net, const char* encoder_path, const char* decoder_path, const char * source_path, const char * target_path, const char * prefix, int post_process_type);
583 
609 int AILIA_API ailiaSpeechOpenPostProcessFileW(struct AILIASpeech* net, const wchar_t* encoder_path, const wchar_t* decoder_path, const wchar_t * source_path, const wchar_t * target_path, const char * prefix, int post_process_type);
610 
632 int AILIA_API
633 ailiaSpeechPushInputData(struct AILIASpeech* net, const float* src, unsigned int channels, unsigned int samples, unsigned int sampling_rate);
634 
654 int AILIA_API
655 ailiaSpeechFinalizeInputData(struct AILIASpeech* net);
656 
672 int AILIA_API ailiaSpeechBuffered(struct AILIASpeech* net, unsigned int *buffered);
673 
689 int AILIA_API
690 ailiaSpeechComplete(struct AILIASpeech* net, unsigned int *complete);
691 
707 int AILIA_API
708 ailiaSpeechSetPrompt(struct AILIASpeech* net, const char *prompt);
709 
727 int AILIA_API
728 ailiaSpeechSetConstraint(struct AILIASpeech* net, const char *constraint, int type);
729 
749 int AILIA_API
750 ailiaSpeechSetLanguage(struct AILIASpeech* net, const char *language);
751 
776 int AILIA_API
777 ailiaSpeechSetSilentThreshold(struct AILIASpeech* net, float silent_threshold, float speech_sec, float no_speech_sec);
778 
802 int AILIA_API
803 ailiaSpeechSetIntermediateCallback(struct AILIASpeech* net, AILIA_SPEECH_USER_API_INTERMEDIATE_CALLBACK callback, void *handle);
804 
822 int AILIA_API
823 ailiaSpeechTranscribe(struct AILIASpeech* net);
824 
842 int AILIA_API
843 ailiaSpeechPostProcess(struct AILIASpeech* net);
844 
860 int AILIA_API
861 ailiaSpeechGetTextCount(struct AILIASpeech* net, unsigned int *count);
862 
888 int AILIA_API
889 ailiaSpeechGetText(struct AILIASpeech* net, AILIASpeechText *text, unsigned int version, unsigned int idx);
890 
918 int AILIA_API
919 ailiaSpeechSetText(struct AILIASpeech* net, const AILIASpeechText *text, unsigned int version, unsigned int idx);
920 
930 void AILIA_API ailiaSpeechDestroy(struct AILIASpeech* net);
931 
953 int AILIA_API ailiaSpeechResetTranscribeState(struct AILIASpeech* net);
954 
976 const char* AILIA_API ailiaSpeechGetErrorDetail(struct AILIASpeech* net);
977 
978 #ifdef UNICODE
979 #define ailiaSpeechOpenModelFile ailiaSpeechOpenModelFileW
980 #define ailiaSpeechOpenVadFile ailiaSpeechOpenVadFileW
981 #define ailiaSpeechOpenDictionaryFile ailiaSpeechOpenDictionaryFileW
982 #define ailiaSpeechOpenPostProcessFile ailiaSpeechOpenPostProcessFileW
983 #else
984 #define ailiaSpeechOpenModelFile ailiaSpeechOpenModelFileA
985 #define ailiaSpeechOpenVadFile ailiaSpeechOpenVadFileA
986 #define ailiaSpeechOpenDictionaryFile ailiaSpeechOpenDictionaryFileA
987 #define ailiaSpeechOpenPostProcessFile ailiaSpeechOpenPostProcessFileA
988 #endif
989 
990 #ifdef __cplusplus
991 }
992 #endif
993 #endif /* !defined(INCLUDED_AILIA_SPEECH) */
ailiaSpeechDestroy
void AILIA_API ailiaSpeechDestroy(struct AILIASpeech *net)
ネットワークオブジェクトを破棄します。
ailiaSpeechPushInputData
int AILIA_API ailiaSpeechPushInputData(struct AILIASpeech *net, const float *src, unsigned int channels, unsigned int samples, unsigned int sampling_rate)
音声をキューに投入します。
_AILIASpeechApiCallback::ailiaCopyBlobData
AILIA_SPEECH_USER_API_AILIA_COPY_BLOB_DATA ailiaCopyBlobData
Definition: ailia_speech.h:347
AILIA_SPEECH_USER_API_AILIA_AUDIO_GET_MEL_SPECTROGRAM
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_AUDIO_GET_MEL_SPECTROGRAM)(void *, const void *, int, int, int, int, int, int, int, int, float, int, float, float, int, int, int)
Definition: ailia_speech.h:267
_AILIASpeechApiCallback::ailiaAudioGetResampleLen
AILIA_SPEECH_USER_API_AILIA_AUDIO_GET_RESAMPLE_LEN ailiaAudioGetResampleLen
Definition: ailia_speech.h:320
_AILIASpeechApiCallback::ailiaTokenizerOpenModelFileW
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_OPEN_MODEL_FILE_W ailiaTokenizerOpenModelFileW
Definition: ailia_speech.h:323
AILIA_SPEECH_USER_API_INTERMEDIATE_CALLBACK
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_INTERMEDIATE_CALLBACK)(void *handle, const char *text)
推論の途中の状況を通知します。
Definition: ailia_speech.h:370
ailiaSpeechSetConstraint
int AILIA_API ailiaSpeechSetConstraint(struct AILIASpeech *net, const char *constraint, int type)
制約の設定を行います。
AILIA_SPEECH_USER_API_AILIA_UPDATE
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_UPDATE)(struct AILIANetwork *)
Definition: ailia_speech.h:292
_AILIASpeechApiCallback::ailiaGetBlobData
AILIA_SPEECH_USER_API_AILIA_GET_BLOB_DATA ailiaGetBlobData
Definition: ailia_speech.h:342
_AILIASpeechText::text
const char * text
Definition: ailia_speech.h:390
ailiaSpeechComplete
int AILIA_API ailiaSpeechComplete(struct AILIASpeech *net, unsigned int *complete)
全てのデータの処理が完了したかどうかを判定します。
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TOKEN_COUNT
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TOKEN_COUNT)(struct AILIATokenizer *, unsigned int *)
Definition: ailia_speech.h:276
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_CREATE
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_CREATE)(struct AILIATokenizer **, int, int)
Definition: ailia_speech.h:272
ailiaSpeechPostProcess
int AILIA_API ailiaSpeechPostProcess(struct AILIASpeech *net)
後処理を行います。
AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_MEM
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_MEM)(struct AILIANetwork *, const void *, unsigned int)
Definition: ailia_speech.h:289
_AILIASpeechApiCallback
Definition: ailia_speech.h:316
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TEXT
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TEXT)(struct AILIATokenizer *, char *, unsigned int)
Definition: ailia_speech.h:280
AILIA_SPEECH_USER_API_AILIA_SET_MEMORY_MODE
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_SET_MEMORY_MODE)(struct AILIANetwork *, unsigned int)
Definition: ailia_speech.h:290
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TOKENS
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TOKENS)(struct AILIATokenizer *, int *, unsigned int)
Definition: ailia_speech.h:277
_AILIASpeechApiCallback::ailiaTokenizerGetTextLength
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TEXT_LENGTH ailiaTokenizerGetTextLength
Definition: ailia_speech.h:328
AILIA_SPEECH_USER_API_AILIA_SET_INPUT_BLOB_SHAPE
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_SET_INPUT_BLOB_SHAPE)(struct AILIANetwork *, const AILIAShape *, unsigned int, unsigned int)
Definition: ailia_speech.h:297
AILIA_SPEECH_USER_API_AILIA_GET_ERROR_DETAIL
const typedef char *AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_GET_ERROR_DETAIL(struct AILIANetwork *)
AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_FILE_W
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_FILE_W)(struct AILIANetwork *, const wchar_t *)
Definition: ailia_speech.h:288
ailiaSpeechSetLanguage
int AILIA_API ailiaSpeechSetLanguage(struct AILIASpeech *net, const char *language)
言語設定を行います。
AILIA_SPEECH_USER_API_AILIA_COPY_BLOB_DATA
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_COPY_BLOB_DATA)(struct AILIANetwork *dst_net, unsigned int dst_blob_idx, struct AILIANetwork *src_net, unsigned int src_blob_idx)
Definition: ailia_speech.h:300
ailiaSpeechSetPrompt
int AILIA_API ailiaSpeechSetPrompt(struct AILIASpeech *net, const char *prompt)
プロンプトの設定を行います。
_AILIASpeechApiCallback::ailiaSetInputBlobData
AILIA_SPEECH_USER_API_AILIA_SET_INPUT_BLOB_DATA ailiaSetInputBlobData
Definition: ailia_speech.h:343
ailiaSpeechOpenModelFileA
int AILIA_API ailiaSpeechOpenModelFileA(struct AILIASpeech *net, const char *encoder_path, const char *decoder_path, int model_type)
モデルを指定します。(MBSC)
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_DECODE
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_DECODE)(struct AILIATokenizer *, const int *, unsigned int)
Definition: ailia_speech.h:278
ailiaSpeechSetText
int AILIA_API ailiaSpeechSetText(struct AILIASpeech *net, const AILIASpeechText *text, unsigned int version, unsigned int idx)
ポストプロセス対象のテキストを設定します。
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TEXT_LENGTH
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TEXT_LENGTH)(struct AILIATokenizer *, unsigned int *)
Definition: ailia_speech.h:279
AILIA_SPEECH_USER_API
#define AILIA_SPEECH_USER_API
Definition: ailia_speech.h:262
AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_FILE_A
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_FILE_A)(struct AILIANetwork *, const char *)
Definition: ailia_speech.h:287
_AILIASpeechText::language
const char * language
Definition: ailia_speech.h:394
_AILIASpeechApiCallback::ailiaTokenizerEncode
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_ENCODE ailiaTokenizerEncode
Definition: ailia_speech.h:324
_AILIASpeechText::time_stamp_begin
float time_stamp_begin
Definition: ailia_speech.h:391
ailiaSpeechOpenDictionaryFileA
int AILIA_API ailiaSpeechOpenDictionaryFileA(struct AILIASpeech *net, const char *dictionary_path, int dictionary_type)
誤り訂正辞書を指定します。(MBSC)
_AILIASpeechText::confidence
float confidence
Definition: ailia_speech.h:395
_AILIASpeechApiCallback::ailiaAudioResample
AILIA_SPEECH_USER_API_AILIA_AUDIO_RESAMPLE ailiaAudioResample
Definition: ailia_speech.h:319
_AILIASpeechApiCallback::ailiaTokenizerDestroy
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_DESTROY ailiaTokenizerDestroy
Definition: ailia_speech.h:330
_AILIASpeechApiCallback::ailiaCreate
AILIA_SPEECH_USER_API_AILIA_CREATE ailiaCreate
Definition: ailia_speech.h:333
_AILIASpeechApiCallback::ailiaGetEnvironment
AILIA_SPEECH_USER_API_AILIA_GET_ENVIRONMENT ailiaGetEnvironment
Definition: ailia_speech.h:348
_AILIASpeechApiCallback::ailiaGetBlobIndexByOutputIndex
AILIA_SPEECH_USER_API_AILIA_GET_BLOB_INDEX_BY_OUTPUT_INDEX ailiaGetBlobIndexByOutputIndex
Definition: ailia_speech.h:341
AILIA_SPEECH_USER_API_AILIA_DESTROY
void(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_DESTROY)(struct AILIANetwork *)
Definition: ailia_speech.h:291
_AILIASpeechApiCallback::ailiaTokenizerUtf8ToUtf32
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_UTF8_TO_UTF32 ailiaTokenizerUtf8ToUtf32
Definition: ailia_speech.h:331
AILIA_SPEECH_USER_API_AILIA_GET_BLOB_INDEX_BY_OUTPUT_INDEX
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_GET_BLOB_INDEX_BY_OUTPUT_INDEX)(struct AILIANetwork *, unsigned int *, unsigned int)
Definition: ailia_speech.h:294
ailiaSpeechCreate
int AILIA_API ailiaSpeechCreate(struct AILIASpeech **net, int env_id, int num_thread, int memory_mode, int task, int flags, AILIASpeechApiCallback callback, int version)
ネットワークオブジェクトを作成します。
AILIA_SPEECH_USER_API_AILIA_AUDIO_GET_FRAME_LEN
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_AUDIO_GET_FRAME_LEN)(int *, int, int, int, int)
Definition: ailia_speech.h:266
ailiaSpeechSetIntermediateCallback
int AILIA_API ailiaSpeechSetIntermediateCallback(struct AILIASpeech *net, AILIA_SPEECH_USER_API_INTERMEDIATE_CALLBACK callback, void *handle)
認識の途中結果を取得するコールバックを設定します。
_AILIASpeechApiCallback::ailiaOpenWeightFileW
AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_FILE_W ailiaOpenWeightFileW
Definition: ailia_speech.h:335
ailiaSpeechOpenVadFileW
int AILIA_API ailiaSpeechOpenVadFileW(struct AILIASpeech *net, const wchar_t *vad_path, int vad_type)
無音検知に適用するVADモデルを指定します。(UTF16)
_AILIASpeechApiCallback::ailiaGetErrorDetail
AILIA_SPEECH_USER_API_AILIA_GET_ERROR_DETAIL ailiaGetErrorDetail
Definition: ailia_speech.h:346
_AILIASpeechApiCallback::ailiaTokenizerUtf32ToUtf8
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_UTF32_TO_UTF8 ailiaTokenizerUtf32ToUtf8
Definition: ailia_speech.h:332
ailiaSpeechSetSilentThreshold
int AILIA_API ailiaSpeechSetSilentThreshold(struct AILIASpeech *net, float silent_threshold, float speech_sec, float no_speech_sec)
無音判定の閾値を設定します。
_AILIASpeechApiCallback::ailiaGetBlobIndexByInputIndex
AILIA_SPEECH_USER_API_AILIA_GET_BLOB_INDEX_BY_INPUT_INDEX ailiaGetBlobIndexByInputIndex
Definition: ailia_speech.h:340
ailiaSpeechTranscribe
int AILIA_API ailiaSpeechTranscribe(struct AILIASpeech *net)
音声認識を行います。
AILIASpeechApiCallback
struct _AILIASpeechApiCallback AILIASpeechApiCallback
_AILIASpeechApiCallback::ailiaAudioGetMelSpectrogram
AILIA_SPEECH_USER_API_AILIA_AUDIO_GET_MEL_SPECTROGRAM ailiaAudioGetMelSpectrogram
Definition: ailia_speech.h:318
ailiaSpeechOpenPostProcessFileW
int AILIA_API ailiaSpeechOpenPostProcessFileW(struct AILIASpeech *net, const wchar_t *encoder_path, const wchar_t *decoder_path, const wchar_t *source_path, const wchar_t *target_path, const char *prefix, int post_process_type)
後処理知に適用するAIモデルを指定します。(UTF16)
ailiaSpeechOpenModelFileW
int AILIA_API ailiaSpeechOpenModelFileW(struct AILIASpeech *net, const wchar_t *encoder_path, const wchar_t *decoder_path, int model_type)
モデルを指定します。(UTF16)
ailiaSpeechResetTranscribeState
int AILIA_API ailiaSpeechResetTranscribeState(struct AILIASpeech *net)
ネットワークオブジェクトの内部状態を初期化します。
ailiaSpeechBuffered
int AILIA_API ailiaSpeechBuffered(struct AILIASpeech *net, unsigned int *buffered)
音声認識を行うために十分なデータが存在するかどうかを判定します。
_AILIASpeechApiCallback::ailiaTokenizerGetTokens
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TOKENS ailiaTokenizerGetTokens
Definition: ailia_speech.h:326
_AILIASpeechApiCallback::ailiaGetBlobShape
AILIA_SPEECH_USER_API_AILIA_GET_BLOB_SHAPE ailiaGetBlobShape
Definition: ailia_speech.h:345
_AILIASpeechApiCallback::ailiaTokenizerGetText
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TEXT ailiaTokenizerGetText
Definition: ailia_speech.h:329
_AILIASpeechText
Definition: ailia_speech.h:389
AILIA_SPEECH_USER_API_AILIA_AUDIO_GET_RESAMPLE_LEN
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_AUDIO_GET_RESAMPLE_LEN)(int *, int, int, int)
Definition: ailia_speech.h:269
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_UTF32_TO_UTF8
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_UTF32_TO_UTF8)(char *, unsigned int *, unsigned int)
Definition: ailia_speech.h:283
_AILIASpeechApiCallback::ailiaSetInputBlobShape
AILIA_SPEECH_USER_API_AILIA_SET_INPUT_BLOB_SHAPE ailiaSetInputBlobShape
Definition: ailia_speech.h:344
AILIA_SPEECH_USER_API_AILIA_GET_BLOB_SHAPE
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_GET_BLOB_SHAPE)(struct AILIANetwork *, AILIAShape *, unsigned int, unsigned int)
Definition: ailia_speech.h:298
AILIASpeechText
struct _AILIASpeechText AILIASpeechText
_AILIASpeechApiCallback::ailiaTokenizerOpenModelFileA
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_OPEN_MODEL_FILE_A ailiaTokenizerOpenModelFileA
Definition: ailia_speech.h:322
AILIA_SPEECH_USER_API_AILIA_SET_INPUT_BLOB_DATA
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_SET_INPUT_BLOB_DATA)(struct AILIANetwork *, const void *, unsigned int, unsigned int)
Definition: ailia_speech.h:296
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_ENCODE
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_ENCODE)(struct AILIATokenizer *, const char *)
Definition: ailia_speech.h:275
AILIA_SPEECH_USER_API_AILIA_CREATE
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_CREATE)(struct AILIANetwork **, int, int)
Definition: ailia_speech.h:286
_AILIASpeechApiCallback::ailiaDestroy
AILIA_SPEECH_USER_API_AILIA_DESTROY ailiaDestroy
Definition: ailia_speech.h:338
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_OPEN_MODEL_FILE_A
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_OPEN_MODEL_FILE_A)(struct AILIATokenizer *, const char *)
Definition: ailia_speech.h:273
ailiaSpeechGetTextCount
int AILIA_API ailiaSpeechGetTextCount(struct AILIASpeech *net, unsigned int *count)
認識したテキストの数を取得します。
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_OPEN_MODEL_FILE_W
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_OPEN_MODEL_FILE_W)(struct AILIATokenizer *, const wchar_t *)
Definition: ailia_speech.h:274
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_UTF8_TO_UTF32
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_UTF8_TO_UTF32)(unsigned int *, unsigned int *, const char *, unsigned int)
Definition: ailia_speech.h:282
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_DESTROY
void(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_TOKENIZER_DESTROY)(struct AILIATokenizer *)
Definition: ailia_speech.h:281
_AILIASpeechApiCallback::ailiaTokenizerCreate
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_CREATE ailiaTokenizerCreate
Definition: ailia_speech.h:321
_AILIASpeechApiCallback::ailiaOpenWeightMem
AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_MEM ailiaOpenWeightMem
Definition: ailia_speech.h:336
ailiaSpeechOpenDictionaryFileW
int AILIA_API ailiaSpeechOpenDictionaryFileW(struct AILIASpeech *net, const wchar_t *dictionary_path, int dictionary_type)
誤り訂正辞書を指定します。(UTF16)
_AILIASpeechApiCallback::ailiaAudioGetFrameLen
AILIA_SPEECH_USER_API_AILIA_AUDIO_GET_FRAME_LEN ailiaAudioGetFrameLen
Definition: ailia_speech.h:317
AILIA_SPEECH_USER_API_AILIA_GET_BLOB_DATA
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_GET_BLOB_DATA)(struct AILIANetwork *, void *, unsigned int, unsigned int)
Definition: ailia_speech.h:295
AILIA_SPEECH_USER_API_AILIA_GET_BLOB_INDEX_BY_INPUT_INDEX
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_GET_BLOB_INDEX_BY_INPUT_INDEX)(struct AILIANetwork *, unsigned int *, unsigned int)
Definition: ailia_speech.h:293
AILIA_SPEECH_USER_API_AILIA_GET_ENVIRONMENT
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_GET_ENVIRONMENT)(AILIAEnvironment **env, unsigned int env_idx, unsigned int version)
Definition: ailia_speech.h:301
ailiaSpeechGetErrorDetail
const char *AILIA_API ailiaSpeechGetErrorDetail(struct AILIASpeech *net)
エラーの詳細を返します
_AILIASpeechApiCallback::ailiaUpdate
AILIA_SPEECH_USER_API_AILIA_UPDATE ailiaUpdate
Definition: ailia_speech.h:339
AILIA_API
#define AILIA_API
Definition: ailia_speech.h:23
ailiaSpeechOpenVadFileA
int AILIA_API ailiaSpeechOpenVadFileA(struct AILIASpeech *net, const char *vad_path, int vad_type)
無音検知に適用するVADモデルを指定します。(MBSC)
ailiaSpeechGetText
int AILIA_API ailiaSpeechGetText(struct AILIASpeech *net, AILIASpeechText *text, unsigned int version, unsigned int idx)
認識したテキストを取得します。
ailiaSpeechOpenPostProcessFileA
int AILIA_API ailiaSpeechOpenPostProcessFileA(struct AILIASpeech *net, const char *encoder_path, const char *decoder_path, const char *source_path, const char *target_path, const char *prefix, int post_process_type)
後処理知に適用するAIモデルを指定します。(MBSC)
_AILIASpeechText::person_id
unsigned int person_id
Definition: ailia_speech.h:393
ailiaSpeechFinalizeInputData
int AILIA_API ailiaSpeechFinalizeInputData(struct AILIASpeech *net)
音声のキューへの投入を終了します。
_AILIASpeechApiCallback::ailiaSetMemoryMode
AILIA_SPEECH_USER_API_AILIA_SET_MEMORY_MODE ailiaSetMemoryMode
Definition: ailia_speech.h:337
_AILIASpeechApiCallback::ailiaOpenWeightFileA
AILIA_SPEECH_USER_API_AILIA_OPEN_WEIGHT_FILE_A ailiaOpenWeightFileA
Definition: ailia_speech.h:334
_AILIASpeechText::time_stamp_end
float time_stamp_end
Definition: ailia_speech.h:392
_AILIASpeechApiCallback::ailiaTokenizerGetTokenCount
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_GET_TOKEN_COUNT ailiaTokenizerGetTokenCount
Definition: ailia_speech.h:325
_AILIASpeechApiCallback::ailiaTokenizerDecode
AILIA_SPEECH_USER_API_AILIA_TOKENIZER_DECODE ailiaTokenizerDecode
Definition: ailia_speech.h:327
AILIA_SPEECH_USER_API_AILIA_AUDIO_RESAMPLE
int(AILIA_SPEECH_USER_API * AILIA_SPEECH_USER_API_AILIA_AUDIO_RESAMPLE)(void *, const void *, int, int, int, int)
Definition: ailia_speech.h:268