|
| 1 | +// c-api-examples/nemo-parakeet-c-api.c |
| 2 | +// Example using the C API and sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8 model |
| 3 | +// Prints recognized text, per-token timestamps, and durations |
| 4 | + |
| 5 | +#include <stdio.h> |
| 6 | +#include <stdlib.h> |
| 7 | +#include <string.h> |
| 8 | + |
| 9 | +#include "sherpa-onnx/c-api/c-api.h" |
| 10 | + |
| 11 | +int32_t main() { |
| 12 | + const char *wav_filename = |
| 13 | + "./sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8/test_wavs/en.wav"; |
| 14 | + const char *encoder_filename = |
| 15 | + "sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8/encoder.int8.onnx"; |
| 16 | + const char *decoder_filename = |
| 17 | + "sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8/decoder.int8.onnx"; |
| 18 | + const char *joiner_filename = |
| 19 | + "sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8/joiner.int8.onnx"; |
| 20 | + const char *tokens_filename = |
| 21 | + "sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8/tokens.txt"; |
| 22 | + const char *provider = "cpu"; |
| 23 | + |
| 24 | + if (!SherpaOnnxFileExists(wav_filename)) { |
| 25 | + fprintf(stderr, "File not found: %s\n", wav_filename); |
| 26 | + return -1; |
| 27 | + } |
| 28 | + const SherpaOnnxWave *wave = SherpaOnnxReadWave(wav_filename); |
| 29 | + if (wave == NULL) { |
| 30 | + fprintf(stderr, "Failed to read or parse %s (not a valid mono 16-bit WAVE file)\n", wav_filename); |
| 31 | + return -1; |
| 32 | + } |
| 33 | + |
| 34 | + SherpaOnnxOfflineModelConfig offline_model_config; |
| 35 | + memset(&offline_model_config, 0, sizeof(offline_model_config)); |
| 36 | + offline_model_config.debug = 0; |
| 37 | + offline_model_config.num_threads = 1; |
| 38 | + offline_model_config.provider = provider; |
| 39 | + offline_model_config.tokens = tokens_filename; |
| 40 | + offline_model_config.transducer.encoder = encoder_filename; |
| 41 | + offline_model_config.transducer.decoder = decoder_filename; |
| 42 | + offline_model_config.transducer.joiner = joiner_filename; |
| 43 | + |
| 44 | + SherpaOnnxOfflineRecognizerConfig recognizer_config; |
| 45 | + memset(&recognizer_config, 0, sizeof(recognizer_config)); |
| 46 | + recognizer_config.decoding_method = "greedy_search"; |
| 47 | + recognizer_config.model_config = offline_model_config; |
| 48 | + |
| 49 | + const SherpaOnnxOfflineRecognizer *recognizer = |
| 50 | + SherpaOnnxCreateOfflineRecognizer(&recognizer_config); |
| 51 | + if (recognizer == NULL) { |
| 52 | + fprintf(stderr, "Please check your config!\n"); |
| 53 | + SherpaOnnxFreeWave(wave); |
| 54 | + return -1; |
| 55 | + } |
| 56 | + |
| 57 | + const SherpaOnnxOfflineStream *stream = |
| 58 | + SherpaOnnxCreateOfflineStream(recognizer); |
| 59 | + if (stream == NULL) { |
| 60 | + fprintf(stderr, "Failed to create offline stream.\n"); |
| 61 | + SherpaOnnxDestroyOfflineRecognizer(recognizer); |
| 62 | + SherpaOnnxFreeWave(wave); |
| 63 | + return -1; |
| 64 | + } |
| 65 | + |
| 66 | + SherpaOnnxAcceptWaveformOffline(stream, wave->sample_rate, wave->samples, |
| 67 | + wave->num_samples); |
| 68 | + SherpaOnnxDecodeOfflineStream(recognizer, stream); |
| 69 | + const SherpaOnnxOfflineRecognizerResult *result = |
| 70 | + SherpaOnnxGetOfflineStreamResult(stream); |
| 71 | + |
| 72 | + printf("Recognized text: %s\n", result->text); |
| 73 | + |
| 74 | + if (result->tokens_arr && result->timestamps && result->durations) { |
| 75 | + printf("Token\tTimestamp\tDuration\n"); |
| 76 | + for (int32_t i = 0; i < result->count; ++i) { |
| 77 | + printf("%s\t%.2f\t%.2f\n", result->tokens_arr[i], result->timestamps[i], result->durations[i]); |
| 78 | + } |
| 79 | + } else { |
| 80 | + printf("Timestamps or durations not available.\n"); |
| 81 | + } |
| 82 | + |
| 83 | + SherpaOnnxDestroyOfflineRecognizerResult(result); |
| 84 | + SherpaOnnxDestroyOfflineStream(stream); |
| 85 | + SherpaOnnxDestroyOfflineRecognizer(recognizer); |
| 86 | + SherpaOnnxFreeWave(wave); |
| 87 | + |
| 88 | + return 0; |
| 89 | +} |
0 commit comments