fix other APIs

k2-fsa · Jun 4, 2024 · 0cc4948 · 0cc4948
1 parent 5db884e
commit 0cc4948
Show file tree

Hide file tree

Showing 7 changed files with 34 additions and 7 deletions.
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -6,7 +6,7 @@ set(CMAKE_OSX_DEPLOYMENT_TARGET "10.14" CACHE STRING "Minimum OS X deployment ve
 
 project(sherpa-onnx)
 
-set(SHERPA_ONNX_VERSION "1.9.26")
+set(SHERPA_ONNX_VERSION "1.9.27")
 
 # Disable warning about
 #

diff --git a/scripts/dotnet/OfflineModelConfig.cs b/scripts/dotnet/OfflineModelConfig.cs
@@ -25,6 +25,7 @@ public OfflineModelConfig()
             ModelType = "";
             ModelingUnit = "cjkchar";
             BpeVocab = "";
+            TeleSpeechCtc = "";
         }
         public OfflineTransducerModelConfig Transducer;
         public OfflineParaformerModelConfig Paraformer;
@@ -50,5 +51,8 @@ public OfflineModelConfig()
 
         [MarshalAs(UnmanagedType.LPStr)]
         public string BpeVocab;
+
+        [MarshalAs(UnmanagedType.LPStr)]
+        public string TeleSpeechCtc;
     }
 }
diff --git a/scripts/go/sherpa_onnx.go b/scripts/go/sherpa_onnx.go
@@ -89,6 +89,7 @@ type OnlineModelConfig struct {
 	ModelType     string // Optional. You can specify it for faster model initialization
 	ModelingUnit  string // Optional. cjkchar, bpe, cjkchar+bpe
 	BpeVocab      string // Optional.
+	TeleSpeechCtc string // Optional.
 }
 
 // Configuration for the feature extractor
@@ -195,6 +196,9 @@ func NewOnlineRecognizer(config *OnlineRecognizerConfig) *OnlineRecognizer {
 	c.model_config.bpe_vocab = C.CString(config.ModelConfig.BpeVocab)
 	defer C.free(unsafe.Pointer(c.model_config.bpe_vocab))
 
+	c.model_config.telespeech_ctc = C.CString(config.ModelConfig.TeleSpeechCtc)
+	defer C.free(unsafe.Pointer(c.model_config.telespeech_ctc))
+
 	c.decoding_method = C.CString(config.DecodingMethod)
 	defer C.free(unsafe.Pointer(c.decoding_method))
 

diff --git a/scripts/node-addon-api/src/non-streaming-asr.cc b/scripts/node-addon-api/src/non-streaming-asr.cc
@@ -128,6 +128,7 @@ static SherpaOnnxOfflineModelConfig GetOfflineModelConfig(Napi::Object obj) {
   SHERPA_ONNX_ASSIGN_ATTR_STR(model_type, modelType);
   SHERPA_ONNX_ASSIGN_ATTR_STR(modeling_unit, modelingUnit);
   SHERPA_ONNX_ASSIGN_ATTR_STR(bpe_vocab, bpeVocab);
+  SHERPA_ONNX_ASSIGN_ATTR_STR(telespeech_ctc, teleSpeechCtc);
 
   return c;
 }
@@ -242,6 +243,10 @@ CreateOfflineRecognizerWrapper(const Napi::CallbackInfo &info) {
     delete[] c.model_config.bpe_vocab;
   }
 
+  if (c.model_config.telespeech_ctc) {
+    delete[] c.model_config.telespeech_ctc;
+  }
+
   if (c.lm_config.model) {
     delete[] c.lm_config.model;
   }

diff --git a/swift-api-examples/SherpaOnnx.swift b/swift-api-examples/SherpaOnnx.swift
@@ -102,7 +102,7 @@ func sherpaOnnxOnlineModelConfig(
     debug: Int32(debug),
     model_type: toCPointer(modelType),
     modeling_unit: toCPointer(modelingUnit),
-    bpeVocab: toCPointer(bpeVocab)
+    bpe_vocab: toCPointer(bpeVocab)
   )
 }
 
@@ -374,7 +374,7 @@ func sherpaOnnxOfflineModelConfig(
     provider: toCPointer(provider),
     model_type: toCPointer(modelType),
     modeling_unit: toCPointer(modelingUnit),
-    bpeVocab: toCPointer(bpeVocab)
+    bpe_vocab: toCPointer(bpeVocab)
   )
 }
 

diff --git a/wasm/asr/sherpa-onnx-asr.js b/wasm/asr/sherpa-onnx-asr.js
@@ -529,7 +529,7 @@ function initSherpaOnnxOfflineModelConfig(config, Module) {
   const tdnn = initSherpaOnnxOfflineTdnnModelConfig(config.tdnn, Module);
 
   const len = transducer.len + paraformer.len + nemoCtc.len + whisper.len +
-      tdnn.len + 7 * 4;
+      tdnn.len + 8 * 4;
   const ptr = Module._malloc(len);
 
   let offset = 0;
@@ -553,9 +553,11 @@ function initSherpaOnnxOfflineModelConfig(config, Module) {
   const modelTypeLen = Module.lengthBytesUTF8(config.modelType) + 1;
   const modelingUnitLen = Module.lengthBytesUTF8(config.modelingUnit || '') + 1;
   const bpeVocabLen = Module.lengthBytesUTF8(config.bpeVocab || '') + 1;
+  const teleSpeechCtcLen =
+      Module.lengthBytesUTF8(config.teleSpeechCtc || '') + 1;
 
-  const bufferLen =
-      tokensLen + providerLen + modelTypeLen + modelingUnitLen + bpeVocabLen;
+  const bufferLen = tokensLen + providerLen + modelTypeLen + modelingUnitLen +
+      bpeVocabLen + teleSpeechCtcLen;
   const buffer = Module._malloc(bufferLen);
 
   offset = 0;
@@ -575,6 +577,10 @@ function initSherpaOnnxOfflineModelConfig(config, Module) {
   Module.stringToUTF8(config.bpeVocab || '', buffer + offset, bpeVocabLen);
   offset += bpeVocabLen;
 
+  Module.stringToUTF8(
+      config.teleSpeechCtc || '', buffer + offset, teleSpeechCtcLen);
+  offset += teleSpeechCtcLen;
+
   offset =
       transducer.len + paraformer.len + nemoCtc.len + whisper.len + tdnn.len;
   Module.setValue(ptr + offset, buffer, 'i8*');  // tokens
@@ -604,6 +610,13 @@ function initSherpaOnnxOfflineModelConfig(config, Module) {
       'i8*');  // bpeVocab
   offset += 4;
 
+  Module.setValue(
+      ptr + offset,
+      buffer + tokensLen + providerLen + modelTypeLen + modelingUnitLen +
+          bpeVocabLen,
+      'i8*');  // teleSpeechCtc
+  offset += 4;
+
   return {
     buffer: buffer, ptr: ptr, len: len, transducer: transducer,
         paraformer: paraformer, nemoCtc: nemoCtc, whisper: whisper, tdnn: tdnn

diff --git a/wasm/nodejs/sherpa-onnx-wasm-nodejs.cc b/wasm/nodejs/sherpa-onnx-wasm-nodejs.cc
@@ -23,7 +23,7 @@ static_assert(sizeof(SherpaOnnxOfflineModelConfig) ==
                       sizeof(SherpaOnnxOfflineParaformerModelConfig) +
                       sizeof(SherpaOnnxOfflineNemoEncDecCtcModelConfig) +
                       sizeof(SherpaOnnxOfflineWhisperModelConfig) +
-                      sizeof(SherpaOnnxOfflineTdnnModelConfig) + 7 * 4,
+                      sizeof(SherpaOnnxOfflineTdnnModelConfig) + 8 * 4,
               "");
 static_assert(sizeof(SherpaOnnxFeatureConfig) == 2 * 4, "");
 static_assert(sizeof(SherpaOnnxOfflineRecognizerConfig) ==
@@ -92,6 +92,7 @@ void PrintOfflineRecognizerConfig(SherpaOnnxOfflineRecognizerConfig *config) {
   fprintf(stdout, "model type: %s\n", model_config->model_type);
   fprintf(stdout, "modeling unit: %s\n", model_config->modeling_unit);
   fprintf(stdout, "bpe vocab: %s\n", model_config->bpe_vocab);
+  fprintf(stdout, "telespeech_ctc: %s\n", model_config->telespeech_ctc);
 
   fprintf(stdout, "----------feat config----------\n");
   fprintf(stdout, "sample rate: %d\n", feat->sample_rate);