chore: 0.5.11 (#649)

mkopcins · michaldudek · Mateusz Kopciński · web-flow · commit 151d62d43d5e · 2025-10-15T13:22:32.000+02:00
Bump to 0.5.11

S2T bug fix

---------

Co-authored-by: Michał Pałys-Dudek &lt;michal@pnd.io&gt;
Co-authored-by: Mateusz Kopciński &lt;mateusz.kopcinski@swmansnion.com&gt;
diff --git a/docs/docs/02-hooks/01-natural-language-processing/useSpeechToText.md b/docs/docs/02-hooks/01-natural-language-processing/useSpeechToText.md
@@ -78,9 +78,9 @@ For more information on loading resources, take a look at [loading models](../..
 | Field                       | Type                                                                                                 | Description                                                                                                                                                                                                                                                                                              |
 | --------------------------- | ---------------------------------------------------------------------------------------------------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
 | `transcribe`                | `(waveform: Float32Array \| number[], options?: DecodingOptions \| undefined) => Promise<string>`    | Starts a transcription process for a given input array, which should be a waveform at 16kHz. The second argument is an options object, e.g. `{ language: 'es' }` for multilingual models. Resolves a promise with the output transcription when the model is finished. Passing `number[]` is deprecated. |
-| `stream`                    | `() => Promise<string>`                                                                              | Starts a streaming transcription process. Use in combination with `streamInsert` to feed audio chunks and `streamStop` to end the stream. Updates `committedTranscription` and `nonCommittedTranscription` as transcription progresses.                                                                  |
-| `streamInsert`              | `(waveform: Float32Array \| number[]) => Promise<void>`                                              | Inserts a chunk of audio data (sampled at 16kHz) into the ongoing streaming transcription. Call this repeatedly as new audio data becomes available. Passing `number[]` is deprecated.                                                                                                                   |
-| `streamStop`                | `() => Promise<void>`                                                                                | Stops the ongoing streaming transcription process.                                                                                                                                                                                                                                                       |
+| `stream`                    | `(options?: DecodingOptions \| undefined) => Promise<string>`                                                                              | Starts a streaming transcription process. Use in combination with `streamInsert` to feed audio chunks and `streamStop` to end the stream. The argument is an options object, e.g. `{ language: 'es' }` for multilingual models. Updates `committedTranscription` and `nonCommittedTranscription` as transcription progresses.                                                                  |
+| `streamInsert`              | `(waveform: Float32Array \| number[]) => void`                                                       | Inserts a chunk of audio data (sampled at 16kHz) into the ongoing streaming transcription. Call this repeatedly as new audio data becomes available. Passing `number[]` is deprecated.                                                                                                                   |
+| `streamStop`                | `() => void`                                                                                         | Stops the ongoing streaming transcription process.                                                                                                                                                                                                                                                       |
 | `encode`                    | `(waveform: Float32Array \| number[]) => Promise<Float32Array>`                                      | Runs the encoding part of the model on the provided waveform. Passing `number[]` is deprecated.                                                                                                                                                                                                          |
 | `decode`                    | `(tokens: number[] \| Int32Array, encoderOutput: Float32Array \| number[]) => Promise<Float32Array>` | Runs the decoder of the model. Passing `number[]` is deprecated.                                                                                                                                                                                                                                         |
 | `committedTranscription`    | `string`                                                                                             | Contains the part of the transcription that is finalized and will not change. Useful for displaying stable results during streaming.                                                                                                                                                                     |
diff --git a/packages/react-native-executorch/package.json b/packages/react-native-executorch/package.json
@@ -1,6 +1,6 @@
 {
   "name": "react-native-executorch",
-  "version": "0.5.10",
+  "version": "0.5.11",
   "description": "An easy way to run AI models in React Native with ExecuTorch",
   "source": "./src/index.ts",
   "main": "./lib/module/index.js",
diff --git a/packages/react-native-executorch/src/hooks/natural_language_processing/useSpeechToText.ts b/packages/react-native-executorch/src/hooks/natural_language_processing/useSpeechToText.ts
@@ -1,7 +1,7 @@
 import { useEffect, useCallback, useState } from 'react';
 import { ETError, getError } from '../../Error';
 import { SpeechToTextModule } from '../../modules/natural_language_processing/SpeechToTextModule';
-import { SpeechToTextModelConfig } from '../../types/stt';
+import { DecodingOptions, SpeechToTextModelConfig } from '../../types/stt';
 
 export const useSpeechToText = ({
   model,
@@ -65,24 +65,29 @@ export const useSpeechToText = ({
     [isReady, isGenerating, modelInstance]
   );
 
-  const stream = useCallback(async () => {
-    if (!isReady) throw new Error(getError(ETError.ModuleNotLoaded));
-    if (isGenerating) throw new Error(getError(ETError.ModelGenerating));
-    setIsGenerating(true);
-    setCommittedTranscription('');
-    setNonCommittedTranscription('');
-    let transcription = '';
-    try {
-      for await (const { committed, nonCommitted } of modelInstance.stream()) {
-        setCommittedTranscription((prev) => prev + committed);
-        setNonCommittedTranscription(nonCommitted);
-        transcription += committed;
+  const stream = useCallback(
+    async (options?: DecodingOptions) => {
+      if (!isReady) throw new Error(getError(ETError.ModuleNotLoaded));
+      if (isGenerating) throw new Error(getError(ETError.ModelGenerating));
+      setIsGenerating(true);
+      setCommittedTranscription('');
+      setNonCommittedTranscription('');
+      let transcription = '';
+      try {
+        for await (const { committed, nonCommitted } of modelInstance.stream(
+          options
+        )) {
+          setCommittedTranscription((prev) => prev + committed);
+          setNonCommittedTranscription(nonCommitted);
+          transcription += committed;
+        }
+      } finally {
+        setIsGenerating(false);
       }
-    } finally {
-      setIsGenerating(false);
-    }
-    return transcription;
-  }, [isReady, isGenerating, modelInstance]);
+      return transcription;
+    },
+    [isReady, isGenerating, modelInstance]
+  );
 
   const wrapper = useCallback(
     <T extends (...args: any[]) => any>(fn: T) => {

Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"name": "react-native-executorch",`
`3`		`- "version": "0.5.10",`
	`3`	`+ "version": "0.5.11",`
`4`	`4`	`"description": "An easy way to run AI models in React Native with ExecuTorch",`
`5`	`5`	`"source": "./src/index.ts",`
`6`	`6`	`"main": "./lib/module/index.js",`