software-mansion
diff --git a/‎README.md‎
Lines changed: 0 additions & 2 deletions b/‎README.md‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎android/build.gradle‎
Lines changed: 1 addition & 1 deletion b/‎android/build.gradle‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎android/gradle/wrapper/gradle-wrapper.properties‎
Lines changed: 2 additions & 1 deletion b/‎android/gradle/wrapper/gradle-wrapper.properties‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/BaseS2TDecoder.kt‎
Lines changed: 7 additions & 4 deletions b/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/BaseS2TDecoder.kt‎
Lines changed: 7 additions & 4 deletions
diff --git a/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/BaseS2TModule.kt‎
Lines changed: 18 additions & 2 deletions b/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/BaseS2TModule.kt‎
Lines changed: 18 additions & 2 deletions
diff --git a/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/MoonshineDecoder.kt‎
Lines changed: 1 addition & 4 deletions b/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/MoonshineDecoder.kt‎
Lines changed: 1 addition & 4 deletions
diff --git a/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/MoonshineEncoder.kt‎
Lines changed: 3 additions & 15 deletions b/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/MoonshineEncoder.kt‎
Lines changed: 3 additions & 15 deletions
diff --git a/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/WhisperDecoder.kt‎
Lines changed: 1 addition & 3 deletions b/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/WhisperDecoder.kt‎
Lines changed: 1 addition & 3 deletions
diff --git a/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/WhisperEncoder.kt‎
Lines changed: 3 additions & 20 deletions b/‎android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/WhisperEncoder.kt‎
Lines changed: 3 additions & 20 deletions
@@ -32,8 +32,6 @@ https://docs.swmansion.com/react-native-executorch
 ```bash
 # Install the package
 yarn add react-native-executorch
-# Install necessary peer dependency
-yarn add react-native-audio-api
 cd ios && pod install && cd ..
 ```
 
 
@@ -93,7 +93,7 @@ repositories {
   maven { url 'https://jitpack.io' }
 }
 
-def kotlin_version = getExtOrDefault("kotlinVersion")
+def kotlin_version = rootProject.ext.has("kotlinVersion") ? rootProject.ext.get("kotlinVersion") : project.properties["RnExecutorch_kotlinVersion"]
 
 dependencies {
   // For < 0.71, this will be from the local maven repo
 
@@ -1,6 +1,7 @@
+#Tue Mar 11 09:36:23 CET 2025
 distributionBase=GRADLE_USER_HOME
 distributionPath=wrapper/dists
-distributionUrl=https\://services.gradle.org/distributions/gradle-8.5-bin.zip
+distributionUrl=https\://services.gradle.org/distributions/gradle-8.6-bin.zip
 networkTimeout=10000
 validateDistributionUrl=true
 zipStoreBase=GRADLE_USER_HOME
 
@@ -11,15 +11,19 @@ abstract class BaseS2TDecoder(
   reactApplicationContext: ReactApplicationContext,
 ) : BaseModel<ReadableArray, Int>(reactApplicationContext) {
   protected abstract var methodName: String
+  lateinit var encoderOutput: EValue
 
   abstract fun setGeneratedTokens(tokens: ReadableArray)
 
   abstract fun getTokensEValue(): EValue
 
   override fun runModel(input: ReadableArray): Int {
-    val tokensEValue = getTokensEValue()
+    var encoderOutput = this.encoderOutput
+    if (input.size() != 0) {
+      encoderOutput = this.preprocess(input)
+    }
     return this.module
-      .execute(methodName, tokensEValue, this.preprocess(input))[0]
+      .execute(methodName, getTokensEValue(), encoderOutput)[0]
       .toTensor()
       .dataAsLongArray
       .last()
@@ -28,8 +32,7 @@ abstract class BaseS2TDecoder(
 
   abstract fun getInputShape(inputLength: Int): LongArray
 
-  fun preprocess(input: ReadableArray): EValue {
-    val inputArray = input.getArray(0)!!
+  fun preprocess(inputArray: ReadableArray): EValue {
     val preprocessorInputShape = this.getInputShape(inputArray.size())
     return EValue.from(Tensor.fromBlob(createFloatArray(inputArray), preprocessorInputShape))
   }
 
@@ -1,16 +1,32 @@
 package com.swmansion.rnexecutorch.models.speechtotext
 
+import com.facebook.react.bridge.Arguments
 import com.facebook.react.bridge.ReadableArray
 import com.facebook.react.bridge.WritableArray
 import com.swmansion.rnexecutorch.models.BaseModel
+import org.pytorch.executorch.EValue
 
 abstract class BaseS2TModule {
-  lateinit var encoder: BaseModel<ReadableArray, WritableArray>
+  lateinit var encoder: BaseModel<ReadableArray, Array<EValue>>
   lateinit var decoder: BaseS2TDecoder
   abstract var startToken: Int
   abstract var eosToken: Int
 
-  fun encode(input: ReadableArray): WritableArray = this.encoder.runModel(input)
+  fun encode(input: ReadableArray): WritableArray {
+    val encoderOutput = this.encoder.runModel(input)
+    this.decoder.encoderOutput = encoderOutput[0]
+    return this.postprocessEncodings(encoderOutput)
+  }
+
+  private fun postprocessEncodings(output: Array<EValue>): WritableArray {
+    val outputWritableArray: WritableArray = Arguments.createArray()
+    output[0].toTensor().dataAsFloatArray.map {
+      outputWritableArray.pushDouble(
+        it.toDouble(),
+      )
+    }
+    return outputWritableArray
+  }
 
   abstract fun decode(
     prevTokens: ReadableArray,
 
@@ -10,12 +10,9 @@ class MoonshineDecoder(
   reactApplicationContext: ReactApplicationContext,
 ) : BaseS2TDecoder(reactApplicationContext) {
   private lateinit var generatedTokens: LongArray
+  override var methodName: String = "forward_cached"
   private var innerDim: Long = 288
 
-  override var methodName: String
-    get() = "forward_cached"
-    set(value) {}
-
   override fun setGeneratedTokens(tokens: ReadableArray) {
     this.generatedTokens = ArrayUtils.createLongArray(tokens)
   }
 
@@ -1,32 +1,20 @@
 package com.swmansion.rnexecutorch.models.speechtotext
 
-import com.facebook.react.bridge.Arguments
 import com.facebook.react.bridge.ReactApplicationContext
 import com.facebook.react.bridge.ReadableArray
-import com.facebook.react.bridge.WritableArray
 import com.swmansion.rnexecutorch.models.BaseModel
 import com.swmansion.rnexecutorch.utils.ArrayUtils.Companion.createFloatArray
 import org.pytorch.executorch.EValue
 import org.pytorch.executorch.Tensor
 
 class MoonshineEncoder(
   reactApplicationContext: ReactApplicationContext,
-) : BaseModel<ReadableArray, WritableArray>(reactApplicationContext) {
-  override fun runModel(input: ReadableArray): WritableArray = this.postprocess(this.module.forward(this.preprocess(input)))
+) : BaseModel<ReadableArray, Array<EValue>>(reactApplicationContext) {
+  override fun runModel(input: ReadableArray): Array<EValue> = this.module.forward(this.preprocess(input))
 
-  fun preprocess(input: ReadableArray): EValue {
+  private fun preprocess(input: ReadableArray): EValue {
     val size = input.size()
     val preprocessorInputShape = longArrayOf(1, size.toLong())
     return EValue.from(Tensor.fromBlob(createFloatArray(input), preprocessorInputShape))
   }
-
-  fun postprocess(output: Array<EValue>): WritableArray {
-    val outputWritableArray: WritableArray = Arguments.createArray()
-    output[0].toTensor().dataAsFloatArray.map {
-      outputWritableArray.pushDouble(
-        it.toDouble(),
-      )
-    }
-    return outputWritableArray
-  }
 }
@@ -10,9 +10,7 @@ class WhisperDecoder(
   reactApplicationContext: ReactApplicationContext,
 ) : BaseS2TDecoder(reactApplicationContext) {
   private lateinit var generatedTokens: IntArray
-  override var methodName: String
-    get() = "forward"
-    set(value) {}
+  override var methodName: String = "forward"
 
   override fun setGeneratedTokens(tokens: ReadableArray) {
     this.generatedTokens = ArrayUtils.createIntArray(tokens)
 
@@ -1,9 +1,7 @@
 package com.swmansion.rnexecutorch.models.speechtotext
 
-import com.facebook.react.bridge.Arguments
 import com.facebook.react.bridge.ReactApplicationContext
 import com.facebook.react.bridge.ReadableArray
-import com.facebook.react.bridge.WritableArray
 import com.swmansion.rnexecutorch.models.BaseModel
 import com.swmansion.rnexecutorch.utils.ArrayUtils
 import com.swmansion.rnexecutorch.utils.STFT
@@ -12,35 +10,20 @@ import org.pytorch.executorch.Tensor
 
 class WhisperEncoder(
   reactApplicationContext: ReactApplicationContext,
-) : BaseModel<ReadableArray, WritableArray>(reactApplicationContext) {
+) : BaseModel<ReadableArray, Array<EValue>>(reactApplicationContext) {
   private val fftSize = 512
   private val hopLength = 160
   private val stftFrameSize = (this.fftSize / 2).toLong()
   private val stft = STFT(fftSize, hopLength)
 
-  override fun runModel(input: ReadableArray): WritableArray {
-    val inputEValue = this.preprocess(input)
-    val hiddenState = this.module.forward(inputEValue)
-    return this.postprocess(hiddenState)
-  }
+  override fun runModel(input: ReadableArray): Array<EValue> = this.module.forward(this.preprocess(input))
 
-  fun preprocess(input: ReadableArray): EValue {
+  private fun preprocess(input: ReadableArray): EValue {
     val waveformFloatArray = ArrayUtils.createFloatArray(input)
 
     val stftResult = this.stft.fromWaveform(waveformFloatArray)
     val numStftFrames = stftResult.size / this.stftFrameSize
     val inputTensor = Tensor.fromBlob(stftResult, longArrayOf(numStftFrames, this.stftFrameSize))
     return EValue.from(inputTensor)
   }
-
-  fun postprocess(output: Array<EValue>): WritableArray {
-    val outputWritableArray: WritableArray = Arguments.createArray()
-
-    output[0].toTensor().dataAsFloatArray.map {
-      outputWritableArray.pushDouble(
-        it.toDouble(),
-      )
-    }
-    return outputWritableArray
-  }
 }
Original file line number	Diff line number	Diff line change
`@@ -93,7 +93,7 @@ repositories {`
`93`	`93`	`maven { url 'https://jitpack.io' }`
`94`	`94`	`}`
`95`	`95`
`96`		`-def kotlin_version = getExtOrDefault("kotlinVersion")`
	`96`	`+def kotlin_version = rootProject.ext.has("kotlinVersion") ? rootProject.ext.get("kotlinVersion") : project.properties["RnExecutorch_kotlinVersion"]`
`97`	`97`
`98`	`98`	`dependencies {`
`99`	`99`	`// For < 0.71, this will be from the local maven repo`