Update docs and model urls

a-szymanska · a-szymanska · commit a66f2262f422 · 2025-09-19T13:08:29.000+02:00
diff --git a/apps/computer-vision/app/text_to_image/index.tsx b/apps/computer-vision/app/text_to_image/index.tsx
@@ -8,7 +8,7 @@ import {
 } from 'react-native';
 import React, { useContext, useEffect, useState } from 'react';
 import Spinner from 'react-native-loading-spinner-overlay';
-import { useTextToImage, BK_SDM_TINY_VPRED } from 'react-native-executorch';
+import { useTextToImage, BK_SDM_TINY_VPRED_256 } from 'react-native-executorch';
 import { GeneratingContext } from '../../context';
 import ColorPalette from '../../colors';
 import ProgressBar from '../../components/ProgressBar';
@@ -22,9 +22,9 @@ export default function TextToImageScreen() {
   const [showTextInput, setShowTextInput] = useState(false);
   const [keyboardVisible, setKeyboardVisible] = useState(false);
 
-  const imageSize = 352;
+  const imageSize = 224;
   const model = useTextToImage({
-    model: BK_SDM_TINY_VPRED,
+    model: BK_SDM_TINY_VPRED_256,
     inferenceCallback: (x) => setInferenceStepIdx(x),
   });
 
@@ -53,10 +53,7 @@ export default function TextToImageScreen() {
     setSteps(numSteps);
     try {
       const output = await model.generate(input, imageSize, steps);
-      console.log('Is output?', !!output);
-      console.log(output);
       if (!output.length) {
-        console.log('interrupted');
         setImageTitle(null);
         return;
       }
diff --git a/docs/docs/02-hooks/02-computer-vision/useTextToImage.md b/docs/docs/02-hooks/02-computer-vision/useTextToImage.md
@@ -15,9 +15,9 @@ It is recommended to use models provided by us which are available at our Huggin
 ## Reference
 
 ```typescript
-import { useTextToImage, BK_SDM_TINY_VPRED } from 'react-native-executorch';
+import { useTextToImage, BK_SDM_TINY_VPRED_256 } from 'react-native-executorch';
 
-const model = useTextToImage({ model: BK_SDM_TINY_VPRED });
+const model = useTextToImage({ model: BK_SDM_TINY_VPRED_256 });
 
 const input = 'a castle';
 
@@ -61,9 +61,7 @@ For more information on loading resources, take a look at [loading models](../..
 
 To run the model, you can use the `forward` method. It accepts four arguments: a text prompt describing the requested image, a size of the image in pixels, a number of denoising steps, and an optional seed value, which enables reproducibility of the results.
 
-The image size must fall within the range from 128 to 512 unless specified differently, and be a multiple of 32 due to the architecture of the U-Net and VAE models.
-
-The seed should be a positive integer.
+The image size must be a multiple of 32 due to the architecture of the U-Net and VAE models. The seed should be a positive integer.
 
 :::warning
 Larger imageSize values require significantly more memory to run the model.
@@ -72,10 +70,10 @@ Larger imageSize values require significantly more memory to run the model.
 ## Example
 
 ```tsx
-import { useTextToImage, BK_SDM_TINY_VPRED } from 'react-native-executorch';
+import { useTextToImage, BK_SDM_TINY_VPRED_256 } from 'react-native-executorch';
 
 function App() {
-  const model = useTextToImage({ model: BK_SDM_TINY_VPRED });
+  const model = useTextToImage({ model: BK_SDM_TINY_VPRED_256 });
 
   //...
   const input = 'a medieval castle by the sea shore';
@@ -104,26 +102,25 @@ function App() {
 | ------------------------------------------------------------------- | -------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
 | [bk-sdm-tiny-vpred](https://huggingface.co/vivym/bk-sdm-tiny-vpred) | 0.5            | BK-SDM (Block-removed Knowledge-distilled Stable Diffusion Model) is a compressed version of Stable Diffusion v1.4 with several residual and attention blocks removed. The BK-SDM-Tiny is a v-prediction variant of the model, obtained through further block removal, built around a 0.33B-parameter U-Net. |
 
-|
-
 ## Benchmarks
 
 :::info
-The number following the underscore (\_) specifies that the model is exported with a static image size. This helps optimize memory usage by allocating only as much as needed. In contrast, models exported with dynamic shapes allocate memory up to the maximum allowed image dimensions, which can be less efficient. This setting has no effect on the actual model size, only on how memory is allocated at runtime.
+The number following the underscore (\_) indicates that the model supports generating image with dimensions ranging from 128 pixels up to that value. This setting doesn’t affect the model’s file size - it only determines how memory is allocated at runtime, based on the maximum allowed image size.
 :::
 
 ### Model size
 
-| Model             | Text encoder (XNNPACK) [MB] | UNet (XNNPACK) [MB] | VAE decoder (XNNPACK) [MB] |
-| ----------------- | --------------------------- | ------------------- | -------------------------- |
-| BK_SDM_TINY_VPRED | 492                         | 1290                | 198                        |
+| Model                 | Text encoder (XNNPACK) [MB] | UNet (XNNPACK) [MB] | VAE decoder (XNNPACK) [MB] |
+| --------------------- | --------------------------- | ------------------- | -------------------------- |
+| BK_SDM_TINY_VPRED_256 | 492                         | 1290                | 198                        |
+| BK_SDM_TINY_VPRED_512 | 492                         | 1290                | 198                        |
 
 ### Memory usage
 
 | Model                 | Android (XNNPACK) [MB] | iOS (XNNPACK) [MB] |
 | --------------------- | ---------------------- | ------------------ |
 | BK_SDM_TINY_VPRED_256 | 2900                   | 2800               |
-| BK_SDM_TINY_VPRED     | 6700                   | 6560               |
+| BK_SDM_TINY_VPRED_512 | 6700                   | 6560               |
 
 ### Inference time
 
diff --git a/docs/docs/03-typescript-api/02-computer-vision/TextToImageModule.md b/docs/docs/03-typescript-api/02-computer-vision/TextToImageModule.md
@@ -7,15 +7,18 @@ TypeScript API implementation of the [useTextToImage](../../02-hooks/02-computer
 ## Reference
 
 ```typescript
-import { TextToImageModule, BK_SDM_TINY_VPRED } from 'react-native-executorch';
+import {
+  TextToImageModule,
+  BK_SDM_TINY_VPRED_256,
+} from 'react-native-executorch';
 
 const input = 'a castle';
 
 // Creating an instance
 const textToImageModule = new TextToImageModule();
 
 // Loading the model
-await textToImageModule.load(BK_SDM_TINY_VPRED);
+await textToImageModule.load(BK_SDM_TINY_VPRED_256);
 
 // Running the model
 const image = await textToImageModule.forward(input);
diff --git a/packages/react-native-executorch/src/constants/modelUrls.ts b/packages/react-native-executorch/src/constants/modelUrls.ts
@@ -424,7 +424,7 @@ export const CLIP_VIT_BASE_PATCH32_TEXT = {
 };
 
 // Image generation
-export const BK_SDM_TINY_VPRED = {
+export const BK_SDM_TINY_VPRED_512 = {
   schedulerSource:
     'https://huggingface.co/aszymanska/bk-sdm-tiny-vpred/resolve/main/scheduler/scheduler_config.json',
   tokenizerSource: