software-mansion
diff --git a/‎apps/computer-vision/components/vision_camera/tasks/InstanceSegmentationTask.tsx‎
Lines changed: 2 additions & 9 deletions b/‎apps/computer-vision/components/vision_camera/tasks/InstanceSegmentationTask.tsx‎
Lines changed: 2 additions & 9 deletions
diff --git a/‎packages/react-native-executorch/common/rnexecutorch/models/VisionModel.cpp‎
Lines changed: 0 additions & 5 deletions b/‎packages/react-native-executorch/common/rnexecutorch/models/VisionModel.cpp‎
Lines changed: 0 additions & 5 deletions
diff --git a/‎packages/react-native-executorch/common/rnexecutorch/models/VisionModel.h‎
Lines changed: 0 additions & 10 deletions b/‎packages/react-native-executorch/common/rnexecutorch/models/VisionModel.h‎
Lines changed: 0 additions & 10 deletions
diff --git a/‎packages/react-native-executorch/common/rnexecutorch/models/object_detection/ObjectDetection.cpp‎
Lines changed: 2 additions & 3 deletions b/‎packages/react-native-executorch/common/rnexecutorch/models/object_detection/ObjectDetection.cpp‎
Lines changed: 2 additions & 3 deletions
diff --git a/‎packages/react-native-executorch/common/rnexecutorch/models/ocr/OCR.cpp‎
Lines changed: 2 additions & 1 deletion b/‎packages/react-native-executorch/common/rnexecutorch/models/ocr/OCR.cpp‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎packages/react-native-executorch/common/rnexecutorch/models/semantic_segmentation/BaseSemanticSegmentation.cpp‎
Lines changed: 16 additions & 14 deletions b/‎packages/react-native-executorch/common/rnexecutorch/models/semantic_segmentation/BaseSemanticSegmentation.cpp‎
Lines changed: 16 additions & 14 deletions
diff --git a/‎packages/react-native-executorch/common/rnexecutorch/models/style_transfer/StyleTransfer.cpp‎
Lines changed: 2 additions & 1 deletion b/‎packages/react-native-executorch/common/rnexecutorch/models/style_transfer/StyleTransfer.cpp‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎packages/react-native-executorch/common/rnexecutorch/models/vertical_ocr/VerticalOCR.cpp‎
Lines changed: 2 additions & 1 deletion b/‎packages/react-native-executorch/common/rnexecutorch/models/vertical_ocr/VerticalOCR.cpp‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎packages/react-native-executorch/common/rnexecutorch/tests/unit/FrameTransformTest.cpp‎
Lines changed: 40 additions & 35 deletions b/‎packages/react-native-executorch/common/rnexecutorch/tests/unit/FrameTransformTest.cpp‎
Lines changed: 40 additions & 35 deletions
diff --git a/‎packages/react-native-executorch/common/rnexecutorch/utils/FrameProcessor.cpp‎
Lines changed: 4 additions & 2 deletions b/‎packages/react-native-executorch/common/rnexecutorch/utils/FrameProcessor.cpp‎
Lines changed: 4 additions & 2 deletions
@@ -27,7 +27,7 @@ type Props = TaskProps & { activeModel: InstSegModelId };
 export default function InstanceSegmentationTask({
   activeModel,
   canvasSize,
-  cameraPosition,
+  cameraPositionSync,
   frameKillSwitch,
   onFrameOutputChange,
   onReadyChange,
@@ -145,13 +145,7 @@ export default function InstanceSegmentationTask({
   const offsetY = (canvasSize.height - imageSize.height * scale) / 2;
 
   return (
-    <View
-      style={[
-        StyleSheet.absoluteFill,
-        cameraPosition === 'front' && { transform: [{ scaleX: -1 }] },
-      ]}
-      pointerEvents="none"
-    >
+    <View style={StyleSheet.absoluteFill} pointerEvents="none">
       {/* Render masks */}
       <Canvas style={StyleSheet.absoluteFill} pointerEvents="none">
         {instances.map((inst, i) => {
@@ -197,7 +191,6 @@ export default function InstanceSegmentationTask({
               style={[
                 styles.bboxLabel,
                 { backgroundColor: labelColorBg(label) },
-                cameraPosition === 'front' && { transform: [{ scaleX: -1 }] },
               ]}
             >
               <Text style={styles.bboxLabelText}>
 
@@ -51,9 +51,4 @@ cv::Mat VisionModel::extractFromPixels(const JSTensorViewIn &tensorView) const {
   return ::rnexecutorch::utils::pixelsToMat(tensorView);
 }
 
-utils::FrameOrientation VisionModel::extractFrameOrientation(
-    jsi::Runtime &runtime, const jsi::Value &frameData) const {
-  return ::rnexecutorch::utils::readFrameOrientation(runtime, frameData);
-}
-
 } // namespace rnexecutorch::models
@@ -144,16 +144,6 @@ class VisionModel : public BaseModel {
    * @endcode
    */
   cv::Mat extractFromPixels(const JSTensorViewIn &tensorView) const;
-
-  /**
-   * @brief Read orientation metadata from JSI frameData object.
-   *
-   * Reads orientation and isMirrored.
-   * Falls back to "up"/false if fields are absent (e.g. when
-   * enablePhysicalBufferRotation is used — transform will then be a no-op).
-   */
-  utils::FrameOrientation extractFrameOrientation(
-      jsi::Runtime &runtime, const jsi::Value &frameData) const;
 };
 
 } // namespace models
 
@@ -139,13 +139,12 @@ std::vector<types::Detection>
 ObjectDetection::generateFromFrame(jsi::Runtime &runtime,
                                    const jsi::Value &frameData,
                                    double detectionThreshold) {
-  auto orient = extractFrameOrientation(runtime, frameData);
+  auto orient = ::rnexecutorch::utils::readFrameOrientation(runtime, frameData);
   cv::Mat frame = extractFromFrame(runtime, frameData);
   cv::Mat rotated = ::rnexecutorch::utils::rotateFrameForModel(frame, orient);
   auto detections = runInference(rotated, detectionThreshold);
   for (auto &det : detections) {
-    ::rnexecutorch::utils::inverseRotateBbox(
-        det.x1, det.y1, det.x2, det.y2, orient, rotated.cols, rotated.rows);
+    ::rnexecutorch::utils::inverseRotateBbox(det.bbox, orient, rotated.size());
   }
   return detections;
 }
 
@@ -5,6 +5,7 @@
 #include <rnexecutorch/data_processing/ImageProcessing.h>
 #include <rnexecutorch/models/ocr/Constants.h>
 #include <rnexecutorch/utils/FrameProcessor.h>
+#include <rnexecutorch/utils/FrameTransform.h>
 
 namespace rnexecutorch::models::ocr {
 OCR::OCR(const std::string &detectorSource, const std::string &recognizerSource,
@@ -67,7 +68,7 @@ OCR::generateFromFrame(jsi::Runtime &runtime, const jsi::Value &frameData) {
   auto detections = runInference(rotated);
   for (auto &det : detections) {
     ::rnexecutorch::utils::inverseRotatePoints(det.bbox, orient,
-                                               rotated.cols, rotated.rows);
+                                               rotated.size());
   }
   return detections;
 }
 
@@ -6,6 +6,7 @@
 #include <rnexecutorch/Log.h>
 #include <rnexecutorch/data_processing/ImageProcessing.h>
 #include <rnexecutorch/models/BaseModel.h>
+#include <rnexecutorch/utils/FrameProcessor.h>
 #include <rnexecutorch/utils/FrameTransform.h>
 
 namespace rnexecutorch::models::semantic_segmentation {
@@ -96,35 +97,36 @@ semantic_segmentation::SegmentationResult
 BaseSemanticSegmentation::generateFromFrame(
     jsi::Runtime &runtime, const jsi::Value &frameData,
     std::set<std::string, std::less<>> classesOfInterest, bool resize) {
-  auto orient = extractFrameOrientation(runtime, frameData);
+  auto orient = ::rnexecutorch::utils::readFrameOrientation(runtime, frameData);
   cv::Mat frame = extractFromFrame(runtime, frameData);
   cv::Mat rotated = utils::rotateFrameForModel(frame, orient);
   // Always run inference without resize — rotate first, then resize.
   auto result = runInference(rotated, rotated.size(), classesOfInterest, false);
 
   const cv::Size outputSize = modelInputSize();
   // JS reads maskW=frame.height, maskH=frame.width (sensor-native swap).
-  const cv::Size screenSize(frame.rows, frame.cols);
+  const cv::Size frameSize = frame.size();
 
-  auto inverseAndResize = [&](std::shared_ptr<OwningArrayBuffer> &buf,
-                              int32_t cvType, int32_t interpFlag) {
+  auto inverseAndResize = [&orient, &frameSize, &outputSize,
+                           resize](std::shared_ptr<OwningArrayBuffer> &buf,
+                                   int32_t cvType, int32_t interpFlag) {
     cv::Mat m(outputSize, cvType, buf->data());
     cv::Mat inv = utils::inverseRotateMat(m, orient);
-    if (resize && inv.size() != screenSize) {
-      cv::resize(inv, inv, screenSize, 0, 0, interpFlag);
+    if (resize && inv.size() != frameSize) {
+      cv::resize(inv, inv, frameSize, 0, 0, interpFlag);
     }
     buf = std::make_shared<OwningArrayBuffer>(
         inv.data, static_cast<size_t>(inv.total() * inv.elemSize()));
-    return inv;
   };
 
-  if (result.argmax && outputSize.area() > 0) {
-    inverseAndResize(result.argmax, CV_32SC1, cv::INTER_NEAREST);
-  }
-
-  if (result.classBuffers && outputSize.area() > 0) {
-    for (auto &[label, buf] : *result.classBuffers) {
-      inverseAndResize(buf, CV_32FC1, cv::INTER_LINEAR);
+  if (outputSize.area() > 0) {
+    if (result.argmax) {
+      inverseAndResize(result.argmax, CV_32SC1, cv::INTER_NEAREST);
+    }
+    if (result.classBuffers) {
+      for (auto &[label, buf] : *result.classBuffers) {
+        inverseAndResize(buf, CV_32FC1, cv::INTER_LINEAR);
+      }
     }
   }
 
 
@@ -1,6 +1,7 @@
 #include "StyleTransfer.h"
 
 #include <rnexecutorch/data_processing/ImageProcessing.h>
+#include <rnexecutorch/utils/FrameProcessor.h>
 #include <rnexecutorch/utils/FrameTransform.h>
 
 #include <executorch/extension/tensor/tensor.h>
@@ -82,7 +83,7 @@ StyleTransferResult StyleTransfer::generateFromString(std::string imageSource,
 
 PixelDataResult StyleTransfer::generateFromFrame(jsi::Runtime &runtime,
                                                  const jsi::Value &frameData) {
-  auto orient = extractFrameOrientation(runtime, frameData);
+  auto orient = ::rnexecutorch::utils::readFrameOrientation(runtime, frameData);
   cv::Mat frame = extractFromFrame(runtime, frameData);
   cv::Mat rotated = utils::rotateFrameForModel(frame, orient);
   cv::Mat output = runInference(rotated, modelInputSize());
 
@@ -6,6 +6,7 @@
 #include <rnexecutorch/models/ocr/Constants.h>
 #include <rnexecutorch/models/ocr/Types.h>
 #include <rnexecutorch/utils/FrameProcessor.h>
+#include <rnexecutorch/utils/FrameTransform.h>
 #include <tuple>
 
 namespace rnexecutorch::models::ocr {
@@ -71,7 +72,7 @@ VerticalOCR::generateFromFrame(jsi::Runtime &runtime,
   auto detections = runInference(rotated);
   for (auto &det : detections) {
     ::rnexecutorch::utils::inverseRotatePoints(det.bbox, orient,
-                                               rotated.cols, rotated.rows);
+                                               rotated.size());
   }
   return detections;
 }
 
@@ -1,15 +1,18 @@
 #include <gtest/gtest.h>
 #include <opencv2/opencv.hpp>
 #include <rnexecutorch/utils/FrameTransform.h>
+#include <rnexecutorch/utils/computer_vision/Types.h>
 
 using namespace rnexecutorch::utils;
+using rnexecutorch::utils::computer_vision::BBox;
 
 static FrameOrientation makeOrient(const std::string &o, bool mirrored) {
   return {orientationFromString(o), mirrored};
 }
 
 // ============================================================================
-// rotateFrameForModel — rotates sensor-native frame so model sees upright image.
+// rotateFrameForModel — rotates sensor-native frame so model sees upright
+// image.
 //
 //   "up"    (landscape-left)       → no rotation
 //   "left"  (portrait upright)     → CW
@@ -215,7 +218,8 @@ TEST(InverseRotateMat, DoesNotModifyInput) {
 // rW/rH = rotated frame dimensions (after rotateFrameForModel).
 // On Android (no __APPLE__), isMirrored is ignored.
 //
-// Formulas (same as inverseRotatePoints per-corner, but preserves x1<=x2, y1<=y2):
+// Formulas (same as inverseRotatePoints per-corner, but preserves x1<=x2,
+// y1<=y2):
 //   "up"    → CW:  nx1=h-y2, ny1=x1, nx2=h-y1, ny2=x2
 //   "right" → 180°: nx1=w-x2, ny1=h-y2, nx2=w-x1, ny2=h-y1
 //   "down"  → CCW: nx1=y1, ny1=w-x2, nx2=y2, ny2=w-x1
@@ -224,53 +228,53 @@ TEST(InverseRotateMat, DoesNotModifyInput) {
 
 // "left" → no-op. Box unchanged.
 TEST(InverseRotateBbox, Left_NoOp) {
-  float x1 = 10, y1 = 20, x2 = 100, y2 = 200;
-  inverseRotateBbox(x1, y1, x2, y2, makeOrient("left", false), 640, 480);
-  EXPECT_FLOAT_EQ(x1, 10);
-  EXPECT_FLOAT_EQ(y1, 20);
-  EXPECT_FLOAT_EQ(x2, 100);
-  EXPECT_FLOAT_EQ(y2, 200);
+  BBox bbox{10, 20, 100, 200};
+  inverseRotateBbox(bbox, makeOrient("left", false), {640, 480});
+  EXPECT_FLOAT_EQ(bbox.x1, 10);
+  EXPECT_FLOAT_EQ(bbox.y1, 20);
+  EXPECT_FLOAT_EQ(bbox.x2, 100);
+  EXPECT_FLOAT_EQ(bbox.y2, 200);
 }
 
 // "up" → CW. rW=640, rH=480. Box (10,20)-(100,200):
 //   nx1=480-200=280, ny1=10, nx2=480-20=460, ny2=100
 TEST(InverseRotateBbox, Up_CW) {
-  float x1 = 10, y1 = 20, x2 = 100, y2 = 200;
-  inverseRotateBbox(x1, y1, x2, y2, makeOrient("up", false), 640, 480);
-  EXPECT_FLOAT_EQ(x1, 280);
-  EXPECT_FLOAT_EQ(y1, 10);
-  EXPECT_FLOAT_EQ(x2, 460);
-  EXPECT_FLOAT_EQ(y2, 100);
+  BBox bbox{10, 20, 100, 200};
+  inverseRotateBbox(bbox, makeOrient("up", false), {640, 480});
+  EXPECT_FLOAT_EQ(bbox.x1, 280);
+  EXPECT_FLOAT_EQ(bbox.y1, 10);
+  EXPECT_FLOAT_EQ(bbox.x2, 460);
+  EXPECT_FLOAT_EQ(bbox.y2, 100);
 }
 
 // "right" → 180°. rW=480, rH=640. Box (10,20)-(100,200):
 //   nx1=480-100=380, ny1=640-200=440, nx2=480-10=470, ny2=640-20=620
 TEST(InverseRotateBbox, Right_180) {
-  float x1 = 10, y1 = 20, x2 = 100, y2 = 200;
-  inverseRotateBbox(x1, y1, x2, y2, makeOrient("right", false), 480, 640);
-  EXPECT_FLOAT_EQ(x1, 380);
-  EXPECT_FLOAT_EQ(y1, 440);
-  EXPECT_FLOAT_EQ(x2, 470);
-  EXPECT_FLOAT_EQ(y2, 620);
+  BBox bbox{10, 20, 100, 200};
+  inverseRotateBbox(bbox, makeOrient("right", false), {480, 640});
+  EXPECT_FLOAT_EQ(bbox.x1, 380);
+  EXPECT_FLOAT_EQ(bbox.y1, 440);
+  EXPECT_FLOAT_EQ(bbox.x2, 470);
+  EXPECT_FLOAT_EQ(bbox.y2, 620);
 }
 
 // "down" → CCW. rW=640, rH=480. Box (10,20)-(100,200):
 //   nx1=20, ny1=640-100=540, nx2=200, ny2=640-10=630
 TEST(InverseRotateBbox, Down_CCW) {
-  float x1 = 10, y1 = 20, x2 = 100, y2 = 200;
-  inverseRotateBbox(x1, y1, x2, y2, makeOrient("down", false), 640, 480);
-  EXPECT_FLOAT_EQ(x1, 20);
-  EXPECT_FLOAT_EQ(y1, 540);
-  EXPECT_FLOAT_EQ(x2, 200);
-  EXPECT_FLOAT_EQ(y2, 630);
+  BBox bbox{10, 20, 100, 200};
+  inverseRotateBbox(bbox, makeOrient("down", false), {640, 480});
+  EXPECT_FLOAT_EQ(bbox.x1, 20);
+  EXPECT_FLOAT_EQ(bbox.y1, 540);
+  EXPECT_FLOAT_EQ(bbox.x2, 200);
+  EXPECT_FLOAT_EQ(bbox.y2, 630);
 }
 
 // Guarantees x1<=x2 and y1<=y2 after transform.
 TEST(InverseRotateBbox, OutputOrdered) {
-  float x1 = 50, y1 = 50, x2 = 150, y2 = 250;
-  inverseRotateBbox(x1, y1, x2, y2, makeOrient("up", false), 640, 480);
-  EXPECT_LE(x1, x2);
-  EXPECT_LE(y1, y2);
+  BBox bbox{50, 50, 150, 250};
+  inverseRotateBbox(bbox, makeOrient("up", false), {640, 480});
+  EXPECT_LE(bbox.x1, bbox.x2);
+  EXPECT_LE(bbox.y1, bbox.y2);
 }
 
 // ============================================================================
@@ -288,7 +292,7 @@ struct Pt {
 // "left" → no-op. Points unchanged.
 TEST(InverseRotatePoints, Left_NoOp) {
   std::array<Pt, 4> pts = {{{10, 20}, {30, 40}, {50, 60}, {70, 80}}};
-  inverseRotatePoints(pts, makeOrient("left", false), 640, 480);
+  inverseRotatePoints(pts, makeOrient("left", false), {640, 480});
   EXPECT_FLOAT_EQ(pts[0].x, 10);
   EXPECT_FLOAT_EQ(pts[0].y, 20);
   EXPECT_FLOAT_EQ(pts[1].x, 30);
@@ -302,7 +306,7 @@ TEST(InverseRotatePoints, Left_NoOp) {
 // "up" → CW per point. rW=640, rH=480. pt(10,20): nx=480-20=460, ny=10.
 TEST(InverseRotatePoints, Up_CW) {
   std::array<Pt, 4> pts = {{{10, 20}, {30, 40}, {50, 60}, {70, 80}}};
-  inverseRotatePoints(pts, makeOrient("up", false), 640, 480);
+  inverseRotatePoints(pts, makeOrient("up", false), {640, 480});
   EXPECT_FLOAT_EQ(pts[0].x, 460);
   EXPECT_FLOAT_EQ(pts[0].y, 10);
   EXPECT_FLOAT_EQ(pts[1].x, 440);
@@ -313,10 +317,11 @@ TEST(InverseRotatePoints, Up_CW) {
   EXPECT_FLOAT_EQ(pts[3].y, 70);
 }
 
-// "right" → 180° per point. rW=480, rH=640. pt(10,20): nx=480-10=470, ny=640-20=620.
+// "right" → 180° per point. rW=480, rH=640. pt(10,20): nx=480-10=470,
+// ny=640-20=620.
 TEST(InverseRotatePoints, Right_180) {
   std::array<Pt, 4> pts = {{{10, 20}, {30, 40}, {50, 60}, {70, 80}}};
-  inverseRotatePoints(pts, makeOrient("right", false), 480, 640);
+  inverseRotatePoints(pts, makeOrient("right", false), {480, 640});
   EXPECT_FLOAT_EQ(pts[0].x, 470);
   EXPECT_FLOAT_EQ(pts[0].y, 620);
   EXPECT_FLOAT_EQ(pts[1].x, 450);
@@ -330,7 +335,7 @@ TEST(InverseRotatePoints, Right_180) {
 // "down" → CCW per point. rW=640, rH=480. pt(10,20): nx=20, ny=640-10=630.
 TEST(InverseRotatePoints, Down_CCW) {
   std::array<Pt, 4> pts = {{{10, 20}, {30, 40}, {50, 60}, {70, 80}}};
-  inverseRotatePoints(pts, makeOrient("down", false), 640, 480);
+  inverseRotatePoints(pts, makeOrient("down", false), {640, 480});
   EXPECT_FLOAT_EQ(pts[0].x, 20);
   EXPECT_FLOAT_EQ(pts[0].y, 630);
   EXPECT_FLOAT_EQ(pts[1].x, 40);
 
@@ -38,15 +38,17 @@ FrameOrientation readFrameOrientation(jsi::Runtime &runtime,
   std::string orientStr = "up";
   if (obj.hasProperty(runtime, "orientation")) {
     auto val = obj.getProperty(runtime, "orientation");
-    if (val.isString())
+    if (val.isString()) {
       orientStr = val.getString(runtime).utf8(runtime);
+    }
   }
 
   bool isMirrored = false;
   if (obj.hasProperty(runtime, "isMirrored")) {
     auto val = obj.getProperty(runtime, "isMirrored");
-    if (val.isBool())
+    if (val.isBool()) {
       isMirrored = val.getBool();
+    }
   }
 
   return {orientationFromString(orientStr), isMirrored};
Original file line number	Diff line number	Diff line change
`@@ -51,9 +51,4 @@ cv::Mat VisionModel::extractFromPixels(const JSTensorViewIn &tensorView) const {`
`51`	`51`	`return ::rnexecutorch::utils::pixelsToMat(tensorView);`
`52`	`52`	`}`
`53`	`53`
`54`		`-utils::FrameOrientation VisionModel::extractFrameOrientation(`
`55`		`- jsi::Runtime &runtime, const jsi::Value &frameData) const {`
`56`		`- return ::rnexecutorch::utils::readFrameOrientation(runtime, frameData);`
`57`		`-}`
`58`		`-`
`59`	`54`	`} // namespace rnexecutorch::models`