From c3832caa22a846dadb45b738a6578d00ceab8b84 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Tue, 31 Mar 2026 11:44:22 -0400
Subject: [PATCH 01/28] fix: TEXT field = operator now uses exact phrase
 matching

- Changed = operator on TEXT fields to always wrap values in quotes
  (@field:"value") for exact phrase semantics, preserving stopwords
- Fixes 'bank of america' bug where stopwords like 'of' were stripped
- Added _escape_text_value() to escape quotes/backslashes in values
- Negation now derived from operator (consistent with TAG builder)
- FULLTEXT operator retains tokenized search with stopword filtering
- Fixed import formatting to match project black/isort style
- Updated docstrings and tests to use FULLTEXT (actual parser operator)
- All 333 tests passing (299 unit + 34 integration)
---
 sql_redis/query_builder.py           | 38 +++++++++++++++++------
 tests/test_parameter_substitution.py |  8 +++--
 tests/test_query_builder.py          | 45 +++++++++++++++++++++++-----
 tests/test_translator.py             |  4 +--
 4 files changed, 75 insertions(+), 20 deletions(-)

diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 1c674ce..86d989d 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -51,6 +51,17 @@ class QueryBuilder:
     # Characters that need escaping in TAG values
     TAG_SPECIAL_CHARS = r".,<>{}[]\"':;!@#$%^&*()-+=~"
 
+    @staticmethod
+    def _escape_text_value(value: str) -> str:
+        """Escape characters that are special inside RediSearch double-quoted phrases.
+
+        Backslashes and double quotes must be escaped so they don't break
+        the query syntax or alter its meaning.
+        """
+        # Escape backslashes first (so we don't double-escape the quote escapes),
+        # then escape double quotes.
+        return value.replace("\\", "\\\\").replace('"', '\\"')
+
     def build_text_condition(
         self,
         field: str | list[str],
@@ -62,14 +73,16 @@ def build_text_condition(
 
         Args:
             field: Field name or list of field names for multi-field search.
-            operator: One of =, MATCH, LIKE, FUZZY.
+            operator: One of =, !=, FULLTEXT, LIKE, FUZZY.
             value: The search term or pattern.
             negated: If True, prefix with - for negation.
 
         Returns:
-            RediSearch query syntax like @field:term or @field:"phrase".
+            RediSearch query syntax like @field:"exact phrase" or @field:(term1 term2).
         """
-        prefix = "-" if negated else ""
+        # Derive negation from both the flag and the operator itself,
+        # consistent with how build_tag_condition handles != via operator.
+        prefix = "-" if negated or operator == "!=" else ""
 
         # Handle multi-field search
         if isinstance(field, list):
@@ -83,8 +96,14 @@ def build_text_condition(
         elif operator == "FUZZY":
             # Wrap with % for fuzzy matching
             search_value = f"%{value}%"
+        elif operator in ("=", "!="):
+            # Exact phrase match — always wrap in quotes, preserve stopwords.
+            # This ensures "bank of america" stays as-is rather than
+            # being tokenized or having stopwords stripped.
+            escaped = self._escape_text_value(value)
+            search_value = f'"{escaped}"'
         elif " " in value:
-            # Phrase search - filter stopwords and wrap in quotes
+            # MATCH with multi-word: tokenized search with stopword filtering
             words = value.split()
             removed_stopwords = [
                 w for w in words if w.lower() in REDIS_DEFAULT_STOPWORDS
@@ -95,16 +114,17 @@ def build_text_condition(
 
             if removed_stopwords:
                 warnings.warn(
-                    f"Stopwords {removed_stopwords} were removed from phrase search '{value}'. "
+                    f"Stopwords {removed_stopwords} were removed from text search '{value}'. "
                     "By default, Redis does not index stopwords. "
-                    "To include stopwords in your index, create it with STOPWORDS 0.",
+                    "To include stopwords in your index, create it with STOPWORDS 0. "
+                    "Use = operator for exact phrase matching that preserves stopwords.",
                     UserWarning,
                     stacklevel=2,
                 )
 
-            # Use filtered phrase, or original if all words were stopwords
-            phrase = " ".join(filtered_words) if filtered_words else value
-            search_value = f'"{phrase}"'
+            # Use filtered words in parentheses (AND semantics), or original if all were stopwords
+            terms = " ".join(filtered_words) if filtered_words else value
+            search_value = f"({terms})"
         else:
             search_value = value
 
diff --git a/tests/test_parameter_substitution.py b/tests/test_parameter_substitution.py
index f123038..c7affe7 100644
--- a/tests/test_parameter_substitution.py
+++ b/tests/test_parameter_substitution.py
@@ -211,9 +211,13 @@ def test_empty_string_value(self, param_executor: Executor, param_test_index: st
         Note: Redis Search doesn't handle empty string literals well in TEXT fields.
         This is a Redis limitation, not a parameter substitution bug.
         """
-        # Empty strings cause Redis syntax errors in TEXT field queries
+        # Empty strings cause Redis errors in TEXT field queries
         # This is expected behavior - Redis Search requires non-empty search terms
-        with pytest.raises(redis.exceptions.ResponseError, match="Syntax error"):
+        # With exact phrase syntax (@field:""), Redis may return "Syntax error"
+        # or "INDEXEMPTY" guidance depending on the Redis version
+        with pytest.raises(
+            redis.exceptions.ResponseError, match="Syntax error|INDEXEMPTY"
+        ):
             param_executor.execute(
                 f"SELECT * FROM {param_test_index} WHERE name = :name",
                 params={"name": ""},
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index 07e5865..aa9db0d 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -8,27 +8,58 @@
 class TestQueryBuilderTextFields:
     """Tests for building TEXT field query syntax."""
 
-    def test_text_single_term(self):
-        """TEXT field with single term: @field:term."""
+    def test_text_single_term_exact(self):
+        """TEXT field with = wraps in quotes for exact phrase: @field:"term"."""
         builder = QueryBuilder()
         result = builder.build_text_condition("title", "=", "laptop")
 
-        assert result == "@title:laptop"
+        assert result == '@title:"laptop"'
 
     def test_text_exact_phrase(self):
-        """TEXT field with phrase: @field:"exact phrase"."""
+        """TEXT field with = preserves multi-word phrase: @field:"exact phrase"."""
         builder = QueryBuilder()
         result = builder.build_text_condition("title", "=", "gaming laptop")
 
         assert result == '@title:"gaming laptop"'
 
-    def test_text_match_term(self):
-        """TEXT field with MATCH: @field:term."""
+    def test_text_exact_phrase_preserves_stopwords(self):
+        """TEXT field with = preserves stopwords in exact phrase matching."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("name", "=", "bank of america")
+
+        # Stopwords like "of" must NOT be stripped for exact phrase matching
+        assert result == '@name:"bank of america"'
+
+    def test_text_exact_phrase_escapes_quotes(self):
+        """TEXT field with = escapes double quotes inside the value."""
         builder = QueryBuilder()
-        result = builder.build_text_condition("title", "MATCH", "laptop")
+        result = builder.build_text_condition("title", "=", 'say "hello"')
+
+        assert result == r'@title:"say \"hello\""'
+
+    def test_text_exact_phrase_escapes_backslashes(self):
+        """TEXT field with = escapes backslashes inside the value."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("path", "=", r"c:\users\docs")
+
+        assert result == r'@path:"c:\\users\\docs"'
+
+    def test_text_fulltext_term(self):
+        """TEXT field with FULLTEXT (tokenized search): @field:term."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "laptop")
 
         assert result == "@title:laptop"
 
+    def test_text_fulltext_multi_word(self):
+        """TEXT field with FULLTEXT and multi-word: @field:(term1 term2)."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            "description", "FULLTEXT", "gaming laptop"
+        )
+
+        assert result == "@description:(gaming laptop)"
+
     def test_text_prefix_search(self):
         """TEXT field with prefix: @field:prefix*."""
         builder = QueryBuilder()
diff --git a/tests/test_translator.py b/tests/test_translator.py
index 4240cad..622e1f9 100644
--- a/tests/test_translator.py
+++ b/tests/test_translator.py
@@ -136,7 +136,7 @@ def test_select_with_text_filter(self, translator: Translator, basic_index: str)
         )
 
         assert result.command == "FT.SEARCH"
-        assert result.query_string == "@title:hello"
+        assert result.query_string == '@title:"hello"'
 
     def test_select_with_numeric_filter(self, translator: Translator, basic_index: str):
         """SELECT with NUMERIC field condition."""
@@ -202,7 +202,7 @@ def test_and_conditions(self, translator: Translator, basic_index: str):
             f"SELECT * FROM {basic_index} WHERE title = 'hello' AND price > 50"
         )
 
-        assert "@title:hello" in result.query_string
+        assert '@title:"hello"' in result.query_string
         assert "@price:[(50 +inf]" in result.query_string
 
     def test_or_conditions(self, translator: Translator, basic_index: str):

From cc7e9af3f196f2a7d89bcf9ebb9ae9535994fb5b Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Tue, 31 Mar 2026 15:36:42 -0400
Subject: [PATCH 02/28] =?UTF-8?q?feat:=20advanced=20text=20search=20?=
 =?UTF-8?q?=E2=80=94=20fuzzy=20LD=202/3,=20suffix/infix,=20OR,=20proximity?=
 =?UTF-8?q?,=20BM25=20scoring?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Parser: add LIKE handler, Boolean extraction for inorder param
- QueryBuilder: suffix/infix patterns, fuzzy LD 2-3, slop/inorder attributes, scoring
- Translator: score_alias on TranslatedQuery, WITHSCORES/SCORER args
- Executor: stride-3 response parsing for WITHSCORES (sync + async)
- Tests: 137 new tests (82 unit QB, 37 unit translator, 18 integration)
- All 402 tests pass, mypy clean
---
 sql_redis/executor.py       |  47 +++++++---
 sql_redis/parser.py         |  86 +++++++++++++++++--
 sql_redis/query_builder.py  |  42 +++++++--
 sql_redis/translator.py     |  17 ++++
 tests/test_query_builder.py | 165 ++++++++++++++++++++++++++++++++++++
 tests/test_sql_queries.py   | 132 +++++++++++++++++++++++++++++
 tests/test_translator.py    | 144 +++++++++++++++++++++++++++++++
 7 files changed, 604 insertions(+), 29 deletions(-)

diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index 97e1fe2..4030a7c 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -166,12 +166,25 @@ def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
         rows = []
 
         if translated.command == "FT.SEARCH":
-            # FT.SEARCH format: [count, key1, [fields1], key2, [fields2], ...]
-            # Skip document keys (odd indices), take field lists (even indices after count)
-            for i in range(2, len(raw_result), 2):
-                row_data = raw_result[i]
-                row = dict(zip(row_data[::2], row_data[1::2]))
-                rows.append(row)
+            # Check if WITHSCORES was requested — changes response format
+            with_scores = "WITHSCORES" in translated.args
+            score_alias = translated.score_alias
+
+            if with_scores:
+                # WITHSCORES format: [count, key1, score1, [fields1], key2, score2, [fields2], ...]
+                # Stride of 3: key, score, field_list
+                for i in range(1, len(raw_result) - 2, 3):
+                    score = raw_result[i + 1]
+                    row_data = raw_result[i + 2]
+                    row = dict(zip(row_data[::2], row_data[1::2]))
+                    row[score_alias or "__score"] = score
+                    rows.append(row)
+            else:
+                # Standard format: [count, key1, [fields1], key2, [fields2], ...]
+                for i in range(2, len(raw_result), 2):
+                    row_data = raw_result[i]
+                    row = dict(zip(row_data[::2], row_data[1::2]))
+                    rows.append(row)
         else:
             # FT.AGGREGATE format: [count, [fields1], [fields2], ...]
             for row_data in raw_result[1:]:
@@ -258,11 +271,23 @@ async def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
         rows = []
 
         if translated.command == "FT.SEARCH":
-            # FT.SEARCH format: [count, key1, [fields1], key2, [fields2], ...]
-            for i in range(2, len(raw_result), 2):
-                row_data = raw_result[i]
-                row = dict(zip(row_data[::2], row_data[1::2]))
-                rows.append(row)
+            with_scores = "WITHSCORES" in translated.args
+            score_alias = translated.score_alias
+
+            if with_scores:
+                # WITHSCORES format: [count, key1, score1, [fields1], ...]
+                for i in range(1, len(raw_result) - 2, 3):
+                    score = raw_result[i + 1]
+                    row_data = raw_result[i + 2]
+                    row = dict(zip(row_data[::2], row_data[1::2]))
+                    row[score_alias or "__score"] = score
+                    rows.append(row)
+            else:
+                # Standard format: [count, key1, [fields1], key2, [fields2], ...]
+                for i in range(2, len(raw_result), 2):
+                    row_data = raw_result[i]
+                    row = dict(zip(row_data[::2], row_data[1::2]))
+                    rows.append(row)
         else:
             # FT.AGGREGATE format: [count, [fields1], [fields2], ...]
             for row_data in raw_result[1:]:
diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index e37cfcd..4343342 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -164,6 +164,9 @@ class Condition:
     operator: str
     value: object
     negated: bool = False
+    fuzzy_level: int | None = None  # Levenshtein distance for FUZZY (1, 2, or 3)
+    slop: int | None = None  # Max distance between terms for proximity search
+    inorder: bool = False  # Require terms in order (used with slop)
 
 
 @dataclass
@@ -196,6 +199,17 @@ class GeoDistanceSelect:
     unit: str = "m"  # m, km, mi, ft (default: meters)
 
 
+@dataclass
+class ScoringSpec:
+    """Specification for relevance scoring.
+
+    Triggers WITHSCORES and optional SCORER on FT.SEARCH.
+    """
+
+    alias: str = "score"  # Column alias for the score
+    scorer: str = "BM25"  # Scorer algorithm (BM25, TFIDF, DISMAX, etc.)
+
+
 @dataclass
 class ParsedQuery:
     """Result of parsing a SQL query."""
@@ -219,6 +233,9 @@ class ParsedQuery:
     limit: int | None = None
     offset: int | None = None
     filters: list[str] = dataclasses.field(default_factory=list)
+    scoring: ScoringSpec | None = None  # Relevance scoring config
+    verbatim: bool = False  # If True, add VERBATIM to FT.SEARCH
+    nostopwords: bool = False  # If True, add NOSTOPWORDS to FT.SEARCH
 
 
 class SQLParser:
@@ -441,6 +458,17 @@ def _process_select_expression_inner(
             elif func_name_lower == "geo_distance":
                 # geo_distance(field, POINT(lon, lat), unit) in SELECT
                 self._process_geo_distance_select(expression, result, alias)
+            elif func_name_lower == "score":
+                # score() or score('BM25') — triggers WITHSCORES + SCORER
+                scorer = "BM25"
+                if expression.expressions:
+                    scorer_val = self._extract_literal_value(expression.expressions[0])
+                    if scorer_val is not None:
+                        scorer = str(scorer_val).upper()
+                result.scoring = ScoringSpec(
+                    alias=alias or "score",
+                    scorer=scorer,
+                )
             elif func_name_lower in redis_reducers:
                 # Redis-specific reducer functions
                 field_name = None
@@ -656,6 +684,9 @@ def _process_where_clause(
             self._add_between_condition(expression, result, negated)
         elif isinstance(expression, exp.In):
             self._add_in_condition(expression, result, negated)
+        elif isinstance(expression, exp.Like):
+            # LIKE 'pattern%' / '%pattern' / '%pattern%'
+            self._add_condition(expression, "LIKE", result, negated)
         elif isinstance(expression, exp.And):
             result.boolean_operator = "AND"
             self._process_where_clause(expression.this, result, negated)
@@ -938,25 +969,59 @@ def _add_in_condition(self, expression, result: ParsedQuery, negated: bool) -> N
     def _add_function_condition(
         self, expression, result: ParsedQuery, negated: bool
     ) -> None:
-        """Add a condition from a function call like fulltext(field, value)."""
+        """Add a condition from a function call like fulltext(field, value) or fuzzy(field, value, level)."""
         func_name = expression.name.upper()
-        if func_name == "FULLTEXT" and len(expression.expressions) >= 2:
-            first_arg = expression.expressions[0]
-            second_arg = expression.expressions[1]
+        args = expression.expressions
+
+        if func_name == "FULLTEXT" and len(args) >= 2:
+            field_name = args[0].name if isinstance(args[0], exp.Column) else None
+            value = self._extract_literal_value(args[1])
+
+            # Optional 3rd arg: slop (int)
+            slop = None
+            if len(args) >= 3:
+                slop_val = self._extract_literal_value(args[2])
+                if slop_val is not None:
+                    slop = int(slop_val)
+
+            # Optional 4th arg: inorder (boolean-like: 1/0 or true/false)
+            inorder = False
+            if len(args) >= 4:
+                inorder_val = self._extract_literal_value(args[3])
+                if inorder_val is not None:
+                    inorder = str(inorder_val).lower() in ("1", "true")
 
-            field_name = None
-            if isinstance(first_arg, exp.Column):
-                field_name = first_arg.name
+            if field_name is not None:
+                result.conditions.append(
+                    Condition(
+                        field=field_name,
+                        operator="FULLTEXT",
+                        value=value,
+                        negated=negated,
+                        slop=slop,
+                        inorder=inorder,
+                    )
+                )
 
-            value = self._extract_literal_value(second_arg)
+        elif func_name == "FUZZY" and len(args) >= 2:
+            field_name = args[0].name if isinstance(args[0], exp.Column) else None
+            value = self._extract_literal_value(args[1])
+
+            # Optional 3rd arg: fuzzy level (1, 2, or 3)
+            fuzzy_level = None
+            if len(args) >= 3:
+                level_val = self._extract_literal_value(args[2])
+                if level_val is not None:
+                    fuzzy_level = int(level_val)
 
             if field_name is not None:
                 result.conditions.append(
                     Condition(
                         field=field_name,
-                        operator="FULLTEXT",
+                        operator="FUZZY",
                         value=value,
                         negated=negated,
+                        fuzzy_level=fuzzy_level,
                     )
                 )
 
@@ -983,6 +1048,9 @@ def _extract_literal_value(self, expression, convert_dates: bool = False):
                 if timestamp is not None:
                     return timestamp
             return value
+        elif isinstance(expression, exp.Boolean):
+            # Handle TRUE/FALSE keywords parsed by sqlglot
+            return expression.this
         elif isinstance(expression, exp.Neg):
             # Handle negative numbers: Neg(Literal(122.4)) -> -122.4
             inner_value = self._extract_literal_value(expression.this)
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 86d989d..5a51eea 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -68,6 +68,10 @@ def build_text_condition(
         operator: str,
         value: str,
         negated: bool = False,
+        *,
+        fuzzy_level: int | None = None,
+        slop: int | None = None,
+        inorder: bool = False,
     ) -> str:
         """Build query syntax for TEXT field conditions.
 
@@ -76,6 +80,9 @@ def build_text_condition(
             operator: One of =, !=, FULLTEXT, LIKE, FUZZY.
             value: The search term or pattern.
             negated: If True, prefix with - for negation.
+            fuzzy_level: Levenshtein distance for FUZZY (1, 2, or 3). Default 1.
+            slop: Maximum distance between terms for proximity search.
+            inorder: If True with slop, require terms in order.
 
         Returns:
             RediSearch query syntax like @field:"exact phrase" or @field:(term1 term2).
@@ -91,19 +98,24 @@ def build_text_condition(
 
         # Handle different operators
         if operator == "LIKE":
-            # Convert SQL LIKE pattern (%) to RediSearch prefix (*)
+            # Convert SQL LIKE pattern (%) to RediSearch prefix/suffix/infix (*)
             search_value = value.replace("%", "*")
         elif operator == "FUZZY":
-            # Wrap with % for fuzzy matching
-            search_value = f"%{value}%"
+            # Wrap with % signs — count determined by fuzzy_level
+            level = fuzzy_level if fuzzy_level is not None else 1
+            if level not in (1, 2, 3):
+                raise ValueError(
+                    f"Fuzzy level must be 1, 2, or 3 (got {level}). "
+                    "RediSearch supports a maximum Levenshtein distance of 3."
+                )
+            pct = "%" * level
+            search_value = f"{pct}{value}{pct}"
         elif operator in ("=", "!="):
             # Exact phrase match — always wrap in quotes, preserve stopwords.
-            # This ensures "bank of america" stays as-is rather than
-            # being tokenized or having stopwords stripped.
             escaped = self._escape_text_value(value)
             search_value = f'"{escaped}"'
-        elif " " in value:
-            # MATCH with multi-word: tokenized search with stopword filtering
+        elif " " in value and " OR " not in value:
+            # FULLTEXT/MATCH with multi-word: tokenized search with stopword filtering
             words = value.split()
             removed_stopwords = [
                 w for w in words if w.lower() in REDIS_DEFAULT_STOPWORDS
@@ -122,13 +134,25 @@ def build_text_condition(
                     stacklevel=2,
                 )
 
-            # Use filtered words in parentheses (AND semantics), or original if all were stopwords
             terms = " ".join(filtered_words) if filtered_words else value
             search_value = f"({terms})"
+        elif " OR " in value:
+            # OR union within text field: split on ' OR ' and join with |
+            or_terms = [t.strip() for t in value.split(" OR ")]
+            search_value = f"({'|'.join(or_terms)})"
         else:
             search_value = value
 
-        return f"{prefix}@{field}:{search_value}"
+        base = f"{prefix}@{field}:{search_value}"
+
+        # Append query attributes (slop, inorder) if specified
+        if slop is not None:
+            attrs = f"$slop: {slop};"
+            if inorder:
+                attrs += " $inorder: true;"
+            base = f"{base} => {{ {attrs} }}"
+
+        return base
 
     def _escape_tag_value(self, value: str) -> str:
         """Escape special characters in TAG values."""
diff --git a/sql_redis/translator.py b/sql_redis/translator.py
index b594362..ced3753 100644
--- a/sql_redis/translator.py
+++ b/sql_redis/translator.py
@@ -28,6 +28,7 @@ class TranslatedQuery:
     query_string: str
     args: list[str] = field(default_factory=list)
     params: dict[str, object] = field(default_factory=dict)  # Named parameters
+    score_alias: str | None = None  # Alias for score column when WITHSCORES is used
 
     def to_command_list(self) -> list[str]:
         """Return as a list suitable for redis.execute_command()."""
@@ -230,6 +231,9 @@ def _build_condition(self, condition: Condition, field_type: str | None) -> str:
                 operator,
                 str(condition.value),
                 is_negated,
+                fuzzy_level=condition.fuzzy_level,
+                slop=condition.slop,
+                inorder=condition.inorder,
             )
         elif field_type == "TAG":
             # Keep list value for IN clauses, convert scalar to string
@@ -334,6 +338,18 @@ def _build_search(
             offset = parsed.offset or 0
             args.extend(["LIMIT", str(offset), str(parsed.limit)])
 
+        # Scoring — WITHSCORES and SCORER
+        if parsed.scoring is not None:
+            args.append("WITHSCORES")
+            if parsed.scoring.scorer:
+                args.extend(["SCORER", parsed.scoring.scorer])
+
+        # Verbatim / nostopwords flags
+        if parsed.verbatim:
+            args.append("VERBATIM")
+        if parsed.nostopwords:
+            args.append("NOSTOPWORDS")
+
         # DIALECT 2 — unconditionally appended as the last arguments
         args.extend(["DIALECT", "2"])
 
@@ -343,6 +359,7 @@ def _build_search(
             query_string=query_string,
             args=args,
             params=params,
+            score_alias=(parsed.scoring.alias if parsed.scoring is not None else None),
         )
 
     def _build_geo_filter_args(self, geo_cond: GeoDistanceCondition) -> list[str]:
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index aa9db0d..48b3e49 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -345,6 +345,171 @@ def test_wildcard_query(self):
         assert result == "*"
 
 
+class TestQueryBuilderFuzzyLevels:
+    """Tests for fuzzy matching with Levenshtein distance levels 1-3."""
+
+    def test_fuzzy_ld1_default(self):
+        """Fuzzy LD=1 (default): @field:%term%."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FUZZY", "laptap")
+        assert result == "@title:%laptap%"
+
+    def test_fuzzy_ld1_explicit(self):
+        """Fuzzy LD=1 (explicit): @field:%term%."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FUZZY", "laptap", fuzzy_level=1)
+        assert result == "@title:%laptap%"
+
+    def test_fuzzy_ld2(self):
+        """Fuzzy LD=2: @field:%%term%%."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FUZZY", "laptap", fuzzy_level=2)
+        assert result == "@title:%%laptap%%"
+
+    def test_fuzzy_ld3(self):
+        """Fuzzy LD=3: @field:%%%term%%%."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FUZZY", "laptap", fuzzy_level=3)
+        assert result == "@title:%%%laptap%%%"
+
+    def test_fuzzy_negated(self):
+        """Fuzzy with negation: -@field:%term%."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            "title", "FUZZY", "laptap", negated=True, fuzzy_level=2
+        )
+        assert result == "-@title:%%laptap%%"
+
+    def test_fuzzy_invalid_level_raises(self):
+        """Fuzzy level outside 1-3 raises ValueError."""
+        builder = QueryBuilder()
+        with pytest.raises(ValueError, match="Fuzzy level must be 1, 2, or 3"):
+            builder.build_text_condition("title", "FUZZY", "laptap", fuzzy_level=4)
+
+    def test_fuzzy_level_zero_raises(self):
+        """Fuzzy level 0 raises ValueError."""
+        builder = QueryBuilder()
+        with pytest.raises(ValueError, match="Fuzzy level must be 1, 2, or 3"):
+            builder.build_text_condition("title", "FUZZY", "laptap", fuzzy_level=0)
+
+
+class TestQueryBuilderSuffixInfix:
+    """Tests for suffix and infix (contains) matching."""
+
+    def test_suffix_match(self):
+        """LIKE '%term' -> suffix match: @field:*term."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "LIKE", "%phone")
+        assert result == "@title:*phone"
+
+    def test_infix_match(self):
+        """LIKE '%term%' -> infix/contains match: @field:*term*."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "LIKE", "%phone%")
+        assert result == "@title:*phone*"
+
+    def test_prefix_match_still_works(self):
+        """LIKE 'term%' -> prefix match: @field:term* (unchanged)."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "LIKE", "lap%")
+        assert result == "@title:lap*"
+
+    def test_suffix_negated(self):
+        """Suffix match with negation."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "LIKE", "%phone", negated=True)
+        assert result == "-@title:*phone"
+
+
+class TestQueryBuilderORInText:
+    """Tests for OR/union within text field searches."""
+
+    def test_fulltext_or_terms(self):
+        """FULLTEXT with OR: @field:(term1|term2)."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "laptop OR tablet")
+        assert result == "@title:(laptop|tablet)"
+
+    def test_fulltext_or_multiple_terms(self):
+        """FULLTEXT with multiple OR: @field:(t1|t2|t3)."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            "title", "FULLTEXT", "laptop OR tablet OR phone"
+        )
+        assert result == "@title:(laptop|tablet|phone)"
+
+    def test_fulltext_or_negated(self):
+        """FULLTEXT OR with negation: -@field:(term1|term2)."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            "title", "FULLTEXT", "laptop OR tablet", negated=True
+        )
+        assert result == "-@title:(laptop|tablet)"
+
+    def test_fulltext_and_still_works(self):
+        """FULLTEXT without OR: @field:(term1 term2) (AND semantics, unchanged)."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "gaming laptop")
+        assert result == "@title:(gaming laptop)"
+
+
+class TestQueryBuilderProximity:
+    """Tests for proximity search (slop and inorder)."""
+
+    def test_fulltext_with_slop(self):
+        """FULLTEXT with slop: @field:(term1 term2) => {$slop: N}."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            "title", "FULLTEXT", "gaming laptop", slop=2
+        )
+        assert result == "@title:(gaming laptop) => { $slop: 2; }"
+
+    def test_fulltext_with_slop_and_inorder(self):
+        """FULLTEXT with slop and inorder."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            "title", "FULLTEXT", "gaming laptop", slop=2, inorder=True
+        )
+        assert result == "@title:(gaming laptop) => { $slop: 2; $inorder: true; }"
+
+    def test_exact_phrase_with_slop(self):
+        """Exact phrase with slop appended."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "=", "gaming laptop", slop=1)
+        assert result == '@title:"gaming laptop" => { $slop: 1; }'
+
+    def test_slop_negated(self):
+        """Proximity with negation."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            "title", "FULLTEXT", "gaming laptop", negated=True, slop=3
+        )
+        assert result == "-@title:(gaming laptop) => { $slop: 3; }"
+
+
+class TestQueryBuilderVerbatim:
+    """Tests for verbatim and nostopwords flags."""
+
+    def test_fulltext_with_verbatim(self):
+        """FULLTEXT search term is not affected by verbatim (query-level flag)."""
+        # verbatim is a query-level flag, not part of the condition string
+        # This test just ensures normal behavior is preserved
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "running")
+        assert result == "@title:running"
+
+
+class TestQueryBuilderOptionalTerms:
+    """Tests for optional term (~) syntax."""
+
+    def test_fulltext_optional_term(self):
+        """FULLTEXT with optional terms using ~ prefix in value."""
+        builder = QueryBuilder()
+        # User writes: fulltext(field, 'required ~optional')
+        result = builder.build_text_condition("title", "FULLTEXT", "laptop ~gaming")
+        assert result == "@title:(laptop ~gaming)"
+
+
 class TestQueryBuilderMissingCondition:
     """Tests for ismissing() query syntax."""
 
diff --git a/tests/test_sql_queries.py b/tests/test_sql_queries.py
index 5758349..0fb7b9b 100644
--- a/tests/test_sql_queries.py
+++ b/tests/test_sql_queries.py
@@ -340,3 +340,135 @@ def test_limit_with_offset(self, executor: Executor, products_data: str):
         if len(all_books.rows) > 1 and len(paginated.rows) >= 1:
             # Second item from all_books should be first in paginated result
             assert all_books.rows[1]["title"] == paginated.rows[0]["title"]
+
+
+class TestFuzzySearch:
+    """Integration tests for fuzzy text search with Levenshtein distance levels."""
+
+    def test_fuzzy_ld1_finds_misspelled(self, executor: Executor, products_data: str):
+        """fuzzy(field, 'laptap') at LD=1 should find 'laptop' titles."""
+        result = executor.execute(
+            f"SELECT title FROM {products_data} WHERE fuzzy(title, 'laptap')"
+        )
+        assert len(result.rows) >= 1, "Fuzzy LD=1 should match 'laptop' from 'laptap'"
+        for row in result.rows:
+            assert "laptop" in row["title"].lower()
+
+    def test_fuzzy_ld2(self, executor: Executor, products_data: str):
+        """fuzzy(field, 'laptep', 2) at LD=2 should still find 'laptop'."""
+        result = executor.execute(
+            f"SELECT title FROM {products_data} WHERE fuzzy(title, 'laptep', 2)"
+        )
+        assert len(result.rows) >= 1, "Fuzzy LD=2 should match 'laptop' from 'laptep'"
+
+    def test_fuzzy_ld3(self, executor: Executor, products_data: str):
+        """fuzzy(field, 'loptep', 3) at LD=3 should find 'laptop'."""
+        result = executor.execute(
+            f"SELECT title FROM {products_data} WHERE fuzzy(title, 'loptep', 3)"
+        )
+        assert len(result.rows) >= 1, "Fuzzy LD=3 should match 'laptop' from 'loptep'"
+
+
+class TestSuffixInfixSearch:
+    """Integration tests for suffix and infix (contains) pattern matching."""
+
+    def test_prefix_search(self, executor: Executor, products_data: str):
+        """LIKE 'lap%' should find laptop titles (prefix match)."""
+        result = executor.execute(
+            f"SELECT title FROM {products_data} WHERE title LIKE 'lap%'"
+        )
+        assert len(result.rows) >= 1, "Prefix 'lap%' should match laptop titles"
+
+    def test_suffix_search(self, executor: Executor, products_data: str):
+        """LIKE '%board' should find keyboard titles (suffix match)."""
+        result = executor.execute(
+            f"SELECT title FROM {products_data} WHERE title LIKE '%board'"
+        )
+        # "Mechanical Keyboard" has 'board' at end of 'Keyboard'
+        assert len(result.rows) >= 1, "Suffix '%board' should match 'Keyboard'"
+
+    def test_infix_search(self, executor: Executor, products_data: str):
+        """LIKE '%ouse%' should find 'Wireless Mouse' (contains match)."""
+        result = executor.execute(
+            f"SELECT title FROM {products_data} WHERE title LIKE '%ouse%'"
+        )
+        assert len(result.rows) >= 1, "Infix '%ouse%' should match 'Mouse'"
+
+
+class TestORInTextSearch:
+    """Integration tests for OR/union within text field searches."""
+
+    def test_fulltext_or_two_terms(self, executor: Executor, products_data: str):
+        """fulltext(field, 'laptop OR keyboard') should find both."""
+        result = executor.execute(
+            f"SELECT title FROM {products_data} WHERE fulltext(title, 'laptop OR keyboard')"
+        )
+        titles = [row["title"].lower() for row in result.rows]
+        has_laptop = any("laptop" in t for t in titles)
+        has_keyboard = any("keyboard" in t for t in titles)
+        assert (
+            has_laptop and has_keyboard
+        ), f"Should find both laptop and keyboard titles, got: {titles}"
+
+    def test_fulltext_or_three_terms(self, executor: Executor, products_data: str):
+        """fulltext(field, 'laptop OR mouse OR lamp') should find all three."""
+        result = executor.execute(
+            f"SELECT title FROM {products_data} WHERE fulltext(title, 'laptop OR mouse OR lamp')"
+        )
+        assert (
+            len(result.rows) >= 3
+        ), f"Should find at least 3 products (laptop, mouse, lamp), got {len(result.rows)}"
+
+
+class TestProximitySearch:
+    """Integration tests for proximity search (slop + inorder)."""
+
+    def test_fulltext_with_slop(self, executor: Executor, products_data: str):
+        """fulltext(title, 'gaming pro', 2) should find 'Gaming laptop Pro'."""
+        result = executor.execute(
+            f"SELECT title FROM {products_data} WHERE fulltext(title, 'gaming pro', 2)"
+        )
+        assert (
+            len(result.rows) >= 1
+        ), "Slop=2 should find 'Gaming laptop Pro' (1 word between gaming and pro)"
+
+    def test_fulltext_with_slop_and_inorder(
+        self, executor: Executor, products_data: str
+    ):
+        """fulltext(title, 'gaming pro', 2, true) with inorder should match."""
+        result = executor.execute(
+            f"SELECT title FROM {products_data} WHERE fulltext(title, 'gaming pro', 2, true)"
+        )
+        assert (
+            len(result.rows) >= 1
+        ), "Slop=2 with inorder should find 'Gaming laptop Pro'"
+
+
+class TestBM25Scoring:
+    """Integration tests for relevance scoring with WITHSCORES."""
+
+    def test_score_returns_relevance(self, executor: Executor, products_data: str):
+        """score() in SELECT should return relevance scores."""
+        result = executor.execute(
+            f"""SELECT title, score() AS relevance
+            FROM {products_data}
+            WHERE fulltext(title, 'laptop')"""
+        )
+        assert len(result.rows) >= 1, "Should return results with scores"
+        for row in result.rows:
+            assert "relevance" in row, f"Row should have 'relevance' key: {row}"
+            score = float(row["relevance"])
+            assert score >= 0, f"Score should be non-negative, got {score}"
+
+    def test_score_custom_scorer(self, executor: Executor, products_data: str):
+        """score('TFIDF') should use TFIDF scorer."""
+        result = executor.execute(
+            f"""SELECT title, score('TFIDF') AS relevance
+            FROM {products_data}
+            WHERE fulltext(title, 'laptop')"""
+        )
+        assert len(result.rows) >= 1, "Should return results with TFIDF scores"
+        for row in result.rows:
+            assert "relevance" in row
+            score = float(row["relevance"])
+            assert score >= 0
diff --git a/tests/test_translator.py b/tests/test_translator.py
index 622e1f9..1c0c702 100644
--- a/tests/test_translator.py
+++ b/tests/test_translator.py
@@ -616,3 +616,147 @@ def test_select_star_with_having_uses_load_all(
         assert "LOAD" in result.args
         load_idx = result.args.index("LOAD")
         assert result.args[load_idx + 1] == "*"
+
+
+class TestTranslatorFuzzyLevels:
+    """Tests for FUZZY with Levenshtein distance levels.
+
+    Inspired by PostgreSQL's pg_trgm similarity threshold levels,
+    maps to RediSearch's %, %%, %%% fuzzy syntax.
+    """
+
+    def test_fuzzy_ld1_default(self, translator: Translator, basic_index: str):
+        """fuzzy(field, 'term') with no level → LD=1 (%term%)."""
+        result = translator.translate(
+            f"SELECT * FROM {basic_index} WHERE fuzzy(title, 'laptap')"
+        )
+        assert result.command == "FT.SEARCH"
+        assert "@title:%laptap%" in result.query_string
+
+    def test_fuzzy_ld2(self, translator: Translator, basic_index: str):
+        """fuzzy(field, 'term', 2) → LD=2 (%%term%%)."""
+        result = translator.translate(
+            f"SELECT * FROM {basic_index} WHERE fuzzy(title, 'laptap', 2)"
+        )
+        assert "@title:%%laptap%%" in result.query_string
+
+    def test_fuzzy_ld3(self, translator: Translator, basic_index: str):
+        """fuzzy(field, 'term', 3) → LD=3 (%%%term%%%)."""
+        result = translator.translate(
+            f"SELECT * FROM {basic_index} WHERE fuzzy(title, 'laptap', 3)"
+        )
+        assert "@title:%%%laptap%%%" in result.query_string
+
+
+class TestTranslatorSuffixInfix:
+    """Tests for suffix and infix (contains) pattern matching.
+
+    PostgreSQL analogy: LIKE '%term' and LIKE '%term%'.
+    RediSearch uses *term and *term* respectively.
+    """
+
+    def test_suffix_match(self, translator: Translator, basic_index: str):
+        """LIKE '%phone' → suffix match @field:*phone."""
+        result = translator.translate(
+            f"SELECT * FROM {basic_index} WHERE title LIKE '%phone'"
+        )
+        assert "@title:*phone" in result.query_string
+
+    def test_infix_match(self, translator: Translator, basic_index: str):
+        """LIKE '%phone%' → infix/contains match @field:*phone*."""
+        result = translator.translate(
+            f"SELECT * FROM {basic_index} WHERE title LIKE '%phone%'"
+        )
+        assert "@title:*phone*" in result.query_string
+
+    def test_prefix_still_works(self, translator: Translator, basic_index: str):
+        """LIKE 'lap%' → prefix match @field:lap* (unchanged)."""
+        result = translator.translate(
+            f"SELECT * FROM {basic_index} WHERE title LIKE 'lap%'"
+        )
+        assert "@title:lap*" in result.query_string
+
+
+class TestTranslatorORInText:
+    """Tests for OR/union within text field searches.
+
+    Inspired by PostgreSQL's to_tsquery('fat | rat') and
+    websearch_to_tsquery('fat OR rat') — natural OR syntax
+    maps to RediSearch's @field:(term1|term2).
+    """
+
+    def test_fulltext_or(self, translator: Translator, basic_index: str):
+        """fulltext(field, 'laptop OR tablet') → @field:(laptop|tablet)."""
+        result = translator.translate(
+            f"SELECT * FROM {basic_index} WHERE fulltext(title, 'laptop OR tablet')"
+        )
+        assert "@title:(laptop|tablet)" in result.query_string
+
+    def test_fulltext_multiple_or(self, translator: Translator, basic_index: str):
+        """fulltext(field, 'a OR b OR c') → @field:(a|b|c)."""
+        result = translator.translate(
+            f"SELECT * FROM {basic_index} WHERE fulltext(title, 'laptop OR tablet OR phone')"
+        )
+        assert "@title:(laptop|tablet|phone)" in result.query_string
+
+
+class TestTranslatorProximity:
+    """Tests for proximity search (slop + inorder).
+
+    Inspired by PostgreSQL's phraseto_tsquery / <N> FOLLOWED BY operator.
+    Maps to RediSearch query attributes: => { $slop: N; $inorder: true; }.
+    """
+
+    def test_fulltext_with_slop(self, translator: Translator, basic_index: str):
+        """fulltext(field, 'gaming laptop', 2) → slop=2 query attribute."""
+        result = translator.translate(
+            f"SELECT * FROM {basic_index} WHERE fulltext(title, 'gaming laptop', 2)"
+        )
+        assert "$slop: 2;" in result.query_string
+
+    def test_fulltext_with_slop_and_inorder(
+        self, translator: Translator, basic_index: str
+    ):
+        """fulltext(field, 'gaming laptop', 2, true) → slop=2 + inorder."""
+        result = translator.translate(
+            f"SELECT * FROM {basic_index} WHERE fulltext(title, 'gaming laptop', 2, true)"
+        )
+        assert "$slop: 2;" in result.query_string
+        assert "$inorder: true;" in result.query_string
+
+
+class TestTranslatorScoring:
+    """Tests for relevance scoring (WITHSCORES + SCORER).
+
+    Inspired by PostgreSQL's ts_rank(vector, query) AS rank in SELECT.
+    Maps to RediSearch's WITHSCORES and SCORER flags on FT.SEARCH.
+
+    SQL: SELECT name, score() AS relevance FROM idx WHERE fulltext(...)
+    Redis: FT.SEARCH idx "@field:(term)" WITHSCORES SCORER BM25
+    """
+
+    def test_score_default_bm25(self, translator: Translator, basic_index: str):
+        """score() in SELECT → WITHSCORES + SCORER BM25."""
+        result = translator.translate(
+            f"SELECT title, score() AS relevance FROM {basic_index} WHERE fulltext(title, 'laptop')"
+        )
+        assert "WITHSCORES" in result.args
+        assert "SCORER" in result.args
+        scorer_idx = result.args.index("SCORER")
+        assert result.args[scorer_idx + 1] == "BM25"
+
+    def test_score_custom_scorer(self, translator: Translator, basic_index: str):
+        """score('TFIDF') in SELECT → WITHSCORES + SCORER TFIDF."""
+        result = translator.translate(
+            f"SELECT title, score('TFIDF') AS relevance FROM {basic_index} WHERE fulltext(title, 'laptop')"
+        )
+        assert "WITHSCORES" in result.args
+        scorer_idx = result.args.index("SCORER")
+        assert result.args[scorer_idx + 1] == "TFIDF"
+
+    def test_no_score_no_withscores(self, translator: Translator, basic_index: str):
+        """Without score() → no WITHSCORES flag."""
+        result = translator.translate(
+            f"SELECT title FROM {basic_index} WHERE fulltext(title, 'laptop')"
+        )
+        assert "WITHSCORES" not in result.args

From 94c9d458d88dbbd7848a2afc3167dc676158af0f Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Tue, 31 Mar 2026 16:00:05 -0400
Subject: [PATCH 03/28] fix: multi-field text search applies escaping/negation
 for =/!= operators

Addresses Copilot review feedback:
- Multi-field early return now applies _escape_text_value and prefix for =/!=
- Documented MATCH as internal alias for FULLTEXT in docstring
---
 sql_redis/query_builder.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 5a51eea..3eb4de8 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -77,7 +77,7 @@ def build_text_condition(
 
         Args:
             field: Field name or list of field names for multi-field search.
-            operator: One of =, !=, FULLTEXT, LIKE, FUZZY.
+            operator: One of =, !=, FULLTEXT (or MATCH alias), LIKE, FUZZY.
             value: The search term or pattern.
             negated: If True, prefix with - for negation.
             fuzzy_level: Levenshtein distance for FUZZY (1, 2, or 3). Default 1.
@@ -91,10 +91,13 @@ def build_text_condition(
         # consistent with how build_tag_condition handles != via operator.
         prefix = "-" if negated or operator == "!=" else ""
 
-        # Handle multi-field search
+        # Handle multi-field search — apply same escaping/operator semantics
         if isinstance(field, list):
             field_str = "|".join(field)
-            return f"(@{field_str}:{value})"
+            if operator in ("=", "!="):
+                escaped = self._escape_text_value(value)
+                return f'{prefix}(@{field_str}:"{escaped}")'
+            return f"{prefix}(@{field_str}:{value})"
 
         # Handle different operators
         if operator == "LIKE":

From 1ec2b007498839e9c8bd3469b023745b4b918956 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 31 Mar 2026 20:08:50 +0000
Subject: [PATCH 04/28] =?UTF-8?q?fix:=20address=20review=20feedback=20?=
 =?UTF-8?q?=E2=80=94=20FULLTEXT=20consistency,=20term=20escaping,=20Black?=
 =?UTF-8?q?=20formatting?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Agent-Logs-Url: https://github.com/redis-developer/sql-redis/sessions/a931f501-2012-4aa2-8d18-2bca615d32be

Co-authored-by: nkanu17 <47899917+nkanu17@users.noreply.github.com>
---
 sql_redis/query_builder.py  |  51 +++++++++++++++--
 tests/test_query_builder.py |  11 +++-
 tests/test_sql_queries.py   | 108 ++++++++++++------------------------
 3 files changed, 90 insertions(+), 80 deletions(-)

diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 3eb4de8..41e8f22 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -51,6 +51,12 @@ class QueryBuilder:
     # Characters that need escaping in TAG values
     TAG_SPECIAL_CHARS = r".,<>{}[]\"':;!@#$%^&*()-+=~"
 
+    # Characters that have special meaning in RediSearch free-text queries
+    # (outside of double-quoted phrases) and must be escaped with a backslash.
+    # Only characters likely to appear accidentally in user data are included;
+    # intentional RediSearch features (~, *, %, ^) are intentionally excluded.
+    TEXT_QUERY_SPECIAL_CHARS = frozenset({"\\", "-", "@", "|", "(", ")"})
+
     @staticmethod
     def _escape_text_value(value: str) -> str:
         """Escape characters that are special inside RediSearch double-quoted phrases.
@@ -62,6 +68,23 @@ def _escape_text_value(value: str) -> str:
         # then escape double quotes.
         return value.replace("\\", "\\\\").replace('"', '\\"')
 
+    @classmethod
+    def _escape_fulltext_term(cls, term: str) -> str:
+        """Escape characters that have special meaning in RediSearch free-text queries.
+
+        Applied to individual terms used outside of double-quoted phrases (e.g.,
+        in parenthesized FULLTEXT expressions) so that user input containing
+        RediSearch operator characters like |, -, (, ), @ does not alter the
+        query semantics or produce syntax errors.
+        """
+        result = []
+        for char in term:
+            if char in cls.TEXT_QUERY_SPECIAL_CHARS:
+                result.append(f"\\{char}")
+            else:
+                result.append(char)
+        return "".join(result)
+
     def build_text_condition(
         self,
         field: str | list[str],
@@ -77,7 +100,11 @@ def build_text_condition(
 
         Args:
             field: Field name or list of field names for multi-field search.
-            operator: One of =, !=, FULLTEXT (or MATCH alias), LIKE, FUZZY.
+            operator: One of =, !=, FULLTEXT, LIKE, FUZZY.
+                - = / !=: exact phrase match, value wrapped in double quotes.
+                - FULLTEXT: tokenized keyword search with stopword filtering.
+                - LIKE: prefix/suffix/infix pattern (SQL % → RediSearch *).
+                - FUZZY: Levenshtein fuzzy match.
             value: The search term or pattern.
             negated: If True, prefix with - for negation.
             fuzzy_level: Levenshtein distance for FUZZY (1, 2, or 3). Default 1.
@@ -118,7 +145,9 @@ def build_text_condition(
             escaped = self._escape_text_value(value)
             search_value = f'"{escaped}"'
         elif " " in value and " OR " not in value:
-            # FULLTEXT/MATCH with multi-word: tokenized search with stopword filtering
+            # FULLTEXT with multi-word: tokenized search with stopword filtering.
+            # Each term is escaped to prevent RediSearch operator characters in
+            # user input from changing query semantics.
             words = value.split()
             removed_stopwords = [
                 w for w in words if w.lower() in REDIS_DEFAULT_STOPWORDS
@@ -137,14 +166,24 @@ def build_text_condition(
                     stacklevel=2,
                 )
 
-            terms = " ".join(filtered_words) if filtered_words else value
-            search_value = f"({terms})"
+            if filtered_words:
+                escaped_terms = " ".join(
+                    self._escape_fulltext_term(w) for w in filtered_words
+                )
+            else:
+                # All words were stopwords; pass them through (escaped) so the
+                # query doesn't become empty. RediSearch will still skip them at
+                # query time, but this avoids a syntax error from an empty clause.
+                escaped_terms = " ".join(self._escape_fulltext_term(w) for w in words)
+            search_value = f"({escaped_terms})"
         elif " OR " in value:
             # OR union within text field: split on ' OR ' and join with |
-            or_terms = [t.strip() for t in value.split(" OR ")]
+            or_terms = [
+                self._escape_fulltext_term(t.strip()) for t in value.split(" OR ")
+            ]
             search_value = f"({'|'.join(or_terms)})"
         else:
-            search_value = value
+            search_value = self._escape_fulltext_term(value)
 
         base = f"{prefix}@{field}:{search_value}"
 
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index 48b3e49..acac971 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -71,7 +71,7 @@ def test_text_negation(self):
         """TEXT field with NOT: -@field:term."""
         builder = QueryBuilder()
         result = builder.build_text_condition(
-            "title", "MATCH", "refurbished", negated=True
+            "title", "FULLTEXT", "refurbished", negated=True
         )
 
         assert result == "-@title:refurbished"
@@ -83,11 +83,18 @@ def test_text_fuzzy_match(self):
 
         assert result == "@title:%laptap%"
 
+    def test_text_fulltext_special_chars_escaped(self):
+        """FULLTEXT term with RediSearch operator chars is escaped to avoid injection."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("description", "FULLTEXT", "anti-virus")
+
+        assert result == r"@description:anti\-virus"
+
     def test_text_multi_field(self):
         """TEXT multi-field search: (@field1|field2:term)."""
         builder = QueryBuilder()
         result = builder.build_text_condition(
-            ["title", "description"], "MATCH", "wireless"
+            ["title", "description"], "FULLTEXT", "wireless"
         )
 
         assert result == "(@title|description:wireless)"
diff --git a/tests/test_sql_queries.py b/tests/test_sql_queries.py
index 0fb7b9b..87086e0 100644
--- a/tests/test_sql_queries.py
+++ b/tests/test_sql_queries.py
@@ -36,15 +36,13 @@ def test_match_with_price_filter_and_ordering(
     ):
         """SQL equivalent of FT.AGGREGATE with text match and numeric filter."""
         # For TEXT fields, = becomes a text search in Redis
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT title, price
             FROM {products_data}
             WHERE title = 'laptop' AND price < 1000
             ORDER BY price ASC
             LIMIT 10
-            """
-        )
+            """)
         assert len(result.rows) >= 1, "Should return at least one laptop under $1000"
         # Verify results are sorted by price ascending
         prices = [float(row["price"]) for row in result.rows]
@@ -94,15 +92,13 @@ class TestGroupByWithCount:
 
     def test_count_with_filter(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with GROUPBY and COUNT."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT category, COUNT(*) AS count
             FROM {products_data}
             WHERE price >= 50
             GROUP BY category
             ORDER BY count DESC
-            """
-        )
+            """)
         assert len(result.rows) >= 1, "Should return grouped results"
         for row in result.rows:
             assert "category" in row
@@ -114,15 +110,13 @@ class TestMultipleAggregations:
 
     def test_count_sum_avg_aggregations(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with multiple REDUCE operations."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT category, COUNT(*) AS product_count, SUM(price) AS total_price, AVG(rating) AS avg_rating
             FROM {products_data}
             GROUP BY category
             ORDER BY total_price DESC
             LIMIT 10
-            """
-        )
+            """)
         assert len(result.rows) >= 1, "Should return aggregated results"
         row = result.rows[0]
         assert "product_count" in row
@@ -135,13 +129,11 @@ class TestGlobalAggregation:
 
     def test_aggregation_without_group_by(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with GROUPBY 0 for global aggregation."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT COUNT(*) AS total_count, AVG(price) AS avg_price
             FROM {products_data}
             WHERE price > 100
-            """
-        )
+            """)
         assert len(result.rows) == 1, "Should return single aggregation row"
         row = result.rows[0]
         assert "total_count" in row
@@ -153,14 +145,12 @@ class TestApplyWithComputedFields:
 
     def test_computed_field_expression(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with APPLY for computed fields."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT price, price * 0.9 AS discounted_price
             FROM {products_data}
             WHERE price > 100
             ORDER BY discounted_price DESC
-            """
-        )
+            """)
         assert len(result.rows) >= 1, "Should return results with computed field"
         for row in result.rows:
             price = float(row["price"])
@@ -169,14 +159,12 @@ def test_computed_field_expression(self, executor: Executor, products_data: str)
 
     def test_computed_field_addition(self, executor: Executor, products_data: str):
         """Computed field with addition."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT price, price + 10 AS price_with_shipping
             FROM {products_data}
             WHERE price < 200
             LIMIT 5
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -185,14 +173,12 @@ def test_computed_field_addition(self, executor: Executor, products_data: str):
 
     def test_computed_field_division(self, executor: Executor, products_data: str):
         """Computed field with division for percentage."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT price, price / 100 AS price_in_hundreds
             FROM {products_data}
             WHERE price >= 100
             LIMIT 5
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -201,14 +187,12 @@ def test_computed_field_division(self, executor: Executor, products_data: str):
 
     def test_multiple_computed_fields(self, executor: Executor, products_data: str):
         """Multiple computed fields in one query."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT price, price * 0.9 AS sale_price, price * 1.1 AS markup_price
             FROM {products_data}
             WHERE price > 50
             LIMIT 5
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -223,13 +207,11 @@ class TestRangeQueryWithBetween:
 
     def test_between_and_greater_than(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with numeric range filters."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT title, price
             FROM {products_data}
             WHERE price BETWEEN 100 AND 500 AND stock >= 1
-            """
-        )
+            """)
         assert len(result.rows) >= 1, "Should return products in price range"
         for row in result.rows:
             price = float(row["price"])
@@ -241,52 +223,44 @@ class TestTagFieldMultiValueSearch:
 
     def test_in_clause_with_or(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with TAG field OR conditions."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT name
             FROM {products_data}
             WHERE tags IN ('sale', 'featured') OR category = 'electronics'
-            """
-        )
+            """)
         assert (
             len(result.rows) >= 1
         ), "Should return products matching tag OR conditions"
 
     def test_tag_in_clause_only(self, executor: Executor, products_data: str):
         """IN clause on TAG field without OR."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT name, category
             FROM {products_data}
             WHERE category IN ('electronics', 'books')
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] in ["electronics", "books"]
 
     def test_tag_equality(self, executor: Executor, products_data: str):
         """Simple TAG equality filter."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT name, category
             FROM {products_data}
             WHERE category = 'electronics'
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] == "electronics"
 
     def test_or_with_same_field_type(self, executor: Executor, products_data: str):
         """OR condition across same field type (TAG)."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT name, category
             FROM {products_data}
             WHERE category = 'electronics' OR category = 'books'
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] in ["electronics", "books"]
@@ -295,13 +269,11 @@ def test_or_with_different_field_types(
         self, executor: Executor, products_data: str
     ):
         """OR condition across different field types (TAG and NUMERIC)."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT name, category, price
             FROM {products_data}
             WHERE category = 'books' OR price > 800
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             is_book = row["category"] == "books"
@@ -315,25 +287,21 @@ class TestPaginationWithOffset:
     def test_limit_with_offset(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with LIMIT offset count."""
         # First get all books sorted
-        all_books = executor.execute(
-            f"""
+        all_books = executor.execute(f"""
             SELECT title, price
             FROM {products_data}
             WHERE category = 'books'
             ORDER BY price DESC
-            """
-        )
+            """)
 
         # Then get with offset (page 2, page size 1)
-        paginated = executor.execute(
-            f"""
+        paginated = executor.execute(f"""
             SELECT title, price
             FROM {products_data}
             WHERE category = 'books'
             ORDER BY price DESC
             LIMIT 1 OFFSET 1
-            """
-        )
+            """)
 
         assert len(paginated.rows) >= 1, "Should return paginated results"
         # If we have enough results, verify offset works
@@ -449,11 +417,9 @@ class TestBM25Scoring:
 
     def test_score_returns_relevance(self, executor: Executor, products_data: str):
         """score() in SELECT should return relevance scores."""
-        result = executor.execute(
-            f"""SELECT title, score() AS relevance
+        result = executor.execute(f"""SELECT title, score() AS relevance
             FROM {products_data}
-            WHERE fulltext(title, 'laptop')"""
-        )
+            WHERE fulltext(title, 'laptop')""")
         assert len(result.rows) >= 1, "Should return results with scores"
         for row in result.rows:
             assert "relevance" in row, f"Row should have 'relevance' key: {row}"
@@ -462,11 +428,9 @@ def test_score_returns_relevance(self, executor: Executor, products_data: str):
 
     def test_score_custom_scorer(self, executor: Executor, products_data: str):
         """score('TFIDF') should use TFIDF scorer."""
-        result = executor.execute(
-            f"""SELECT title, score('TFIDF') AS relevance
+        result = executor.execute(f"""SELECT title, score('TFIDF') AS relevance
             FROM {products_data}
-            WHERE fulltext(title, 'laptop')"""
-        )
+            WHERE fulltext(title, 'laptop')""")
         assert len(result.rows) >= 1, "Should return results with TFIDF scores"
         for row in result.rows:
             assert "relevance" in row

From 7fb840dfa6cb5a25864c1c5e0cd06e0103701f5b Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Tue, 31 Mar 2026 17:08:51 -0400
Subject: [PATCH 05/28] fix: address Codex/Copilot review feedback (cycle 2)

- score() only SELECT emits RETURN 0 to prevent full document payload leak
- score() with FT.AGGREGATE raises ValueError (WITHSCORES is FT.SEARCH-only)
- Score alias collision guard in executor (both sync/async)
- Add _escape_fulltext_term with double-quote escaping
- Apply escaping to LIKE and FUZZY operators for special chars
- Escape multi-field non-exact text search values
- Mark verbatim/nostopwords as API-only fields (no SQL parser path yet)
- 9 new tests (128 total QB+translator), 411 total pass
---
 sql_redis/executor.py       |  11 +++-
 sql_redis/parser.py         |   1 +
 sql_redis/query_builder.py  |  73 ++++++++++++------------
 sql_redis/translator.py     |  18 +++++-
 tests/test_query_builder.py |  48 ++++++++++++++++
 tests/test_sql_queries.py   | 108 ++++++++++++++++++++++++------------
 tests/test_translator.py    |  24 ++++++++
 7 files changed, 205 insertions(+), 78 deletions(-)

diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index 4030a7c..f90b518 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -177,7 +177,11 @@ def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    row[score_alias or "__score"] = score
+                    alias = score_alias or "__score"
+                    # Guard: if alias collides with a document field, prefix it
+                    if alias in row:
+                        alias = f"__score_{alias}"
+                    row[alias] = score
                     rows.append(row)
             else:
                 # Standard format: [count, key1, [fields1], key2, [fields2], ...]
@@ -280,7 +284,10 @@ async def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    row[score_alias or "__score"] = score
+                    alias = score_alias or "__score"
+                    if alias in row:
+                        alias = f"__score_{alias}"
+                    row[alias] = score
                     rows.append(row)
             else:
                 # Standard format: [count, key1, [fields1], key2, [fields2], ...]
diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index 4343342..c154159 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -234,6 +234,7 @@ class ParsedQuery:
     offset: int | None = None
     filters: list[str] = dataclasses.field(default_factory=list)
     scoring: ScoringSpec | None = None  # Relevance scoring config
+    # API-only flags — not set by SQL parsing, available for programmatic use
     verbatim: bool = False  # If True, add VERBATIM to FT.SEARCH
     nostopwords: bool = False  # If True, add NOSTOPWORDS to FT.SEARCH
 
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 41e8f22..16c34a3 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -52,30 +52,18 @@ class QueryBuilder:
     TAG_SPECIAL_CHARS = r".,<>{}[]\"':;!@#$%^&*()-+=~"
 
     # Characters that have special meaning in RediSearch free-text queries
-    # (outside of double-quoted phrases) and must be escaped with a backslash.
-    # Only characters likely to appear accidentally in user data are included;
-    # intentional RediSearch features (~, *, %, ^) are intentionally excluded.
-    TEXT_QUERY_SPECIAL_CHARS = frozenset({"\\", "-", "@", "|", "(", ")"})
-
-    @staticmethod
-    def _escape_text_value(value: str) -> str:
-        """Escape characters that are special inside RediSearch double-quoted phrases.
-
-        Backslashes and double quotes must be escaped so they don't break
-        the query syntax or alter its meaning.
-        """
-        # Escape backslashes first (so we don't double-escape the quote escapes),
-        # then escape double quotes.
-        return value.replace("\\", "\\\\").replace('"', '\\"')
+    # (outside double-quoted phrases). Must be escaped with backslash.
+    # Includes double-quote to prevent starting/ending quoted phrases.
+    TEXT_QUERY_SPECIAL_CHARS = set('\\|-()"@~!{}[]^$><=;:')
 
     @classmethod
     def _escape_fulltext_term(cls, term: str) -> str:
         """Escape characters that have special meaning in RediSearch free-text queries.
 
         Applied to individual terms used outside of double-quoted phrases (e.g.,
-        in parenthesized FULLTEXT expressions) so that user input containing
-        RediSearch operator characters like |, -, (, ), @ does not alter the
-        query semantics or produce syntax errors.
+        in parenthesized FULLTEXT expressions, LIKE, FUZZY) so that user input
+        containing RediSearch operator characters does not alter query semantics
+        or produce syntax errors.
         """
         result = []
         for char in term:
@@ -85,6 +73,17 @@ def _escape_fulltext_term(cls, term: str) -> str:
                 result.append(char)
         return "".join(result)
 
+    @staticmethod
+    def _escape_text_value(value: str) -> str:
+        """Escape characters that are special inside RediSearch double-quoted phrases.
+
+        Backslashes and double quotes must be escaped so they don't break
+        the query syntax or alter its meaning.
+        """
+        # Escape backslashes first (so we don't double-escape the quote escapes),
+        # then escape double quotes.
+        return value.replace("\\", "\\\\").replace('"', '\\"')
+
     def build_text_condition(
         self,
         field: str | list[str],
@@ -124,14 +123,19 @@ def build_text_condition(
             if operator in ("=", "!="):
                 escaped = self._escape_text_value(value)
                 return f'{prefix}(@{field_str}:"{escaped}")'
-            return f"{prefix}(@{field_str}:{value})"
+            escaped = self._escape_fulltext_term(value)
+            return f"{prefix}(@{field_str}:{escaped})"
 
         # Handle different operators
         if operator == "LIKE":
-            # Convert SQL LIKE pattern (%) to RediSearch prefix/suffix/infix (*)
-            search_value = value.replace("%", "*")
+            # Escape special chars in the non-wildcard portion, then convert % → *
+            # Split on %, escape each segment, rejoin with *
+            parts = value.split("%")
+            escaped_parts = [self._escape_fulltext_term(p) for p in parts]
+            search_value = "*".join(escaped_parts)
         elif operator == "FUZZY":
-            # Wrap with % signs — count determined by fuzzy_level
+            # Escape special chars before wrapping with % markers
+            escaped = self._escape_fulltext_term(value)
             level = fuzzy_level if fuzzy_level is not None else 1
             if level not in (1, 2, 3):
                 raise ValueError(
@@ -139,15 +143,15 @@ def build_text_condition(
                     "RediSearch supports a maximum Levenshtein distance of 3."
                 )
             pct = "%" * level
-            search_value = f"{pct}{value}{pct}"
+            search_value = f"{pct}{escaped}{pct}"
         elif operator in ("=", "!="):
             # Exact phrase match — always wrap in quotes, preserve stopwords.
             escaped = self._escape_text_value(value)
             search_value = f'"{escaped}"'
         elif " " in value and " OR " not in value:
-            # FULLTEXT with multi-word: tokenized search with stopword filtering.
-            # Each term is escaped to prevent RediSearch operator characters in
-            # user input from changing query semantics.
+            # FULLTEXT/MATCH with multi-word: tokenized search with stopword filtering.
+            # FULLTEXT is intentionally pass-through — users craft RediSearch queries
+            # via fulltext(), so operator chars like ~, |, - are preserved.
             words = value.split()
             removed_stopwords = [
                 w for w in words if w.lower() in REDIS_DEFAULT_STOPWORDS
@@ -166,23 +170,14 @@ def build_text_condition(
                     stacklevel=2,
                 )
 
-            if filtered_words:
-                escaped_terms = " ".join(
-                    self._escape_fulltext_term(w) for w in filtered_words
-                )
-            else:
-                # All words were stopwords; pass them through (escaped) so the
-                # query doesn't become empty. RediSearch will still skip them at
-                # query time, but this avoids a syntax error from an empty clause.
-                escaped_terms = " ".join(self._escape_fulltext_term(w) for w in words)
-            search_value = f"({escaped_terms})"
+            terms = " ".join(filtered_words) if filtered_words else value
+            search_value = f"({terms})"
         elif " OR " in value:
             # OR union within text field: split on ' OR ' and join with |
-            or_terms = [
-                self._escape_fulltext_term(t.strip()) for t in value.split(" OR ")
-            ]
+            or_terms = [t.strip() for t in value.split(" OR ")]
             search_value = f"({'|'.join(or_terms)})"
         else:
+            # Single-word FULLTEXT — escape to prevent accidental operator injection
             search_value = self._escape_fulltext_term(value)
 
         base = f"{prefix}@{field}:{search_value}"
diff --git a/sql_redis/translator.py b/sql_redis/translator.py
index ced3753..e40948b 100644
--- a/sql_redis/translator.py
+++ b/sql_redis/translator.py
@@ -162,6 +162,13 @@ def _build_command(self, analyzed: AnalyzedQuery) -> TranslatedQuery:
         query_string = self._build_query_string(analyzed)
 
         if use_aggregate:
+            if parsed.scoring is not None:
+                raise ValueError(
+                    "score() is not supported with FT.AGGREGATE queries. "
+                    "WITHSCORES / SCORER are FT.SEARCH-only features. "
+                    "Remove score() or avoid GROUP BY / aggregation functions "
+                    "in the same query."
+                )
             return self._build_aggregate(analyzed, query_string)
         else:
             return self._build_search(analyzed, query_string)
@@ -323,7 +330,16 @@ def _build_search(
             if analyzed.vector_search.alias not in return_fields:
                 return_fields.append(analyzed.vector_search.alias)
 
-        if return_fields and return_fields != ["*"]:
+        # When score() is the only SELECT expression, parsed.fields is empty.
+        # We still need a RETURN clause to avoid leaking full document payloads.
+        # Score itself is delivered via WITHSCORES (not RETURN), but we must
+        # emit RETURN 0 so Redis returns no document attributes beyond the score.
+        score_only_select = parsed.scoring is not None and not return_fields
+
+        if score_only_select:
+            # RETURN 0 — suppress all document fields, score comes via WITHSCORES
+            args.extend(["RETURN", "0"])
+        elif return_fields and return_fields != ["*"]:
             args.append("RETURN")
             args.append(str(len(return_fields)))
             args.extend(return_fields)
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index acac971..ddd45e2 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -531,3 +531,51 @@ def test_build_missing_condition_is_not_null(self):
         builder = QueryBuilder()
         result = builder.build_missing_condition("email", is_missing=False)
         assert result == "-ismissing(@email)"
+
+
+class TestQueryBuilderEscaping:
+    """Tests for escaping special characters in text search values."""
+
+    def test_escape_fulltext_term_special_chars(self):
+        """_escape_fulltext_term escapes RediSearch operator characters."""
+        builder = QueryBuilder()
+        result = builder._escape_fulltext_term("hello|world")
+        assert result == "hello\\|world"
+
+    def test_escape_fulltext_term_double_quote(self):
+        """_escape_fulltext_term escapes double quotes."""
+        builder = QueryBuilder()
+        result = builder._escape_fulltext_term('say "hello"')
+        assert result == 'say \\"hello\\"'
+
+    def test_escape_fulltext_term_at_sign(self):
+        """_escape_fulltext_term escapes @ to prevent field injection."""
+        builder = QueryBuilder()
+        result = builder._escape_fulltext_term("user@email")
+        assert result == "user\\@email"
+
+    def test_like_escapes_special_chars(self):
+        """LIKE pattern escapes special chars in the non-wildcard portion."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "LIKE", "%hello|world%")
+        assert result == "@title:*hello\\|world*"
+
+    def test_fuzzy_escapes_special_chars(self):
+        """FUZZY escapes special chars in the term before wrapping with %."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FUZZY", "hello@world")
+        assert result == "@title:%hello\\@world%"
+
+    def test_fuzzy_escapes_double_quote(self):
+        """FUZZY escapes double quotes in term."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FUZZY", 'say"hi')
+        assert result == '@title:%say\\"hi%'
+
+    def test_multi_field_non_exact_escapes(self):
+        """Multi-field search with non-exact operator escapes special chars."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            ["title", "description"], "FULLTEXT", "hello|world"
+        )
+        assert result == "(@title|description:hello\\|world)"
diff --git a/tests/test_sql_queries.py b/tests/test_sql_queries.py
index 87086e0..0fb7b9b 100644
--- a/tests/test_sql_queries.py
+++ b/tests/test_sql_queries.py
@@ -36,13 +36,15 @@ def test_match_with_price_filter_and_ordering(
     ):
         """SQL equivalent of FT.AGGREGATE with text match and numeric filter."""
         # For TEXT fields, = becomes a text search in Redis
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT title, price
             FROM {products_data}
             WHERE title = 'laptop' AND price < 1000
             ORDER BY price ASC
             LIMIT 10
-            """)
+            """
+        )
         assert len(result.rows) >= 1, "Should return at least one laptop under $1000"
         # Verify results are sorted by price ascending
         prices = [float(row["price"]) for row in result.rows]
@@ -92,13 +94,15 @@ class TestGroupByWithCount:
 
     def test_count_with_filter(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with GROUPBY and COUNT."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT category, COUNT(*) AS count
             FROM {products_data}
             WHERE price >= 50
             GROUP BY category
             ORDER BY count DESC
-            """)
+            """
+        )
         assert len(result.rows) >= 1, "Should return grouped results"
         for row in result.rows:
             assert "category" in row
@@ -110,13 +114,15 @@ class TestMultipleAggregations:
 
     def test_count_sum_avg_aggregations(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with multiple REDUCE operations."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT category, COUNT(*) AS product_count, SUM(price) AS total_price, AVG(rating) AS avg_rating
             FROM {products_data}
             GROUP BY category
             ORDER BY total_price DESC
             LIMIT 10
-            """)
+            """
+        )
         assert len(result.rows) >= 1, "Should return aggregated results"
         row = result.rows[0]
         assert "product_count" in row
@@ -129,11 +135,13 @@ class TestGlobalAggregation:
 
     def test_aggregation_without_group_by(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with GROUPBY 0 for global aggregation."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT COUNT(*) AS total_count, AVG(price) AS avg_price
             FROM {products_data}
             WHERE price > 100
-            """)
+            """
+        )
         assert len(result.rows) == 1, "Should return single aggregation row"
         row = result.rows[0]
         assert "total_count" in row
@@ -145,12 +153,14 @@ class TestApplyWithComputedFields:
 
     def test_computed_field_expression(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with APPLY for computed fields."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT price, price * 0.9 AS discounted_price
             FROM {products_data}
             WHERE price > 100
             ORDER BY discounted_price DESC
-            """)
+            """
+        )
         assert len(result.rows) >= 1, "Should return results with computed field"
         for row in result.rows:
             price = float(row["price"])
@@ -159,12 +169,14 @@ def test_computed_field_expression(self, executor: Executor, products_data: str)
 
     def test_computed_field_addition(self, executor: Executor, products_data: str):
         """Computed field with addition."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT price, price + 10 AS price_with_shipping
             FROM {products_data}
             WHERE price < 200
             LIMIT 5
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -173,12 +185,14 @@ def test_computed_field_addition(self, executor: Executor, products_data: str):
 
     def test_computed_field_division(self, executor: Executor, products_data: str):
         """Computed field with division for percentage."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT price, price / 100 AS price_in_hundreds
             FROM {products_data}
             WHERE price >= 100
             LIMIT 5
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -187,12 +201,14 @@ def test_computed_field_division(self, executor: Executor, products_data: str):
 
     def test_multiple_computed_fields(self, executor: Executor, products_data: str):
         """Multiple computed fields in one query."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT price, price * 0.9 AS sale_price, price * 1.1 AS markup_price
             FROM {products_data}
             WHERE price > 50
             LIMIT 5
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -207,11 +223,13 @@ class TestRangeQueryWithBetween:
 
     def test_between_and_greater_than(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with numeric range filters."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT title, price
             FROM {products_data}
             WHERE price BETWEEN 100 AND 500 AND stock >= 1
-            """)
+            """
+        )
         assert len(result.rows) >= 1, "Should return products in price range"
         for row in result.rows:
             price = float(row["price"])
@@ -223,44 +241,52 @@ class TestTagFieldMultiValueSearch:
 
     def test_in_clause_with_or(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with TAG field OR conditions."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT name
             FROM {products_data}
             WHERE tags IN ('sale', 'featured') OR category = 'electronics'
-            """)
+            """
+        )
         assert (
             len(result.rows) >= 1
         ), "Should return products matching tag OR conditions"
 
     def test_tag_in_clause_only(self, executor: Executor, products_data: str):
         """IN clause on TAG field without OR."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT name, category
             FROM {products_data}
             WHERE category IN ('electronics', 'books')
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] in ["electronics", "books"]
 
     def test_tag_equality(self, executor: Executor, products_data: str):
         """Simple TAG equality filter."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT name, category
             FROM {products_data}
             WHERE category = 'electronics'
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] == "electronics"
 
     def test_or_with_same_field_type(self, executor: Executor, products_data: str):
         """OR condition across same field type (TAG)."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT name, category
             FROM {products_data}
             WHERE category = 'electronics' OR category = 'books'
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] in ["electronics", "books"]
@@ -269,11 +295,13 @@ def test_or_with_different_field_types(
         self, executor: Executor, products_data: str
     ):
         """OR condition across different field types (TAG and NUMERIC)."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT name, category, price
             FROM {products_data}
             WHERE category = 'books' OR price > 800
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             is_book = row["category"] == "books"
@@ -287,21 +315,25 @@ class TestPaginationWithOffset:
     def test_limit_with_offset(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with LIMIT offset count."""
         # First get all books sorted
-        all_books = executor.execute(f"""
+        all_books = executor.execute(
+            f"""
             SELECT title, price
             FROM {products_data}
             WHERE category = 'books'
             ORDER BY price DESC
-            """)
+            """
+        )
 
         # Then get with offset (page 2, page size 1)
-        paginated = executor.execute(f"""
+        paginated = executor.execute(
+            f"""
             SELECT title, price
             FROM {products_data}
             WHERE category = 'books'
             ORDER BY price DESC
             LIMIT 1 OFFSET 1
-            """)
+            """
+        )
 
         assert len(paginated.rows) >= 1, "Should return paginated results"
         # If we have enough results, verify offset works
@@ -417,9 +449,11 @@ class TestBM25Scoring:
 
     def test_score_returns_relevance(self, executor: Executor, products_data: str):
         """score() in SELECT should return relevance scores."""
-        result = executor.execute(f"""SELECT title, score() AS relevance
+        result = executor.execute(
+            f"""SELECT title, score() AS relevance
             FROM {products_data}
-            WHERE fulltext(title, 'laptop')""")
+            WHERE fulltext(title, 'laptop')"""
+        )
         assert len(result.rows) >= 1, "Should return results with scores"
         for row in result.rows:
             assert "relevance" in row, f"Row should have 'relevance' key: {row}"
@@ -428,9 +462,11 @@ def test_score_returns_relevance(self, executor: Executor, products_data: str):
 
     def test_score_custom_scorer(self, executor: Executor, products_data: str):
         """score('TFIDF') should use TFIDF scorer."""
-        result = executor.execute(f"""SELECT title, score('TFIDF') AS relevance
+        result = executor.execute(
+            f"""SELECT title, score('TFIDF') AS relevance
             FROM {products_data}
-            WHERE fulltext(title, 'laptop')""")
+            WHERE fulltext(title, 'laptop')"""
+        )
         assert len(result.rows) >= 1, "Should return results with TFIDF scores"
         for row in result.rows:
             assert "relevance" in row
diff --git a/tests/test_translator.py b/tests/test_translator.py
index 1c0c702..63a24d3 100644
--- a/tests/test_translator.py
+++ b/tests/test_translator.py
@@ -760,3 +760,27 @@ def test_no_score_no_withscores(self, translator: Translator, basic_index: str):
             f"SELECT title FROM {basic_index} WHERE fulltext(title, 'laptop')"
         )
         assert "WITHSCORES" not in result.args
+
+    def test_score_only_select_emits_return_0(
+        self, translator: Translator, basic_index: str
+    ):
+        """SELECT score() AS relevance (no other fields) → RETURN 0 to prevent payload leak."""
+        result = translator.translate(
+            f"SELECT score() AS relevance FROM {basic_index} WHERE fulltext(title, 'laptop')"
+        )
+        assert "RETURN" in result.args
+        ret_idx = result.args.index("RETURN")
+        assert result.args[ret_idx + 1] == "0"
+        assert "WITHSCORES" in result.args
+
+    def test_score_with_aggregate_raises(
+        self, translator: Translator, basic_index: str
+    ):
+        """score() combined with GROUP BY (forces FT.AGGREGATE) raises ValueError."""
+        import pytest
+
+        with pytest.raises(ValueError, match="score.*not supported.*FT.AGGREGATE"):
+            translator.translate(
+                f"SELECT COUNT(*), score() AS relevance FROM {basic_index} "
+                "WHERE fulltext(title, 'laptop') GROUP BY category"
+            )

From 3ffccb2adc3d8ba81afc2424ac911327cfc858e3 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 31 Mar 2026 21:20:01 +0000
Subject: [PATCH 06/28] fix: double-negation XOR semantics, remove dead
 verbatim/nostopwords fields

Agent-Logs-Url: https://github.com/redis-developer/sql-redis/sessions/d42f3789-3c56-4e27-ba5d-df016d816d6e

Co-authored-by: nkanu17 <47899917+nkanu17@users.noreply.github.com>
---
 sql_redis/parser.py         |   3 -
 sql_redis/translator.py     |  17 +++---
 tests/test_query_builder.py |  12 ----
 tests/test_sql_queries.py   | 108 ++++++++++++------------------------
 tests/test_translator.py    |   8 +++
 5 files changed, 51 insertions(+), 97 deletions(-)

diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index c154159..a2e52a3 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -234,9 +234,6 @@ class ParsedQuery:
     offset: int | None = None
     filters: list[str] = dataclasses.field(default_factory=list)
     scoring: ScoringSpec | None = None  # Relevance scoring config
-    # API-only flags — not set by SQL parsing, available for programmatic use
-    verbatim: bool = False  # If True, add VERBATIM to FT.SEARCH
-    nostopwords: bool = False  # If True, add NOSTOPWORDS to FT.SEARCH
 
 
 class SQLParser:
diff --git a/sql_redis/translator.py b/sql_redis/translator.py
index e40948b..6353b67 100644
--- a/sql_redis/translator.py
+++ b/sql_redis/translator.py
@@ -226,11 +226,14 @@ def _build_condition(self, condition: Condition, field_type: str | None) -> str:
                 condition.field, is_missing=(condition.operator == "IS_NULL")
             )
 
-        # Determine if this is a negation (either explicit or via != operator)
+        # Resolve negation using XOR so that double negation cancels out.
+        # e.g. NOT (field != 'x') → negated=True, op='!=' → is_negated=False.
         operator = condition.operator
-        is_negated = condition.negated or operator == "!="
-        if condition.negated and operator == "=":
-            operator = "!="
+        is_negated = condition.negated ^ (operator == "!=")
+        # Normalize = / != to match the resolved negation state so every
+        # downstream builder sees a consistent (operator, negated) pair.
+        if operator in ("=", "!="):
+            operator = "!=" if is_negated else "="
 
         if field_type == "TEXT":
             return self._query_builder.build_text_condition(
@@ -360,12 +363,6 @@ def _build_search(
             if parsed.scoring.scorer:
                 args.extend(["SCORER", parsed.scoring.scorer])
 
-        # Verbatim / nostopwords flags
-        if parsed.verbatim:
-            args.append("VERBATIM")
-        if parsed.nostopwords:
-            args.append("NOSTOPWORDS")
-
         # DIALECT 2 — unconditionally appended as the last arguments
         args.extend(["DIALECT", "2"])
 
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index ddd45e2..24a6ade 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -494,18 +494,6 @@ def test_slop_negated(self):
         assert result == "-@title:(gaming laptop) => { $slop: 3; }"
 
 
-class TestQueryBuilderVerbatim:
-    """Tests for verbatim and nostopwords flags."""
-
-    def test_fulltext_with_verbatim(self):
-        """FULLTEXT search term is not affected by verbatim (query-level flag)."""
-        # verbatim is a query-level flag, not part of the condition string
-        # This test just ensures normal behavior is preserved
-        builder = QueryBuilder()
-        result = builder.build_text_condition("title", "FULLTEXT", "running")
-        assert result == "@title:running"
-
-
 class TestQueryBuilderOptionalTerms:
     """Tests for optional term (~) syntax."""
 
diff --git a/tests/test_sql_queries.py b/tests/test_sql_queries.py
index 0fb7b9b..87086e0 100644
--- a/tests/test_sql_queries.py
+++ b/tests/test_sql_queries.py
@@ -36,15 +36,13 @@ def test_match_with_price_filter_and_ordering(
     ):
         """SQL equivalent of FT.AGGREGATE with text match and numeric filter."""
         # For TEXT fields, = becomes a text search in Redis
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT title, price
             FROM {products_data}
             WHERE title = 'laptop' AND price < 1000
             ORDER BY price ASC
             LIMIT 10
-            """
-        )
+            """)
         assert len(result.rows) >= 1, "Should return at least one laptop under $1000"
         # Verify results are sorted by price ascending
         prices = [float(row["price"]) for row in result.rows]
@@ -94,15 +92,13 @@ class TestGroupByWithCount:
 
     def test_count_with_filter(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with GROUPBY and COUNT."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT category, COUNT(*) AS count
             FROM {products_data}
             WHERE price >= 50
             GROUP BY category
             ORDER BY count DESC
-            """
-        )
+            """)
         assert len(result.rows) >= 1, "Should return grouped results"
         for row in result.rows:
             assert "category" in row
@@ -114,15 +110,13 @@ class TestMultipleAggregations:
 
     def test_count_sum_avg_aggregations(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with multiple REDUCE operations."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT category, COUNT(*) AS product_count, SUM(price) AS total_price, AVG(rating) AS avg_rating
             FROM {products_data}
             GROUP BY category
             ORDER BY total_price DESC
             LIMIT 10
-            """
-        )
+            """)
         assert len(result.rows) >= 1, "Should return aggregated results"
         row = result.rows[0]
         assert "product_count" in row
@@ -135,13 +129,11 @@ class TestGlobalAggregation:
 
     def test_aggregation_without_group_by(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with GROUPBY 0 for global aggregation."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT COUNT(*) AS total_count, AVG(price) AS avg_price
             FROM {products_data}
             WHERE price > 100
-            """
-        )
+            """)
         assert len(result.rows) == 1, "Should return single aggregation row"
         row = result.rows[0]
         assert "total_count" in row
@@ -153,14 +145,12 @@ class TestApplyWithComputedFields:
 
     def test_computed_field_expression(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with APPLY for computed fields."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT price, price * 0.9 AS discounted_price
             FROM {products_data}
             WHERE price > 100
             ORDER BY discounted_price DESC
-            """
-        )
+            """)
         assert len(result.rows) >= 1, "Should return results with computed field"
         for row in result.rows:
             price = float(row["price"])
@@ -169,14 +159,12 @@ def test_computed_field_expression(self, executor: Executor, products_data: str)
 
     def test_computed_field_addition(self, executor: Executor, products_data: str):
         """Computed field with addition."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT price, price + 10 AS price_with_shipping
             FROM {products_data}
             WHERE price < 200
             LIMIT 5
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -185,14 +173,12 @@ def test_computed_field_addition(self, executor: Executor, products_data: str):
 
     def test_computed_field_division(self, executor: Executor, products_data: str):
         """Computed field with division for percentage."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT price, price / 100 AS price_in_hundreds
             FROM {products_data}
             WHERE price >= 100
             LIMIT 5
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -201,14 +187,12 @@ def test_computed_field_division(self, executor: Executor, products_data: str):
 
     def test_multiple_computed_fields(self, executor: Executor, products_data: str):
         """Multiple computed fields in one query."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT price, price * 0.9 AS sale_price, price * 1.1 AS markup_price
             FROM {products_data}
             WHERE price > 50
             LIMIT 5
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -223,13 +207,11 @@ class TestRangeQueryWithBetween:
 
     def test_between_and_greater_than(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with numeric range filters."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT title, price
             FROM {products_data}
             WHERE price BETWEEN 100 AND 500 AND stock >= 1
-            """
-        )
+            """)
         assert len(result.rows) >= 1, "Should return products in price range"
         for row in result.rows:
             price = float(row["price"])
@@ -241,52 +223,44 @@ class TestTagFieldMultiValueSearch:
 
     def test_in_clause_with_or(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with TAG field OR conditions."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT name
             FROM {products_data}
             WHERE tags IN ('sale', 'featured') OR category = 'electronics'
-            """
-        )
+            """)
         assert (
             len(result.rows) >= 1
         ), "Should return products matching tag OR conditions"
 
     def test_tag_in_clause_only(self, executor: Executor, products_data: str):
         """IN clause on TAG field without OR."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT name, category
             FROM {products_data}
             WHERE category IN ('electronics', 'books')
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] in ["electronics", "books"]
 
     def test_tag_equality(self, executor: Executor, products_data: str):
         """Simple TAG equality filter."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT name, category
             FROM {products_data}
             WHERE category = 'electronics'
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] == "electronics"
 
     def test_or_with_same_field_type(self, executor: Executor, products_data: str):
         """OR condition across same field type (TAG)."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT name, category
             FROM {products_data}
             WHERE category = 'electronics' OR category = 'books'
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] in ["electronics", "books"]
@@ -295,13 +269,11 @@ def test_or_with_different_field_types(
         self, executor: Executor, products_data: str
     ):
         """OR condition across different field types (TAG and NUMERIC)."""
-        result = executor.execute(
-            f"""
+        result = executor.execute(f"""
             SELECT name, category, price
             FROM {products_data}
             WHERE category = 'books' OR price > 800
-            """
-        )
+            """)
         assert len(result.rows) >= 1
         for row in result.rows:
             is_book = row["category"] == "books"
@@ -315,25 +287,21 @@ class TestPaginationWithOffset:
     def test_limit_with_offset(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with LIMIT offset count."""
         # First get all books sorted
-        all_books = executor.execute(
-            f"""
+        all_books = executor.execute(f"""
             SELECT title, price
             FROM {products_data}
             WHERE category = 'books'
             ORDER BY price DESC
-            """
-        )
+            """)
 
         # Then get with offset (page 2, page size 1)
-        paginated = executor.execute(
-            f"""
+        paginated = executor.execute(f"""
             SELECT title, price
             FROM {products_data}
             WHERE category = 'books'
             ORDER BY price DESC
             LIMIT 1 OFFSET 1
-            """
-        )
+            """)
 
         assert len(paginated.rows) >= 1, "Should return paginated results"
         # If we have enough results, verify offset works
@@ -449,11 +417,9 @@ class TestBM25Scoring:
 
     def test_score_returns_relevance(self, executor: Executor, products_data: str):
         """score() in SELECT should return relevance scores."""
-        result = executor.execute(
-            f"""SELECT title, score() AS relevance
+        result = executor.execute(f"""SELECT title, score() AS relevance
             FROM {products_data}
-            WHERE fulltext(title, 'laptop')"""
-        )
+            WHERE fulltext(title, 'laptop')""")
         assert len(result.rows) >= 1, "Should return results with scores"
         for row in result.rows:
             assert "relevance" in row, f"Row should have 'relevance' key: {row}"
@@ -462,11 +428,9 @@ def test_score_returns_relevance(self, executor: Executor, products_data: str):
 
     def test_score_custom_scorer(self, executor: Executor, products_data: str):
         """score('TFIDF') should use TFIDF scorer."""
-        result = executor.execute(
-            f"""SELECT title, score('TFIDF') AS relevance
+        result = executor.execute(f"""SELECT title, score('TFIDF') AS relevance
             FROM {products_data}
-            WHERE fulltext(title, 'laptop')"""
-        )
+            WHERE fulltext(title, 'laptop')""")
         assert len(result.rows) >= 1, "Should return results with TFIDF scores"
         for row in result.rows:
             assert "relevance" in row
diff --git a/tests/test_translator.py b/tests/test_translator.py
index 63a24d3..64546f8 100644
--- a/tests/test_translator.py
+++ b/tests/test_translator.py
@@ -416,6 +416,14 @@ def test_not_condition(self, translator: Translator, basic_index: str):
 
         assert "-@title" in result.query_string
 
+    def test_double_negation_cancels(self, translator: Translator, basic_index: str):
+        """NOT (field != x) double negation resolves to positive match."""
+        result = translator.translate(
+            f"SELECT * FROM {basic_index} WHERE NOT title != 'good'"
+        )
+
+        assert result.query_string == '@title:"good"'
+
 
 class TestTranslatorOutput:
     """Tests for output format methods."""

From 33b2b9ed0f1ef478f9a7364297de208f9f1f0fc0 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 14:02:42 -0400
Subject: [PATCH 07/28] fix: WITHSCORES+RETURN0 parsing, OR operand escaping,
 slop validation

- Fix stride mismatch in executor when WITHSCORES + RETURN 0 (NOCONTENT)
  produces [count, id, score, ...] without field arrays
- Add _ScoreParseMixin with _has_return_0() helper for both sync/async executors
- Escape individual OR operands in fulltext() to prevent accidental
  negation (anti-virus) and field injection (@field)
- Validate slop >= 0 in parser, raise ValueError for negative values
- Add tests for all three fixes
---
 sql_redis/executor.py       | 42 ++++++++++++++++++++++++++++++++-----
 sql_redis/parser.py         |  6 +++++-
 sql_redis/query_builder.py  |  6 ++++--
 tests/test_query_builder.py | 15 +++++++++++++
 tests/test_sql_parser.py    | 10 +++++++++
 5 files changed, 71 insertions(+), 8 deletions(-)

diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index f90b518..f346f14 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -103,7 +103,20 @@ class QueryResult:
     count: int
 
 
-class Executor:
+class _ScoreParseMixin:
+    """Shared helper for detecting RETURN 0 (NOCONTENT) in translated args."""
+
+    @staticmethod
+    def _has_return_0(args: list[str]) -> bool:
+        """Return True when the args contain 'RETURN 0' (no document fields)."""
+        try:
+            idx = args.index("RETURN")
+            return args[idx + 1] == "0"
+        except (ValueError, IndexError):
+            return False
+
+
+class Executor(_ScoreParseMixin):
     """Executes SQL queries against Redis."""
 
     def __init__(self, client: redis.Redis, schema_registry: SchemaRegistry) -> None:
@@ -169,8 +182,19 @@ def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
             # Check if WITHSCORES was requested — changes response format
             with_scores = "WITHSCORES" in translated.args
             score_alias = translated.score_alias
-
-            if with_scores:
+            # RETURN 0 suppresses document fields (like NOCONTENT);
+            # with WITHSCORES the reply is [count, id, score, id, score, ...]
+            no_content = self._has_return_0(translated.args)
+
+            if with_scores and no_content:
+                # WITHSCORES + RETURN 0: [count, id1, score1, id2, score2, ...]
+                # Stride of 2: key, score (no field array)
+                for i in range(1, len(raw_result) - 1, 2):
+                    score = raw_result[i + 1]
+                    alias = score_alias or "__score"
+                    row = {alias: score}
+                    rows.append(row)
+            elif with_scores:
                 # WITHSCORES format: [count, key1, score1, [fields1], key2, score2, [fields2], ...]
                 # Stride of 3: key, score, field_list
                 for i in range(1, len(raw_result) - 2, 3):
@@ -198,7 +222,7 @@ def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
         return QueryResult(rows=rows, count=count)
 
 
-class AsyncExecutor:
+class AsyncExecutor(_ScoreParseMixin):
     """Async version of Executor for use with redis.asyncio clients."""
 
     def __init__(
@@ -277,8 +301,16 @@ async def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
         if translated.command == "FT.SEARCH":
             with_scores = "WITHSCORES" in translated.args
             score_alias = translated.score_alias
+            no_content = self._has_return_0(translated.args)
 
-            if with_scores:
+            if with_scores and no_content:
+                # WITHSCORES + RETURN 0: [count, id1, score1, id2, score2, ...]
+                for i in range(1, len(raw_result) - 1, 2):
+                    score = raw_result[i + 1]
+                    alias = score_alias or "__score"
+                    row = {alias: score}
+                    rows.append(row)
+            elif with_scores:
                 # WITHSCORES format: [count, key1, score1, [fields1], ...]
                 for i in range(1, len(raw_result) - 2, 3):
                     score = raw_result[i + 1]
diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index a2e52a3..44014e5 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -975,12 +975,16 @@ def _add_function_condition(
             field_name = args[0].name if isinstance(args[0], exp.Column) else None
             value = self._extract_literal_value(args[1])
 
-            # Optional 3rd arg: slop (int)
+            # Optional 3rd arg: slop (non-negative int)
             slop = None
             if len(args) >= 3:
                 slop_val = self._extract_literal_value(args[2])
                 if slop_val is not None:
                     slop = int(slop_val)
+                    if slop < 0:
+                        raise ValueError(
+                            f"FULLTEXT slop argument must be a non-negative integer (got {slop})"
+                        )
 
             # Optional 4th arg: inorder (boolean-like: 1/0 or true/false)
             inorder = False
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 16c34a3..dcea4b3 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -173,8 +173,10 @@ def build_text_condition(
             terms = " ".join(filtered_words) if filtered_words else value
             search_value = f"({terms})"
         elif " OR " in value:
-            # OR union within text field: split on ' OR ' and join with |
-            or_terms = [t.strip() for t in value.split(" OR ")]
+            # OR union within text field: split on ' OR ', escape each term, join with |
+            or_terms = [
+                self._escape_fulltext_term(t.strip()) for t in value.split(" OR ")
+            ]
             search_value = f"({'|'.join(or_terms)})"
         else:
             # Single-word FULLTEXT — escape to prevent accidental operator injection
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index 24a6ade..fa2367b 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -567,3 +567,18 @@ def test_multi_field_non_exact_escapes(self):
             ["title", "description"], "FULLTEXT", "hello|world"
         )
         assert result == "(@title|description:hello\\|world)"
+
+    def test_or_terms_escape_special_chars(self):
+        """OR operands are escaped before joining with |."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            "title", "FULLTEXT", "laptop OR anti-virus"
+        )
+        # '-' is a RediSearch operator and should be escaped in OR terms
+        assert result == "@title:(laptop|anti\\-virus)"
+
+    def test_or_terms_escape_at_sign(self):
+        """OR operands escape @ to prevent field injection."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "hello OR @world")
+        assert result == "@title:(hello|\\@world)"
diff --git a/tests/test_sql_parser.py b/tests/test_sql_parser.py
index 10e63cb..6d72b89 100644
--- a/tests/test_sql_parser.py
+++ b/tests/test_sql_parser.py
@@ -855,3 +855,13 @@ def test_exists_in_where_raises_error(self):
         parser = SQLParser()
         with pytest.raises(ValueError, match="exists.*aggregate"):
             parser.parse("SELECT * FROM idx WHERE exists(email)")
+
+
+class TestSQLParserFulltextValidation:
+    """Tests for fulltext() argument validation."""
+
+    def test_fulltext_negative_slop_raises(self):
+        """Negative slop in fulltext() raises ValueError."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="non-negative integer"):
+            parser.parse("SELECT * FROM idx WHERE fulltext(title, 'hello world', -1)")

From 4d5c093a6123697948d87a9b06f393ce97268cf3 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 14:28:33 -0400
Subject: [PATCH 08/28] fix: multi-word FULLTEXT escaping, stable score alias,
 slop float validation

- Escape individual terms in multi-word FULLTEXT branch while preserving
  ~ optional-term prefix (prevents @field injection and accidental negation)
- Move score alias collision check out of per-row loop into
  _resolve_score_alias() so all rows use the same column name
- Reject float slop values (e.g. 2.9) instead of silently truncating
- Add tests for all three fixes (350 total)
---
 sql_redis/executor.py       |  41 ++++++++++----
 sql_redis/parser.py         |   6 ++
 sql_redis/query_builder.py  |  15 ++++-
 tests/test_query_builder.py |  18 ++++++
 tests/test_sql_parser.py    |   6 ++
 tests/test_sql_queries.py   | 108 ++++++++++++++++++++++++------------
 6 files changed, 143 insertions(+), 51 deletions(-)

diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index f346f14..cbb6128 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -104,7 +104,7 @@ class QueryResult:
 
 
 class _ScoreParseMixin:
-    """Shared helper for detecting RETURN 0 (NOCONTENT) in translated args."""
+    """Shared helpers for score-related response parsing."""
 
     @staticmethod
     def _has_return_0(args: list[str]) -> bool:
@@ -115,6 +115,23 @@ def _has_return_0(args: list[str]) -> bool:
         except (ValueError, IndexError):
             return False
 
+    @staticmethod
+    def _resolve_score_alias(score_alias: str | None, args: list[str]) -> str:
+        """Determine a stable score column name that won't collide with
+        document fields.  The alias is decided once before iterating rows
+        so every row uses the same column name."""
+        alias = score_alias or "__score"
+        # Extract RETURN field names from args to detect collision
+        try:
+            idx = args.index("RETURN")
+            count = int(args[idx + 1])
+            return_fields = set(args[idx + 2 : idx + 2 + count])
+        except (ValueError, IndexError):
+            return_fields = set()
+        if alias in return_fields:
+            alias = f"__score_{alias}"
+        return alias
+
 
 class Executor(_ScoreParseMixin):
     """Executes SQL queries against Redis."""
@@ -181,17 +198,21 @@ def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
         if translated.command == "FT.SEARCH":
             # Check if WITHSCORES was requested — changes response format
             with_scores = "WITHSCORES" in translated.args
-            score_alias = translated.score_alias
             # RETURN 0 suppresses document fields (like NOCONTENT);
             # with WITHSCORES the reply is [count, id, score, id, score, ...]
             no_content = self._has_return_0(translated.args)
+            # Determine score column name once so every row is consistent
+            alias = (
+                self._resolve_score_alias(translated.score_alias, translated.args)
+                if with_scores
+                else ""
+            )
 
             if with_scores and no_content:
                 # WITHSCORES + RETURN 0: [count, id1, score1, id2, score2, ...]
                 # Stride of 2: key, score (no field array)
                 for i in range(1, len(raw_result) - 1, 2):
                     score = raw_result[i + 1]
-                    alias = score_alias or "__score"
                     row = {alias: score}
                     rows.append(row)
             elif with_scores:
@@ -201,10 +222,6 @@ def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    alias = score_alias or "__score"
-                    # Guard: if alias collides with a document field, prefix it
-                    if alias in row:
-                        alias = f"__score_{alias}"
                     row[alias] = score
                     rows.append(row)
             else:
@@ -300,14 +317,17 @@ async def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
 
         if translated.command == "FT.SEARCH":
             with_scores = "WITHSCORES" in translated.args
-            score_alias = translated.score_alias
             no_content = self._has_return_0(translated.args)
+            alias = (
+                self._resolve_score_alias(translated.score_alias, translated.args)
+                if with_scores
+                else ""
+            )
 
             if with_scores and no_content:
                 # WITHSCORES + RETURN 0: [count, id1, score1, id2, score2, ...]
                 for i in range(1, len(raw_result) - 1, 2):
                     score = raw_result[i + 1]
-                    alias = score_alias or "__score"
                     row = {alias: score}
                     rows.append(row)
             elif with_scores:
@@ -316,9 +336,6 @@ async def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    alias = score_alias or "__score"
-                    if alias in row:
-                        alias = f"__score_{alias}"
                     row[alias] = score
                     rows.append(row)
             else:
diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index 44014e5..c4a9b35 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -980,6 +980,12 @@ def _add_function_condition(
             if len(args) >= 3:
                 slop_val = self._extract_literal_value(args[2])
                 if slop_val is not None:
+                    # Reject non-integer values (e.g. 2.9) instead of
+                    # silently truncating via int().
+                    if isinstance(slop_val, float) and slop_val != int(slop_val):
+                        raise ValueError(
+                            f"FULLTEXT slop argument must be an integer (got {slop_val})"
+                        )
                     slop = int(slop_val)
                     if slop < 0:
                         raise ValueError(
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index dcea4b3..739b0f7 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -150,8 +150,9 @@ def build_text_condition(
             search_value = f'"{escaped}"'
         elif " " in value and " OR " not in value:
             # FULLTEXT/MATCH with multi-word: tokenized search with stopword filtering.
-            # FULLTEXT is intentionally pass-through — users craft RediSearch queries
-            # via fulltext(), so operator chars like ~, |, - are preserved.
+            # Each term is escaped to prevent accidental operator injection, but a
+            # leading ~ (optional-term modifier) is preserved as an intentional
+            # RediSearch operator.
             words = value.split()
             removed_stopwords = [
                 w for w in words if w.lower() in REDIS_DEFAULT_STOPWORDS
@@ -170,7 +171,15 @@ def build_text_condition(
                     stacklevel=2,
                 )
 
-            terms = " ".join(filtered_words) if filtered_words else value
+            escaped_words = []
+            for w in (filtered_words if filtered_words else words):
+                if w.startswith("~"):
+                    # Preserve ~ optional-term prefix, escape the rest
+                    escaped_words.append("~" + self._escape_fulltext_term(w[1:]))
+                else:
+                    escaped_words.append(self._escape_fulltext_term(w))
+
+            terms = " ".join(escaped_words)
             search_value = f"({terms})"
         elif " OR " in value:
             # OR union within text field: split on ' OR ', escape each term, join with |
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index fa2367b..a2cf8ce 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -582,3 +582,21 @@ def test_or_terms_escape_at_sign(self):
         builder = QueryBuilder()
         result = builder.build_text_condition("title", "FULLTEXT", "hello OR @world")
         assert result == "@title:(hello|\\@world)"
+
+    def test_multiword_fulltext_escapes_special_chars(self):
+        """Multi-word FULLTEXT escapes dangerous chars like @ and |."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "hello @world")
+        assert result == "@title:(hello \\@world)"
+
+    def test_multiword_fulltext_preserves_optional_prefix(self):
+        """Multi-word FULLTEXT preserves ~ optional-term prefix."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "laptop ~gaming")
+        assert result == "@title:(laptop ~gaming)"
+
+    def test_multiword_fulltext_escapes_dash(self):
+        """Multi-word FULLTEXT escapes - to prevent accidental negation."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "hello anti-virus")
+        assert result == "@title:(hello anti\\-virus)"
diff --git a/tests/test_sql_parser.py b/tests/test_sql_parser.py
index 6d72b89..1d228da 100644
--- a/tests/test_sql_parser.py
+++ b/tests/test_sql_parser.py
@@ -865,3 +865,9 @@ def test_fulltext_negative_slop_raises(self):
         parser = SQLParser()
         with pytest.raises(ValueError, match="non-negative integer"):
             parser.parse("SELECT * FROM idx WHERE fulltext(title, 'hello world', -1)")
+
+    def test_fulltext_float_slop_raises(self):
+        """Float slop in fulltext() raises ValueError instead of silently truncating."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="must be an integer"):
+            parser.parse("SELECT * FROM idx WHERE fulltext(title, 'hello world', 2.9)")
diff --git a/tests/test_sql_queries.py b/tests/test_sql_queries.py
index 87086e0..0fb7b9b 100644
--- a/tests/test_sql_queries.py
+++ b/tests/test_sql_queries.py
@@ -36,13 +36,15 @@ def test_match_with_price_filter_and_ordering(
     ):
         """SQL equivalent of FT.AGGREGATE with text match and numeric filter."""
         # For TEXT fields, = becomes a text search in Redis
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT title, price
             FROM {products_data}
             WHERE title = 'laptop' AND price < 1000
             ORDER BY price ASC
             LIMIT 10
-            """)
+            """
+        )
         assert len(result.rows) >= 1, "Should return at least one laptop under $1000"
         # Verify results are sorted by price ascending
         prices = [float(row["price"]) for row in result.rows]
@@ -92,13 +94,15 @@ class TestGroupByWithCount:
 
     def test_count_with_filter(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with GROUPBY and COUNT."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT category, COUNT(*) AS count
             FROM {products_data}
             WHERE price >= 50
             GROUP BY category
             ORDER BY count DESC
-            """)
+            """
+        )
         assert len(result.rows) >= 1, "Should return grouped results"
         for row in result.rows:
             assert "category" in row
@@ -110,13 +114,15 @@ class TestMultipleAggregations:
 
     def test_count_sum_avg_aggregations(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with multiple REDUCE operations."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT category, COUNT(*) AS product_count, SUM(price) AS total_price, AVG(rating) AS avg_rating
             FROM {products_data}
             GROUP BY category
             ORDER BY total_price DESC
             LIMIT 10
-            """)
+            """
+        )
         assert len(result.rows) >= 1, "Should return aggregated results"
         row = result.rows[0]
         assert "product_count" in row
@@ -129,11 +135,13 @@ class TestGlobalAggregation:
 
     def test_aggregation_without_group_by(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with GROUPBY 0 for global aggregation."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT COUNT(*) AS total_count, AVG(price) AS avg_price
             FROM {products_data}
             WHERE price > 100
-            """)
+            """
+        )
         assert len(result.rows) == 1, "Should return single aggregation row"
         row = result.rows[0]
         assert "total_count" in row
@@ -145,12 +153,14 @@ class TestApplyWithComputedFields:
 
     def test_computed_field_expression(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with APPLY for computed fields."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT price, price * 0.9 AS discounted_price
             FROM {products_data}
             WHERE price > 100
             ORDER BY discounted_price DESC
-            """)
+            """
+        )
         assert len(result.rows) >= 1, "Should return results with computed field"
         for row in result.rows:
             price = float(row["price"])
@@ -159,12 +169,14 @@ def test_computed_field_expression(self, executor: Executor, products_data: str)
 
     def test_computed_field_addition(self, executor: Executor, products_data: str):
         """Computed field with addition."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT price, price + 10 AS price_with_shipping
             FROM {products_data}
             WHERE price < 200
             LIMIT 5
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -173,12 +185,14 @@ def test_computed_field_addition(self, executor: Executor, products_data: str):
 
     def test_computed_field_division(self, executor: Executor, products_data: str):
         """Computed field with division for percentage."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT price, price / 100 AS price_in_hundreds
             FROM {products_data}
             WHERE price >= 100
             LIMIT 5
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -187,12 +201,14 @@ def test_computed_field_division(self, executor: Executor, products_data: str):
 
     def test_multiple_computed_fields(self, executor: Executor, products_data: str):
         """Multiple computed fields in one query."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT price, price * 0.9 AS sale_price, price * 1.1 AS markup_price
             FROM {products_data}
             WHERE price > 50
             LIMIT 5
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             price = float(row["price"])
@@ -207,11 +223,13 @@ class TestRangeQueryWithBetween:
 
     def test_between_and_greater_than(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with numeric range filters."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT title, price
             FROM {products_data}
             WHERE price BETWEEN 100 AND 500 AND stock >= 1
-            """)
+            """
+        )
         assert len(result.rows) >= 1, "Should return products in price range"
         for row in result.rows:
             price = float(row["price"])
@@ -223,44 +241,52 @@ class TestTagFieldMultiValueSearch:
 
     def test_in_clause_with_or(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with TAG field OR conditions."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT name
             FROM {products_data}
             WHERE tags IN ('sale', 'featured') OR category = 'electronics'
-            """)
+            """
+        )
         assert (
             len(result.rows) >= 1
         ), "Should return products matching tag OR conditions"
 
     def test_tag_in_clause_only(self, executor: Executor, products_data: str):
         """IN clause on TAG field without OR."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT name, category
             FROM {products_data}
             WHERE category IN ('electronics', 'books')
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] in ["electronics", "books"]
 
     def test_tag_equality(self, executor: Executor, products_data: str):
         """Simple TAG equality filter."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT name, category
             FROM {products_data}
             WHERE category = 'electronics'
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] == "electronics"
 
     def test_or_with_same_field_type(self, executor: Executor, products_data: str):
         """OR condition across same field type (TAG)."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT name, category
             FROM {products_data}
             WHERE category = 'electronics' OR category = 'books'
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             assert row["category"] in ["electronics", "books"]
@@ -269,11 +295,13 @@ def test_or_with_different_field_types(
         self, executor: Executor, products_data: str
     ):
         """OR condition across different field types (TAG and NUMERIC)."""
-        result = executor.execute(f"""
+        result = executor.execute(
+            f"""
             SELECT name, category, price
             FROM {products_data}
             WHERE category = 'books' OR price > 800
-            """)
+            """
+        )
         assert len(result.rows) >= 1
         for row in result.rows:
             is_book = row["category"] == "books"
@@ -287,21 +315,25 @@ class TestPaginationWithOffset:
     def test_limit_with_offset(self, executor: Executor, products_data: str):
         """SQL equivalent of FT.AGGREGATE with LIMIT offset count."""
         # First get all books sorted
-        all_books = executor.execute(f"""
+        all_books = executor.execute(
+            f"""
             SELECT title, price
             FROM {products_data}
             WHERE category = 'books'
             ORDER BY price DESC
-            """)
+            """
+        )
 
         # Then get with offset (page 2, page size 1)
-        paginated = executor.execute(f"""
+        paginated = executor.execute(
+            f"""
             SELECT title, price
             FROM {products_data}
             WHERE category = 'books'
             ORDER BY price DESC
             LIMIT 1 OFFSET 1
-            """)
+            """
+        )
 
         assert len(paginated.rows) >= 1, "Should return paginated results"
         # If we have enough results, verify offset works
@@ -417,9 +449,11 @@ class TestBM25Scoring:
 
     def test_score_returns_relevance(self, executor: Executor, products_data: str):
         """score() in SELECT should return relevance scores."""
-        result = executor.execute(f"""SELECT title, score() AS relevance
+        result = executor.execute(
+            f"""SELECT title, score() AS relevance
             FROM {products_data}
-            WHERE fulltext(title, 'laptop')""")
+            WHERE fulltext(title, 'laptop')"""
+        )
         assert len(result.rows) >= 1, "Should return results with scores"
         for row in result.rows:
             assert "relevance" in row, f"Row should have 'relevance' key: {row}"
@@ -428,9 +462,11 @@ def test_score_returns_relevance(self, executor: Executor, products_data: str):
 
     def test_score_custom_scorer(self, executor: Executor, products_data: str):
         """score('TFIDF') should use TFIDF scorer."""
-        result = executor.execute(f"""SELECT title, score('TFIDF') AS relevance
+        result = executor.execute(
+            f"""SELECT title, score('TFIDF') AS relevance
             FROM {products_data}
-            WHERE fulltext(title, 'laptop')""")
+            WHERE fulltext(title, 'laptop')"""
+        )
         assert len(result.rows) >= 1, "Should return results with TFIDF scores"
         for row in result.rows:
             assert "relevance" in row

From e43827aea9b08ba6fee2f5f0d4a0e52eab67d57f Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 14:46:12 -0400
Subject: [PATCH 09/28] fix: score alias collision for SELECT *, reject float
 fuzzy levels

- When no RETURN clause exists (SELECT *), use first row's field names
  to detect score alias collisions instead of skipping the check
- Reject non-integer fuzzy levels (e.g. 2.9) with ValueError, matching
  the slop validation behavior
- Add test for fuzzy float rejection (351 total)
---
 sql_redis/executor.py    | 59 ++++++++++++++++++++++++++++------------
 sql_redis/parser.py      |  4 +++
 tests/test_sql_parser.py |  6 ++++
 3 files changed, 51 insertions(+), 18 deletions(-)

diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index cbb6128..e3f29a8 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -116,10 +116,20 @@ def _has_return_0(args: list[str]) -> bool:
             return False
 
     @staticmethod
-    def _resolve_score_alias(score_alias: str | None, args: list[str]) -> str:
+    def _resolve_score_alias(
+        score_alias: str | None,
+        args: list[str],
+        first_row_fields: set[str] | None = None,
+    ) -> str:
         """Determine a stable score column name that won't collide with
         document fields.  The alias is decided once before iterating rows
-        so every row uses the same column name."""
+        so every row uses the same column name.
+
+        When a RETURN clause is present, the returned field names are used
+        for collision detection.  When RETURN is absent (SELECT *), the
+        caller should pass ``first_row_fields`` — the field names from the
+        first result row — so we can detect collisions even when all
+        document attributes are returned."""
         alias = score_alias or "__score"
         # Extract RETURN field names from args to detect collision
         try:
@@ -127,7 +137,7 @@ def _resolve_score_alias(score_alias: str | None, args: list[str]) -> str:
             count = int(args[idx + 1])
             return_fields = set(args[idx + 2 : idx + 2 + count])
         except (ValueError, IndexError):
-            return_fields = set()
+            return_fields = first_row_fields or set()
         if alias in return_fields:
             alias = f"__score_{alias}"
         return alias
@@ -201,28 +211,35 @@ def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
             # RETURN 0 suppresses document fields (like NOCONTENT);
             # with WITHSCORES the reply is [count, id, score, id, score, ...]
             no_content = self._has_return_0(translated.args)
-            # Determine score column name once so every row is consistent
-            alias = (
-                self._resolve_score_alias(translated.score_alias, translated.args)
-                if with_scores
-                else ""
-            )
+
+            # Pre-resolve score alias; may be deferred for SELECT *
+            score_alias: str | None = None
 
             if with_scores and no_content:
                 # WITHSCORES + RETURN 0: [count, id1, score1, id2, score2, ...]
                 # Stride of 2: key, score (no field array)
+                score_alias = self._resolve_score_alias(
+                    translated.score_alias, translated.args
+                )
                 for i in range(1, len(raw_result) - 1, 2):
                     score = raw_result[i + 1]
-                    row = {alias: score}
+                    row = {score_alias: score}
                     rows.append(row)
             elif with_scores:
                 # WITHSCORES format: [count, key1, score1, [fields1], key2, score2, [fields2], ...]
                 # Stride of 3: key, score, field_list
+                # Resolve alias using first row's fields for SELECT * (no RETURN)
                 for i in range(1, len(raw_result) - 2, 3):
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    row[alias] = score
+                    if score_alias is None:
+                        score_alias = self._resolve_score_alias(
+                            translated.score_alias,
+                            translated.args,
+                            first_row_fields=set(row.keys()),
+                        )
+                    row[score_alias] = score
                     rows.append(row)
             else:
                 # Standard format: [count, key1, [fields1], key2, [fields2], ...]
@@ -318,17 +335,17 @@ async def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
         if translated.command == "FT.SEARCH":
             with_scores = "WITHSCORES" in translated.args
             no_content = self._has_return_0(translated.args)
-            alias = (
-                self._resolve_score_alias(translated.score_alias, translated.args)
-                if with_scores
-                else ""
-            )
+
+            score_alias: str | None = None
 
             if with_scores and no_content:
                 # WITHSCORES + RETURN 0: [count, id1, score1, id2, score2, ...]
+                score_alias = self._resolve_score_alias(
+                    translated.score_alias, translated.args
+                )
                 for i in range(1, len(raw_result) - 1, 2):
                     score = raw_result[i + 1]
-                    row = {alias: score}
+                    row = {score_alias: score}
                     rows.append(row)
             elif with_scores:
                 # WITHSCORES format: [count, key1, score1, [fields1], ...]
@@ -336,7 +353,13 @@ async def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    row[alias] = score
+                    if score_alias is None:
+                        score_alias = self._resolve_score_alias(
+                            translated.score_alias,
+                            translated.args,
+                            first_row_fields=set(row.keys()),
+                        )
+                    row[score_alias] = score
                     rows.append(row)
             else:
                 # Standard format: [count, key1, [fields1], key2, [fields2], ...]
diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index c4a9b35..7dce26e 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -1020,6 +1020,10 @@ def _add_function_condition(
             if len(args) >= 3:
                 level_val = self._extract_literal_value(args[2])
                 if level_val is not None:
+                    if isinstance(level_val, float) and level_val != int(level_val):
+                        raise ValueError(
+                            f"FUZZY level argument must be an integer (got {level_val})"
+                        )
                     fuzzy_level = int(level_val)
 
             if field_name is not None:
diff --git a/tests/test_sql_parser.py b/tests/test_sql_parser.py
index 1d228da..f04a5fc 100644
--- a/tests/test_sql_parser.py
+++ b/tests/test_sql_parser.py
@@ -871,3 +871,9 @@ def test_fulltext_float_slop_raises(self):
         parser = SQLParser()
         with pytest.raises(ValueError, match="must be an integer"):
             parser.parse("SELECT * FROM idx WHERE fulltext(title, 'hello world', 2.9)")
+
+    def test_fuzzy_float_level_raises(self):
+        """Float fuzzy level raises ValueError instead of silently truncating."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="must be an integer"):
+            parser.parse("SELECT * FROM idx WHERE fuzzy(title, 'laptap', 2.9)")

From 2bc82aa2d39d4cc85ebe53bdfa9dcef66ac794f6 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 15:47:12 -0400
Subject: [PATCH 10/28] fix: multi-field FULLTEXT scoping, reject
 fuzzy/fulltext on non-TEXT, boolean validation

- Refactor build_text_condition so multi-field queries share the same
  operator-specific formatting as single-field (fixes multi-word and OR
  terms escaping the field scope in multi-field queries)
- Reject fuzzy() and fulltext() on non-TEXT fields (TAG, NUMERIC, etc.)
  with ValueError instead of silently producing incorrect queries
- Reject boolean values for slop and fuzzy level arguments (true/false
  would silently coerce to 1/0 via int())
- Add 7 new tests (358 total)
---
 sql_redis/parser.py         | 12 ++++++++++--
 sql_redis/query_builder.py  | 18 +++++++-----------
 sql_redis/translator.py     |  9 +++++++++
 tests/test_query_builder.py | 24 ++++++++++++++++++++++++
 tests/test_sql_parser.py    | 12 ++++++++++++
 tests/test_translator.py    | 16 ++++++++++++++++
 6 files changed, 78 insertions(+), 13 deletions(-)

diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index 7dce26e..d084f95 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -980,8 +980,12 @@ def _add_function_condition(
             if len(args) >= 3:
                 slop_val = self._extract_literal_value(args[2])
                 if slop_val is not None:
-                    # Reject non-integer values (e.g. 2.9) instead of
-                    # silently truncating via int().
+                    # Reject booleans and non-integer floats — only real
+                    # integers are valid for slop.
+                    if isinstance(slop_val, bool):
+                        raise ValueError(
+                            f"FULLTEXT slop argument must be an integer (got {slop_val})"
+                        )
                     if isinstance(slop_val, float) and slop_val != int(slop_val):
                         raise ValueError(
                             f"FULLTEXT slop argument must be an integer (got {slop_val})"
@@ -1020,6 +1024,10 @@ def _add_function_condition(
             if len(args) >= 3:
                 level_val = self._extract_literal_value(args[2])
                 if level_val is not None:
+                    if isinstance(level_val, bool):
+                        raise ValueError(
+                            f"FUZZY level argument must be an integer (got {level_val})"
+                        )
                     if isinstance(level_val, float) and level_val != int(level_val):
                         raise ValueError(
                             f"FUZZY level argument must be an integer (got {level_val})"
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 739b0f7..09dae6e 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -117,16 +117,7 @@ def build_text_condition(
         # consistent with how build_tag_condition handles != via operator.
         prefix = "-" if negated or operator == "!=" else ""
 
-        # Handle multi-field search — apply same escaping/operator semantics
-        if isinstance(field, list):
-            field_str = "|".join(field)
-            if operator in ("=", "!="):
-                escaped = self._escape_text_value(value)
-                return f'{prefix}(@{field_str}:"{escaped}")'
-            escaped = self._escape_fulltext_term(value)
-            return f"{prefix}(@{field_str}:{escaped})"
-
-        # Handle different operators
+        # Build search_value based on operator — shared by single- and multi-field paths
         if operator == "LIKE":
             # Escape special chars in the non-wildcard portion, then convert % → *
             # Split on %, escape each segment, rejoin with *
@@ -191,7 +182,12 @@ def build_text_condition(
             # Single-word FULLTEXT — escape to prevent accidental operator injection
             search_value = self._escape_fulltext_term(value)
 
-        base = f"{prefix}@{field}:{search_value}"
+        # Handle multi-field search — use computed search_value with multi-field syntax
+        if isinstance(field, list):
+            field_str = "|".join(field)
+            base = f"{prefix}(@{field_str}:{search_value})"
+        else:
+            base = f"{prefix}@{field}:{search_value}"
 
         # Append query attributes (slop, inorder) if specified
         if slop is not None:
diff --git a/sql_redis/translator.py b/sql_redis/translator.py
index 6353b67..3a25026 100644
--- a/sql_redis/translator.py
+++ b/sql_redis/translator.py
@@ -226,6 +226,15 @@ def _build_condition(self, condition: Condition, field_type: str | None) -> str:
                 condition.field, is_missing=(condition.operator == "IS_NULL")
             )
 
+        # Reject text-only operators on non-TEXT fields — fuzzy() and fulltext()
+        # only make sense for TEXT fields; silently falling through to TAG/NUMERIC
+        # would produce incorrect queries.
+        if condition.operator in ("FUZZY", "FULLTEXT") and field_type != "TEXT":
+            raise ValueError(
+                f"{condition.operator.lower()}() can only be used on TEXT fields, "
+                f"but '{condition.field}' is {field_type or 'unknown'}."
+            )
+
         # Resolve negation using XOR so that double negation cancels out.
         # e.g. NOT (field != 'x') → negated=True, op='!=' → is_negated=False.
         operator = condition.operator
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index a2cf8ce..dc2b2a5 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -600,3 +600,27 @@ def test_multiword_fulltext_escapes_dash(self):
         builder = QueryBuilder()
         result = builder.build_text_condition("title", "FULLTEXT", "hello anti-virus")
         assert result == "@title:(hello anti\\-virus)"
+
+    def test_multi_field_multiword_fulltext(self):
+        """Multi-field with multi-word FULLTEXT scopes all terms to fields."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            ["title", "description"], "FULLTEXT", "gaming laptop"
+        )
+        assert result == "(@title|description:(gaming laptop))"
+
+    def test_multi_field_or_fulltext(self):
+        """Multi-field with OR FULLTEXT uses pipe-separated terms."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            ["title", "description"], "FULLTEXT", "laptop OR tablet"
+        )
+        assert result == "(@title|description:(laptop|tablet))"
+
+    def test_multi_field_fuzzy(self):
+        """Multi-field with FUZZY wraps with % markers."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            ["title", "description"], "FUZZY", "laptap", fuzzy_level=2
+        )
+        assert result == "(@title|description:%%laptap%%)"
diff --git a/tests/test_sql_parser.py b/tests/test_sql_parser.py
index f04a5fc..47dad20 100644
--- a/tests/test_sql_parser.py
+++ b/tests/test_sql_parser.py
@@ -877,3 +877,15 @@ def test_fuzzy_float_level_raises(self):
         parser = SQLParser()
         with pytest.raises(ValueError, match="must be an integer"):
             parser.parse("SELECT * FROM idx WHERE fuzzy(title, 'laptap', 2.9)")
+
+    def test_fulltext_boolean_slop_raises(self):
+        """Boolean slop in fulltext() raises ValueError."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="must be an integer"):
+            parser.parse("SELECT * FROM idx WHERE fulltext(title, 'hello world', true)")
+
+    def test_fuzzy_boolean_level_raises(self):
+        """Boolean fuzzy level raises ValueError."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="must be an integer"):
+            parser.parse("SELECT * FROM idx WHERE fuzzy(title, 'laptap', true)")
diff --git a/tests/test_translator.py b/tests/test_translator.py
index 64546f8..452b480 100644
--- a/tests/test_translator.py
+++ b/tests/test_translator.py
@@ -655,6 +655,22 @@ def test_fuzzy_ld3(self, translator: Translator, basic_index: str):
         )
         assert "@title:%%%laptap%%%" in result.query_string
 
+    def test_fuzzy_on_tag_field_raises(self, translator: Translator, basic_index: str):
+        """fuzzy() on a TAG field raises ValueError."""
+        with pytest.raises(ValueError, match="can only be used on TEXT fields"):
+            translator.translate(
+                f"SELECT * FROM {basic_index} WHERE fuzzy(category, 'laptap')"
+            )
+
+    def test_fulltext_on_numeric_field_raises(
+        self, translator: Translator, basic_index: str
+    ):
+        """fulltext() on a NUMERIC field raises ValueError."""
+        with pytest.raises(ValueError, match="can only be used on TEXT fields"):
+            translator.translate(
+                f"SELECT * FROM {basic_index} WHERE fulltext(price, 'laptop')"
+            )
+
 
 class TestTranslatorSuffixInfix:
     """Tests for suffix and infix (contains) pattern matching.

From 354111f42a50963fd385d60fbabf58f1ace79fec Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 16:53:24 -0400
Subject: [PATCH 11/28] fix: case-insensitive OR, escape */+, LIKE guard,
 inorder validation, alias loop

- OR parsing now case-insensitive and whitespace-tolerant (regex split)
- Escape * and + in TEXT_QUERY_SPECIAL_CHARS to prevent wildcard/mandatory
  injection in FULLTEXT/FUZZY terms
- Add LIKE to the non-TEXT field guard (alongside FUZZY/FULLTEXT)
- Validate inorder argument strictly: reject values like 'yes', 2, etc.
- Score alias collision uses while loop for repeated prefix collisions
- Add 7 new tests (365 total)
---
 sql_redis/executor.py       |  2 +-
 sql_redis/parser.py         | 12 ++++++++++--
 sql_redis/query_builder.py  | 19 +++++++++++--------
 sql_redis/translator.py     |  2 +-
 tests/test_query_builder.py | 32 ++++++++++++++++++++++++++++++++
 tests/test_sql_parser.py    |  8 ++++++++
 tests/test_translator.py    |  7 +++++++
 7 files changed, 70 insertions(+), 12 deletions(-)

diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index e3f29a8..f7078dc 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -138,7 +138,7 @@ def _resolve_score_alias(
             return_fields = set(args[idx + 2 : idx + 2 + count])
         except (ValueError, IndexError):
             return_fields = first_row_fields or set()
-        if alias in return_fields:
+        while alias in return_fields:
             alias = f"__score_{alias}"
         return alias
 
diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index d084f95..f5c9890 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -996,12 +996,20 @@ def _add_function_condition(
                             f"FULLTEXT slop argument must be a non-negative integer (got {slop})"
                         )
 
-            # Optional 4th arg: inorder (boolean-like: 1/0 or true/false)
+            # Optional 4th arg: inorder (boolean-like: true/false or 1/0)
             inorder = False
             if len(args) >= 4:
                 inorder_val = self._extract_literal_value(args[3])
                 if inorder_val is not None:
-                    inorder = str(inorder_val).lower() in ("1", "true")
+                    if isinstance(inorder_val, bool):
+                        inorder = inorder_val
+                    elif str(inorder_val).lower() in ("1", "0", "true", "false"):
+                        inorder = str(inorder_val).lower() in ("1", "true")
+                    else:
+                        raise ValueError(
+                            f"FULLTEXT inorder argument must be a boolean "
+                            f"(true/false or 1/0), got {inorder_val!r}"
+                        )
 
             if field_name is not None:
                 result.conditions.append(
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 09dae6e..fc2e317 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -2,6 +2,7 @@
 
 from __future__ import annotations
 
+import re
 import warnings
 
 # Redis default stopwords - these are not indexed by default
@@ -54,7 +55,7 @@ class QueryBuilder:
     # Characters that have special meaning in RediSearch free-text queries
     # (outside double-quoted phrases). Must be escaped with backslash.
     # Includes double-quote to prevent starting/ending quoted phrases.
-    TEXT_QUERY_SPECIAL_CHARS = set('\\|-()"@~!{}[]^$><=;:')
+    TEXT_QUERY_SPECIAL_CHARS = set('\\|-()"@~!{}[]^$><=;:*+')
 
     @classmethod
     def _escape_fulltext_term(cls, term: str) -> str:
@@ -139,7 +140,15 @@ def build_text_condition(
             # Exact phrase match — always wrap in quotes, preserve stopwords.
             escaped = self._escape_text_value(value)
             search_value = f'"{escaped}"'
-        elif " " in value and " OR " not in value:
+        elif re.search(r"\s+[Oo][Rr]\s+", value):
+            # OR union within text field: split on case-insensitive OR with
+            # flexible whitespace, escape each term, join with |
+            or_terms = [
+                self._escape_fulltext_term(t.strip())
+                for t in re.split(r"\s+[Oo][Rr]\s+", value)
+            ]
+            search_value = f"({'|'.join(or_terms)})"
+        elif " " in value:
             # FULLTEXT/MATCH with multi-word: tokenized search with stopword filtering.
             # Each term is escaped to prevent accidental operator injection, but a
             # leading ~ (optional-term modifier) is preserved as an intentional
@@ -172,12 +181,6 @@ def build_text_condition(
 
             terms = " ".join(escaped_words)
             search_value = f"({terms})"
-        elif " OR " in value:
-            # OR union within text field: split on ' OR ', escape each term, join with |
-            or_terms = [
-                self._escape_fulltext_term(t.strip()) for t in value.split(" OR ")
-            ]
-            search_value = f"({'|'.join(or_terms)})"
         else:
             # Single-word FULLTEXT — escape to prevent accidental operator injection
             search_value = self._escape_fulltext_term(value)
diff --git a/sql_redis/translator.py b/sql_redis/translator.py
index 3a25026..a7346f4 100644
--- a/sql_redis/translator.py
+++ b/sql_redis/translator.py
@@ -229,7 +229,7 @@ def _build_condition(self, condition: Condition, field_type: str | None) -> str:
         # Reject text-only operators on non-TEXT fields — fuzzy() and fulltext()
         # only make sense for TEXT fields; silently falling through to TAG/NUMERIC
         # would produce incorrect queries.
-        if condition.operator in ("FUZZY", "FULLTEXT") and field_type != "TEXT":
+        if condition.operator in ("FUZZY", "FULLTEXT", "LIKE") and field_type != "TEXT":
             raise ValueError(
                 f"{condition.operator.lower()}() can only be used on TEXT fields, "
                 f"but '{condition.field}' is {field_type or 'unknown'}."
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index dc2b2a5..5a301ac 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -624,3 +624,35 @@ def test_multi_field_fuzzy(self):
             ["title", "description"], "FUZZY", "laptap", fuzzy_level=2
         )
         assert result == "(@title|description:%%laptap%%)"
+
+    def test_or_case_insensitive_lowercase(self):
+        """OR parsing is case-insensitive: 'laptop or tablet' works."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "laptop or tablet")
+        assert result == "@title:(laptop|tablet)"
+
+    def test_or_case_insensitive_mixed(self):
+        """OR parsing is case-insensitive: 'laptop Or tablet' works."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "laptop Or tablet")
+        assert result == "@title:(laptop|tablet)"
+
+    def test_or_extra_whitespace(self):
+        """OR parsing tolerates extra whitespace."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            "title", "FULLTEXT", "laptop  OR   tablet"
+        )
+        assert result == "@title:(laptop|tablet)"
+
+    def test_escape_asterisk_in_fulltext(self):
+        """Literal * in FULLTEXT is escaped to prevent wildcard."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "hello*world")
+        assert result == r"@title:hello\*world"
+
+    def test_escape_plus_in_fulltext(self):
+        """Literal + in FULLTEXT is escaped to prevent mandatory-term."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "C++")
+        assert result == r"@title:C\+\+"
diff --git a/tests/test_sql_parser.py b/tests/test_sql_parser.py
index 47dad20..4d4f7f0 100644
--- a/tests/test_sql_parser.py
+++ b/tests/test_sql_parser.py
@@ -889,3 +889,11 @@ def test_fuzzy_boolean_level_raises(self):
         parser = SQLParser()
         with pytest.raises(ValueError, match="must be an integer"):
             parser.parse("SELECT * FROM idx WHERE fuzzy(title, 'laptap', true)")
+
+    def test_fulltext_invalid_inorder_raises(self):
+        """Invalid inorder value (e.g., 'yes') raises ValueError."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="inorder argument must be a boolean"):
+            parser.parse(
+                "SELECT * FROM idx WHERE fulltext(title, 'hello world', 0, 'yes')"
+            )
diff --git a/tests/test_translator.py b/tests/test_translator.py
index 452b480..8cf75f8 100644
--- a/tests/test_translator.py
+++ b/tests/test_translator.py
@@ -671,6 +671,13 @@ def test_fulltext_on_numeric_field_raises(
                 f"SELECT * FROM {basic_index} WHERE fulltext(price, 'laptop')"
             )
 
+    def test_like_on_tag_field_raises(self, translator: Translator, basic_index: str):
+        """LIKE on a TAG field raises ValueError."""
+        with pytest.raises(ValueError, match="can only be used on TEXT fields"):
+            translator.translate(
+                f"SELECT * FROM {basic_index} WHERE category LIKE '%phone%'"
+            )
+
 
 class TestTranslatorSuffixInfix:
     """Tests for suffix and infix (contains) pattern matching.

From 20abd76e057f71e75f3a28505e27255e5a029648 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 17:48:55 -0400
Subject: [PATCH 12/28] docs: add TEXT search section to README

- Feature reference table with SQL syntax and RediSearch output
- Examples for exact phrase, fuzzy, OR, proximity, LIKE patterns, scoring
- Notes on operator restrictions and auto-escaping
---
 README.md | 55 ++++++++++++++++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 54 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index b3d5c98..3650498 100644
--- a/README.md
+++ b/README.md
@@ -154,7 +154,7 @@ The layered approach emerged from TDD — writing tests first revealed natural b
 - [x] Computed fields: `price * 0.9 AS discounted`
 - [x] Vector KNN search: `vector_distance(field, :param)`
 - [x] Hybrid search (filters + vector)
-- [x] Full-text search: `LIKE 'prefix%'` (prefix), `fulltext(field, 'terms')` function
+- [x] Full-text search: exact phrase, fuzzy, proximity, OR/union, LIKE patterns, BM25 scoring (see below)
 - [x] GEO field queries with full operator support (see below)
 - [x] Date functions: `YEAR()`, `MONTH()`, `DAY()`, `DATE_FORMAT()`, etc. (see below)
 
@@ -166,6 +166,59 @@ The layered approach emerged from TDD — writing tests first revealed natural b
 - [ ] DISTINCT
 - [ ] Index creation from SQL (CREATE INDEX)
 
+### TEXT Search
+
+Full-text search on TEXT fields with multiple search modes:
+
+| Feature | SQL Syntax | RediSearch Output |
+|---------|-----------|-------------------|
+| Exact phrase | `title = 'gaming laptop'` | `@title:"gaming laptop"` |
+| Tokenized search | `fulltext(title, 'gaming laptop')` | `@title:(gaming laptop)` |
+| Fuzzy LD=1 | `fuzzy(title, 'laptap')` | `@title:%laptap%` |
+| Fuzzy LD=2 | `fuzzy(title, 'laptap', 2)` | `@title:%%laptap%%` |
+| Fuzzy LD=3 | `fuzzy(title, 'laptap', 3)` | `@title:%%%laptap%%%` |
+| OR / union | `fulltext(title, 'laptop OR tablet')` | `@title:(laptop\|tablet)` |
+| Prefix | `title LIKE 'lap%'` | `@title:lap*` |
+| Suffix | `title LIKE '%top'` | `@title:*top` |
+| Contains | `title LIKE '%apt%'` | `@title:*apt*` |
+| Proximity (slop) | `fulltext(title, 'gaming laptop', 2)` | `@title:(gaming laptop) => { $slop: 2; }` |
+| Proximity + order | `fulltext(title, 'gaming laptop', 2, true)` | `@title:(gaming laptop) => { $slop: 2; $inorder: true; }` |
+| Optional term | `fulltext(title, 'laptop ~gaming')` | `@title:(laptop ~gaming)` |
+| BM25 score | `SELECT score() AS relevance FROM idx` | `FT.SEARCH ... WITHSCORES` |
+| Negation | `NOT fulltext(title, 'refurbished')` | `-@title:(refurbished)` |
+
+**Examples:**
+
+```sql
+-- Exact phrase match (stopwords preserved)
+SELECT * FROM products WHERE title = 'bank of america'
+
+-- Fuzzy search for typos (Levenshtein distance 2)
+SELECT * FROM products WHERE fuzzy(title, 'laptap', 2)
+
+-- OR search across terms
+SELECT * FROM products WHERE fulltext(title, 'laptop OR tablet OR phone')
+
+-- Proximity: terms within 3 words of each other, in order
+SELECT * FROM products WHERE fulltext(title, 'gaming laptop', 3, true)
+
+-- Suffix/contains pattern matching
+SELECT * FROM products WHERE title LIKE '%phone%'
+
+-- BM25 relevance scoring
+SELECT title, score() AS relevance FROM products WHERE fulltext(title, 'laptop')
+
+-- Multi-field search
+SELECT * FROM products WHERE fulltext(title, 'laptop') OR fulltext(description, 'laptop')
+```
+
+**Notes:**
+- `=` on TEXT fields performs **exact phrase** matching (preserves stopwords)
+- `fulltext()` performs **tokenized** search (stopwords are filtered with a warning)
+- `fuzzy()` and `fulltext()` only work on TEXT fields — using them on TAG or NUMERIC raises `ValueError`
+- OR is case-insensitive: `'laptop OR tablet'`, `'laptop or tablet'`, and `'laptop Or tablet'` all work
+- Special characters (`@`, `|`, `-`, `*`, `+`, etc.) in search terms are automatically escaped
+
 ### DATE/DATETIME Handling
 
 Redis does not have a native DATE field type. Dates are stored as **NUMERIC fields** with Unix timestamps.

From 6e4ec671771d41c999653945a03267da416a2bfb Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 17:55:09 -0400
Subject: [PATCH 13/28] fix: single-term ~ prefix, multi-word OR grouping;
 docs: IS NULL & exists()
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Preserve ~ optional-term prefix on single-word FULLTEXT (was escaped)
- Wrap multi-word OR operands in parentheses to prevent precedence issues
  (e.g. 'gaming laptop OR tablet' → (gaming laptop)|tablet)
- Add IS NULL / IS NOT NULL (ismissing) section to README
- Add exists() function section to README
- Add to What's Implemented checklist
- Add 3 new tests (368 total)
---
 README.md                   | 41 +++++++++++++++++++++++++++++++++++++
 sql_redis/query_builder.py  | 26 +++++++++++++++--------
 tests/test_query_builder.py | 22 ++++++++++++++++++++
 3 files changed, 81 insertions(+), 8 deletions(-)

diff --git a/README.md b/README.md
index 3650498..cf3c743 100644
--- a/README.md
+++ b/README.md
@@ -157,6 +157,8 @@ The layered approach emerged from TDD — writing tests first revealed natural b
 - [x] Full-text search: exact phrase, fuzzy, proximity, OR/union, LIKE patterns, BM25 scoring (see below)
 - [x] GEO field queries with full operator support (see below)
 - [x] Date functions: `YEAR()`, `MONTH()`, `DAY()`, `DATE_FORMAT()`, etc. (see below)
+- [x] `IS NULL` / `IS NOT NULL` via `ismissing()` (requires Redis 7.4+, see below)
+- [x] `exists()` function for field presence checks (see below)
 
 ## What's Not Implemented (Yet...)
 
@@ -219,6 +221,45 @@ SELECT * FROM products WHERE fulltext(title, 'laptop') OR fulltext(description,
 - OR is case-insensitive: `'laptop OR tablet'`, `'laptop or tablet'`, and `'laptop Or tablet'` all work
 - Special characters (`@`, `|`, `-`, `*`, `+`, etc.) in search terms are automatically escaped
 
+### IS NULL / IS NOT NULL (ismissing)
+
+Check for missing (absent) fields using standard SQL `IS NULL` / `IS NOT NULL` syntax. Requires **Redis 7.4+** (RediSearch 2.10+) with `INDEXMISSING` declared on the field.
+
+| SQL | RediSearch Output |
+|-----|-------------------|
+| `WHERE email IS NULL` | `ismissing(@email)` |
+| `WHERE email IS NOT NULL` | `-ismissing(@email)` |
+
+```sql
+-- Find users without an email
+SELECT * FROM users WHERE email IS NULL
+
+-- Find users with an email
+SELECT * FROM users WHERE email IS NOT NULL
+
+-- Combine with other filters
+SELECT * FROM users WHERE category = 'eng' AND email IS NULL
+```
+
+**Note:** The field must be declared with `INDEXMISSING` in the index schema. A warning is emitted at translation time as a reminder.
+
+### exists() — Field Presence Check
+
+Check whether a field has a value using `exists()` in SELECT or HAVING. This uses `FT.AGGREGATE` with `APPLY exists(@field)`.
+
+```sql
+-- Check if fields exist (returns 1 or 0)
+SELECT name, exists(email) AS has_email FROM users
+
+-- Filter to only rows where a field exists
+SELECT name FROM users HAVING exists(email) = 1
+
+-- Combine with other computed fields
+SELECT name, exists(email) AS has_email, exists(phone) AS has_phone FROM users
+```
+
+**Note:** `exists()` is different from `IS NOT NULL` — it works via `FT.AGGREGATE APPLY` and doesn't require `INDEXMISSING` on the field, but returns `1`/`0` rather than filtering rows directly.
+
 ### DATE/DATETIME Handling
 
 Redis does not have a native DATE field type. Dates are stored as **NUMERIC fields** with Unix timestamps.
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index fc2e317..b67681d 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -142,12 +142,18 @@ def build_text_condition(
             search_value = f'"{escaped}"'
         elif re.search(r"\s+[Oo][Rr]\s+", value):
             # OR union within text field: split on case-insensitive OR with
-            # flexible whitespace, escape each term, join with |
-            or_terms = [
-                self._escape_fulltext_term(t.strip())
-                for t in re.split(r"\s+[Oo][Rr]\s+", value)
-            ]
-            search_value = f"({'|'.join(or_terms)})"
+            # flexible whitespace, escape each term, join with |.
+            # Multi-word operands (e.g. "gaming laptop OR tablet") are wrapped
+            # in parentheses so each side is an atomic subexpression.
+            or_parts: list[str] = []
+            for part in re.split(r"\s+[Oo][Rr]\s+", value):
+                words = part.strip().split()
+                if len(words) > 1:
+                    escaped = " ".join(self._escape_fulltext_term(w) for w in words)
+                    or_parts.append(f"({escaped})")
+                else:
+                    or_parts.append(self._escape_fulltext_term(words[0]))
+            search_value = f"({'|'.join(or_parts)})"
         elif " " in value:
             # FULLTEXT/MATCH with multi-word: tokenized search with stopword filtering.
             # Each term is escaped to prevent accidental operator injection, but a
@@ -182,8 +188,12 @@ def build_text_condition(
             terms = " ".join(escaped_words)
             search_value = f"({terms})"
         else:
-            # Single-word FULLTEXT — escape to prevent accidental operator injection
-            search_value = self._escape_fulltext_term(value)
+            # Single-word FULLTEXT — escape to prevent accidental operator injection.
+            # Preserve ~ optional-term prefix (same as multi-word branch).
+            if value.startswith("~"):
+                search_value = "~" + self._escape_fulltext_term(value[1:])
+            else:
+                search_value = self._escape_fulltext_term(value)
 
         # Handle multi-field search — use computed search_value with multi-field syntax
         if isinstance(field, list):
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index 5a301ac..9ef0d8f 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -656,3 +656,25 @@ def test_escape_plus_in_fulltext(self):
         builder = QueryBuilder()
         result = builder.build_text_condition("title", "FULLTEXT", "C++")
         assert result == r"@title:C\+\+"
+
+    def test_single_term_optional_prefix_preserved(self):
+        """Single-term FULLTEXT with ~ prefix preserves optional semantics."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "~gaming")
+        assert result == "@title:~gaming"
+
+    def test_or_multiword_operand_grouped(self):
+        """OR with multi-word operand wraps it in parentheses."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            "title", "FULLTEXT", "gaming laptop OR tablet"
+        )
+        assert result == "@title:((gaming laptop)|tablet)"
+
+    def test_or_both_multiword_operands_grouped(self):
+        """OR with multi-word operands on both sides wraps each."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition(
+            "title", "FULLTEXT", "gaming laptop OR android tablet"
+        )
+        assert result == "@title:((gaming laptop)|(android tablet))"

From 09286e680fbd30b7102c566ab1b065954d80393e Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 18:17:30 -0400
Subject: [PATCH 14/28] fix: empty OR operand guard, LIKE error message, README
 negation typo

- Raise ValueError for empty OR operands ('laptop OR ', ' OR tablet')
  instead of crashing with IndexError
- LIKE error message now says 'LIKE can only be used...' instead of
  'like() can only be used...' since LIKE is not a function
- Fix README table: negation of single-term FULLTEXT doesn't have parens
- Add 2 new tests (370 total)
---
 README.md                   |  2 +-
 sql_redis/query_builder.py  |  5 +++++
 sql_redis/translator.py     |  7 ++++++-
 tests/test_query_builder.py | 12 ++++++++++++
 4 files changed, 24 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index cf3c743..0fdd86d 100644
--- a/README.md
+++ b/README.md
@@ -187,7 +187,7 @@ Full-text search on TEXT fields with multiple search modes:
 | Proximity + order | `fulltext(title, 'gaming laptop', 2, true)` | `@title:(gaming laptop) => { $slop: 2; $inorder: true; }` |
 | Optional term | `fulltext(title, 'laptop ~gaming')` | `@title:(laptop ~gaming)` |
 | BM25 score | `SELECT score() AS relevance FROM idx` | `FT.SEARCH ... WITHSCORES` |
-| Negation | `NOT fulltext(title, 'refurbished')` | `-@title:(refurbished)` |
+| Negation | `NOT fulltext(title, 'refurbished')` | `-@title:refurbished` |
 
 **Examples:**
 
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index b67681d..b7c1257 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -148,6 +148,11 @@ def build_text_condition(
             or_parts: list[str] = []
             for part in re.split(r"\s+[Oo][Rr]\s+", value):
                 words = part.strip().split()
+                if not words:
+                    raise ValueError(
+                        "Empty operand in OR expression — each side of OR "
+                        "must contain at least one search term."
+                    )
                 if len(words) > 1:
                     escaped = " ".join(self._escape_fulltext_term(w) for w in words)
                     or_parts.append(f"({escaped})")
diff --git a/sql_redis/translator.py b/sql_redis/translator.py
index a7346f4..a524851 100644
--- a/sql_redis/translator.py
+++ b/sql_redis/translator.py
@@ -230,8 +230,13 @@ def _build_condition(self, condition: Condition, field_type: str | None) -> str:
         # only make sense for TEXT fields; silently falling through to TAG/NUMERIC
         # would produce incorrect queries.
         if condition.operator in ("FUZZY", "FULLTEXT", "LIKE") and field_type != "TEXT":
+            op_display = (
+                "LIKE"
+                if condition.operator == "LIKE"
+                else f"{condition.operator.lower()}()"
+            )
             raise ValueError(
-                f"{condition.operator.lower()}() can only be used on TEXT fields, "
+                f"{op_display} can only be used on TEXT fields, "
                 f"but '{condition.field}' is {field_type or 'unknown'}."
             )
 
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index 9ef0d8f..e61fe99 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -678,3 +678,15 @@ def test_or_both_multiword_operands_grouped(self):
             "title", "FULLTEXT", "gaming laptop OR android tablet"
         )
         assert result == "@title:((gaming laptop)|(android tablet))"
+
+    def test_or_trailing_empty_operand_raises(self):
+        """Trailing OR with empty operand raises ValueError."""
+        builder = QueryBuilder()
+        with pytest.raises(ValueError, match="Empty operand in OR expression"):
+            builder.build_text_condition("title", "FULLTEXT", "laptop OR ")
+
+    def test_or_leading_empty_operand_raises(self):
+        """Leading OR with empty operand raises ValueError."""
+        builder = QueryBuilder()
+        with pytest.raises(ValueError, match="Empty operand in OR expression"):
+            builder.build_text_condition("title", "FULLTEXT", " OR tablet")

From 055337f40cf7e942784473f69bfdcd05ef987961 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 18:31:31 -0400
Subject: [PATCH 15/28] fix: scorer case preservation, duplicate score guard,
 OR ~ prefix, stopword warning

- Preserve caller-provided scorer casing (score('MyScorer') no longer
  uppercased to MYSCORER)
- Raise ValueError when multiple score() expressions in same query
- Preserve ~ optional-term prefix in OR operands
- Fix misleading stopword warning when all tokens are stopwords
- Remove redundant inner pytest import in test_translator.py
- Add 3 new tests (373 total)
---
 sql_redis/parser.py         |  6 +++++-
 sql_redis/query_builder.py  | 23 +++++++++++++++++++----
 tests/test_query_builder.py |  6 ++++++
 tests/test_translator.py    | 21 +++++++++++++++++++--
 4 files changed, 49 insertions(+), 7 deletions(-)

diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index f5c9890..7e27774 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -462,7 +462,11 @@ def _process_select_expression_inner(
                 if expression.expressions:
                     scorer_val = self._extract_literal_value(expression.expressions[0])
                     if scorer_val is not None:
-                        scorer = str(scorer_val).upper()
+                        scorer = str(scorer_val)
+                if result.scoring is not None:
+                    raise ValueError(
+                        "Only one score() expression is allowed per query."
+                    )
                 result.scoring = ScoringSpec(
                     alias=alias or "score",
                     scorer=scorer,
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index b7c1257..f9be1c4 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -154,10 +154,21 @@ def build_text_condition(
                         "must contain at least one search term."
                     )
                 if len(words) > 1:
-                    escaped = " ".join(self._escape_fulltext_term(w) for w in words)
-                    or_parts.append(f"({escaped})")
+                    escaped_tokens = []
+                    for w in words:
+                        if w.startswith("~"):
+                            escaped_tokens.append(
+                                "~" + self._escape_fulltext_term(w[1:])
+                            )
+                        else:
+                            escaped_tokens.append(self._escape_fulltext_term(w))
+                    or_parts.append(f"({' '.join(escaped_tokens)})")
                 else:
-                    or_parts.append(self._escape_fulltext_term(words[0]))
+                    token = words[0]
+                    if token.startswith("~"):
+                        or_parts.append("~" + self._escape_fulltext_term(token[1:]))
+                    else:
+                        or_parts.append(self._escape_fulltext_term(token))
             search_value = f"({'|'.join(or_parts)})"
         elif " " in value:
             # FULLTEXT/MATCH with multi-word: tokenized search with stopword filtering.
@@ -173,8 +184,12 @@ def build_text_condition(
             ]
 
             if removed_stopwords:
+                if filtered_words:
+                    sw_action = f"Stopwords {removed_stopwords} were removed from"
+                else:
+                    sw_action = f"All tokens in '{value}' are stopwords and may not be indexed by"
                 warnings.warn(
-                    f"Stopwords {removed_stopwords} were removed from text search '{value}'. "
+                    f"{sw_action} text search '{value}'. "
                     "By default, Redis does not index stopwords. "
                     "To include stopwords in your index, create it with STOPWORDS 0. "
                     "Use = operator for exact phrase matching that preserves stopwords.",
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index e61fe99..3a685c7 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -690,3 +690,9 @@ def test_or_leading_empty_operand_raises(self):
         builder = QueryBuilder()
         with pytest.raises(ValueError, match="Empty operand in OR expression"):
             builder.build_text_condition("title", "FULLTEXT", " OR tablet")
+
+    def test_or_preserves_optional_prefix(self):
+        """OR operand with ~ prefix preserves optional-term semantics."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "FULLTEXT", "laptop OR ~gaming")
+        assert result == "@title:(laptop|~gaming)"
diff --git a/tests/test_translator.py b/tests/test_translator.py
index 8cf75f8..926ee24 100644
--- a/tests/test_translator.py
+++ b/tests/test_translator.py
@@ -785,6 +785,25 @@ def test_score_custom_scorer(self, translator: Translator, basic_index: str):
         scorer_idx = result.args.index("SCORER")
         assert result.args[scorer_idx + 1] == "TFIDF"
 
+    def test_score_custom_scorer_preserves_case(
+        self, translator: Translator, basic_index: str
+    ):
+        """score('MyScorer') preserves caller-provided casing."""
+        result = translator.translate(
+            f"SELECT title, score('MyScorer') AS relevance FROM {basic_index} "
+            "WHERE fulltext(title, 'laptop')"
+        )
+        scorer_idx = result.args.index("SCORER")
+        assert result.args[scorer_idx + 1] == "MyScorer"
+
+    def test_duplicate_score_raises(self, translator: Translator, basic_index: str):
+        """Multiple score() expressions in the same query raise ValueError."""
+        with pytest.raises(ValueError, match="Only one score"):
+            translator.translate(
+                f"SELECT score() AS s1, score('TFIDF') AS s2 FROM {basic_index} "
+                "WHERE fulltext(title, 'laptop')"
+            )
+
     def test_no_score_no_withscores(self, translator: Translator, basic_index: str):
         """Without score() → no WITHSCORES flag."""
         result = translator.translate(
@@ -808,8 +827,6 @@ def test_score_with_aggregate_raises(
         self, translator: Translator, basic_index: str
     ):
         """score() combined with GROUP BY (forces FT.AGGREGATE) raises ValueError."""
-        import pytest
-
         with pytest.raises(ValueError, match="score.*not supported.*FT.AGGREGATE"):
             translator.translate(
                 f"SELECT COUNT(*), score() AS relevance FROM {basic_index} "

From 8a69d067d3f7db508b3886e3c5595936f347f4e2 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 18:44:20 -0400
Subject: [PATCH 16/28] fix: score() arg count validation, slop validation in
 QueryBuilder, stopword warning grammar

- Raise ValueError when score() receives more than one argument
- Validate slop is a non-negative int at QueryBuilder level (not just parser)
- Fix stopword warning grammar for all-stopword inputs
- Add 3 new tests (376 total)
---
 sql_redis/parser.py         |  5 +++++
 sql_redis/query_builder.py  |  4 +++-
 tests/test_query_builder.py | 18 ++++++++++++++++++
 tests/test_translator.py    |  8 ++++++++
 4 files changed, 34 insertions(+), 1 deletion(-)

diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index 7e27774..5aef23c 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -459,6 +459,11 @@ def _process_select_expression_inner(
             elif func_name_lower == "score":
                 # score() or score('BM25') — triggers WITHSCORES + SCORER
                 scorer = "BM25"
+                if len(expression.expressions) > 1:
+                    raise ValueError(
+                        f"score() expects at most one argument, "
+                        f"got {len(expression.expressions)}."
+                    )
                 if expression.expressions:
                     scorer_val = self._extract_literal_value(expression.expressions[0])
                     if scorer_val is not None:
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index f9be1c4..71f8343 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -187,7 +187,7 @@ def build_text_condition(
                 if filtered_words:
                     sw_action = f"Stopwords {removed_stopwords} were removed from"
                 else:
-                    sw_action = f"All tokens in '{value}' are stopwords and may not be indexed by"
+                    sw_action = f"All tokens in '{value}' are stopwords and may not be indexed in"
                 warnings.warn(
                     f"{sw_action} text search '{value}'. "
                     "By default, Redis does not index stopwords. "
@@ -224,6 +224,8 @@ def build_text_condition(
 
         # Append query attributes (slop, inorder) if specified
         if slop is not None:
+            if not isinstance(slop, int) or isinstance(slop, bool) or slop < 0:
+                raise ValueError(f"slop must be a non-negative integer (got {slop!r})")
             attrs = f"$slop: {slop};"
             if inorder:
                 attrs += " $inorder: true;"
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index 3a685c7..9567620 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -696,3 +696,21 @@ def test_or_preserves_optional_prefix(self):
         builder = QueryBuilder()
         result = builder.build_text_condition("title", "FULLTEXT", "laptop OR ~gaming")
         assert result == "@title:(laptop|~gaming)"
+
+
+class TestQueryBuilderSlopValidation:
+    """Tests for slop validation at the QueryBuilder level."""
+
+    def test_slop_negative_raises(self):
+        """Negative slop raises ValueError."""
+        builder = QueryBuilder()
+        with pytest.raises(ValueError, match="non-negative integer"):
+            builder.build_text_condition("title", "FULLTEXT", "gaming laptop", slop=-1)
+
+    def test_slop_boolean_raises(self):
+        """Boolean slop raises ValueError."""
+        builder = QueryBuilder()
+        with pytest.raises(ValueError, match="non-negative integer"):
+            builder.build_text_condition(
+                "title", "FULLTEXT", "gaming laptop", slop=True
+            )
diff --git a/tests/test_translator.py b/tests/test_translator.py
index 926ee24..555c636 100644
--- a/tests/test_translator.py
+++ b/tests/test_translator.py
@@ -832,3 +832,11 @@ def test_score_with_aggregate_raises(
                 f"SELECT COUNT(*), score() AS relevance FROM {basic_index} "
                 "WHERE fulltext(title, 'laptop') GROUP BY category"
             )
+
+    def test_score_too_many_args_raises(self, translator: Translator, basic_index: str):
+        """score() with more than one argument raises ValueError."""
+        with pytest.raises(ValueError, match="at most one argument"):
+            translator.translate(
+                f"SELECT score('BM25', 'extra') AS relevance FROM {basic_index} "
+                "WHERE fulltext(title, 'laptop')"
+            )

From 3d3485c6c18c7efb5b8a8d38585761ad92bf30e8 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 18:54:11 -0400
Subject: [PATCH 17/28] fix: parenthesize multi-word LIKE patterns, raise on
 invalid fulltext/fuzzy signatures

- LIKE '%gaming laptop%' now generates @title:(*gaming laptop*) to prevent
  token leaking across fields in Dialect 2
- fulltext(title) and fuzzy(title) with < 2 args now raise ValueError
  instead of silently dropping the predicate
- Update existing test expectation for insufficient args
- Add 3 new tests (379 total)
---
 sql_redis/parser.py         |  6 ++++++
 sql_redis/query_builder.py  |  6 ++++++
 tests/test_query_builder.py |  6 ++++++
 tests/test_sql_parser.py    | 20 +++++++++++++++-----
 4 files changed, 33 insertions(+), 5 deletions(-)

diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index 5aef23c..349284e 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -980,6 +980,12 @@ def _add_function_condition(
         func_name = expression.name.upper()
         args = expression.expressions
 
+        if func_name in ("FULLTEXT", "FUZZY") and len(args) < 2:
+            raise ValueError(
+                f"{func_name.lower()}() requires at least 2 arguments: "
+                f"{func_name.lower()}(field, value), got {len(args)}."
+            )
+
         if func_name == "FULLTEXT" and len(args) >= 2:
             field_name = args[0].name if isinstance(args[0], exp.Column) else None
             value = self._extract_literal_value(args[1])
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 71f8343..a52d6c7 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -125,6 +125,12 @@ def build_text_condition(
             parts = value.split("%")
             escaped_parts = [self._escape_fulltext_term(p) for p in parts]
             search_value = "*".join(escaped_parts)
+            # If the non-wildcard portion contains spaces, wrap in parens
+            # so all tokens stay scoped to the field (e.g. '%gaming laptop%'
+            # → *gaming laptop* needs grouping to avoid token leaking).
+            non_wildcard = value.strip("%")
+            if " " in non_wildcard:
+                search_value = f"({search_value})"
         elif operator == "FUZZY":
             # Escape special chars before wrapping with % markers
             escaped = self._escape_fulltext_term(value)
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index 9567620..68ea28e 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -427,6 +427,12 @@ def test_suffix_negated(self):
         result = builder.build_text_condition("title", "LIKE", "%phone", negated=True)
         assert result == "-@title:*phone"
 
+    def test_infix_multiword_grouped(self):
+        """LIKE '%multi word%' groups tokens in parentheses."""
+        builder = QueryBuilder()
+        result = builder.build_text_condition("title", "LIKE", "%gaming laptop%")
+        assert result == "@title:(*gaming laptop*)"
+
 
 class TestQueryBuilderORInText:
     """Tests for OR/union within text field searches."""
diff --git a/tests/test_sql_parser.py b/tests/test_sql_parser.py
index 4d4f7f0..be312f5 100644
--- a/tests/test_sql_parser.py
+++ b/tests/test_sql_parser.py
@@ -622,12 +622,10 @@ def test_parse_fulltext_non_column_first_arg(self):
         assert len(result.conditions) == 0
 
     def test_parse_fulltext_insufficient_args(self):
-        """Parse fulltext with insufficient arguments."""
+        """Parse fulltext with insufficient arguments raises ValueError."""
         parser = SQLParser()
-        result = parser.parse("SELECT * FROM products WHERE fulltext(title)")
-
-        # Only 1 arg, needs >= 2 - condition skipped
-        assert len(result.conditions) == 0
+        with pytest.raises(ValueError, match="requires at least 2 arguments"):
+            parser.parse("SELECT * FROM products WHERE fulltext(title)")
 
     def test_parse_geo_distance_no_args(self):
         """Parse geo_distance with no arguments in comparison."""
@@ -897,3 +895,15 @@ def test_fulltext_invalid_inorder_raises(self):
             parser.parse(
                 "SELECT * FROM idx WHERE fulltext(title, 'hello world', 0, 'yes')"
             )
+
+    def test_fulltext_no_value_raises(self):
+        """fulltext() with only field arg raises ValueError."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="requires at least 2 arguments"):
+            parser.parse("SELECT * FROM idx WHERE fulltext(title)")
+
+    def test_fuzzy_no_value_raises(self):
+        """fuzzy() with only field arg raises ValueError."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="requires at least 2 arguments"):
+            parser.parse("SELECT * FROM idx WHERE fuzzy(title)")

From 581041711e40d8bcf5f468225198c0c599f1dea3 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 19:01:00 -0400
Subject: [PATCH 18/28] =?UTF-8?q?fix:=204=20review=20issues=20=E2=80=94=20?=
 =?UTF-8?q?case-sensitive=20OR,=20score=20ORDER=20BY,=20per-row=20alias=20?=
 =?UTF-8?q?collision,=20extra=20arg=20validation?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

P1 fixes:
- Lowercase 'or' no longer parsed as boolean OR in FULLTEXT; only uppercase
  'OR' triggers union semantics ('bank or america' stays as AND search)
- ORDER BY score() alias DESC omits invalid SORTBY (RediSearch sorts by
  relevance by default); ORDER BY score ASC raises ValueError

P2 fixes:
- Score alias collision detection now checks per-row instead of first-row-only,
  preventing field overwrite when later rows have different field sets
- fulltext() rejects >4 args, fuzzy() rejects >3 args (was silently ignoring)
- Applied to both sync and async executor paths

Add 8 new tests (384 total)
---
 sql_redis/executor.py       | 32 +++++++++++++++++---------------
 sql_redis/parser.py         | 10 ++++++++++
 sql_redis/query_builder.py  |  9 ++++++---
 sql_redis/translator.py     | 19 +++++++++++++++++--
 tests/test_query_builder.py | 22 ++++++++++++++++------
 tests/test_sql_parser.py    | 14 ++++++++++++++
 tests/test_translator.py    | 31 +++++++++++++++++++++++++++++++
 7 files changed, 111 insertions(+), 26 deletions(-)

diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index f7078dc..bc71cbb 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -228,18 +228,20 @@ def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
             elif with_scores:
                 # WITHSCORES format: [count, key1, score1, [fields1], key2, score2, [fields2], ...]
                 # Stride of 3: key, score, field_list
-                # Resolve alias using first row's fields for SELECT * (no RETURN)
+                # Resolve alias per-row: FT.SEARCH may omit missing attributes,
+                # so different rows can have different field sets.  We must
+                # check each row individually to avoid overwriting a real field
+                # with the score value.
                 for i in range(1, len(raw_result) - 2, 3):
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    if score_alias is None:
-                        score_alias = self._resolve_score_alias(
-                            translated.score_alias,
-                            translated.args,
-                            first_row_fields=set(row.keys()),
-                        )
-                    row[score_alias] = score
+                    row_score_alias = self._resolve_score_alias(
+                        translated.score_alias,
+                        translated.args,
+                        first_row_fields=set(row.keys()),
+                    )
+                    row[row_score_alias] = score
                     rows.append(row)
             else:
                 # Standard format: [count, key1, [fields1], key2, [fields2], ...]
@@ -349,17 +351,17 @@ async def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
                     rows.append(row)
             elif with_scores:
                 # WITHSCORES format: [count, key1, score1, [fields1], ...]
+                # Resolve alias per-row to avoid field collision on later rows.
                 for i in range(1, len(raw_result) - 2, 3):
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    if score_alias is None:
-                        score_alias = self._resolve_score_alias(
-                            translated.score_alias,
-                            translated.args,
-                            first_row_fields=set(row.keys()),
-                        )
-                    row[score_alias] = score
+                    row_score_alias = self._resolve_score_alias(
+                        translated.score_alias,
+                        translated.args,
+                        first_row_fields=set(row.keys()),
+                    )
+                    row[row_score_alias] = score
                     rows.append(row)
             else:
                 # Standard format: [count, key1, [fields1], key2, [fields2], ...]
diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index 349284e..52dd199 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -986,6 +986,16 @@ def _add_function_condition(
                 f"{func_name.lower()}(field, value), got {len(args)}."
             )
 
+        # Validate max argument counts to catch typos / misuse early.
+        # fulltext(field, value [, slop [, inorder]]) → max 4
+        # fuzzy(field, value [, level])               → max 3
+        _max_args = {"FULLTEXT": 4, "FUZZY": 3}
+        if func_name in _max_args and len(args) > _max_args[func_name]:
+            raise ValueError(
+                f"{func_name.lower()}() accepts at most {_max_args[func_name]} "
+                f"arguments, got {len(args)}."
+            )
+
         if func_name == "FULLTEXT" and len(args) >= 2:
             field_name = args[0].name if isinstance(args[0], exp.Column) else None
             value = self._extract_literal_value(args[1])
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index a52d6c7..074143b 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -146,13 +146,16 @@ def build_text_condition(
             # Exact phrase match — always wrap in quotes, preserve stopwords.
             escaped = self._escape_text_value(value)
             search_value = f'"{escaped}"'
-        elif re.search(r"\s+[Oo][Rr]\s+", value):
-            # OR union within text field: split on case-insensitive OR with
+        elif re.search(r"\s+OR\s+", value):
+            # OR union within text field: split on uppercase-only OR with
             # flexible whitespace, escape each term, join with |.
+            # Only uppercase OR is treated as a boolean operator; lowercase
+            # "or" is treated as a regular search term (e.g. "bank or america"
+            # stays as a multi-word AND search, not bank|america).
             # Multi-word operands (e.g. "gaming laptop OR tablet") are wrapped
             # in parentheses so each side is an atomic subexpression.
             or_parts: list[str] = []
-            for part in re.split(r"\s+[Oo][Rr]\s+", value):
+            for part in re.split(r"\s+OR\s+", value):
                 words = part.strip().split()
                 if not words:
                     raise ValueError(
diff --git a/sql_redis/translator.py b/sql_redis/translator.py
index a524851..c89e13b 100644
--- a/sql_redis/translator.py
+++ b/sql_redis/translator.py
@@ -361,10 +361,25 @@ def _build_search(
             args.append(str(len(return_fields)))
             args.extend(return_fields)
 
-        # SORTBY
+        # SORTBY — skip if the ORDER BY field is a score() alias, because
+        # WITHSCORES already returns results in relevance order and the alias
+        # is not a sortable indexed field.
+        score_alias_name = parsed.scoring.alias if parsed.scoring else None
         if parsed.orderby_fields:
             field_name, direction = parsed.orderby_fields[0]
-            args.extend(["SORTBY", field_name, direction])
+            if field_name == score_alias_name:
+                # score() alias — not a real field; RediSearch sorts by
+                # relevance by default when no SORTBY is specified.
+                if direction == "ASC":
+                    raise ValueError(
+                        f"ORDER BY {field_name} ASC is not supported: "
+                        "RediSearch returns results in descending relevance "
+                        "order by default and does not support ascending "
+                        "score sorting via FT.SEARCH."
+                    )
+                # DESC is the default — omit SORTBY entirely
+            else:
+                args.extend(["SORTBY", field_name, direction])
 
         # LIMIT
         if parsed.limit is not None:
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index 68ea28e..a67fd91 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -631,17 +631,27 @@ def test_multi_field_fuzzy(self):
         )
         assert result == "(@title|description:%%laptap%%)"
 
-    def test_or_case_insensitive_lowercase(self):
-        """OR parsing is case-insensitive: 'laptop or tablet' works."""
+    def test_lowercase_or_is_not_boolean(self):
+        """Lowercase 'or' is treated as a regular search term, not a boolean operator.
+
+        'bank or america' should NOT become bank|america — it should be a
+        multi-word AND-style search with stopword filtering applied to 'or'.
+        """
         builder = QueryBuilder()
         result = builder.build_text_condition("title", "FULLTEXT", "laptop or tablet")
-        assert result == "@title:(laptop|tablet)"
+        # "or" is a stopword; remaining terms are "laptop" and "tablet"
+        assert result == "@title:(laptop tablet)"
 
-    def test_or_case_insensitive_mixed(self):
-        """OR parsing is case-insensitive: 'laptop Or tablet' works."""
+    def test_mixed_case_or_is_not_boolean(self):
+        """Mixed case 'Or' / 'oR' is treated as a regular term, not boolean OR.
+
+        Only uppercase 'OR' triggers the union operator.
+        'Or' is a stopword (or → stopword list), so it gets removed.
+        """
         builder = QueryBuilder()
         result = builder.build_text_condition("title", "FULLTEXT", "laptop Or tablet")
-        assert result == "@title:(laptop|tablet)"
+        # "Or" lowercases to "or" which is a stopword; remaining: laptop tablet
+        assert result == "@title:(laptop tablet)"
 
     def test_or_extra_whitespace(self):
         """OR parsing tolerates extra whitespace."""
diff --git a/tests/test_sql_parser.py b/tests/test_sql_parser.py
index be312f5..a79b75b 100644
--- a/tests/test_sql_parser.py
+++ b/tests/test_sql_parser.py
@@ -907,3 +907,17 @@ def test_fuzzy_no_value_raises(self):
         parser = SQLParser()
         with pytest.raises(ValueError, match="requires at least 2 arguments"):
             parser.parse("SELECT * FROM idx WHERE fuzzy(title)")
+
+    def test_fulltext_too_many_args_raises(self):
+        """fulltext() with more than 4 arguments raises ValueError."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="at most 4 arguments"):
+            parser.parse(
+                "SELECT * FROM idx WHERE fulltext(title, 'hello world', 2, true, 'extra')"
+            )
+
+    def test_fuzzy_too_many_args_raises(self):
+        """fuzzy() with more than 3 arguments raises ValueError."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="at most 3 arguments"):
+            parser.parse("SELECT * FROM idx WHERE fuzzy(title, 'laptap', 2, 'extra')")
diff --git a/tests/test_translator.py b/tests/test_translator.py
index 555c636..c43367b 100644
--- a/tests/test_translator.py
+++ b/tests/test_translator.py
@@ -840,3 +840,34 @@ def test_score_too_many_args_raises(self, translator: Translator, basic_index: s
                 f"SELECT score('BM25', 'extra') AS relevance FROM {basic_index} "
                 "WHERE fulltext(title, 'laptop')"
             )
+
+    def test_order_by_score_desc_omits_sortby(
+        self, translator: Translator, basic_index: str
+    ):
+        """ORDER BY score_alias DESC omits SORTBY (RediSearch sorts by relevance by default)."""
+        result = translator.translate(
+            f"SELECT title, score() AS relevance FROM {basic_index} "
+            "WHERE fulltext(title, 'laptop') ORDER BY relevance DESC"
+        )
+        assert "WITHSCORES" in result.args
+        assert "SORTBY" not in result.args
+
+    def test_order_by_score_asc_raises(self, translator: Translator, basic_index: str):
+        """ORDER BY score_alias ASC raises ValueError (not supported by RediSearch)."""
+        with pytest.raises(ValueError, match="ASC is not supported"):
+            translator.translate(
+                f"SELECT title, score() AS relevance FROM {basic_index} "
+                "WHERE fulltext(title, 'laptop') ORDER BY relevance ASC"
+            )
+
+    def test_order_by_real_field_with_score_still_works(
+        self, translator: Translator, basic_index: str
+    ):
+        """ORDER BY a real field (not score alias) still emits SORTBY."""
+        result = translator.translate(
+            f"SELECT title, score() AS relevance FROM {basic_index} "
+            "WHERE fulltext(title, 'laptop') ORDER BY price DESC"
+        )
+        assert "SORTBY" in result.args
+        idx = result.args.index("SORTBY")
+        assert result.args[idx + 1] == "price"

From 2ca128be12db4d669dd8f073203cc0ae3726f0fd Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Wed, 1 Apr 2026 19:03:10 -0400
Subject: [PATCH 19/28] fix: reject non-column args in fulltext/fuzzy, validate
 score() literal arg

- fulltext(UPPER(title), ...) and fuzzy('title', ...) now raise ValueError
  instead of silently dropping the predicate
- score(my_column) raises ValueError; only literal scorer names accepted
- Update existing test expectations for non-column first arg
- Add 2 new tests (386 total)
---
 sql_redis/parser.py      | 54 ++++++++++++++++++++++++----------------
 tests/test_sql_parser.py | 24 ++++++++++++------
 2 files changed, 50 insertions(+), 28 deletions(-)

diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index 52dd199..8cae422 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -466,8 +466,12 @@ def _process_select_expression_inner(
                     )
                 if expression.expressions:
                     scorer_val = self._extract_literal_value(expression.expressions[0])
-                    if scorer_val is not None:
-                        scorer = str(scorer_val)
+                    if scorer_val is None:
+                        raise ValueError(
+                            "score() argument must be a literal scorer name "
+                            f"(e.g., 'BM25', 'TFIDF'), got {expression.expressions[0]}."
+                        )
+                    scorer = str(scorer_val)
                 if result.scoring is not None:
                     raise ValueError(
                         "Only one score() expression is allowed per query."
@@ -1036,17 +1040,21 @@ def _add_function_condition(
                             f"(true/false or 1/0), got {inorder_val!r}"
                         )
 
-            if field_name is not None:
-                result.conditions.append(
-                    Condition(
-                        field=field_name,
-                        operator="FULLTEXT",
-                        value=value,
-                        negated=negated,
-                        slop=slop,
-                        inorder=inorder,
-                    )
+            if field_name is None:
+                raise ValueError(
+                    "fulltext() first argument must be a column name, "
+                    f"got {args[0]}. Usage: fulltext(field, 'search terms')"
+                )
+            result.conditions.append(
+                Condition(
+                    field=field_name,
+                    operator="FULLTEXT",
+                    value=value,
+                    negated=negated,
+                    slop=slop,
+                    inorder=inorder,
                 )
+            )
 
         elif func_name == "FUZZY" and len(args) >= 2:
             field_name = args[0].name if isinstance(args[0], exp.Column) else None
@@ -1067,16 +1075,20 @@ def _add_function_condition(
                         )
                     fuzzy_level = int(level_val)
 
-            if field_name is not None:
-                result.conditions.append(
-                    Condition(
-                        field=field_name,
-                        operator="FUZZY",
-                        value=value,
-                        negated=negated,
-                        fuzzy_level=fuzzy_level,
-                    )
+            if field_name is None:
+                raise ValueError(
+                    "fuzzy() first argument must be a column name, "
+                    f"got {args[0]}. Usage: fuzzy(field, 'search term')"
+                )
+            result.conditions.append(
+                Condition(
+                    field=field_name,
+                    operator="FUZZY",
+                    value=value,
+                    negated=negated,
+                    fuzzy_level=fuzzy_level,
                 )
+            )
 
     def _extract_literal_value(self, expression, convert_dates: bool = False):
         """Extract a Python value from a sqlglot Literal or Neg expression.
diff --git a/tests/test_sql_parser.py b/tests/test_sql_parser.py
index a79b75b..72a4f56 100644
--- a/tests/test_sql_parser.py
+++ b/tests/test_sql_parser.py
@@ -612,14 +612,10 @@ def test_parse_non_fulltext_function_in_where(self):
         assert len(result.conditions) == 0
 
     def test_parse_fulltext_non_column_first_arg(self):
-        """Parse fulltext with non-column first argument."""
+        """Parse fulltext with non-column first argument raises ValueError."""
         parser = SQLParser()
-        result = parser.parse(
-            "SELECT * FROM products WHERE fulltext(UPPER(title), 'query')"
-        )
-
-        # First arg is a function, not Column - condition skipped
-        assert len(result.conditions) == 0
+        with pytest.raises(ValueError, match="must be a column name"):
+            parser.parse("SELECT * FROM products WHERE fulltext(UPPER(title), 'query')")
 
     def test_parse_fulltext_insufficient_args(self):
         """Parse fulltext with insufficient arguments raises ValueError."""
@@ -921,3 +917,17 @@ def test_fuzzy_too_many_args_raises(self):
         parser = SQLParser()
         with pytest.raises(ValueError, match="at most 3 arguments"):
             parser.parse("SELECT * FROM idx WHERE fuzzy(title, 'laptap', 2, 'extra')")
+
+    def test_fuzzy_non_column_first_arg_raises(self):
+        """fuzzy() with non-column first argument raises ValueError."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="must be a column name"):
+            parser.parse("SELECT * FROM idx WHERE fuzzy('title', 'laptap')")
+
+    def test_score_non_literal_arg_raises(self):
+        """score() with a non-literal argument (e.g., column ref) raises ValueError."""
+        parser = SQLParser()
+        with pytest.raises(ValueError, match="must be a literal scorer name"):
+            parser.parse(
+                "SELECT score(my_column) AS relevance FROM idx WHERE fulltext(title, 'laptop')"
+            )

From be1a839a009bed9dc9baa38f6178320d8c55c92f Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Thu, 2 Apr 2026 00:15:24 -0400
Subject: [PATCH 20/28] address PR #17 review comments
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Fix FULLTEXT operator naming (MATCH → FULLTEXT) in query_builder and tests
- Resolve score alias once per result set to prevent column name flip-flop
- Add fuzzy_level range validation (1-3) in parser
- Fix import formatting (isort/black) in translator.py and analyzer.py
---
 sql_redis/executor.py       | 37 ++++++++++++++++++++-----------------
 sql_redis/parser.py         |  5 +++++
 sql_redis/query_builder.py  |  2 +-
 tests/test_query_builder.py |  4 ++--
 4 files changed, 28 insertions(+), 20 deletions(-)

diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index bc71cbb..f7d42da 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -228,20 +228,20 @@ def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
             elif with_scores:
                 # WITHSCORES format: [count, key1, score1, [fields1], key2, score2, [fields2], ...]
                 # Stride of 3: key, score, field_list
-                # Resolve alias per-row: FT.SEARCH may omit missing attributes,
-                # so different rows can have different field sets.  We must
-                # check each row individually to avoid overwriting a real field
-                # with the score value.
+                # Resolve alias once from the first row so every row uses the
+                # same column name (consistent output schema).
+                resolved_alias: str | None = None
                 for i in range(1, len(raw_result) - 2, 3):
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    row_score_alias = self._resolve_score_alias(
-                        translated.score_alias,
-                        translated.args,
-                        first_row_fields=set(row.keys()),
-                    )
-                    row[row_score_alias] = score
+                    if resolved_alias is None:
+                        resolved_alias = self._resolve_score_alias(
+                            translated.score_alias,
+                            translated.args,
+                            first_row_fields=set(row.keys()),
+                        )
+                    row[resolved_alias] = score
                     rows.append(row)
             else:
                 # Standard format: [count, key1, [fields1], key2, [fields2], ...]
@@ -351,17 +351,20 @@ async def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
                     rows.append(row)
             elif with_scores:
                 # WITHSCORES format: [count, key1, score1, [fields1], ...]
-                # Resolve alias per-row to avoid field collision on later rows.
+                # Resolve alias once from the first row so every row uses the
+                # same column name (consistent output schema).
+                resolved_alias: str | None = None
                 for i in range(1, len(raw_result) - 2, 3):
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    row_score_alias = self._resolve_score_alias(
-                        translated.score_alias,
-                        translated.args,
-                        first_row_fields=set(row.keys()),
-                    )
-                    row[row_score_alias] = score
+                    if resolved_alias is None:
+                        resolved_alias = self._resolve_score_alias(
+                            translated.score_alias,
+                            translated.args,
+                            first_row_fields=set(row.keys()),
+                        )
+                    row[resolved_alias] = score
                     rows.append(row)
             else:
                 # Standard format: [count, key1, [fields1], key2, [fields2], ...]
diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index 8cae422..4fcd0bc 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -1074,6 +1074,11 @@ def _add_function_condition(
                             f"FUZZY level argument must be an integer (got {level_val})"
                         )
                     fuzzy_level = int(level_val)
+                    if fuzzy_level not in (1, 2, 3):
+                        raise ValueError(
+                            f"FUZZY level must be 1, 2, or 3 (got {fuzzy_level}). "
+                            "RediSearch supports a maximum Levenshtein distance of 3."
+                        )
 
             if field_name is None:
                 raise ValueError(
diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 074143b..eb23787 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -180,7 +180,7 @@ def build_text_condition(
                         or_parts.append(self._escape_fulltext_term(token))
             search_value = f"({'|'.join(or_parts)})"
         elif " " in value:
-            # FULLTEXT/MATCH with multi-word: tokenized search with stopword filtering.
+            # FULLTEXT with multi-word: tokenized search with stopword filtering.
             # Each term is escaped to prevent accidental operator injection, but a
             # leading ~ (optional-term modifier) is preserved as an intentional
             # RediSearch operator.
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index a67fd91..b358462 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -324,7 +324,7 @@ def test_simple_text_query(self):
         """Build simple text search query."""
         builder = QueryBuilder()
         result = builder.build_query_string(
-            text_conditions=[("title", "MATCH", "laptop")],
+            text_conditions=[("title", "FULLTEXT", "laptop")],
             field_types={"title": "TEXT"},
         )
 
@@ -334,7 +334,7 @@ def test_combined_query(self):
         """Build combined text + numeric + tag query."""
         builder = QueryBuilder()
         result = builder.build_query_string(
-            text_conditions=[("title", "MATCH", "laptop")],
+            text_conditions=[("title", "FULLTEXT", "laptop")],
             numeric_conditions=[("price", "<", 1000)],
             tag_conditions=[("category", "=", "electronics")],
             field_types={"title": "TEXT", "price": "NUMERIC", "category": "TAG"},

From 597c56d2e2b53d3eb0f7a68b0afe5fb1652862c0 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Thu, 2 Apr 2026 10:18:22 -0400
Subject: [PATCH 21/28] Address review comments: strict parser validation,
 stable score alias resolution, OR docs fix

- Validate fulltext/fuzzy/score args are literals (allow Placeholders)
- Collect all field names across result set before resolving score alias
- Clarify OR operator case-sensitivity in README
---
 README.md             |  2 +-
 sql_redis/executor.py | 53 ++++++++++++++++++++++++-------------------
 sql_redis/parser.py   | 32 +++++++++++++++++++++++++-
 3 files changed, 62 insertions(+), 25 deletions(-)

diff --git a/README.md b/README.md
index 0fdd86d..554494a 100644
--- a/README.md
+++ b/README.md
@@ -218,7 +218,7 @@ SELECT * FROM products WHERE fulltext(title, 'laptop') OR fulltext(description,
 - `=` on TEXT fields performs **exact phrase** matching (preserves stopwords)
 - `fulltext()` performs **tokenized** search (stopwords are filtered with a warning)
 - `fuzzy()` and `fulltext()` only work on TEXT fields — using them on TAG or NUMERIC raises `ValueError`
-- OR is case-insensitive: `'laptop OR tablet'`, `'laptop or tablet'`, and `'laptop Or tablet'` all work
+- OR must be **uppercase**: `'laptop OR tablet'` triggers union; lowercase `'laptop or tablet'` is treated as a regular three-word AND search
 - Special characters (`@`, `|`, `-`, `*`, `+`, etc.) in search terms are automatically escaped
 
 ### IS NULL / IS NOT NULL (ismissing)
diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index f7d42da..bddf664 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -122,14 +122,14 @@ def _resolve_score_alias(
         first_row_fields: set[str] | None = None,
     ) -> str:
         """Determine a stable score column name that won't collide with
-        document fields.  The alias is decided once before iterating rows
-        so every row uses the same column name.
+        document fields.  The alias is resolved once and reused for every
+        row so all rows share the same column name.
 
         When a RETURN clause is present, the returned field names are used
         for collision detection.  When RETURN is absent (SELECT *), the
-        caller should pass ``first_row_fields`` — the field names from the
-        first result row — so we can detect collisions even when all
-        document attributes are returned."""
+        caller should pass ``first_row_fields`` — the union of all field
+        names across all result rows — so we can detect collisions even
+        when different documents have different field sets."""
         alias = score_alias or "__score"
         # Extract RETURN field names from args to detect collision
         try:
@@ -228,19 +228,23 @@ def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
             elif with_scores:
                 # WITHSCORES format: [count, key1, score1, [fields1], key2, score2, [fields2], ...]
                 # Stride of 3: key, score, field_list
-                # Resolve alias once from the first row so every row uses the
-                # same column name (consistent output schema).
-                resolved_alias: str | None = None
+                # First pass: collect all field names across all rows so the
+                # alias avoids collisions with any document field, not just
+                # the first row's fields.
+                all_field_names: set[str] = set()
+                parsed_rows: list[tuple[dict, Any]] = []
                 for i in range(1, len(raw_result) - 2, 3):
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    if resolved_alias is None:
-                        resolved_alias = self._resolve_score_alias(
-                            translated.score_alias,
-                            translated.args,
-                            first_row_fields=set(row.keys()),
-                        )
+                    all_field_names.update(row.keys())
+                    parsed_rows.append((row, score))
+                resolved_alias = self._resolve_score_alias(
+                    translated.score_alias,
+                    translated.args,
+                    first_row_fields=all_field_names,
+                )
+                for row, score in parsed_rows:
                     row[resolved_alias] = score
                     rows.append(row)
             else:
@@ -351,19 +355,22 @@ async def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
                     rows.append(row)
             elif with_scores:
                 # WITHSCORES format: [count, key1, score1, [fields1], ...]
-                # Resolve alias once from the first row so every row uses the
-                # same column name (consistent output schema).
-                resolved_alias: str | None = None
+                # First pass: collect all field names across all rows so the
+                # alias avoids collisions with any document field.
+                all_field_names: set[str] = set()
+                parsed_rows: list[tuple[dict, Any]] = []
                 for i in range(1, len(raw_result) - 2, 3):
                     score = raw_result[i + 1]
                     row_data = raw_result[i + 2]
                     row = dict(zip(row_data[::2], row_data[1::2]))
-                    if resolved_alias is None:
-                        resolved_alias = self._resolve_score_alias(
-                            translated.score_alias,
-                            translated.args,
-                            first_row_fields=set(row.keys()),
-                        )
+                    all_field_names.update(row.keys())
+                    parsed_rows.append((row, score))
+                resolved_alias = self._resolve_score_alias(
+                    translated.score_alias,
+                    translated.args,
+                    first_row_fields=all_field_names,
+                )
+                for row, score in parsed_rows:
                     row[resolved_alias] = score
                     rows.append(row)
             else:
diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index 4fcd0bc..b74b898 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -471,7 +471,12 @@ def _process_select_expression_inner(
                             "score() argument must be a literal scorer name "
                             f"(e.g., 'BM25', 'TFIDF'), got {expression.expressions[0]}."
                         )
-                    scorer = str(scorer_val)
+                    if not isinstance(scorer_val, str):
+                        raise ValueError(
+                            "score() argument must be a string scorer name "
+                            f"(e.g., 'BM25', 'TFIDF'), got {scorer_val!r}."
+                        )
+                    scorer = scorer_val
                 if result.scoring is not None:
                     raise ValueError(
                         "Only one score() expression is allowed per query."
@@ -1003,11 +1008,21 @@ def _add_function_condition(
         if func_name == "FULLTEXT" and len(args) >= 2:
             field_name = args[0].name if isinstance(args[0], exp.Column) else None
             value = self._extract_literal_value(args[1])
+            if value is None and not isinstance(args[1], exp.Placeholder):
+                raise ValueError(
+                    "fulltext() second argument must be a literal string, "
+                    f"got {args[1]}. Usage: fulltext(field, 'search terms')"
+                )
 
             # Optional 3rd arg: slop (non-negative int)
             slop = None
             if len(args) >= 3:
                 slop_val = self._extract_literal_value(args[2])
+                if slop_val is None and not isinstance(args[2], exp.Placeholder):
+                    raise ValueError(
+                        "fulltext() slop argument must be a literal integer, "
+                        f"got {args[2]}."
+                    )
                 if slop_val is not None:
                     # Reject booleans and non-integer floats — only real
                     # integers are valid for slop.
@@ -1029,6 +1044,11 @@ def _add_function_condition(
             inorder = False
             if len(args) >= 4:
                 inorder_val = self._extract_literal_value(args[3])
+                if inorder_val is None and not isinstance(args[3], exp.Placeholder):
+                    raise ValueError(
+                        "fulltext() inorder argument must be a literal boolean "
+                        f"(true/false or 1/0), got {args[3]}."
+                    )
                 if inorder_val is not None:
                     if isinstance(inorder_val, bool):
                         inorder = inorder_val
@@ -1059,11 +1079,21 @@ def _add_function_condition(
         elif func_name == "FUZZY" and len(args) >= 2:
             field_name = args[0].name if isinstance(args[0], exp.Column) else None
             value = self._extract_literal_value(args[1])
+            if value is None and not isinstance(args[1], exp.Placeholder):
+                raise ValueError(
+                    "fuzzy() second argument must be a literal string, "
+                    f"got {args[1]}. Usage: fuzzy(field, 'search term')"
+                )
 
             # Optional 3rd arg: fuzzy level (1, 2, or 3)
             fuzzy_level = None
             if len(args) >= 3:
                 level_val = self._extract_literal_value(args[2])
+                if level_val is None and not isinstance(args[2], exp.Placeholder):
+                    raise ValueError(
+                        "fuzzy() level argument must be a literal integer, "
+                        f"got {args[2]}."
+                    )
                 if level_val is not None:
                     if isinstance(level_val, bool):
                         raise ValueError(

From 610bbf22a02cef6233eb7d07b22804f1e63be69d Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Thu, 2 Apr 2026 10:38:36 -0400
Subject: [PATCH 22/28] Normalize bytes field keys to str in score alias
 collision detection

When decode_responses=False, Redis returns field names as bytes. The
collision check now decodes them so alias detection works consistently.
---
 sql_redis/executor.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index bddf664..81868dd 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -137,7 +137,12 @@ def _resolve_score_alias(
             count = int(args[idx + 1])
             return_fields = set(args[idx + 2 : idx + 2 + count])
         except (ValueError, IndexError):
-            return_fields = first_row_fields or set()
+            # Normalize bytes keys to str so collision detection works
+            # regardless of decode_responses setting.
+            raw = first_row_fields or set()
+            return_fields = {
+                k.decode() if isinstance(k, bytes) else k for k in raw
+            }
         while alias in return_fields:
             alias = f"__score_{alias}"
         return alias

From 6bd0745e8de8268e9340d1d79d4204a8eeecf3ef Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Thu, 2 Apr 2026 10:41:07 -0400
Subject: [PATCH 23/28] Fix black formatting

---
 sql_redis/executor.py | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index 81868dd..0b55f37 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -140,9 +140,7 @@ def _resolve_score_alias(
             # Normalize bytes keys to str so collision detection works
             # regardless of decode_responses setting.
             raw = first_row_fields or set()
-            return_fields = {
-                k.decode() if isinstance(k, bytes) else k for k in raw
-            }
+            return_fields = {k.decode() if isinstance(k, bytes) else k for k in raw}
         while alias in return_fields:
             alias = f"__score_{alias}"
         return alias

From 8e2753a8be96c9ce09feff385acda38b2d3c95b4 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Thu, 2 Apr 2026 16:01:22 -0400
Subject: [PATCH 24/28] Strip stopwords from exact phrase queries (= operator)

RediSearch does not index stopwords, so exact phrase queries like
"diagnosing and treating" fail with a syntax error. The = operator
now strips default stopwords before wrapping in double quotes, matching
how the indexer assigns consecutive positions. A warning is emitted
when stopwords are removed.

Also removes outdated 'Use = operator for exact phrase matching that
preserves stopwords' hint from FULLTEXT stopword warning.
---
 sql_redis/query_builder.py  | 37 +++++++++++++++++++++++++++++++++----
 tests/test_query_builder.py | 28 +++++++++++++++++++++++-----
 2 files changed, 56 insertions(+), 9 deletions(-)

diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index eb23787..3b62e6c 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -143,8 +143,37 @@ def build_text_condition(
             pct = "%" * level
             search_value = f"{pct}{escaped}{pct}"
         elif operator in ("=", "!="):
-            # Exact phrase match — always wrap in quotes, preserve stopwords.
-            escaped = self._escape_text_value(value)
+            # Exact phrase match — wrap in double quotes.
+            # Strip default stopwords because RediSearch does not index them;
+            # keeping them in the quoted phrase causes a query-time error
+            # (e.g. "diagnosing and treating" fails on "and").
+            # Since the indexer assigns consecutive positions after dropping
+            # stopwords, the stripped phrase matches correctly.
+            words = value.split()
+            removed = [w for w in words if w.lower() in REDIS_DEFAULT_STOPWORDS]
+            filtered = [w for w in words if w.lower() not in REDIS_DEFAULT_STOPWORDS]
+
+            if removed:
+                phrase_words = filtered if filtered else words
+                if filtered:
+                    sw_msg = f"Stopwords {removed} were removed from"
+                else:
+                    sw_msg = (
+                        f"All tokens in '{value}' are stopwords and may not "
+                        "be indexed in"
+                    )
+                warnings.warn(
+                    f"{sw_msg} exact phrase '{value}'. "
+                    "By default, Redis does not index stopwords. "
+                    "To include stopwords in your index, create it "
+                    "with STOPWORDS 0.",
+                    UserWarning,
+                    stacklevel=2,
+                )
+            else:
+                phrase_words = words
+
+            escaped = self._escape_text_value(" ".join(phrase_words))
             search_value = f'"{escaped}"'
         elif re.search(r"\s+OR\s+", value):
             # OR union within text field: split on uppercase-only OR with
@@ -200,8 +229,8 @@ def build_text_condition(
                 warnings.warn(
                     f"{sw_action} text search '{value}'. "
                     "By default, Redis does not index stopwords. "
-                    "To include stopwords in your index, create it with STOPWORDS 0. "
-                    "Use = operator for exact phrase matching that preserves stopwords.",
+                    "To include stopwords in your index, create it "
+                    "with STOPWORDS 0.",
                     UserWarning,
                     stacklevel=2,
                 )
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index b358462..97f1f01 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -22,13 +22,31 @@ def test_text_exact_phrase(self):
 
         assert result == '@title:"gaming laptop"'
 
-    def test_text_exact_phrase_preserves_stopwords(self):
-        """TEXT field with = preserves stopwords in exact phrase matching."""
+    def test_text_exact_phrase_strips_stopwords(self):
+        """TEXT field with = strips stopwords and warns (RediSearch doesn't index them)."""
         builder = QueryBuilder()
-        result = builder.build_text_condition("name", "=", "bank of america")
+        import warnings
 
-        # Stopwords like "of" must NOT be stripped for exact phrase matching
-        assert result == '@name:"bank of america"'
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            result = builder.build_text_condition("name", "=", "bank of america")
+
+        # "of" is a stopword — stripped so the phrase matches indexed positions
+        assert result == '@name:"bank america"'
+        assert len(w) == 1
+        assert "Stopwords ['of']" in str(w[0].message)
+
+    def test_text_exact_phrase_no_stopwords_no_warning(self):
+        """TEXT field with = on phrase without stopwords produces no warning."""
+        builder = QueryBuilder()
+        import warnings
+
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            result = builder.build_text_condition("name", "=", "bank america")
+
+        assert result == '@name:"bank america"'
+        assert len(w) == 0
 
     def test_text_exact_phrase_escapes_quotes(self):
         """TEXT field with = escapes double quotes inside the value."""

From 74dbaf7ba78c6417570c2833179e2e90579780f5 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Thu, 2 Apr 2026 16:17:24 -0400
Subject: [PATCH 25/28] Harden WITHSCORES detection and reject empty scorer
 names

- Detect WITHSCORES mode via translated.score_alias instead of
  scanning args for the literal token, preventing false positives
  if a field is named WITHSCORES.
- Reject score('') with a clear ValueError so the caller's intent
  is not silently lost by falling back to the default scorer.
---
 sql_redis/executor.py | 8 +++++---
 sql_redis/parser.py   | 6 ++++++
 2 files changed, 11 insertions(+), 3 deletions(-)

diff --git a/sql_redis/executor.py b/sql_redis/executor.py
index 0b55f37..e15d1b9 100644
--- a/sql_redis/executor.py
+++ b/sql_redis/executor.py
@@ -209,8 +209,10 @@ def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
         rows = []
 
         if translated.command == "FT.SEARCH":
-            # Check if WITHSCORES was requested — changes response format
-            with_scores = "WITHSCORES" in translated.args
+            # Use the explicit score_alias signal rather than scanning args
+            # for the literal token "WITHSCORES", which could false-positive
+            # if a returned field happened to be named "WITHSCORES".
+            with_scores = translated.score_alias is not None
             # RETURN 0 suppresses document fields (like NOCONTENT);
             # with WITHSCORES the reply is [count, id, score, id, score, ...]
             no_content = self._has_return_0(translated.args)
@@ -342,7 +344,7 @@ async def execute(self, sql: str, *, params: dict | None = None) -> QueryResult:
         rows = []
 
         if translated.command == "FT.SEARCH":
-            with_scores = "WITHSCORES" in translated.args
+            with_scores = translated.score_alias is not None
             no_content = self._has_return_0(translated.args)
 
             score_alias: str | None = None
diff --git a/sql_redis/parser.py b/sql_redis/parser.py
index b74b898..dc12690 100644
--- a/sql_redis/parser.py
+++ b/sql_redis/parser.py
@@ -476,6 +476,12 @@ def _process_select_expression_inner(
                             "score() argument must be a string scorer name "
                             f"(e.g., 'BM25', 'TFIDF'), got {scorer_val!r}."
                         )
+                    if not scorer_val:
+                        raise ValueError(
+                            "score() scorer name must not be empty. "
+                            "Use score() with no arguments for the default "
+                            "BM25 scorer, or pass a valid name like 'TFIDF'."
+                        )
                     scorer = scorer_val
                 if result.scoring is not None:
                     raise ValueError(

From 9c857e9fbebb2ef362761e0005c64106fa503cfa Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Thu, 2 Apr 2026 16:55:13 -0400
Subject: [PATCH 26/28] Document stopword stripping behavior for = and
 fulltext()

Update README to reflect that both exact phrase (=) and tokenized
search (fulltext()) strip default Redis stopwords before sending
queries. Adds a dedicated Stopword Handling section with examples
and the STOPWORDS 0 workaround. Replaces outdated 'preserves
stopwords' language.
---
 README.md | 54 ++++++++++++++++++++++++++++++++++--------------------
 1 file changed, 34 insertions(+), 20 deletions(-)

diff --git a/README.md b/README.md
index 554494a..f7cfc2e 100644
--- a/README.md
+++ b/README.md
@@ -172,28 +172,29 @@ The layered approach emerged from TDD — writing tests first revealed natural b
 
 Full-text search on TEXT fields with multiple search modes:
 
-| Feature | SQL Syntax | RediSearch Output |
-|---------|-----------|-------------------|
-| Exact phrase | `title = 'gaming laptop'` | `@title:"gaming laptop"` |
-| Tokenized search | `fulltext(title, 'gaming laptop')` | `@title:(gaming laptop)` |
-| Fuzzy LD=1 | `fuzzy(title, 'laptap')` | `@title:%laptap%` |
-| Fuzzy LD=2 | `fuzzy(title, 'laptap', 2)` | `@title:%%laptap%%` |
-| Fuzzy LD=3 | `fuzzy(title, 'laptap', 3)` | `@title:%%%laptap%%%` |
-| OR / union | `fulltext(title, 'laptop OR tablet')` | `@title:(laptop\|tablet)` |
-| Prefix | `title LIKE 'lap%'` | `@title:lap*` |
-| Suffix | `title LIKE '%top'` | `@title:*top` |
-| Contains | `title LIKE '%apt%'` | `@title:*apt*` |
-| Proximity (slop) | `fulltext(title, 'gaming laptop', 2)` | `@title:(gaming laptop) => { $slop: 2; }` |
-| Proximity + order | `fulltext(title, 'gaming laptop', 2, true)` | `@title:(gaming laptop) => { $slop: 2; $inorder: true; }` |
-| Optional term | `fulltext(title, 'laptop ~gaming')` | `@title:(laptop ~gaming)` |
-| BM25 score | `SELECT score() AS relevance FROM idx` | `FT.SEARCH ... WITHSCORES` |
-| Negation | `NOT fulltext(title, 'refurbished')` | `-@title:refurbished` |
+| Feature | SQL Syntax | RediSearch Output | Notes |
+|---------|-----------|-------------------|-------|
+| Exact phrase | `title = 'gaming laptop'` | `@title:"gaming laptop"` | Stopwords stripped |
+| Tokenized search | `fulltext(title, 'gaming laptop')` | `@title:(gaming laptop)` | Stopwords stripped |
+| Fuzzy LD=1 | `fuzzy(title, 'laptap')` | `@title:%laptap%` | |
+| Fuzzy LD=2 | `fuzzy(title, 'laptap', 2)` | `@title:%%laptap%%` | |
+| Fuzzy LD=3 | `fuzzy(title, 'laptap', 3)` | `@title:%%%laptap%%%` | |
+| OR / union | `fulltext(title, 'laptop OR tablet')` | `@title:(laptop\|tablet)` | |
+| Prefix | `title LIKE 'lap%'` | `@title:lap*` | |
+| Suffix | `title LIKE '%top'` | `@title:*top` | |
+| Contains | `title LIKE '%apt%'` | `@title:*apt*` | |
+| Proximity (slop) | `fulltext(title, 'gaming laptop', 2)` | `@title:(gaming laptop) => { $slop: 2; }` | |
+| Proximity + order | `fulltext(title, 'gaming laptop', 2, true)` | `@title:(gaming laptop) => { $slop: 2; $inorder: true; }` | |
+| Optional term | `fulltext(title, 'laptop ~gaming')` | `@title:(laptop ~gaming)` | |
+| BM25 score | `SELECT score() AS relevance FROM idx` | `FT.SEARCH ... WITHSCORES` | |
+| Negation | `NOT fulltext(title, 'refurbished')` | `-@title:refurbished` | |
 
 **Examples:**
 
 ```sql
--- Exact phrase match (stopwords preserved)
+-- Exact phrase match (stopwords like "of" are stripped automatically)
 SELECT * FROM products WHERE title = 'bank of america'
+-- Produces: @title:"bank america"
 
 -- Fuzzy search for typos (Levenshtein distance 2)
 SELECT * FROM products WHERE fuzzy(title, 'laptap', 2)
@@ -214,10 +215,23 @@ SELECT title, score() AS relevance FROM products WHERE fulltext(title, 'laptop')
 SELECT * FROM products WHERE fulltext(title, 'laptop') OR fulltext(description, 'laptop')
 ```
 
+**Stopword handling:**
+
+Both `=` (exact phrase) and `fulltext()` (tokenized search) automatically strip [Redis default stopwords](https://redis.io/docs/latest/develop/ai/search-and-query/advanced-concepts/stopwords/) before sending queries to RediSearch. This is necessary because RediSearch does not index stopwords, so including them in queries causes syntax errors or failed matches. A `UserWarning` is emitted when stopwords are removed.
+
+For example, `WHERE title = 'bank of america'` produces `@title:"bank america"` because "of" is a default stopword and is never stored in the inverted index. The stripped phrase still matches correctly because the indexer assigns consecutive token positions after dropping stopwords.
+
+To include stopwords in your queries, create your index with `STOPWORDS 0`:
+
+```
+FT.CREATE myindex ON HASH PREFIX 1 doc: STOPWORDS 0 SCHEMA title TEXT
+```
+
 **Notes:**
-- `=` on TEXT fields performs **exact phrase** matching (preserves stopwords)
-- `fulltext()` performs **tokenized** search (stopwords are filtered with a warning)
-- `fuzzy()` and `fulltext()` only work on TEXT fields — using them on TAG or NUMERIC raises `ValueError`
+- `=` on TEXT fields performs **exact phrase** matching (double-quoted)
+- `fulltext()` performs **tokenized** AND search (parenthesized)
+- Both operators strip stopwords and emit a warning when they do
+- `fuzzy()` and `fulltext()` only work on TEXT fields; using them on TAG or NUMERIC raises `ValueError`
 - OR must be **uppercase**: `'laptop OR tablet'` triggers union; lowercase `'laptop or tablet'` is treated as a regular three-word AND search
 - Special characters (`@`, `|`, `-`, `*`, `+`, etc.) in search terms are automatically escaped
 

From 13c4a32c2a1ee93580bd0e11d259e6946c6296f2 Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Fri, 3 Apr 2026 11:28:06 -0400
Subject: [PATCH 27/28] Reject boolean values in numeric context, catch
 dangling OR

- Add bool guard in _build_condition and _convert_to_numeric so
  WHERE price = true raises ValueError instead of producing
  invalid @price:[True True] syntax.
- Expand OR detection regex to match leading/trailing OR
  (e.g. 'laptop OR', 'OR tablet') so the empty-operand check
  catches these malformed inputs instead of silently dropping OR
  as a stopword.
---
 sql_redis/query_builder.py  |  7 +++++--
 sql_redis/translator.py     | 11 +++++++++++
 tests/test_query_builder.py | 18 ++++++++++++++++++
 tests/test_translator.py    |  7 +++++++
 4 files changed, 41 insertions(+), 2 deletions(-)

diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 3b62e6c..3d86d30 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -175,7 +175,7 @@ def build_text_condition(
 
             escaped = self._escape_text_value(" ".join(phrase_words))
             search_value = f'"{escaped}"'
-        elif re.search(r"\s+OR\s+", value):
+        elif re.search(r"(?:^|\s+)OR(?:\s+|$)", value):
             # OR union within text field: split on uppercase-only OR with
             # flexible whitespace, escape each term, join with |.
             # Only uppercase OR is treated as a boolean operator; lowercase
@@ -183,8 +183,11 @@ def build_text_condition(
             # stays as a multi-word AND search, not bank|america).
             # Multi-word operands (e.g. "gaming laptop OR tablet") are wrapped
             # in parentheses so each side is an atomic subexpression.
+            # The regex also matches leading/trailing OR (e.g. "laptop OR"
+            # or "OR tablet") so that the empty-operand check below catches
+            # these malformed inputs instead of silently dropping "OR".
             or_parts: list[str] = []
-            for part in re.split(r"\s+OR\s+", value):
+            for part in re.split(r"(?:^|\s+)OR(?:\s+|$)", value):
                 words = part.strip().split()
                 if not words:
                     raise ValueError(
diff --git a/sql_redis/translator.py b/sql_redis/translator.py
index c89e13b..8f3f199 100644
--- a/sql_redis/translator.py
+++ b/sql_redis/translator.py
@@ -280,6 +280,12 @@ def _build_condition(self, condition: Condition, field_type: str | None) -> str:
                 low_val = self._convert_to_numeric(low)
                 high_val = self._convert_to_numeric(high)
                 numeric_value = (low_val, high_val)
+            elif isinstance(condition.value, bool):
+                raise ValueError(
+                    f"Boolean value {condition.value!r} is not valid in a "
+                    "numeric context. Use 1/0 instead of true/false for "
+                    "numeric fields."
+                )
             elif isinstance(condition.value, (int, float)):
                 numeric_value = condition.value
             else:
@@ -311,6 +317,11 @@ def _convert_to_numeric(self, value: object) -> int | float:
         Raises:
             ValueError: If conversion fails.
         """
+        if isinstance(value, bool):
+            raise ValueError(
+                f"Boolean value {value!r} is not valid in a numeric context. "
+                "Use 1/0 instead of true/false for numeric fields."
+            )
         if isinstance(value, (int, float)):
             return value
         if isinstance(value, str):
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index 97f1f01..3dfa8b2 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -679,6 +679,24 @@ def test_or_extra_whitespace(self):
         )
         assert result == "@title:(laptop|tablet)"
 
+    def test_or_trailing_raises(self):
+        """Trailing OR with no operand raises ValueError."""
+        builder = QueryBuilder()
+        with pytest.raises(ValueError, match="Empty operand"):
+            builder.build_text_condition("title", "FULLTEXT", "laptop OR")
+
+    def test_or_leading_raises(self):
+        """Leading OR with no operand raises ValueError."""
+        builder = QueryBuilder()
+        with pytest.raises(ValueError, match="Empty operand"):
+            builder.build_text_condition("title", "FULLTEXT", "OR tablet")
+
+    def test_or_only_raises(self):
+        """Bare 'OR' with no operands raises ValueError."""
+        builder = QueryBuilder()
+        with pytest.raises(ValueError, match="Empty operand"):
+            builder.build_text_condition("title", "FULLTEXT", "OR")
+
     def test_escape_asterisk_in_fulltext(self):
         """Literal * in FULLTEXT is escaped to prevent wildcard."""
         builder = QueryBuilder()
diff --git a/tests/test_translator.py b/tests/test_translator.py
index c43367b..23fda9a 100644
--- a/tests/test_translator.py
+++ b/tests/test_translator.py
@@ -213,6 +213,13 @@ def test_or_conditions(self, translator: Translator, basic_index: str):
 
         assert "|" in result.query_string  # OR uses pipe
 
+    def test_boolean_in_numeric_context_raises(
+        self, translator: Translator, basic_index: str
+    ):
+        """WHERE price = true should raise, not produce @price:[True True]."""
+        with pytest.raises(ValueError, match="Boolean value"):
+            translator.translate(f"SELECT * FROM {basic_index} WHERE price = true")
+
 
 class TestTranslatorAggregate:
     """Tests for FT.AGGREGATE translation."""

From 45c7fb72793d9934676c7e3dd1e03da3e34030bd Mon Sep 17 00:00:00 2001
From: Nitin Kanukolanu <nitinkanukolanu@gmail.com>
Date: Fri, 3 Apr 2026 14:09:55 -0400
Subject: [PATCH 28/28] Filter stopwords in OR operands before building text
 query

Strip Redis default stopwords from each OR operand, matching the
existing multi-word FULLTEXT path behavior.  If an operand becomes
empty after filtering (all tokens are stopwords), fall back to the
original words so the query is not silently truncated.  A UserWarning
is emitted listing the removed stopwords.
---
 sql_redis/query_builder.py  | 37 ++++++++++++++++++++++++++++++++++---
 tests/test_query_builder.py | 30 ++++++++++++++++++++++++++++++
 2 files changed, 64 insertions(+), 3 deletions(-)

diff --git a/sql_redis/query_builder.py b/sql_redis/query_builder.py
index 3d86d30..8a8acf0 100644
--- a/sql_redis/query_builder.py
+++ b/sql_redis/query_builder.py
@@ -187,6 +187,7 @@ def build_text_condition(
             # or "OR tablet") so that the empty-operand check below catches
             # these malformed inputs instead of silently dropping "OR".
             or_parts: list[str] = []
+            all_removed: list[str] = []
             for part in re.split(r"(?:^|\s+)OR(?:\s+|$)", value):
                 words = part.strip().split()
                 if not words:
@@ -194,9 +195,29 @@ def build_text_condition(
                         "Empty operand in OR expression — each side of OR "
                         "must contain at least one search term."
                     )
-                if len(words) > 1:
+
+                # Filter stopwords from this operand (same logic as
+                # the multi-word FULLTEXT branch).
+                removed = [w for w in words if w.lower() in REDIS_DEFAULT_STOPWORDS]
+                filtered = [
+                    w for w in words if w.lower() not in REDIS_DEFAULT_STOPWORDS
+                ]
+                if removed:
+                    all_removed.extend(removed)
+                # Use filtered list if any non-stopword tokens remain;
+                # otherwise fall back to original words so we don't
+                # silently produce an empty operand.
+                effective = filtered if filtered else words
+
+                if not effective:
+                    raise ValueError(
+                        "Empty operand in OR expression — each side of OR "
+                        "must contain at least one search term."
+                    )
+
+                if len(effective) > 1:
                     escaped_tokens = []
-                    for w in words:
+                    for w in effective:
                         if w.startswith("~"):
                             escaped_tokens.append(
                                 "~" + self._escape_fulltext_term(w[1:])
@@ -205,11 +226,21 @@ def build_text_condition(
                             escaped_tokens.append(self._escape_fulltext_term(w))
                     or_parts.append(f"({' '.join(escaped_tokens)})")
                 else:
-                    token = words[0]
+                    token = effective[0]
                     if token.startswith("~"):
                         or_parts.append("~" + self._escape_fulltext_term(token[1:]))
                     else:
                         or_parts.append(self._escape_fulltext_term(token))
+
+            if all_removed:
+                warnings.warn(
+                    f"Stopwords {all_removed} were removed from OR "
+                    f"expression '{value}'. By default, Redis does not "
+                    "index stopwords. To include stopwords in your "
+                    "index, create it with STOPWORDS 0.",
+                    UserWarning,
+                    stacklevel=2,
+                )
             search_value = f"({'|'.join(or_parts)})"
         elif " " in value:
             # FULLTEXT with multi-word: tokenized search with stopword filtering.
diff --git a/tests/test_query_builder.py b/tests/test_query_builder.py
index 3dfa8b2..d01c1be 100644
--- a/tests/test_query_builder.py
+++ b/tests/test_query_builder.py
@@ -697,6 +697,36 @@ def test_or_only_raises(self):
         with pytest.raises(ValueError, match="Empty operand"):
             builder.build_text_condition("title", "FULLTEXT", "OR")
 
+    def test_or_operand_stopword_filtered(self):
+        """Stopwords inside OR operands are stripped with a warning."""
+        builder = QueryBuilder()
+        with pytest.warns(UserWarning, match="Stopwords.*removed from OR"):
+            result = builder.build_text_condition("title", "FULLTEXT", "laptop OR the")
+        # "the" is a stopword — after filtering only "laptop" remains on
+        # the right side, but since the right operand was *only* a stopword
+        # and falls back to original words, we keep it.
+        # Actually "the" is the only word so filtered=[] → fallback to ["the"].
+        # Let's just verify the left side is clean.
+        assert "laptop" in result
+
+    def test_or_multi_word_operand_stopword_filtered(self):
+        """Stopwords in multi-word OR operands are stripped."""
+        builder = QueryBuilder()
+        with pytest.warns(UserWarning, match="Stopwords.*removed from OR"):
+            result = builder.build_text_condition(
+                "title", "FULLTEXT", "gaming laptop OR the tablet"
+            )
+        # "the" stripped from second operand → "tablet"
+        assert result == "@title:((gaming laptop)|tablet)"
+
+    def test_or_all_stopwords_operand_warns(self):
+        """OR operand that is entirely stopwords falls back but warns."""
+        builder = QueryBuilder()
+        with pytest.warns(UserWarning, match="Stopwords.*removed from OR"):
+            result = builder.build_text_condition("title", "FULLTEXT", "laptop OR the")
+        # "the" is sole token and a stopword → filtered=[] → fallback to ["the"]
+        assert result == "@title:(laptop|the)"
+
     def test_escape_asterisk_in_fulltext(self):
         """Literal * in FULLTEXT is escaped to prevent wildcard."""
         builder = QueryBuilder()