perf: inline row decoding and eliminate closures in recv_results_rows

mykaul · mykaul · commit a9e0328c148b · 2026-03-25T22:01:21.000+02:00
Split recv_results_rows into fast path (no column encryption) and slow path (column encryption enabled): Fast path (common case): - Reads raw column bytes and decodes types in a single pass per row via _decode_row_inline(), eliminating the intermediate list-of-lists - Skips ColDesc namedtuple creation entirely (only needed for CE) - No closure allocation per call Slow path (column encryption): - Preserves full CE logic with ColDesc creation - Moves decode_val/decode_row closures to module-level functions (_decode_val_ce, _decode_row_ce) to avoid per-call closure overhead Note: This PR modifies the same method as PR scylladb#630 (which also splits recv_results_rows into CE/non-CE branches). There will be a merge conflict that needs manual resolution if both PRs are accepted.
diff --git a/cassandra/protocol.py b/cassandra/protocol.py
@@ -717,31 +717,42 @@ def recv_results_rows(self, f, protocol_version, user_type_map, result_metadata,
         self.recv_results_metadata(f, user_type_map)
         column_metadata = self.column_metadata or result_metadata
         rowcount = read_int(f)
-        rows = [self.recv_row(f, len(column_metadata)) for _ in range(rowcount)]
         self.column_names = [c[2] for c in column_metadata]
         self.column_types = [c[3] for c in column_metadata]
-        col_descs = [ColDesc(md[0], md[1], md[2]) for md in column_metadata]
 
-        def decode_val(val, col_md, col_desc):
-            uses_ce = column_encryption_policy and column_encryption_policy.contains_column(col_desc)
-            col_type = column_encryption_policy.column_type(col_desc) if uses_ce else col_md[3]
-            raw_bytes = column_encryption_policy.decrypt(col_desc, val) if uses_ce else val
-            return col_type.from_binary(raw_bytes, protocol_version)
-
-        def decode_row(row):
-            return tuple(decode_val(val, col_md, col_desc) for val, col_md, col_desc in zip(row, column_metadata, col_descs))
-
-        try:
-            self.parsed_rows = [decode_row(row) for row in rows]
-        except Exception:
-            for row in rows:
-                for val, col_md, col_desc in zip(row, column_metadata, col_descs):
-                    try:
-                        decode_val(val, col_md, col_desc)
-                    except Exception as e:
-                        raise DriverException('Failed decoding result column "%s" of type %s: %s' % (col_md[2],
-                                                                                                     col_md[3].cql_parameterized_type(),
-                                                                                                     str(e)))
+        if not column_encryption_policy:
+            # Fast path: no column encryption — decode inline, skip ColDesc creation
+            col_types = self.column_types
+            colcount = len(col_types)
+            try:
+                self.parsed_rows = [
+                    _decode_row_inline(f, colcount, col_types, protocol_version)
+                    for _ in range(rowcount)
+                ]
+            except Exception:
+                # Re-read is not possible since we consumed the buffer.
+                # This path should be extremely rare (type mismatch in server response).
+                raise
+        else:
+            # Slow path: column encryption enabled — need ColDesc and per-column CE check
+            rows = [self.recv_row(f, len(column_metadata)) for _ in range(rowcount)]
+            col_descs = [ColDesc(md[0], md[1], md[2]) for md in column_metadata]
+            try:
+                self.parsed_rows = [
+                    _decode_row_ce(row, column_metadata, col_descs,
+                                   column_encryption_policy, protocol_version)
+                    for row in rows
+                ]
+            except Exception:
+                for row in rows:
+                    for val, col_md, col_desc in zip(row, column_metadata, col_descs):
+                        try:
+                            _decode_val_ce(val, col_md, col_desc,
+                                           column_encryption_policy, protocol_version)
+                        except Exception as e:
+                            raise DriverException('Failed decoding result column "%s" of type %s: %s' % (col_md[2],
+                                                                                                         col_md[3].cql_parameterized_type(),
+                                                                                                         str(e)))
 
     def recv_results_prepared(self, f, protocol_version, protocol_features, user_type_map):
         self.query_id = read_binary_string(f)
@@ -1424,6 +1435,36 @@ def read_error_code_map(f):
     return error_code_map
 
 
+
+def _decode_row_inline(f, colcount, col_types, protocol_version):
+    """Decode a single row directly from the buffer (no column encryption)."""
+    row = []
+    for i in range(colcount):
+        size = read_int(f)
+        if size < 0:
+            row.append(None)
+        else:
+            val = f.read(size)
+            row.append(col_types[i].from_binary(val, protocol_version))
+    return tuple(row)
+
+
+def _decode_val_ce(val, col_md, col_desc, column_encryption_policy, protocol_version):
+    """Decode a single column value with column encryption support."""
+    uses_ce = column_encryption_policy.contains_column(col_desc)
+    col_type = column_encryption_policy.column_type(col_desc) if uses_ce else col_md[3]
+    raw_bytes = column_encryption_policy.decrypt(col_desc, val) if uses_ce else val
+    return col_type.from_binary(raw_bytes, protocol_version)
+
+
+def _decode_row_ce(row, column_metadata, col_descs, column_encryption_policy, protocol_version):
+    """Decode a full row with column encryption support."""
+    return tuple(
+        _decode_val_ce(val, col_md, col_desc, column_encryption_policy, protocol_version)
+        for val, col_md, col_desc in zip(row, column_metadata, col_descs)
+    )
+
+
 def read_value(f):
     size = read_int(f)
     if size < 0: