cipherflow-fhe
diff --git a/‎backends/HEonGPU‎ b/‎backends/HEonGPU‎
diff --git a/‎examples/CMakeLists.txt‎
Lines changed: 1 addition & 0 deletions b/‎examples/CMakeLists.txt‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎examples/ckks_sparse_bootstrap_cpu/CMakeLists.txt‎
Lines changed: 10 additions & 0 deletions b/‎examples/ckks_sparse_bootstrap_cpu/CMakeLists.txt‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎examples/ckks_sparse_bootstrap_cpu/ckks_sparse_bootstrap_cpu.cpp‎
Lines changed: 67 additions & 0 deletions b/‎examples/ckks_sparse_bootstrap_cpu/ckks_sparse_bootstrap_cpu.cpp‎
Lines changed: 67 additions & 0 deletions
diff --git a/‎examples/ckks_sparse_bootstrap_cpu/ckks_sparse_bootstrap_cpu.py‎
Lines changed: 43 additions & 0 deletions b/‎examples/ckks_sparse_bootstrap_cpu/ckks_sparse_bootstrap_cpu.py‎
Lines changed: 43 additions & 0 deletions
diff --git a/‎fhe_ops_lib/fhe_lib_v2.cpp‎
Lines changed: 12 additions & 0 deletions b/‎fhe_ops_lib/fhe_lib_v2.cpp‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎fhe_ops_lib/fhe_lib_v2.h‎
Lines changed: 8 additions & 0 deletions b/‎fhe_ops_lib/fhe_lib_v2.h‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎fhe_ops_lib/lattigo‎ b/‎fhe_ops_lib/lattigo‎
diff --git a/‎frontend/bootstrap_params.py‎
Lines changed: 9 additions & 4 deletions b/‎frontend/bootstrap_params.py‎
Lines changed: 9 additions & 4 deletions
diff --git a/‎frontend/custom_task.py‎
Lines changed: 33 additions & 6 deletions b/‎frontend/custom_task.py‎
Lines changed: 33 additions & 6 deletions
@@ -10,6 +10,7 @@ add_subdirectory(ckks_mult_cpu)
 add_subdirectory(ckks_mult_serialization_cpu)
 add_subdirectory(ckks_euclidean_distance_cpu)
 add_subdirectory(ckks_logistic_regression_cpu)
+add_subdirectory(ckks_sparse_bootstrap_cpu)
 add_subdirectory(benchmark_cpu)
 add_subdirectory(benchmark_convolution)
 if(LATTISENSE_ENABLE_GPU)
 
@@ -0,0 +1,10 @@
+add_executable(ckks_sparse_bootstrap_cpu ckks_sparse_bootstrap_cpu.cpp)
+target_link_libraries(ckks_sparse_bootstrap_cpu PRIVATE lattisense)
+
+set_target_properties(ckks_sparse_bootstrap_cpu PROPERTIES
+    INSTALL_RPATH "$ORIGIN/../../../lib"
+    BUILD_WITH_INSTALL_RPATH OFF
+)
+
+configure_file(${CMAKE_CURRENT_SOURCE_DIR}/ckks_sparse_bootstrap_cpu.py
+               ${CMAKE_CURRENT_BINARY_DIR}/ckks_sparse_bootstrap_cpu.py COPYONLY)
@@ -0,0 +1,67 @@
+/*
+ * Copyright (c) 2025-2026 CipherFlow (Shenzhen) Co., Ltd.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ *
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#include <cxx_sdk_v2/cxx_fhe_task.h>
+#include <fhe_ops_lib/fhe_lib_v2.h>
+
+#include <cmath>
+#include <cstdio>
+#include <vector>
+
+using namespace lattisense;
+using namespace std;
+
+void ckks_sparse_bootstrap_cpu() {
+    constexpr int log_slots = 8;
+    constexpr int sparse_slots = 1 << log_slots;
+
+    CkksBtpParameter btp_param = CkksBtpParameter::create_toy_sparse_parameter(log_slots);
+    CkksBtpContext btp_ctx = CkksBtpContext::create_random_context(btp_param);
+    btp_ctx.create_bootstrapper();
+
+    double scale = btp_param.get_ckks_parameter().get_default_scale();
+    vector<double> x_mg(sparse_slots);
+    for (int i = 0; i < sparse_slots; i++)
+        x_mg[i] = 0.5 * cos(2.0 * M_PI * i / sparse_slots);
+
+    CkksCiphertext x_ct = btp_ctx.encrypt_asymmetric(btp_ctx.encode(x_mg, 0, scale));
+    CkksCiphertext y_ct = btp_ctx.new_ciphertext(9, scale);
+
+    FheTaskCpu cpu_project("project");
+    vector<CxxVectorArgument> cxx_args = {
+        {"x", &x_ct},
+        {"y", &y_ct},
+    };
+    cpu_project.run(&btp_ctx, cxx_args);
+
+    vector<double> y_mg = btp_ctx.decode(btp_ctx.decrypt(y_ct));
+
+    double max_err = 0.0;
+    for (int i = 0; i < sparse_slots; i++)
+        max_err = std::max(max_err, std::abs(y_mg[i] - x_mg[i]));
+
+    printf("CKKS sparse bootstrap (log_slots=%d, n=%d), CPU\n", log_slots, btp_param.get_ckks_parameter().get_n());
+    print_double_message(x_mg.data(), "x_mg (input, first 4 slots)", 4);
+    print_double_message(y_mg.data(), "y_mg (bootstrapped, first 4 slots)", 4);
+    printf("max abs error over active %d slots: %.3e\n", sparse_slots, max_err);
+}
+
+int main() {
+    ckks_sparse_bootstrap_cpu();
+    return 0;
+}
@@ -0,0 +1,43 @@
+# Copyright (c) 2025-2026 CipherFlow (Shenzhen) Co., Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import os
+import sys
+
+sys.path.append(os.path.dirname(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))))
+
+from frontend.custom_task import *
+
+
+def ckks_sparse_bootstrap():
+    # Sparse bootstrap keeps only 2^log_slots active slots, shrinking the
+    # CtS/StC matrices and cutting wall time vs full packing.
+    param = CkksBtpParam.create_toy_sparse_param(log_slots=8)
+    set_fhe_param(param)
+
+    x = CkksCiphertextNode('x', level=0)
+    y = bootstrap(x, 'y')
+
+    process_custom_task(
+        input_args=[Argument('x', x)],
+        output_args=[Argument('y', y)],
+        output_instruction_path='project',
+        fpga_acc=False,
+    )
+
+
+if __name__ == '__main__':
+    ckks_sparse_bootstrap()
@@ -617,6 +617,18 @@ CkksBtpParameter CkksBtpParameter::create_toy_parameter() {
     return CkksBtpParameter(CreateCkksToyBtpParameter());
 }
 
+CkksBtpParameter CkksBtpParameter::create_sparse_parameter(int32_t log_slots) {
+    CkksBtpParameter btp(CreateCkksBtpParameter());
+    SetCkksParameterLogSlots(btp.get_ckks_parameter().get(), log_slots);
+    return btp;
+}
+
+CkksBtpParameter CkksBtpParameter::create_toy_sparse_parameter(int32_t log_slots) {
+    CkksBtpParameter btp(CreateCkksToyBtpParameter());
+    SetCkksParameterLogSlots(btp.get_ckks_parameter().get(), log_slots);
+    return btp;
+}
+
 // CkksParameter
 CkksParameter CkksParameter::create_parameter(uint64_t N) {
     return CkksParameter(CreateCkksParameter(N));
 
@@ -287,6 +287,14 @@ class CkksBtpParameter : public CkksParameter {
 
     static CkksBtpParameter create_toy_parameter();
 
+    // Sparse-packing CKKS bootstrap (LogSlots < LogN-1). The CPU runner
+    // (lattigo) handles any log_slots in [4, LogN-2]. The GPU runner
+    // (HEonGPU) currently only supports N=2^16 sparse, so create_toy_sparse_*
+    // is CPU-only and will error if routed to GPU; use the production-N
+    // create_sparse_parameter for end-to-end CPU+GPU sparse runs.
+    static CkksBtpParameter create_sparse_parameter(int32_t log_slots);
+    static CkksBtpParameter create_toy_sparse_parameter(int32_t log_slots);
+
     CkksParameter& get_ckks_parameter();
 
 protected:
 
@@ -198,10 +198,15 @@ def _find_best_bsgs_split(diag_matrix: Dict[int, bool], max_n: int, max_ratio: f
         _, rot_n1, rot_n2 = _bsgs_index(diag_matrix, max_n, n1)
         nb_n1, nb_n2 = len(rot_n1) - 1, len(rot_n2) - 1
 
-        if nb_n2 / nb_n1 == max_ratio:
-            return n1
-        if nb_n2 / nb_n1 > max_ratio:
-            return n1 // 2
+        # At small n1 (or sparse matrices), one of the partitions can collapse
+        # to a single element (nb_n1 == 0). Skip the ratio check in that case
+        # and double n1 to broaden the partition; only stop once nb_n1 > 0 and
+        # the ratio threshold is crossed.
+        if nb_n1 > 0:
+            if nb_n2 / nb_n1 == max_ratio:
+                return n1
+            if nb_n2 / nb_n1 > max_ratio:
+                return n1 // 2
 
         n1 <<= 1
 
 
@@ -280,11 +280,9 @@ def create_fpga_param(cls):
 
 
 class CkksBtpParam(CkksParam):
-    """
-    @class CkksBtpParam
-    @brief CKKS Bootstrap parameter class.
-
-    Contains additional parameters required for CKKS bootstrapping.
+    """CKKS bootstrap parameter class. Set sparse packing via create_sparse_param()
+    or by inheriting from CkksParam.set_slots(); trace compensation is handled by
+    the bootstrap op via rotations_for_bootstrapping().
     """
 
     def __init__(self, n: int = 1 << 16):
@@ -293,6 +291,12 @@ def __init__(self, n: int = 1 << 16):
         self.stc_params: EncodingMatrixParams = None
         self.eval_mod_params: EvalModParams = None
         self.btp_output_level: int = -1
+        self.btp_cts_start_level: int = -1
+        self.btp_eval_mod_start_level: int = -1
+        self.btp_stc_start_level: int = -1
+
+    def is_sparse(self) -> bool:
+        return self.slots < (self.n // 2)
 
     @classmethod
     def create_toy_param(cls):
@@ -464,6 +468,24 @@ def create_default_param(cls):
 
         return instance
 
+    # Lattigo's genWfftIndexMap panics below this (CTS/STC depth exceeds slots).
+    _MIN_LOG_SLOTS = 4
+
+    @classmethod
+    def create_sparse_param(cls, log_slots: int, n: int = 1 << 16):
+        """Create sparse CKKS bootstrap params: 2^log_slots active slots."""
+        max_log_slots = int(math.log2(n)) - 2
+        if log_slots < cls._MIN_LOG_SLOTS or log_slots > max_log_slots:
+            raise ValueError(f'log_slots must be in [{cls._MIN_LOG_SLOTS}, {max_log_slots}] for n={n}, got {log_slots}')
+        instance = cls.create_default_param() if n == (1 << 16) else cls.create_toy_param()
+        instance.set_slots(1 << log_slots)
+        return instance
+
+    @classmethod
+    def create_toy_sparse_param(cls, log_slots: int):
+        """Sparse toy params (n=8192). Insecure; for development only."""
+        return cls.create_sparse_param(log_slots, n=1 << 13)
+
     def rotations_for_bootstrapping(self) -> list[int]:
         log_n = int(math.log2(self.n))
         log_slots = int(math.log2(self.slots))
@@ -1969,6 +1991,7 @@ def bootstrap(x: CkksCiphertextNode, output_id: Optional[str] = None) -> CkksCip
         g_swk_node_dict[rlk].level = g_param.max_level
     g_dag.add_edge(g_swk_node_dict[rlk], op)
 
+    assert isinstance(g_param, CkksBtpParam)
     rots = g_param.rotations_for_bootstrapping()
     for rot in rots:
         gal_elem = get_galois_element_for_column_rotation_by(rot, g_param.n)
@@ -2260,6 +2283,8 @@ def process_data_args(args: list[Argument] | None, phase: str) -> tuple[list[Dat
 
     used_id = []
 
+    slots_for_task: Optional[int] = g_param.slots if isinstance(g_param, CkksParam) else None
+
     all_input_list, input_sigdata_list = process_data_args(input_args, 'in')
     all_output_list, output_sigdata_list = process_data_args(output_args, 'out')
     all_offline_list, offline_sigdata_list = process_data_args(offline_input_args, 'offline')
@@ -2308,7 +2333,9 @@ def process_data_args(args: list[Argument] | None, phase: str) -> tuple[list[Dat
     if g_param.algo == Algo.BFV:
         parameter['t'] = g_param.t
     if isinstance(g_param, CkksParam):
-        parameter['slots'] = g_param.slots
+        # slots_for_task was computed above (with optional sparse inference).
+        assert slots_for_task is not None
+        parameter['slots'] = slots_for_task
         parameter['scale'] = g_param.scale
     if isinstance(g_param, CkksBtpParam):
         parameter['btp_cts_start_level'] = g_param.cts_params.level_start