Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
62 commits
Select commit Hold shift + click to select a range
4d083b4
initialize layerwise worker
zhuofan1123 Dec 17, 2025
9085d52
add layerwise transfer op
zhuofan1123 Dec 17, 2025
645a22c
clear op callback if layerwise
zhuofan1123 Dec 18, 2025
be7cc02
layerwise worker naive impl
zhuofan1123 Dec 18, 2025
52a19f3
check layerwise condition
zhuofan1123 Dec 18, 2025
fb6ce12
add default value
zhuofan1123 Dec 18, 2025
4dc9fb4
fix bug and benchmark
zhuofan1123 Dec 18, 2025
80c2077
add layerwise param
zhuofan1123 Dec 18, 2025
f64b9c0
fix bugs
zhuofan1123 Dec 18, 2025
d86335b
disable layerwise in benchmark
zhuofan1123 Dec 19, 2025
7a74665
pin memory of block ids
zhuofan1123 Dec 19, 2025
7641dcc
make ssd optional
Jan 9, 2026
0835555
initial layerwise cpp impl
zhuofan1123 Jan 9, 2026
6881413
add callback && fix some bugs
zhuofan1123 Jan 9, 2026
7c7ab27
fix
zhuofan1123 Jan 9, 2026
ed4187d
some fix
zhuofan1123 Jan 12, 2026
79dc6ce
add sglang support using eventfd
Jan 15, 2026
b7c86bf
print bandwidth for layerwise transfer
Jan 21, 2026
d635935
add nvtx for layerwise
Jan 28, 2026
af4c1d5
update kernel
zhuofan1123 Jan 29, 2026
a159da9
remove print
zhuofan1123 Jan 30, 2026
417b59b
fix cuda device set
zhuofan1123 Jan 30, 2026
ffbcecd
fix
zhuofan1123 Feb 2, 2026
fd8ce04
fix mempool
zhuofan1123 Feb 3, 2026
2463aa4
refactor transfer config, set num of cta instead of sm
zhuofan1123 Feb 3, 2026
586dbc6
fix
Mar 23, 2026
bc1a18c
fix unit test
zhuofan1123 Mar 23, 2026
d3cc1d9
update
zhuofan1123 Mar 23, 2026
12be2cc
merge h2d and disk2h to layerwiseop
zhuofan1123 Mar 23, 2026
ee4c5c0
Bug Fix: illegal memory (#133)
jianyingzhu Apr 1, 2026
72c5187
feat: add DSA cache and PP support
Apr 5, 2026
9b27128
fix page align bug
Apr 7, 2026
c5b292d
feat: distributed KV cache improvements - RedisMeta refactor, benchma…
Apr 8, 2026
1c14efd
fix cpu layout problems in tp + blockwise cpu layout
linhu-nv Apr 9, 2026
cc835f1
split cpu stride for ssd and for gpu
linhu-nv Apr 9, 2026
c63ffee
fix: comprehensive TP/PP/DP dimension fixes and observability improve…
Apr 9, 2026
a5eb20f
fix ssd read when blockwise + tp + layerwise
linhu-nv Apr 9, 2026
5a706b1
dont sync prefetch
zhuofan1123 Apr 10, 2026
9e72cf1
support cpuonly match for prefetch
zhuofan1123 Apr 10, 2026
d3ebb4b
fix: preload shared libraries via ctypes.CDLL in __init__.py
Apr 10, 2026
5a5f7da
add kv_cache_dtype to sglang
peaceforeverCN Apr 11, 2026
ba6c000
add some log to info the malloc
peaceforeverCN Apr 11, 2026
7806055
support cp+layerwise
Apr 14, 2026
d56c404
fix empty token mask
zhuofan1123 Apr 15, 2026
930c2a9
fix: make eventfd accept loop resilient to per-connection failures
Apr 15, 2026
b427e7e
fix: add ACK handshake for layerwise eventfd transfer to prevent race…
Apr 15, 2026
d91bed1
fix: correct variable name and config reference in MoonCakeTransferEn…
staryxchen Apr 15, 2026
dfe21d4
fix(mooncakeEngineWrapper): change unregist_buffer return type from N…
staryxchen Apr 15, 2026
3a36508
fix(mooncakeEngineWrapper): add return type annotation to
staryxchen Apr 15, 2026
7148c7e
fix d2h issue for glm5+cp8
zhuofan1123 Apr 15, 2026
d54f930
fix sglang config issue
zhuofan1123 Apr 15, 2026
7ec580f
fix(layerwise): fuse indexer DISK2H/H2D into layerwise worker (#149)
zhjc1124 Apr 17, 2026
1bf5eca
fix server_args kv cache dtype (#151)
zhjc1124 Apr 17, 2026
b9e29ac
fix: support cross-node TP - add _node suffix to eventfd socket path …
Apr 22, 2026
7ece123
refactor: align multi-node TP topology with framework (nnodes/node_ra…
Apr 24, 2026
ba8fccf
Merge pull request #156 from zhjc1124/feat/layerwise_rebase
peaceforeverCN Apr 27, 2026
50e702e
feat(hugepage): add HugePage support (#158)
staryxchen Apr 30, 2026
2508b11
feat: add PP support with centralized data plane and WorkerKey abstra…
Apr 30, 2026
7a2a8af
Merge pull request #159 from zhjc1124/support_pp
peaceforeverCN Apr 30, 2026
2f572d8
fix: improve transfer manager and engine robustness for PP
Apr 30, 2026
7ef3715
Merge pull request #160 from zhjc1124/support_pp
peaceforeverCN Apr 30, 2026
16fa450
refactor(DistributedRadixTree): enforce single-node matching constraint
Apr 29, 2026
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
55 changes: 51 additions & 4 deletions CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -1,5 +1,42 @@
cmake_minimum_required(VERSION 3.10)
project(MainProject VERSION 1.0)

find_package(Git QUIET)

if(GIT_FOUND)
execute_process(
COMMAND ${GIT_EXECUTABLE} describe --tags --long --match "v*"
WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}
OUTPUT_VARIABLE GIT_DESCRIBE_OUTPUT
ERROR_QUIET
OUTPUT_STRIP_TRAILING_WHITESPACE
)
if(GIT_DESCRIBE_OUTPUT MATCHES "^v([0-9]+\\.[0-9]+\\.[0-9]+)-([0-9]+)-g([0-9a-f]+)$")
set(GIT_VERSION "${CMAKE_MATCH_1}")
set(GIT_DISTANCE "${CMAKE_MATCH_2}")
set(GIT_HASH "${CMAKE_MATCH_3}")
if(GIT_DISTANCE STREQUAL "0")
set(DETECTED_VERSION "${GIT_VERSION}")
else()
set(DETECTED_VERSION "${GIT_VERSION}+git${GIT_HASH}")
endif()
message(STATUS "Version from git tag: ${DETECTED_VERSION}")
endif()
endif()

if(NOT DEFINED DETECTED_VERSION OR DETECTED_VERSION STREQUAL "")
set(DETECTED_VERSION "0.0.0")
message(WARNING "Could not detect version from git tag, using fallback: ${DETECTED_VERSION}")
endif()

# Strip +gitXXXXXXX suffix for CMake project VERSION (must be numeric X.Y.Z)
if(DETECTED_VERSION MATCHES "^([0-9]+\\.[0-9]+\\.[0-9]+)")
set(NUMERIC_VERSION "${CMAKE_MATCH_1}")
else()
set(NUMERIC_VERSION "0.0.0")
endif()

project(MainProject VERSION ${NUMERIC_VERSION})
message(STATUS "Project version: ${PROJECT_VERSION} (full: ${DETECTED_VERSION})")

set(CMAKE_CXX_STANDARD 17)
set(CMAKE_CXX_STANDARD_REQUIRED ON)
Expand Down Expand Up @@ -30,10 +67,20 @@ target_include_directories(xxhash PUBLIC
install(FILES ${XXHASH_HEADERS} DESTINATION include)

# ==================== prometheus-cpp Library ====================
# Option to enable/disable monitoring (env FLEXKV_ENABLE_METRICS=0 or -DFLEXKV_ENABLE_MONITORING=OFF)
set(_FLEXKV_MONITORING_DEFAULT ON)
# Step 1: Auto-detect default from directory existence
if(IS_DIRECTORY "${CMAKE_CURRENT_SOURCE_DIR}/third_party/prometheus-cpp")
set(_FLEXKV_MONITORING_DEFAULT ON)
else()
set(_FLEXKV_MONITORING_DEFAULT OFF)
message(STATUS "third_party/prometheus-cpp not found, Prometheus monitoring defaults to OFF")
endif()

# Step 2: Environment variable override (FLEXKV_ENABLE_METRICS=1/0)
if(DEFINED ENV{FLEXKV_ENABLE_METRICS})
if("$ENV{FLEXKV_ENABLE_METRICS}" STREQUAL "0" OR "$ENV{FLEXKV_ENABLE_METRICS}" STREQUAL "OFF"
if("$ENV{FLEXKV_ENABLE_METRICS}" STREQUAL "1" OR "$ENV{FLEXKV_ENABLE_METRICS}" STREQUAL "ON"
OR "$ENV{FLEXKV_ENABLE_METRICS}" STREQUAL "YES" OR "$ENV{FLEXKV_ENABLE_METRICS}" STREQUAL "TRUE")
set(_FLEXKV_MONITORING_DEFAULT ON)
elseif("$ENV{FLEXKV_ENABLE_METRICS}" STREQUAL "0" OR "$ENV{FLEXKV_ENABLE_METRICS}" STREQUAL "OFF"
OR "$ENV{FLEXKV_ENABLE_METRICS}" STREQUAL "NO" OR "$ENV{FLEXKV_ENABLE_METRICS}" STREQUAL "FALSE")
set(_FLEXKV_MONITORING_DEFAULT OFF)
endif()
Expand Down
1 change: 0 additions & 1 deletion VERSION

This file was deleted.

Loading