Skip to content

Commit 7e589a2

Browse files
authored
Merge branch 'release/online/20260415' into cp/47a3cff6-add-values-check
2 parents e698271 + 5babb00 commit 7e589a2

9 files changed

Lines changed: 13 additions & 12 deletions

File tree

.github/workflows/Codestyle-Check.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ on:
44
pull_request:
55
branches:
66
- develop
7-
- 'release/*'
7+
- 'release/**'
88

99
jobs:
1010
pre-commit:

.github/workflows/check-bypass.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ jobs:
2222
permissions:
2323
contents: read
2424
env:
25-
CI_TEAM_MEMBERS: '["yuanlehome","YuanRisheng","Jiang-Jia-Jun","DDDivano","XieYunshen","EmmonsCurse","CSWYF3634076","plusNew001"]'
25+
CI_TEAM_MEMBERS: '["yuanlehome","YuanRisheng","Jiang-Jia-Jun","DDDivano","XieYunshen","EmmonsCurse","CSWYF3634076","plusNew001","freeliuzc"]'
2626
outputs:
2727
can-skip: ${{ steps.final-output.outputs.can-skip }}
2828
can-skip-docs: ${{ steps.final-output.outputs.can-skip-docs }}

.github/workflows/ci_iluvatar.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ name: ILUVATAR-CI
22
on:
33
pull_request:
44
types: [opened, synchronize]
5-
branches: [develop, release/**]
5+
branches: [develop, release/*]
66
permissions: read-all
77

88
concurrency:

.github/workflows/ci_metax.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ on:
77
- synchronize
88
branches:
99
- develop
10-
- release/**
10+
- release/*
1111

1212
permissions:
1313
contents: read

.github/workflows/ci_xpu.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ name: CI_XPU
33
on:
44
pull_request:
55
types: [opened, synchronize]
6-
branches: [develop, release/**]
6+
branches: [develop, release/*]
77
permissions: read-all
88

99
concurrency:

fastdeploy/model_executor/layers/moe/fused_moe_cutlass_backend.py

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -175,7 +175,7 @@ def apply_ep_prefill(
175175
if fastdeploy.envs.FD_MOE_PROB_IN_ADVANCE:
176176
out = paddlefleet_ops.fused_swiglu_scale(out, dst_weights)
177177
else:
178-
out = paddle.incubate.nn.functional.swiglu(out)
178+
out = paddle.nn.functional.swiglu(out)
179179
ffn_out = paddle.incubate.nn.functional.batched_gemm(
180180
out,
181181
getattr(layer, self.added_weight_attrs[1]),
@@ -335,7 +335,6 @@ def apply_tp(
335335
layer.routed_scaling_factor,
336336
layer.gate_correction_bias,
337337
getattr(layer, "renormalize", True),
338-
use_fused_cast=use_fused,
339338
)
340339
else:
341340
gate_out = gate_out.cast("float32")
@@ -406,7 +405,6 @@ def apply_tp(
406405
layer.gate_correction_bias,
407406
getattr(layer, "renormalize", True),
408407
topk_reduce_func=getattr(layer, "topk_reduce_func", None),
409-
use_fused_cast=use_fused,
410408
)
411409

412410
(

tests/input/test_process_stop_token_ids.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -12,9 +12,9 @@
1212
# See the License for the specific language governing permissions and
1313
# limitations under the License.
1414

15-
"""Tests for process_stop_token_ids in fastdeploy.input.utils.common."""
15+
"""Tests for process_stop_token_ids in fastdeploy.input.utils."""
1616

17-
from fastdeploy.input.utils.common import process_stop_token_ids
17+
from fastdeploy.input.utils import process_stop_token_ids
1818

1919

2020
def _mock_update_stop_seq_fn(stop_sequences):
@@ -115,4 +115,4 @@ def test_stop_token_ids_empty_list():
115115
test_empty_request()
116116
test_stop_token_ids_none()
117117
test_stop_token_ids_empty_list()
118-
print("All tests passed.")
118+
print("All tests passed.")

tests/layers/test_speculative_sampler.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -78,7 +78,7 @@ def _create_default_sampling_metadata(
7878
fake_sampling_metadata = SamplingMetadata(
7979
temperature=paddle.full(shape=[batch_size, 1], fill_value=0.9, dtype="float32"),
8080
top_p=paddle.full(shape=[batch_size, 1], fill_value=0.7, dtype="float32"),
81-
top_k=paddle.full(shape=[batch_size, 1], fill_value=0, dtype="int32"),
81+
top_k=paddle.full(shape=[batch_size, 1], fill_value=0, dtype="int64"),
8282
prompt_lens=paddle.full(shape=[batch_size, 1], fill_value=0, dtype="int64"),
8383
step_idx=paddle.full(shape=[batch_size, 1], fill_value=0, dtype="int64"),
8484
token_ids_all=_create_tokens_tensor(batch_size, max_seq_len),

tests/model_executor/test_ep.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -419,6 +419,9 @@ def fake_get_moe_scores(*_args, **_kwargs):
419419
routed_scaling_factor=1.0,
420420
gate_correction_bias=None,
421421
renormalize=False,
422+
fd_config=SimpleNamespace(
423+
scheduler_config=SimpleNamespace(enable_moe_scores_elementwise_fuse=False),
424+
),
422425
)
423426
gate_out = paddle.randn([1, 4], dtype="float32")
424427

0 commit comments

Comments
 (0)