Skip to content

Commit f73e18b

Browse files
authored
Merge pull request #298 from InfiniTensor/issue/297
issue/297 - compile all paged batch sizes up to 64
2 parents dec52b1 + 6adee77 commit f73e18b

File tree

1 file changed

+1
-4
lines changed

1 file changed

+1
-4
lines changed

csrc/engine/compiler/paged_compiler.cpp

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -18,10 +18,7 @@ inline void set_minus_one(infinicore::Tensor &tensor) {
1818
namespace infinilm::engine {
1919
PagedCompiler::PagedCompiler(const std::shared_ptr<InfinilmModel> &model, RankBarrier *barrier)
2020
: GraphCompiler(model, barrier) {
21-
for (size_t b = 1; b < 32; b++) {
22-
decode_batch_sizes_.push_back(b);
23-
}
24-
for (size_t b = 32; b < 64; b += 8) {
21+
for (size_t b = 1; b < 64; ++b) {
2522
decode_batch_sizes_.push_back(b);
2623
}
2724
for (size_t b = 64; b < 128; b += 16) {

0 commit comments

Comments
 (0)