We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
2 parents dec52b1 + 6adee77 commit f73e18bCopy full SHA for f73e18b
csrc/engine/compiler/paged_compiler.cpp
@@ -18,10 +18,7 @@ inline void set_minus_one(infinicore::Tensor &tensor) {
18
namespace infinilm::engine {
19
PagedCompiler::PagedCompiler(const std::shared_ptr<InfinilmModel> &model, RankBarrier *barrier)
20
: GraphCompiler(model, barrier) {
21
- for (size_t b = 1; b < 32; b++) {
22
- decode_batch_sizes_.push_back(b);
23
- }
24
- for (size_t b = 32; b < 64; b += 8) {
+ for (size_t b = 1; b < 64; ++b) {
25
decode_batch_sizes_.push_back(b);
26
}
27
for (size_t b = 64; b < 128; b += 16) {
0 commit comments