Skip to content

Commit 559240b

Browse files
authored
feat: modify the default values of the parameters max_seqs_per_batch and communication_backend. (#431)
1 parent e6b0b3d commit 559240b

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

xllm/core/common/global_flags.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -135,7 +135,7 @@ DEFINE_double(max_memory_utilization,
135135

136136
DEFINE_int32(max_tokens_per_batch, 20480, "Max number of tokens per batch.");
137137

138-
DEFINE_int32(max_seqs_per_batch, 256, "Max number of sequences per batch.");
138+
DEFINE_int32(max_seqs_per_batch, 1024, "Max number of sequences per batch.");
139139

140140
DEFINE_bool(enable_schedule_overlap,
141141
true,
@@ -172,7 +172,7 @@ DEFINE_int32(ep_size, 1, "Expert parallel size for MoE model.");
172172

173173
DEFINE_string(
174174
communication_backend,
175-
"lccl",
175+
"hccl",
176176
"NPU communication backend.(e.g. lccl, hccl). When enable dp, use hccl.");
177177

178178
// --- ep load balance config ---

0 commit comments

Comments
 (0)