Skip to content

Commit be19157

Browse files
Merge pull request #3977 from CIeNET-International:maxtext/user/dora/v5e_config_oom
PiperOrigin-RevId: 921524627
2 parents 4110d13 + 80fdc09 commit be19157

1 file changed

Lines changed: 10 additions & 1 deletion

File tree

benchmarks/maxtext_v5e_model_configs.py

Lines changed: 10 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -40,6 +40,7 @@
4040
"reuse_example_batch": 1,
4141
"enable_checkpointing": False,
4242
"profiler": "xplane",
43+
"use_qwix_quantization": True,
4344
},
4445
xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER),
4546
),
@@ -63,6 +64,7 @@
6364
"reuse_example_batch": 1,
6465
"enable_checkpointing": False,
6566
"profiler": "xplane",
67+
"use_qwix_quantization": True,
6668
},
6769
xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER),
6870
),
@@ -86,6 +88,7 @@
8688
"reuse_example_batch": 1,
8789
"enable_checkpointing": False,
8890
"profiler": "xplane",
91+
"use_qwix_quantization": True,
8992
},
9093
xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER),
9194
),
@@ -112,6 +115,7 @@
112115
"reuse_example_batch": 1,
113116
"enable_checkpointing": False,
114117
"profiler": "xplane",
118+
"use_qwix_quantization": True,
115119
},
116120
xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER),
117121
),
@@ -133,6 +137,7 @@
133137
"reuse_example_batch": 1,
134138
"enable_checkpointing": False,
135139
"profiler": "xplane",
140+
"use_qwix_quantization": True,
136141
},
137142
xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER),
138143
),
@@ -155,6 +160,7 @@
155160
"reuse_example_batch": 1,
156161
"enable_checkpointing": False,
157162
"profiler": "xplane",
163+
"use_qwix_quantization": True,
158164
},
159165
xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER),
160166
),
@@ -167,7 +173,7 @@
167173
model_type="llama2-13b",
168174
tuning_params={
169175
"ici_fsdp_parallelism": -1,
170-
"per_device_batch_size": 8,
176+
"per_device_batch_size": 6,
171177
"remat_policy": "qkv_proj_offloaded",
172178
"max_target_length": 2048,
173179
"use_iota_embed": True,
@@ -177,6 +183,7 @@
177183
"reuse_example_batch": 1,
178184
"enable_checkpointing": False,
179185
"profiler": "xplane",
186+
"use_qwix_quantization": True,
180187
},
181188
xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER),
182189
),
@@ -198,6 +205,7 @@
198205
"reuse_example_batch": 1,
199206
"enable_checkpointing": False,
200207
"profiler": "xplane",
208+
"use_qwix_quantization": True,
201209
},
202210
xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER),
203211
),
@@ -236,6 +244,7 @@
236244
"profiler": "xplane",
237245
"skip_first_n_steps_for_profiler": 10,
238246
"profiler_steps": 5,
247+
"use_qwix_quantization": True,
239248
},
240249
xla_flags=(
241250
xla_flags_library.DENSE_VMEM_LIMIT_FLAG

0 commit comments

Comments
 (0)