|
40 | 40 | "reuse_example_batch": 1, |
41 | 41 | "enable_checkpointing": False, |
42 | 42 | "profiler": "xplane", |
| 43 | + "use_qwix_quantization": True, |
43 | 44 | }, |
44 | 45 | xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER), |
45 | 46 | ), |
|
63 | 64 | "reuse_example_batch": 1, |
64 | 65 | "enable_checkpointing": False, |
65 | 66 | "profiler": "xplane", |
| 67 | + "use_qwix_quantization": True, |
66 | 68 | }, |
67 | 69 | xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER), |
68 | 70 | ), |
|
86 | 88 | "reuse_example_batch": 1, |
87 | 89 | "enable_checkpointing": False, |
88 | 90 | "profiler": "xplane", |
| 91 | + "use_qwix_quantization": True, |
89 | 92 | }, |
90 | 93 | xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER), |
91 | 94 | ), |
|
112 | 115 | "reuse_example_batch": 1, |
113 | 116 | "enable_checkpointing": False, |
114 | 117 | "profiler": "xplane", |
| 118 | + "use_qwix_quantization": True, |
115 | 119 | }, |
116 | 120 | xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER), |
117 | 121 | ), |
|
133 | 137 | "reuse_example_batch": 1, |
134 | 138 | "enable_checkpointing": False, |
135 | 139 | "profiler": "xplane", |
| 140 | + "use_qwix_quantization": True, |
136 | 141 | }, |
137 | 142 | xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER), |
138 | 143 | ), |
|
155 | 160 | "reuse_example_batch": 1, |
156 | 161 | "enable_checkpointing": False, |
157 | 162 | "profiler": "xplane", |
| 163 | + "use_qwix_quantization": True, |
158 | 164 | }, |
159 | 165 | xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER), |
160 | 166 | ), |
|
167 | 173 | model_type="llama2-13b", |
168 | 174 | tuning_params={ |
169 | 175 | "ici_fsdp_parallelism": -1, |
170 | | - "per_device_batch_size": 8, |
| 176 | + "per_device_batch_size": 6, |
171 | 177 | "remat_policy": "qkv_proj_offloaded", |
172 | 178 | "max_target_length": 2048, |
173 | 179 | "use_iota_embed": True, |
|
177 | 183 | "reuse_example_batch": 1, |
178 | 184 | "enable_checkpointing": False, |
179 | 185 | "profiler": "xplane", |
| 186 | + "use_qwix_quantization": True, |
180 | 187 | }, |
181 | 188 | xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER), |
182 | 189 | ), |
|
198 | 205 | "reuse_example_batch": 1, |
199 | 206 | "enable_checkpointing": False, |
200 | 207 | "profiler": "xplane", |
| 208 | + "use_qwix_quantization": True, |
201 | 209 | }, |
202 | 210 | xla_flags=(xla_flags_library.DATA_PARALLEL_OVERLAP + xla_flags_library.CF_FOR_ALL_GATHER), |
203 | 211 | ), |
|
236 | 244 | "profiler": "xplane", |
237 | 245 | "skip_first_n_steps_for_profiler": 10, |
238 | 246 | "profiler_steps": 5, |
| 247 | + "use_qwix_quantization": True, |
239 | 248 | }, |
240 | 249 | xla_flags=( |
241 | 250 | xla_flags_library.DENSE_VMEM_LIMIT_FLAG |
|
0 commit comments