We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 838d14d commit f8cf40cCopy full SHA for f8cf40c
1 file changed
aiu_fms_testing_utils/scripts/drive_paged_programs.py
@@ -426,6 +426,18 @@ def __load_validation_info(
426
**extra_kwargs,
427
)
428
429
+# do an extra inference call to workaround the issue on z/OS where the first inference
430
+# result is always incorrect during multi-AIU (issue 173)
431
+extract_validation_information(
432
+ model,
433
+ input_ids,
434
+ max_new_tokens,
435
+ post_iteration_hook=None,
436
+ last_n_tokens=64,
437
+ prefill_chunk_size=args.prefill_chunk_size,
438
+ **extra_kwargs,
439
+)
440
+
441
if USE_DISTRIBUTED:
442
# wait for rank0 to be finished as it is the only one generating the criteria json
443
# this is needed since otherwise we may run into a race condition
0 commit comments