1+ benchmarks :
2+ - benchmark_name : all_gather
3+ benchmark_sweep_params :
4+ - {matrix_dim_range: {start: 64, end: 16384, multiplier: 2}, dtype: "float32", mesh_shape: "16x4x2", ici_size_range: 128, sharding_strategy: "16x4x1", op_dimension: 1, num_runs: 5} # Parallel Replica
5+ - {matrix_dim_range: {start: 64, end: 16384, multiplier: 2}, dtype: "float32", mesh_shape: "16x4x2", ici_size_range: 128, sharding_strategy: "16x4x2", op_dimension: 1, num_runs: 5} # Non-Parallel Replica
6+ trace_dir : " ../microbenchmarks/all_gather_tpu7x_4x4x4"
7+ csv_path : " ../microbenchmarks/all_gather_tpu7x_4x4x4"
8+ xlml_metrics_dir : " ../microbenchmarks/all_gather_tpu7x_4x4x4"
9+ xla_dump_dir : " ../microbenchmarks/all_gather_tpu7x_4x4x4/hlo_graphs"
10+ - benchmark_name : psum
11+ benchmark_sweep_params :
12+ - {matrix_dim_range: {start: 64, end: 16384, multiplier: 2}, dtype: "float32", mesh_shape: "16x4x2", ici_size_range: 128, sharding_strategy: "16x4x1", op_dimension: 1, num_runs: 5} # Parallel Replica
13+ - {matrix_dim_range: {start: 64, end: 16384, multiplier: 2}, dtype: "float32", mesh_shape: "16x4x2", ici_size_range: 128, sharding_strategy: "16x4x2", op_dimension: 1, num_runs: 5} # Non-Parallel Replica
14+ trace_dir : " ../microbenchmarks/psum_tpu7x_4x4x4"
15+ csv_path : " ../microbenchmarks/psum_tpu7x_4x4x4"
16+ xlml_metrics_dir : " ../microbenchmarks/psum_tpu7x_4x4x4"
17+ xla_dump_dir : " ../microbenchmarks/psum_tpu7x_4x4x4/hlo_graphs"
18+ - benchmark_name : all_to_all
19+ benchmark_sweep_params :
20+ - {matrix_dim_range: {start: 64, end: 16384, multiplier: 2}, dtype: "float32", mesh_shape: "16x4x2", ici_size_range: 128, sharding_strategy: "16x4x1", op_dimension: 1, num_runs: 5} # Parallel Replica
21+ - {matrix_dim_range: {start: 64, end: 16384, multiplier: 2}, dtype: "float32", mesh_shape: "16x4x2", ici_size_range: 128, sharding_strategy: "16x4x2", op_dimension: 1, num_runs: 5} # Non-Parallel Replica
22+ trace_dir : " ../microbenchmarks/all_to_all_tpu7x_4x4x4"
23+ csv_path : " ../microbenchmarks/all_to_all_tpu7x_4x4x4"
24+ xlml_metrics_dir : " ../microbenchmarks/all_to_all_tpu7x_4x4x4"
25+ xla_dump_dir : " ../microbenchmarks/all_to_all_tpu7x_4x4x4/hlo_graphs"
0 commit comments