Skip to content

Commit bca93db

Browse files
committed
unblock splash kernel error using cp and explicit sharding
1 parent 7fb6d25 commit bca93db

5 files changed

Lines changed: 72 additions & 0 deletions

File tree

tests/utils/sharding_info/deepseek2-16b/tpu7x-16/slice_1/rule_default/input_shardings.json

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -96,6 +96,18 @@
9696
"PartitionSpec": "P('fsdp', None, None, None)"
9797
}
9898
},
99+
{
100+
"attention_op/arr: int8[1,4,4]": {
101+
"logic_axes": "Unknown",
102+
"PartitionSpec": "P(None, None)"
103+
}
104+
},
105+
{
106+
"attention_op/arr: int32[2048]": {
107+
"logic_axes": "Unknown",
108+
"PartitionSpec": "P(None,)"
109+
}
110+
},
99111
{
100112
"attention_mla/out: bfloat16[192,2048,16,128]": {
101113
"logic_axes": "('activation_batch', 'activation_length', 'activation_heads', 'activation_kv')",

tests/utils/sharding_info/deepseek2-16b/tpu7x-16/slice_1/rule_pure-fsdp/input_shardings.json

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -96,6 +96,18 @@
9696
"PartitionSpec": "P('fsdp', None, None, None)"
9797
}
9898
},
99+
{
100+
"attention_op/arr: int8[1,4,4]": {
101+
"logic_axes": "Unknown",
102+
"PartitionSpec": "P(None, None)"
103+
}
104+
},
105+
{
106+
"attention_op/arr: int32[2048]": {
107+
"logic_axes": "Unknown",
108+
"PartitionSpec": "P(None,)"
109+
}
110+
},
99111
{
100112
"attention_mla/out: bfloat16[192,2048,16,128]": {
101113
"logic_axes": "('activation_batch', 'activation_length', 'activation_heads', 'activation_kv')",

tests/utils/sharding_info/gpt-oss-20b/tpu7x-16/slice_1/rule_default/input_shardings.json

Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -66,6 +66,24 @@
6666
"PartitionSpec": "P('fsdp', None, None, None)"
6767
}
6868
},
69+
{
70+
"attention_op/arr: int8[1,4,2]": {
71+
"logic_axes": "Unknown",
72+
"PartitionSpec": "P(None, None)"
73+
}
74+
},
75+
{
76+
"attention_op/arr: bool[2,512,512]": {
77+
"logic_axes": "Unknown",
78+
"PartitionSpec": "P()"
79+
}
80+
},
81+
{
82+
"attention_op/arr: int8[1,2,4]": {
83+
"logic_axes": "Unknown",
84+
"PartitionSpec": "P(None, None)"
85+
}
86+
},
6987
{
7088
"attentions/out: bfloat16[192,2048,64,64]": {
7189
"logic_axes": "('activation_batch', 'activation_attn_length', 'activation_heads', 'activation_kv')",

tests/utils/sharding_info/gpt-oss-20b/tpu7x-16/slice_1/rule_default_ici_fsdp_parallelism=-1_ici_expert_parallelism=2/input_shardings.json

Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -66,6 +66,24 @@
6666
"PartitionSpec": "P(('fsdp', 'expert'), None, None, None)"
6767
}
6868
},
69+
{
70+
"attention_op/arr: int8[1,4,2]": {
71+
"logic_axes": "Unknown",
72+
"PartitionSpec": "P(None, None)"
73+
}
74+
},
75+
{
76+
"attention_op/arr: bool[2,512,512]": {
77+
"logic_axes": "Unknown",
78+
"PartitionSpec": "P()"
79+
}
80+
},
81+
{
82+
"attention_op/arr: int8[1,2,4]": {
83+
"logic_axes": "Unknown",
84+
"PartitionSpec": "P(None, None)"
85+
}
86+
},
6987
{
7088
"attentions/out: bfloat16[192,2048,64,64]": {
7189
"logic_axes": "('activation_batch', 'activation_attn_length', 'activation_heads', 'activation_kv')",

tests/utils/sharding_info/qwen3-0.6b/tpu7x-16/slice_1/rule_default/input_shardings.json

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -60,6 +60,18 @@
6060
"PartitionSpec": "P('fsdp', None, None, None)"
6161
}
6262
},
63+
{
64+
"attention_op/arr: int8[1,4,4]": {
65+
"logic_axes": "Unknown",
66+
"PartitionSpec": "P(None, None)"
67+
}
68+
},
69+
{
70+
"attention_op/arr: int32[2048]": {
71+
"logic_axes": "Unknown",
72+
"PartitionSpec": "P(None,)"
73+
}
74+
},
6375
{
6476
"attentions/out: bfloat16[192,2048,16,128]": {
6577
"logic_axes": "('activation_batch', 'activation_attn_length', 'activation_heads', 'activation_kv')",

0 commit comments

Comments
 (0)