Commit 7c90850
authored
ggml-webgpu: improve MTP inference by using mat-vec path for small batches (ggml-org#24811)
* ggml-webgpu: improve small batches decoding
* Add barrier to the NUM_COLS loop in mul-mat-vec1 parent 035cd8f commit 7c90850
8 files changed
Lines changed: 687 additions & 596 deletions
File tree
- ggml/src/ggml-webgpu
- wgsl-shaders
- tests
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
905 | 905 | | |
906 | 906 | | |
907 | 907 | | |
| 908 | + | |
908 | 909 | | |
909 | 910 | | |
910 | 911 | | |
911 | 912 | | |
912 | | - | |
| 913 | + | |
913 | 914 | | |
914 | 915 | | |
915 | 916 | | |
| |||
919 | 920 | | |
920 | 921 | | |
921 | 922 | | |
| 923 | + | |
922 | 924 | | |
923 | 925 | | |
924 | 926 | | |
| |||
993 | 995 | | |
994 | 996 | | |
995 | 997 | | |
| 998 | + | |
996 | 999 | | |
997 | 1000 | | |
998 | 1001 | | |
999 | 1002 | | |
1000 | | - | |
| 1003 | + | |
1001 | 1004 | | |
1002 | 1005 | | |
1003 | 1006 | | |
| |||
1007 | 1010 | | |
1008 | 1011 | | |
1009 | 1012 | | |
| 1013 | + | |
1010 | 1014 | | |
1011 | 1015 | | |
1012 | 1016 | | |
| |||
1107 | 1111 | | |
1108 | 1112 | | |
1109 | 1113 | | |
1110 | | - | |
| 1114 | + | |
1111 | 1115 | | |
1112 | 1116 | | |
1113 | 1117 | | |
| |||
1889 | 1893 | | |
1890 | 1894 | | |
1891 | 1895 | | |
| 1896 | + | |
1892 | 1897 | | |
1893 | 1898 | | |
1894 | 1899 | | |
| |||
2004 | 2009 | | |
2005 | 2010 | | |
2006 | 2011 | | |
| 2012 | + | |
2007 | 2013 | | |
2008 | 2014 | | |
2009 | 2015 | | |
| |||
2421 | 2427 | | |
2422 | 2428 | | |
2423 | 2429 | | |
| 2430 | + | |
2424 | 2431 | | |
2425 | 2432 | | |
2426 | 2433 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
1418 | 1418 | | |
1419 | 1419 | | |
1420 | 1420 | | |
1421 | | - | |
1422 | | - | |
1423 | | - | |
| 1421 | + | |
| 1422 | + | |
| 1423 | + | |
1424 | 1424 | | |
1425 | 1425 | | |
1426 | 1426 | | |
| 1427 | + | |
1427 | 1428 | | |
1428 | 1429 | | |
1429 | 1430 | | |
| 1431 | + | |
1430 | 1432 | | |
1431 | 1433 | | |
1432 | 1434 | | |
| |||
1442 | 1444 | | |
1443 | 1445 | | |
1444 | 1446 | | |
1445 | | - | |
| 1447 | + | |
1446 | 1448 | | |
1447 | 1449 | | |
1448 | 1450 | | |
| |||
1456 | 1458 | | |
1457 | 1459 | | |
1458 | 1460 | | |
1459 | | - | |
| 1461 | + | |
1460 | 1462 | | |
1461 | 1463 | | |
1462 | 1464 | | |
| |||
1482 | 1484 | | |
1483 | 1485 | | |
1484 | 1486 | | |
1485 | | - | |
| 1487 | + | |
1486 | 1488 | | |
1487 | 1489 | | |
1488 | 1490 | | |
| |||
1529 | 1531 | | |
1530 | 1532 | | |
1531 | 1533 | | |
1532 | | - | |
| 1534 | + | |
1533 | 1535 | | |
1534 | 1536 | | |
1535 | 1537 | | |
| |||
3691 | 3693 | | |
3692 | 3694 | | |
3693 | 3695 | | |
3694 | | - | |
3695 | | - | |
| 3696 | + | |
| 3697 | + | |
3696 | 3698 | | |
3697 | 3699 | | |
3698 | 3700 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
103 | 103 | | |
104 | 104 | | |
105 | 105 | | |
106 | | - | |
| 106 | + | |
107 | 107 | | |
108 | 108 | | |
109 | 109 | | |
| |||
126 | 126 | | |
127 | 127 | | |
128 | 128 | | |
129 | | - | |
| 129 | + | |
130 | 130 | | |
131 | 131 | | |
132 | 132 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
91 | 91 | | |
92 | 92 | | |
93 | 93 | | |
94 | | - | |
| 94 | + | |
95 | 95 | | |
96 | 96 | | |
97 | 97 | | |
98 | 98 | | |
99 | 99 | | |
100 | 100 | | |
101 | | - | |
102 | | - | |
103 | | - | |
104 | | - | |
105 | | - | |
106 | | - | |
107 | | - | |
| 101 | + | |
108 | 102 | | |
109 | | - | |
| 103 | + | |
| 104 | + | |
| 105 | + | |
| 106 | + | |
| 107 | + | |
| 108 | + | |
| 109 | + | |
110 | 110 | | |
111 | | - | |
112 | | - | |
113 | | - | |
114 | | - | |
115 | | - | |
116 | | - | |
117 | | - | |
118 | | - | |
119 | | - | |
120 | | - | |
121 | | - | |
| 111 | + | |
| 112 | + | |
| 113 | + | |
| 114 | + | |
| 115 | + | |
| 116 | + | |
| 117 | + | |
| 118 | + | |
| 119 | + | |
| 120 | + | |
| 121 | + | |
| 122 | + | |
| 123 | + | |
122 | 124 | | |
123 | 125 | | |
124 | 126 | | |
125 | | - | |
126 | | - | |
127 | | - | |
| 127 | + | |
| 128 | + | |
| 129 | + | |
128 | 130 | | |
129 | | - | |
| 131 | + | |
130 | 132 | | |
131 | | - | |
| 133 | + | |
132 | 134 | | |
133 | | - | |
134 | | - | |
135 | | - | |
136 | | - | |
| 135 | + | |
| 136 | + | |
| 137 | + | |
| 138 | + | |
| 139 | + | |
| 140 | + | |
| 141 | + | |
| 142 | + | |
| 143 | + | |
137 | 144 | | |
138 | | - | |
139 | 145 | | |
140 | | - | |
141 | | - | |
142 | | - | |
| 146 | + | |
| 147 | + | |
| 148 | + | |
| 149 | + | |
| 150 | + | |
| 151 | + | |
| 152 | + | |
| 153 | + | |
| 154 | + | |
143 | 155 | | |
144 | | - | |
145 | | - | |
146 | | - | |
147 | | - | |
148 | | - | |
149 | 156 | | |
150 | | - | |
151 | 157 | | |
0 commit comments