Skip to content

Commit 033a72f

Browse files
committed
Limit to gen-12lp
1 parent 89201c3 commit 033a72f

File tree

2 files changed

+6
-2
lines changed

2 files changed

+6
-2
lines changed

js/web/lib/wasm/jsep/webgpu/ops/matmulnbits.ts

+5-1
Original file line numberDiff line numberDiff line change
@@ -436,7 +436,11 @@ export const createMatMulNBitsBlockSize32ProgramInfo = (
436436

437437
export const matMulNBits = (context: ComputeContext, attributes: MatMulNBitsAttributes): void => {
438438
validateInputs(context.inputs, attributes);
439-
if (attributes.blockSize === 32 && context.adapterInfo.isVendor('intel')) {
439+
if (
440+
attributes.blockSize === 32 &&
441+
context.adapterInfo.isVendor('intel') &&
442+
context.adapterInfo.isArchitecture('gen-12lp')
443+
) {
440444
context.compute(createMatMulNBitsBlockSize32ProgramInfo(context.inputs, attributes));
441445
} else {
442446
context.compute(createMatMulNBitsProgramInfo(context.inputs, attributes));

js/web/lib/wasm/jsep/webgpu/types.ts

+1-1
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ export enum GpuDataType {
1515
}
1616
export type GpuDataId = number;
1717

18-
export type GpuArchitecture = 'ampere';
18+
export type GpuArchitecture = 'ampere' | 'gen-12lp';
1919
export type GpuVendor = 'amd' | 'intel' | 'nvidia';
2020
export interface AdapterInfo {
2121
isArchitecture: (architecture: GpuArchitecture) => boolean;

0 commit comments

Comments
 (0)