// Copyright (c) Microsoft Corporation. All rights reserved. // Licensed under the MIT License. import {DataType} from '../../../wasm-common'; import {ShapeUtil} from '../../util'; import {ProgramUniform, ProgramUniformVariableInfo} from '../types'; /** * constant value for a workgroup size. * * We definitely can do further optimization in future, but for now we use 64. * * rule of thumb: Use [a workgroup size of] 64 unless you know what GPU you are targeting or that your workload * needs something different. * * from: https://surma.dev/things/webgpu/ **/ export const WORKGROUP_SIZE = 64; interface IndicesHelperTypes { /** * WGSL type of indices expression */ readonly indices: string; /** * WGSL type of a value */ readonly value: string; /** * WGSL type of storage type representing a value * * This is usually the same to `value`, but for some type (eg. bool), we need to use `u32` as storage type for * value type `vec4` */ readonly storage: string; /** * tensor type as represented in TensorView */ readonly tensor: number; } /** * A helper class for generating WGSL code for manipulating indices and data for a shader's input or output. * * This class is designed to offer a unified way to generate WGSL code for manipulating indices and data for a shader's * input or output. * * The following is a list of terminologies used in this class: * - `offset`: a uint32 value representing the offset of an element in the data buffer. * - `indices`: an abstraction of a multi-dimensional array's indices representing the data's index on each dimension. * - `value`: a value of a data element. * * Users are expected to create an instance of this class for each shader's input or output, and use the instance to * generate WGSL code for manipulating indices and data. The following 2 exported functions are for users to call to * create an instance of an indices helper: * - `inputVariable()`: create an indices helper instance for an input. * - `outputVariable()`: create an indices helper instance for an output. * - `internalVariable()`: create an indices helper instance for an internal variable. * * An indices helper instance contains helper functions for the following operations: * - access readonly basic information, including: `name`(the name of the input or output), `usage`(whether it's an * input, an output or an internal variable) and `shape`(the passed in shape). * - `type`: access readonly type information, including: `indices`(the type of indices), `value`(the type of value at * runtime), `storage`(the type of value at storage) and `tensor`(the tensor type as represented in TensorView). * - generate WGSL code for getting indices from offset. Use `offsetToIndices()` for WGSL code snippet to calculate * indices from offset, and use `indicesToOffset()` for WGSL code snippet to calculate offset from indices. * - to manipulate an instance of indices, use `setIndices()` and `getIndices()` to set and get the indices on an * indices variable. * - to manipulate data, use `set()`/`get()` to access data at the given indices from parameter list, use * `setByIndices()`/`getByIndices()` to access data at the given indices from an indices variable, and use * `setByOffset()`/`getByOffset()` to access data at the given offset. * - `impl`: get WGSL code of function implementation for the util functions mentioned above. */ export interface IndicesHelper { /** * get WGSL code of function implementation for the util functions. * */ readonly impl: () => string; /** * get type info */ readonly type: IndicesHelperTypes; /** * WGSL code of a expression for getting indices from offset. * * @param varOffset - a u32 expression representing the offset. * * @returns an `type.indices` expression */ readonly offsetToIndices: (varOffset: string) => string; /** * WGSL code of an `u32` expression for getting offset from indices. * * @param varIndices - a `type.indices` expression representing the indices. * * @returns an `u32` expression */ readonly indicesToOffset: (varIndices: string) => string; /** * WGSL code of an `u32` expression for getting original offset from broadcasted indices. * * @param varIndices - a `type.indices` expression representing the output indices. * @param output - output IndicesHelper. * * @returns an `u32` expression */ readonly broadcastedIndicesToOffset: (varIndices: string, output: IndicesHelper) => string; /** * WGSL code of generating an indices literal * * @param init - initial value. */ readonly indices: (...init: ReadonlyArray) => string; /** * WGSL code of a statement for setting indices. * * @param varIndices - a variable name for the indices. * @param idx - the index of the indices to set. can be a number or a string (WGSL `u32` expression). * @param value - the value to set. can be a number or a string (WGSL `u32` expression). * * @returns a WGSL statement */ readonly indicesSet: (varIndices: string, idx: number|string, value: number|string) => void; /** * WGSL code of an `u32` expression for getting indices. * * @param varIndices - a variable name for the indices. * @param idx - the index of the indices to get. can be a number or a string (WGSL `u32` expression). * * @returns an `u32` expression */ readonly indicesGet: (varIndices: string, idx: number|string) => string; /** * WGSL code for a statement for setting data at the given indices. * * @param indicesAndValue - an array of numbers or strings (WGSL `u32` expression) representing the indices, followed * by the value to set. This array should have exactly `shape.length + 1` elements. */ readonly set: (...indicesAndValue: ReadonlyArray) => string; /** * WGSL code for a statement for setting data at the given indices variable. * * @param varIndices - a variable name for the indices. * @param value - the value to set. should be a WGSL expression. */ readonly setByIndices: (varIndices: string, value: string) => string; /** * WGSL code for a statement for setting data at the given offset. * * @param offset - a number or a string (WGSL `u32` expression) representing the offset. * @param value - the value to set. should be a WGSL expression. */ readonly setByOffset: (offset: number|string, value: string) => string; /** * WGSL code for an expression for getting data at the given indices. * * @param indices - an array of numbers or strings (WGSL `u32` expression) representing the indices. */ readonly get: (...indices: ReadonlyArray) => string; /** * WGSL code for an expression for getting data at the given indices variable. * * @param varIndices - a variable name for the indices. */ readonly getByIndices: (varIndices: string) => string; /** * WGSL code for an expression for getting data at the given offset. * * @param offset - a number or a string (WGSL `u32` expression) representing the offset. */ readonly getByOffset: (offset: number|string) => string; /** * name of the data variable */ readonly name: string; /** * whether the helper is for an input, an output or an internal variable. */ readonly usage: 'input'|'output'|'internal'; /** * the rank of the input or output. */ readonly rank: number; /** * a string representing the variable name for the shape of the input or output. */ readonly shape: string; /** * a string representing the variable name for the strides of the input or output. */ readonly strides: string; } const getWgslMappedType = (type: number, components: 1|2|3|4): string|[string, string] => { if (components === 3) { throw new Error('vec3 has same alignment as vec4, use vec4 instead'); } // return type is [ storage type, runtime type ] or a single string for both switch (type) { case DataType.float16: return components > 1 ? `vec${components}` : 'f16'; case DataType.float: return components > 1 ? `vec${components}` : 'f32'; case DataType.int32: return components > 1 ? `vec${components}` : 'i32'; case DataType.uint32: return components > 1 ? `vec${components}` : 'u32'; case DataType.int64: if (components > 1) { throw new Error('currently not supported vecX of uint64 yet'); } return ['vec2', 'i32']; case DataType.uint64: if (components > 1) { throw new Error('currently not supported vecX of uint64 yet'); } return ['vec2', 'u32']; case DataType.bool: if (components !== 4) { throw new Error('bool must be vec4'); } return ['u32', 'vec4']; default: throw new Error(`Unknown data type: ${type}`); } }; export const tensorTypeToWsglStorageType = (type: DataType, components: 1|2|3|4 = 1) => { const mappedType = getWgslMappedType(type, components); return typeof mappedType === 'string' ? mappedType : mappedType[0]; }; export const tensorTypeToWsglValueType = (type: DataType, components: 1|2|3|4 = 1) => { const mappedType = getWgslMappedType(type, components); return typeof mappedType === 'string' ? mappedType : mappedType[1]; }; export const createTensorShapeVariables = (...dims: ReadonlyArray): ProgramUniform[] => { const programUniforms: ProgramUniform[] = []; dims.forEach(dim => { if (dim.length !== 0) { programUniforms.push( {type: DataType.uint32, data: dim}, {type: DataType.uint32, data: ShapeUtil.computeStrides(dim)}); } }); return programUniforms; }; /** * A helper function to get maximum vector size for specified data length * @param size */ export const getMaxComponents = (size: number) => { // we cannot use vec3 type since it has alignment of 16 bytes if (size % 4 === 0) { return 4; } else if (size % 2 === 0) { return 2; } return 1; }; /** * A helper function that initializes variable as a scalar or vector. e.g. f32(0) or vec4f(0,0,0,0) * @param dataType * @param components * @param value */ export const fillVector = (dataType = 'f32', components?: number, value = '0') => { if (!components || components === 1) { return `${dataType}(${value})`; } return `vec${components}<${dataType}>(${value})`; }; /** * A helper function that casts value or vector to f32 * @param dataType * @param components * @param value */ export const castToF32 = (dataType: string, components: number, value: string) => { if (dataType === 'f32') { return value; } if (components === 1) { return `f32(${value})`; } return `vec${components}(${value})`; }; /** * A helper function that returns scalar or sums all components of a vector * @param name * @param components */ export const sumVector = (name: string, components: number) => { if (components === 4) { return `(${name}.x + ${name}.y + ${name}.z + ${name}.w)`; } else if (components === 2) { return `(${name}.x + ${name}.y)`; } else if (components === 3) { return `(${name}.x + ${name}.y + ${name}.z)`; } return name; }; /** * A helper function that returns variable element at index. * @param name - the name of variable. * @param index - the index of variable element. * @param length - the length of variable. * @param type - the type of variable, optional. */ export const getElementAt = (name: string, index: number|string, length: number, type?: UniformDataElementType): string => { if (name.startsWith('uniforms.') && length > 4) { if (typeof (index) === 'string') { if (type === 'f16') { return `${name}[(${index}) / 8][(${index}) % 8 / 4][(${index}) % 8 % 4]`; } else { return `${name}[(${index}) / 4][(${index}) % 4]`; } } else { if (type === 'f16') { return `${name}[${Math.floor(index / 8)}][${Math.floor(index % 8 / 4)}][${index % 8 % 4}]`; } else { return `${name}[${Math.floor(index / 4)}][${index % 4}]`; } } } else { return length > 1 ? `${name}[${index}]` : name; } }; /** * A helper function to get a IndicesHelper for a given input or output. * * @param name - the name of the input or output. * @param tensorType - the tensor type of the input or output. * @param shapeOrRank - the tensor shape or the rank of the input or output. * @param usage - the usage of the indices helper. * @param components - indicates the number of components of each element. 1 for scalar, 2 for vec2, 3 for vec3, 4 for * vec4. */ const createIndicesHelper = (name: string, tensorType: number, shapeOrRank: number|readonly number[], usage: IndicesHelper['usage'], components: 1|2|3|4): IndicesHelper => { const useUniform = typeof shapeOrRank === 'number'; const rank = useUniform ? shapeOrRank : shapeOrRank.length; const rankIdentity = [...new Array(rank).keys()]; const indicesType = rank < 2 ? 'u32' : rank <= 4 ? `vec${rank}` : `array`; const mappedType = getWgslMappedType(tensorType, components); const valueType = typeof mappedType === 'string' ? mappedType : mappedType[1]; const storageType = typeof mappedType === 'string' ? mappedType : mappedType[0]; const type = {indices: indicesType, value: valueType, storage: storageType, tensor: tensorType}; const normalizeDim = (dim: number|string): string => typeof dim === 'string' ? dim : `${dim}u`; const implementationUsed = { offsetToIndices: false, indicesToOffset: false, broadcastedIndicesToOffset: false, set: false, setByIndices: false, get: false, getByIndices: false, }; const uniformPrefix = useUniform ? 'uniforms.' : ''; const shape = `${uniformPrefix}${name}_shape`; const strides = `${uniformPrefix}${name}_strides`; let o2iSnippet = ''; for (let i = 0; i < rank - 1; i++) { o2iSnippet += ` let dim${i} = current / ${getElementAt(strides, i, rank)}; let rest${i} = current % ${getElementAt(strides, i, rank)}; indices[${i}] = dim${i}; current = rest${i}; `; } o2iSnippet += `indices[${rank - 1}] = current;`; const offsetToIndicesImplementation = rank < 2 ? '' : ` fn o2i_${name}(offset: u32) -> ${type.indices} { var indices: ${type.indices}; var current = offset; ${o2iSnippet} return indices; }`; const offsetToIndices = (varOffset: string) => { implementationUsed.offsetToIndices = true; return rank < 2 ? varOffset : `o2i_${name}(${varOffset})`; }; const offsets: string[] = []; if (rank >= 2) { for (let i = rank - 1; i >= 0; i--) { offsets.push(`${getElementAt(strides, i, rank)} * (indices[${i}])`); } } const indicesToOffsetImplementation = rank < 2 ? '' : ` fn i2o_${name}(indices: ${type.indices}) -> u32 { return ${offsets.join('+')}; }`; const indicesToOffset = (varIndices: string) => { implementationUsed.indicesToOffset = true; return rank < 2 ? varIndices : `i2o_${name}(${varIndices})`; }; const indices = (...init: ReadonlyArray) => rank === 0 ? '0u' : `${type.indices}(${init.map(normalizeDim).join(',')})`; const indicesGet = (varIndices: string, idx: number|string) => { if (rank < 2) { return `${varIndices}`; } else { return `${getElementAt(varIndices, idx, rank)}`; } }; const indicesSet = (varIndices: string, idx: number|string, value: string) => { if (rank < 2) { return `${varIndices}=${value};`; } else { return `${getElementAt(varIndices, idx, rank)}=${value};`; } }; const broadcastedIndicesToOffsetImplementation: {[key: string]: string} = {}; const broadcastedIndicesToOffset = (varIndices: string, output: IndicesHelper) => { implementationUsed.broadcastedIndicesToOffset = true; const implKey = `${output.name}broadcastedIndicesTo${name}Offset`; if (implKey in broadcastedIndicesToOffsetImplementation) { return `${implKey}(${varIndices})`; } const offsets = []; for (let i = rank - 1; i >= 0; i--) { const idx = output.indicesGet('outputIndices', i + output.rank - rank); offsets.push(`${indicesGet(strides, i)} * (${idx} % ${indicesGet(shape, i)})`); } broadcastedIndicesToOffsetImplementation[implKey] = `fn ${implKey}(outputIndices: ${output.type.indices}) -> u32 { return ${offsets.length > 0 ? offsets.join('+') : '0u'}; }`; return `${implKey}(${varIndices})`; }; const setByOffset = (offset: number|string, value: string) => (() => { if (type.storage === type.value) { return `${name}[${offset}]=${value};`; } else if (type.storage === 'vec2' && type.value === 'i32') { // int64, components === 1 return `${name}[${offset}]=vec2(u32(${value}), select(0u, 0xFFFFFFFFu, ${value} < 0));`; } else if (type.storage === 'vec2' && type.value === 'u32') { // uint64, components === 1 return `${name}[${offset}]=vec2(u32(${value}), 0u);`; } else if (type.storage === 'u32' && type.value === 'vec4') { // bool, components === 4 return `${name}[${offset}]=dot(vec4(0x1, 0x100, 0x10000, 0x1000000), vec4(${value}));`; } else { throw new Error(`not supported combination of storage type ${type.storage} and value type ${type.value} yet`); } })(); const getByOffset = (offset: number|string) => (() => { if (type.storage === type.value) { return `${name}[${offset}]`; } else if (type.storage === 'vec2' && type.value === 'i32') { // int64, components === 1 return `i32(${name}[${offset}].x)`; } else if (type.storage === 'vec2' && type.value === 'u32') { // uint64, components === 1 return `u32(${name}[${offset}].x)`; } else if (type.storage === 'u32' && type.value === 'vec4') { // bool, components === 4 return `vec4(bool(${name}[${offset}] & 0xFFu), bool(${name}[${offset}] & 0xFF00u), bool(${name}[${ offset}] & 0xFF0000u), bool(${name}[${offset}] & 0xFF000000u))`; } else { throw new Error(`not supported combination of storage type ${type.storage} and value type ${type.value} yet`); } })(); const getByIndicesImplementation = rank < 2 ? '' : ` fn get_${name}ByIndices(indices: ${type.indices}) -> ${valueType} { return ${getByOffset(`i2o_${name}(indices)`)}; }`; const getImplementation = rank < 2 ? '' : (() => { const functionParams = rankIdentity.map(i => `d${i}: u32`).join(', '); const dimsParams = rankIdentity.map(i => `d${i}`).join(', '); return ` fn get_${name}(${functionParams}) -> ${valueType} { return get_${name}ByIndices(${indices(dimsParams)}); }`; })(); const get = (...indices: ReadonlyArray) => { if (indices.length !== rank) { throw new Error(`indices length must be ${rank}`); } const normalizedIndices = indices.map(normalizeDim).join(','); if (rank === 0) { return getByOffset('0u'); } else if (rank === 1) { return getByOffset(normalizedIndices[0]); } else { implementationUsed.get = true; implementationUsed.getByIndices = true; implementationUsed.indicesToOffset = true; return `get_${name}(${normalizedIndices})`; } }; const getByIndices = (varIndices: string) => { if (rank < 2) { return getByOffset(varIndices); } else { implementationUsed.getByIndices = true; implementationUsed.indicesToOffset = true; return `get_${name}ByIndices(${varIndices})`; } }; const setByIndicesImplementation = rank < 2 ? '' : ` fn set_${name}ByIndices(indices: ${type.indices}, value: ${valueType}) { ${setByOffset(`i2o_${name}(indices)`, 'value')} }`; const setImplementation = rank < 2 ? '' : (() => { const functionParams = rankIdentity.map(i => `d${i}: u32`).join(', '); const dimsParams = rankIdentity.map(i => `d${i}`).join(', '); return ` fn set_${name}(${functionParams}, value: ${valueType}) { set_${name}ByIndices(${indices(dimsParams)}, value); }`; })(); const set = (...indicesAndValue: ReadonlyArray) => { if (indicesAndValue.length !== rank + 1) { throw new Error(`indices length must be ${rank}`); } const value = indicesAndValue[rank]; if (typeof value !== 'string') { throw new Error('value must be string'); } const normalizedIndices = indicesAndValue.slice(0, rank).map(normalizeDim).join(','); if (rank === 0) { return setByOffset('0u', value); } else if (rank === 1) { return setByOffset(normalizedIndices[0], value); } else { implementationUsed.set = true; implementationUsed.setByIndices = true; implementationUsed.indicesToOffset = true; return `set_${name}(${normalizedIndices}, ${value})`; } }; const setByIndices = (varIndices: string, value: string) => { if (rank < 2) { return setByOffset(varIndices, value); } else { implementationUsed.setByIndices = true; implementationUsed.indicesToOffset = true; return `set_${name}ByIndices(${varIndices}, ${value});`; } }; const impl = () => { const impls = []; let needShapeStrides = false; if (implementationUsed.offsetToIndices) { impls.push(offsetToIndicesImplementation); needShapeStrides = true; } if (implementationUsed.indicesToOffset) { impls.push(indicesToOffsetImplementation); needShapeStrides = true; } if (implementationUsed.broadcastedIndicesToOffset) { Object.values(broadcastedIndicesToOffsetImplementation).forEach(impl => impls.push(impl)); needShapeStrides = true; } if (implementationUsed.set) { impls.push(setImplementation); needShapeStrides = true; } if (implementationUsed.setByIndices) { impls.push(setByIndicesImplementation); needShapeStrides = true; } if (implementationUsed.get) { impls.push(getImplementation); needShapeStrides = true; } if (implementationUsed.getByIndices) { impls.push(getByIndicesImplementation); needShapeStrides = true; } if (!useUniform && needShapeStrides) { impls.unshift( `const ${shape} = ${type.indices}(${shapeOrRank.join(',')});`, `const ${strides} = ${type.indices}(${ShapeUtil.computeStrides(shapeOrRank).join(',')});`); } return impls.join('\n'); }; return { impl, type, offsetToIndices, indicesToOffset, broadcastedIndicesToOffset, indices, indicesGet, indicesSet, set, setByOffset, setByIndices, get, getByOffset, getByIndices, // isVec4, usage, name, strides, shape, rank }; }; /** * Create a IndicesHelper for an input. * * @param name - the name of the input. * @param type - the tensor type of the input. * @param shapeOrRank - the tensor shape or the rank of the input. * @param components - the number of components of the input. available values are 1, 2, 3, 4. default is 1. * @returns an IndicesHelper for the input. */ export const inputVariable = (name: string, type: number, shapeOrRank: number|readonly number[], components: 1|2|3|4 = 1): IndicesHelper => createIndicesHelper(name, type, shapeOrRank, 'input', components); /** * Create a IndicesHelper for an output. * * @param name - the name of the output. * @param type - the tensor type of the output. * @param shapeOrRank - the tensor shape or the rank of the output. * @param components - the number of components of the output. available values are 1, 2, 3, 4. default is 1. * @returns an IndicesHelper for the output. */ export const outputVariable = (name: string, type: number, shapeOrRank: number|readonly number[], components: 1|2|3|4 = 1): IndicesHelper => createIndicesHelper(name, type, shapeOrRank, 'output', components); /** * Create a IndicesHelper for an internal variable. * * @param name - the name of the variable. * @param type - the tensor type of the variable. * @param shapeOrRank - the tensor shape or the rank of the variable. * @param components - the number of components of the variable. available values are 1, 2, 3, 4. default is 1. * @returns an IndicesHelper for the variable. */ export const internalVariable = (name: string, type: number, shapeOrRank: number|readonly number[], components: 1|2|3|4 = 1): IndicesHelper => createIndicesHelper(name, type, shapeOrRank, 'internal', components); export type UniformDataElementType = 'u32'|'f16'|'f32'|'i32'; export type UniformsArrayType = Array<{name: string; type: UniformDataElementType; length?: number}>; /** * A ShaderHelper is a helper class for generating WGSL code. */ export interface ShaderHelper { /** * A helper function to generate the start of main function in WGSL source code. * * @example * const getShaderSource = (shaderHelper: ShaderHelper) => ` * ... * * ${shaderHelper.mainStart()} * // your code here inside main() function * ... * } * `; * * @param workgroupSize - an optional workgroup size. default is WORKGROUP_SIZE. */ mainStart(workgroupSize?: number|[number, number, number]): string; /** * A helper function to generate the code snippet for guarding against out-of-bounds size. * * @example * const getShaderSource = (shaderHelper: ShaderHelper) => ` * ... * * ${shaderHelper.mainStart()} * ${shaderHelper.guardAgainstOutOfBoundsWorkgroupSizes(outputSize)} * * // your code here inside main() function * ... * } * `; * * @param size - the size of the data to guard against. can be a number or a string (WGSL `u32` expression). */ guardAgainstOutOfBoundsWorkgroupSizes(size: unknown): string; /** * A helper function to generate the code snippet for declaring multiple inputs or outputs. * * @param variables - an array of IndicesHelper for the variables. */ declareVariables(...variables: IndicesHelper[]): string; /** * A helper function to register one uniform. Can be called multiple times to register multiple uniforms. * * @param name - the name of the uniform. * @param type - the type of the uniform. * @param length - the length of the uniform, default to 1 when it is not provided. */ registerUniform(name: string, type: string, length?: number): ShaderHelper; /** * A helper function to register multiple uniforms. Can be called multiple times to register multiple uniforms. * * @param uniforms - an array of uniforms. Each element of the array is an object with 2 properties: `name` and * `type`. */ registerUniforms(uniforms: UniformsArrayType): ShaderHelper; /** * A helper function to register multiple internal variables. Can be called multiple times to register multiple * internal variables. * * @param variables - an array of IndicesHelper for the variables. */ registerInternalVariables(...variables: IndicesHelper[]): ShaderHelper; } class ShaderHelperImpl implements ShaderHelper { constructor(private normalizedDispatchGroup: [number, number, number], private limits: GPUSupportedLimits) {} guardAgainstOutOfBoundsWorkgroupSizes(size: number|string): string { // Guard against out-of-bounds work group sizes const sizeInCode = typeof size === 'number' ? `${size}u` : size; return `if (global_idx >= ${sizeInCode}) { return; }`; } mainStart(workgroupSize: number|[number, number, number] = WORKGROUP_SIZE) { const workgroupSizeX = typeof workgroupSize === 'number' ? workgroupSize : workgroupSize[0]; const workgroupSizeY = typeof workgroupSize === 'number' ? 1 : workgroupSize[1]; const workgroupSizeZ = typeof workgroupSize === 'number' ? 1 : workgroupSize[2]; if (workgroupSizeX > this.limits.maxComputeWorkgroupSizeX || workgroupSizeY > this.limits.maxComputeWorkgroupSizeY || workgroupSizeZ > this.limits.maxComputeWorkgroupSizeZ) { throw new Error(`workgroup size [${workgroupSizeX}, ${workgroupSizeY}, ${ workgroupSizeZ}] exceeds the maximum workgroup size [${this.limits.maxComputeWorkgroupSizeX}, ${ this.limits.maxComputeWorkgroupSizeY}, ${this.limits.maxComputeWorkgroupSizeZ}].`); } if (workgroupSizeX * workgroupSizeY * workgroupSizeZ > this.limits.maxComputeInvocationsPerWorkgroup) { throw new Error(`workgroup size [${workgroupSizeX}, ${workgroupSizeY}, ${ workgroupSizeZ}] exceeds the maximum workgroup invocations ${ this.limits.maxComputeInvocationsPerWorkgroup}.`); } const is1DimensionDispatch = this.normalizedDispatchGroup[1] === 1 && this.normalizedDispatchGroup[2] === 1; const paramList = is1DimensionDispatch ? `@builtin(global_invocation_id) global_id : vec3, @builtin(workgroup_id) workgroup_id : vec3, @builtin(local_invocation_id) local_id : vec3` : `@builtin(global_invocation_id) global_id : vec3, @builtin(local_invocation_id) local_id : vec3, @builtin(local_invocation_index) local_idx : u32, @builtin(workgroup_id) workgroup_id : vec3, @builtin(num_workgroups) num_workgroups : vec3`; const globalIdxDefinition = is1DimensionDispatch ? 'let global_idx = global_id.x; let local_idx = local_id.x;' : `let global_idx = (workgroup_id.z * num_workgroups[0] * num_workgroups[1] + workgroup_id.y * num_workgroups[0] + workgroup_id.x) * ${ workgroupSizeX * workgroupSizeY * workgroupSizeZ}u + local_idx;`; return `@compute @workgroup_size(${workgroupSizeX}, ${workgroupSizeY}, ${workgroupSizeZ}) fn main(${paramList}) { ${globalIdxDefinition} `; } private appendVariableUniforms(variable: IndicesHelper): void { if (variable.rank !== 0) { if (variable.shape.startsWith('uniforms.')) { this.uniforms.push({name: variable.shape.replace('uniforms.', ''), type: 'u32', length: variable.rank}); } if (variable.strides.startsWith('uniforms.')) { this.uniforms.push({name: variable.strides.replace('uniforms.', ''), type: 'u32', length: variable.rank}); } } } private declareVariable(variable: IndicesHelper, bindingIndex: number): string { if (variable.usage === 'internal') { throw new Error('cannot use internal variable with declareVariable(). use registerInternalVariables() instead.'); } this.variables.push(variable); this.appendVariableUniforms(variable); const access = variable.usage === 'input' ? 'read' : 'read_write'; const storageType = variable.type.storage; return `@group(0) @binding(${bindingIndex}) var ${variable.name}: array<${storageType}>;`; } declareVariables(...variables: IndicesHelper[]): string { return variables.map(v => this.declareVariable(v, this.variableIndex++)).join('\n'); } private registerInternalVariable(variable: IndicesHelper): void { if (variable.usage !== 'internal') { throw new Error( 'cannot use input or output variable with registerInternalVariable(). use declareVariables() instead.'); } this.internalVariables.push(variable); this.appendVariableUniforms(variable); } registerInternalVariables(...variables: IndicesHelper[]): ShaderHelper { variables.forEach(v => this.registerInternalVariable(v)); return this; } registerUniform(name: string, type: UniformDataElementType, length = 1): ShaderHelper { this.uniforms.push({name, type, length}); return this; } registerUniforms(additionalUniforms: UniformsArrayType): ShaderHelper { this.uniforms = this.uniforms.concat(additionalUniforms); return this; } private internalVariables: IndicesHelper[] = []; private variables: IndicesHelper[] = []; private uniforms: UniformsArrayType = []; private uniformDeclaration(): string { if (this.uniforms.length === 0) { return ''; } const uniformSnippets: string[] = []; for (const {name, type, length} of this.uniforms) { if (length && length > 4) { if (type === 'f16') { uniformSnippets.push(`@align(16) ${name}:array, ${Math.ceil(length / 8)}>`); } else { uniformSnippets.push(`${name}:array, ${Math.ceil(length / 4)}>`); } } else { const typeTemp = length == null || length === 1 ? type : `vec${length}<${type}>`; uniformSnippets.push(`${name}:${typeTemp}`); } } return ` struct Uniforms { ${uniformSnippets.join(', ')} }; @group(0) @binding(${this.variableIndex}) var uniforms: Uniforms;`; } private variableIndex = 0; /** * Get additional implementation that needs to be added to the shader source. */ get additionalImplementations(): string { return this.uniformDeclaration() + this.variables.map(i => i.impl()).join('\n') + this.internalVariables.map(i => i.impl()).join('\n'); } /** * Get the variable info of the shader program. */ get variablesInfo(): ProgramUniformVariableInfo[]|undefined { if (this.uniforms.length === 0) { return undefined; } const uniformWgslTypeToDataType = (type: UniformDataElementType) => ([DataType.uint32, DataType.float16, DataType.float, DataType.int32][['u32', 'f16', 'f32', 'i32'].indexOf(type)]); return this.uniforms.map(u => ([uniformWgslTypeToDataType(u.type), u.length ?? 1])); } } export const createShaderHelper = (dispatchGroup: [number, number, number], limits: GPUSupportedLimits) => new ShaderHelperImpl(dispatchGroup, limits); /** * This function comes from https://github.com/tensorflow/tfjs/blob/master/tfjs-core/src/ops/broadcast_util.ts#L18-L40 * Returns the dimensions in the input shape that are broadcasted to * produce the provided output shape. * * The returned dimensions are 0-indexed and sorted. An example: * inShape = [4, 1, 3] * outShape = [5, 4, 3, 3] * result = [1]. Dimension 1 (2nd dimension of input) gets broadcasted 1 => 3. */ export const getBroadcastDims = (inShape: readonly number[], outShape: readonly number[]): number[] => { const inRank = inShape.length; const dims: number[] = []; for (let i = 0; i < inRank; i++) { const dim = inRank - 1 - i; const a = inShape[dim] || 1; const b = outShape[outShape.length - 1 - i] || 1; if (b > 1 && a === 1) { dims.unshift(dim); } } return dims; };