-
Notifications
You must be signed in to change notification settings - Fork 2k
/
Copy pathtile_gpu.ts
62 lines (55 loc) · 1.91 KB
/
tile_gpu.ts
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
/**
* @license
* Copyright 2017 Google LLC. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
import {GPGPUProgram} from './gpgpu_math';
import {getCoordsDataType} from './shader_compiler';
export class TileProgram implements GPGPUProgram {
variableNames = ['A'];
outputShape: number[];
userCode: string;
rank: number;
constructor(aShape: number[], reps: number[]) {
const outputShape: number[] = new Array(aShape.length);
for (let i = 0; i < outputShape.length; i++) {
outputShape[i] = aShape[i] * reps[i];
}
this.outputShape = outputShape;
this.rank = outputShape.length;
const dtype = getCoordsDataType(this.rank);
const sourceCoords = getSourceCoords(aShape);
this.userCode = `
void main() {
${dtype} resRC = getOutputCoords();
setOutput(getA(${sourceCoords}));
}
`;
}
}
function getSourceCoords(aShape: number[]): string {
const rank = aShape.length;
if (rank > 5) {
throw Error(`Tile for rank ${rank} is not yet supported`);
}
if (rank === 1) {
return `imod(resRC, ${aShape[0]})`;
}
const currentCoords = ['resRC.x', 'resRC.y', 'resRC.z', 'resRC.w', 'resRC.u'];
const sourceCoords = [];
for (let i = 0; i < aShape.length; i++) {
sourceCoords.push(`imod(${currentCoords[i]}, ${aShape[i]})`);
}
return sourceCoords.join();
}