This repository was archived by the owner on Aug 15, 2019. It is now read-only.

Commit 5cc5267

authored

Fuse prelu activation. (#1867)

FEATURE PERF

1 parent 5aa35a3 commit 5cc5267Copy full SHA for 5cc5267

File tree

8 files changed

+454

-108

lines changed

src
- backends
  - backend.ts
  - cpu
    - backend_cpu.ts
  - webgl
- ops

8 files changed

+454

-108

lines changed

`‎src/backends/backend.ts‎`

Lines changed: 4 additions & 4 deletions

Original file line number	Diff line number	Diff line change
`@@ -16,7 +16,7 @@`
`16`	`16`	`*/`
`17`	`17`
`18`	`18`	`import {Conv2DInfo, Conv3DInfo} from '../ops/conv_util';`
`19`		`-import {Activation} from '../ops/fused_util';`
	`19`	`+import {Activation,FusedBatchMatMulConfig} from '../ops/fused_util';`
`20`	`20`	`import {Backend, DataId, Scalar, Tensor, Tensor1D, Tensor2D, Tensor3D, Tensor4D, Tensor5D} from '../tensor';`
`21`	`21`	`import {BackendValues, DataType, PixelData, Rank, ShapeMap} from '../types';`
`22`	`22`
`@@ -132,8 +132,8 @@ export class KernelBackend implements TensorStorage, Backend, BackendTimer {`
`132`	`132`	`}`
`133`	`133`
`134`	`134`	`fusedBatchMatMul(`
`135`		`- a: Tensor3D, b: Tensor3D, transposeA: boolean, transposeB: boolean,`
`136`		`- bias?: Tensor,activation?: Activation): Tensor3D {`
	`135`	`+ {a, b, transposeA, transposeB, bias, activation, preluActivationWeights}:`
	`136`	`+ FusedBatchMatMulConfig): Tensor3D {`
`137`	`137`	`throw new Error('Not yet implemented');`
`138`	`138`	`}`
`139`	`139`
`@@ -413,7 +413,7 @@ export class KernelBackend implements TensorStorage, Backend, BackendTimer {`
`413`	`413`
`414`	`414`	`fusedConv2d(`
`415`	`415`	`x: Tensor4D, filter: Tensor4D, convInfo: Conv2DInfo, bias?: Tensor4D,`
`416`		`- activation?: Activation): Tensor4D {`
	`416`	`+ activation?: Activation,preluActivationWeights?: Tensor): Tensor4D {`
`417`	`417`	`throw new Error('Not yet implemented');`
`418`	`418`	`}`
`419`	`419`

`‎src/backends/cpu/backend_cpu.ts‎`

Lines changed: 14 additions & 7 deletions

Original file line number	Diff line number	Diff line change
`@@ -26,7 +26,7 @@ import * as broadcast_util from '../../ops/broadcast_util';`
`26`	`26`	`import * as concat_util from '../../ops/concat_util';`
`27`	`27`	`import {Conv2DInfo, Conv3DInfo} from '../../ops/conv_util';`
`28`	`28`	`import * as erf_util from '../../ops/erf_util';`
`29`		`-import {Activation} from '../../ops/fused_util';`
	`29`	`+import {Activation,FusedBatchMatMulConfig} from '../../ops/fused_util';`
`30`	`30`	`import * as gather_nd_util from '../../ops/gather_nd_util';`
`31`	`31`	`import * as ops from '../../ops/ops';`
`32`	`32`	`import {buffer, scalar, tensor, tensor3d, tensor4d} from '../../ops/ops';`
`@@ -47,11 +47,14 @@ import {topkImpl} from '../topk_impl';`
`47`	`47`	`import {whereImpl} from '../where_impl';`
`48`	`48`
`49`	`49`	`function mapActivation(`
`50`		`- backend: MathBackendCPU, activation: Activation, x: Tensor): Tensor {`
	`50`	`+ backend: MathBackendCPU, x: Tensor, activation: Activation,`
	`51`	`+ preluActivationWeights?: Tensor): Tensor {`
`51`	`52`	`if (activation === 'linear') {`
`52`	`53`	`return backend.linear(x);`
`53`	`54`	`} else if (activation === 'relu') {`
`54`	`55`	`return backend.relu(x);`
	`56`	`+ } else if (activation === 'prelu') {`
	`57`	`+ return backend.prelu(x, preluActivationWeights);`
`55`	`58`	`}`
`56`	`59`	`throw new Error(`
`57`	`60`	`Activation ${activation} has not been implemented for the CPU backend.`);
`@@ -522,14 +525,16 @@ export class MathBackendCPU implements KernelBackend {`
`522`	`525`	`}`
`523`	`526`
`524`	`527`	`fusedBatchMatMul(`
`525`		`- a: Tensor3D, b: Tensor3D, transposeA: boolean, transposeB: boolean,`
`526`		`- bias?: Tensor,activation?: Activation): Tensor3D {`
	`528`	`+ {a, b, transposeA, transposeB, bias, activation, preluActivationWeights}:`
	`529`	`+ FusedBatchMatMulConfig): Tensor3D {`
`527`	`530`	`let result = this.batchMatMul(a, b, transposeA, transposeB);`
`528`	`531`	`if (bias) {`
`529`	`532`	`result = this.add(result, bias) as Tensor3D;`
`530`	`533`	`}`
`531`	`534`	`if (activation) {`
`532`		`- result = mapActivation(this, activation, result) as Tensor3D;`
	`535`	`+ result =`
	`536`	`+ mapActivation(this, result, activation, preluActivationWeights) as`
	`537`	`+ Tensor3D;`
`533`	`538`	`}`
`534`	`539`	`return result;`
`535`	`540`	`}`
`@@ -1515,14 +1520,16 @@ export class MathBackendCPU implements KernelBackend {`
`1515`	`1520`
`1516`	`1521`	`fusedConv2d(`
`1517`	`1522`	`x: Tensor4D, filter: Tensor4D, convInfo: Conv2DInfo, bias?: Tensor4D,`
`1518`		`- activation?: Activation): Tensor4D {`
	`1523`	`+ activation?: Activation,preluActivationWeights?: Tensor): Tensor4D {`
`1519`	`1524`	`let result = this.conv2d(x, filter, convInfo);`
`1520`	`1525`
`1521`	`1526`	`if (bias) {`
`1522`	`1527`	`result = this.add(result, bias) as Tensor4D;`
`1523`	`1528`	`}`
`1524`	`1529`	`if (activation) {`
`1525`		`- result = mapActivation(this, activation, result) as Tensor4D;`
	`1530`	`+ result =`
	`1531`	`+ mapActivation(this, result, activation, preluActivationWeights) as`
	`1532`	`+ Tensor4D;`
`1526`	`1533`	`}`
`1527`	`1534`	`return result;`
`1528`	`1535`	`}`

`‎src/backends/webgl/backend_webgl.ts‎`

Lines changed: 49 additions & 16 deletions

Original file line number	Diff line number	Diff line change
`@@ -28,7 +28,7 @@ import * as array_ops_util from '../../ops/array_ops_util';`
`28`	`28`	`import * as axis_util from '../../ops/axis_util';`
`29`	`29`	`import {computeOutShape} from '../../ops/concat_util';`
`30`	`30`	`import {Conv2DInfo, Conv3DInfo} from '../../ops/conv_util';`
`31`		`-import {Activation} from '../../ops/fused_util';`
	`31`	`+import {Activation,FusedBatchMatMulConfig} from '../../ops/fused_util';`
`32`	`32`	`import * as gather_nd_util from '../../ops/gather_nd_util';`
`33`	`33`	`import * as reduce_util from '../../ops/reduce_util';`
`34`	`34`	`import * as scatter_nd_util from '../../ops/scatter_nd_util';`
`@@ -174,6 +174,11 @@ function mapActivationToShaderProgram(`
`174`	`174`	`return unary_packed_op.RELU;`
`175`	`175`	`}`
`176`	`176`	`return unary_op.RELU;`
	`177`	`+ } else if (activation === 'prelu') {`
	`178`	`+ if (packed) {`
	`179`	`+ return binaryop_packed_gpu.PRELU;`
	`180`	`+ }`
	`181`	`+ return binaryop_gpu.PRELU;`
`177`	`182`	`}`
`178`	`183`	throw new Error(`Activation ${
`179`	`184`	activation} has not been implemented for the WebGL backend.`);
`@@ -865,26 +870,30 @@ export class MathBackendWebGL implements KernelBackend {`
`865`	`870`	`}`
`866`	`871`
`867`	`872`	`fusedBatchMatMul(`
`868`		`- a: Tensor3D, b: Tensor3D, transposeA: boolean, transposeB: boolean,`
`869`		`- bias?: Tensor,activation?: Activation): Tensor3D {`
	`873`	`+ {a, b, transposeA, transposeB, bias, activation, preluActivationWeights}:`
	`874`	`+ FusedBatchMatMulConfig): Tensor3D {`
`870`	`875`	`const outerShapeA = transposeA ? a.shape[2] : a.shape[1];`
`871`	`876`	`const outerShapeB = transposeB ? b.shape[1] : b.shape[2];`
`872`	`877`	`const [batch, , ] = a.shape;`
`873`	`878`
`874`	`879`	`const dtype = upcastType(a.dtype, b.dtype);`
`875`	`880`
`876`	`881`	`const hasBias = bias != null;`
	`882`	`+ const hasPreluActivationWeights = preluActivationWeights != null;`
`877`	`883`	`const fusedActivation =`
`878`	`884`	`activation ? mapActivationToShaderProgram(activation, true) : null;`
`879`	`885`	`const program = new MatMulPackedProgram(`
`880`	`886`	`a.shape, [batch, outerShapeA, outerShapeB], transposeA, transposeB,`
`881`		`- hasBias, fusedActivation);`
	`887`	`+ hasBias, fusedActivation,hasPreluActivationWeights);`
`882`	`888`	`const output =`
`883`	`889`	`this.makePackedTensor(program.outputShape, dtype) as Tensor3D;`
`884`	`890`	`const inputs: TensorHandle[] = [a, b];`
`885`	`891`	`if (bias) {`
`886`	`892`	`inputs.push(bias);`
`887`	`893`	`}`
	`894`	`+ if (preluActivationWeights) {`
	`895`	`+ inputs.push(preluActivationWeights);`
	`896`	`+ }`
`888`	`897`	`return this.compileAndRun<Tensor3D>(program, inputs, output);`
`889`	`898`	`}`
`890`	`899`
`@@ -1819,7 +1828,7 @@ export class MathBackendWebGL implements KernelBackend {`
`1819`	`1828`
`1820`	`1829`	`private conv2dByMatMul(`
`1821`	`1830`	`x: Tensor4D, filter: Tensor4D, convInfo: Conv2DInfo, bias?: Tensor4D,`
`1822`		`- activation?: Activation): Tensor4D {`
	`1831`	`+ activation?: Activation,preluActivationWeights?: Tensor): Tensor4D {`
`1823`	`1832`	`// Reshapes conv2D input to 2D tensors, uses matMul and then reshape the`
`1824`	`1833`	`// result from 2D to 4D.`
`1825`	`1834`	`const xShape = x.shape;`
`@@ -1850,9 +1859,15 @@ export class MathBackendWebGL implements KernelBackend {`
`1850`	`1859`	`Tensor3D;`
`1851`	`1860`
`1852`	`1861`	`return this.reshape<Rank.R4>(`
`1853`		`- this.fusedBatchMatMul(`
`1854`		`- xReshaped, filterReshaped, transposeA, transposeB, bias,`
`1855`		`- activation),`
	`1862`	`+ this.fusedBatchMatMul({`
	`1863`	`+ a: xReshaped,`
	`1864`	`+ b: filterReshaped,`
	`1865`	`+ transposeA,`
	`1866`	`+ transposeB,`
	`1867`	`+ bias,`
	`1868`	`+ activation,`
	`1869`	`+ preluActivationWeights`
	`1870`	`+ }),`
`1856`	`1871`	`convInfo.outShape);`
`1857`	`1872`	`}`
`1858`	`1873`
`@@ -1888,8 +1903,15 @@ export class MathBackendWebGL implements KernelBackend {`
`1888`	`1903`	`this.reshape(filter, [1, convInfo.inChannels, convInfo.outChannels]) as`
`1889`	`1904`	`Tensor3D;`
`1890`	`1905`
`1891`		`- const pointwiseConv = this.fusedBatchMatMul(`
`1892`		`- xReshaped, filterReshaped, transposeA, transposeB, bias, activation);`
	`1906`	`+ const pointwiseConv = this.fusedBatchMatMul({`
	`1907`	`+ a: xReshaped,`
	`1908`	`+ b: filterReshaped,`
	`1909`	`+ transposeA,`
	`1910`	`+ transposeB,`
	`1911`	`+ bias,`
	`1912`	`+ activation,`
	`1913`	`+ preluActivationWeights`
	`1914`	`+ });`
`1893`	`1915`	`const pointwiseConvTexData = this.texData.get(pointwiseConv.dataId);`
`1894`	`1916`	`util.assert(`
`1895`	`1917`	`pointwiseConvTexData.isPacked,`
`@@ -1906,7 +1928,7 @@ export class MathBackendWebGL implements KernelBackend {`
`1906`	`1928`
`1907`	`1929`	`private conv2dWithIm2Row(`
`1908`	`1930`	`x: Tensor4D, filter: Tensor4D, convInfo: Conv2DInfo, bias?: Tensor4D,`
`1909`		`- activation?: Activation): Tensor4D {`
	`1931`	`+ activation?: Activation,preluActivationWeights?: Tensor): Tensor4D {`
`1910`	`1932`	`// Rearranges conv2d input so each block to be convolved over forms the`
`1911`	`1933`	`// column of a new matrix with shape [filterWidth * filterHeight *`
`1912`	`1934`	`// inChannels, outHeight * outWidth]. The filter is also rearranged so each`
`@@ -1938,42 +1960,53 @@ export class MathBackendWebGL implements KernelBackend {`
`1938`	`1960`	`]) as Tensor3D;`
`1939`	`1961`
`1940`	`1962`	`const hasBias = bias != null;`
	`1963`	`+ const hasPreluActivationWeights = preluActivationWeights != null;`
`1941`	`1964`	`const fusedActivation =`
`1942`	`1965`	`activation ? mapActivationToShaderProgram(activation, true) : null;`
`1943`	`1966`	`const matmulProgram = new MatMulPackedProgram(`
`1944`	`1967`	`im2Col.shape, [1, numCols, convInfo.outChannels], transposeA,`
`1945`		`- transposeB, hasBias, fusedActivation);`
	`1968`	`+ transposeB, hasBias, fusedActivation,hasPreluActivationWeights);`
`1946`	`1969`	`const inputs: TensorHandle[] = [im2Col, w2Row];`
`1947`	`1970`	`if (bias) {`
`1948`	`1971`	`inputs.push(bias);`
`1949`	`1972`	`}`
	`1973`	`+ if (hasPreluActivationWeights) {`
	`1974`	`+ inputs.push(preluActivationWeights);`
	`1975`	`+ }`
`1950`	`1976`	`const product = this.compileAndRun<Tensor4D>(matmulProgram, inputs);`
`1951`	`1977`
`1952`	`1978`	`return product.reshape([1, outHeight, outWidth, convInfo.outChannels]);`
`1953`	`1979`	`}`
`1954`	`1980`
`1955`	`1981`	`fusedConv2d(`
`1956`	`1982`	`x: Tensor4D, filter: Tensor4D, convInfo: Conv2DInfo, bias?: Tensor4D,`
`1957`		`- activation?: Activation): Tensor4D {`
	`1983`	`+ activation?: Activation,preluActivationWeights?: Tensor): Tensor4D {`
`1958`	`1984`	`if (convInfo.filterHeight === 1 && convInfo.filterWidth === 1 &&`
`1959`	`1985`	`convInfo.dilationHeight === 1 && convInfo.dilationWidth === 1 &&`
`1960`	`1986`	`convInfo.strideHeight === 1 && convInfo.strideWidth === 1 &&`
`1961`	`1987`	`(convInfo.padInfo.type === 'SAME' \|\|`
`1962`	`1988`	`convInfo.padInfo.type === 'VALID')) {`
`1963`		`- return this.conv2dByMatMul(x, filter, convInfo, bias, activation);`
	`1989`	`+ return this.conv2dByMatMul(`
	`1990`	`+ x, filter, convInfo, bias, activation, preluActivationWeights);`
`1964`	`1991`	`}`
`1965`	`1992`	`if (ENV.getBool('WEBGL_CONV_IM2COL') && x.shape[0] === 1) {`
`1966`		`- return this.conv2dWithIm2Row(x, filter, convInfo, bias, activation);`
	`1993`	`+ return this.conv2dWithIm2Row(`
	`1994`	`+ x, filter, convInfo, bias, activation, preluActivationWeights);`
`1967`	`1995`	`}`
`1968`	`1996`
`1969`	`1997`	`const hasBias = bias != null;`
	`1998`	`+ const hasPreluActivationWeights = preluActivationWeights != null;`
`1970`	`1999`	`const fusedActivation =`
`1971`	`2000`	`activation ? mapActivationToShaderProgram(activation, false) : null;`
`1972`		`- const program = new Conv2DProgram(convInfo, hasBias, fusedActivation);`
	`2001`	`+ const program = new Conv2DProgram(`
	`2002`	`+ convInfo, hasBias, fusedActivation, hasPreluActivationWeights);`
`1973`	`2003`	`const inputs: TensorHandle[] = [x, filter];`
`1974`	`2004`	`if (bias) {`
`1975`	`2005`	`inputs.push(bias);`
`1976`	`2006`	`}`
	`2007`	`+ if (preluActivationWeights) {`
	`2008`	`+ inputs.push(preluActivationWeights);`
	`2009`	`+ }`
`1977`	`2010`	`return this.compileAndRun(program, inputs);`
`1978`	`2011`	`}`
`1979`	`2012`

`‎src/backends/webgl/conv_gpu.ts‎`

Lines changed: 17 additions & 5 deletions

Original file line number	Diff line number	Diff line change
`@@ -24,7 +24,8 @@ export class Conv2DProgram implements GPGPUProgram {`
`24`	`24`	`userCode: string;`
`25`	`25`
`26`	`26`	`constructor(`
`27`		`- convInfo: Conv2DInfo, addBias = false, activation: string = null) {`
	`27`	`+ convInfo: Conv2DInfo, addBias = false, activation: string = null,`
	`28`	`+ hasPreluActivationWeights = false) {`
`28`	`29`	`this.outputShape = convInfo.outShape;`
`29`	`30`	`const padTop = convInfo.padInfo.top;`
`30`	`31`	`const padLeft = convInfo.padInfo.left;`
`@@ -40,11 +41,18 @@ export class Conv2DProgram implements GPGPUProgram {`
`40`	`41`
`41`	`42`	`let activationSnippet = '', applyActivationSnippet = '';`
`42`	`43`	`if (activation) {`
`43`		- activationSnippet = `
`44`		`- float activation(float x) {`
	`44`	`+ if (hasPreluActivationWeights) {`
	`45`	+ activationSnippet = `float activation(float a) {
	`46`	`+ float b = getPreluActivationWeightsAtOutCoords();`
`45`	`47`	`${activation}`
`46`		`- }`
`47`		- `;
	`48`	+ }`;
	`49`	`+ } else {`
	`50`	+ activationSnippet = `
	`51`	`+ float activation(float x) {`
	`52`	`+ ${activation}`
	`53`	`+ }`
	`54`	+ `;
	`55`	`+ }`
`48`	`56`
`49`	`57`	applyActivationSnippet = `result = activation(result);`;
`50`	`58`	`}`
`@@ -54,6 +62,10 @@ export class Conv2DProgram implements GPGPUProgram {`
`54`	`62`	`this.variableNames.push('bias');`
`55`	`63`	`}`
`56`	`64`
	`65`	`+ if (hasPreluActivationWeights) {`
	`66`	`+ this.variableNames.push('preluActivationWeights');`
	`67`	`+ }`
	`68`	`+`
`57`	`69`	this.userCode = `
`58`	`70`	`${activationSnippet}`
`59`	`71`

`‎src/backends/webgl/mulmat_packed_gpu.ts‎`

Lines changed: 16 additions & 5 deletions

Original file line number	Diff line number	Diff line change
`@@ -26,7 +26,7 @@ export class MatMulPackedProgram implements GPGPUProgram {`
`26`	`26`	`constructor(`
`27`	`27`	`aShape: [number, number, number], outputShape: [number, number, number],`
`28`	`28`	`transposeA = false, transposeB = false, addBias = false,`
`29`		`- activation: string = null) {`
	`29`	`+ activation: string = null,hasPreluActivation=false) {`
`30`	`30`	`this.outputShape = outputShape;`
`31`	`31`
`32`	`32`	`const sharedDim = transposeA ? aShape[1] : aShape[2];`
`@@ -39,9 +39,16 @@ export class MatMulPackedProgram implements GPGPUProgram {`
`39`	`39`
`40`	`40`	`let activationSnippet = '', applyActivationSnippet = '';`
`41`	`41`	`if (activation) {`
`42`		- activationSnippet = `vec4 activation(vec4 x) {
`43`		`- ${activation}`
`44`		- }`;
	`42`	`+ if (hasPreluActivation) {`
	`43`	+ activationSnippet = `vec4 activation(vec4 a) {
	`44`	`+ vec4 b = getPreluActivationWeightsAtOutCoords();`
	`45`	`+ ${activation}`
	`46`	+ }`;
	`47`	`+ } else {`
	`48`	+ activationSnippet = `vec4 activation(vec4 x) {
	`49`	`+ ${activation}`
	`50`	+ }`;
	`51`	`+ }`
`45`	`52`
`46`	`53`	applyActivationSnippet = `result = activation(result);`;
`47`	`54`	`}`
`@@ -51,6 +58,10 @@ export class MatMulPackedProgram implements GPGPUProgram {`
`51`	`58`	`this.variableNames.push('bias');`
`52`	`59`	`}`
`53`	`60`
	`61`	`+ if (hasPreluActivation) {`
	`62`	`+ this.variableNames.push('preluActivationWeights');`
	`63`	`+ }`
	`64`	`+`
`54`	`65`	this.userCode = `
`55`	`66`	`${activationSnippet}`
`56`	`67`
`@@ -82,4 +93,4 @@ export class MatMulPackedProgram implements GPGPUProgram {`
`82`	`93`	`}`
`83`	`94`	`;
`84`	`95`	`}`
`85`		`-}`
	`96`	`+}`

0 commit comments

Comments

(0)

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit 5cc5267

File tree

8 files changed

8 files changed

`‎src/backends/backend.ts‎`

`‎src/backends/cpu/backend_cpu.ts‎`

`‎src/backends/webgl/backend_webgl.ts‎`

`‎src/backends/webgl/conv_gpu.ts‎`

`‎src/backends/webgl/mulmat_packed_gpu.ts‎`

0 commit comments