piercus
diff --git a/‎src/kernels/backend_webgl.ts
Lines changed: 78 additions & 29 deletions b/‎src/kernels/backend_webgl.ts
Lines changed: 78 additions & 29 deletions
@@ -51,7 +51,8 @@ import * as binaryop_complex_gpu from './webgl/binaryop_complex_gpu';
 import {BinaryOpComplexProgram} from './webgl/binaryop_complex_gpu';
 import * as binaryop_gpu from './webgl/binaryop_gpu';
 import {BinaryOpProgram} from './webgl/binaryop_gpu';
-import {BinaryOpPackedProgram, PACKED_DIV, PACKED_INT_DIV, PACKED_POW} from './webgl/binaryop_packed_gpu';
+import * as binaryop_packed_gpu from './webgl/binaryop_packed_gpu';
+import {BinaryOpPackedProgram} from './webgl/binaryop_packed_gpu';
 import {ClipProgram} from './webgl/clip_gpu';
 import {ClipPackedProgram} from './webgl/clip_packed_gpu';
 import {ComplexAbsProgram} from './webgl/complex_abs_gpu';
@@ -768,8 +769,8 @@ export class MathBackendWebGL implements KernelBackend {
 
     const dtype = upcastType(a.dtype, b.dtype);
 
-    const program = new MatMulPackedProgram(a.shape,
-        [batch, outerShapeA, outerShapeB], transposeA, transposeB);
+    const program = new MatMulPackedProgram(
+        a.shape, [batch, outerShapeA, outerShapeB], transposeA, transposeB);
     const output =
         this.makePackedTensor(program.outputShape, dtype) as Tensor3D;
     return this.compileAndRun<Tensor3D>(program, [a, b], output);
@@ -784,8 +785,9 @@ export class MathBackendWebGL implements KernelBackend {
 
     const dtype = upcastType(a.dtype, b.dtype);
 
-    const program = new MatMulPackedProgram(a.shape,
-        [batch, outerShapeA, outerShapeB], transposeA, transposeB, !!bias,
+    const program = new MatMulPackedProgram(
+        a.shape, [batch, outerShapeA, outerShapeB], transposeA, transposeB,
+        !!bias,
         activation ? mapActivationToShaderProgram(activation, true) : null);
     const output =
         this.makePackedTensor(program.outputShape, dtype) as Tensor3D;
@@ -1099,12 +1101,18 @@ export class MathBackendWebGL implements KernelBackend {
   }
 
   equal(a: Tensor, b: Tensor): Tensor {
+    if (ENV.get('WEBGL_PACK_BINARY_OPERATIONS')) {
+      return this.packedBinaryOp(a, b, binaryop_packed_gpu.EQUAL, 'bool');
+    }
     const program = new BinaryOpProgram(binaryop_gpu.EQUAL, a.shape, b.shape);
     const output = this.makeOutputArray(program.outputShape, 'bool');
     return this.compileAndRun(program, [a, b], output);
   }
 
   notEqual(a: Tensor, b: Tensor): Tensor {
+    if (ENV.get('WEBGL_PACK_BINARY_OPERATIONS')) {
+      return this.packedBinaryOp(a, b, binaryop_packed_gpu.NOT_EQUAL, 'bool');
+    }
     const program =
         new BinaryOpProgram(binaryop_gpu.NOT_EQUAL, a.shape, b.shape);
     const output = this.makeOutputArray(program.outputShape, 'bool');
@@ -1116,12 +1124,19 @@ export class MathBackendWebGL implements KernelBackend {
       return this.cpuBackend.less(a, b);
     }
 
+    if (ENV.get('WEBGL_PACK_BINARY_OPERATIONS')) {
+      return this.packedBinaryOp(a, b, binaryop_packed_gpu.LESS, 'bool');
+    }
+
     const program = new BinaryOpProgram(binaryop_gpu.LESS, a.shape, b.shape);
     const output = this.makeOutputArray(program.outputShape, 'bool');
     return this.compileAndRun(program, [a, b], output);
   }
 
   lessEqual(a: Tensor, b: Tensor): Tensor {
+    if (ENV.get('WEBGL_PACK_BINARY_OPERATIONS')) {
+      return this.packedBinaryOp(a, b, binaryop_packed_gpu.LESS_EQUAL, 'bool');
+    }
     const program =
         new BinaryOpProgram(binaryop_gpu.LESS_EQUAL, a.shape, b.shape);
     const output = this.makeOutputArray(program.outputShape, 'bool');
@@ -1133,12 +1148,20 @@ export class MathBackendWebGL implements KernelBackend {
       return this.cpuBackend.greater(a, b);
     }
 
+    if (ENV.get('WEBGL_PACK_BINARY_OPERATIONS')) {
+      return this.packedBinaryOp(a, b, binaryop_packed_gpu.GREATER, 'bool');
+    }
+
     const program = new BinaryOpProgram(binaryop_gpu.GREATER, a.shape, b.shape);
     const output = this.makeOutputArray(program.outputShape, 'bool');
     return this.compileAndRun(program, [a, b], output);
   }
 
   greaterEqual(a: Tensor, b: Tensor): Tensor {
+    if (ENV.get('WEBGL_PACK_BINARY_OPERATIONS')) {
+      return this.packedBinaryOp(
+          a, b, binaryop_packed_gpu.GREATER_EQUAL, 'bool');
+    }
     const program =
         new BinaryOpProgram(binaryop_gpu.GREATER_EQUAL, a.shape, b.shape);
     const output = this.makeOutputArray(program.outputShape, 'bool');
@@ -1151,13 +1174,19 @@ export class MathBackendWebGL implements KernelBackend {
   }
 
   logicalAnd(a: Tensor, b: Tensor): Tensor {
+    if (ENV.get('WEBGL_PACK_BINARY_OPERATIONS')) {
+      return this.packedBinaryOp(a, b, binaryop_packed_gpu.LOGICAL_AND, 'bool');
+    }
     const program =
         new BinaryOpProgram(binaryop_gpu.LOGICAL_AND, a.shape, b.shape);
     const output = this.makeOutputArray(program.outputShape, 'bool');
     return this.compileAndRun(program, [a, b], output);
   }
 
   logicalOr(a: Tensor, b: Tensor): Tensor {
+    if (ENV.get('WEBGL_PACK_BINARY_OPERATIONS')) {
+      return this.packedBinaryOp(a, b, binaryop_packed_gpu.LOGICAL_OR, 'bool');
+    }
     const program =
         new BinaryOpProgram(binaryop_gpu.LOGICAL_OR, a.shape, b.shape);
     const output = this.makeOutputArray(program.outputShape, 'bool');
@@ -1198,12 +1227,17 @@ export class MathBackendWebGL implements KernelBackend {
       return this.cpuBackend.minimum(a, b);
     }
 
-    const program = new BinaryOpProgram(binaryop_gpu.MIN, a.shape, b.shape);
-    return this.compileAndRun(program, [a, b]);
+    const program = ENV.get('WEBGL_PACK_BINARY_OPERATIONS') ?
+        new BinaryOpPackedProgram(binaryop_packed_gpu.MIN, a.shape, b.shape) :
+        new BinaryOpProgram(binaryop_gpu.MIN, a.shape, b.shape);
+    const customSetup = program.getCustomSetupFunc();
+    return this.compileAndRun(program, [a, b], null, customSetup);
   }
 
   mod(a: Tensor, b: Tensor): Tensor {
-    const program = new BinaryOpProgram(binaryop_gpu.MOD, a.shape, b.shape);
+    const program = ENV.get('WEBGL_PACK_BINARY_OPERATIONS') ?
+        new BinaryOpPackedProgram(binaryop_packed_gpu.MOD, a.shape, b.shape) :
+        new BinaryOpProgram(binaryop_gpu.MOD, a.shape, b.shape);
     const customSetup = program.getCustomSetupFunc();
     return this.compileAndRun(program, [a, b], null, customSetup);
   }
@@ -1222,8 +1256,11 @@ export class MathBackendWebGL implements KernelBackend {
       return this.cpuBackend.maximum(a, b);
     }
 
-    const program = new BinaryOpProgram(binaryop_gpu.MAX, a.shape, b.shape);
-    return this.compileAndRun(program, [a, b]);
+    const program = ENV.get('WEBGL_PACK_BINARY_OPERATIONS') ?
+        new BinaryOpPackedProgram(binaryop_packed_gpu.MAX, a.shape, b.shape) :
+        new BinaryOpProgram(binaryop_gpu.MAX, a.shape, b.shape);
+    const customSetup = program.getCustomSetupFunc();
+    return this.compileAndRun(program, [a, b], null, customSetup);
   }
 
   all(x: Tensor, axes: number[]): Tensor {
@@ -1245,7 +1282,9 @@ export class MathBackendWebGL implements KernelBackend {
   }
 
   squaredDifference(a: Tensor, b: Tensor): Tensor {
-    const program =
+    const program = ENV.get('WEBGL_PACK_BINARY_OPERATIONS') ?
+        new BinaryOpPackedProgram(
+            binaryop_gpu.SQUARED_DIFFERENCE, a.shape, b.shape) :
         new BinaryOpProgram(binaryop_gpu.SQUARED_DIFFERENCE, a.shape, b.shape);
     return this.compileAndRun(program, [a, b]);
   }
@@ -1254,7 +1293,7 @@ export class MathBackendWebGL implements KernelBackend {
     const op = binaryop_gpu.DIV;
     const outputDtype = 'float32';
     if (ENV.get('WEBGL_PACK_BINARY_OPERATIONS')) {
-      return this.packedBinaryOp(a, b, PACKED_DIV, outputDtype);
+      return this.packedBinaryOp(a, b, binaryop_packed_gpu.DIV, outputDtype);
     }
     const program = new BinaryOpProgram(op, a.shape, b.shape);
     const output = this.makeOutputArray(program.outputShape, outputDtype);
@@ -1265,7 +1304,8 @@ export class MathBackendWebGL implements KernelBackend {
     const op = binaryop_gpu.INT_DIV;
     const outputDtype = 'int32';
     if (ENV.get('WEBGL_PACK_BINARY_OPERATIONS')) {
-      return this.packedBinaryOp(a, b, PACKED_INT_DIV, outputDtype);
+      return this.packedBinaryOp(
+          a, b, binaryop_packed_gpu.INT_DIV, outputDtype);
     }
     const program = new BinaryOpProgram(op, a.shape, b.shape);
     const output = this.makeOutputArray(program.outputShape, outputDtype);
@@ -1285,7 +1325,8 @@ export class MathBackendWebGL implements KernelBackend {
     return this.compileAndRun<Tensor>(program, [a, b], output);
   }
 
-  private packedBinaryOp(a: Tensor, b: Tensor, op: string, dtype: DataType) {
+  private packedBinaryOp(
+      a: TensorHandle, b: TensorHandle, op: string, dtype: DataType) {
     const program = new BinaryOpPackedProgram(op, a.shape, b.shape);
     const output = this.makePackedTensor(program.outputShape, dtype) as Tensor;
     return this.compileAndRun<Tensor>(program, [a, b], output);
@@ -1305,14 +1346,14 @@ export class MathBackendWebGL implements KernelBackend {
     ].map(complexParts => {
       const [aPart, bPart] = complexParts;
 
+      const aHandle = this.makeComplexComponentTensorHandle(a, aPart);
+      const bHandle = this.makeComplexComponentTensorHandle(b, bPart);
+
       const program = new BinaryOpProgram(op, a.shape, b.shape);
       const output = this.makeOutputArray(
                          program.outputShape,
                          upcastType(aPart.dtype, bPart.dtype)) as Tensor;
 
-      const aHandle = this.makeComplexComponentTensorHandle(a, aPart);
-      const bHandle = this.makeComplexComponentTensorHandle(b, bPart);
-
       return this.compileAndRun<Tensor>(program, [aHandle, bHandle], output);
     });
 
@@ -1362,7 +1403,7 @@ export class MathBackendWebGL implements KernelBackend {
   pow<T extends Tensor>(a: T, b: Tensor): T {
     const usePackedOp = ENV.get('WEBGL_PACK_BINARY_OPERATIONS');
     const program = usePackedOp ?
-        new BinaryOpPackedProgram(PACKED_POW, a.shape, b.shape) :
+        new BinaryOpPackedProgram(binaryop_packed_gpu.POW, a.shape, b.shape) :
         new BinaryOpProgram(binaryop_gpu.POW, a.shape, b.shape);
     const dtype = upcastType(a.dtype, b.dtype);
     const output = usePackedOp ?
@@ -1454,7 +1495,9 @@ export class MathBackendWebGL implements KernelBackend {
   }
 
   prelu<T extends Tensor>(x: T, alpha: T): T {
-    const program =
+    const program = ENV.get('WEBGL_PACK_BINARY_OPERATIONS') ?
+        new BinaryOpPackedProgram(
+            binaryop_packed_gpu.PRELU, x.shape, alpha.shape) :
         new BinaryOpProgram(binaryop_gpu.PRELU, x.shape, alpha.shape);
     return this.compileAndRun(program, [x, alpha]) as T;
   }
@@ -1465,7 +1508,9 @@ export class MathBackendWebGL implements KernelBackend {
   }
 
   eluDer<T extends Tensor>(dy: T, y: T): T {
-    const program =
+    const program = ENV.get('WEBGL_PACK_BINARY_OPERATIONS') ?
+        new BinaryOpPackedProgram(
+            binaryop_packed_gpu.ELU_DER, dy.shape, y.shape) :
         new BinaryOpProgram(binaryop_gpu.ELU_DER, dy.shape, y.shape);
     return this.compileAndRun(program, [dy, y]) as T;
   }
@@ -1550,8 +1595,11 @@ export class MathBackendWebGL implements KernelBackend {
   }
 
   atan2<T extends Tensor>(a: T, b: T): T {
-    const program = new BinaryOpProgram(binaryop_gpu.ATAN2, a.shape, b.shape);
-    return this.compileAndRun(program, [a, b]) as T;
+    const program = ENV.get('WEBGL_PACK_BINARY_OPERATIONS') ?
+        new BinaryOpPackedProgram(binaryop_packed_gpu.ATAN2, a.shape, b.shape) :
+        new BinaryOpProgram(binaryop_gpu.ATAN2, a.shape, b.shape);
+    const customSetup = program.getCustomSetupFunc();
+    return this.compileAndRun(program, [a, b], null, customSetup) as T;
   }
 
   sinh<T extends Tensor>(x: T): T {
@@ -1680,12 +1728,13 @@ export class MathBackendWebGL implements KernelBackend {
 
     const im2ColProgram =
         new Im2ColProgram(x2ColShape, xSqueezed.shape, convInfo);
-    const im2Col = this.compileAndRun<Tensor2D>(im2ColProgram, [xSqueezed]).
-        reshape([1, x2ColShape[0], x2ColShape[1]]) as Tensor3D;
+    const im2Col =
+        this.compileAndRun<Tensor2D>(im2ColProgram, [xSqueezed]).reshape([
+          1, x2ColShape[0], x2ColShape[1]
+        ]) as Tensor3D;
 
     const matmulProgram = new MatMulPackedProgram(
-        im2Col.shape, [1, numCols, convInfo.outChannels], true,
-        false);
+        im2Col.shape, [1, numCols, convInfo.outChannels], true, false);
     const product =
         this.compileAndRun<Tensor4D>(matmulProgram, [im2Col, w2Row]);
 
@@ -1825,9 +1874,9 @@ export class MathBackendWebGL implements KernelBackend {
 
   reshape<R extends Rank>(x: Tensor, shape: ShapeMap[R]): Tensor<R> {
     const texData = this.texData.get(x.dataId);
-    if (texData.isPacked && !webgl_util.isReshapeFree(x.shape, shape)
-        && !(texData.texture !== null &&
-             webgl_util.isReshapeFree(texData.shape, shape))) {
+    if (texData.isPacked && !webgl_util.isReshapeFree(x.shape, shape) &&
+        !(texData.texture !== null &&
+          webgl_util.isReshapeFree(texData.shape, shape))) {
       return this.packedReshape(x, shape);
     }
     return backend_util.reshapeTensor(x, shape);