JavaScriptPlugins
diff --git a/‎package.json‎
Lines changed: 1 addition & 1 deletion b/‎package.json‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎tfjs-backend-wasm/package.json‎
Lines changed: 5 additions & 5 deletions b/‎tfjs-backend-wasm/package.json‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎tfjs-backend-wasm/scripts/test-bundle-size.js‎
Lines changed: 2 additions & 2 deletions b/‎tfjs-backend-wasm/scripts/test-bundle-size.js‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎tfjs-backend-wasm/src/cc/BUILD‎
Lines changed: 30 additions & 3 deletions b/‎tfjs-backend-wasm/src/cc/BUILD‎
Lines changed: 30 additions & 3 deletions
diff --git a/‎tfjs-backend-wasm/src/cc/conv2d_impl.cc‎
Lines changed: 201 additions & 0 deletions b/‎tfjs-backend-wasm/src/cc/conv2d_impl.cc‎
Lines changed: 201 additions & 0 deletions
diff --git a/‎tfjs-backend-wasm/src/cc/conv2d_impl.h‎
Lines changed: 32 additions & 0 deletions b/‎tfjs-backend-wasm/src/cc/conv2d_impl.h‎
Lines changed: 32 additions & 0 deletions
@@ -7,7 +7,7 @@
     "shelljs": "~0.8.3",
     "ts-node": "~4.1.0",
     "tslint": "~5.20.0",
-    "typescript": "3.5.3"
+    "typescript": "3.6.3"
   },
   "scripts": {
     "diff": "./scripts/diff.js",
 
@@ -36,14 +36,14 @@
     "karma-jasmine": "~1.1.1",
     "karma-typescript": "~4.0.0",
     "rimraf": "~2.6.2",
-    "rollup": "^1.17.0",
-    "rollup-plugin-commonjs": "^10.0.1",
-    "rollup-plugin-node-resolve": "^5.2.0",
+    "rollup": "~1.26.3",
+    "rollup-plugin-commonjs": "~10.1.0",
+    "rollup-plugin-node-resolve": "~5.2.0",
     "rollup-plugin-terser": "^5.1.1",
-    "rollup-plugin-typescript2": "^0.22.1",
+    "rollup-plugin-typescript2": "~0.25.2",
     "tslint": "^5.20.0",
     "tslint-no-circular-imports": "^0.7.0",
-    "typescript": "3.5.3",
+    "typescript": "3.6.3",
     "yalc": "~1.0.0-pre.21"
   },
   "license": "Apache-2.0"
 
@@ -19,7 +19,7 @@ const {exec} = require('../../scripts/test-util');
 const {showDiff, getFileSizeBytes} = require('../../scripts/bundle-size-util');
 
 // Get the bundle sizes from this change.
-exec(`yarn rollup -c`, {silent: true});
+exec(`yarn rollup -c`, {silent: false});
 
 const bundleFilename = 'dist/tf-backend-wasm.min.js';
 const minBundleSize = getFileSizeBytes(bundleFilename);
@@ -36,7 +36,7 @@ exec(
 
 shell.cd(dirName);
 shell.cd(wasmDirName);
-exec(`yarn && ./scripts/build-ci.sh && yarn rollup -c`, {silent: true});
+exec(`yarn && ./scripts/build-ci.sh && yarn rollup -c`, {silent: false});
 
 const masterMinBundleSize = getFileSizeBytes(bundleFilename);
 const masterWasmSize = getFileSizeBytes(wasmFileName);
 
@@ -62,6 +62,17 @@ tfjs_cc_library(
   deps = [":util"],
 )
 
+tfjs_cc_library(
+  name = "conv2d_impl",
+  hdrs = ["conv2d_impl.h"],
+  srcs = ["conv2d_impl.cc"],
+  deps = [
+    ":backend",
+    ":transpose_impl",
+    ":util",
+  ],
+)
+
 tfjs_cc_library(
   name = "all_kernels",
   deps = [
@@ -70,6 +81,7 @@ tfjs_cc_library(
     ":BatchMatMul",
     ":CropAndResize",
     ":Conv2D",
+    ":FusedConv2D",
     ":Div",
     ":Mul",
     ":Prelu",
@@ -151,9 +163,16 @@ tfjs_cc_library(
   srcs = ["kernels/Conv2D.cc"],
   hdrs = ["kernels/Conv2D.h"],
   deps = [
-    ":backend",
-    ":transpose_impl",
-    ":util",
+    ":conv2d_impl",
+  ],
+)
+
+tfjs_cc_library(
+  name = "FusedConv2D",
+  srcs = ["kernels/FusedConv2D.cc"],
+  hdrs = ["kernels/FusedConv2D.h"],
+  deps = [
+    ":conv2d_impl",
   ],
 )
 
@@ -260,3 +279,11 @@ tfjs_unit_test(
     ":Conv2D",
   ]
 )
+
+tfjs_unit_test(
+  name = "FusedConv2D_test",
+  srcs = ["kernels/FusedConv2D_test.cc"],
+  deps = [
+    ":FusedConv2D",
+  ]
+)
@@ -0,0 +1,201 @@
+/* Copyright 2019 Google Inc. All Rights Reserved.
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ * ===========================================================================*/
+
+#ifdef __EMSCRIPTEN__
+#include <emscripten.h>
+#endif
+
+#include "src/cc/conv2d_impl.h"
+
+#include <xnnpack.h>
+#include <array>
+#include <cmath>
+#include <limits>
+#include <map>
+#include <memory>
+#include <unordered_map>
+#include <utility>
+#include <vector>
+
+#include "src/cc/backend.h"
+#include "src/cc/transpose_impl.h"
+#include "src/cc/util.h"
+
+namespace {
+// These integer values are keys to creating the conv2d operator. We use
+// std::array instead of a vanilla array as it implements the compare operator
+// needed for std::map.
+typedef std::array<int, 16> OperatorCacheKey;
+
+// The operator cache maps the cache key to the xnn_operator_t instantiated for
+// this set of arguments to the xnn_operator.
+std::map<OperatorCacheKey, xnn_operator_t> operator_cache;
+
+// Maps a filter id to a list of operator cache keys that this filter belongs
+// to.
+std::unordered_map<int, std::vector<OperatorCacheKey>>
+    filter_operator_cache_key_map;
+
+// Maps a bias id to a list of operator cache keys that this filter belongs
+// to.
+std::unordered_map<int, std::vector<OperatorCacheKey>>
+    bias_operator_cache_key_map;
+
+void erase_from_cache(const int tensor_id,
+                      std::unordered_map<int, std::vector<OperatorCacheKey>>&
+                          operator_cache_key_map) {
+  auto operator_cache_keys_idx = operator_cache_key_map.find(tensor_id);
+  if (operator_cache_keys_idx != operator_cache_key_map.end()) {
+    std::vector<OperatorCacheKey> operator_cache_keys =
+        operator_cache_keys_idx->second;
+    for (auto& operator_cache_key : operator_cache_keys) {
+      auto operator_cache_key_idx = operator_cache.find(operator_cache_key);
+      if (operator_cache_key_idx != operator_cache.end()) {
+        auto& conv2d_op = operator_cache_key_idx->second;
+
+        xnn_delete_operator(conv2d_op);
+        tfjs::backend::xnn_operator_count--;
+
+        operator_cache.erase(operator_cache_key);
+      }
+    }
+    operator_cache_key_map.erase(tensor_id);
+  }
+}
+
+void delete_xnn_operators(int tensor_id) {
+  erase_from_cache(tensor_id, filter_operator_cache_key_map);
+  erase_from_cache(tensor_id, bias_operator_cache_key_map);
+}
+
+void associate_tensor_with_key(
+    const int tensor_id, const OperatorCacheKey& cache_key,
+    std::unordered_map<int, std::vector<OperatorCacheKey>>&
+        operator_cache_key_map) {
+  auto cache_keys_idx = operator_cache_key_map.find(tensor_id);
+  if (cache_keys_idx == operator_cache_key_map.end()) {
+    std::vector<OperatorCacheKey> cache_keys = {cache_key};
+    operator_cache_key_map.emplace(tensor_id, std::move(cache_keys));
+    tfjs::backend::register_disposal_callback(tensor_id, *delete_xnn_operators);
+
+  } else {
+    auto& cache_keys = operator_cache_key_map.at(tensor_id);
+    cache_keys.emplace_back(cache_key);
+  }
+}
+
+}  // namespace
+
+namespace tfjs {
+namespace wasm {
+
+void conv2d(const int x_id, const int batch_size, const int input_height,
+            const int input_width, const int filter_id, const int filter_height,
+            const int filter_width, const int bias_id, int pad_top,
+            int pad_right, int pad_bottom, int pad_left, const int is_same_pad,
+            const int dilation_height, const int dilation_width,
+            const int stride_height, const int stride_width,
+            const int input_channels, const int output_channels,
+            const int out_id) {
+  auto& x_info = backend::get_tensor_info(x_id);
+  auto& filter_info = backend::get_tensor_info(filter_id);
+  auto& out_info = backend::get_tensor_info_out(out_id);
+
+  const float* x_buf = x_info.f32();
+  const float* filter_buf = filter_info.f32();
+  const float* bias_buf = nullptr;
+  if (bias_id != -1) {
+    bias_buf = backend::get_tensor_info_out(bias_id).f32();
+  }
+  float* out_buf = out_info.f32_write();
+
+  xnn_operator_t conv2d_op = nullptr;
+
+  int flags = 0;
+  if (is_same_pad) {
+    pad_top = 0, pad_right = 0, pad_bottom = 0, pad_left = 0;
+    flags = XNN_FLAG_TENSORFLOW_SAME_PADDING;
+  }
+
+  const int groups = 1;
+
+  OperatorCacheKey cache_key = {
+      pad_top,         pad_right,      pad_bottom,    pad_left,
+      filter_height,   filter_width,   stride_height, stride_width,
+      dilation_height, dilation_width, groups,        input_channels,
+      output_channels, filter_id,      bias_id,       flags};
+
+  auto operator_cache_idx = operator_cache.find(cache_key);
+  if (operator_cache_idx == operator_cache.end()) {
+    float output_min = -std::numeric_limits<float>::infinity();
+    float output_max = std::numeric_limits<float>::infinity();
+
+    // xnn pack expects weights layed out like:
+    //   [output_channels, filter_height, filter_width, input_channels]
+    // TensorFlow has weights layed out like:
+    //   [filter_height, filter_width, input_channels, output_channels]
+    // This can be transposed with a 2d transpose to move output_channels to the
+    // outer most dimension.
+    std::vector<float> transposed_filter(filter_info.size);
+
+    const std::vector<int> filter_shape = {
+        filter_height * filter_width * input_channels, output_channels};
+    const std::vector<int> perm = {1, 0};
+    tfjs::wasm::transpose(filter_buf, filter_shape, perm,
+                          transposed_filter.data());
+
+    xnn_status status = xnn_create_convolution2d_nhwc_f32(
+        pad_top, pad_right, pad_bottom, pad_left, filter_height, filter_width,
+        stride_height, stride_width, dilation_height, dilation_width, groups,
+        input_channels /* group_input_channels */,
+        output_channels /* group_output_channels */,
+        input_channels /* input_pixel_stride */,
+        output_channels /* output_pixel_stride */, transposed_filter.data(),
+        bias_buf, output_min, output_max, flags, &conv2d_op);
+    if (status != xnn_status_success) {
+      util::warn(
+          "XNN status for xnn_create_convolution2d_nhwc_f32 is not successful. "
+          "Got status %d. Use -c dbg to see XNN logs.",
+          status);
+    }
+
+    operator_cache.emplace(cache_key, conv2d_op);
+
+    associate_tensor_with_key(filter_id, cache_key,
+                              filter_operator_cache_key_map);
+    if (bias_id != -1) {
+      associate_tensor_with_key(bias_id, cache_key,
+                                bias_operator_cache_key_map);
+    }
+
+    tfjs::backend::xnn_operator_count++;
+  } else {
+    conv2d_op = operator_cache_idx->second;
+  }
+
+  xnn_status status = xnn_setup_convolution2d_nhwc_f32(
+      conv2d_op, batch_size, input_height, input_width, x_buf, out_buf,
+      nullptr /* thread pool */);
+  if (status != xnn_status_success) {
+    util::warn(
+        "XNN status for xnn_setup_convolution2d_nhwc_f32 is not successful. "
+        "Got status %d. Use -c dbg to see XNN logs.",
+        status);
+  }
+
+  xnn_run_operator(conv2d_op, nullptr /* thread pool */);
+}
+
+}  // namespace wasm
+}  // namespace tfjs
@@ -0,0 +1,32 @@
+/* Copyright 2019 Google Inc. All Rights Reserved.
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ * ===========================================================================*/
+
+#ifndef CONV2D_IMPL_H_
+#define CONV2D_IMPL_H_
+
+namespace tfjs {
+namespace wasm {
+
+void conv2d(const int x_id, const int batch_size, const int input_height,
+            const int input_width, const int filter_id, const int filter_height,
+            const int filter_width, const int bias_id, int pad_top,
+            int pad_right, int pad_bottom, int pad_left, const int is_same_pad,
+            const int dilation_height, const int dilation_width,
+            const int stride_height, const int stride_width,
+            const int input_channels, const int output_channels,
+            const int out_id);
+}  // namespace wasm
+}  // namespace tfjs
+
+#endif  // CONV2D_IMPL_H_