Add/add v2 op (#11)

tokusumi · web-flow · commit 5c130bfe91d3 · 2020-08-17T21:36:14.000+09:00
* add AddV2 op
diff --git a/keras_flops/flops_registory.py b/keras_flops/flops_registory.py
@@ -1,7 +1,10 @@
 import numpy as np
 from tensorflow.python.framework import ops
 from tensorflow.python.framework import graph_util
-from tensorflow.python.profiler.internal.flops_registry import _reduction_op_flops
+from tensorflow.python.profiler.internal.flops_registry import (
+    _reduction_op_flops,
+    _binary_per_element_op_flops,
+)
 
 
 @ops.RegisterStatistics("FusedBatchNormV3", "flops")
@@ -18,8 +21,8 @@ def _flops_fused_batch_norm_v3(graph, node):
         raise ValueError("Only supports inference mode")
 
     num_flops = (
-        in_shape.num_elements()
-        + 4 * variance_shape.num_elements()
+        2 * in_shape.num_elements()
+        + 5 * variance_shape.num_elements()
         + mean_shape.num_elements()
     )
     return ops.OpStats("flops", num_flops)
@@ -31,3 +34,9 @@ def _flops_max(graph, node):
     # reduction - comparison, no finalization
     return _reduction_op_flops(graph, node, reduce_flops=1, finalize_flops=0)
 
+
+@ops.RegisterStatistics("AddV2", "flops")
+def _flops_add(graph, node):
+    """inference is supportted"""
+    return _binary_per_element_op_flops(graph, node)
+
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,7 +1,7 @@
 [tool.poetry]
 name = "keras-flops"
-version = "0.1.1"
-description = "FLOPs calculator with tf.profiler for neural network architecture written in tensorflow 2.x (tf.keras)"
+version = "0.1.2"
+description = "FLOPs calculator with tf.profiler for neural network architecture written in tensorflow 2.2+ (tf.keras)"
 authors = ["tokusumi <tksmtoms@gmail.com>"]
 license = "MIT"
 readme = "README.md"
diff --git a/tests/test_flops.py b/tests/test_flops.py
@@ -315,11 +315,11 @@ def test_conv1dtranspose():
 def test_batchnormalization():
     """
     batch normalization is calculated as follows,
-    1. (2 ops * |var|) inv = rsqrt(var + eps)
+    1. (3 ops * |var|) inv = rsqrt(var + eps)
     2. (1 ops * |var|) inv *= gamma (scale)
-    3. (|x| + |mean| + |var| ops) x' = inv * x + beta (shift) - mean * inv
+    3. (2 * |x| + |mean| + |var| ops) x' = inv * x + beta (shift) - mean * inv
     , where |var| = |mean| = channel size in default
-    Thus, tot FLOPs = 5 * channel size + input element size.
+    Thus, tot FLOPs = 6 * channel size + 2 * input element size.
     """
     in_w = 32
     in_h = 32
@@ -334,7 +334,7 @@ def test_batchnormalization():
     )
     flops = get_flops(model, batch_size=1)
     assert (
-        flops == 5 * in_ch + in_w * in_ch
+        flops == 6 * in_ch + 2 * in_w * in_ch
     ), "fused is False. see nn_impl.batch_normalization"
 
     model = Sequential(
@@ -346,7 +346,7 @@ def test_batchnormalization():
     )
     flops = get_flops(model, batch_size=1)
     assert (
-        flops == 5 * in_ch + in_w * in_h * in_ch
+        flops == 6 * in_ch + 2 * in_w * in_h * in_ch
     ), "fused is True, see gen_nn.fused_batch_norm_v3"
 
 
@@ -355,7 +355,7 @@ def test_additive_attention():
     Bahdanau-style attention. query (batch, Tq, dim), key (batch, Tv, dim) and value (batch, Tv, dim) are inputs.
     following computations is processed.
     1. reshape query as shape [batch, Tq, 1, dim] and value as shape [batch, 1, Tv, dim]
-    2. broadcasting multiply between both of above as output shape [batch, Tq, Tv, dim]
+    2. broadcasting multiply between additive of above as output shape [batch, Tq, Tv, dim]
     3. reduce_sum above with dim axis as output shape [batch, Tq, Tv]
     4. softmax of above
     5. MatMul between 4. and value as output shape [batch, Tq, dim]
@@ -375,6 +375,7 @@ def test_additive_attention():
     assert (
         flops
         == Tq * Tv * dim  # No.2 (multiply)
+        + Tq * Tv * dim  # No.3 (add)
         + Tq * Tv * (dim - 1)  # No.3 (reduce_sum)
         + 5 * Tq * Tv  # No.4 (softmax)
         + 2 * Tv * Tq * dim  # No.5 (MatMul)