uTensor
diff --git a/‎python/test_scripts/gen_qconv2d.py‎
Lines changed: 90 additions & 0 deletions b/‎python/test_scripts/gen_qconv2d.py‎
Lines changed: 90 additions & 0 deletions
diff --git a/‎python/test_scripts/jinja_env/__init__.py‎
Lines changed: 169 additions & 7 deletions b/‎python/test_scripts/jinja_env/__init__.py‎
Lines changed: 169 additions & 7 deletions
@@ -0,0 +1,90 @@
+from jinja_env import env2, Operator, Tensor, SingleOpTest, QuantizationType
+import tensorflow as tf
+import numpy as np
+import copy
+
+test_group = "Conv2D"
+num_tests = 2;
+output_file = "test_sq_conv2d.cpp"
+const_file = "constants_sq_conv2d.hpp"
+
+def gen_test(test_number):
+    test_name = "random_gen_conv2d__%d" % ( test_number)
+    in0 = np.random.uniform(low=-5, high=5, size=[1,14,14,32]).astype(np.float32)
+    w0 = np.random.uniform(low=-1, high=1, size=[3,3,32, 64]).astype(np.float32)
+    b = np.random.uniform(low=-2.2, high=2.2, size=(1,64)).astype(np.float32).flatten()
+    m = tf.nn.conv2d(in0, w0, strides=[1,1,1,1], padding="VALID")
+    print(m.shape)
+    out_1 = tf.math.add(m, b).numpy()
+    
+    # Update Weights to match TFLu [64,3,3,32]
+    w = np.zeros((w0.shape[3], w0.shape[0], w0.shape[1], w0.shape[2]), dtype=w0.dtype)
+    for i0 in range(w.shape[0]):
+      for i1 in range(w.shape[1]):
+        for i2 in range(w.shape[2]):
+          for i3 in range(w.shape[3]):
+            w[i0, i1, i2, i3] = w0[i1, i2, i3, i0]
+
+    # Generate float Tests!
+    in_ref_name = "s_ref_in_%d_%s"   % (test_number, "f")
+    w_ref_name = "s_ref_w_%d_%s"     % (test_number, "f")
+    b_ref_name = "s_ref_b_%d_%s"     % (test_number, "f")
+    out_ref_name = "s_ref_out_%d_%s" % (test_number, "f")
+    in_t = Tensor("in", in0, ref_name=in_ref_name, quantization_type=QuantizationType.PER_TENSOR_SYMMETRIC)
+    w_t = Tensor("w", w, ref_name=w_ref_name, quantization_type=QuantizationType.PER_CHANNEL_SYMMETRIC, quantize_dim= 0, narrow_range=True)
+    b_t = Tensor("b", b, ref_name=b_ref_name, quantization_type=QuantizationType.PER_CHANNEL_SYMMETRIC, quantize_dim=0, num_quant_bits=32)
+    out_ref = Tensor("out_ref", out_1, ref_name=out_ref_name, quantization_type=QuantizationType.PER_TENSOR_SYMMETRIC) # Store the reference out values
+    out_t = Tensor("out", out_1, quantization_type=QuantizationType.PER_TENSOR_SYMMETRIC)                 
+    #conv_param_str = "{%s}, %s" % (str(strides).lstrip('[').rstrip(']'), padding)
+    #convOp = Operator("Conv2dOperator", "op_0", dtypes=["float"], param_str=conv_param_str)
+    #param_str = "Fuseable::NoActivation<float>"
+    param_str = "{1,1,1,1}, SAME"
+    op = Operator("Conv2dOperator", "convOp", dtypes=[in_t.get_dtype], param_str=param_str)
+    op.set_inputs({"input": in_t, "filter": w_t, "bias": b_t}).set_outputs({"output": out_t})
+    
+    test = SingleOpTest(test_group, test_name + "_f", op)
+    test.add_tensor_comparison(out_t, out_ref)
+    test_rendered_f, const_snippets_f = test.render()
+    
+    # Quantize!
+    in_ref_name = "s_ref_in_%d_%s"   % (test_number, "q")
+    in_ref_name = "s_ref_in_%d_%s"   % (test_number, "q")
+    w_ref_name = "s_ref_w_%d_%s"     % (test_number, "q")
+    b_ref_name = "s_ref_b_%d_%s"     % (test_number, "q")
+    out_ref_name = "s_ref_out_%d_%s" % (test_number, "q")
+    out_name = "s_out_%d_%s" % (test_number, "q")
+    in_t.ref_name = in_ref_name
+    w_t.ref_name = w_ref_name
+    b_t.ref_name = b_ref_name
+    out_ref.ref_name = out_ref_name
+    out_t.quantize_params.ref_name = out_name # Gotta give it somewhere to store params
+    in_t.quantize()
+    w_t.quantize()
+    # Bias quantization params depend on input and wieghts
+    b_t.quantize_params.scale =  [in_t.quantize_params.scale[0]*j for j in w_t.quantize_params.scale]
+    b_t.quantize_params.zp = copy.deepcopy(w_t.quantize_params.zp)
+    b_t.quantize()
+    out_t.quantize()
+    out_ref.quantize()
+    
+    test = SingleOpTest(test_group, test_name + "_q", op)
+    test.add_tensor_comparison(out_t, out_ref)
+    test_rendered_q, const_snippets_q = test.render()
+    
+    return [(test_rendered_f, const_snippets_f),(test_rendered_q, const_snippets_q)]
+
+
+if __name__ == '__main__':
+    tests = []
+    const_snippets =[]
+    for i in range(num_tests):
+        rendered = gen_test(i)
+        for tr, cs in rendered:
+            tests.append(tr)
+            const_snippets.extend(cs)
+    with open(const_file, "w") as fp:
+        c_r = env2.get_template("const_container.hpp").render(constants=const_snippets, constants_header=const_file)
+        fp.write(c_r)
+    with open(output_file, "w") as fp:
+        gt_r = env2.get_template("gtest_container.cpp").render(constants_header=const_file, using_directives=["using namespace uTensor::ReferenceOperators"], tests=tests)
+        fp.write(gt_r)
@@ -1,6 +1,10 @@
 import jinja2
+from enum import Enum
 from pathlib import Path
 import numpy as np
+from abc import ABCMeta, abstractmethod
+from .quantization_util import get_quantization_params, quantize
+
 
 _template_dir = Path(__file__).parent / "templates"
 _template2_dir = Path(__file__).parent / "templates_v2"
@@ -41,6 +45,12 @@
     np.int32: "int32_t",
     np.uint32: "uint32_t",
     np.float: "float",
+    np.dtype('int8'): "int8_t",
+    np.dtype('uint8'): "uint8_t",
+    np.dtype('int16'): "int16_t",
+    np.dtype('uint16'): "uint16_t",
+    np.dtype('int32'): "int32_t",
+    np.dtype('uint32'): "uint32_t",
     np.dtype('float32'): "float",
     }
 env2 = jinja2.Environment(
@@ -53,13 +63,69 @@
     NUMPY_2_CMAP=NUMPY_2_CMAP,
     )
 
+class QuantizationType(Enum):
+  NONE                   = 0
+  PER_TENSOR_ASYMMETRIC  = 1
+  PER_CHANNEL_ASYMMETRIC = 2
+  PER_TENSOR_SYMMETRIC   = 3
+  PER_CHANNEL_SYMMETRIC  = 4
+
+class UnknownQuantizationTypeError(Exception):
+  pass 
+
+class QuantizationParams(object):
+  def __init__(self, tensor):
+    self.tensor = tensor # Store ref to parent
+    self.ref_name = tensor.ref_name
+    self.zp = []
+    self.scale = []
+    #self.num_channels = 0
+
+  @property
+  def ref_zp(self):
+    if not self.ref_name:
+      print("WARNING: No reference name set for Quantization Param")
+    return "%s_zp" % self.ref_name
+  @property
+  def ref_scale(self):
+    if not self.ref_name:
+      print("WARNING: No reference name set for Quantization Param")
+    return "%s_scale" % self.ref_name
+
+  def render_set_quantization_params(self):
+    if self.zp:
+      return env2.get_template('set_quantization_params.cpp').render(qp=self)
+    else:
+      return ""
+
+  @property
+  def num_channels(self):
+    if self.zp:
+      return len(self.zp)
+    else:
+      return 0;
+  
+  @property
+  def quantization_type(self):
+    if self.num_channels == 1:
+      return "PerTensorQuantizationParams"
+    elif self.num_channels > 1:
+      return "PerChannelQuantizationParams"
+    else:
+      raise UnknownQuantizationTypeError
+      
 
 class Tensor:
-  def __init__(self, name, np_array, ref_name=None, quantize_params=[]):
+  def __init__(self, name, np_array, ref_name=None, quantization_type=QuantizationType.NONE, quantize_dim=None, narrow_range=False, num_quant_bits=8):
     self.name = name
     self.np_array = np_array
     self.ref_name = ref_name
-    self.quantize_params = quantize_params
+    self.quantize_params = QuantizationParams(self)
+    self.quantization_type = quantization_type
+    self.quantize_dim = quantize_dim
+    self.narrow_range = narrow_range
+    self.quantized = False
+    self.num_quant_bits = num_quant_bits
 
   @property
   def shape(self):
@@ -68,6 +134,8 @@ def shape(self):
   @property
   def dtype(self):
     return NUMPY_2_CMAP[self.np_array.dtype]
+  def get_dtype(self):
+    return self.dtype
 
   @property
   def utype(self):
@@ -77,28 +145,108 @@ def flatten(self):
     return self.np_array.flatten()
 
   def render_constant(self):
-    if self.ref_name:
-      return env2.get_template('def_constant.hpp').render(tensor=self)
-    else:
-      return ""
+    return env2.get_template('def_constant.hpp').render(tensor=self)
   def render_declaration(self):
     if self.ref_name:
       return env2.get_template('declare_rom_tensor.cpp').render(tensor=self)
     else:
       return env2.get_template('declare_ram_tensor.cpp').render(tensor=self)
+  
+  def is_quantized(self):
+    return self.quantized and self.is_quantizable()
+  
+  def is_quantizable(self):
+    return self.quantization_type != QuantizationType.NONE
 
+  @property
+  def symmetric(self):
+    if self.is_quantizable() and (self.quantization_type == QuantizationType.PER_TENSOR_SYMMETRIC or self.quantization_type == QuantizationType.PER_CHANNEL_SYMMETRIC):
+      return True
+    else:
+      return False
+  
+  @property
+  def per_tensor_quantization(self):
+    return self.is_quantizable() and (self.quantization_type == QuantizationType.PER_TENSOR_ASYMMETRIC or self.quantization_type == QuantizationType.PER_TENSOR_SYMMETRIC)
+
+  @property
+  def per_channel_quantization(self):
+    return self.is_quantizable() and self.quantize_dim != None and (self.quantization_type == QuantizationType.PER_CHANNEL_ASYMMETRIC or self.quantization_type == QuantizationType.PER_CHANNEL_SYMMETRIC)
+
+  def get_quantization_params(self):
+    if not self.is_quantizable():
+      return (None, None)
+    if not self.quantize_params.zp and not self.quantize_params.scale:
+      # Else compute them
+      if self.per_channel_quantization:
+        num_dims = len(self.np_array.shape)
+        num_channels = self.np_array.shape[self.quantize_dim]
+        for i in range(num_channels):
+          c = tuple([ i if j == self.quantize_dim else slice(None) for j in range(num_dims)])
+          zp, scale = get_quantization_params(self.np_array[c], symmetric=self.symmetric, narrow_range=self.narrow_range, num_quant_bits=self.num_quant_bits)
+          self.quantize_params.zp.append(zp)
+          self.quantize_params.scale.append(scale)
+      else:
+        zp, scale = get_quantization_params(self.np_array, symmetric=self.symmetric, narrow_range=self.narrow_range, num_quant_bits=self.num_quant_bits)
+        self.quantize_params.zp.append(zp)
+        self.quantize_params.scale.append(scale)
+    return (self.quantize_params.zp, self.quantize_params.scale)
+
+  def quantize(self):
+    if self.quantized:
+      return
+    if not self.is_quantizable():
+      return None
+    zp, scale = self.get_quantization_params()
+    if self.per_channel_quantization:
+      if self.symmetric:
+        if self.num_quant_bits == 8:
+          dtype = np.int8
+        else:
+          dtype = np.int32
+      else:
+        if self.num_quant_bits == 8:
+          dtype = np.uint8
+        else:
+          dtype = np.uint32
+
+      num_dims = len(self.np_array.shape)
+      num_channels = self.np_array.shape[self.quantize_dim]
+      q_array = np.zeros(self.np_array.shape, dtype=dtype)
+      for i in range(num_channels):
+        c = tuple([ i if j == self.quantize_dim else slice(None) for j in range(num_dims)])
+        slc = self.np_array[c]
+        if isinstance(slc, np.float32):
+          tmp = np.ndarray((1), dtype=self.np_array.dtype)
+          tmp[0] = slc
+        else:
+          tmp = slc
+        q = quantize(tmp, zp[i], scale[i], self.symmetric, self.narrow_range, self.num_quant_bits)
+        q_array[c] = q
+      self.np_array = q_array
+    else:
+      q = quantize(self.np_array, zp[0], scale[0], self.symmetric, self.narrow_range, self.num_quant_bits)
+      self.np_array = q
+    self.quantized = True
 
 class Operator:
   def __init__(self, op_type, name, dtypes=[], param_str=None):
+    """
+    dtypes should be bound to get_dtype methods on a tensor
+    """
     self.op_type = op_type
     self.name = name
-    self.dtypes = dtypes
+    self._dtypes = dtypes
     self.param_str = param_str
     self.array_template = env2.get_template('array_template.cpp')
     self.input_map = {}
     self.output_map = {}
     self.type_signature = env2.get_template('op_type_signature.cpp').render(op=self)
 
+  @property
+  def dtype(self):
+    return [dt() for dt in self._dtypes]
+
   def set_inputs(self, input_map):
     self.input_map = input_map
     return self
@@ -112,6 +260,11 @@ def render_declaration(self):
 
   def render_eval(self):
     return env2.get_template('eval_operator.cpp').render(op=self)
+  def quantize(self):
+    for thing in self.input_map:
+      self.input_map[thing].quantize()
+    for thing in self.output_map:
+      self.output_map[thing].quantize()
 
 class SingleOpTest:
   def __init__(self, test_group, test_name, target_op):
@@ -133,6 +286,15 @@ def add_tensor_comparison(self, a, b):
     self.tensor_set.add(a)
     self.tensor_set.add(b)
 
+  def quantize(self):
+    self.target_op.quantize()
+    # Duplicate quantization because we can
+    for (a, b) in self.compare_tensors:
+      a.quantize()
+      b.quantize()
+    for thing in tensor_set:
+      thing.quantize()
+
   def render(self):
     const_snippets = []
     tensor_decls = []