PyPI - ai-edge-quantizer-nightly - Versions diffs - 0.0.1.dev20250115__py3-none-any.whl - Mend

ai-edge-quantizer-nightly 0.0.1.dev20250115__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

ai_edge_quantizer/__init__.py +19 -0
ai_edge_quantizer/algorithm_manager.py +167 -0
ai_edge_quantizer/algorithm_manager_api.py +271 -0
ai_edge_quantizer/algorithm_manager_api_test.py +210 -0
ai_edge_quantizer/algorithms/__init__.py +15 -0
ai_edge_quantizer/algorithms/nonlinear_quantize/__init__.py +15 -0
ai_edge_quantizer/algorithms/nonlinear_quantize/float_casting.py +273 -0
ai_edge_quantizer/algorithms/nonlinear_quantize/float_casting_test.py +664 -0
ai_edge_quantizer/algorithms/uniform_quantize/__init__.py +15 -0
ai_edge_quantizer/algorithms/uniform_quantize/naive_min_max_quantize.py +666 -0
ai_edge_quantizer/algorithms/uniform_quantize/naive_min_max_quantize_test.py +184 -0
ai_edge_quantizer/algorithms/uniform_quantize/uniform_quantize_tensor.py +371 -0
ai_edge_quantizer/algorithms/uniform_quantize/uniform_quantize_tensor_test.py +357 -0
ai_edge_quantizer/algorithms/utils/__init__.py +15 -0
ai_edge_quantizer/algorithms/utils/min_max_quantize_utils.py +1067 -0
ai_edge_quantizer/algorithms/utils/min_max_quantize_utils_test.py +512 -0
ai_edge_quantizer/calibrator.py +288 -0
ai_edge_quantizer/calibrator_test.py +297 -0
ai_edge_quantizer/conftest.py +22 -0
ai_edge_quantizer/default_policy.py +310 -0
ai_edge_quantizer/model_modifier.py +176 -0
ai_edge_quantizer/model_modifier_test.py +130 -0
ai_edge_quantizer/model_validator.py +357 -0
ai_edge_quantizer/model_validator_test.py +354 -0
ai_edge_quantizer/params_generator.py +361 -0
ai_edge_quantizer/params_generator_test.py +1041 -0
ai_edge_quantizer/qtyping.py +483 -0
ai_edge_quantizer/quantizer.py +372 -0
ai_edge_quantizer/quantizer_test.py +532 -0
ai_edge_quantizer/recipe.py +67 -0
ai_edge_quantizer/recipe_manager.py +245 -0
ai_edge_quantizer/recipe_manager_test.py +815 -0
ai_edge_quantizer/recipe_test.py +97 -0
ai_edge_quantizer/transformation_instruction_generator.py +584 -0
ai_edge_quantizer/transformation_instruction_generator_test.py +1082 -0
ai_edge_quantizer/transformation_performer.py +278 -0
ai_edge_quantizer/transformation_performer_test.py +344 -0
ai_edge_quantizer/transformations/__init__.py +15 -0
ai_edge_quantizer/transformations/dequant_insert.py +87 -0
ai_edge_quantizer/transformations/dequant_insert_test.py +304 -0
ai_edge_quantizer/transformations/emulated_subchannel.py +363 -0
ai_edge_quantizer/transformations/emulated_subchannel_test.py +212 -0
ai_edge_quantizer/transformations/quant_insert.py +100 -0
ai_edge_quantizer/transformations/quant_insert_test.py +284 -0
ai_edge_quantizer/transformations/quantize_tensor.py +156 -0
ai_edge_quantizer/transformations/quantize_tensor_test.py +227 -0
ai_edge_quantizer/transformations/transformation_utils.py +132 -0
ai_edge_quantizer/transformations/transformation_utils_test.py +162 -0
ai_edge_quantizer/utils/__init__.py +15 -0
ai_edge_quantizer/utils/calibration_utils.py +86 -0
ai_edge_quantizer/utils/calibration_utils_test.py +77 -0
ai_edge_quantizer/utils/test_utils.py +107 -0
ai_edge_quantizer/utils/tfl_flatbuffer_utils.py +317 -0
ai_edge_quantizer/utils/tfl_flatbuffer_utils_test.py +200 -0
ai_edge_quantizer/utils/tfl_interpreter_utils.py +312 -0
ai_edge_quantizer/utils/tfl_interpreter_utils_test.py +332 -0
ai_edge_quantizer/utils/validation_utils.py +125 -0
ai_edge_quantizer/utils/validation_utils_test.py +87 -0
ai_edge_quantizer_nightly-0.0.1.dev20250115.dist-info/LICENSE +201 -0
ai_edge_quantizer_nightly-0.0.1.dev20250115.dist-info/METADATA +32 -0
ai_edge_quantizer_nightly-0.0.1.dev20250115.dist-info/RECORD +63 -0
ai_edge_quantizer_nightly-0.0.1.dev20250115.dist-info/WHEEL +5 -0
ai_edge_quantizer_nightly-0.0.1.dev20250115.dist-info/top_level.txt +1 -0

ai_edge_quantizer/utils/tfl_flatbuffer_utils.py ADDED Viewed

@@ -0,0 +1,317 @@
+# Copyright 2024 The AI Edge Quantizer Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""flatbuffer utils for the Quantizer."""
+from typing import Any, Optional, Union
+import immutabledict
+import numpy as np
+from ai_edge_quantizer import qtyping
+from ai_edge_litert import schema_py_generated  # pylint:disable=g-direct-tensorflow-import
+from tensorflow.lite.tools import flatbuffer_utils  # pylint: disable=g-direct-tensorflow-import
+from tensorflow.python.platform import gfile  # pylint: disable=g-direct-tensorflow-import
+_TFLOpName = qtyping.TFLOperationName
+TFL_OP_NAME_TO_CODE = immutabledict.immutabledict({
+    _TFLOpName.FULLY_CONNECTED: (
+        schema_py_generated.BuiltinOperator.FULLY_CONNECTED
+    ),
+    _TFLOpName.BATCH_MATMUL: schema_py_generated.BuiltinOperator.BATCH_MATMUL,
+    _TFLOpName.CONV_2D: schema_py_generated.BuiltinOperator.CONV_2D,
+    _TFLOpName.DEPTHWISE_CONV_2D: (
+        schema_py_generated.BuiltinOperator.DEPTHWISE_CONV_2D
+    ),
+    _TFLOpName.CONV_2D_TRANSPOSE: (
+        schema_py_generated.BuiltinOperator.TRANSPOSE_CONV
+    ),
+    _TFLOpName.EMBEDDING_LOOKUP: (
+        schema_py_generated.BuiltinOperator.EMBEDDING_LOOKUP
+    ),
+    _TFLOpName.SOFTMAX: schema_py_generated.BuiltinOperator.SOFTMAX,
+    _TFLOpName.AVERAGE_POOL_2D: (
+        schema_py_generated.BuiltinOperator.AVERAGE_POOL_2D
+    ),
+    _TFLOpName.RESHAPE: schema_py_generated.BuiltinOperator.RESHAPE,
+    _TFLOpName.TANH: schema_py_generated.BuiltinOperator.TANH,
+    _TFLOpName.TRANSPOSE: schema_py_generated.BuiltinOperator.TRANSPOSE,
+    _TFLOpName.GELU: schema_py_generated.BuiltinOperator.GELU,
+    _TFLOpName.ADD: schema_py_generated.BuiltinOperator.ADD,
+    _TFLOpName.SUB: schema_py_generated.BuiltinOperator.SUB,
+    _TFLOpName.MUL: schema_py_generated.BuiltinOperator.MUL,
+    _TFLOpName.MEAN: schema_py_generated.BuiltinOperator.MEAN,
+    _TFLOpName.RSQRT: schema_py_generated.BuiltinOperator.RSQRT,
+    _TFLOpName.CONCATENATION: schema_py_generated.BuiltinOperator.CONCATENATION,
+    _TFLOpName.STRIDED_SLICE: schema_py_generated.BuiltinOperator.STRIDED_SLICE,
+    _TFLOpName.SPLIT: schema_py_generated.BuiltinOperator.SPLIT,
+    _TFLOpName.LOGISTIC: schema_py_generated.BuiltinOperator.LOGISTIC,
+    _TFLOpName.SLICE: schema_py_generated.BuiltinOperator.SLICE,
+    _TFLOpName.SUM: schema_py_generated.BuiltinOperator.SUM,
+    _TFLOpName.SELECT_V2: schema_py_generated.BuiltinOperator.SELECT_V2,
+})
+TFL_OP_CODE_TO_NAME = immutabledict.immutabledict(
+    dict((reversed(item) for item in TFL_OP_NAME_TO_CODE.items()))
+)
+# Quantized dimension for per-channel quantization.
+# See https://www.tensorflow.org/lite/performance/quantization_spec.
+TFL_OP_TO_WEIGHT_QUANTIZED_DIM = immutabledict.immutabledict({
+    _TFLOpName.FULLY_CONNECTED: 0,
+    _TFLOpName.DEPTHWISE_CONV_2D: 3,
+    _TFLOpName.CONV_2D: 0,
+    _TFLOpName.EMBEDDING_LOOKUP: 0,
+    _TFLOpName.CONV_2D_TRANSPOSE: 0,
+})
+NUM_TFL_DATATYPES = 18
+TENSOR_CODE_TO_TYPE = {}
+for dtype_code in range(NUM_TFL_DATATYPES):
+  TENSOR_CODE_TO_TYPE[dtype_code] = flatbuffer_utils.type_to_name(dtype_code)
+TENSOR_CODE_TO_TYPE = immutabledict.immutabledict(TENSOR_CODE_TO_TYPE)
+TENSOR_TYPE_TO_CODE = immutabledict.immutabledict(
+    (reversed(item) for item in TENSOR_CODE_TO_TYPE.items())
+)
+# Expose functions in tensorflow.lite.tools.flatbuffer_utils
+write_model = flatbuffer_utils.write_model
+def read_model(tflite_model: Union[str, bytearray]) -> Any:
+  """Read and convert the TFLite model into a flatbuffer object.
+  Args:
+    tflite_model: TFLite model path or bytearray.
+  Raises:
+    ValueError: Unsupported tflite_model type.
+  Returns:
+    flatbuffer_model: the flatbuffer_model.
+  """
+  if isinstance(tflite_model, str):
+    return flatbuffer_utils.read_model(tflite_model)
+  elif isinstance(tflite_model, bytes) or isinstance(tflite_model, bytearray):
+    return flatbuffer_utils.read_model_from_bytearray(tflite_model)
+  else:
+    raise ValueError(
+        "Unsupported tflite_model type: %s" % type(tflite_model).__name__
+    )
+def get_model_content(tflite_path: str) -> bytes:
+  """Get the model content (bytes) from the path.
+  Args:
+    tflite_path: Path to the .tflite.
+  Returns:
+    The model bytes.
+  """
+  with gfile.Open(tflite_path, "rb") as tflite_file:
+    return tflite_file.read()
+def get_model_buffer(tflite_path: str) -> bytearray:
+  """Get the model buffer from the path.
+  Args:
+    tflite_path: path to the .tflite.
+  Returns:
+    model_buffer: the model buffer.
+  """
+  with gfile.Open(tflite_path, "rb") as tflite_file:
+    return bytearray(tflite_file.read())
+def parse_op_tensors(op: Any, subgraph_tensors: list[Any]) -> list[Any]:
+  """Parse the op tensors.
+  Args:
+    op: the op that need to be parsed.
+    subgraph_tensors: list of tensors in the subgraph.
+  Returns:
+    tensors: list of tensors that are associated with the op.
+  """
+  tensors = []
+  for tensor_idx in list(op.outputs) + list(op.inputs):
+    if tensor_idx != -1:
+      tensors.append(subgraph_tensors[tensor_idx])
+  return tensors
+def parse_fc_bmm_conv_tensors(
+    op: Any,
+    subgraph_tensors: list[Any],
+    input_index: int = 0,
+    weight_index: int = 1,
+    bias_index: int = 2,
+    output_index: int = 0,
+) -> tuple[Any, Any, Any, Any]:
+  """Parse tensors in FullyConnected, BatchMatmul, and Convolutions.
+  Args:
+    op: the TFLite op, must be fully_connected, batch_matmul, or convolution.
+    subgraph_tensors: tensors in the subgraph.
+    input_index: index for the input tensor.
+    weight_index: index for the weight tensor.
+    bias_index: index for the bias tensor.
+    output_index: index for the output tensor.
+  Returns:
+    input_tensor, weight_tensor, bias_tensor, output_tensor
+  """
+  input_tensor = subgraph_tensors[op.inputs[input_index]]
+  weight_tensor = subgraph_tensors[op.inputs[weight_index]]
+  bias_tensor = None
+  if bias_index < len(op.inputs) and op.inputs[bias_index] != -1:
+    bias_tensor = subgraph_tensors[op.inputs[bias_index]]
+  output_tensor = subgraph_tensors[op.outputs[output_index]]
+  return input_tensor, weight_tensor, bias_tensor, output_tensor
+# flatbuffer_model has Any type since tensorflow.lite.tools.flatbuffer_utils
+# is not type annotated.
+def buffer_to_tensors(flatbuffer_model: Any) -> dict[int, list[Any]]:
+  """Get the buffer to tensor map for a tflite model.
+  Args:
+    flatbuffer_model: the flatbuffer_model.
+  Returns:
+    buffer_to_tensor_map: key as buffer index, value as list of tensors share
+    the buffer
+  """
+  buffer_to_tensor_map = {}
+  for subgraph in flatbuffer_model.subgraphs:
+    for op in subgraph.operators:
+      for tensor in parse_op_tensors(op, subgraph.tensors):
+        if tensor.buffer not in buffer_to_tensor_map:
+          buffer_to_tensor_map[tensor.buffer] = []
+        buffer_to_tensor_map[tensor.buffer].append(tensor)
+  return buffer_to_tensor_map
+def get_tensor_name(tensor: Any) -> str:
+  """Get the tensor name for a fb tensor.
+  Args:
+    tensor: tensor in flatbuffer.
+  Returns:
+    tensor_name: name of the buffer
+  """
+  return tensor.name.decode("utf-8")
+def get_tensor_data(tensor: Any, buffers: list[Any]) -> Optional[np.ndarray]:
+  """Get the tensor data.
+  Args:
+    tensor: tensor in flatbuffer.
+    buffers: list of buffers
+  Returns:
+    tensor_data: data inside the tensor
+  """
+  tensor_buffer = buffers[tensor.buffer]
+  buffer_data = tensor_buffer.data
+  if buffer_data is None:
+    return None
+  data = np.frombuffer(
+      buffer_data, dtype=TENSOR_CODE_TO_TYPE[tensor.type].lower()
+  )
+  data = np.reshape(data, tensor.shape)
+  return data
+def has_same_quantization(tensor1: Any, tensor2: Any) -> bool:
+  """Check if two tensors have the same quantization.
+  Args:
+    tensor1: tensor in flatbuffer.
+    tensor2: tensor in flatbuffer.
+  Returns:
+    True if two tensors have the same quantization.
+  """
+  def to_tuple(val):
+    if val is None:
+      val = []
+    return tuple(val)
+  same_type = tensor1.type == tensor2.type
+  # Return True if both tensors are not quantized.
+  if tensor1.quantization is None and tensor2.quantization is None:
+    return True
+  if tensor1.quantization.scale is None and tensor2.quantization.scale is None:
+    return True
+  same_scale = to_tuple(tensor1.quantization.scale) == to_tuple(
+      tensor2.quantization.scale
+  )
+  same_zero_point = to_tuple(tensor1.quantization.zeroPoint) == to_tuple(
+      tensor2.quantization.zeroPoint
+  )
+  same_quantized_dimension = (
+      tensor1.quantization.quantizedDimension
+      == tensor2.quantization.quantizedDimension
+  )
+  return (
+      same_type and same_scale and same_zero_point and same_quantized_dimension
+  )
+def is_float_model(flatbuffer_model: Any) -> bool:
+  """Checks that the model is float and not already quantized."""
+  for subgraph in flatbuffer_model.subgraphs:
+    for tensor in subgraph.tensors:
+      if tensor.quantization is None:
+        continue
+      if tensor.quantization.scale is not None:
+        return False
+  return True
+def get_subgraph_input_output_operators(
+    subgraph: Any,
+) -> list[qtyping.IOOperator]:
+  """Get the input/output operators for the subgraph.
+  Args:
+    subgraph: The subgraph object.
+  Returns:
+    Input and output operators for the subgraph.
+  """
+  input_op = qtyping.IOOperator(
+      inputs=[],
+      outputs=subgraph.inputs,
+      op_key=qtyping.TFLOperationName.INPUT,
+  )
+  output_op = qtyping.IOOperator(
+      inputs=subgraph.outputs,
+      outputs=[],
+      op_key=qtyping.TFLOperationName.OUTPUT,
+  )
+  return [input_op, output_op]

ai_edge_quantizer/utils/tfl_flatbuffer_utils_test.py ADDED Viewed

@@ -0,0 +1,200 @@
+# Copyright 2024 The AI Edge Quantizer Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Tests for tfl_flatbuffer_utils.py."""
+import os
+import numpy as np
+from tensorflow.python.platform import googletest
+from ai_edge_quantizer import qtyping
+from ai_edge_quantizer.utils import test_utils
+from ai_edge_quantizer.utils import tfl_flatbuffer_utils
+TEST_DATA_PREFIX_PATH = test_utils.get_path_to_datafile("../tests/models")
+# TODO: b/328830092 - Add test cases for model require buffer offset.
+class FlatbufferUtilsTest(googletest.TestCase):
+  def setUp(self):
+    super().setUp()
+    self._test_model_path = os.path.join(
+        TEST_DATA_PREFIX_PATH, "conv_fc_mnist.tflite"
+    )
+    self._test_model = tfl_flatbuffer_utils.read_model(self._test_model_path)
+  def test_get_model_buffer(self):
+    model_buffer = tfl_flatbuffer_utils.get_model_buffer(self._test_model_path)
+    file_stats = os.stat(self._test_model_path)
+    self.assertLen(model_buffer, file_stats.st_size)
+  def test_parse_op_tensors(self):
+    subgraph0 = self._test_model.subgraphs[0]
+    conv2d_op = subgraph0.operators[0]
+    op_tensors = tfl_flatbuffer_utils.parse_op_tensors(
+        conv2d_op, subgraph0.tensors
+    )
+    # conv2d have three inputs and one output
+    self.assertLen(op_tensors, 4)
+    average_pool_op = subgraph0.operators[1]
+    op_tensors = tfl_flatbuffer_utils.parse_op_tensors(
+        average_pool_op, subgraph0.tensors
+    )
+    # averagepool have one input and one output
+    self.assertLen(op_tensors, 2)
+  def test_parse_fc_bmm_conv_tensors(self):
+    subgraph0 = self._test_model.subgraphs[0]
+    conv2d_op = subgraph0.operators[0]
+    inputs, weight, bias, output = (
+        tfl_flatbuffer_utils.parse_fc_bmm_conv_tensors(
+            conv2d_op, subgraph0.tensors
+        )
+    )
+    self.assertEqual(tuple(inputs.shape), (1, 28, 28, 1))
+    self.assertEqual(tuple(weight.shape), (8, 3, 3, 1))
+    self.assertEqual(tuple(bias.shape), (8,))
+    self.assertEqual(tuple(output.shape), (1, 28, 28, 8))
+    fc_with_bias = subgraph0.operators[3]
+    inputs, weight, bias, output = (
+        tfl_flatbuffer_utils.parse_fc_bmm_conv_tensors(
+            fc_with_bias,
+            subgraph0.tensors,
+        )
+    )
+    self.assertEqual(tuple(inputs.shape), (1, 1568))
+    self.assertEqual(tuple(weight.shape), (32, 1568))
+    self.assertEqual(tuple(bias.shape), (32,))
+    self.assertEqual(tuple(output.shape), (1, 32))
+    fc_no_bias = subgraph0.operators[4]
+    inputs, weight, bias, output = (
+        tfl_flatbuffer_utils.parse_fc_bmm_conv_tensors(
+            fc_no_bias,
+            subgraph0.tensors,
+        )
+    )
+    self.assertEqual(tuple(inputs.shape), (1, 32))
+    self.assertEqual(tuple(weight.shape), (10, 32))
+    self.assertIsNone(bias)
+    self.assertEqual(tuple(output.shape), (1, 10))
+  def test_buffer_to_tensors(self):
+    buffer_to_tensor_map = tfl_flatbuffer_utils.buffer_to_tensors(
+        self._test_model
+    )
+    # Read from Netron/Model Explorer
+    tensors = buffer_to_tensor_map[6]
+    self.assertLen(tensors, 1)
+    conv2d_filter_tensor = tensors[0]
+    self.assertEqual(tuple(conv2d_filter_tensor.shape), (8, 3, 3, 1))
+  def test_get_tensor_name(self):
+    subgraph0 = self._test_model.subgraphs[0]
+    subgraph_tensors = subgraph0.tensors
+    conv2d_op = subgraph0.operators[0]
+    weight_tensor = subgraph_tensors[conv2d_op.inputs[1]]
+    weight_tensor_name = tfl_flatbuffer_utils.get_tensor_name(weight_tensor)
+    self.assertEqual(weight_tensor_name, "sequential/conv2d/Conv2D")
+  # TODO: b/325123193 - test tensor with data outside of flatbuffer.
+  def test_get_tensor_data(self):
+    subgraph0 = self._test_model.subgraphs[0]
+    subgraph_tensors = subgraph0.tensors
+    conv2d_op = subgraph0.operators[0]
+    # Check tensor with data
+    weight_tensor = subgraph_tensors[conv2d_op.inputs[1]]
+    weight_tensor_data = tfl_flatbuffer_utils.get_tensor_data(
+        weight_tensor, self._test_model.buffers
+    )
+    self.assertEqual(
+        tuple(weight_tensor.shape), tuple(weight_tensor_data.shape)  # pytype: disable=attribute-error
+    )
+    self.assertAlmostEqual(weight_tensor_data[0][0][0][0], -0.12941549718379974)
+    # Check tensor with no data
+    input_tensor = subgraph_tensors[conv2d_op.inputs[0]]
+    input_tensor_data = tfl_flatbuffer_utils.get_tensor_data(
+        input_tensor, self._test_model.buffers
+    )
+    self.assertIsNone(input_tensor_data)
+  def test_has_same_quantization_succeeds(self):
+    tensor0, tensor1 = self._test_model.subgraphs[0].tensors[:2]
+    tensor0.quantization.scale = np.array([1, 2, 3]).astype(np.float32)
+    tensor0.quantization.zeroPoint = np.array([3, 2, 1]).astype(np.int32)
+    tensor1.quantization.scale = np.array([1, 2, 3]).astype(np.float32)
+    tensor1.quantization.zeroPoint = np.array([3, 2, 1]).astype(np.int32)
+    self.assertTrue(
+        tfl_flatbuffer_utils.has_same_quantization(tensor0, tensor1)
+    )
+  def test_has_same_quantization_succeds_not_quantized(self):
+    tensor0, tensor1 = self._test_model.subgraphs[0].tensors[:2]
+    tensor0.type = 10
+    self.assertTrue(
+        tfl_flatbuffer_utils.has_same_quantization(tensor0, tensor1)
+    )
+  def test_has_same_quantization_fails_different_scale(self):
+    tensor0, tensor1 = self._test_model.subgraphs[0].tensors[:2]
+    tensor1.quantization.scale = np.array([1, 2, 3]).astype(np.float32)
+    self.assertFalse(
+        tfl_flatbuffer_utils.has_same_quantization(tensor0, tensor1)
+    )
+  def test_has_same_quantization_fails_different_zp(self):
+    tensor0, tensor1 = self._test_model.subgraphs[0].tensors[:2]
+    tensor0.quantization.scale = np.array([1, 2, 3]).astype(np.float32)
+    tensor0.quantization.zeroPoint = np.array([3, 2, 1]).astype(np.int32)
+    tensor1.quantization.scale = np.array([1, 2, 3]).astype(np.float32)
+    tensor1.quantization.zeroPoint = np.array([1, 2, 3]).astype(np.int32)
+    self.assertFalse(
+        tfl_flatbuffer_utils.has_same_quantization(tensor0, tensor1)
+    )
+  def test_check_is_float_model_true_when_model_is_float(self):
+    test_model_path = os.path.join(
+        TEST_DATA_PREFIX_PATH, "conv_fc_mnist.tflite"
+    )
+    model = tfl_flatbuffer_utils.read_model(test_model_path)
+    self.assertTrue(tfl_flatbuffer_utils.is_float_model(model))
+  def test_check_is_float_model_false_when_model_is_quantized(self):
+    test_model_path = os.path.join(
+        TEST_DATA_PREFIX_PATH, "mnist_quantized.tflite"
+    )
+    model = tfl_flatbuffer_utils.read_model(test_model_path)
+    self.assertFalse(tfl_flatbuffer_utils.is_float_model(model))
+  def test_get_subgraph_input_output_operators(self):
+    subgraph = self._test_model.subgraphs[0]
+    input_op, output_op = (
+        tfl_flatbuffer_utils.get_subgraph_input_output_operators(subgraph)
+    )
+    self.assertEqual(input_op.op_key, qtyping.TFLOperationName.INPUT)
+    self.assertEmpty(input_op.inputs)
+    self.assertListEqual(list(input_op.outputs), [0])
+    self.assertEqual(output_op.op_key, qtyping.TFLOperationName.OUTPUT)
+    self.assertListEqual(list(output_op.inputs), [12])
+    self.assertEmpty(output_op.outputs)
+if __name__ == "__main__":
+  googletest.main()