ai-edge-quantizer-nightly 0.1.0.dev20250427__py3-none-any.whl → 0.1.0.dev20250429__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- ai_edge_quantizer/model_modifier.py +2 -2
- ai_edge_quantizer/utils/tfl_interpreter_utils.py +30 -5
- ai_edge_quantizer/utils/tfl_interpreter_utils_test.py +19 -2
- {ai_edge_quantizer_nightly-0.1.0.dev20250427.dist-info → ai_edge_quantizer_nightly-0.1.0.dev20250429.dist-info}/METADATA +1 -1
- {ai_edge_quantizer_nightly-0.1.0.dev20250427.dist-info → ai_edge_quantizer_nightly-0.1.0.dev20250429.dist-info}/RECORD +8 -8
- {ai_edge_quantizer_nightly-0.1.0.dev20250427.dist-info → ai_edge_quantizer_nightly-0.1.0.dev20250429.dist-info}/LICENSE +0 -0
- {ai_edge_quantizer_nightly-0.1.0.dev20250427.dist-info → ai_edge_quantizer_nightly-0.1.0.dev20250429.dist-info}/WHEEL +0 -0
- {ai_edge_quantizer_nightly-0.1.0.dev20250427.dist-info → ai_edge_quantizer_nightly-0.1.0.dev20250429.dist-info}/top_level.txt +0 -0
@@ -104,8 +104,8 @@ class ModelModifier:
|
|
104
104
|
instructions, quantized_model, tensor_processing_order
|
105
105
|
)
|
106
106
|
constant_buffer_size = self._process_constant_map(quantized_model)
|
107
|
-
# we leave
|
108
|
-
if constant_buffer_size > 2**31 - 2**
|
107
|
+
# we leave 256MB for the model architecture.
|
108
|
+
if constant_buffer_size > 2**31 - 2**28:
|
109
109
|
return self._serialize_large_model(quantized_model)
|
110
110
|
else:
|
111
111
|
return self._serialize_small_model(quantized_model)
|
@@ -319,7 +319,27 @@ def get_signature_main_subgraph_index(
|
|
319
319
|
return signature_runner._subgraph_index # pylint:disable=protected-access
|
320
320
|
|
321
321
|
|
322
|
-
def
|
322
|
+
def _create_random_normal(
|
323
|
+
rng: np.random.Generator,
|
324
|
+
shape: tuple[int, ...],
|
325
|
+
dtype: np.dtype,
|
326
|
+
) -> dict[str, Any]:
|
327
|
+
"""Creates a random normal dataset sample for given input details."""
|
328
|
+
return rng.normal(size=shape).astype(dtype)
|
329
|
+
|
330
|
+
|
331
|
+
def _create_random_integers(
|
332
|
+
rng: np.random.Generator,
|
333
|
+
shape: tuple[int, ...],
|
334
|
+
dtype: np.dtype,
|
335
|
+
min_value: int = 0,
|
336
|
+
max_value: int = 1024,
|
337
|
+
) -> dict[str, Any]:
|
338
|
+
"""Creates a random integer dataset sample for given input details."""
|
339
|
+
return rng.integers(min_value, max_value, size=shape, dtype=dtype)
|
340
|
+
|
341
|
+
|
342
|
+
def create_random_dataset(
|
323
343
|
input_details: dict[str, Any],
|
324
344
|
num_samples: int,
|
325
345
|
random_seed: Union[int, np._typing.ArrayLike],
|
@@ -340,9 +360,14 @@ def create_random_normal_dataset(
|
|
340
360
|
for _ in range(num_samples):
|
341
361
|
input_data = {}
|
342
362
|
for arg_name, input_tensor in input_details.items():
|
343
|
-
|
344
|
-
|
345
|
-
)
|
363
|
+
dtype = input_tensor["dtype"]
|
364
|
+
shape = input_tensor["shape"]
|
365
|
+
if dtype in (np.int32, np.int64):
|
366
|
+
new_data = _create_random_integers(rng, shape, dtype)
|
367
|
+
elif dtype == np.float32:
|
368
|
+
new_data = _create_random_normal(rng, shape, dtype)
|
369
|
+
else:
|
370
|
+
raise ValueError(f"Unsupported dtype: {input_tensor['dtype']}")
|
346
371
|
input_data[arg_name] = new_data
|
347
372
|
dataset.append(input_data)
|
348
373
|
return dataset
|
@@ -372,7 +397,7 @@ def create_random_normal_input_data(
|
|
372
397
|
for signature_key in signature_keys:
|
373
398
|
signature_runner = tfl_interpreter.get_signature_runner(signature_key)
|
374
399
|
input_details = signature_runner.get_input_details()
|
375
|
-
test_data[signature_key] =
|
400
|
+
test_data[signature_key] = create_random_dataset(
|
376
401
|
input_details, num_samples, random_seed
|
377
402
|
)
|
378
403
|
return test_data
|
@@ -19,7 +19,6 @@ from tensorflow.python.platform import googletest
|
|
19
19
|
from ai_edge_quantizer.utils import test_utils
|
20
20
|
from ai_edge_quantizer.utils import tfl_interpreter_utils
|
21
21
|
|
22
|
-
|
23
22
|
TEST_DATA_PREFIX_PATH = test_utils.get_path_to_datafile("../tests/models")
|
24
23
|
|
25
24
|
|
@@ -159,7 +158,6 @@ class TflUtilsQuantizedModelTest(googletest.TestCase):
|
|
159
158
|
signature_output = tfl_interpreter_utils.invoke_interpreter_signature(
|
160
159
|
tfl_interpreter, self._signature_input_data
|
161
160
|
)
|
162
|
-
print(signature_output)
|
163
161
|
self.assertEqual(tuple(signature_output["dense_1"].shape), (1, 10))
|
164
162
|
|
165
163
|
# Assert the input data is not modified in-place b/353340272.
|
@@ -328,5 +326,24 @@ class TflUtilsMultiSignatureModelTest(googletest.TestCase):
|
|
328
326
|
self.assertEqual(multiply_output_content, [20.0])
|
329
327
|
|
330
328
|
|
329
|
+
class TflUtilsIntegerInputModelTest(googletest.TestCase):
|
330
|
+
|
331
|
+
def setUp(self):
|
332
|
+
super().setUp()
|
333
|
+
np.random.seed(0)
|
334
|
+
self._test_model_path = os.path.join(
|
335
|
+
TEST_DATA_PREFIX_PATH, "toy_model_with_kv_cache_multi_signature.tflite"
|
336
|
+
)
|
337
|
+
|
338
|
+
def test_random_integer_input_data(self):
|
339
|
+
test_data = tfl_interpreter_utils.create_random_normal_input_data(
|
340
|
+
self._test_model_path
|
341
|
+
)
|
342
|
+
self.assertEqual(test_data["signature_1"][0]["cache_0"].dtype, np.float32)
|
343
|
+
self.assertEqual(test_data["signature_1"][0]["cache_1"].dtype, np.float32)
|
344
|
+
self.assertEqual(test_data["signature_1"][0]["positions"].dtype, np.int32)
|
345
|
+
self.assertEqual(test_data["signature_1"][0]["tokens"].dtype, np.int32)
|
346
|
+
|
347
|
+
|
331
348
|
if __name__ == "__main__":
|
332
349
|
googletest.main()
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: ai-edge-quantizer-nightly
|
3
|
-
Version: 0.1.0.
|
3
|
+
Version: 0.1.0.dev20250429
|
4
4
|
Summary: A quantizer for advanced developers to quantize converted AI Edge models.
|
5
5
|
Home-page: https://github.com/google-ai-edge/ai-edge-quantizer
|
6
6
|
Keywords: On-Device ML,AI,Google,TFLite,Quantization,LLMs,GenAI
|
@@ -6,7 +6,7 @@ ai_edge_quantizer/calibrator.py,sha256=n7AD9j7UScR-CieoI6DQRMeiG_fhLBfSLRiM4460x
|
|
6
6
|
ai_edge_quantizer/calibrator_test.py,sha256=C_oWOaRugPKYX74jF-eRFH-k6nGOdA8I9_uPiocaOuE,11900
|
7
7
|
ai_edge_quantizer/conftest.py,sha256=SxCz-5LlRD_lQm4hQc4c6IGG7DS8d7IyEWY9gnscPN0,794
|
8
8
|
ai_edge_quantizer/default_policy.py,sha256=81z4cruBK7mGFt8xFRZK5LKya65axuZwo2zpbcYSicc,11099
|
9
|
-
ai_edge_quantizer/model_modifier.py,sha256=
|
9
|
+
ai_edge_quantizer/model_modifier.py,sha256=teGa8I6kGvn6TQY6Xv53YFIc_pQEhNvM9Zb4bvhezyw,7110
|
10
10
|
ai_edge_quantizer/model_modifier_test.py,sha256=cJd04SLOG-fQZZNZPcisoBLx3cLtWEwGqUBbLb-pif4,4751
|
11
11
|
ai_edge_quantizer/model_validator.py,sha256=fRNz0jO54cthPTibsCuViUXUuFRHl_fbvEiCukIVy20,13030
|
12
12
|
ai_edge_quantizer/model_validator_test.py,sha256=EeqOP_mrZsnZ3rug756s0ryDDqd2KgIDld5Lm_gDuWY,13020
|
@@ -62,12 +62,12 @@ ai_edge_quantizer/utils/calibration_utils_test.py,sha256=Z-AcdTieesWFKyKBb08ZXm4
|
|
62
62
|
ai_edge_quantizer/utils/test_utils.py,sha256=HwZCIpO9fJRAhuN6t6voXKOYQtcioFtt_tpkAlDsAYk,6205
|
63
63
|
ai_edge_quantizer/utils/tfl_flatbuffer_utils.py,sha256=NKtw60BJAjIE6Yww8B1vJpxXwp4MSERmpKajXJWm5rI,10568
|
64
64
|
ai_edge_quantizer/utils/tfl_flatbuffer_utils_test.py,sha256=K1SbK8q92qYVtiVj0I0GtugsPTkpIpEKv9zakvFV_Sc,8555
|
65
|
-
ai_edge_quantizer/utils/tfl_interpreter_utils.py,sha256=
|
66
|
-
ai_edge_quantizer/utils/tfl_interpreter_utils_test.py,sha256=
|
65
|
+
ai_edge_quantizer/utils/tfl_interpreter_utils.py,sha256=WoewyiZpaua80oP0tpgyrw5Ws1v7f4vl88vdzS0UjDE,13490
|
66
|
+
ai_edge_quantizer/utils/tfl_interpreter_utils_test.py,sha256=6fjkM-rycZ95L4yfvlr0TN6RlrhfPzxNUYrZaYO_F0A,12013
|
67
67
|
ai_edge_quantizer/utils/validation_utils.py,sha256=oYw33Sg547AqtGw-choPUJmp9SAKkV46J_ddqSsum2Q,3950
|
68
68
|
ai_edge_quantizer/utils/validation_utils_test.py,sha256=V_qNDikPD4OPB-siOLQCWNVWTAu87h2IgNYt7teFd-o,2934
|
69
|
-
ai_edge_quantizer_nightly-0.1.0.
|
70
|
-
ai_edge_quantizer_nightly-0.1.0.
|
71
|
-
ai_edge_quantizer_nightly-0.1.0.
|
72
|
-
ai_edge_quantizer_nightly-0.1.0.
|
73
|
-
ai_edge_quantizer_nightly-0.1.0.
|
69
|
+
ai_edge_quantizer_nightly-0.1.0.dev20250429.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
70
|
+
ai_edge_quantizer_nightly-0.1.0.dev20250429.dist-info/METADATA,sha256=uL3RUBECU5YAPHCJ8tNR8CaVFIQN1Bq-Mc4now2cpJw,1527
|
71
|
+
ai_edge_quantizer_nightly-0.1.0.dev20250429.dist-info/WHEEL,sha256=tZoeGjtWxWRfdplE7E3d45VPlLNQnvbKiYnx7gwAy8A,92
|
72
|
+
ai_edge_quantizer_nightly-0.1.0.dev20250429.dist-info/top_level.txt,sha256=8QTfPnFXNVUhScFLaa-NWZMFWMn72M50DVPubpwWB1g,18
|
73
|
+
ai_edge_quantizer_nightly-0.1.0.dev20250429.dist-info/RECORD,,
|
File without changes
|
File without changes
|