Merge pull request PINTO0309#100 from PINTO0309/TFLite_ModelAnalyzer

TFLite ModelAnalyzer (Check if the model can be supported by GPU Delegate, 6D Transpose to xxxD Transpose)
dkscksals12 · Jan 6, 2023 · dd6d732 · dd6d732
2 parents ed2c636 + 968e3e6
commit dd6d732
Show file tree

Hide file tree

Showing 3 changed files with 154 additions and 2 deletions.
diff --git a/README.md b/README.md
@@ -89,7 +89,7 @@ Video speed is adjusted approximately 50 times slower than actual speed.
   $ docker run --rm -it \
   -v `pwd`:/workdir \
   -w /workdir \
-  ghcr.io/pinto0309/onnx2tf:1.3.19
+  ghcr.io/pinto0309/onnx2tf:1.4.0
 
   or
 
@@ -197,6 +197,7 @@ usage: onnx2tf
 [-rerf]
 [-me]
 [-prf PARAM_REPLACEMENT_FILE]
+[-cgdc]
 [-n]
 
 optional arguments:
@@ -429,6 +430,64 @@ optional arguments:
   -prf PARAM_REPLACEMENT_FILE, --param_replacement_file PARAM_REPLACEMENT_FILE
     Parameter replacement file path. (.json)
 
+  -cgdc, --check_gpu_delegate_compatibility
+    Run TFLite ModelAnalyzer on the generated Float16 tflite model
+    to check if the model can be supported by GPU Delegate.
+    e.g.
+    """
+    === TFLite ModelAnalyzer ===
+
+    Your TFLite model has '1' subgraph(s). In the subgraph description below,
+    T# represents the Tensor numbers. For example, in Subgraph#0, the RESHAPE op takes
+    tensor #0 and tensor #6 as input and produces tensor #7 as output.
+
+    Subgraph#0 main(T#0) -> [T#17]
+      Op#0 RESHAPE(T#0, T#6[2, 8, 8, 3, 2, ...]) -> [T#7]
+      Op#1 SPLIT(T#5[0], T#7) -> [T#8, T#9]
+      Op#2 RESHAPE(T#8, T#1[8, 8, 3, 2, 2]) -> [T#10]
+      Op#3 TRANSPOSE(T#10, T#4[0, 3, 1, 4, 2]) -> [T#11]
+      Op#4 RESHAPE(T#11, T#2[1, 8, 2, 8, 2, ...]) -> [T#12]
+      Op#5 RESHAPE(T#9, T#1[8, 8, 3, 2, 2]) -> [T#13]
+      Op#6 TRANSPOSE(T#13, T#4[0, 3, 1, 4, 2]) -> [T#14]
+      Op#7 RESHAPE(T#14, T#2[1, 8, 2, 8, 2, ...]) -> [T#15]
+      Op#8 CONCATENATION(T#12, T#15) -> [T#16]
+      Op#9 RESHAPE(T#16, T#3[2, 16, 16, 3]) -> [T#17]
+
+    Tensors of Subgraph#0
+      T#0(inputs_0) shape:[2, 8, 8, 12], type:FLOAT32
+      T#1(model/tf.compat.v1.squeeze_2/Squeeze) shape:[5], type:INT32 RO 20 bytes, data:[8, 8, 3, 2, 2]
+      T#2(model/tf.expand_dims_1/ExpandDims) shape:[6], type:INT32 RO 24 bytes, data:[1, 8, 2, 8, 2, ...]
+      T#3(model/tf.reshape_1/Reshape/shape) shape:[4], type:INT32 RO 16 bytes, data:[2, 16, 16, 3]
+      T#4(model/tf.compat.v1.transpose/transpose/perm) shape:[5], type:INT32 RO 20 bytes, data:[0, 3, 1, 4, 2]
+      T#5(model/tf.concat/concat/axis) shape:[], type:INT32 RO 4 bytes, data:[0]
+      T#6(model/tf.reshape/Reshape/shape) shape:[6], type:INT32 RO 24 bytes, data:[2, 8, 8, 3, 2, ...]
+      T#7(model/tf.reshape/Reshape) shape:[2, 8, 8, 3, 2, 2], type:FLOAT32
+      T#8(model/tf.split/split) shape:[1, 8, 8, 3, 2, 2], type:FLOAT32
+      T#9(model/tf.split/split1) shape:[1, 8, 8, 3, 2, 2], type:FLOAT32
+      T#10(model/tf.compat.v1.squeeze_1/Squeeze) shape:[8, 8, 3, 2, 2], type:FLOAT32
+      T#11(model/tf.compat.v1.transpose/transpose) shape:[8, 2, 8, 2, 3], type:FLOAT32
+      T#12(model/tf.expand_dims/ExpandDims) shape:[1, 8, 2, 8, 2, 3], type:FLOAT32
+      T#13(model/tf.compat.v1.squeeze_2/Squeeze1) shape:[8, 8, 3, 2, 2], type:FLOAT32
+      T#14(model/tf.compat.v1.transpose_1/transpose) shape:[8, 2, 8, 2, 3], type:FLOAT32
+      T#15(model/tf.expand_dims_1/ExpandDims1) shape:[1, 8, 2, 8, 2, 3], type:FLOAT32
+      T#16(model/tf.concat/concat) shape:[2, 8, 2, 8, 2, 3], type:FLOAT32
+      T#17(Identity) shape:[2, 16, 16, 3], type:FLOAT32
+
+    Your model looks compatibile with GPU delegate with TFLite runtime version 2.10.0.
+    But it doesn't guarantee that your model works well with GPU delegate.
+    There could be some runtime incompatibililty happen.
+    ---------------------------------------------------------------
+                  Model size:       2988 bytes
+        Non-data buffer size:       2757 bytes (92.27 %)
+      Total data buffer size:        231 bytes (07.73 %)
+        (Zero value buffers):          4 bytes (00.13 %)
+
+    * Buffers of TFLite model are mostly used for constant tensors.
+      And zero value buffers are buffers filled with zeros.
+      Non-data buffers area are used to store operators, subgraphs and etc.
+      You can find more details from https://github.com/tensorflow/tensorflow/blob/master/tensorflow/lite/schema/schema.fbs
+    """
+
   -n, --non_verbose
     Do not show all information logs. Only error logs are displayed.
 ```
@@ -478,6 +537,7 @@ convert(
   replace_erf_to_pseudo_erf: Optional[bool] = False,
   mvn_epsilon: Union[float, NoneType] = 0.0000000001,
   param_replacement_file: Optional[str] = '',
+  check_gpu_delegate_compatibility: Optional[bool] = False,
   non_verbose: Union[bool, NoneType] = False
 ) -> keras.engine.training.Model
 
@@ -717,6 +777,65 @@ convert(
     param_replacement_file: Optional[str]
       Parameter replacement file path. (.json)
 
+    check_gpu_delegate_compatibility: Optional[bool]
+      Run TFLite ModelAnalyzer on the generated Float16 tflite model
+      to check if the model can be supported by GPU Delegate.
+      e.g.
+      """
+      === TFLite ModelAnalyzer ===
+
+      Your TFLite model has '1' subgraph(s). In the subgraph description below,
+      T# represents the Tensor numbers. For example, in Subgraph#0, the RESHAPE op takes
+      tensor #0 and tensor #6 as input and produces tensor #7 as output.
+
+      Subgraph#0 main(T#0) -> [T#17]
+        Op#0 RESHAPE(T#0, T#6[2, 8, 8, 3, 2, ...]) -> [T#7]
+        Op#1 SPLIT(T#5[0], T#7) -> [T#8, T#9]
+        Op#2 RESHAPE(T#8, T#1[8, 8, 3, 2, 2]) -> [T#10]
+        Op#3 TRANSPOSE(T#10, T#4[0, 3, 1, 4, 2]) -> [T#11]
+        Op#4 RESHAPE(T#11, T#2[1, 8, 2, 8, 2, ...]) -> [T#12]
+        Op#5 RESHAPE(T#9, T#1[8, 8, 3, 2, 2]) -> [T#13]
+        Op#6 TRANSPOSE(T#13, T#4[0, 3, 1, 4, 2]) -> [T#14]
+        Op#7 RESHAPE(T#14, T#2[1, 8, 2, 8, 2, ...]) -> [T#15]
+        Op#8 CONCATENATION(T#12, T#15) -> [T#16]
+        Op#9 RESHAPE(T#16, T#3[2, 16, 16, 3]) -> [T#17]
+
+      Tensors of Subgraph#0
+        T#0(inputs_0) shape:[2, 8, 8, 12], type:FLOAT32
+        T#1(model/tf.compat.v1.squeeze_2/Squeeze) shape:[5], type:INT32 RO 20 bytes, data:[8, 8, 3, 2, 2]
+        T#2(model/tf.expand_dims_1/ExpandDims) shape:[6], type:INT32 RO 24 bytes, data:[1, 8, 2, 8, 2, ...]
+        T#3(model/tf.reshape_1/Reshape/shape) shape:[4], type:INT32 RO 16 bytes, data:[2, 16, 16, 3]
+        T#4(model/tf.compat.v1.transpose/transpose/perm) shape:[5], type:INT32 RO 20 bytes, data:[0, 3, 1, 4, 2]
+        T#5(model/tf.concat/concat/axis) shape:[], type:INT32 RO 4 bytes, data:[0]
+        T#6(model/tf.reshape/Reshape/shape) shape:[6], type:INT32 RO 24 bytes, data:[2, 8, 8, 3, 2, ...]
+        T#7(model/tf.reshape/Reshape) shape:[2, 8, 8, 3, 2, 2], type:FLOAT32
+        T#8(model/tf.split/split) shape:[1, 8, 8, 3, 2, 2], type:FLOAT32
+        T#9(model/tf.split/split1) shape:[1, 8, 8, 3, 2, 2], type:FLOAT32
+        T#10(model/tf.compat.v1.squeeze_1/Squeeze) shape:[8, 8, 3, 2, 2], type:FLOAT32
+        T#11(model/tf.compat.v1.transpose/transpose) shape:[8, 2, 8, 2, 3], type:FLOAT32
+        T#12(model/tf.expand_dims/ExpandDims) shape:[1, 8, 2, 8, 2, 3], type:FLOAT32
+        T#13(model/tf.compat.v1.squeeze_2/Squeeze1) shape:[8, 8, 3, 2, 2], type:FLOAT32
+        T#14(model/tf.compat.v1.transpose_1/transpose) shape:[8, 2, 8, 2, 3], type:FLOAT32
+        T#15(model/tf.expand_dims_1/ExpandDims1) shape:[1, 8, 2, 8, 2, 3], type:FLOAT32
+        T#16(model/tf.concat/concat) shape:[2, 8, 2, 8, 2, 3], type:FLOAT32
+        T#17(Identity) shape:[2, 16, 16, 3], type:FLOAT32
+
+      Your model looks compatibile with GPU delegate with TFLite runtime version 2.10.0.
+      But it doesn't guarantee that your model works well with GPU delegate.
+      There could be some runtime incompatibililty happen.
+      ---------------------------------------------------------------
+                    Model size:       2988 bytes
+          Non-data buffer size:       2757 bytes (92.27 %)
+        Total data buffer size:        231 bytes (07.73 %)
+          (Zero value buffers):          4 bytes (00.13 %)
+
+      * Buffers of TFLite model are mostly used for constant tensors.
+        And zero value buffers are buffers filled with zeros.
+        Non-data buffers area are used to store operators, subgraphs and etc.
+        You can find more details from https://github.com/tensorflow/tensorflow/blob/master/tensorflow/lite/schema/schema.fbs
+      """
+
+
     non_verbose: Optional[bool]
       Do not show all information logs. Only error logs are displayed.
       Default: False

diff --git a/onnx2tf/__init__.py b/onnx2tf/__init__.py
@@ -1,3 +1,3 @@
 from onnx2tf.onnx2tf import convert, main
 
-__version__ = '1.3.19'
+__version__ = '1.4.0'
diff --git a/onnx2tf/onnx2tf.py b/onnx2tf/onnx2tf.py
@@ -80,6 +80,7 @@ def convert(
     replace_hardswish_to_pseudo_hardswish: Optional[bool] = False,
     replace_erf_to_pseudo_erf: Optional[bool] = False,
     param_replacement_file: Optional[str] = '',
+    check_gpu_delegate_compatibility: Optional[bool] = False,
     mvn_epsilon: Optional[float] = 0.0000000001,
     non_verbose: Optional[bool] = False,
 ) -> tf.keras.Model:
@@ -319,6 +320,10 @@ def convert(
     param_replacement_file: Optional[str]
         Parameter replacement file path. (.json)
 
+    check_gpu_delegate_compatibility: Optional[bool]
+        Run TFLite ModelAnalyzer on the generated Float16 tflite model\n
+        to check if the model can be supported by GPU Delegate.'
+
     non_verbose: Optional[bool]
         Do not show all information logs. Only error logs are displayed.\n
         Default: False
@@ -714,6 +719,24 @@ def convert(
         if not non_verbose:
             print(f'{Color.GREEN}Float16 tflite output complete!{Color.RESET}')
 
+        # Run TFLite ModelAnalyzer on the generated Float16 tflite model
+        # to check if the model can be supported by GPU Delegate.
+        if check_gpu_delegate_compatibility:
+            print('')
+            try:
+                tf.lite.experimental.Analyzer.analyze(
+                    model_content=tflite_model,
+                    gpu_compatibility=True,
+                )
+            except Exception as ex:
+                if not non_verbose:
+                    import traceback
+                    traceback.print_exc()
+                    print(
+                        f'{Color.YELLOW}WARNING:{Color.RESET} '+
+                        'TFLite ModelAnalyzer failed.'
+                    )
+
         # Quantized TFLite
         if output_integer_quantized_tflite:
             # Dynamic Range Quantization
@@ -1275,6 +1298,15 @@ def main():
         default='',
         help='Parameter replacement file path. (.json)'
     )
+    parser.add_argument(
+        '-cgdc',
+        '--check_gpu_delegate_compatibility',
+        action='store_true',
+        help=\
+            'Run TFLite ModelAnalyzer on the generated Float16 tflite model ' +
+            'to check if the model can be supported by GPU Delegate.'
+    )
+    tf.lite.experimental.Analyzer.analyze()
     parser.add_argument(
         '-n',
         '--non_verbose',
@@ -1344,6 +1376,7 @@ def main():
         replace_hardswish_to_pseudo_hardswish=args.replace_hardswish_to_pseudo_hardswish,
         replace_erf_to_pseudo_erf=args.replace_erf_to_pseudo_erf,
         param_replacement_file=args.param_replacement_file,
+        check_gpu_delegate_compatibility=args.check_gpu_delegate_compatibility,
         mvn_epsilon=args.mvn_epsilon,
         non_verbose=args.non_verbose,
     )