# TensorFlow2 转换为 ONNX 推理

参考：[migrating_checkpoints](https://www.tensorflow.org/guide/migrate/migrating_checkpoints)

下面以模型 [resnet_v2_50](http://download.tensorflow.org/models/resnet_v2_50_2017_04_14.tar.gz) 为例展示。

需要克隆项目 [models](https://github.com/tensorflow/models)，然后执行如下操作。

In [1]:
import tensorflow as tf
try:
    tf1 = tf.compat.v1
except (ImportError, AttributeError):
    tf1 = tf
tf.get_logger().setLevel('ERROR')

2023-06-16 17:32:16.513696: I tensorflow/tsl/cuda/cudart_stub.cc:28] Could not find cuda drivers on your machine, GPU will not be used.
2023-06-16 17:32:16.563629: I tensorflow/tsl/cuda/cudart_stub.cc:28] Could not find cuda drivers on your machine, GPU will not be used.
2023-06-16 17:32:16.564661: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


切换到 `models/research/slim` 目录下：

In [2]:
%cd /media/pc/data/lxw/ai/tasks/models/research/slim

/media/pc/data/lxw/ai/tasks/models/research/slim


将 TF1 升级为 TF2：

In [3]:
from nets import resnet_v2
import tf_slim as slim


class ResnetV2_50_block(tf.keras.layers.Layer):
    def __init__(self, trainable=False, 
                 name="resnet_v2_50", 
                 dtype=None, dynamic=False, **kwargs):
        super().__init__(trainable, name, dtype, dynamic, **kwargs)

    @tf1.keras.utils.track_tf1_style_variables
    def call(self, inputs):
        with slim.arg_scope(resnet_v2.resnet_arg_scope()):
            logits, end_points = resnet_v2.resnet_v2_50(
                inputs, 
                num_classes=1001,
                global_pool=True,
                is_training=self.trainable,
                scope=self.name
            )
        del end_points
        return tf.nn.softmax(logits)

class ResnetV2_50(tf.keras.Model):
    def __init__(self, trainable=False, 
                 name="resnet_v2_50", 
                 dtype=None, dynamic=False, **kwargs):
        super().__init__()
        self.block = ResnetV2_50_block(
            trainable=trainable, 
            name=name, dtype=dtype, 
            dynamic=dynamic, **kwargs
        )

    @tf.function(input_signature=[tf.TensorSpec([None, 224, 224, 3], 
                                                 tf.float32, name="data")])
    def call(self, inputs):
        x = self.block(inputs)
        return x

预处理：

In [4]:
from PIL import Image
import numpy as np
from nets import resnet_v2
from preprocessing.preprocessing_factory import get_preprocessing
import tf_slim as slim

preprocessing = get_preprocessing("resnet_v2_50")
image_size = 224
path = '/media/pc/data/board/arria10/lxw/data/test/cat.png' # 将要预测的图片路径
preprocessing = get_preprocessing("resnet_v2_50")


@tf.function
def preprocess_image(image, output_height, output_width):
    # image = tf.constant(image)
    processed_image = preprocessing(image, output_height, output_width)
    return processed_image/256
with Image.open(path) as im:
    if im.mode != "RGB":
        im.convert("RGB")
    image = np.asarray(im)
np_processed_image = preprocess_image(image, image_size, image_size)
np_processed_images = np.expand_dims(np_processed_image, axis=0)

2023-06-16 17:32:19.387439: W tensorflow/core/common_runtime/gpu/gpu_device.cc:1956] Cannot dlopen some GPU libraries. Please make sure the missing libraries mentioned above are installed properly if you would like to use GPU. Follow the guide at https://www.tensorflow.org/install/gpu for how to download and setup the required libraries for your platform.
Skipping registering GPU devices...


前向推理：

In [5]:
model = ResnetV2_50()
model(tf.ones(shape=(1, 224, 224, 3), dtype=tf.float32))
ckpt = tf.train.Checkpoint(model=model)
ckpt.restore("/tmp/checkpoints/resnet_v2_50.ckpt") # 更新模型参数
outputs = model(np_processed_images)
outputs = outputs.numpy()

  self.updates, tf.compat.v1.GraphKeys.UPDATE_OPS


打印标签信息：

In [6]:
from github import Github

g = Github(user_agent="xinetzone")
repo = g.get_repo("tensorflow/models")
label_content = repo.get_contents("research/slim/datasets/imagenet_lsvrc_2015_synsets.txt")
imagenet_labels = label_content.decoded_content.decode().split()
assert len(imagenet_labels) == 1000
metadata = repo.get_contents("research/slim/datasets/imagenet_metadata.txt")
imagenet_metadata = metadata.decoded_content.decode().splitlines()
synset_to_human = {}
for metadata in imagenet_metadata:
    name, value = metadata.split("\t")
    synset_to_human[name] = value
name2id = {name: k+1 for k, name in enumerate(imagenet_labels)}

topk = 5
sorted_inds = outputs[0].argsort()[::-1]
for sorted_ind in sorted_inds[:topk]:
    label = synset_to_human[imagenet_labels[sorted_ind-1]]
    print(f"{sorted_ind-1}: {label.ljust(20)}\t{outputs[0][sorted_ind-1]}")

282: tiger cat           	0.15822742879390717
285: Egyptian cat        	0.0009194915182888508
281: tabby, tabby cat    	9.054027759702876e-05
278: kit fox, Vulpes macrotis	0.0044543202966451645
277: red fox, Vulpes vulpes	2.409669548342208e-07


In [7]:
model.summary()

Model: "resnet_v2_50"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 resnet_v2_50 (ResnetV2_50_b  multiple                 25615849  
 lock)                                                           
                                                                 
Total params: 25,615,849
Trainable params: 0
Non-trainable params: 25,615,849
_________________________________________________________________


将其模型和参数与加载下来：

In [8]:
# # model = ResnetV2_50()
# inputs = tf.keras.Input(shape=(224, 224, 3), dtype=tf.float32, name="data")
# outputs = model(inputs)
# model2 = tf.keras.Model(inputs=inputs, outputs=outputs, name="resnet_v2_50_model")

# model2.save(module_with_signature_path)

In [9]:
module_with_signature_path = "temp/resnet_v2_50_keras"
model.save(module_with_signature_path)
imported_with_signatures = tf.saved_model.load(module_with_signature_path)
infer = imported_with_signatures.signatures['serving_default']
labeling = infer(tf.constant(np_processed_images))

  self.updates, tf.compat.v1.GraphKeys.UPDATE_OPS
  self.updates, tf.compat.v1.GraphKeys.UPDATE_OPS


## ONNX (TF2) 前端推理

[Keras 模型转换 ONNX](https://onnxruntime.ai/docs/tutorials/tf-get-started.html)：

In [12]:
import tf2onnx
import onnx

input_signature = [tf.TensorSpec([1, 224, 224, 3], tf.float32, name="data")]
# Use from_function for tf functions
onnx_model, _ = tf2onnx.convert.from_keras(model, input_signature, opset=13)
onnx.save(onnx_model, "temp/resnet_v2_50.onnx")

2023-06-16 17:35:47.187897: I tensorflow/core/grappler/devices.cc:66] Number of eligible GPUs (core count >= 8, compute capability >= 0.0): 2
2023-06-16 17:35:47.188039: I tensorflow/core/grappler/clusters/single_machine.cc:358] Starting new session
2023-06-16 17:35:47.188735: W tensorflow/core/common_runtime/gpu/gpu_device.cc:1956] Cannot dlopen some GPU libraries. Please make sure the missing libraries mentioned above are installed properly if you would like to use GPU. Follow the guide at https://www.tensorflow.org/install/gpu for how to download and setup the required libraries for your platform.
Skipping registering GPU devices...
2023-06-16 17:35:48.946008: I tensorflow/core/grappler/devices.cc:66] Number of eligible GPUs (core count >= 8, compute capability >= 0.0): 2
2023-06-16 17:35:48.946161: I tensorflow/core/grappler/clusters/single_machine.cc:358] Starting new session
2023-06-16 17:35:48.946861: W tensorflow/core/common_runtime/gpu/gpu_device.cc:1956] Cannot dlopen some GP

构建库：

In [16]:
import set_env
from tvm.relay.frontend import from_onnx

shape_dict = {
    "data": [1, 224, 224, 3],
}

graph_def = onnx.load("temp/resnet_v2_50.onnx")

mod, params = from_onnx(
    graph_def,
    shape_dict,
    opset=13,
    freeze_params=True
)

推理：

In [18]:
import tvm
from tvm import relay

with tvm.transform.PassContext(opt_level=3):
    lib = relay.build(mod, "llvm", params=params)
    
inputs_dict = {"data": np_processed_images}
mlib_proxy = tvm.contrib.graph_executor.GraphModule(lib["default"](tvm.cpu()))
mlib_proxy.run(**inputs_dict)

One or more operators have not been tuned. Please tune your model for better performance. Use DEBUG logging level to see more details.


验证一致性：

In [26]:
np.testing.assert_allclose(
    labeling['output_1'].numpy(), 
    mlib_proxy.get_output(0).numpy(),
    rtol=1e-07, atol=1e-5
)