[New Feature] Add paddle2onnx component (#1228)

rainyfly · web-flow · commit 092c02747527 · 2023-03-13T16:30:38.000+08:00
* add paddle2onnx component

* add comments

* fix

* supplement failure judgement

* fix format

* fix format
diff --git a/requirements.txt b/requirements.txt
@@ -9,7 +9,8 @@ six >= 1.14.0
 matplotlib
 pandas
 packaging
-x2paddle
+x2paddle >= 1.4.0
+paddle2onnx >= 1.0.5
 rarfile
 gradio
 tritonclient[all]
diff --git a/visualdl/component/inference/model_convert_server.py b/visualdl/component/inference/model_convert_server.py
@@ -1,3 +1,4 @@
+# flake8: noqa
 # Copyright (c) 2022 VisualDL Authors. All Rights Reserve.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
@@ -13,20 +14,18 @@
 # limitations under the License.
 # =======================================================================
 import base64
-import glob
 import hashlib
 import json
 import os
 import shutil
 import tempfile
-from threading import Lock
 
+import paddle2onnx
 from flask import request
-from x2paddle.convert import caffe2paddle
 from x2paddle.convert import onnx2paddle
 
 from .xarfile import archive
-from .xarfile import unarchive
+from visualdl.io.bfile import BosFileSystem
 from visualdl.server.api import gen_result
 from visualdl.server.api import result
 from visualdl.utils.dir import X2PADDLE_CACHE_PATH
@@ -35,126 +34,252 @@
 
 
 class ModelConvertApi(object):
+    '''!
+    Integrate multiple model convertion tools, and provide convertion service for users.
+    When user uploads a model to this server, convert model and upload the results to VDL Bos.
+    When user downloads the model, we get the data from Bos and send it to client.
+    Maybe users can download from bos directy if frontend can achieve it.
+    '''
+
     def __init__(self):
-        self.supported_formats = {'onnx', 'caffe'}
-        self.lock = Lock()
-        self.server_count = 0  # we use this variable to count requests handled,
-        # and check the number of files every 100 requests.
-        # If more than _max_cache_numbers files in cache, we delete the last recent used 50 files.
+        '''
+        Initialize a object to provide service. Need a BosFileSystem client to write data.
+        '''
+        try:
+            self.bos_client = BosFileSystem()
+            self.bucket_name = os.getenv("BOS_BUCKET_NAME")
+        except Exception:
+            # When BOS_HOST, BOS_AK, BOS_SK, BOS_STS are not set in the environment variables.
+            # We use VDL BOS by default
+            self.bos_client = BosFileSystem(write_flag=False)
+            self.bos_client.renew_bos_client_from_server()
+            self.bucket_name = 'visualdl-server'
 
     @result()
-    def convert_model(self, format):
-        file_handle = request.files['file']
-        data = file_handle.stream.read()
-        if format not in self.supported_formats:
-            raise RuntimeError('Model format {} is not supported. "\
-          "Only onnx and caffe models are supported now.'.format(format))
+    def onnx2paddle_model_convert(self, convert_to_lite, lite_valid_places,
+                                  lite_model_type):  # noqa:C901
+        '''
+        Convert onnx model to paddle model.
+        '''
+        model_handle = request.files['model']
+        data = model_handle.stream.read()
         result = {}
-        result['from'] = format
-        result['to'] = 'paddle'
+        # Do a simple data verification
+        if convert_to_lite in ['true', 'True', 'yes', 'Yes', 'y']:
+            convert_to_lite = True
+        else:
+            convert_to_lite = False
+
+        if lite_valid_places not in [
+                'arm', 'opencl', 'x86', 'metal', 'xpu', 'bm', 'mlu',
+                'intel_fpga', 'huawei_ascend_npu', 'imagination_nna',
+                'rockchip_npu', 'mediatek_apu', 'huawei_kirin_npu',
+                'amlogic_npu'
+        ]:
+            lite_valid_places = 'arm'
+        if lite_model_type not in ['protobuf', 'naive_buffer']:
+            lite_model_type = 'naive_buffer'
+
         # call x2paddle to convert models
         hl = hashlib.md5()
         hl.update(data)
         identity = hl.hexdigest()
         result['request_id'] = identity
-        target_path = os.path.join(X2PADDLE_CACHE_PATH, identity)
-        if os.path.exists(target_path):
-            if os.path.exists(
-                    os.path.join(target_path, 'inference_model',
-                                 'model.pdmodel')):  # if data in cache
-                with open(
-                        os.path.join(target_path, 'inference_model',
-                                     'model.pdmodel'), 'rb') as model_fp:
-                    model_encoded = base64.b64encode(
-                        model_fp.read()).decode('utf-8')
-                result['pdmodel'] = model_encoded
+        # check whether model has been transfromed before
+        # if model has been transformed before, data is stored at bos
+        pdmodel_filename = 'bos://{}/onnx2paddle/{}/model.pdmodel'.format(
+            self.bucket_name, identity)
+        if self.bos_client.exists(pdmodel_filename):
+            remote_data = self.bos_client.read_file(pdmodel_filename)
+            if remote_data:  # we should check data is not empty,
+                # in case convertion failed but empty data is still uploaded before due to unknown reasons
+                model_encoded = base64.b64encode(remote_data).decode('utf-8')
+                result['model'] = model_encoded
                 return result
-        else:
+        target_path = os.path.join(X2PADDLE_CACHE_PATH, 'onnx2paddle',
+                                   identity)
+        if not os.path.exists(target_path):
             os.makedirs(target_path, exist_ok=True)
         with tempfile.NamedTemporaryFile() as fp:
             fp.write(data)
             fp.flush()
             try:
-                if format == 'onnx':
-                    try:
-                        import onnx  # noqa: F401
-                    except Exception:
-                        raise RuntimeError(
-                            "[ERROR] onnx is not installed, use \"pip install onnx>=1.6.0\"."
-                        )
-                    onnx2paddle(fp.name, target_path)
-                elif format == 'caffe':
-                    with tempfile.TemporaryDirectory() as unarchivedir:
-                        unarchive(fp.name, unarchivedir)
-                        prototxt_path = None
-                        weight_path = None
-                        for dirname, subdirs, filenames in os.walk(
-                                unarchivedir):
-                            for filename in filenames:
-                                if '.prototxt' in filename:
-                                    prototxt_path = os.path.join(
-                                        dirname, filename)
-                                if '.caffemodel' in filename:
-                                    weight_path = os.path.join(
-                                        dirname, filename)
-                        if prototxt_path is None or weight_path is None:
-                            raise RuntimeError(
-                                ".prototxt or .caffemodel file is missing in your archive file, "
-                                "please check files uploaded.")
-                        caffe2paddle(prototxt_path, weight_path, target_path,
-                                     None)
+                import onnx  # noqa: F401
+            except Exception:
+                raise RuntimeError(
+                    "[ERROR] onnx is not installed, use \"pip install onnx>=1.6.0\"."
+                )
+            try:
+                if convert_to_lite is False:
+                    onnx2paddle(
+                        fp.name, target_path, convert_to_lite=convert_to_lite)
+                else:
+                    onnx2paddle(
+                        fp.name,
+                        target_path,
+                        convert_to_lite=convert_to_lite,
+                        lite_valid_places=lite_valid_places,
+                        lite_model_type=lite_model_type)
             except Exception as e:
                 raise RuntimeError(
                     "[Convertion error] {}.\n Please open an issue at "
                     "https://github.com/PaddlePaddle/X2Paddle/issues to report your problem."
                     .format(e))
-        with self.lock:  # we need to enter dirname(target_path) to archive,
-            # in case unneccessary directory added in archive.
+
             origin_dir = os.getcwd()
             os.chdir(os.path.dirname(target_path))
             archive(os.path.basename(target_path))
             os.chdir(origin_dir)
-            self.server_count += 1
+            with open(
+                    os.path.join(X2PADDLE_CACHE_PATH, 'onnx2paddle',
+                                 '{}.tar'.format(identity)), 'rb') as f:
+                # upload archived transformed model to vdl bos
+                data = f.read()
+                filename = 'bos://{}/onnx2paddle/{}.tar'.format(
+                    self.bucket_name, identity)
+                try:
+                    self.bos_client.write(filename, data)
+                except Exception as e:
+                    print(
+                        "Exception: Write file {}.tar to bos failed, due to {}"
+                        .format(identity, e))
         with open(
                 os.path.join(target_path, 'inference_model', 'model.pdmodel'),
                 'rb') as model_fp:
-            model_encoded = base64.b64encode(model_fp.read()).decode('utf-8')
-        result['pdmodel'] = model_encoded
+            # upload pdmodel file to bos, if some model has been transformed before, we can directly download from bos
+            filename = 'bos://{}/onnx2paddle/{}/model.pdmodel'.format(
+                self.bucket_name, identity)
+            data = model_fp.read()
+            try:
+                self.bos_client.write(filename, data)
+            except Exception as e:
+                print(
+                    "Exception: Write file {}/model.pdmodel to bos failed, due to {}"
+                    .format(identity, e))
+            # return transformed pdmodel file to frontend to show model structure graph
+            model_encoded = base64.b64encode(data).decode('utf-8')
+        # delete target_path
+        shutil.rmtree(target_path)
+        result['model'] = model_encoded
         return result
 
     @result('application/octet-stream')
-    def download_model(self, request_id):
-        if os.path.exists(
-                os.path.join(X2PADDLE_CACHE_PATH,
-                             '{}.tar'.format(request_id))):
-            with open(
-                    os.path.join(X2PADDLE_CACHE_PATH,
-                                 '{}.tar'.format(request_id)), 'rb') as f:
-                data = f.read()
-            if self.server_count % 100 == 0:  # we check number of files every 100 request
-                file_paths = glob.glob(
-                    os.path.join(X2PADDLE_CACHE_PATH, '*.tar'))
-                if len(file_paths) >= _max_cache_numbers:
-                    file_paths = sorted(
-                        file_paths, key=os.path.getctime, reverse=True)
-                    for file_path in file_paths:
-                        try:
-                            os.remove(file_path)
-                            shutil.rmtree(
-                                os.path.join(
-                                    os.path.dirname(file_path),
-                                    os.path.splitext(
-                                        os.path.basename(file_path))[0]))
-                        except Exception:
-                            pass
-            return data
+    def onnx2paddle_model_download(self, request_id):
+        '''
+        Download converted paddle model from bos.
+        '''
+        filename = 'bos://{}/onnx2paddle/{}.tar'.format(
+            self.bucket_name, request_id)
+        data = None
+        if self.bos_client.exists(filename):
+            data = self.bos_client.read_file(filename)
+        if not data:
+            raise RuntimeError(
+                "The requested model can not be downloaded due to not existing or convertion failed."
+            )
+        return data
+
+    @result()
+    def paddle2onnx_convert(self, opset_version, deploy_backend):
+        '''
+        Convert paddle model to onnx model.
+        '''
+        model_handle = request.files['model']
+        params_handle = request.files['param']
+        model_data = model_handle.stream.read()
+        param_data = params_handle.stream.read()
+        result = {}
+        # Do a simple data verification
+        try:
+            opset_version = int(opset_version)
+        except Exception:
+            opset_version = 11
+        if deploy_backend not in ['onnxruntime', 'tensorrt', 'others']:
+            deploy_backend = 'onnxruntime'
+
+        # call paddle2onnx to convert models
+        hl = hashlib.md5()
+        hl.update(model_data + param_data)
+        identity = hl.hexdigest()
+        result['request_id'] = identity
+        # check whether model has been transfromed before
+        # if model has been transformed before, data is stored at bos
+        model_filename = 'bos://{}/paddle2onnx/{}/model.onnx'.format(
+            self.bucket_name, identity)
+        if self.bos_client.exists(model_filename):
+            remote_data = self.bos_client.read_file(model_filename)
+            if remote_data:  # we should check data is not empty,
+                # in case convertion failed but empty data is still uploaded before due to unknown reasons
+                model_encoded = base64.b64encode(remote_data).decode('utf-8')
+                result['model'] = model_encoded
+                return result
+
+        with tempfile.NamedTemporaryFile() as model_fp:
+            with tempfile.NamedTemporaryFile() as param_fp:
+                model_fp.write(model_data)
+                param_fp.write(param_data)
+                model_fp.flush()
+                param_fp.flush()
+                try:
+                    onnx_model = paddle2onnx.export(
+                        model_fp.name,
+                        param_fp.name,
+                        opset_version=opset_version,
+                        deploy_backend=deploy_backend)
+                except Exception as e:
+                    raise RuntimeError(
+                        "[Convertion error] {}.\n Please open an issue at "
+                        "https://github.com/PaddlePaddle/Paddle2ONNX/issues to report your problem."
+                        .format(e))
+                if not onnx_model:
+                    raise RuntimeError(
+                        "[Convertion error] Please check your input model and param files."
+                    )
+
+                # upload transformed model to vdl bos
+                filename = 'bos://{}/paddle2onnx/{}/model.onnx'.format(
+                    self.bucket_name, identity)
+                model_encoded = None
+                if onnx_model:
+                    try:
+                        self.bos_client.write(filename, onnx_model)
+                    except Exception as e:
+                        print(
+                            "Exception: Write file {}/model.onnx to bos failed, due to {}"
+                            .format(identity, e))
+                    model_encoded = base64.b64encode(onnx_model).decode(
+                        'utf-8')
+        result['model'] = model_encoded
+        return result
+
+    @result('application/octet-stream')
+    def paddle2onnx_download(self, request_id):
+        '''
+        Download converted onnx model from bos.
+        '''
+        filename = 'bos://{}/paddle2onnx/{}/model.onnx'.format(
+            self.bucket_name, request_id)
+        data = None
+        if self.bos_client.exists(filename):
+            data = self.bos_client.read_file(filename)
+        if not data:
+            raise RuntimeError(
+                "The requested model can not be downloaded due to not existing or convertion failed."
+            )
+        return data
 
 
 def create_model_convert_api_call():
     api = ModelConvertApi()
     routes = {
-        'convert': (api.convert_model, ['format']),
-        'download': (api.download_model, ['request_id'])
+        'paddle2onnx/convert': (api.paddle2onnx_convert,
+                                ['opset_version', 'deploy_backend']),
+        'paddle2onnx/download': (api.paddle2onnx_download, ['request_id']),
+        'onnx2paddle/convert':
+        (api.onnx2paddle_model_convert,
+         ['convert_to_lite', 'lite_valid_places', 'lite_model_type']),
+        'onnx2paddle/download': (api.onnx2paddle_model_download,
+                                 ['request_id'])
     }
 
     def call(path: str, args):
diff --git a/visualdl/io/bfile.py b/visualdl/io/bfile.py