deepjavalibrary · xyang16 · Apr 16, 2024 · Apr 16, 2024 · Apr 16, 2024 · Apr 16, 2024
@@ -23,6 +23,11 @@ def converter_args():
                         default=1,
                         help="Max amount of models to convert")
     parser.add_argument("-o", "--output-dir", help="Model output directory")
+    parser.add_argument("-f",
+                        "--output-format",
+                        default="PyTorch",
+                        choices=["PyTorch", "OnnxRuntime"],
+                        help="Model output format")
     parser.add_argument("-r",
                         "--retry-failed",
                         action='store_true',

@@ -12,6 +12,7 @@
 # the specific language governing permissions and limitations under the License.
 import logging
 import os.path
+import sys
 import shutil
 from argparse import Namespace
 
@@ -36,6 +37,42 @@ def __init__(self):
         self.outputs = None
 
     def save_model(self, model_info, args: Namespace, temp_dir: str):
+        if args.output_format == "OnnxRuntime":
+            self.save_onnx_model(model_info, args, temp_dir)
+        else:
+            self.save_pytorch_model(model_info, args, temp_dir)
+
+    def save_onnx_model(self, model_info, args: Namespace, temp_dir: str):
+        model_id = model_info.modelId
+        if not os.path.exists(temp_dir):
+            os.makedirs(temp_dir)
+
+        try:
+            hf_pipeline = self.load_model(model_id)
+        except Exception as e:
+            logging.warning(f"Failed to load model: {model_id}.")
+            logging.warning(e, exc_info=True)
+            return False, "Failed to load model", -1
+
+        model_name = model_id.split("/")[-1]
+        logging.info(f"Saving onnxruntime model: {model_name}.onnx ...")
+
+        from optimum.commands.optimum_cli import main
+
+        sys.argv = [
+            "model_zoo_importer.py", "export", "onnx", "-m", model_id, temp_dir
+        ]
+        main()
+
+        model_input_names = hf_pipeline.tokenizer.model_input_names
+        include_types = "token_type_ids" in model_input_names
+        size = self.save_to_model_zoo(model_info, args.output_dir,
+                                      "OnnxRuntime", temp_dir, hf_pipeline,
+                                      include_types)
+
+        return True, None, size
+
+    def save_pytorch_model(self, model_info, args: Namespace, temp_dir: str):
         model_id = model_info.modelId
         if not os.path.exists(temp_dir):
             os.makedirs(temp_dir)
@@ -59,8 +96,10 @@ def save_model(self, model_info, args: Namespace, temp_dir: str):
         config = hf_hub_download(repo_id=model_id, filename="config.json")
         shutil.copyfile(config, os.path.join(temp_dir, "config.json"))
 
+        model_input_names = hf_pipeline.tokenizer.model_input_names
+        include_types = "token_type_ids" in model_input_names
+
         # Save jit traced .pt file to temp dir
-        include_types = False
         model_file = self.jit_trace_model(hf_pipeline, model_id, temp_dir,
                                           include_types)
         if not model_file:
@@ -69,19 +108,10 @@ def save_model(self, model_info, args: Namespace, temp_dir: str):
         result, reason = self.verify_jit_model(hf_pipeline, model_file,
                                                include_types, args.cpu_only)
         if not result:
-            include_types = True
-            model_file = self.jit_trace_model(hf_pipeline, model_id, temp_dir,
-                                              include_types)
-            if not model_file:
-                return False, reason, -1
-
-            result, reason = self.verify_jit_model(hf_pipeline, model_file,
-                                                   include_types,
-                                                   args.cpu_only)
-            if not result:
-                return False, reason, -1
-
-        size = self.save_to_model_zoo(model_info, args.output_dir, temp_dir,
+            return False, reason, -1
+
+        size = self.save_to_model_zoo(model_info, args.output_dir,
+                                      args.output_format, temp_dir,
                                       hf_pipeline, include_types)
 
         return True, None, size
@@ -129,12 +159,12 @@ def jit_trace_model(self, hf_pipeline, model_id: str, temp_dir: str,
 
         return model_file
 
-    def save_to_model_zoo(self, model_info, output_dir: str, temp_dir: str,
-                          hf_pipeline, include_types: bool):
+    def save_to_model_zoo(self, model_info, output_dir: str, engine: str,
+                          temp_dir: str, hf_pipeline, include_types: bool):
         model_id = model_info.modelId
         model_name = model_id.split("/")[-1]
-
-        repo_dir = f"{output_dir}/model/{self.application}/ai/djl/huggingface/pytorch/{model_id}"
+        group_id = f"ai/djl/huggingface/{engine.lower()}"
+        repo_dir = f"{output_dir}/model/{self.application}/{group_id}/{model_id}"
         model_dir = f"{repo_dir}/0.0.1"
         if not os.path.exists(model_dir):
             os.makedirs(model_dir)
@@ -147,9 +177,10 @@ def save_to_model_zoo(self, model_info, output_dir: str, temp_dir: str,
         arguments["translatorFactory"] = self.translator
 
         with open(serving_file, 'w') as f:
-            f.write(f"engine=PyTorch\n"
-                    f"option.modelName={model_name}\n"
-                    f"option.mapLocation=true\n")
+            f.write(f"engine={engine}\n"
+                    f"option.modelName={model_name}\n")
+            if engine == "PyTorch":
+                f.write(f"option.mapLocation=true\n")
 
             for k, v in arguments.items():
                 f.write(f"{k}={v}\n")
@@ -160,11 +191,11 @@ def save_to_model_zoo(self, model_info, output_dir: str, temp_dir: str,
         zip_dir(temp_dir, zip_file)
 
         # Save metadata.json
-        arguments["engine"] = "PyTorch"
+        arguments["engine"] = engine
         sha1 = sha1_sum(zip_file)
         file_size = os.path.getsize(zip_file)
-        metadata = HuggingfaceMetadata(model_info, self.application, sha1,
-                                       file_size, arguments)
+        metadata = HuggingfaceMetadata(model_info, engine, self.application,
+                                       sha1, file_size, arguments)
         metadata_file = os.path.join(repo_dir, "metadata.json")
         metadata.save_metadata(metadata_file)
 

@@ -16,15 +16,19 @@
 
 class HuggingfaceMetadata:
 
-    def __init__(self, model_info, application: str, sha1: str, file_size: int,
-                 arguments: dict):
+    def __init__(self, model_info, engine: str, application: str, sha1: str,
+                 file_size: int, arguments: dict):
         self.model_info = model_info
+        self.group_id = f"ai.djl.huggingface.{engine.lower()}"
         self.artifact_id = model_info.modelId
         self.model_name = model_info.modelId.split("/")[-1]
         self.application = application
         self.sha1 = sha1
         self.file_size = file_size
         self.arguments = arguments
+        self.options = {}
+        if engine == "PyTorch":
+            self.options["mapLocation"] = True
 
     def save_metadata(self, metadata_file: str):
         properties = get_lang_tags(self.model_info)
@@ -37,7 +41,7 @@ def save_metadata(self, metadata_file: str):
             "application":
             self.application,
             "groupId":
-            "ai.djl.huggingface.pytorch",
+            self.group_id,
             "artifactId":
             self.artifact_id,
             "name":
@@ -58,9 +62,7 @@ def save_metadata(self, metadata_file: str):
                 "name": self.model_name,
                 "properties": properties,
                 "arguments": self.arguments,
-                "options": {
-                    "mapLocation": True
-                },
+                "options": self.options,
                 "files": {
                     "model": {
                         "uri": f"0.0.1/{self.model_name}.zip",

@@ -11,6 +11,7 @@
 # BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, express or implied. See the License for
 # the specific language governing permissions and limitations under the License.
 import logging
+import os.path
 import shutil
 import sys
 
@@ -63,7 +64,8 @@ def main():
 
         huggingface_models.update_progress(model_info, converter.application,
                                            result, reason, size, args.cpu_only)
-        shutil.rmtree(temp_dir)
+        if os.path.exists(temp_dir):
+            shutil.rmtree(temp_dir)
 
     logging.info("finished.")
 

@@ -2,3 +2,4 @@ huggingface_hub
 transformers
 torch
 protobuf==3.20.2
+optimum[exporters,onnxruntime]