initial RyzenAI support

huggingface · Mar 5, 2024 · ac508c2 · ac508c2
1 parent a3cd823
commit ac508c2
Show file tree

Hide file tree

Showing 7 changed files with 219 additions and 2 deletions.
diff --git a/examples/ryzenai_resnet50.yaml b/examples/ryzenai_resnet50.yaml
@@ -0,0 +1,36 @@
+defaults:
+  - backend: ryzenai
+  - launcher: process
+  - benchmark: inference
+  - experiment # inheriting experiment schema
+  - _self_ # for hydra 1.1 compatibility
+  - override hydra/job_logging: colorlog # colorful logging
+  - override hydra/hydra_logging: colorlog # colorful logging
+
+experiment_name: ryzenai_resnet50
+
+backend:
+  device: ipu
+  export: false
+  model: amd/resnet50
+  provider: CPUExecutionProvider
+
+benchmark:
+  input_shapes:
+    batch_size: 1
+
+# hydra/cli specific settings
+hydra:
+  run:
+    # where to store run results
+    dir: runs/${experiment_name}
+  sweep:
+    # where to store sweep results
+    dir: sweeps/${experiment_name}
+  job:
+    # change working directory to the run directory
+    chdir: true
+    env_set:
+      # set environment variable OVERRIDE_BENCHMARKS to 1
+      # to not skip benchmarks that have been run before
+      OVERRIDE_BENCHMARKS: 1
diff --git a/optimum_benchmark/backends/config.py b/optimum_benchmark/backends/config.py
@@ -61,8 +61,10 @@ def __post_init__(self):
             self.device_ids = self.device.split(":")[1]
             LOGGER.warning(f"`device` and `device_ids` are now set to `{self.device}` and `{self.device_ids}`.")
 
-        if self.device not in ["cuda", "cpu", "mps", "xla"]:
-            raise ValueError(f"`device` must be either `cuda`, `cpu`, `mps` or `xla`, but got {self.device}")
+        if self.device not in ["cuda", "cpu", "mps", "xla", "ipu", "npu"]:
+            raise ValueError(
+                f"`device` must be either `cuda`, `cpu`, `mps` or `xla`, `ipu`, `npu`, but got {self.device}"
+            )
 
         if self.device == "cuda":
             if self.device_ids is None:

diff --git a/optimum_benchmark/backends/ryzenai/backend.py b/optimum_benchmark/backends/ryzenai/backend.py
@@ -0,0 +1,133 @@
+import gc
+import os
+from collections import OrderedDict
+from logging import getLogger
+from tempfile import TemporaryDirectory
+from typing import Any, Dict
+
+import torch
+from hydra.utils import get_class
+from safetensors.torch import save_file
+from transformers.utils.logging import set_verbosity_error
+
+from ...task_utils import IMAGE_PROCESSING_TASKS, TEXT_GENERATION_TASKS
+from ..base import Backend
+from ..transformers_utils import random_init_weights
+from .config import RyzenAIConfig
+from .utils import TASKS_TO_RYZENAIMODEL
+
+# disable transformers logging
+set_verbosity_error()
+
+LOGGER = getLogger("ryzenai")
+
+
+class RyzenAIBackend(Backend[RyzenAIConfig]):
+    NAME: str = "ryzenai"
+
+    def __init__(self, config: RyzenAIConfig) -> None:
+        super().__init__(config)
+        self.validate_task()
+
+        LOGGER.info("\t+ Creating backend temporary directory")
+        self.tmpdir = TemporaryDirectory()
+
+        if self.config.no_weights:
+            LOGGER.info("\t+ Loading no weights RyzenAIModel")
+            self.load_ryzenaimodel_with_no_weights()
+        else:
+            LOGGER.info("\t+ Loading pretrained RyzenAIModel")
+            self.load_ryzenaimodel_from_pretrained()
+
+        self.tmpdir.cleanup()
+
+    def validate_task(self) -> None:
+        if self.config.task not in TASKS_TO_RYZENAIMODEL:
+            raise NotImplementedError(f"RyzenAIBackend does not support task {self.config.task}")
+
+        self.ryzenaimodel_class = get_class(TASKS_TO_RYZENAIMODEL[self.config.task])
+        LOGGER.info(f"\t+ Using RyzenAIModel class {self.ryzenaimodel_class.__name__}")
+
+    def create_no_weights_model(self) -> None:
+        self.no_weights_model = os.path.join(self.tmpdir.name, "no_weights_model")
+        LOGGER.info("\t+ Creating no weights model directory")
+        os.makedirs(self.no_weights_model, exist_ok=True)
+        LOGGER.info("\t+ Creating no weights model state dict")
+        state_dict = torch.nn.Linear(1, 1).state_dict()
+        LOGGER.info("\t+ Saving no weights model safetensors")
+        safetensors = os.path.join(self.no_weights_model, "model.safetensors")
+        save_file(tensors=state_dict, filename=safetensors, metadata={"format": "pt"})
+
+        if self.config.library == "transformers":
+            LOGGER.info("\t+ Saving no weights model pretrained config")
+            self.pretrained_config.save_pretrained(save_directory=self.no_weights_model)
+
+    def load_automodel_with_no_weights(self) -> None:
+        LOGGER.info("\t+ Creating no weights model")
+        self.create_no_weights_model()
+
+        with random_init_weights():
+            original_model, self.config.model = self.config.model, self.no_weights_model
+            LOGGER.info("\t+ Loading no weights AutoModel")
+            self.load_automodel_from_pretrained()
+            self.config.model = original_model
+
+        LOGGER.info("\t+ Tying model weights")
+        self.pretrained_model.tie_weights()
+
+    def load_automodel_from_pretrained(self) -> None:
+        self.pretrained_model = self.automodel_class.from_pretrained(self.config.model, **self.config.hub_kwargs)
+
+    def load_ryzenaimodel_with_no_weights(self) -> None:
+        LOGGER.info("\t+ Creating no weights model")
+        self.create_no_weights_model()
+
+        with random_init_weights():
+            original_model, self.config.model = self.config.model, self.no_weights_model
+            original_export, self.config.export = self.config.export, True
+            LOGGER.info("\t+ Loading no weights RyzenAIModel")
+            self.load_ryzenaimodel_from_pretrained()
+            self.config.model = original_model
+            self.config.export = original_export
+
+    def load_ryzenaimodel_from_pretrained(self) -> None:
+        self.pretrained_model = self.ryzenaimodel_class.from_pretrained(
+            self.config.model,
+            export=self.config.export,
+            provider=self.config.provider,
+            vaip_config=self.config.vaip_config,
+            **self.config.hub_kwargs,
+            **self.ryzenaimodel_kwargs,
+        )
+
+    @property
+    def ryzenaimodel_kwargs(self) -> Dict[str, Any]:
+        kwargs = {}
+
+        if self.config.task in TEXT_GENERATION_TASKS:
+            kwargs["use_cache"] = self.config.use_cache
+
+        return kwargs
+
+    def prepare_inputs(self, inputs: Dict[str, Any]) -> Dict[str, Any]:
+        inputs = super().prepare_inputs(inputs)
+
+        if self.config.task in IMAGE_PROCESSING_TASKS:
+            # channels last
+            inputs["pixel_values"] = inputs["pixel_values"].permute(0, 2, 3, 1)
+
+        return inputs
+
+    def forward(self, inputs: Dict[str, Any], kwargs: Dict[str, Any]) -> OrderedDict:
+        return self.pretrained_model.forward(**inputs, **kwargs)
+
+    def generate(self, inputs: Dict[str, Any], kwargs: Dict[str, Any]) -> OrderedDict:
+        return self.pretrained_model.generate(**inputs, **kwargs)
+
+    def clean(self) -> None:
+        super().clean()
+
+        if hasattr(self, "tmpdir"):
+            self.tmpdir.cleanup()
+
+        gc.collect()
diff --git a/optimum_benchmark/backends/ryzenai/config.py b/optimum_benchmark/backends/ryzenai/config.py
@@ -0,0 +1,31 @@
+from dataclasses import dataclass, field
+from typing import Any, Dict, Optional
+
+from ..config import BackendConfig
+
+
+@dataclass
+class RyzenAIConfig(BackendConfig):
+    name: str = "ryzenai"
+    version: Optional[str] = None
+    _target_: str = "optimum_benchmark.backends.ryzenai.backend.RyzenAIBackend"
+
+    # optimum-benchmark options
+    no_weights: bool = False
+
+    # export/load options
+    export: bool = True
+    use_cache: bool = True
+
+    # provider options
+    provider: Optional[str] = None
+    provider_options: Dict[str, Any] = field(default_factory=dict)
+
+    # ryzenai config
+    vaip_config: Optional[str] = None  # /usr/bin/vaip_config.json
+
+    def __post_init__(self):
+        super().__post_init__()
+
+        if self.device not in ["ipu", "npu"]:
+            raise ValueError(f"RyzenAIBackend only supports IPU/NPU device, got {self.device}")
diff --git a/optimum_benchmark/backends/ryzenai/utils.py b/optimum_benchmark/backends/ryzenai/utils.py
@@ -0,0 +1,4 @@
+TASKS_TO_RYZENAIMODEL = {
+    "image-classification": "optimum.amd.ryzenai.RyzenAIModelForImageClassification",
+    "object-detection": "optimum.amd.ryzenai.RyzenAIModelForObjectDetection",
+}
diff --git a/optimum_benchmark/cli.py b/optimum_benchmark/cli.py
@@ -12,6 +12,7 @@
 from .backends.openvino.config import OVConfig
 from .backends.py_tgi.config import PyTGIConfig
 from .backends.pytorch.config import PyTorchConfig
+from .backends.ryzenai.config import RyzenAIConfig
 from .backends.tensorrt_llm.config import TRTLLMConfig
 from .backends.torch_ort.config import TorchORTConfig
 from .benchmarks.inference.config import InferenceConfig
@@ -36,6 +37,7 @@
 cs.store(group="backend", name=INCConfig.name, node=INCConfig)
 cs.store(group="backend", name=PyTGIConfig.name, node=PyTGIConfig)
 cs.store(group="backend", name=LLMSwarmConfig.name, node=LLMSwarmConfig)
+cs.store(group="backend", name=RyzenAIConfig.name, node=RyzenAIConfig)
 # benchmarks configurations
 cs.store(group="benchmark", name=TrainingConfig.name, node=TrainingConfig)
 cs.store(group="benchmark", name=InferenceConfig.name, node=InferenceConfig)

diff --git a/optimum_benchmark/task_utils.py b/optimum_benchmark/task_utils.py
@@ -99,6 +99,15 @@
 
 TEXT_GENERATION_TASKS = ["image-to-text", "text-generation", "text2text-generation", "automatic-speech-recognition"]
 
+IMAGE_PROCESSING_TASKS = [
+    "image-classification",
+    "image-segmentation",
+    "object-detection",
+    "semantic-segmentation",
+    "zero-shot-image-classification",
+    "zero-shot-object-detection",
+]
+
 
 def map_from_synonym(task: str) -> str:
     if task in _SYNONYM_TASK_MAP: