fix

huggingface · Nov 27, 2024 · 88b86fa · 88b86fa
1 parent 712d851
commit 88b86fa
Show file tree

Hide file tree

Showing 10 changed files with 214 additions and 174 deletions.
diff --git a/optimum_benchmark/backends/base.py b/optimum_benchmark/backends/base.py
@@ -13,14 +13,14 @@
 from .config import BackendConfigT
 from .diffusers_utils import (
     extract_diffusers_shapes_from_model,
-    get_diffusers_automodel_loader_for_task,
+    get_diffusers_auto_pipeline_class_for_task,
     get_diffusers_pretrained_config,
 )
-from .timm_utils import extract_timm_shapes_from_config, get_timm_automodel_loader, get_timm_pretrained_config
+from .timm_utils import extract_timm_shapes_from_config, get_timm_model_creator, get_timm_pretrained_config
 from .transformers_utils import (
     PretrainedProcessor,
     extract_transformers_shapes_from_artifacts,
-    get_transformers_automodel_loader_for_task,
+    get_transformers_auto_model_class_for_task,
     get_transformers_generation_config,
     get_transformers_pretrained_config,
     get_transformers_pretrained_processor,
@@ -56,15 +56,15 @@ def __init__(self, config: BackendConfigT):
             self.logger.info("\t+ Benchmarking a Diffusers pipeline")
             self.pretrained_config = get_diffusers_pretrained_config(self.config.model, **self.config.model_kwargs)
             self.model_shapes = extract_diffusers_shapes_from_model(self.config.model, **self.config.model_kwargs)
-            self.automodel_loader = get_diffusers_automodel_loader_for_task(self.config.task)
+            self.automodel_loader = get_diffusers_auto_pipeline_class_for_task(self.config.task)
             self.pretrained_processor = None
             self.generation_config = None
 
         elif self.config.library == "timm":
             self.logger.info("\t+ Benchmarking a Timm model")
             self.pretrained_config = get_timm_pretrained_config(self.config.model)
             self.model_shapes = extract_timm_shapes_from_config(self.pretrained_config)
-            self.automodel_loader = get_timm_automodel_loader()
+            self.automodel_loader = get_timm_model_creator()
             self.pretrained_processor = None
             self.generation_config = None
 
@@ -78,7 +78,7 @@ def __init__(self, config: BackendConfigT):
 
         else:
             self.logger.info("\t+ Benchmarking a Transformers model")
-            self.automodel_loader = get_transformers_automodel_loader_for_task(self.config.task, self.config.model_type)
+            self.automodel_loader = get_transformers_auto_model_class_for_task(self.config.task, self.config.model_type)
             self.generation_config = get_transformers_generation_config(self.config.model, **self.config.model_kwargs)
             self.pretrained_config = get_transformers_pretrained_config(self.config.model, **self.config.model_kwargs)
             self.pretrained_processor = get_transformers_pretrained_processor(

diff --git a/optimum_benchmark/backends/diffusers_utils.py b/optimum_benchmark/backends/diffusers_utils.py
@@ -9,33 +9,16 @@
     import diffusers
     from diffusers import DiffusionPipeline
 
-    if hasattr(diffusers, "pipelines") and hasattr(diffusers.pipelines, "auto_pipeline"):
-        from diffusers.pipelines.auto_pipeline import (
-            AUTO_IMAGE2IMAGE_PIPELINES_MAPPING,
-            AUTO_INPAINT_PIPELINES_MAPPING,
-            AUTO_TEXT2IMAGE_PIPELINES_MAPPING,
-        )
-
-        TASKS_TO_MODEL_TYPES_TO_MODEL_CLASSES = {
-            "inpainting": AUTO_INPAINT_PIPELINES_MAPPING.copy(),
-            "text-to-image": AUTO_TEXT2IMAGE_PIPELINES_MAPPING.copy(),
-            "image-to-image": AUTO_IMAGE2IMAGE_PIPELINES_MAPPING.copy(),
-        }
-
-        for task_name, model_mapping in TASKS_TO_MODEL_TYPES_TO_MODEL_CLASSES.items():
-            for model_type, model_class in model_mapping.items():
-                TASKS_TO_MODEL_TYPES_TO_MODEL_CLASSES[task_name][model_type] = model_class.__name__
-    else:
-        TASKS_TO_MODEL_TYPES_TO_MODEL_CLASSES = {}
-else:
-    TASKS_TO_MODEL_TYPES_TO_MODEL_CLASSES = {}
 
+def get_diffusers_auto_pipeline_class_for_task(task: str):
+    from ..task_utils import TASKS_TO_AUTO_PIPELINE_CLASS_NAMES
 
-TASKS_TO_MODEL_LOADERS = {
-    "inpainting": "AutoPipelineForInpainting",
-    "text-to-image": "AutoPipelineForText2Image",
-    "image-to-image": "AutoPipelineForImage2Image",
-}
+    if not is_diffusers_available():
+        raise ImportError("diffusers is not available. Please, pip install diffusers.")
+
+    model_loader_name = TASKS_TO_AUTO_PIPELINE_CLASS_NAMES.get(task, None)
+    model_loader_class = getattr(diffusers, model_loader_name)
+    return model_loader_class
 
 
 def get_diffusers_pretrained_config(model: str, **kwargs) -> Dict[str, int]:
@@ -85,12 +68,3 @@ def extract_diffusers_shapes_from_model(model: str, **kwargs) -> Dict[str, int]:
         shapes["width"] = -1
 
     return shapes
-
-
-def get_diffusers_automodel_loader_for_task(task: str):
-    if not is_diffusers_available():
-        raise ImportError("diffusers is not available. Please, pip install diffusers.")
-
-    model_loader_name = TASKS_TO_MODEL_LOADERS[task]
-    model_loader_class = getattr(diffusers, model_loader_name)
-    return model_loader_class
diff --git a/optimum_benchmark/backends/timm_utils.py b/optimum_benchmark/backends/timm_utils.py
@@ -10,6 +10,13 @@
     from timm.models import get_pretrained_cfg, load_model_config_from_hf, parse_model_name
 
 
+def get_timm_model_creator():
+    if not is_timm_available():
+        raise ImportError("timm is not available. Please, pip install timm.")
+
+    return create_model
+
+
 def get_timm_pretrained_config(model_name: str) -> PretrainedConfig:
     if not is_timm_available():
         raise ImportError("timm is not available. Please, pip install timm.")
@@ -71,10 +78,3 @@ def extract_timm_shapes_from_config(config: PretrainedConfig) -> Dict[str, Any]:
         warnings.warn("Could not extract shapes [num_channels, height, width] from timm model config.")
 
     return shapes
-
-
-def get_timm_automodel_loader():
-    if not is_timm_available():
-        raise ImportError("timm is not available. Please, pip install timm.")
-
-    return create_model
diff --git a/optimum_benchmark/backends/transformers_utils.py b/optimum_benchmark/backends/transformers_utils.py
@@ -18,59 +18,23 @@
     SpecialTokensMixin,
 )
 
-TASKS_TO_AUTOMODEL_CLASS_NAMES = {
-    # text processing
-    "feature-extraction": "AutoModel",
-    "fill-mask": "AutoModelForMaskedLM",
-    "multiple-choice": "AutoModelForMultipleChoice",
-    "question-answering": "AutoModelForQuestionAnswering",
-    "token-classification": "AutoModelForTokenClassification",
-    "text-classification": "AutoModelForSequenceClassification",
-    # audio processing
-    "audio-xvector": "AutoModelForAudioXVector",
-    "text-to-audio": "AutoModelForTextToSpectrogram",
-    "audio-classification": "AutoModelForAudioClassification",
-    "audio-frame-classification": "AutoModelForAudioFrameClassification",
-    # image processing
-    "mask-generation": "AutoModel",
-    "image-to-image": "AutoModelForImageToImage",
-    "masked-im": "AutoModelForMaskedImageModeling",
-    "object-detection": "AutoModelForObjectDetection",
-    "depth-estimation": "AutoModelForDepthEstimation",
-    "image-segmentation": "AutoModelForImageSegmentation",
-    "image-classification": "AutoModelForImageClassification",
-    "semantic-segmentation": "AutoModelForSemanticSegmentation",
-    "zero-shot-object-detection": "AutoModelForZeroShotObjectDetection",
-    "zero-shot-image-classification": "AutoModelForZeroShotImageClassification",
-    # text generation
-    "image-to-text": "AutoModelForVision2Seq",
-    "text-generation": "AutoModelForCausalLM",
-    "text2text-generation": "AutoModelForSeq2SeqLM",
-    "image-text-to-text": "AutoModelForImageTextToText",
-    "visual-question-answering": "AutoModelForVisualQuestionAnswering",
-    "automatic-speech-recognition": ("AutoModelForSpeechSeq2Seq", "AutoModelForCTC"),
-}
-
-SYNONYM_TASKS = {
-    "summarization": "text2text-generation",
-    "sentence-similarity": "feature-extraction",
-}
 
+def get_transformers_auto_model_class_for_task(task: str, model_type: Optional[str] = None) -> Type["AutoModel"]:
+    from ..task_utils import SYNONYM_TASKS, TASKS_TO_AUTO_MODEL_CLASS_NAMES
 
-def get_transformers_automodel_class_for_task(task: str, model_type: Optional[str] = None) -> Type["AutoModel"]:
     if task in SYNONYM_TASKS:
         task = SYNONYM_TASKS[task]
 
-    if task not in TASKS_TO_AUTOMODEL_CLASS_NAMES:
+    if task not in TASKS_TO_AUTO_MODEL_CLASS_NAMES:
         raise ValueError(f"Task {task} not supported")
 
-    if isinstance(TASKS_TO_AUTOMODEL_CLASS_NAMES[task], str):
-        return getattr(transformers, TASKS_TO_AUTOMODEL_CLASS_NAMES[task])
+    if isinstance(TASKS_TO_AUTO_MODEL_CLASS_NAMES[task], str):
+        return getattr(transformers, TASKS_TO_AUTO_MODEL_CLASS_NAMES[task])
     else:
         if model_type is None:
             raise ValueError(f"Task {task} requires a model_type to be specified")
 
-        for automodel_class_name in TASKS_TO_AUTOMODEL_CLASS_NAMES[task]:
+        for automodel_class_name in TASKS_TO_AUTO_MODEL_CLASS_NAMES[task]:
             automodel_class = getattr(transformers, automodel_class_name)
             if model_type in automodel_class._model_mapping._model_mapping:
                 return automodel_class

diff --git a/optimum_benchmark/scenarios/inference/scenario.py b/optimum_benchmark/scenarios/inference/scenario.py
@@ -66,15 +66,17 @@ def run(self, backend: Backend[BackendConfigT]) -> BenchmarkReport:
             self.logger.info("\t+ Updating Text Generation kwargs with default values")
             self.config.generate_kwargs = {**TEXT_GENERATION_DEFAULT_KWARGS, **self.config.generate_kwargs}
             self.logger.info("\t+ Initializing Text Generation report")
-            self.report = BenchmarkReport.from_list(targets=["load", "prefill", "decode", "per_token"])
+            self.report = BenchmarkReport.from_list(targets=["load_model", "prefill", "decode", "per_token"])
         elif self.backend.config.task in IMAGE_DIFFUSION_TASKS:
             self.logger.info("\t+ Updating Image Diffusion kwargs with default values")
             self.config.call_kwargs = {**IMAGE_DIFFUSION_DEFAULT_KWARGS, **self.config.call_kwargs}
             self.logger.info("\t+ Initializing Image Diffusion report")
-            self.report = BenchmarkReport.from_list(targets=["load", "call"])
+            self.report = BenchmarkReport.from_list(targets=["load_model", "call"])
         else:
             self.logger.info("\t+ Initializing Inference report")
-            self.report = BenchmarkReport.from_list(targets=["load", "forward"])
+            self.report = BenchmarkReport.from_list(targets=["load_model", "forward"])
+
+        self.run_model_loading_tracking(backend)
 
         self.logger.info("\t+ Creating input generator")
         self.input_generator = InputGenerator(
@@ -83,15 +85,11 @@ def run(self, backend: Backend[BackendConfigT]) -> BenchmarkReport:
             input_shapes=self.config.input_shapes,
             model_type=backend.config.model_type,
         )
-
         self.logger.info("\t+ Generating inputs")
         self.inputs = self.input_generator()
-
-        self.logger.info("\t+ Preparing inputs for Inference")
+        self.logger.info("\t+ Preparing inputs for backend")
         self.inputs = backend.prepare_inputs(inputs=self.inputs)
 
-        self.run_model_loading_tracking(backend)
-
         if self.config.latency or self.config.energy:
             # latency and energy are metrics that require some warmup
             if self.config.warmup_runs > 0:
@@ -159,8 +157,14 @@ def run_model_loading_tracking(self, backend: Backend[BackendConfigT]):
             )
         if self.config.latency:
             latency_tracker = LatencyTracker(backend=backend.config.name, device=backend.config.device)
+        if self.config.energy:
+            energy_tracker = EnergyTracker(
+                backend=backend.config.name, device=backend.config.device, device_ids=backend.config.device_ids
+            )
 
         with ExitStack() as context_stack:
+            if self.config.energy:
+                context_stack.enter_context(energy_tracker.track())
             if self.config.memory:
                 context_stack.enter_context(memory_tracker.track())
             if self.config.latency:
@@ -169,9 +173,11 @@ def run_model_loading_tracking(self, backend: Backend[BackendConfigT]):
             backend.load()
 
         if self.config.latency:
-            self.report.load.latency = latency_tracker.get_latency()
+            self.report.load_model.latency = latency_tracker.get_latency()
         if self.config.memory:
-            self.report.load.memory = memory_tracker.get_max_memory()
+            self.report.load_model.memory = memory_tracker.get_max_memory()
+        if self.config.energy:
+            self.report.load_model.energy = energy_tracker.get_energy()
 
     ## Memory tracking
     def run_text_generation_memory_tracking(self, backend: Backend[BackendConfigT]):