move the registration of the perplexity eval function where it belongs

dbogunowicz · dbogunowicz · commit 7a3ad2fcfe7a · 2024-02-09T16:16:51.000Z
diff --git a/src/deepsparse/evaluation/evaluator.py b/src/deepsparse/evaluation/evaluator.py
@@ -16,9 +16,6 @@
 from typing import List, Optional, Union
 
 from deepsparse import Pipeline
-from deepsparse.evaluation.integrations.perplexity import (  # noqa
-    integration_eval as integration_eval_perplexity,
-)
 from deepsparse.evaluation.registry import EvaluationRegistry
 from deepsparse.evaluation.results import Result
 from deepsparse.evaluation.utils import create_pipeline
diff --git a/src/deepsparse/evaluation/utils.py b/src/deepsparse/evaluation/utils.py
@@ -42,10 +42,14 @@ def potentially_check_dependency_import(integration_name: str) -> bool:
     :return: True if the dependency is installed, False otherwise
     """
 
-    if integration_name.replace("_", "-") == LM_EVALUATION_HARNESS:
+    if integration_name == LM_EVALUATION_HARNESS:
         from deepsparse.evaluation.integrations import try_import_lm_evaluation_harness
 
         try_import_lm_evaluation_harness()
+    if integration_name == PERPLEXITY:
+        from deepsparse.evaluation.integrations.perplexity import (  # noqa F401
+            integration_eval,
+        )
 
     return True
 
diff --git a/tests/deepsparse/evaluation/test_evaluator.py b/tests/deepsparse/evaluation/test_evaluator.py
@@ -115,20 +115,25 @@ def test_evaluate_pipeline_without_kv_cache(
     not try_import_lm_evaluation_harness(raise_error=False),
     reason="lm_evaluation_harness not installed",
 )
-def test_evaluation_llm_evaluation_harness_integration_name(
+def test_evaluation_llm_evaluation_harness(
     model_path,
-    datasets,
 ):
     assert evaluate(
         model=model_path,
         # testing only on hellaswag dataset
         # to avoid long running time
-        datasets=datasets[0],
+        datasets="hellaswag",
         limit=1,
         integration="lm_evaluation_harness",
     )
 
 
+def test_evaluation_perplexity(model_path):
+    assert evaluate(
+        model=model_path, datasets="openai_humaneval", limit=1, integration="perplexity"
+    )
+
+
 @pytest.mark.parametrize("type_serialization", ["json", "yaml"])
 @pytest.mark.skipif(
     tuple(map(int, sys.version.split(".")[:2])) < (3, 10),