Merge pull request #95 from mozilla-ai/sfriedowitz/patch-prometheus

Move client inside data generator becuase its not serializable
mozilla-ai · Apr 9, 2024 · fa3a054 · fa3a054
2 parents 706ac29 + 2fb8a05
commit fa3a054
Show file tree

Hide file tree

Showing 2 changed files with 9 additions and 8 deletions.
diff --git a/pyproject.toml b/pyproject.toml
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "lm-buddy"
-version = "0.10.0"
+version = "0.10.1"
 authors = [
     { name = "Sean Friedowitz", email = "[email protected]" },
     { name = "Aaron Gonzales", email = "[email protected]" },

diff --git a/src/lm_buddy/jobs/evaluation/prometheus.py b/src/lm_buddy/jobs/evaluation/prometheus.py
@@ -100,7 +100,7 @@ def get_response_with_retries(
             feedback, score = parse_response(config, response)
             break
         except (OpenAIError, BadResponseError) as e:
-            logger.warn(
+            logger.warning(
                 f"{e.message}: "
                 f"Retrying ({current_retry_attempt}/{config.evaluation.max_retries})"
             )
@@ -111,12 +111,8 @@ def get_response_with_retries(
 
 
 def run_eval(config: PrometheusJobConfig) -> Path:
-    # Instantiate OpenAI client to speak with the vLLM endpoint
-    client = OpenAI(base_url=config.prometheus.inference.base_url)
-
-    hf_loader = HuggingFaceAssetLoader()
-
     # Resolve the engine model
+    hf_loader = HuggingFaceAssetLoader()
     engine_path = hf_loader.resolve_asset_path(config.prometheus.inference.engine)
 
     # Load dataset from W&B artifact
@@ -135,6 +131,11 @@ def run_eval(config: PrometheusJobConfig) -> Path:
 
     # Generator that iterates over samples and yields new rows with the prometheus outputs
     def data_generator():
+        # Instantiate OpenAI client to speak with the vLLM endpoint
+        # Client is non-serializable so must be instantiated internal to this method
+        # Reference: https://huggingface.co/docs/datasets/en/troubleshoot#pickling-issues
+        client = OpenAI(base_url=config.prometheus.inference.base_url)
+
         for sample in dataset_iterable:
             # convert instructions from the dataset (`text_field` in a dict) to
             # prompts that prometheus accepts
@@ -143,7 +144,7 @@ def data_generator():
             # skip those examples which are too long
             tokenized_prompt = tokenizer(prompt, truncation=False)
             if len(tokenized_prompt["input_ids"]) > 3072:
-                logger.warn(f"Skipping row due to prompt exceeding token limit: {prompt=}")
+                logger.warning(f"Skipping row due to prompt exceeding token limit: {prompt=}")
                 continue
 
             # prepare output