Update base model to "meta-llama/Meta-Llama-3.1-8B-Instruct" across files

htahir1 · htahir1 · commit 6a86399c97e2 · 2025-03-14T10:14:25.000+01:00
diff --git a/README.md b/README.md
@@ -46,7 +46,7 @@ python run.py --openpipe-api-key=opk-your-api-key
 - `--openpipe-api-key`: Your OpenPipe API key (required if not set as environment variable)
 - `--dataset-name`: Name for the OpenPipe dataset (default: "zenml_dataset")
 - `--model-name`: Name for the fine-tuned model (default: "zenml_finetuned_model")
-- `--base-model`: Base model to fine-tune (default: "meta-llama/Meta-Llama-3-8B-Instruct")
+- `--base-model`: Base model to fine-tune (default: "meta-llama/Meta-Llama-3.1-8B-Instruct")
 - `--system-prompt`: System prompt to use for all examples (default: "You are a helpful assistant")
 - `--wait-for-completion/--no-wait-for-completion`: Whether to wait for the fine-tuning job to complete (default: wait)
 - `--no-cache`: Disable caching for the pipeline run
diff --git a/configs/openpipe_finetuning.yaml b/configs/openpipe_finetuning.yaml
@@ -22,7 +22,7 @@ metadata_columns: ["product"]
 # openPipe parameters
 dataset_name: "ultra_customer_service"
 model_name: "customer_service_assistant"
-base_model: "meta-llama/Meta-Llama-3-8B-Instruct"
+base_model: "meta-llama/Meta-Llama-3.1-8B-Instruct"
 enable_sft: true
 enable_preference_tuning: false
 learning_rate_multiplier: 1.0
diff --git a/pipelines/openpipe_finetuning.py b/pipelines/openpipe_finetuning.py
@@ -25,6 +25,7 @@
     openpipe_data_converter,
     openpipe_dataset_creator,
     openpipe_finetuning_starter,
+    openpipe_finetuning_starter_sdk,
 )
 
 logger = get_logger(__name__)
@@ -49,7 +50,7 @@ def openpipe_finetuning(
     
     # Fine-tuning parameters
     model_name: str = "zenml_finetuned_model",
-    base_model: str = "meta-llama/Meta-Llama-3-8B-Instruct",
+    base_model: str = "meta-llama/Meta-Llama-3.1-8B-Instruct",
     enable_sft: bool = True,
     enable_preference_tuning: bool = False,
     learning_rate_multiplier: float = 1.0,
@@ -61,6 +62,9 @@ def openpipe_finetuning(
     verbose_logs: bool = True,
     auto_rename: bool = True,
     force_overwrite: bool = False,
+    
+    # Implementation options
+    use_sdk: bool = False,
 ):
     """
     OpenPipe fine-tuning pipeline.
@@ -93,6 +97,7 @@ def openpipe_finetuning(
         verbose_logs: Whether to log detailed model information during polling
         auto_rename: If True, automatically append a timestamp to model name if it already exists
         force_overwrite: If True, delete existing model with the same name before creating new one
+        use_sdk: If True, use the Python OpenPipe SDK instead of direct API calls
 
     Returns:
         A dictionary with details about the fine-tuning job, including model information
@@ -122,24 +127,46 @@ def openpipe_finetuning(
         base_url=base_url,
     )
     
-    # Start fine-tuning and monitor progress
-    finetuning_result = openpipe_finetuning_starter(
-        dataset_id=dataset_id,
-        model_name=model_name,
-        base_model=base_model,
-        openpipe_api_key=openpipe_api_key,
-        base_url=base_url,
-        enable_sft=enable_sft,
-        enable_preference_tuning=enable_preference_tuning,
-        learning_rate_multiplier=learning_rate_multiplier,
-        num_epochs=num_epochs,
-        batch_size=batch_size,
-        default_temperature=default_temperature,
-        wait_for_completion=wait_for_completion,
-        timeout_minutes=timeout_minutes,
-        verbose_logs=verbose_logs,
-        auto_rename=auto_rename,
-        force_overwrite=force_overwrite,
-    )
+    # Choose between SDK and direct API implementation
+    if use_sdk:
+        # Use the SDK implementation
+        finetuning_result = openpipe_finetuning_starter_sdk(
+            dataset_id=dataset_id,
+            model_name=model_name,
+            base_model=base_model,
+            openpipe_api_key=openpipe_api_key,
+            base_url=base_url,
+            enable_sft=enable_sft,
+            enable_preference_tuning=enable_preference_tuning,
+            learning_rate_multiplier=learning_rate_multiplier,
+            num_epochs=num_epochs,
+            batch_size=batch_size,
+            default_temperature=default_temperature,
+            wait_for_completion=wait_for_completion,
+            timeout_minutes=timeout_minutes,
+            verbose_logs=verbose_logs,
+            auto_rename=auto_rename,
+            force_overwrite=force_overwrite,
+        )
+    else:
+        # Use the original direct API implementation
+        finetuning_result = openpipe_finetuning_starter(
+            dataset_id=dataset_id,
+            model_name=model_name,
+            base_model=base_model,
+            openpipe_api_key=openpipe_api_key,
+            base_url=base_url,
+            enable_sft=enable_sft,
+            enable_preference_tuning=enable_preference_tuning,
+            learning_rate_multiplier=learning_rate_multiplier,
+            num_epochs=num_epochs,
+            batch_size=batch_size,
+            default_temperature=default_temperature,
+            wait_for_completion=wait_for_completion,
+            timeout_minutes=timeout_minutes,
+            verbose_logs=verbose_logs,
+            auto_rename=auto_rename,
+            force_overwrite=force_overwrite,
+        )
     
-    return finetuning_result 
+    return finetuning_result
diff --git a/run.py b/run.py
@@ -79,7 +79,7 @@
 )
 @click.option(
     "--base-model",
-    default="meta-llama/Meta-Llama-3-8B-Instruct",
+    default="meta-llama/Meta-Llama-3.1-8B-Instruct",
     type=click.STRING,
     help="Base model to fine-tune.",
 )
@@ -141,11 +141,17 @@
     default=False,
     help="Disable caching for the pipeline run.",
 )
+@click.option(
+    "--use-sdk",
+    is_flag=True,
+    default=False,
+    help="Use the Python OpenPipe SDK instead of direct API calls.",
+)
 def main(
     openpipe_api_key: Optional[str] = None,
     dataset_name: str = "ultra_customer_service",
     model_name: str = "customer_service_assistant",
-    base_model: str = "meta-llama/Meta-Llama-3-8B-Instruct",
+    base_model: str = "meta-llama/Meta-Llama-3.1-8B-Instruct",
     system_prompt: str = "You are a helpful customer service assistant for Ultra electronics products.",
     data_source: str = "toy",
     sample_size: int = 30,
@@ -156,6 +162,7 @@ def main(
     force_overwrite: bool = False,
     fetch_details_only: bool = False,
     no_cache: bool = False,
+    use_sdk: bool = False,
 ):
     """Main entry point for the OpenPipe fine-tuning pipeline.
 
@@ -176,6 +183,7 @@ def main(
         force_overwrite: If True, delete existing model with the same name before creating new one.
         fetch_details_only: Only fetch model details without running the fine-tuning pipeline.
         no_cache: If `True` cache will be disabled.
+        use_sdk: If `True` use the Python OpenPipe SDK instead of direct API calls.
     """
     client = Client()
 
@@ -269,6 +277,7 @@ def main(
         "auto_rename": auto_rename,
         "force_overwrite": force_overwrite,
         "openpipe_api_key": openpipe_api_key,
+        "use_sdk": use_sdk,
     }
     
     # Run the pipeline
diff --git a/steps/__init__.py b/steps/__init__.py
@@ -26,4 +26,5 @@
 )
 from .openpipe_finetuning_starter import (
     openpipe_finetuning_starter,
+    openpipe_finetuning_starter_sdk,
 )
diff --git a/steps/openpipe_finetuning_starter.py b/steps/openpipe_finetuning_starter.py

Original file line number	Diff line number	Diff line change
`@@ -26,4 +26,5 @@`
`26`	`26`	`)`
`27`	`27`	`from .openpipe_finetuning_starter import (`
`28`	`28`	`openpipe_finetuning_starter,`
	`29`	`+ openpipe_finetuning_starter_sdk,`
`29`	`30`	`)`