feat(components): Upgrade LLM evaluation classification and text generation pipelines to preview

KevinBNaughton · Google Cloud Pipeline Components maintainers · commit b350ac4ddc32 · 2023-08-10T10:08:00.000-07:00
PiperOrigin-RevId: 555540517
diff --git a/components/google-cloud/google_cloud_pipeline_components/preview/model_evaluation/evaluation_llm_classification_pipeline.py b/components/google-cloud/google_cloud_pipeline_components/preview/model_evaluation/evaluation_llm_classification_pipeline.py
@@ -15,16 +15,16 @@
 
 
 @dsl.pipeline(name=_PIPELINE_NAME)
-def llm_eval_classification_pipeline(  # pylint: disable=dangerous-default-value
+def evaluation_llm_classification_pipeline(  # pylint: disable=dangerous-default-value
     project: str,
     location: str,
     target_field_name: str,
+    batch_predict_gcs_source_uris: List[str],
     batch_predict_gcs_destination_output_uri: str,
     model_name: str = 'publishers/google/models/text-bison@001',
     evaluation_task: str = 'text-classification',
     evaluation_class_labels: List[str] = [],
     batch_predict_instances_format: str = 'jsonl',
-    batch_predict_gcs_source_uris: List[str] = [],
     batch_predict_predictions_format: str = 'jsonl',
     machine_type: str = 'e2-highmem-16',
     service_account: str = '',
@@ -49,6 +49,13 @@ def llm_eval_classification_pipeline(  # pylint: disable=dangerous-default-value
     target_field_name: The target field's name. Formatted to be able to find
       nested columns, delimited by ``.``. Prefixed with 'instance.' on the
       component for Vertex Batch Prediction.
+    batch_predict_gcs_source_uris: Google Cloud Storage URI(-s) to your
+      instances data to run batch prediction on. The instances data should also
+      contain the ground truth (target) data, used for evaluation. May contain
+      wildcards. For more information on wildcards, see
+      https://cloud.google.com/storage/docs/gsutil/addlhelp/WildcardNames. For
+        more details about this input config, see
+      https://cloud.google.com/vertex-ai/docs/reference/rest/v1/projects.locations.batchPredictionJobs#InputConfig.
     batch_predict_gcs_destination_output_uri: The Google Cloud Storage location
       of the directory where the output is to be written to.
     model_name: The Model name used to run evaluation. Must be a publisher Model
@@ -65,13 +72,6 @@ def llm_eval_classification_pipeline(  # pylint: disable=dangerous-default-value
       must be one of the Model's supportedInputStorageFormats. For more details
       about this input config, see
       https://cloud.google.com/vertex-ai/docs/reference/rest/v1/projects.locations.batchPredictionJobs#InputConfig.
-    batch_predict_gcs_source_uris: Google Cloud Storage URI(-s) to your
-      instances data to run batch prediction on. The instances data should also
-      contain the ground truth (target) data, used for evaluation. May contain
-      wildcards. For more information on wildcards, see
-      https://cloud.google.com/storage/docs/gsutil/addlhelp/WildcardNames. For
-        more details about this input config, see
-      https://cloud.google.com/vertex-ai/docs/reference/rest/v1/projects.locations.batchPredictionJobs#InputConfig.
     batch_predict_predictions_format: The format in which Vertex AI gives the
       predictions. Must be one of the Model's supportedOutputStorageFormats. For
       more details about this output config, see
@@ -113,19 +113,18 @@ def llm_eval_classification_pipeline(  # pylint: disable=dangerous-default-value
       created.
 
   Returns:
-    NamedTuple:
-      evaluation_metrics: ClassificationMetrics Artifact for LLM Text
-        Classification.
-      evaluation_resource_name: If run on an user's managed VertexModel, the
-        imported evaluation resource name. Empty if run on a publisher model.
+    evaluation_metrics: ClassificationMetrics Artifact for LLM Text
+      Classification.
+    evaluation_resource_name: If run on an user's managed VertexModel, the
+      imported evaluation resource name. Empty if run on a publisher model.
   """
   outputs = NamedTuple(
       'outputs',
       evaluation_metrics=ClassificationMetrics,
       evaluation_resource_name=str,
   )
 
-  get_vertex_model_task = dsl.importer_node.importer(
+  get_vertex_model_task = dsl.importer(
       artifact_uri=(
           f'https://{location}-aiplatform.googleapis.com/v1/{model_name}'
       ),
diff --git a/components/google-cloud/google_cloud_pipeline_components/preview/model_evaluation/evaluation_llm_text_generation_pipeline.py b/components/google-cloud/google_cloud_pipeline_components/preview/model_evaluation/evaluation_llm_text_generation_pipeline.py
@@ -14,14 +14,14 @@
 
 
 @dsl.pipeline(name=_PIPELINE_NAME)
-def llm_eval_text_generation_pipeline(  # pylint: disable=dangerous-default-value
+def evaluation_llm_text_generation_pipeline(  # pylint: disable=dangerous-default-value
     project: str,
     location: str,
+    batch_predict_gcs_source_uris: List[str],
     batch_predict_gcs_destination_output_uri: str,
     model_name: str = 'publishers/google/models/text-bison@001',
     evaluation_task: str = 'text-generation',
     batch_predict_instances_format: str = 'jsonl',
-    batch_predict_gcs_source_uris: List[str] = [],
     batch_predict_predictions_format: str = 'jsonl',
     machine_type: str = 'e2-highmem-16',
     service_account: str = '',
@@ -39,6 +39,13 @@ def llm_eval_text_generation_pipeline(  # pylint: disable=dangerous-default-valu
   Args:
     project: The GCP project that runs the pipeline components.
     location: The GCP region that runs the pipeline components.
+    batch_predict_gcs_source_uris: Google Cloud Storage URI(-s) to your
+      instances data to run batch prediction on. The instances data should also
+      contain the ground truth (target) data, used for evaluation. May contain
+      wildcards. For more information on wildcards, see
+      https://cloud.google.com/storage/docs/gsutil/addlhelp/WildcardNames. For
+        more details about this input config, see
+      https://cloud.google.com/vertex-ai/docs/reference/rest/v1/projects.locations.batchPredictionJobs#InputConfig.
     batch_predict_gcs_destination_output_uri: The Google Cloud Storage location
       of the directory where the output is to be written to.
     model_name: The Model name used to run evaluation. Must be a publisher Model
@@ -53,13 +60,6 @@ def llm_eval_text_generation_pipeline(  # pylint: disable=dangerous-default-valu
       must be one of the Model's supportedInputStorageFormats. Only "jsonl" is
       currently supported. For more details about this input config, see
       https://cloud.google.com/vertex-ai/docs/reference/rest/v1/projects.locations.batchPredictionJobs#InputConfig.
-    batch_predict_gcs_source_uris: Google Cloud Storage URI(-s) to your
-      instances data to run batch prediction on. The instances data should also
-      contain the ground truth (target) data, used for evaluation. May contain
-      wildcards. For more information on wildcards, see
-      https://cloud.google.com/storage/docs/gsutil/addlhelp/WildcardNames. For
-        more details about this input config, see
-      https://cloud.google.com/vertex-ai/docs/reference/rest/v1/projects.locations.batchPredictionJobs#InputConfig.
     batch_predict_predictions_format: The format in which Vertex AI gives the
       predictions. Must be one of the Model's supportedOutputStorageFormats.
       Only "jsonl" is currently supported. For more details about this output
@@ -91,18 +91,17 @@ def llm_eval_text_generation_pipeline(  # pylint: disable=dangerous-default-valu
       created.
 
   Returns:
-    NamedTuple:
-      evaluation_metrics: Metrics Artifact for LLM Text Generation.
-      evaluation_resource_name: If run on an user's managed VertexModel, the
-        imported evaluation resource name. Empty if run on a publisher model.
+    evaluation_metrics: Metrics Artifact for LLM Text Generation.
+    evaluation_resource_name: If run on an user's managed VertexModel, the
+      imported evaluation resource name. Empty if run on a publisher model.
   """
   outputs = NamedTuple(
       'outputs',
       evaluation_metrics=Metrics,
       evaluation_resource_name=str,
   )
 
-  get_vertex_model_task = dsl.importer_node.importer(
+  get_vertex_model_task = dsl.importer(
       artifact_uri=(
           f'https://{location}-aiplatform.googleapis.com/v1/{model_name}'
       ),