From b012283c08cf8abc2974dc73ff7c2d3b8112a16b Mon Sep 17 00:00:00 2001
From: Morgan Du <morgandu@google.com>
Date: Wed, 25 Nov 2020 11:51:00 -0800
Subject: [PATCH] feat: add
 create_training_pipeline_custom_training_managed_dataset sample (#75)

Co-authored-by: Yu-Han Liu <yuhanliu@google.com>
---
 ..._custom_training_managed_dataset_sample.py | 103 +++++++++++++++++
 ...om_training_managed_dataset_sample_test.py | 107 ++++++++++++++++++
 2 files changed, 210 insertions(+)
 create mode 100644 samples/snippets/create_training_pipeline_custom_training_managed_dataset_sample.py
 create mode 100644 samples/snippets/create_training_pipeline_custom_training_managed_dataset_sample_test.py

diff --git a/samples/snippets/create_training_pipeline_custom_training_managed_dataset_sample.py b/samples/snippets/create_training_pipeline_custom_training_managed_dataset_sample.py
new file mode 100644
index 0000000000..3638b53abc
--- /dev/null
+++ b/samples/snippets/create_training_pipeline_custom_training_managed_dataset_sample.py
@@ -0,0 +1,103 @@
+# Copyright 2020 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# [START aiplatform_create_training_pipeline_custom_training_managed_dataset_sample]
+from google.cloud import aiplatform
+from google.protobuf import json_format
+from google.protobuf.struct_pb2 import Value
+
+
+def create_training_pipeline_custom_training_managed_dataset_sample(
+    project: str,
+    display_name: str,
+    model_display_name: str,
+    dataset_id: str,
+    annotation_schema_uri: str,
+    training_container_spec_image_uri: str,
+    model_container_spec_image_uri: str,
+    base_output_uri_prefix: str,
+    location: str = "us-central1",
+    api_endpoint: str = "us-central1-aiplatform.googleapis.com",
+):
+    client_options = {"api_endpoint": api_endpoint}
+    # Initialize client that will be used to create and send requests.
+    # This client only needs to be created once, and can be reused for
+    # multiple requests.
+    client = aiplatform.gapic.PipelineServiceClient(
+        client_options=client_options)
+
+    # input_data_config
+    input_data_config = {
+        "dataset_id": dataset_id,
+        "annotation_schema_uri": annotation_schema_uri,
+        "gcs_destination": {"output_uri_prefix": base_output_uri_prefix},
+    }
+
+    # training_task_definition
+    custom_task_definition = "gs://google-cloud-aiplatform/schema/" \
+                             "trainingjob/definition/custom_task_1.0.0.yaml"
+
+    # training_task_inputs
+    training_container_spec = {
+        "imageUri": training_container_spec_image_uri,
+        # AIP_MODEL_DIR is set by the service according to baseOutputDirectory.
+        "args": ["--model-dir=$(AIP_MODEL_DIR)",],
+    }
+
+    training_worker_pool_spec = {
+        "replicaCount": 1,
+        "machineSpec": {"machineType": "n1-standard-8"},
+        "containerSpec": training_container_spec,
+    }
+
+    training_task_inputs_dict = {
+        "workerPoolSpecs": [training_worker_pool_spec],
+        "baseOutputDirectory": {"outputUriPrefix": base_output_uri_prefix},
+    }
+
+    training_task_inputs = json_format.ParseDict(
+        training_task_inputs_dict, Value())
+
+    # model_to_upload
+    model_container_spec = {
+        "image_uri": model_container_spec_image_uri,
+        "command": ["/bin/tensorflow_model_server"],
+        "args": [
+            "--model_name=$(AIP_MODEL)",
+            "--model_base_path=$(AIP_STORAGE_URI)",
+            "--rest_api_port=8080",
+            "--port=8500",
+            "--file_system_poll_wait_seconds=31540000"
+        ],
+    }
+
+    model = {
+        "display_name": model_display_name,
+        "container_spec": model_container_spec}
+
+    training_pipeline = {
+        "display_name": display_name,
+        "input_data_config": input_data_config,
+        "training_task_definition": custom_task_definition,
+        "training_task_inputs": training_task_inputs,
+        "model_to_upload": model,
+    }
+    parent = f"projects/{project}/locations/{location}"
+    response = client.create_training_pipeline(
+        parent=parent, training_pipeline=training_pipeline
+    )
+    print("response:", response)
+
+
+# [END aiplatform_create_training_pipeline_custom_training_managed_dataset_sample]
diff --git a/samples/snippets/create_training_pipeline_custom_training_managed_dataset_sample_test.py b/samples/snippets/create_training_pipeline_custom_training_managed_dataset_sample_test.py
new file mode 100644
index 0000000000..85c6f22734
--- /dev/null
+++ b/samples/snippets/create_training_pipeline_custom_training_managed_dataset_sample_test.py
@@ -0,0 +1,107 @@
+# Copyright 2020 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import uuid
+import pytest
+import os
+
+from google.cloud import aiplatform
+
+import helpers
+
+import create_training_pipeline_custom_training_managed_dataset_sample
+
+API_ENDPOINT = "us-central1-aiplatform.googleapis.com"
+
+PROJECT_ID = os.getenv("BUILD_SPECIFIC_GCLOUD_PROJECT")
+DISPLAY_NAME = f"temp_create_training_pipeline_custom_training_managed_dataset_test_{uuid.uuid4()}"
+MODEL_DISPLAY_NAME = f"Temp Model for {DISPLAY_NAME}"
+
+DATASET_ID = "1084241610289446912"  # permanent_50_flowers_dataset
+ANNOTATION_SCHEMA_URI = "gs://google-cloud-aiplatform/schema/dataset/annotation/image_classification_1.0.0.yaml"
+
+TRAINING_CONTAINER_SPEC_IMAGE_URI = "gcr.io/ucaip-test/custom-container-managed-dataset:latest"
+MODEL_CONTAINER_SPEC_IMAGE_URI = "gcr.io/cloud-aiplatform/prediction/tf-gpu.1-15:latest"
+
+BASE_OUTPUT_URI_PREFIX = "gs://ucaip-samples-us-central1/training_pipeline_output/custom_training_managed_dataset"
+
+
+@pytest.fixture
+def shared_state():
+    state = {}
+    yield state
+
+
+@pytest.fixture
+def pipeline_client():
+    client_options = {"api_endpoint": API_ENDPOINT}
+    pipeline_client = aiplatform.gapic.PipelineServiceClient(
+        client_options=client_options
+    )
+    yield pipeline_client
+
+
+@pytest.fixture
+def model_client():
+    client_options = {"api_endpoint": API_ENDPOINT}
+    model_client = aiplatform.gapic.ModelServiceClient(
+        client_options=client_options)
+    yield model_client
+
+
+@pytest.fixture(scope="function", autouse=True)
+def teardown(shared_state, model_client, pipeline_client):
+    yield
+    model_client.delete_model(name=shared_state["model_name"])
+    pipeline_client.delete_training_pipeline(
+        name=shared_state["training_pipeline_name"]
+    )
+
+
+def test_create_training_pipeline_custom_training_managed_dataset_sample(
+    capsys, shared_state, pipeline_client
+):
+    create_training_pipeline_custom_training_managed_dataset_sample.create_training_pipeline_custom_training_managed_dataset_sample(
+        project=PROJECT_ID,
+        display_name=DISPLAY_NAME,
+        model_display_name=MODEL_DISPLAY_NAME,
+        dataset_id=DATASET_ID,
+        annotation_schema_uri=ANNOTATION_SCHEMA_URI,
+        training_container_spec_image_uri=TRAINING_CONTAINER_SPEC_IMAGE_URI,
+        model_container_spec_image_uri=MODEL_CONTAINER_SPEC_IMAGE_URI,
+        base_output_uri_prefix=BASE_OUTPUT_URI_PREFIX,
+    )
+
+    out, _ = capsys.readouterr()
+
+    # Save resource name of the newly created training pipeline
+    shared_state["training_pipeline_name"] = helpers.get_name(out)
+
+    # Poll until the pipeline succeeds because we want to test the model_upload step as well.
+    helpers.wait_for_job_state(
+        get_job_method=pipeline_client.get_training_pipeline,
+        name=shared_state["training_pipeline_name"],
+        expected_state="SUCCEEDED",
+        timeout=1800,
+        freq=20,
+    )
+
+    training_pipeline = pipeline_client.get_training_pipeline(
+        name=shared_state["training_pipeline_name"]
+    )
+
+    # Check that the model indeed has been uploaded.
+    assert training_pipeline.model_to_upload.name != ""
+
+    shared_state["model_name"] = training_pipeline.model_to_upload.name