aws
diff --git a/‎src/sagemaker/image_uris.py
Lines changed: 0 additions & 1 deletion b/‎src/sagemaker/image_uris.py
Lines changed: 0 additions & 1 deletion
diff --git a/‎src/sagemaker/modules/testing_notebooks/model_builder_handshake.ipynb
Lines changed: 262 additions & 65 deletions b/‎src/sagemaker/modules/testing_notebooks/model_builder_handshake.ipynb
Lines changed: 262 additions & 65 deletions
@@ -609,7 +609,6 @@ def _validate_py_version_and_set_if_needed(py_version, version_config, framework
 
 def _validate_arg(arg, available_options, arg_name):
     """Checks if the arg is in the available options, and raises a ``ValueError`` if not."""
-    print("VALIDATE")
     if arg not in available_options:
         raise ValueError(
             "Unsupported {arg_name}: {arg}. You may need to upgrade your SDK version "
 
@@ -1,74 +1,174 @@
 {
  "cells": [
   {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "eca12282",
    "metadata": {},
-   "outputs": [],
+   "cell_type": "markdown",
    "source": [
-    "! pip install \"pydantic>=2.0.0\" sagemaker-core"
-   ]
+    "# Model Builder Redesign\n",
+    "## This notebook highlights the new changes made to ModelBuilder and related utilities\n",
+    "\n",
+    "- Latest Container Image Utility function\n",
+    "- Handshake with ModelTrainer \n",
+    "- Unified Deployment from ModelBuilder"
+   ],
+   "id": "609dabdc97ce0a62"
   },
   {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "756ebbf2",
    "metadata": {},
+   "cell_type": "code",
+   "source": "alias = \"user\"",
+   "id": "54b0ea46e1886184",
    "outputs": [],
-   "source": [
-    "! pip install sagemaker-2.232.4.dev0.tar.gz"
-   ]
+   "execution_count": null
   },
   {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## Inital Setup",
+   "id": "b421db5dfb9a7fa7"
+  },
+  {
+   "metadata": {},
    "cell_type": "code",
-   "execution_count": null,
-   "id": "initial_id",
-   "metadata": {
-    "collapsed": true
-   },
-   "outputs": [],
    "source": [
-    "from sagemaker_core.main.shapes import TrainingJob\n",
-    "\n",
     "from sagemaker import Session, get_execution_role\n",
     "\n",
     "sagemaker_session = Session()\n",
     "role = get_execution_role()\n",
     "region = sagemaker_session.boto_region_name\n",
     "bucket = sagemaker_session.default_bucket()"
-   ]
+   ],
+   "id": "30656ece22011af6",
+   "outputs": [],
+   "execution_count": null
   },
   {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "4b3a4f7d1713685f",
    "metadata": {},
+   "cell_type": "code",
+   "source": [
+    "from sklearn.datasets import load_iris\n",
+    "from sklearn.model_selection import train_test_split\n",
+    "\n",
+    "import pandas as pd\n",
+    "\n",
+    "# Prepare Data\n",
+    "\n",
+    "iris = load_iris()\n",
+    "iris_df = pd.DataFrame(iris.data, columns=iris.feature_names)\n",
+    "iris_df['target'] = iris.target\n",
+    "\n",
+    "os.makedirs('./data', exist_ok=True)\n",
+    "\n",
+    "iris_df = iris_df[['target'] + [col for col in iris_df.columns if col != 'target']]\n",
+    "\n",
+    "train_data, test_data = train_test_split(iris_df, test_size=0.2, random_state=42)\n",
+    "\n",
+    "train_data.to_csv('./data/train.csv', index=False, header=False)\n",
+    "test_data.to_csv('./data/test.csv', index=False, header=False)\n",
+    "\n",
+    "# Remove the target column from the testing data. We will use this to call invoke_endpoint later\n",
+    "test_data_no_target = test_data.drop('target', axis=1)\n",
+    "\n",
+    "prefix = \"DEMO-scikit-iris\"\n",
+    "TRAIN_DATA = \"train.csv\"\n",
+    "TEST_DATA = \"test.csv\"\n",
+    "DATA_DIRECTORY = \"data\"\n",
+    "\n",
+    "train_input = sagemaker_session.upload_data(\n",
+    "    DATA_DIRECTORY, bucket=bucket, key_prefix=\"{}/{}\".format(prefix, DATA_DIRECTORY)\n",
+    ")\n",
+    "\n",
+    "\n",
+    "s3_input_path = \"s3://{}/{}/data/{}\".format(bucket, prefix, TRAIN_DATA)\n",
+    "s3_output_path = \"s3://{}/{}/output\".format(bucket, prefix)\n",
+    "\n",
+    "s3_test_path = \"s3://{}/{}/data/{}\".format(bucket, prefix, TEST_DATA)\n",
+    "\n",
+    "print(s3_input_path)\n",
+    "print(s3_output_path)"
+   ],
+   "id": "d0ea8169b21eaa29",
    "outputs": [],
+   "execution_count": null
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": [
+    "\n",
+    "# Integration with ModelTrainer\n",
+    "\n",
+    "The handshake between ModelTrainer and ModelBuilder is made seamlessly as in this example. The created model trainer object is directly fed into the model attribute of ModelBuilder through resource chaining . Fetching of the model artifacts is done internally within the ModelBuilder. \n",
+    "\n",
+    "Note: \n",
+    "- Other than the ModelTrainer, the ModelBuilder also supports chaining of attributes such as Estimator or sagemaker-core's TrainingJob into the model attribute. \n",
+    "\n",
+    "Other than this there is an upgrade designed for retrieving images for a particular framework. The enhanced `image_uris.retrieve()` method will fetch the latest version of an image automatically if the version is not provided.\n"
+   ],
+   "id": "1dc5055ba5ccb2bb"
+  },
+  {
+   "metadata": {},
+   "cell_type": "code",
    "source": [
     "\n",
-    "from sagemaker.modules.configs import SourceCode\n",
+    "from sagemaker import image_uris\n",
+    "from sagemaker_core.main.shapes import Channel, DataSource, S3DataSource, OutputDataConfig, \\\n",
+    "    StoppingCondition\n",
     "from sagemaker.modules.train.model_trainer import ModelTrainer\n",
     "\n",
-    "xgboost_image = \"433757028032.dkr.ecr.us-west-2.amazonaws.com/xgboost:latest\"\n",
+    "# xgboost_image=\"433757028032.dkr.ecr.us-west-2.amazonaws.com/xgboost:latest\"\n",
+    "xgboost_image = image_uris.retrieve(framework=\"xgboost\", region=\"us-west-2\", image_scope=\"training\")\n",
+    "print(xgboost_image)\n",
     "\n",
-    "source_code = SourceCode(\n",
-    "    command=\"echo 'Hello World' && env\",\n",
-    ")\n",
     "model_trainer = ModelTrainer(\n",
+    "    base_job_name=f'{alias}-mb-handshake',\n",
+    "    hyperparameters={\n",
+    "        'objective': 'multi:softmax',\n",
+    "        'num_class': '3',\n",
+    "        'num_round': '10',\n",
+    "        'eval_metric': 'merror'\n",
+    "    },\n",
     "    training_image=xgboost_image,\n",
-    "    source_code=source_code,\n",
+    "    training_input_mode='File',\n",
+    "    role=role,\n",
+    "    output_data_config=OutputDataConfig(\n",
+    "        s3_output_path=s3_output_path\n",
+    "    ),\n",
+    "    stopping_condition=StoppingCondition(\n",
+    "        max_runtime_in_seconds=600\n",
+    "    )\n",
     ")\n",
     "\n",
-    "model_trainer.train()"
-   ]
+    "model_trainer.train(input_data_config=[\n",
+    "    Channel(\n",
+    "        channel_name='train',\n",
+    "        content_type='csv',\n",
+    "        compression_type='None',\n",
+    "        record_wrapper_type='None',\n",
+    "        data_source=DataSource(\n",
+    "            s3_data_source=S3DataSource(\n",
+    "                s3_data_type='S3Prefix',\n",
+    "                s3_uri=s3_input_path,\n",
+    "                s3_data_distribution_type='FullyReplicated'\n",
+    "            )\n",
+    "        )\n",
+    "    )\n",
+    "], )"
+   ],
+   "id": "4b3a4f7d1713685f",
+   "outputs": [],
+   "execution_count": null
   },
   {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "295a16ef277257a0",
    "metadata": {},
-   "outputs": [],
+   "cell_type": "markdown",
+   "source": "",
+   "id": "96be4afa22c64350"
+  },
+  {
+   "metadata": {},
+   "cell_type": "code",
    "source": [
     "import numpy as np\n",
     "from sagemaker.serve.builder.schema_builder import SchemaBuilder\n",
@@ -96,54 +196,151 @@
     "        predictions = np.argmax(prediction_probabilities, axis=1)\n",
     "        return predictions\n",
     "\n",
+    "\n",
     "model_builder = ModelBuilder(\n",
-    "    model=model_trainer, # ModelTrainer object passed onto ModelBuilder directly \n",
+    "    model=model_trainer,  # ModelTrainer object passed onto ModelBuilder directly \n",
     "    role_arn=role,\n",
     "    image_uri=xgboost_image,\n",
     "    inference_spec=XGBoostSpec(),\n",
     "    schema_builder=schema_builder,\n",
     "    instance_type=\"ml.c6i.xlarge\"\n",
     ")\n",
-    "model=model_builder.build()\n",
-    "predictor=model_builder.deploy()\n",
-    "\n",
-    "predictor\n",
-    "assert model.model_data == model_trainer._latest_training_job.model_artifacts.s3_model_artifacts\n",
-    "\n",
-    "print(model.model_data)"
-   ]
+    "model = model_builder.build()"
+   ],
+   "id": "295a16ef277257a0",
+   "outputs": [],
+   "execution_count": null
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "Once the model has been built , it can be deployed directly through the model_builder.deploy() method. This abstracts out information that was previously used commonly in workflows for different deployment modes. The deploy() method takes in an optional parameter `inference_config`. This determines attributes for modes such as serverless, async, batch and multi-model/multi-container endpoints. If the `inference_config` is not provided, the default real-time deployment is carried out.",
+   "id": "99b403edaf616ef0"
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## ModelBuilder - Real-Time Deployment",
+   "id": "44416566576e26df"
   },
   {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "935ea8486278d7b1",
    "metadata": {},
+   "cell_type": "code",
+   "source": [
+    "predictor = model_builder.deploy(endpoint_name=f\"{alias}-xgboost-deploy-realtime\")\n",
+    "sklearn_input = np.array([1.0, 2.0, 3.0, 4.0])\n",
+    "result = predictor.predict(sklearn_input)\n",
+    "print(result)"
+   ],
+   "id": "ab43000f6bd6018b",
    "outputs": [],
+   "execution_count": null
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## ModelBuilder - Serverless Deployment\n",
+   "id": "fbd0e6f6e92d0aeb"
+  },
+  {
+   "metadata": {},
+   "cell_type": "code",
    "source": [
-    "training_job: TrainingJob = model_trainer._latest_training_job\n",
-    "\n",
-    "model_builder = ModelBuilder(\n",
-    "    model=training_job, # Sagemaker core's TrainingJob object passed onto ModelBuilder directly \n",
-    "    role_arn=role,\n",
-    "    image_uri=xgboost_image,\n",
-    "    schema_builder=schema_builder,\n",
-    "    inference_spec=XGBoostSpec(),\n",
-    "    instance_type=\"ml.c6i.xlarge\"\n",
-    ")\n",
-    "model=model_builder.build()\n",
+    "from sagemaker.serverless.serverless_inference_config import ServerlessInferenceConfig\n",
     "\n",
-    "assert model.model_data == training_job.model_artifacts.s3_model_artifacts\n",
+    "predictor = model_builder.deploy(endpoint_name=f\"{alias}-xgboost-deploy-serverless\",\n",
+    "                                 inference_config=ServerlessInferenceConfig(memory_size_in_mb=2048))\n",
+    "sklearn_input = np.array([1.0, 2.0, 3.0, 4.0])\n",
+    "result = predictor.predict(sklearn_input)\n",
+    "print(result)"
+   ],
+   "id": "40d3c9973d2d8934",
+   "outputs": [],
+   "execution_count": null
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## ModelBuilder - Async Deployment\n",
+   "id": "93818038782f105d"
+  },
+  {
+   "metadata": {},
+   "cell_type": "code",
+   "source": [
+    "from sagemaker.async_inference.async_inference_config import AsyncInferenceConfig\n",
+    "from sagemaker.s3_utils import s3_path_join\n",
     "\n",
-    "print(model.model_data)"
-   ]
+    "predictor = model_builder.deploy(endpoint_name=f\"{alias}-xgboost-deploy-async\", inference_config=AsyncInferenceConfig(\n",
+    "    output_path=s3_path_join(\"s3://\", bucket, \"async_inference/output\")))\n",
+    "sklearn_input = np.array([1.0, 2.0, 3.0, 4.0])\n",
+    "result = predictor.predict(sklearn_input)\n",
+    "print(result)"
+   ],
+   "id": "77e7104aaa9d6da2",
+   "outputs": [],
+   "execution_count": null
   },
   {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## ModelBuilder - Batch Deployment\n",
+   "id": "2ff3e043b5f5f8d7"
+  },
+  {
+   "metadata": {},
    "cell_type": "code",
-   "execution_count": null,
-   "id": "757180da84407a1a",
+   "source": [
+    "from sagemaker.batch_inference.batch_transform_inference_config import BatchTransformInferenceConfig\n",
+    "from sagemaker.s3_utils import s3_path_join\n",
+    "\n",
+    "transformer = model_builder.deploy(endpoint_name=f\"{alias}-xgboost-deploy-batch\",\n",
+    "                                 inference_config=BatchTransformInferenceConfig(\n",
+    "                                     instance_count=1,\n",
+    "                                     instance_type='ml.m5.large',\n",
+    "                                     output_path=s3_path_join(\"s3://\", bucket, \"batch_inference/output\"),\n",
+    "                                     test_data_s3_path = s3_test_path\n",
+    "                                 ))\n",
+    "print(transformer)"
+   ],
+   "id": "3ef3febc0f840133",
+   "outputs": [],
+   "execution_count": null
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## ModelBuilder - Multi-Model Endpoint Deployment\n",
+   "id": "66e103b7292694eb"
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "",
+   "id": "a1c4d43bbd23efec"
+  },
+  {
    "metadata": {},
+   "cell_type": "code",
+   "source": [
+    "from sagemaker.compute_resource_requirements.resource_requirements import ResourceRequirements\n",
+    "\n",
+    "predictor = model_builder.deploy(endpoint_name=f\"{alias}-xgboost-deploy-multi-model\",\n",
+    "                                 inference_config=ResourceRequirements(\n",
+    "                                     requests={\n",
+    "                                         \"num_cpus\": 0.5,\n",
+    "                                         \"memory\": 512,\n",
+    "                                         \"copies\": 2,\n",
+    "                                     },\n",
+    "                                     limits={},\n",
+    "                                 ))\n",
+    "sklearn_input = np.array([1.0, 2.0, 3.0, 4.0])\n",
+    "result = predictor.predict(sklearn_input)\n",
+    "print(result)"
+   ],
+   "id": "f3c622148377c964",
    "outputs": [],
-   "source": []
+   "execution_count": null
   }
  ],
  "metadata": {