)]\n"
]
}
],
"source": [
"from sagemaker.feature_store.feature_definition import FeatureDefinition\n",
"from sagemaker.feature_store.feature_definition import FeatureTypeEnum\n",
"\n",
"default_feature_type = FeatureTypeEnum.STRING\n",
"column_to_feature_type_mapping = {\n",
" \"float\": FeatureTypeEnum.FRACTIONAL,\n",
" \"long\": FeatureTypeEnum.INTEGRAL\n",
"}\n",
"\n",
"feature_definitions = [\n",
" FeatureDefinition(\n",
" feature_name=column_schema['name'], \n",
" feature_type=column_to_feature_type_mapping.get(column_schema['type'], default_feature_type)\n",
" ) for column_schema in column_schemas\n",
"]\n",
"logger.info(f'feature definitions: {feature_definitions}')"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Configure Feature Group\n",
"\n",
" 💡 Configurable Settings \n",
"\n",
"1. feature_group_name: name of the feature group.\n",
"1. feature_store_offline_s3_uri: SageMaker FeatureStore writes the data in the OfflineStore of a FeatureGroup to a S3 location owned by you.\n",
"1. enable_online_store: controls if online store is enabled. Enabling the online store allows quick access to the latest value for a Record via the GetRecord API.\n",
"1. iam_role: IAM role for executing the processing job.\n",
"1. table_format: Amazon SageMaker Feature Store supports the AWS Glue and Apache Iceberg table formats for the offline store. \n",
"
"
]
},
{
"cell_type": "code",
"execution_count": 14,
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"# Calculate current_timestamp to create unique entries\n",
"current_timestamp = strftime('%m-%d-%H-%M-%S', gmtime())"
]
},
{
"cell_type": "code",
"execution_count": 15,
"metadata": {
"tags": []
},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"Feature Group Name: fscw-orders-03-30-19-21-40\n"
]
}
],
"source": [
"# flow name and an unique ID for this export (used later as the processing job name for the export)\n",
"flow_name = \"orders\"\n",
"flow_export_name = f'DWF-Orders'\n",
"\n",
"# feature group name, with flow_name and an unique id. You can give it a customized name\n",
"feature_group_name = f\"{fs_champions_workshop_prefix}-{flow_name}-{current_timestamp}\"\n",
"logger.info(f'Feature Group Name: {feature_group_name}')\n",
"\n",
"# SageMaker FeatureStore writes the data in the OfflineStore of a FeatureGroup to a \n",
"# S3 location owned by you.\n",
"feature_store_offline_s3_uri = 's3://' + bucket\n",
"\n",
"# controls if online store is enabled. Enabling the online store allows quick access to \n",
"# the latest value for a Record via the GetRecord API.\n",
"enable_online_store = True"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Initialize Feature Group"
]
},
{
"cell_type": "code",
"execution_count": 16,
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"# Initialize Boto3 session that is required to create feature group\n",
"import boto3\n",
"from sagemaker.session import Session\n",
"\n",
"region = boto3.Session().region_name\n",
"boto_session = boto3.Session(region_name=region)\n",
"\n",
"sagemaker_client = boto_session.client(service_name='sagemaker', region_name=region)\n",
"featurestore_runtime = boto_session.client(service_name='sagemaker-featurestore-runtime', region_name=region)\n",
"\n",
"feature_store_session = Session(\n",
" boto_session=boto_session,\n",
" sagemaker_client=sagemaker_client,\n",
" sagemaker_featurestore_runtime_client=featurestore_runtime\n",
")"
]
},
{
"cell_type": "code",
"execution_count": 17,
"metadata": {
"tags": []
},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"Feature Group Name: fscw-orders-03-30-17-02\n",
"Create Feature Group: False\n"
]
}
],
"source": [
"#Check if we use the persisted feature store name or create a new one\n",
"if orders_feature_group_name is None:\n",
" create_new_feature_group = True\n",
"elif create_new_feature_group is False:\n",
" feature_group_name = orders_feature_group_name \n",
"\n",
"logger.info(f'Feature Group Name: {feature_group_name}')\n",
"logger.info(f'Create Feature Group: {create_new_feature_group}')"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Feature group is initialized and created below"
]
},
{
"cell_type": "code",
"execution_count": 18,
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"from sagemaker.feature_store.feature_group import FeatureGroup\n",
"from sagemaker.feature_store.inputs import TableFormatEnum\n",
"\n",
"if create_new_feature_group is True:\n",
" feature_group = FeatureGroup(\n",
" name=feature_group_name, sagemaker_session=feature_store_session, feature_definitions=feature_definitions)\n",
"\n",
" feature_group.create(\n",
" s3_uri=feature_store_offline_s3_uri,\n",
" record_identifier_name=record_identifier_feature_name,\n",
" event_time_feature_name=event_time_feature_name,\n",
" role_arn=iam_role,\n",
" enable_online_store=enable_online_store,\n",
" table_format=TableFormatEnum.ICEBERG # or GLUE\n",
" )"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Invoke the Feature Store API to create the feature group and wait until it is ready"
]
},
{
"cell_type": "code",
"execution_count": 19,
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"import time\n",
"def wait_for_feature_group_creation_complete(feature_group):\n",
" \"\"\"Helper function to wait for the completions of creating a feature group\"\"\"\n",
" status = feature_group.describe().get(\"FeatureGroupStatus\")\n",
" while status == \"Creating\":\n",
" print(\"Waiting for Feature Group Creation\")\n",
" time.sleep(5)\n",
" status = feature_group.describe().get(\"FeatureGroupStatus\")\n",
" if status != \"Created\":\n",
" raise SystemExit(f\"Failed to create feature group {feature_group.name}: {status}\")\n",
" print(f\"FeatureGroup {feature_group.name} successfully created.\")"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Create Feature Group"
]
},
{
"cell_type": "code",
"execution_count": 20,
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"if create_new_feature_group is True:\n",
" wait_for_feature_group_creation_complete(feature_group=feature_group)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Now that the feature group is created, You will use a processing job to process your \n",
" data at scale and ingest the transformed data into this feature group."
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Verify created or existing feature group"
]
},
{
"cell_type": "code",
"execution_count": 21,
"metadata": {
"tags": []
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"{'FeatureGroupArn': 'arn:aws:sagemaker:us-west-2:227246955871:feature-group/fscw-orders-03-30-17-02', 'FeatureGroupName': 'fscw-orders-03-30-17-02', 'RecordIdentifierFeatureName': 'order_id', 'EventTimeFeatureName': 'event_time', 'FeatureDefinitions': [{'FeatureName': 'order_id', 'FeatureType': 'String'}, {'FeatureName': 'customer_id', 'FeatureType': 'String'}, {'FeatureName': 'product_id', 'FeatureType': 'String'}, {'FeatureName': 'purchase_amount', 'FeatureType': 'Fractional'}, {'FeatureName': 'is_reordered', 'FeatureType': 'Integral'}, {'FeatureName': 'event_time', 'FeatureType': 'String'}, {'FeatureName': 'n_days_since_last_purchase', 'FeatureType': 'Fractional'}], 'CreationTime': datetime.datetime(2023, 3, 30, 17, 2, 46, 972000, tzinfo=tzlocal()), 'OnlineStoreConfig': {'EnableOnlineStore': True}, 'OfflineStoreConfig': {'S3StorageConfig': {'S3Uri': 's3://sagemaker-us-west-2-227246955871/sagemaker-feature-store', 'ResolvedOutputS3Uri': 's3://sagemaker-us-west-2-227246955871/sagemaker-feature-store/227246955871/sagemaker/us-west-2/offline-store/fscw-orders-03-30-17-02-1680195766/data'}, 'DisableGlueTableCreation': False, 'DataCatalogConfig': {'TableName': 'fscw_orders_03_30_17_02_1680195766', 'Catalog': 'AwsDataCatalog', 'Database': 'SageMaker_FeatureStore'}, 'TableFormat': 'Iceberg'}, 'RoleArn': 'arn:aws:iam::227246955871:role/service-role/AmazonSageMaker-ExecutionRole-20220810T165739', 'FeatureGroupStatus': 'Created', 'OfflineStoreStatus': {'Status': 'Active'}, 'OnlineStoreTotalSizeBytes': 0, 'ResponseMetadata': {'RequestId': 'c71bea09-f8f8-40c0-98a0-2447935aa952', 'HTTPStatusCode': 200, 'HTTPHeaders': {'x-amzn-requestid': 'c71bea09-f8f8-40c0-98a0-2447935aa952', 'content-type': 'application/x-amz-json-1.1', 'content-length': '1862', 'date': 'Thu, 30 Mar 2023 19:21:56 GMT'}, 'RetryAttempts': 0}}\n"
]
}
],
"source": [
"# Use Describe command to get the details of the feature group\n",
"response = sagemaker_client.describe_feature_group(FeatureGroupName = feature_group_name)\n",
"print(response)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Creating a workflow using Data Wrangler (OPTIONAL)\n",
"[SKIP this section](#Inputs-and-Outputs)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### ** BEGIN **\n",
"\n",
"##### Follow the below steps to create the dwf-orders.flow using Data Wrangler (DW)\n",
"\n",
" #### 1. Please follow these steps for Opening DW \n",
""
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
" #### 2. Please follow these steps to open S3 as your source. \n",
""
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
" #### 3. Please follow these steps to navigate to the desired S3 bucket/folder path to import the dataset from your source. \n",
" "
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
" #### 4. Please follow these steps to add a 'Transform' to your imported dataset. \n",
"\n",
" "
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
" #### 5. Please follow these steps to navigate to the desired transform to apply to a source column. \n",
" \n",
" "
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
" #### 6. Please follow these steps to 'Export' the created workflow to create a notebook that would ingest the data in to a feature store.. \n",
"\n",
" "
]
},
{
"attachments": {
"image.png": {
"image/png": ""
}
},
"cell_type": "markdown",
"metadata": {},
"source": [
" #### A notebook is generated as shown below \n",
"\n",
" "
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
" #### 7. Please follow these steps to copy the value from the Output name variable (as shown below) that is auto-generated from the selected node's ID from the flowfile. \n",
"\n",
" "
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
" #### 8. Please follow these steps to navigate to 'Save As' option to rename the Workflow file to 'orders.flow' \n",
" \n",
" \n",
" "
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
""
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## ** END ** Creating a workflow using Data Wrangler (OPTIONAL)\n",
"\n",
"\n",
"\n",
"\n",
"\n"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"# Inputs and Outputs\n",
"\n",
"The below settings configure the inputs and outputs for the flow export.\n",
"\n",
" 💡 Configurable Settings \n",
"\n",
"In Input - Source you can configure the data sources that will be used as input by Data Wrangler\n",
"\n",
"1. For S3 sources, configure the source attribute that points to the input S3 prefixes\n",
"2. For all other sources, configure attributes like query_string, database in the source's \n",
"DatasetDefinition object.\n",
"\n",
"If you modify the inputs the provided data must have the same schema and format as the data used in the Flow. \n",
"You should also re-execute the cells in this section if you have modified the settings in any data sources.\n",
"
"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"from sagemaker.processing import ProcessingInput, ProcessingOutput\n",
"from sagemaker.dataset_definition.inputs import AthenaDatasetDefinition, DatasetDefinition, RedshiftDatasetDefinition\n",
"\n",
"data_sources = []"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Input: S3 Source: orders.csv"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"ordersfilename='orders.csv'\n",
"# You can override this to point to other dataset on S3\n",
"orders_datasource = f'{bucketlocation}{ordersfilename}'\n",
"%store orders_datasource\n",
"print(f\"Data source: {orders_datasource}\")\n",
"\n",
"data_sources.append(ProcessingInput(\n",
" source=orders_datasource, \n",
" destination=f'/opt/ml/processing/{ordersfilename}',\n",
" input_name=ordersfilename,\n",
" s3_data_type=\"S3Prefix\",\n",
" s3_input_mode=\"File\",\n",
" s3_data_distribution_type=\"FullyReplicated\"\n",
"))"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Output: Feature Store \n",
"\n",
"##### Use the link below if you want to go back and create a Data Wrangler flow\n",
"[Create Data Wrangler Workflow](#Creating-a-workflow-using-Data-Wrangler-(OPTIONAL))"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Below are the inputs required by the SageMaker Python SDK to launch a processing job with feature store as an output."
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"\n",
"
Warning!!!
\n",
"
The output_name variable shown below should be configured only if you created you own flow file using Data Wrangler and have overwritten the original file.
\n",
"
Use the value copied from Step-7 of the process used to create the DW flow.
\n",
"
"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"# Output name is auto-generated from the select node's ID + output name from the flow file.\n",
"output_name = None #Use the Node ID from the provided DW flow file.\n",
"if output_name is None: \n",
" output_name = \"739f8413-3a63-42c3-99a0-fa678a68c2d6.default\"\n",
"logger.info(f'output_name = {output_name}')"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"from sagemaker.processing import FeatureStoreOutput\n",
"\n",
"processing_job_output = ProcessingOutput(\n",
" output_name=output_name,\n",
" app_managed=True,\n",
" feature_store_output=FeatureStoreOutput(feature_group_name=feature_group_name),\n",
")"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Upload Flow to S3\n",
"\n",
"To use the Data Wrangler as an input to the processing job, first upload your flow file to Amazon S3."
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"import os\n",
"import json\n",
"import boto3\n",
"\n",
"# name of the flow file which should exist in the current notebook working directory\n",
"flow_file_name = f'{flow_name}.flow'\n",
"\n",
"# Load .flow file from current notebook working directory \n",
"!echo \"Loading flow file from current notebook working directory: $PWD\"\n",
"\n",
"#Read file from current notebook working directory\n",
"with open(flow_file_name) as f:\n",
" flow = json.load(f)\n",
"\n",
"# Upload flow to S3\n",
"s3_client = boto3.client(\"s3\")\n",
"orders_flow_file=f'{workshopfolder}data_wrangler_flows/{flow_export_name}.flow'\n",
"s3_client.upload_file(flow_file_name, bucket, orders_flow_file)\n",
"flow_s3_uri = f's3://{bucket}/{orders_flow_file}'\n",
"print(f\"Data Wrangler flow {flow_file_name} uploaded to {flow_s3_uri}\")"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"The Data Wrangler Flow is also provided to the Processing Job as an input source which we configure below."
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"## Input - Flow: DWF-Orders.flow\n",
"flow_input = ProcessingInput(\n",
" source=flow_s3_uri,\n",
" destination=\"/opt/ml/processing/flow\",\n",
" input_name=\"flow\",\n",
" s3_data_type=\"S3Prefix\",\n",
" s3_input_mode=\"File\",\n",
" s3_data_distribution_type=\"FullyReplicated\"\n",
")"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"# Run Processing Job \n",
"## Job Configurations\n",
"\n",
" 💡 Configurable Settings \n",
"\n",
"You can configure the following settings for Processing Jobs. If you change any configurations you will \n",
"need to re-execute this and all cells below it by selecting the Run menu above and click \n",
"Run Selected Cells and All Below\n",
"\n",
"1. IAM role for executing the processing job. \n",
"2. A unique name of the processing job. Give a unique name every time you re-execute processing jobs\n",
"3. Data Wrangler Container URL.\n",
"4. Instance count, instance type and storage volume size in GB.\n",
"5. Content type for each output. Data Wrangler supports CSV as default and Parquet.\n",
"6. Network Isolation settings\n",
"
"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"import uuid\n",
"\n",
"# IAM role for executing the processing job.\n",
"iam_role = sagemaker.get_execution_role()\n",
"\n",
"# Unique processing job name. Give a unique name every time you re-execute processing jobs\n",
"flow_export_id = f\"{strftime('%d-%H-%M-%S', gmtime())}-{str(uuid.uuid4())[:8]}\"\n",
"processing_job_name = f\"data-wrangler-flow-processing-{flow_export_id}\"\n",
"print(f\"Processing job name: {processing_job_name}\")\n",
"%store processing_job_name\n",
"\n",
"# Data Wrangler Container URL.\n",
"container_id = get_container(region)\n",
"print(f\"container_id: {container_id}\")\n",
"container_uri = f'{container_id}.dkr.ecr.{region}.amazonaws.com/sagemaker-data-wrangler-container:1.x'\n",
"print(f\"container_uri: {container_uri}\")\n",
"\n",
"# Processing Job Instance count and instance type.\n",
"instance_count = 2\n",
"instance_type = \"ml.m5.4xlarge\"\n",
"\n",
"# Size in GB of the EBS volume to use for storing data during processing\n",
"volume_size_in_gb = 30\n",
"\n",
"# Content type for each output. Data Wrangler supports CSV as default and Parquet.\n",
"output_content_type = \"CSV\"\n",
"\n",
"# Network Isolation mode; default is off\n",
"enable_network_isolation = False\n",
"\n",
"# Output configuration used as processing job container arguments \n",
"output_config = {\n",
" output_name: {\n",
" \"content_type\": output_content_type\n",
" }\n",
"}"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Create and Execute Processing Job\n",
"\n",
"To launch a Processing Job, you will use the SageMaker Python SDK to create a Processor function."
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"from sagemaker.processing import Processor\n",
"from sagemaker.network import NetworkConfig\n",
"\n",
"processor = Processor(\n",
" role=iam_role,\n",
" image_uri=container_uri,\n",
" instance_count=instance_count,\n",
" instance_type=instance_type,\n",
" volume_size_in_gb=volume_size_in_gb,\n",
" network_config=NetworkConfig(enable_network_isolation=enable_network_isolation),\n",
" sagemaker_session=sess\n",
")\n",
"\n",
"# Start Job\n",
"processor.run(\n",
" inputs=[flow_input] + data_sources, \n",
" outputs=[processing_job_output],\n",
" arguments=[f\"--output-config '{json.dumps(output_config)}'\"],\n",
" wait=False,\n",
" logs=False,\n",
" job_name=processing_job_name\n",
")"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Job Status\n",
"\n",
"Below you wait for processing job to finish. If it finishes successfully, your feature group should be populated \n",
"with transformed feature values. In addition the raw parameters used by the Processing Job will be printed."
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"job_result = sess.wait_for_processing_job(processing_job_name)\n",
"logger.info(f'Job result={job_result}') "
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"You can check the status of your processing job as shown below. In case of errors, the log can be very helpful to debug.\n",
"\n",
""
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Verify Processing Job Results"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"import random\n",
"\n",
"order_id = f'O{random.randint(1, 5000)}'\n",
"logger.info(f\"order_id={order_id}\") \n",
"\n",
"featurestore_runtime_client = sess.boto_session.client('sagemaker-featurestore-runtime', region_name=region)\n",
"# Verify Processing Job Results by querying Feature Store\n",
"feature_record = featurestore_runtime_client.get_record(FeatureGroupName=feature_group_name, RecordIdentifierValueAsString=order_id)\n",
"logger.info(f\"Feature Record={feature_record}\") "
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Storing Variable Values"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"# Storing the values of the Orders Feature Groupname and DW outputname\n",
"%store output_name\n",
"%store feature_group_name\n",
"processing_job = sagemaker.processing.ProcessingJob.from_processing_name(sess, processing_job_name)\n",
"processing_job_description = processing_job.describe()\n",
"%store processing_job_description\n",
"# These variables will be used by Module-6 & Module-8"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"You can view newly created feature group in Studio, refer to [Use Amazon SageMaker Feature Store with Amazon SageMaker Studio](https://docs.aws.amazon.com/sagemaker/latest/dg/feature-store-use-with-studio.html)\n",
"for detailed guide. [Learn more about SageMaker Feature Store](https://github.com/aws/amazon-sagemaker-examples/tree/master/sagemaker-featurestore)"
]
}
],
"metadata": {
"availableInstances": [
{
"_defaultOrder": 0,
"_isFastLaunch": true,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 4,
"name": "ml.t3.medium",
"vcpuNum": 2
},
{
"_defaultOrder": 1,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 8,
"name": "ml.t3.large",
"vcpuNum": 2
},
{
"_defaultOrder": 2,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 16,
"name": "ml.t3.xlarge",
"vcpuNum": 4
},
{
"_defaultOrder": 3,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 32,
"name": "ml.t3.2xlarge",
"vcpuNum": 8
},
{
"_defaultOrder": 4,
"_isFastLaunch": true,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 8,
"name": "ml.m5.large",
"vcpuNum": 2
},
{
"_defaultOrder": 5,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 16,
"name": "ml.m5.xlarge",
"vcpuNum": 4
},
{
"_defaultOrder": 6,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 32,
"name": "ml.m5.2xlarge",
"vcpuNum": 8
},
{
"_defaultOrder": 7,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 64,
"name": "ml.m5.4xlarge",
"vcpuNum": 16
},
{
"_defaultOrder": 8,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 128,
"name": "ml.m5.8xlarge",
"vcpuNum": 32
},
{
"_defaultOrder": 9,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 192,
"name": "ml.m5.12xlarge",
"vcpuNum": 48
},
{
"_defaultOrder": 10,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 256,
"name": "ml.m5.16xlarge",
"vcpuNum": 64
},
{
"_defaultOrder": 11,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 384,
"name": "ml.m5.24xlarge",
"vcpuNum": 96
},
{
"_defaultOrder": 12,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 8,
"name": "ml.m5d.large",
"vcpuNum": 2
},
{
"_defaultOrder": 13,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 16,
"name": "ml.m5d.xlarge",
"vcpuNum": 4
},
{
"_defaultOrder": 14,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 32,
"name": "ml.m5d.2xlarge",
"vcpuNum": 8
},
{
"_defaultOrder": 15,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 64,
"name": "ml.m5d.4xlarge",
"vcpuNum": 16
},
{
"_defaultOrder": 16,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 128,
"name": "ml.m5d.8xlarge",
"vcpuNum": 32
},
{
"_defaultOrder": 17,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 192,
"name": "ml.m5d.12xlarge",
"vcpuNum": 48
},
{
"_defaultOrder": 18,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 256,
"name": "ml.m5d.16xlarge",
"vcpuNum": 64
},
{
"_defaultOrder": 19,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 384,
"name": "ml.m5d.24xlarge",
"vcpuNum": 96
},
{
"_defaultOrder": 20,
"_isFastLaunch": false,
"category": "General purpose",
"gpuNum": 0,
"hideHardwareSpecs": true,
"memoryGiB": 0,
"name": "ml.geospatial.interactive",
"supportedImageNames": [
"sagemaker-geospatial-v1-0"
],
"vcpuNum": 0
},
{
"_defaultOrder": 21,
"_isFastLaunch": true,
"category": "Compute optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 4,
"name": "ml.c5.large",
"vcpuNum": 2
},
{
"_defaultOrder": 22,
"_isFastLaunch": false,
"category": "Compute optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 8,
"name": "ml.c5.xlarge",
"vcpuNum": 4
},
{
"_defaultOrder": 23,
"_isFastLaunch": false,
"category": "Compute optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 16,
"name": "ml.c5.2xlarge",
"vcpuNum": 8
},
{
"_defaultOrder": 24,
"_isFastLaunch": false,
"category": "Compute optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 32,
"name": "ml.c5.4xlarge",
"vcpuNum": 16
},
{
"_defaultOrder": 25,
"_isFastLaunch": false,
"category": "Compute optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 72,
"name": "ml.c5.9xlarge",
"vcpuNum": 36
},
{
"_defaultOrder": 26,
"_isFastLaunch": false,
"category": "Compute optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 96,
"name": "ml.c5.12xlarge",
"vcpuNum": 48
},
{
"_defaultOrder": 27,
"_isFastLaunch": false,
"category": "Compute optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 144,
"name": "ml.c5.18xlarge",
"vcpuNum": 72
},
{
"_defaultOrder": 28,
"_isFastLaunch": false,
"category": "Compute optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 192,
"name": "ml.c5.24xlarge",
"vcpuNum": 96
},
{
"_defaultOrder": 29,
"_isFastLaunch": true,
"category": "Accelerated computing",
"gpuNum": 1,
"hideHardwareSpecs": false,
"memoryGiB": 16,
"name": "ml.g4dn.xlarge",
"vcpuNum": 4
},
{
"_defaultOrder": 30,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 1,
"hideHardwareSpecs": false,
"memoryGiB": 32,
"name": "ml.g4dn.2xlarge",
"vcpuNum": 8
},
{
"_defaultOrder": 31,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 1,
"hideHardwareSpecs": false,
"memoryGiB": 64,
"name": "ml.g4dn.4xlarge",
"vcpuNum": 16
},
{
"_defaultOrder": 32,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 1,
"hideHardwareSpecs": false,
"memoryGiB": 128,
"name": "ml.g4dn.8xlarge",
"vcpuNum": 32
},
{
"_defaultOrder": 33,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 4,
"hideHardwareSpecs": false,
"memoryGiB": 192,
"name": "ml.g4dn.12xlarge",
"vcpuNum": 48
},
{
"_defaultOrder": 34,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 1,
"hideHardwareSpecs": false,
"memoryGiB": 256,
"name": "ml.g4dn.16xlarge",
"vcpuNum": 64
},
{
"_defaultOrder": 35,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 1,
"hideHardwareSpecs": false,
"memoryGiB": 61,
"name": "ml.p3.2xlarge",
"vcpuNum": 8
},
{
"_defaultOrder": 36,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 4,
"hideHardwareSpecs": false,
"memoryGiB": 244,
"name": "ml.p3.8xlarge",
"vcpuNum": 32
},
{
"_defaultOrder": 37,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 8,
"hideHardwareSpecs": false,
"memoryGiB": 488,
"name": "ml.p3.16xlarge",
"vcpuNum": 64
},
{
"_defaultOrder": 38,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 8,
"hideHardwareSpecs": false,
"memoryGiB": 768,
"name": "ml.p3dn.24xlarge",
"vcpuNum": 96
},
{
"_defaultOrder": 39,
"_isFastLaunch": false,
"category": "Memory Optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 16,
"name": "ml.r5.large",
"vcpuNum": 2
},
{
"_defaultOrder": 40,
"_isFastLaunch": false,
"category": "Memory Optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 32,
"name": "ml.r5.xlarge",
"vcpuNum": 4
},
{
"_defaultOrder": 41,
"_isFastLaunch": false,
"category": "Memory Optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 64,
"name": "ml.r5.2xlarge",
"vcpuNum": 8
},
{
"_defaultOrder": 42,
"_isFastLaunch": false,
"category": "Memory Optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 128,
"name": "ml.r5.4xlarge",
"vcpuNum": 16
},
{
"_defaultOrder": 43,
"_isFastLaunch": false,
"category": "Memory Optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 256,
"name": "ml.r5.8xlarge",
"vcpuNum": 32
},
{
"_defaultOrder": 44,
"_isFastLaunch": false,
"category": "Memory Optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 384,
"name": "ml.r5.12xlarge",
"vcpuNum": 48
},
{
"_defaultOrder": 45,
"_isFastLaunch": false,
"category": "Memory Optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 512,
"name": "ml.r5.16xlarge",
"vcpuNum": 64
},
{
"_defaultOrder": 46,
"_isFastLaunch": false,
"category": "Memory Optimized",
"gpuNum": 0,
"hideHardwareSpecs": false,
"memoryGiB": 768,
"name": "ml.r5.24xlarge",
"vcpuNum": 96
},
{
"_defaultOrder": 47,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 1,
"hideHardwareSpecs": false,
"memoryGiB": 16,
"name": "ml.g5.xlarge",
"vcpuNum": 4
},
{
"_defaultOrder": 48,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 1,
"hideHardwareSpecs": false,
"memoryGiB": 32,
"name": "ml.g5.2xlarge",
"vcpuNum": 8
},
{
"_defaultOrder": 49,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 1,
"hideHardwareSpecs": false,
"memoryGiB": 64,
"name": "ml.g5.4xlarge",
"vcpuNum": 16
},
{
"_defaultOrder": 50,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 1,
"hideHardwareSpecs": false,
"memoryGiB": 128,
"name": "ml.g5.8xlarge",
"vcpuNum": 32
},
{
"_defaultOrder": 51,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 1,
"hideHardwareSpecs": false,
"memoryGiB": 256,
"name": "ml.g5.16xlarge",
"vcpuNum": 64
},
{
"_defaultOrder": 52,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 4,
"hideHardwareSpecs": false,
"memoryGiB": 192,
"name": "ml.g5.12xlarge",
"vcpuNum": 48
},
{
"_defaultOrder": 53,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 4,
"hideHardwareSpecs": false,
"memoryGiB": 384,
"name": "ml.g5.24xlarge",
"vcpuNum": 96
},
{
"_defaultOrder": 54,
"_isFastLaunch": false,
"category": "Accelerated computing",
"gpuNum": 8,
"hideHardwareSpecs": false,
"memoryGiB": 768,
"name": "ml.g5.48xlarge",
"vcpuNum": 192
}
],
"instance_type": "ml.t3.medium",
"kernelspec": {
"display_name": "Python 3 (Data Science)",
"language": "python",
"name": "python3__SAGEMAKER_INTERNAL__arn:aws:sagemaker:us-west-2:236514542706:image/datascience-1.0"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.7.10"
}
},
"nbformat": 4,
"nbformat_minor": 4
}