-
Notifications
You must be signed in to change notification settings - Fork 1.2k
feature: allow setting the default bucket in Session #1176
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from all commits
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -76,7 +76,13 @@ class Session(object): # pylint: disable=too-many-public-methods | |
bucket based on a naming convention which includes the current AWS account ID. | ||
""" | ||
|
||
def __init__(self, boto_session=None, sagemaker_client=None, sagemaker_runtime_client=None): | ||
def __init__( | ||
self, | ||
boto_session=None, | ||
sagemaker_client=None, | ||
sagemaker_runtime_client=None, | ||
default_bucket=None, | ||
): | ||
"""Initialize a SageMaker ``Session``. | ||
|
||
Args: | ||
|
@@ -91,13 +97,25 @@ def __init__(self, boto_session=None, sagemaker_client=None, sagemaker_runtime_c | |
``InvokeEndpoint`` calls to Amazon SageMaker (default: None). Predictors created | ||
using this ``Session`` use this client. If not provided, one will be created using | ||
this instance's ``boto_session``. | ||
default_bucket (str): The default Amazon S3 bucket to be used by this session. | ||
This will be created the next time an Amazon S3 bucket is needed (by calling | ||
:func:`default_bucket`). | ||
If not provided, a default bucket will be created based on the following format: | ||
"sagemaker-{region}-{aws-account-id}". | ||
Example: "sagemaker-my-custom-bucket". | ||
|
||
""" | ||
self._default_bucket = None | ||
self._default_bucket_name_override = default_bucket | ||
|
||
# currently is used for local_code in local mode | ||
self.config = None | ||
|
||
self._initialize(boto_session, sagemaker_client, sagemaker_runtime_client) | ||
self._initialize( | ||
boto_session=boto_session, | ||
sagemaker_client=sagemaker_client, | ||
sagemaker_runtime_client=sagemaker_runtime_client, | ||
) | ||
Comment on lines
+114
to
+118
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. guessing There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Don't think so? Based on my git hooks, I wouldn't have been able to commit it if black-check didn't return 1. Edit: return 0 * There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. never mind. it looked strange to me that there should be any diff remaining in this part of the code, and my understanding was that black had a strict threshold for when it moved to multiple lines (for these kinds of cases) |
||
|
||
def _initialize(self, boto_session, sagemaker_client, sagemaker_runtime_client): | ||
"""Initialize this SageMaker Session. | ||
|
@@ -315,10 +333,13 @@ def default_bucket(self): | |
return self._default_bucket | ||
|
||
region = self.boto_session.region_name | ||
account = self.boto_session.client( | ||
"sts", region_name=region, endpoint_url=sts_regional_endpoint(region) | ||
).get_caller_identity()["Account"] | ||
default_bucket = "sagemaker-{}-{}".format(region, account) | ||
|
||
default_bucket = self._default_bucket_name_override | ||
if not default_bucket: | ||
account = self.boto_session.client( | ||
"sts", region_name=region, endpoint_url=sts_regional_endpoint(region) | ||
).get_caller_identity()["Account"] | ||
default_bucket = "sagemaker-{}-{}".format(region, account) | ||
|
||
s3 = self.boto_session.resource("s3") | ||
try: | ||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,50 @@ | ||
# Copyright 2019 Amazon.com, Inc. or its affiliates. All Rights Reserved. | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"). You | ||
# may not use this file except in compliance with the License. A copy of | ||
# the License is located at | ||
# | ||
# http://aws.amazon.com/apache2.0/ | ||
# | ||
# or in the "license" file accompanying this file. This file is | ||
# distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF | ||
# ANY KIND, either express or implied. See the License for the specific | ||
# language governing permissions and limitations under the License. | ||
from __future__ import absolute_import | ||
|
||
import boto3 | ||
from botocore.config import Config | ||
|
||
from sagemaker import Session | ||
|
||
DEFAULT_REGION = "us-west-2" | ||
CUSTOM_BUCKET_NAME = "this-bucket-should-not-exist" | ||
|
||
|
||
def test_sagemaker_session_does_not_create_bucket_on_init( | ||
sagemaker_client_config, sagemaker_runtime_config, boto_config | ||
): | ||
boto_session = ( | ||
boto3.Session(**boto_config) if boto_config else boto3.Session(region_name=DEFAULT_REGION) | ||
) | ||
sagemaker_client_config.setdefault("config", Config(retries=dict(max_attempts=10))) | ||
sagemaker_client = ( | ||
boto_session.client("sagemaker", **sagemaker_client_config) | ||
if sagemaker_client_config | ||
else None | ||
) | ||
runtime_client = ( | ||
boto_session.client("sagemaker-runtime", **sagemaker_runtime_config) | ||
if sagemaker_runtime_config | ||
else None | ||
) | ||
|
||
Session( | ||
boto_session=boto_session, | ||
sagemaker_client=sagemaker_client, | ||
sagemaker_runtime_client=runtime_client, | ||
default_bucket=CUSTOM_BUCKET_NAME, | ||
) | ||
|
||
s3 = boto3.resource("s3") | ||
assert s3.Bucket(CUSTOM_BUCKET_NAME).creation_date is None |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
nit: if you want the "example" block to be formatted, you need a newline before it. (if you were going for having it in the same paragraph, then ignore this comment.)
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Gotcha. I actually want this example to match default_bucket's param precisely.