sagemaker-python-sdk/tests/integ/test_rl.py at master · devopsgitpython/sagemaker-python-sdk

132 lines (107 loc) · 4.54 KB
# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
# Licensed under the Apache License, Version 2.0 (the "License"). You
# may not use this file except in compliance with the License. A copy of
# the License is located at
#     http://aws.amazon.com/apache2.0/
# or in the "license" file accompanying this file. This file is
# distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF
# ANY KIND, either express or implied. See the License for the specific
# language governing permissions and limitations under the License.
from __future__ import absolute_import
import numpy
import pytest
from sagemaker.rl import RLEstimator, RLFramework, RLToolkit
from sagemaker.utils import sagemaker_timestamp, unique_name_from_base
from tests.integ import DATA_DIR, RL_SUPPORTED_REGIONS, test_region
from tests.integ.timeout import timeout, timeout_and_delete_endpoint_by_name
@pytest.mark.release
def test_coach_mxnet(sagemaker_session, coach_mxnet_latest_version, cpu_instance_type):
    estimator = _test_coach(
        sagemaker_session, RLFramework.MXNET, coach_mxnet_latest_version, cpu_instance_type
    job_name = unique_name_from_base("test-coach-mxnet")
    with timeout(minutes=15):
        estimator.fit(wait="False", job_name=job_name)
        estimator = RLEstimator.attach(
            estimator.latest_training_job.name, sagemaker_session=sagemaker_session
    endpoint_name = "test-mxnet-coach-deploy-{}".format(sagemaker_timestamp())
    with timeout_and_delete_endpoint_by_name(endpoint_name, sagemaker_session):
        predictor = estimator.deploy(
            1, cpu_instance_type, entry_point="mxnet_deploy.py", endpoint_name=endpoint_name
        observation = numpy.asarray([0, 0, 0, 0])
        action = predictor.predict(observation)
    assert 0 < action[0][0] < 1
    assert 0 < action[0][1] < 1
@pytest.mark.skipif(
    test_region() not in RL_SUPPORTED_REGIONS,
    reason="Updated RL images aren't in {}".format(test_region()),
def test_coach_tf(sagemaker_session, coach_tensorflow_latest_version, cpu_instance_type):
    estimator = _test_coach(
        sagemaker_session,
        RLFramework.TENSORFLOW,
        coach_tensorflow_latest_version,
        cpu_instance_type,
    job_name = unique_name_from_base("test-coach-tf")
    with timeout(minutes=15):
        estimator.fit(job_name=job_name)
    endpoint_name = "test-tf-coach-deploy-{}".format(sagemaker_timestamp())
    with timeout_and_delete_endpoint_by_name(endpoint_name, sagemaker_session):
        predictor = estimator.deploy(1, cpu_instance_type)
        observation = numpy.asarray([0, 0, 0, 0])
        action = predictor.predict(observation)
    assert action == {"predictions": [[0.5, 0.5]]}
def _test_coach(sagemaker_session, rl_framework, rl_coach_version, cpu_instance_type):
    source_dir = os.path.join(DATA_DIR, "coach_cartpole")
    dependencies = [os.path.join(DATA_DIR, "sagemaker_rl")]
    cartpole = "train_coach.py"
    return RLEstimator(
        toolkit=RLToolkit.COACH,
        toolkit_version=rl_coach_version,
        framework=rl_framework,
        entry_point=cartpole,
        source_dir=source_dir,
        role="SageMakerRole",
        instance_count=1,
        instance_type=cpu_instance_type,
        sagemaker_session=sagemaker_session,
        dependencies=dependencies,
        hyperparameters={
            "save_model": 1,
            "RLCOACH_PRESET": "preset_cartpole_clippedppo",
            "rl.agent_params.algorithm.discount": 0.9,
            "rl.evaluation_steps:EnvironmentEpisodes": 1,
@pytest.mark.skipif(
    test_region() not in RL_SUPPORTED_REGIONS,
    reason="Updated RL images aren't in {}".format(test_region()),
@pytest.mark.release
def test_ray_tf(sagemaker_session, ray_tensorflow_latest_version, cpu_instance_type):
    source_dir = os.path.join(DATA_DIR, "ray_cartpole")
    cartpole = "train_ray.py"
    estimator = RLEstimator(
        entry_point=cartpole,
        source_dir=source_dir,
        toolkit=RLToolkit.RAY,
        framework=RLFramework.TENSORFLOW,
        toolkit_version=ray_tensorflow_latest_version,
        sagemaker_session=sagemaker_session,
        role="SageMakerRole",
        instance_type=cpu_instance_type,
        instance_count=1,
    job_name = unique_name_from_base("test-ray-tf")
    with timeout(minutes=15):
        estimator.fit(job_name=job_name)
    with pytest.raises(NotImplementedError) as e:
        estimator.deploy(1, cpu_instance_type)
    assert "Automatic deployment of Ray models is not currently available" in str(e.value)
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

test_rl.py

Latest commit

History

test_rl.py

File metadata and controls