Source code for sagemaker.core.compute_resource_requirements.resource_requirements
# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"). You
# may not use this file except in compliance with the License. A copy of
# the License is located at
#
# http://aws.amazon.com/apache2.0/
#
# or in the "license" file accompanying this file. This file is
# distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF
# ANY KIND, either express or implied. See the License for the specific
# language governing permissions and limitations under the License.
"""Defines the ResourceRequirements class that configures the compute resources for the Model."""
from __future__ import absolute_import
import logging
from typing import Optional, Dict
from sagemaker.core.common_utils import stringify_object
LOGGER = logging.getLogger("sagemaker")
[docs]
class ResourceRequirements(object):
"""Configures the compute resources for a Model."""
def __init__(
self,
requests: Optional[Dict[str, int]] = None,
limits: Optional[Dict[str, int]] = None,
):
"""Initializes a ResourceRequirements object for an Amazon SageMaker inference component.
Args:
requests (dict): Basic resource to be requested, including num_cpus, memory (in MB),
accelerator_memory (in MB), copies.
limits (dict): Max resource limit to be requested, including memory (in MB).
Example:
requests = {
num_cpus: 1,
memory: 1024,
copies: 5
},
limits = {
memory: 2048
}
"""
self.requests = requests
self.limits = limits
self.num_accelerators: Optional[int] = None
self.num_cpus: Optional[int] = None
self.min_memory: Optional[int] = None
self.max_memory: Optional[int] = None
self.copy_count = 1
if requests:
if "num_accelerators" in requests:
self.num_accelerators = requests["num_accelerators"]
if "num_cpus" in requests:
self.num_cpus = requests["num_cpus"]
if "memory" in requests:
self.min_memory = requests["memory"]
if "copies" in requests:
self.copy_count = requests["copies"]
if limits:
if "memory" in limits:
self.max_memory = limits["memory"]
def __str__(self) -> str:
"""Overriding str(*) method to make more human-readable."""
return stringify_object(self)
def __eq__(self, other) -> bool:
"""Implement equal method for easy unit testing."""
return self.requests == other.requests and self.limits == other.limits
[docs]
def get_compute_resource_requirements(self) -> dict:
"""Returns a dict of resource requirements."""
resource_requirements = {
"MinMemoryRequiredInMb": self.min_memory,
}
if self.max_memory:
resource_requirements.update({"MaxMemoryRequiredInMb": self.max_memory})
if self.num_cpus:
resource_requirements.update({"NumberOfCpuCoresRequired": self.num_cpus})
if self.num_accelerators:
resource_requirements.update(
{"NumberOfAcceleratorDevicesRequired": self.num_accelerators}
)
return resource_requirements