Skip to content

Commit

Permalink
Format
Browse files Browse the repository at this point in the history
  • Loading branch information
samruds committed Mar 20, 2024
1 parent 9e64c40 commit 650d40e
Show file tree
Hide file tree
Showing 2 changed files with 13 additions and 6 deletions.
18 changes: 12 additions & 6 deletions src/sagemaker/serve/builder/model_builder.py
Original file line number Diff line number Diff line change
Expand Up @@ -43,8 +43,11 @@
from sagemaker.serve.utils import task
from sagemaker.serve.utils.exceptions import TaskNotFoundException
from sagemaker.serve.utils.predictors import _get_local_mode_predictor
from sagemaker.serve.utils.hardware_detector import _get_gpu_info, _get_gpu_info_fallback,\
_total_inference_model_size_mib
from sagemaker.serve.utils.hardware_detector import (
_get_gpu_info,
_get_gpu_info_fallback,
_total_inference_model_size_mib,
)
from sagemaker.serve.detector.image_detector import (
auto_detect_container,
_detect_framework_and_version,
Expand Down Expand Up @@ -724,12 +727,15 @@ def _can_fit_on_single_gpu(self) -> Type[bool]:
"""
try:
single_gpu_size_mib = self._try_fetch_gpu_info()
if _total_inference_model_size_mib(self.model, self.env_vars.get("dtypes", "float32")) \
<= single_gpu_size_mib:
if (
_total_inference_model_size_mib(self.model, self.env_vars.get("dtypes", "float32"))
<= single_gpu_size_mib
):
logger.info(
"Total inference model size MIB %s, single GPU size for instance MIB %s",
_total_inference_model_size_mib(self.model, self.env_vars.get("dtypes",
"float32")),
_total_inference_model_size_mib(
self.model, self.env_vars.get("dtypes", "float32")
),
single_gpu_size_mib,
)
return True
Expand Down
1 change: 1 addition & 0 deletions src/sagemaker/serve/utils/hardware_detector.py
Original file line number Diff line number Diff line change
Expand Up @@ -33,6 +33,7 @@
"size calculations e.g. pip install 'sagemaker[huggingface]'"
)


def _get_gpu_info(instance_type: str, session: Session) -> Tuple[int, int]:
"""Get GPU info for the provided instance
Expand Down

0 comments on commit 650d40e

Please sign in to comment.