Skip to content

Commit ff8f223

Browse files
committed
Return predictor from deploy method via super
1 parent 3e8b430 commit ff8f223

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

src/sagemaker/djl_inference/model.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@
3232

3333
logger = logging.getLogger("sagemaker")
3434

35-
35+
# DJL Serving uses log4j, so we convert python logging name to log4j equivalent
3636
LOG_LEVEL_MAP = {
3737
logging.INFO: "info",
3838
logging.DEBUG: "debug",
@@ -200,7 +200,7 @@ def deploy(
200200
f"with GPUs. Supported instance families are {defaults.ALLOWED_INSTANCE_FAMILIES}"
201201
)
202202

203-
super(DJLLargeModel, self).deploy(
203+
return super(DJLLargeModel, self).deploy(
204204
initial_instance_count=initial_instance_count,
205205
instance_type=instance_type,
206206
serializer=serializer,
@@ -447,8 +447,8 @@ def __init__(
447447
self.engine = DJLEngine.HUGGINGFACE_ACCELERATE
448448
self.device_id = device_id
449449
self.device_map = device_map
450-
self.load_in_8bit = (load_in_8bit,)
451-
self.low_cpu_mem_usage = (low_cpu_mem_usage,)
450+
self.load_in_8bit = load_in_8bit
451+
self.low_cpu_mem_usage = low_cpu_mem_usage
452452

453453
def generate_serving_properties(self, serving_properties={}) -> Dict[str, str]:
454454
serving_properties = super(HuggingfaceAccelerateModel, self).generate_serving_properties()

0 commit comments

Comments
 (0)