change: Enable default model fn for cpu and gpu

saimidu · saimidu · commit 58b37b0eb448 · 2021-10-11T10:28:05.000-07:00
diff --git a/src/sagemaker_pytorch_serving_container/default_pytorch_inference_handler.py b/src/sagemaker_pytorch_serving_container/default_pytorch_inference_handler.py
@@ -49,10 +49,14 @@ def default_model_fn(self, model_dir):
             # Client-framework is CPU only. But model will run in Elastic Inference server with CUDA.
             return torch.jit.load(model_path, map_location=torch.device('cpu'))
         else:
-            raise NotImplementedError(textwrap.dedent("""
-            Please provide a model_fn implementation.
-            See documentation for model_fn at https://github.com/aws/sagemaker-python-sdk
-            """))
+            device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+            model_path = os.path.join(model_dir, DEFAULT_MODEL_FILENAME)
+            if not os.path.exists(model_path):
+                raise FileNotFoundError("Failed to load model with default model_fn: missing file {}."
+                                        .format(DEFAULT_MODEL_FILENAME))
+            model = torch.jit.load(model_path, map_location=device)
+            model = model.to(device)
+            return model
 
     def default_input_fn(self, input_data, content_type):
         """A default input_fn that can handle JSON, CSV and NPZ formats.