update doc

pytorch · Feb 8, 2022 · 9b91d20 · 9b91d20
1 parent 3ac4296
commit 9b91d20
Showing 1 changed file with 94 additions and 0 deletions.
diff --git a/docs/management_api.md b/docs/management_api.md
@@ -285,6 +285,100 @@ curl http://localhost:8081/models/noop/all
 ]
 ```
 
+`GET /models/{model_name}/{model_version}?customized=true`
+or 
+`GET /models/{model_name}?customized=true`
+
+Use the Describe Model API to get detail runtime status and customized metadata of a version of a model:
+* Implement function _is_describe and describe_handle. Eg.
+```
+    def _is_describe(self):
+        if self.context and self.context.get_request_header(0, "describe"):
+            if self.context.get_request_header(0, "describe") == "True":
+                return True
+        return False
+
+    def describe_handle(self):
+        """Customized describe handler
+        Returns:
+            dict : A dictionary response.
+        """
+        output_describe = None
+
+        logger.info("Collect customized metadata")
+
+        return output_describe
+```
+* Call function _is_describe and describe_handle in handle. Eg.
+```
+def handle(self, data, context):
+        """Entry point for default handler. It takes the data from the input request and returns
+           the predicted outcome for the input.
+        Args:
+            data (list): The input data that needs to be made a prediction request on.
+            context (Context): It is a JSON Object containing information pertaining to
+                               the model artefacts parameters.
+        Returns:
+            list : Returns a list of dictionary with the predicted response.
+        """
+
+        # It can be used for pre or post processing if needed as additional request
+        # information is available in context
+        start_time = time.time()
+
+        self.context = context
+        metrics = self.context.metrics
+
+        is_profiler_enabled = os.environ.get("ENABLE_TORCH_PROFILER", None)
+        if is_profiler_enabled:
+            output, _ = self._infer_with_profiler(data=data)
+        else:
+            if self._is_describe():
+                output = [self.describe_handle()]
+            else:
+                data_preprocess = self.preprocess(data)
+
+                if not self._is_explain():
+                    output = self.inference(data_preprocess)
+                    output = self.postprocess(output)
+                else:
+                    output = self.explain_handle(data_preprocess, data)
+
+        stop_time = time.time()
+        metrics.add_time('HandlerTime', round(
+            (stop_time - start_time) * 1000, 2), None, 'ms')
+        return output
+```
+ts/torch_handler/base_handler.py implements the above functions. Here is an example.
+```bash
+curl http://localhost:8081/models/noop-customized/1.0?customized=true
+[
+    {
+        "modelName": "noop-customized",
+        "modelVersion": "1.0",
+        "modelUrl": "noop-customized.mar",
+        "runtime": "python",
+        "minWorkers": 1,
+        "maxWorkers": 1,
+        "batchSize": 1,
+        "maxBatchDelay": 100,
+        "loadedAtStartup": false,
+        "workers": [
+          {
+            "id": "9010",
+            "startTime": "2022-02-08T11:03:20.974Z",
+            "status": "READY",
+            "memoryUsage": 0,
+            "pid": 98972,
+            "gpu": false,
+            "gpuUsage": "N/A"
+          }
+        ],
+        "customizedMetadata": "{\n  \"data1\": \"1\",\n  \"data2\": \"2\"\n}"
+     }
+]
+```
+
 ## Unregister a model
 
 This API follows the [ManagementAPIsService.UnregisterModel](https://github.com/pytorch/serve/blob/master/frontend/server/src/main/resources/proto/management.proto) gRPC API. It returns the status of a model in the ModelServer.