elastic · valeriy42 · Jul 11, 2023 · Jul 7, 2023 · Jul 7, 2023 · Jul 10, 2023
diff --git a/README.md b/README.md
@@ -245,7 +245,7 @@ The `--start` argument will deploy the model with one allocation and one
 thread per allocation, which will not offer good performance. When starting
 the model deployment using the ML UI in Kibana or the Elasticsearch
 [API](https://www.elastic.co/guide/en/elasticsearch/reference/current/start-trained-model-deployment.html)
-you will be able to set the threading options to make best use of your
+you will be able to set the threading options to make the best use of your
 hardware.
 
 ```python

diff --git a/eland/ml/pytorch/_pytorch_model.py b/eland/ml/pytorch/_pytorch_model.py
@@ -134,7 +134,7 @@ def infer(
         __body: Dict[str, Any] = {}
         __body["docs"] = docs
 
-        __path = f"/_ml/trained_models/{_quote(self.model_id)}/deployment/_infer"
+        __path = f"/_ml/trained_models/{_quote(self.model_id)}/_infer"
         __query: Dict[str, Any] = {}
         __query["timeout"] = timeout
         __headers = {"accept": "application/json", "content-type": "application/json"}