[ML] Add inference results tests for PyTorch transformer models

2025-07-24 00:00:39 +08:00 · 2021-11-10 07:50:10 -05:00 · 2021-11-10 07:50:10 -05:00 · a3b0907c5b
commit a3b0907c5b
parent 66e3e4eaad
4 changed files with 99 additions and 4 deletions
--- a/.ci/jobs/defaults.yml
+++ b/.ci/jobs/defaults.yml
@ -24,7 +24,7 @@
    - inject:
        properties-content: HOME=$JENKINS_HOME
    concurrent: true
-    node: ubuntu
+    node: flyweight
    scm:
    - git:
        name: origin
--- a/.ci/run-elasticsearch.sh
+++ b/.ci/run-elasticsearch.sh
@ -121,6 +121,7 @@ if [[ "$ELASTICSEARCH_VERSION" != *oss* ]]; then
    --env xpack.security.enabled=false
    --env xpack.security.http.ssl.enabled=false
    --env xpack.security.transport.ssl.enabled=false
    --env xpack.ml.max_machine_memory_percent=90
 END
 ))
 fi
--- a/eland/ml/pytorch/_pytorch_model.py
+++ b/eland/ml/pytorch/_pytorch_model.py
@ -96,8 +96,8 @@ class PyTorchModel:
    ) -> None:
        # TODO: Implement some pre-flight checks on config, vocab, and model
        self.put_config(config_path)
        self.put_vocab(vocab_path)
        self.put_model(model_path, chunk_size)
        self.put_vocab(vocab_path)
    def infer(
        self, body: Dict[str, Any], timeout: str = DEFAULT_TIMEOUT
@ -106,14 +106,14 @@ class PyTorchModel:
            "POST",
            f"/_ml/trained_models/{self.model_id}/deployment/_infer",
            body=body,
-            params={"timeout": timeout},
+            params={"timeout": timeout, "request_timeout": 60},
        )
    def start(self, timeout: str = DEFAULT_TIMEOUT) -> None:
        self._client.transport.perform_request(
            "POST",
            f"/_ml/trained_models/{self.model_id}/deployment/_start",
-            params={"timeout": timeout, "wait_for": "started"},
+            params={"timeout": timeout, "request_timeout": 60, "wait_for": "started"},
        )
    def stop(self) -> None:
--- a/tests/ml/pytorch/test_pytorch_model_pytest.py
+++ b/tests/ml/pytorch/test_pytorch_model_pytest.py
@ -0,0 +1,94 @@
 #  Licensed to Elasticsearch B.V. under one or more contributor
 #  license agreements. See the NOTICE file distributed with
 #  this work for additional information regarding copyright
 #  ownership. Elasticsearch B.V. licenses this file to you under
 #  the Apache License, Version 2.0 (the "License"); you may
 #  not use this file except in compliance with the License.
 #  You may obtain a copy of the License at
 #
 # 	http://www.apache.org/licenses/LICENSE-2.0
 #
 #  Unless required by applicable law or agreed to in writing,
 #  software distributed under the License is distributed on an
 #  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 #  KIND, either express or implied.  See the License for the
 #  specific language governing permissions and limitations
 #  under the License.
 import tempfile
 import pytest
 try:
    import sklearn  # noqa: F401
    HAS_SKLEARN = True
 except ImportError:
    HAS_SKLEARN = False
 try:
    import transformers  # noqa: F401
    from eland.ml.pytorch import PyTorchModel
    from eland.ml.pytorch.transformers import TransformerModel
    HAS_TRANSFORMERS = True
 except ImportError:
    HAS_TRANSFORMERS = False
 from tests import ES_TEST_CLIENT, ES_VERSION
 pytestmark = [
    pytest.mark.skipif(
        ES_VERSION < (8, 0, 0),
        reason="This test requires at least Elasticsearch version 8.0.0",
    ),
    pytest.mark.skipif(
        not HAS_SKLEARN, reason="This test requires 'scikit-learn' package to run"
    ),
    pytest.mark.skipif(
        not HAS_TRANSFORMERS, reason="This test requires 'transformers' package to run"
    ),
 ]
 TEXT_PREDICTION_MODELS = [
    (
        "distilbert-base-uncased",
        "fill_mask",
        "[MASK] is the capital of France.",
        "paris",
    )
 ]
@pytest.fixture(scope="function", autouse=True)
 def setup_and_tear_down():
    ES_TEST_CLIENT.cluster.put_settings(
        body={"transient": {"logger.org.elasticsearch.xpack.ml": "DEBUG"}}
    )
    yield
    for model_id, _, _, _ in TEXT_PREDICTION_MODELS:
        model = PyTorchModel(ES_TEST_CLIENT, model_id.replace("/", "__").lower()[:64])
        model.stop()
        model.delete()
 def download_model_and_start_deployment(tmp_dir, quantize, model_id, task):
    print("Loading HuggingFace transformer tokenizer and model")
    tm = TransformerModel(model_id, task, quantize)
    model_path, config_path, vocab_path = tm.save(tmp_dir)
    ptm = PyTorchModel(ES_TEST_CLIENT, tm.elasticsearch_model_id())
    ptm.stop()
    ptm.delete()
    print(f"Importing model: {ptm.model_id}")
    ptm.import_model(model_path, config_path, vocab_path)
    ptm.start()
    return ptm
 class TestPytorchModel:
    @pytest.mark.parametrize("model_id,task,text_input,value", TEXT_PREDICTION_MODELS)
    def test_text_classification(self, model_id, task, text_input, value):
        with tempfile.TemporaryDirectory() as tmp_dir:
            ptm = download_model_and_start_deployment(tmp_dir, True, model_id, task)
            result = ptm.infer({"docs": [{"text_field": text_input}]})
            assert result["predicted_value"] == value