extras: add vllm,bark,vall-e-x tests, bump diffusers (#1422)

* tests: add vllm Signed-off-by: Ettore Di Giacinto <mudler@users.noreply.github.com> * tests: Add vall-e-x tests * Add bark tests * bump diffusers --------- Signed-off-by: Ettore Di Giacinto <mudler@users.noreply.github.com>
2025-05-20 10:35:01 +00:00 · 2023-12-11 18:39:26 -05:00 · 2023-12-11 18:39:26 -05:00 · 9aa2a7ca13
commit 9aa2a7ca13
parent e80cbca6b0
13 changed files with 344 additions and 40 deletions
--- a/backend/python/vllm/Makefile
+++ b/backend/python/vllm/Makefile
@ -9,3 +9,9 @@ run:
 	@echo "Running vllm..."
 	bash run.sh
 	@echo "vllm run."
+
+.PHONY: test
+test:
+	@echo "Testing vllm..."
+	bash test.sh
+	@echo "vllm tested."
--- a/backend/python/vllm/test.sh
+++ b/backend/python/vllm/test.sh
@ -0,0 +1,11 @@
+#!/bin/bash
+##
+## A bash script wrapper that runs the transformers server with conda
+
+# Activate conda environment
+source activate vllm
+
+# get the directory where the bash script is located
+DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" >/dev/null 2>&1 && pwd )"
+
+python -m unittest $DIR/test_backend_vllm.py
--- a/backend/python/vllm/test_backend_vllm.py
+++ b/backend/python/vllm/test_backend_vllm.py
@ -21,13 +21,13 @@ class TestBackendServicer(unittest.TestCase):
    """
    def setUp(self):
        self.service = subprocess.Popen(["python", "backend_vllm.py", "--addr", "localhost:50051"])
+        time.sleep(10)

    def tearDown(self) -> None:
        self.service.terminate()
        self.service.wait()

    def test_server_startup(self):
-        time.sleep(2)
        try:
            self.setUp()
            with grpc.insecure_channel("localhost:50051") as channel:
@ -39,3 +39,38 @@ class TestBackendServicer(unittest.TestCase):
            self.fail("Server failed to start")
        finally:
            self.tearDown()
+    def test_load_model(self):
+        """
+        This method tests if the model is loaded successfully
+        """
+        try:
+            self.setUp()
+            with grpc.insecure_channel("localhost:50051") as channel:
+                stub = backend_pb2_grpc.BackendStub(channel)
+                response = stub.LoadModel(backend_pb2.ModelOptions(Model="facebook/opt-125m"))
+                self.assertTrue(response.success)
+                self.assertEqual(response.message, "Model loaded successfully")
+        except Exception as err:
+            print(err)
+            self.fail("LoadModel service failed")
+        finally:
+            self.tearDown()
+
+    def test_text(self):
+        """
+        This method tests if the embeddings are generated successfully
+        """
+        try:
+            self.setUp()
+            with grpc.insecure_channel("localhost:50051") as channel:
+                stub = backend_pb2_grpc.BackendStub(channel)
+                response = stub.LoadModel(backend_pb2.ModelOptions(Model="facebook/opt-125m"))
+                self.assertTrue(response.success)
+                req = backend_pb2.PredictOptions(prompt="The capital of France is")
+                resp = stub.Predict(req)
+                self.assertIsNotNone(resp.message)
+        except Exception as err:
+            print(err)
+            self.fail("text service failed")
+        finally:
+            self.tearDown()