Fedir Zadniprovskyi 2024-12-22
chore: adjust model manager test sleep delay
@2e7d12b0de68a4612f0fe821bca43eac543135c0
src/faster_whisper_server/api_models.py
--- src/faster_whisper_server/api_models.py
+++ src/faster_whisper_server/api_models.py
@@ -69,7 +69,7 @@
                 end=segment.end,
                 text=segment.text,
                 tokens=segment.tokens,
-                temperature=segment.temperature,
+                temperature=segment.temperature or 0,  # FIX: hardcoded
                 avg_logprob=segment.avg_logprob,
                 compression_ratio=segment.compression_ratio,
                 no_speech_prob=segment.no_speech_prob,
tests/model_manager_test.py
--- tests/model_manager_test.py
+++ tests/model_manager_test.py
@@ -20,7 +20,7 @@
         await aclient.post(f"/api/ps/{model}")
         res = (await aclient.get("/api/ps")).json()
         assert len(res["models"]) == 1
-        await asyncio.sleep(ttl + 1)
+        await asyncio.sleep(ttl + 1)  # wait for the model to be unloaded
         res = (await aclient.get("/api/ps")).json()
         assert len(res["models"]) == 0
 
@@ -35,7 +35,7 @@
         await aclient.post(f"/api/ps/{model}")
         res = (await aclient.get("/api/ps")).json()
         assert len(res["models"]) == 1
-        await asyncio.sleep(ttl - 2)
+        await asyncio.sleep(ttl - 2)  # sleep for less than the ttl. The model should not be unloaded
         res = (await aclient.get("/api/ps")).json()
         assert len(res["models"]) == 1
 
@@ -48,11 +48,11 @@
         ).json()
         res = (await aclient.get("/api/ps")).json()
         assert len(res["models"]) == 1
-        await asyncio.sleep(ttl - 2)
+        await asyncio.sleep(ttl - 2)  # sleep for less than the ttl. The model should not be unloaded
         res = (await aclient.get("/api/ps")).json()
         assert len(res["models"]) == 1
 
-        await asyncio.sleep(3)
+        await asyncio.sleep(3)  # sleep for a bit more. The model should be unloaded
         res = (await aclient.get("/api/ps")).json()
         assert len(res["models"]) == 0
 
@@ -80,7 +80,7 @@
                 "/v1/audio/transcriptions", files={"file": ("audio.wav", data, "audio/wav")}, data={"model": model}
             )
         )
-        await asyncio.sleep(0.01)
+        await asyncio.sleep(0.1)  # wait for the server to start processing the request
         res = await aclient.delete(f"/api/ps/{model}")
         assert res.status_code == 409
 
Add a comment
List