added a lock to avoid two inference at the same time and added consequent support for asynchronous generator based model

2025-01-10 19:11:48 +01:00 · 2025-01-10 19:11:48 +01:00 · 775c78c6cb
commit 775c78c6cb
parent c6d779f591
4 changed files with 19 additions and 12 deletions
--- a/samples/models/dummy/model.py
+++ b/samples/models/dummy/model.py
@ -1,4 +1,3 @@
-import json
 import typing


@ -8,5 +7,5 @@ def load(model) -> None:
 def unload(model) -> None:
    pass

-def infer(model, file) -> typing.Iterator[bytes]:
-    yield json.dumps({"hello": "world!"}).encode("utf-8")
+async def infer(model, file) -> typing.AsyncIterator[bytes]:
+    yield await file.read()