Преглед на файлове

fix: update request handling to pass state from send_one_request to wait_one_response

myhloli преди 5 месеца
родител
ревизия
a49c605f12
променени са 1 файла, в които са добавени 4 реда и са изтрити 4 реда
  1. 4 4
      mineru/model/vlm_sglang_model/engine.py

+ 4 - 4
mineru/model/vlm_sglang_model/engine.py

@@ -183,8 +183,8 @@ async def _one_request(
     created_time: Optional[float],
 ):
     tokenized_obj = await self._tokenize_one_request(obj)
-    self._send_one_request(obj, tokenized_obj, created_time)
-    async for out in self._wait_one_response(obj, request):
+    state = self._send_one_request(obj, tokenized_obj, created_time)
+    async for out in self._wait_one_response(obj, state, request):
         yield out
 
 
@@ -256,8 +256,8 @@ async def _generate_request(
         is_single = obj.is_single
         if is_single:
             tokenized_obj = await self._tokenize_one_request(obj)
-            self._send_one_request(obj, tokenized_obj, created_time)
-            async for response in self._wait_one_response(obj, request):
+            state = self._send_one_request(obj, tokenized_obj, created_time)
+            async for response in self._wait_one_response(obj, state, request):
                 yield response
         else:
             async for response in _handle_batch_request(self, obj, request, created_time):