add async operations for completions

matank-vendi · matank-vendi · commit 4b9f2106c5e4 · 2024-04-10T16:44:21.000+03:00
diff --git a/poetry.lock b/poetry.lock
diff --git a/pyproject.toml b/pyproject.toml
@@ -14,7 +14,7 @@ tenacity = "^8.2.3"
 requests = "^2.31.0"
 pydantic = "^2.5.2"
 pydantic-settings = "^2.1.0"
-pandas = "^2.1.3"
+pandas = "*"
 aiohttp = "^3.8.1"
 
 
diff --git a/src/vendi/completions/completions.py b/src/vendi/completions/completions.py
@@ -165,7 +165,7 @@ async def acreate(
     async def acreate_many(
         self,
         requests: list[CompletionRequest],
-    ) -> List[ChatCompletion]:
+    ) -> List[ChatCompletion] | List[VendiCompletionResponse]:
         """
         Create multiple completions on different models with the same prompt and parameters
         requests: A list of completionr requests
@@ -254,6 +254,36 @@ def run_batch_job(
                 time.sleep(poll_interval)
         return job
 
+    async def arun_batch_job(
+        self,
+        dataset_id: uuid.UUID,
+        model_parameters: list[ModelParameters],
+        wait_until_complete: bool = False,
+        timeout: int = 3000,
+        poll_interval: int = 5,
+    ) -> BatchInference:
+        _res = await self.__aclient.post(
+            path="/platform/v1/inference/batch/",
+            json={
+                "dataset_id": str(dataset_id),
+                "model_parameters": [{**i.model_dump(), **i.model_extra} for i in model_parameters]
+            }
+        )
+        job = BatchInference(**_res)
+
+        if wait_until_complete:
+            start_time = time.time()
+            while True:
+                job = await self._aget_batch_job(job.id)
+                if job.status in [BatchInferenceStatus.COMPLETED, BatchInferenceStatus.FAILED]:
+                    return job
+                if time.time() - start_time > timeout:
+                    raise TimeoutError(
+                        "The batch job did not complete within the specified timeout. "
+                        "You can still check its status by using the batch_job_status method.")
+
+                await asyncio.sleep(poll_interval)
+
     def __post_batch_job(self, dataset_id: uuid.UUID, model_parameters: list[ModelParameters]) -> BatchInference:
         res = self.__client.post(
             uri="/platform/v1/inference/batch/",
@@ -280,3 +310,27 @@ def _get_batch_job(self, batch_inference_id: uuid.UUID) -> BatchInference:
             uri=f"/platform/v1/inference/batch/{batch_inference_id}"
         )
         return BatchInference(**res)
+
+    async def _aget_batch_job(self, batch_inference_id: uuid.UUID) -> BatchInference:
+        """
+        Get a batch inference object job by ID
+        """
+        res = await self.__aclient.get(
+            path=f"/platform/v1/inference/batch/{batch_inference_id}"
+        )
+        return BatchInference(**res)
+
+    def list_batch_jobs(self) -> List[BatchInference]:
+        """
+        Get all batch inferences
+        """
+        res = self.__client.get(
+            uri="/platform/v1/inference/batch/"
+        )
+        return [BatchInference(**i) for i in res]
+
+    def delete_batch_job(self, batch_id: uuid.UUID):
+        """
+        Delete a batch inference job
+        """
+        return self.__client.delete(f"/platform/v1/inference/batch/{batch_id}")