Fix dangling asyncio tasks

aight
2024-11-25 16:13:58 +01:00 · 2023-10-08 23:05:03 +03:00 · 2023-10-08 21:53:27 +02:00
4 changed files with 22 additions and 7 deletions
--- a/.vscode/settings.json
+++ b/.vscode/settings.json
@ -7,9 +7,9 @@
        "**/.DS_Store": true,
        "**/Thumbs.db": true,
        "**/__pycache__": true,
-        "**/*.css.map": true,
        "**/.vscode": true,
        "**/*.map": true,
+        "**/*.css.map": true,
        "tests/__pycache__": true
    },
    "hide-files.files": [
--- a/api/config/config.yml
+++ b/api/config/config.yml
@ -6,10 +6,9 @@ costs:
  other: 5

  chat-models:
-    gpt-4-32k-azure: 100
+    gpt-4-32k: 200
    gpt-4: 50
-    gpt-4-azure: 10
-    gpt-3: 5
+    gpt-3: 10

 ## Roles Explanation

--- a/api/responder.py
+++ b/api/responder.py
@ -7,6 +7,7 @@ import aiohttp
 import asyncio
 import starlette

+from typing import Any, Coroutine, Set
 from rich import print
 from dotenv import load_dotenv

@ -23,6 +24,19 @@ CRITICAL_API_ERRORS = ['invalid_api_key', 'account_deactivated']

 keymanager = providerkeys.manager

+background_tasks: Set[asyncio.Task[Any]] = set()
+
+
+def create_background_task(coro: Coroutine[Any, Any, Any]) -> None:
+    """asyncio.create_task, which prevents the task from being garbage collected.
+
+    https://docs.python.org/3/library/asyncio-task.html#asyncio.create_task
+    """
+    task = asyncio.create_task(coro)
+    background_tasks.add(task)
+    task.add_done_callback(background_tasks.discard)
+
+
 async def respond(
    path: str='/v1/chat/completions',
    user: dict=None,
@ -147,13 +161,15 @@ async def respond(
                                print('[!] too many requests')
                                continue

+                        chunk_no = 0
                        async for chunk in response.content.iter_any():
+                            chunk_no += 1
                            chunk = chunk.decode('utf8').strip()

                            if 'azure' in provider_name:
                                chunk = chunk.strip().replace('data: ', '')

-                                if not chunk or 'prompt_filter_results' in chunk:
+                                if not chunk or chunk_no == 1:
                                    continue

                            yield chunk + '\n\n'
@ -172,7 +188,7 @@ async def respond(
    if (not is_stream) and server_json_response:
        yield json.dumps(server_json_response)

-    asyncio.create_task(
+    create_background_task(
        after_request.after_request(
            incoming_request=incoming_request,
            target_request=target_request,
--- a/checks/client.py
+++ b/checks/client.py
@ -216,7 +216,7 @@ async def demo():
            raise ConnectionError('API Server is not running.')

        for func in [
-            # test_chat_non_stream_gpt4,
+            test_chat_non_stream_gpt4,
            test_chat_stream_gpt3
        ]:
            print(f'[*] {func.__name__}')
Author	SHA1	Message	Date
monosans	007e078fb6	Fix dangling asyncio tasks	2023-10-08 23:05:03 +03:00
nsde	a6af7bd1a4	aight	2023-10-08 21:53:27 +02:00