Update streaming to work & change stats to class

add comments to streaming.py
massive cleanup of streaming (i think this works?)
2024-11-25 20:33:58 +01:00 · 2023-08-13 21:42:38 +05:00 · 2023-08-13 21:29:45 +05:00 · 2023-08-13 21:26:35 +05:00 · 2023-08-13 21:19:56 +05:00 · 2023-08-13 20:16:33 +05:00
9 changed files with 175 additions and 190 deletions
--- a/api/db/logs.py
+++ b/api/db/logs.py
@ -24,11 +24,24 @@ async def _get_collection(collection_name: str):
    return conn['nova-core'][collection_name]

 async def replacer(text: str, dict_: dict) -> str:
+    # This seems to exist for a very specific and dumb purpose :D
    for k, v in dict_.items():
        text = text.replace(k, v)
    return text

 async def log_api_request(user: dict, incoming_request, target_url: str):
+    """Logs the API Request into the database.
+    No input prompt is logged, however data such as IP & useragent is noted.
+    This would be useful for security reasons. Other minor data is also collected.
+
+    Args:
+        user (dict): User dict object
+        incoming_request (_type_): Request
+        target_url (str): The URL the api request was targetted to.
+
+    Returns:
+        _type_: _description_
+    """
    db = await _get_collection('logs')
    payload = {}

--- a/api/db/stats.py
+++ b/api/db/stats.py
@ -17,6 +17,17 @@ async def _get_collection(collection_name: str):

 ## Statistics

+class Stats:
+    """
+    ### The manager for all statistics tracking
+    Stats tracked:
+    - Dates
+    - IPs
+    - Target URLs
+    - Tokens
+    - Models
+    - URL Paths
+    """
    async def add_date():
        date = datetime.datetime.now(pytz.timezone('GMT')).strftime('%Y.%m.%d')
        year, month, day = date.split('.')
@ -51,5 +62,5 @@ async def get_value(obj_filter):
        return await db.find_one({obj_filter})

 if __name__ == '__main__':
-    asyncio.run(add_date())
-    asyncio.run(add_path('/__demo/test'))
+    asyncio.run(Stats.add_date())
+    asyncio.run(Stats.add_path('/__demo/test'))
--- a/api/db/users.py
+++ b/api/db/users.py
@ -20,7 +20,14 @@ async def _get_collection(collection_name: str):
    return conn['nova-core'][collection_name]

 async def create(discord_id: str='') -> dict:
-    """Adds a new user to the MongoDB collection."""
+    """Add a user to the mongodb
+
+    Args:
+        discord_id (str): Defaults to ''.
+
+    Returns:
+        dict: The user object
+    """

    chars = string.ascii_letters + string.digits

--- a/api/load_balancing.py
+++ b/api/load_balancing.py
@ -10,7 +10,9 @@ async def _get_module_name(module) -> str:
    return name

 async def balance_chat_request(payload: dict) -> dict:
-    """Load balance the chat completion request between chat providers.
+    """
+    ### Load balance the chat completion request between chat providers.
+    Providers are sorted by streaming and models. Target (provider.chat_completion) is returned
    """

    providers_available = []
@ -36,7 +38,9 @@ async def balance_chat_request(payload: dict) -> dict:
    return target

 async def balance_organic_request(request: dict) -> dict:
-    """Load balnace to non-chat completion request between other "organic" providers which respond in the desired format already.
+    """
+    ### Load balance non-chat completion request
+    Balances between other "organic" providers which respond in the desired format already.
    Organic providers are used for non-chat completions, such as moderation and other paths.    
    """
    providers_available = []
--- a/api/main.py
+++ b/api/main.py
@ -31,7 +31,9 @@ async def startup_event():

@app.get('/')
 async def root():
-    """Returns the root endpoint."""
+    """
+    Returns the root endpoint.
+    """

    return {
        'status': 'ok',
--- a/api/proxies.py
+++ b/api/proxies.py
@ -63,7 +63,11 @@ class Proxy:

    @property
    def connector(self):
-        """Returns an aiohttp_socks.ProxyConnector object. Which can be used in aiohttp.ClientSession."""
+        """
+        ### Returns a proxy connector
+        Returns an aiohttp_socks.ProxyConnector object. 
+        This can be used in aiohttp.ClientSession.
+        """

        proxy_types = {
            'http': aiohttp_socks.ProxyType.HTTP,
--- a/api/streaming.py
+++ b/api/streaming.py
@ -15,7 +15,8 @@ import proxies
 import provider_auth
 import load_balancing

-from db import logs, users, stats
+from db import logs, users
+from db.stats import Stats
 from helpers import network, chat, errors

 load_dotenv()
@ -30,6 +31,33 @@ DEMO_PAYLOAD = {
    ]
 }

+async def process_response(response, is_chat, chat_id, model, target_request):
+    """Proccesses chunks from streaming
+
+    Args:
+        response (_type_): The response
+        is_chat (bool): If there is 'chat/completions' in path
+        chat_id (_type_): ID of chat with bot
+        model (_type_): What AI model it is
+    """
+    async for chunk in response.content.iter_any():
+        chunk = chunk.decode("utf8").strip()
+        send = False
+
+        if is_chat and '{' in chunk:
+            data = json.loads(chunk.split('data: ')[1])
+            chunk = chunk.replace(data['id'], chat_id)
+            send = True
+
+            if target_request['module'] == 'twa' and data.get('text'):
+                chunk = await chat.create_chat_chunk(chat_id=chat_id, model=model, content=['text'])
+
+            if (not data['choices'][0]['delta']) or data['choices'][0]['delta'] == {'role': 'assistant'}:
+                send = False
+
+        if send and chunk:
+            yield chunk + '\n\n'
+
 async def stream(
    path: str='/v1/chat/completions',
    user: dict=None,
@ -38,6 +66,17 @@ async def stream(
    input_tokens: int=0,
    incoming_request: starlette.requests.Request=None,
 ):
+    """Stream the completions request. Sends data in chunks
+
+    Args:
+        path (str, optional): URL Path. Defaults to '/v1/chat/completions'.
+        user (dict, optional): User object (dict) Defaults to None.
+        payload (dict, optional): Payload. Defaults to None.
+        credits_cost (int, optional): Cost of the credits of the request. Defaults to 0.
+        input_tokens (int, optional): Total tokens calculated with tokenizer. Defaults to 0.
+        incoming_request (starlette.requests.Request, optional): Incoming request. Defaults to None.
+    """
+
    is_chat = False
    is_stream = payload.get('stream', False)

@ -45,34 +84,16 @@ async def stream(
        is_chat = True
        model = payload['model']

-    # Chat completions always have the same beginning
    if is_chat and is_stream:
        chat_id = await chat.create_chat_id()
+        yield await chat.create_chat_chunk(chat_id=chat_id, model=model, content=chat.CompletionStart)
+        yield await chat.create_chat_chunk(chat_id=chat_id, model=model, content=None)

-        chunk = await chat.create_chat_chunk(
-            chat_id=chat_id,
-            model=model,
-            content=chat.CompletionStart
-        )
-        yield chunk
+    json_response = {'error': 'No JSON response could be received'}

-        chunk = await chat.create_chat_chunk(
-            chat_id=chat_id,
-            model=model,
-            content=None
-        )
-
-        yield chunk
-
-    json_response = {
-        'error': 'No JSON response could be received'
-    }
-
-    # Try to get a response from the API
    for _ in range(5):
-        headers = {
-            'Content-Type': 'application/json'
-        }
+        headers = {'Content-Type': 'application/json'}
+

        # Load balancing
        # If the request is a chat completion, then we need to load balance between chat providers
@ -82,7 +103,8 @@ async def stream(
            if is_chat:
                target_request = await load_balancing.balance_chat_request(payload)
            else:
-                # "organic" means that it's not using a reverse engineered front-end, but rather ClosedAI's API directly
+                
+                # In this case we are doing a organic request. "organic" means that it's not using a reverse engineered front-end, but rather ClosedAI's API directly
                # churchless.tech is an example of an organic provider, because it redirects the request to ClosedAI.
                target_request = await load_balancing.balance_organic_request({
                    'method': incoming_request.method,
@ -92,19 +114,12 @@ async def stream(
                    'cookies': incoming_request.cookies
                })
        except ValueError as exc:
-            # Error load balancing? Send a webhook to the admins
            webhook = dhooks.Webhook(os.getenv('DISCORD_WEBHOOK__API_ISSUE'))
            webhook.send(content=f'API Issue: **`{exc}`**\nhttps://i.imgflip.com/7uv122.jpg')
-
-            yield await errors.yield_error(
-                500,
-                'Sorry, the API has no working keys anymore.',
-                'The admins have been messaged automatically.'
-            )
+            yield await errors.yield_error(500, 'Sorry, the API has no working keys anymore.', 'The admins have been messaged automatically.')
            return

-        for k, v in target_request.get('headers', {}).items():
-            target_request['headers'][k] = v
+        target_request['headers'].update(target_request.get('headers', {}))

        if target_request['method'] == 'GET' and not payload:
            target_request['payload'] = None
@ -116,22 +131,16 @@ async def stream(
                async with session.request(
                    method=target_request.get('method', 'POST'),
                    url=target_request['url'],
-
                    data=target_request.get('data'),
                    json=target_request.get('payload'),
-
                    headers=target_request.get('headers', {}),
                    cookies=target_request.get('cookies'),
-
                    ssl=False,
-
                    timeout=aiohttp.ClientTimeout(total=float(os.getenv('TRANSFER_TIMEOUT', '120'))),
                ) as response:
-                    # if the answer is JSON
                    if response.content_type == 'application/json':
                        data = await response.json()

-                        # Invalidate the key if it's not working
                        if data.get('code') == 'invalid_api_key':
                            await provider_auth.invalidate_key(target_request.get('provider_auth'))
                            continue
@ -139,52 +148,15 @@ async def stream(
                        if response.ok:
                            json_response = data

-                    # if the answer is a stream
                    if is_stream:
                        try:
                            response.raise_for_status()
                        except Exception as exc:
-                            # Rate limit? Balance again
                            if 'Too Many Requests' in str(exc):
                                continue

-                        try:
-                            # process the response chunks
-                            async for chunk in response.content.iter_any():
-                                send = False
-                                chunk = f'{chunk.decode("utf8")}\n\n'
-
-                                if is_chat and '{' in chunk:
-                                    # parse the JSON
-                                    data = json.loads(chunk.split('data: ')[1])
-                                    chunk = chunk.replace(data['id'], chat_id)
-                                    send = True
-
-                                    # create a custom chunk if we're using specific providers
-                                    if target_request['module'] == 'twa' and data.get('text'):
-                                        chunk = await chat.create_chat_chunk(
-                                            chat_id=chat_id,
-                                            model=model,
-                                            content=['text']
-                                        )
-
-                                    # don't send empty/unnecessary messages
-                                    if (not data['choices'][0]['delta']) or data['choices'][0]['delta'] == {'role': 'assistant'}:
-                                        send = False
-
-                                # send the chunk
-                                if send and chunk.strip():
-                                    final_chunk = chunk.strip().replace('data: [DONE]', '') + '\n\n'
-                                    yield final_chunk
-
-                        except Exception as exc:
-                            if 'Connection closed' in str(exc):
-                                yield await errors.yield_error(
-                                    500,
-                                    'Sorry, there was an issue with the connection.',
-                                    'Please first check if the issue on your end. If this error repeats, please don\'t heistate to contact the staff!.'
-                                )
-                                return
+                        async for chunk in process_response(response, is_chat, chat_id, model, target_request):
+                            yield chunk

                    break

@ -192,44 +164,27 @@ async def stream(
                print('[!] Proxy error:', exc)
                continue

-    # Chat completions always have the same ending
    if is_chat and is_stream:
-        chunk = await chat.create_chat_chunk(
-            chat_id=chat_id,
-            model=model,
-            content=chat.CompletionStop
-        )
-        yield chunk
+        yield await chat.create_chat_chunk(chat_id=chat_id, model=model, content=chat.CompletionStop)
        yield 'data: [DONE]\n\n'

-    # If the response is JSON, then we need to yield it like this
    if not is_stream and json_response:
        yield json.dumps(json_response)

-    # DONE WITH REQUEST, NOW LOGGING ETC.
-
    if user and incoming_request:
-        await logs.log_api_request(
-            user=user,
-            incoming_request=incoming_request,
-            target_url=target_request['url']
-        )
+        await logs.log_api_request(user=user, incoming_request=incoming_request, target_url=target_request['url'])

    if credits_cost and user:
-        await users.update_by_id(user['_id'], {
-            '$inc': {'credits': -credits_cost}
-        })
+        await users.update_by_id(user['_id'], {'$inc': {'credits': -credits_cost}})

    ip_address = await network.get_ip(incoming_request)
-
-    await stats.add_date()
-    await stats.add_ip_address(ip_address)
-    await stats.add_path(path)
-    await stats.add_target(target_request['url'])
-
+    await Stats.add_date()
+    await Stats.add_ip_address(ip_address)
+    await Stats.add_path(path)
+    await Stats.add_target(target_request['url'])
    if is_chat:
-        await stats.add_model(model)
-        await stats.add_tokens(input_tokens, model)
+        await Stats.add_model(model)
+        await Stats.add_tokens(input_tokens, model)

 if __name__ == '__main__':
    asyncio.run(stream())
--- a/api/transfer.py
+++ b/api/transfer.py
@ -20,87 +20,67 @@ with open('config/credits.yml', encoding='utf8') as f:
    credits_config = yaml.safe_load(f)

 async def handle(incoming_request):
-    """Transfer a streaming response from the incoming request to the target endpoint"""
+    """
+    ### Transfer a streaming response 
+    Takes the request from the incoming request to the target endpoint.
+    Checks method, token amount, auth and cost along with if request is NSFW.
+    """
    
    path = incoming_request.url.path.replace('v1/v1/', 'v1/')

-    # METHOD
-    if incoming_request.method not in ['GET', 'POST', 'PUT', 'DELETE', 'PATCH']:
-        return await errors.error(405, f'Method "{incoming_request.method}" is not allowed.', 'Change the request method to the correct one.')
+    allowed_methods = {'GET', 'POST', 'PUT', 'DELETE', 'PATCH'}
+    method = incoming_request.method
+
+    if method not in allowed_methods:
+        return await errors.error(405, f'Method "{method}" is not allowed.', 'Change the request method to the correct one.')

-    # PAYLOAD
-    try:
    payload = await incoming_request.json()
-    except json.decoder.JSONDecodeError:
-        payload = {}

-    # Tokenise w/ tiktoken
    try:
-        input_tokens = await tokens.count_for_messages(payload['messages'])
+        input_tokens = await tokens.count_for_messages(payload.get('messages', []))
    except (KeyError, TypeError):
        input_tokens = 0

-    # Check user auth
    received_key = incoming_request.headers.get('Authorization')

-    if not received_key:
+    if not received_key or not received_key.startswith('Bearer '):
        return await errors.error(401, 'No NovaAI API key given!', 'Add "Authorization: Bearer nv-..." to your request headers.')

-    if received_key.startswith('Bearer '):
-        received_key = received_key.split('Bearer ')[1]
+    user = await users.by_api_key(received_key.split('Bearer ')[1].strip())

-    user = await users.by_api_key(received_key.strip())
-
-    if not user:
-        return await errors.error(401, 'Invalid NovaAI API key!', 'Create a new NovaOSS API key.')
+    if not user or not user['status']['active']:
+        return await errors.error(401, 'Invalid or inactive NovaAI API key!', 'Create a new NovaOSS API key or reactivate your account.')

    ban_reason = user['status']['ban_reason']
    if ban_reason:
        return await errors.error(403, f'Your NovaAI account has been banned. Reason: "{ban_reason}".', 'Contact the staff for an appeal.')

-    if not user['status']['active']:
-        return await errors.error(418, 'Your NovaAI account is not active (paused).', 'Simply re-activate your account using a Discord command or the web panel.')
-
-    if '/models' in path:
+    path_contains_models = '/models' in path
+    if path_contains_models:
        return fastapi.responses.JSONResponse(content=models_list)

-    # Calculate cost of tokens & check for nsfw prompts
    costs = credits_config['costs']
    cost = costs['other']

-    policy_violation = False
-
    if 'chat/completions' in path:
-        for model_name, model_cost in costs['chat-models'].items():
-            if model_name in payload['model']:
-                cost = model_cost
+        cost = costs['chat-models'].get(payload.get('model'), cost)

-        policy_violation = await moderation.is_policy_violated(payload['messages'])
-
-    elif '/moderations' in path:
-        pass
-
-    else:
-        inp = payload.get('input', payload.get('prompt'))
-
-        if inp:
-            if len(inp) > 2 and not inp.isnumeric():
+    policy_violation = False
+    if 'chat/completions' in path or ('input' in payload or 'prompt' in payload):
+        inp = payload.get('input', payload.get('prompt', ''))
+        if inp and len(inp) > 2 and not inp.isnumeric():
            policy_violation = await moderation.is_policy_violated(inp)

    if policy_violation:
        return await errors.error(400, f'The request contains content which violates this model\'s policies for "{policy_violation}".', 'We currently don\'t support any NSFW models.')

-
    role_cost_multiplier = credits_config['bonuses'].get(user['role'], 1)
    cost = round(cost * role_cost_multiplier)

    if user['credits'] < cost:
        return await errors.error(429, 'Not enough credits.', 'Wait or earn more credits. Learn more on our website or Discord server.')

-
-    # Send the completion request
-
-    if 'chat/completions' in path and not payload.get('stream') is True:
+    if 'chat/completions' in path and not payload.get('stream', False):
        payload['stream'] = False

    media_type = 'text/event-stream' if payload.get('stream', False) else 'application/json'
--- a/tests/main.py
+++ b/tests/main.py
@ -83,11 +83,20 @@ def test_models():
 def test_all():
    """Runs all tests."""

-    # print(test_server())
-    # print(test_api())
+    print("Running test on API server to check if its running.."
+    print(test_server())
+
+    print("Running a api endpoint to see if requests can go through..."
+    print(test_api())
+
+    print("Checking if the API works with the python library..."
    print(test_library())
-    # print(test_library_moderation())
-    # print(test_models())
+
+    print("Checking if the moderation endpoint works...")
+    print(test_library_moderation())
+
+    print("Checking if all models can be GET"
+    print(test_models())

 def test_api_moderation(model: str=MODEL, messages: List[dict]=None) -> dict:
    """Tests an API api_endpoint."""
Author	SHA1	Message	Date
Game_Time	bb1e9de563	Update streaming to work & change stats to class	2023-08-13 21:42:38 +05:00
Game_Time	885da2a27e	add comments to streaming.py	2023-08-13 21:29:45 +05:00
Game_Time	3e811f3e3b	massive cleanup of streaming (i think this works?)	2023-08-13 21:26:35 +05:00
Game_Time	def26f9104	clean up code a lot	2023-08-13 21:19:56 +05:00
Game_Time	8e70c25ee0	updating tests to add tests back since they were removed for some reason?	2023-08-13 20:16:33 +05:00
Game_Time	6ecc5f59ce	Codebase changes + a lot of commenting	2023-08-13 20:12:35 +05:00