nova-api/api/streaming.py

"""This module contains the streaming logic for the API."""

import os
import json
import dhooks
import asyncio
import aiohttp
import starlette

from rich import print
from dotenv import load_dotenv
from python_socks._errors import ProxyError

import proxies
import provider_auth
import load_balancing

from db import logs, users, stats
from helpers import network, chat, errors

load_dotenv()

DEMO_PAYLOAD = {
    'model': 'gpt-3.5-turbo',
    'messages': [
        {
            'role': 'user',
            'content': '1+1='
        }
    ]
}

async def stream(
    path: str='/v1/chat/completions',
    user: dict=None,
    payload: dict=None,
    credits_cost: int=0,
    input_tokens: int=0,
    incoming_request: starlette.requests.Request=None,
):
    is_chat = False
    is_stream = payload.get('stream', False)

    if 'chat/completions' in path:
        is_chat = True
        model = payload['model']

    # Chat completions always have the same beginning
    if is_chat and is_stream:
        chat_id = await chat.create_chat_id()

        chunk = await chat.create_chat_chunk(
            chat_id=chat_id,
            model=model,
            content=chat.CompletionStart
        )
        yield chunk

        chunk = await chat.create_chat_chunk(
            chat_id=chat_id,
            model=model,
            content=None
        )

        yield chunk

    json_response = {
        'error': 'No JSON response could be received'
    }

    # Try to get a response from the API
    for _ in range(5):
        headers = {
            'Content-Type': 'application/json'
        }

        # Load balancing
        # If the request is a chat completion, then we need to load balance between chat providers
        # If the request is an organic request, then we need to load balance between organic providers

        try:
            if is_chat:
                target_request = await load_balancing.balance_chat_request(payload)
            else:
                # "organic" means that it's not using a reverse engineered front-end, but rather ClosedAI's API directly
                # churchless.tech is an example of an organic provider, because it redirects the request to ClosedAI.
                target_request = await load_balancing.balance_organic_request({
                    'method': incoming_request.method,
                    'path': path,
                    'payload': payload,
                    'headers': headers,
                    'cookies': incoming_request.cookies
                })
        except ValueError as exc:
            # Error load balancing? Send a webhook to the admins
            webhook = dhooks.Webhook(os.getenv('DISCORD_WEBHOOK__API_ISSUE'))
            webhook.send(content=f'API Issue: **`{exc}`**\nhttps://i.imgflip.com/7uv122.jpg')

            yield await errors.yield_error(
                500,
                'Sorry, the API has no working keys anymore.',
                'The admins have been messaged automatically.'
            )
            return

        for k, v in target_request.get('headers', {}).items():
            target_request['headers'][k] = v

        if target_request['method'] == 'GET' and not payload:
            target_request['payload'] = None

        # We haven't done any requests as of right now, everything until now was just preparation
        # Here, we process the request
        async with aiohttp.ClientSession(connector=proxies.get_proxy().connector) as session:
            try:
                async with session.request(
                    method=target_request.get('method', 'POST'),
                    url=target_request['url'],

                    data=target_request.get('data'),
                    json=target_request.get('payload'),

                    headers=target_request.get('headers', {}),
                    cookies=target_request.get('cookies'),

                    ssl=False,

                    timeout=aiohttp.ClientTimeout(total=float(os.getenv('TRANSFER_TIMEOUT', '120'))),
                ) as response:
                    # if the answer is JSON
                    if response.content_type == 'application/json':
                        data = await response.json()

                        # Invalidate the key if it's not working
                        if data.get('code') == 'invalid_api_key':
                            await provider_auth.invalidate_key(target_request.get('provider_auth'))
                            continue

                        if response.ok:
                            json_response = data

                    # if the answer is a stream
                    if is_stream:
                        try:
                            response.raise_for_status()
                        except Exception as exc:
                            # Rate limit? Balance again
                            if 'Too Many Requests' in str(exc):
                                continue

                        try:
                            # process the response chunks
                            async for chunk in response.content.iter_any():
                                send = False
                                chunk = f'{chunk.decode("utf8")}\n\n'

                                if is_chat and '{' in chunk:
                                    # parse the JSON
                                    data = json.loads(chunk.split('data: ')[1])
                                    chunk = chunk.replace(data['id'], chat_id)
                                    send = True

                                    # create a custom chunk if we're using specific providers
                                    if target_request['module'] == 'twa' and data.get('text'):
                                        chunk = await chat.create_chat_chunk(
                                            chat_id=chat_id,
                                            model=model,
                                            content=['text']
                                        )

                                    # don't send empty/unnecessary messages
                                    if (not data['choices'][0]['delta']) or data['choices'][0]['delta'] == {'role': 'assistant'}:
                                        send = False

                                # send the chunk
                                if send and chunk.strip():
                                    final_chunk = chunk.strip().replace('data: [DONE]', '') + '\n\n'
                                    yield final_chunk

                        except Exception as exc:
                            if 'Connection closed' in str(exc):
                                yield await errors.yield_error(
                                    500,
                                    'Sorry, there was an issue with the connection.',
                                    'Please first check if the issue on your end. If this error repeats, please don\'t heistate to contact the staff!.'
                                )
                                return

                    break

            except ProxyError as exc:
                print('[!] Proxy error:', exc)
                continue

    # Chat completions always have the same ending
    if is_chat and is_stream:
        chunk = await chat.create_chat_chunk(
            chat_id=chat_id,
            model=model,
            content=chat.CompletionStop
        )
        yield chunk
        yield 'data: [DONE]\n\n'

    # If the response is JSON, then we need to yield it like this
    if not is_stream and json_response:
        yield json.dumps(json_response)

    # DONE WITH REQUEST, NOW LOGGING ETC.

    if user and incoming_request:
        await logs.log_api_request(
            user=user,
            incoming_request=incoming_request,
            target_url=target_request['url']
        )

    if credits_cost and user:
        await users.update_by_id(user['_id'], {
            '$inc': {'credits': -credits_cost}
        })

    ip_address = await network.get_ip(incoming_request)

    await stats.add_date()
    await stats.add_ip_address(ip_address)
    await stats.add_path(path)
    await stats.add_target(target_request['url'])

    if is_chat:
        await stats.add_model(model)
        await stats.add_tokens(input_tokens, model)

if __name__ == '__main__':
    asyncio.run(stream())
Added more documentation 2023-08-12 17:49:31 +02:00			`"""This module contains the streaming logic for the API."""`

some stuff idfk 2023-08-04 03:30:56 +02:00			`import os`
proxies have issues 2023-08-04 17:29:49 +02:00			`import json`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`import dhooks`
some stuff idfk 2023-08-04 03:30:56 +02:00			`import asyncio`
			`import aiohttp`
			`import starlette`

proxies have issues 2023-08-04 17:29:49 +02:00			`from rich import print`
some stuff idfk 2023-08-04 03:30:56 +02:00			`from dotenv import load_dotenv`
some thingies 2023-08-05 02:30:42 +02:00			`from python_socks._errors import ProxyError`
some stuff idfk 2023-08-04 03:30:56 +02:00
			`import proxies`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`import provider_auth`
some stuff idfk 2023-08-04 03:30:56 +02:00			`import load_balancing`

			`from db import logs, users, stats`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`from helpers import network, chat, errors`
some stuff idfk 2023-08-04 03:30:56 +02:00
			`load_dotenv()`

			`DEMO_PAYLOAD = {`
			`'model': 'gpt-3.5-turbo',`
			`'messages': [`
			`{`
			`'role': 'user',`
			`'content': '1+1='`
			`}`
			`]`
			`}`

			`async def stream(`
			`path: str='/v1/chat/completions',`
			`user: dict=None,`
			`payload: dict=None,`
			`credits_cost: int=0,`
			`input_tokens: int=0,`
			`incoming_request: starlette.requests.Request=None,`
			`):`
proxies have issues 2023-08-04 17:29:49 +02:00			`is_chat = False`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`is_stream = payload.get('stream', False)`
some stuff idfk 2023-08-04 03:30:56 +02:00
proxies have issues 2023-08-04 17:29:49 +02:00			`if 'chat/completions' in path:`
			`is_chat = True`
			`model = payload['model']`
some stuff idfk 2023-08-04 03:30:56 +02:00
Added more documentation 2023-08-12 17:49:31 +02:00			`# Chat completions always have the same beginning`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`if is_chat and is_stream:`
			`chat_id = await chat.create_chat_id()`

moderation is done yay 2023-08-06 21:42:07 +02:00			`chunk = await chat.create_chat_chunk(`
proxies have issues 2023-08-04 17:29:49 +02:00			`chat_id=chat_id,`
			`model=model,`
			`content=chat.CompletionStart`
			`)`
moderation is done yay 2023-08-06 21:42:07 +02:00			`yield chunk`
some stuff idfk 2023-08-04 03:30:56 +02:00
moderation is done yay 2023-08-06 21:42:07 +02:00			`chunk = await chat.create_chat_chunk(`
some thingies 2023-08-05 02:30:42 +02:00			`chat_id=chat_id,`
			`model=model,`
			`content=None`
			`)`
some stuff idfk 2023-08-04 03:30:56 +02:00
moderation is done yay 2023-08-06 21:42:07 +02:00			`yield chunk`

			`json_response = {`
			`'error': 'No JSON response could be received'`
			`}`

Added more documentation 2023-08-12 17:49:31 +02:00			`# Try to get a response from the API`
moderation is done yay 2023-08-06 21:42:07 +02:00			`for _ in range(5):`
proxies have issues 2023-08-04 17:29:49 +02:00			`headers = {`
			`'Content-Type': 'application/json'`
			`}`

Added more documentation 2023-08-12 17:49:31 +02:00			`# Load balancing`
			`# If the request is a chat completion, then we need to load balance between chat providers`
			`# If the request is an organic request, then we need to load balance between organic providers`

sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`try:`
			`if is_chat:`
			`target_request = await load_balancing.balance_chat_request(payload)`
			`else:`
Added more documentation 2023-08-12 17:49:31 +02:00			`# "organic" means that it's not using a reverse engineered front-end, but rather ClosedAI's API directly`
			`# churchless.tech is an example of an organic provider, because it redirects the request to ClosedAI.`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`target_request = await load_balancing.balance_organic_request({`
			`'method': incoming_request.method,`
			`'path': path,`
			`'payload': payload,`
			`'headers': headers,`
			`'cookies': incoming_request.cookies`
			`})`
			`except ValueError as exc:`
Added more documentation 2023-08-12 17:49:31 +02:00			`# Error load balancing? Send a webhook to the admins`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`webhook = dhooks.Webhook(os.getenv('DISCORD_WEBHOOK__API_ISSUE'))`
			webhook.send(content=f'API Issue: `{exc}`\nhttps://i.imgflip.com/7uv122.jpg')
Added more documentation 2023-08-12 17:49:31 +02:00
a few more nice changes 2023-08-12 18:05:53 +02:00			`yield await errors.yield_error(`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`500,`
			`'Sorry, the API has no working keys anymore.',`
			`'The admins have been messaged automatically.'`
			`)`
idk 2023-08-06 12:46:41 +02:00			`return`
some thingies 2023-08-05 02:30:42 +02:00
proxies have issues 2023-08-04 17:29:49 +02:00			`for k, v in target_request.get('headers', {}).items():`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`target_request['headers'][k] = v`

			`if target_request['method'] == 'GET' and not payload:`
			`target_request['payload'] = None`
proxies have issues 2023-08-04 17:29:49 +02:00
Added more documentation 2023-08-12 17:49:31 +02:00			`# We haven't done any requests as of right now, everything until now was just preparation`
			`# Here, we process the request`
			`async with aiohttp.ClientSession(connector=proxies.get_proxy().connector) as session:`
some thingies 2023-08-05 02:30:42 +02:00			`try:`
			`async with session.request(`
			`method=target_request.get('method', 'POST'),`
			`url=target_request['url'],`

			`data=target_request.get('data'),`
			`json=target_request.get('payload'),`

Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`headers=target_request.get('headers', {}),`
some thingies 2023-08-05 02:30:42 +02:00			`cookies=target_request.get('cookies'),`

			`ssl=False,`

			`timeout=aiohttp.ClientTimeout(total=float(os.getenv('TRANSFER_TIMEOUT', '120'))),`
			`) as response:`
Added more documentation 2023-08-12 17:49:31 +02:00			`# if the answer is JSON`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`if response.content_type == 'application/json':`
			`data = await response.json()`
moderation is done yay 2023-08-06 21:42:07 +02:00
Added more documentation 2023-08-12 17:49:31 +02:00			`# Invalidate the key if it's not working`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`if data.get('code') == 'invalid_api_key':`
			`await provider_auth.invalidate_key(target_request.get('provider_auth'))`
some thingies 2023-08-05 02:30:42 +02:00			`continue`
some stuff idfk 2023-08-04 03:30:56 +02:00
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`if response.ok:`
			`json_response = data`

Added more documentation 2023-08-12 17:49:31 +02:00			`# if the answer is a stream`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`if is_stream:`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`try:`
			`response.raise_for_status()`
			`except Exception as exc:`
Added more documentation 2023-08-12 17:49:31 +02:00			`# Rate limit? Balance again`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`if 'Too Many Requests' in str(exc):`
			`continue`

sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`try:`
Added more documentation 2023-08-12 17:49:31 +02:00			`# process the response chunks`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`async for chunk in response.content.iter_any():`
			`send = False`
			`chunk = f'{chunk.decode("utf8")}\n\n'`

			`if is_chat and '{' in chunk:`
Added more documentation 2023-08-12 17:49:31 +02:00			`# parse the JSON`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`data = json.loads(chunk.split('data: ')[1])`
moderation is done yay 2023-08-06 21:42:07 +02:00			`chunk = chunk.replace(data['id'], chat_id)`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`send = True`

Added more documentation 2023-08-12 17:49:31 +02:00			`# create a custom chunk if we're using specific providers`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`if target_request['module'] == 'twa' and data.get('text'):`
moderation is done yay 2023-08-06 21:42:07 +02:00			`chunk = await chat.create_chat_chunk(`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`chat_id=chat_id,`
			`model=model,`
			`content=['text']`
			`)`

Added more documentation 2023-08-12 17:49:31 +02:00			`# don't send empty/unnecessary messages`
			`if (not data['choices'][0]['delta']) or data['choices'][0]['delta'] == {'role': 'assistant'}:`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`send = False`
Added more documentation 2023-08-12 17:49:31 +02:00
			`# send the chunk`
Very slight streaming improvements 2023-08-11 21:21:38 +02:00			`if send and chunk.strip():`
moderation is done yay 2023-08-06 21:42:07 +02:00			`final_chunk = chunk.strip().replace('data: [DONE]', '') + '\n\n'`
			`yield final_chunk`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00
			`except Exception as exc:`
			`if 'Connection closed' in str(exc):`
a few more nice changes 2023-08-12 18:05:53 +02:00			`yield await errors.yield_error(`
moderation is done yay 2023-08-06 21:42:07 +02:00			`500,`
			`'Sorry, there was an issue with the connection.',`
			`'Please first check if the issue on your end. If this error repeats, please don\'t heistate to contact the staff!.'`
			`)`
			`return`
proxies have issues 2023-08-04 17:29:49 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`break`
proxies have issues 2023-08-04 17:29:49 +02:00
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`except ProxyError as exc:`
Added more documentation 2023-08-12 17:49:31 +02:00			`print('[!] Proxy error:', exc)`
some thingies 2023-08-05 02:30:42 +02:00			`continue`
proxies have issues 2023-08-04 17:29:49 +02:00
Added more documentation 2023-08-12 17:49:31 +02:00			`# Chat completions always have the same ending`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`if is_chat and is_stream:`
moderation is done yay 2023-08-06 21:42:07 +02:00			`chunk = await chat.create_chat_chunk(`
proxies have issues 2023-08-04 17:29:49 +02:00			`chat_id=chat_id,`
			`model=model,`
			`content=chat.CompletionStop`
			`)`
moderation is done yay 2023-08-06 21:42:07 +02:00			`yield chunk`
some thingies 2023-08-05 02:30:42 +02:00			`yield 'data: [DONE]\n\n'`
some stuff idfk 2023-08-04 03:30:56 +02:00
Added more documentation 2023-08-12 17:49:31 +02:00			`# If the response is JSON, then we need to yield it like this`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`if not is_stream and json_response:`
moderation is done yay 2023-08-06 21:42:07 +02:00			`yield json.dumps(json_response)`

Added more documentation 2023-08-12 17:49:31 +02:00			`# DONE WITH REQUEST, NOW LOGGING ETC.`
moderation is done yay 2023-08-06 21:42:07 +02:00
			`if user and incoming_request:`
			`await logs.log_api_request(`
			`user=user,`
			`incoming_request=incoming_request,`
			`target_url=target_request['url']`
			`)`

			`if credits_cost and user:`
			`await users.update_by_id(user['_id'], {`
			`'$inc': {'credits': -credits_cost}`
			`})`

			`ip_address = await network.get_ip(incoming_request)`

			`await stats.add_date()`
			`await stats.add_ip_address(ip_address)`
			`await stats.add_path(path)`
			`await stats.add_target(target_request['url'])`

			`if is_chat:`
			`await stats.add_model(model)`
			`await stats.add_tokens(input_tokens, model)`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00
some stuff idfk 2023-08-04 03:30:56 +02:00			`if __name__ == '__main__':`
			`asyncio.run(stream())`