nova-api/api/responder.py

"""This module contains the streaming logic for the API."""

import os
import json
import yaml
import dhooks
import asyncio
import aiohttp
import starlette

from rich import print
from dotenv import load_dotenv

import proxies
import provider_auth
import after_request
import load_balancing

from helpers import network, chat, errors

load_dotenv()

async def respond(
    path: str='/v1/chat/completions',
    user: dict=None,
    payload: dict=None,
    credits_cost: int=0,
    input_tokens: int=0,
    incoming_request: starlette.requests.Request=None,
):
    """Stream the completions request. Sends data in chunks
    If not streaming, it sends the result in its entirety.
    """

    is_chat = False

    model = None
    is_stream = False

    if 'chat/completions' in path:
        is_chat = True
        model = payload['model']

    json_response = {}

    headers = {
        'Content-Type': 'application/json',
        'User-Agent': 'axios/0.21.1',
    }

    for _ in range(10):
        # Load balancing: randomly selecting a suitable provider
        # If the request is a chat completion, then we need to load balance between chat providers
        # If the request is an organic request, then we need to load balance between organic providers
        try:
            if is_chat:
                target_request = await load_balancing.balance_chat_request(payload)
            else:
                
                # In this case we are doing a organic request. "organic" means that it's not using a reverse engineered front-end, but rather ClosedAI's API directly
                # churchless.tech is an example of an organic provider, because it redirects the request to ClosedAI.
                target_request = await load_balancing.balance_organic_request({
                    'method': incoming_request.method,
                    'path': path,
                    'payload': payload,
                    'headers': headers,
                    'cookies': incoming_request.cookies
                })
        except ValueError as exc:
            if model in ['gpt-3.5-turbo', 'gpt-4', 'gpt-4-32k']:
                webhook = dhooks.Webhook(os.environ['DISCORD_WEBHOOK__API_ISSUE'])
                webhook.send(content=f'API Issue: **`{exc}`**\nhttps://i.imgflip.com/7uv122.jpg')
                yield await errors.yield_error(500, 'Sorry, the API has no working keys anymore.', 'The admins have been messaged automatically.')
            return

        target_request['headers'].update(target_request.get('headers', {}))

        if target_request['method'] == 'GET' and not payload:
            target_request['payload'] = None

        # We haven't done any requests as of right now, everything until now was just preparation
        # Here, we process the request
        async with aiohttp.ClientSession(connector=proxies.get_proxy().connector) as session:
            try:
                async with session.request(
                    method=target_request.get('method', 'POST'),
                    url=target_request['url'],
                    data=target_request.get('data'),
                    json=target_request.get('payload'),
                    headers=target_request.get('headers', {}),
                    cookies=target_request.get('cookies'),
                    ssl=False,
                    timeout=aiohttp.ClientTimeout(
                        connect=0.3,
                        total=float(os.getenv('TRANSFER_TIMEOUT', '500'))
                    ),
                ) as response:
                    is_stream = response.content_type == 'text/event-stream'

                    if response.status == 429:
                        continue

                    if response.content_type == 'application/json':
                        data = await response.json()

                        if 'method_not_supported' in str(data):
                            await errors.error(500, 'Sorry, this endpoint does not support this method.', data['error']['message'])

                        if 'invalid_api_key' in str(data) or 'account_deactivated' in str(data):
                            print('[!] invalid api key', target_request.get('provider_auth'))
                            await provider_auth.invalidate_key(target_request.get('provider_auth'))
                            continue

                        if response.ok:
                            json_response = data

                    if is_stream:
                        try:
                            response.raise_for_status()
                        except Exception as exc:
                            if 'Too Many Requests' in str(exc):
                                continue

                        async for chunk in response.content.iter_any():
                            chunk = chunk.decode('utf8').strip()
                            yield chunk + '\n\n'

                    break

            except Exception as exc:
                continue

            if (not json_response) and is_chat:
                print('[!] chat response is empty')
                continue
    else:
        yield await errors.yield_error(500, 'Sorry, the provider is not responding. We\'re possibly getting rate-limited.', 'Please try again later.')
        return

    if (not is_stream) and json_response:
        yield json.dumps(json_response)

    print(f'[+] {path} -> {model or ""}')

    await after_request.after_request(
        incoming_request=incoming_request,
        target_request=target_request,
        user=user,
        credits_cost=credits_cost,
        input_tokens=input_tokens,
        path=path,
        is_chat=is_chat,
        model=model,
    )
Added more documentation 2023-08-12 17:49:31 +02:00			`"""This module contains the streaming logic for the API."""`

some stuff idfk 2023-08-04 03:30:56 +02:00			`import os`
proxies have issues 2023-08-04 17:29:49 +02:00			`import json`
I don't even fkin know lmfao 2023-08-18 21:23:00 +02:00			`import yaml`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`import dhooks`
some stuff idfk 2023-08-04 03:30:56 +02:00			`import asyncio`
			`import aiohttp`
			`import starlette`

proxies have issues 2023-08-04 17:29:49 +02:00			`from rich import print`
some stuff idfk 2023-08-04 03:30:56 +02:00			`from dotenv import load_dotenv`

			`import proxies`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`import provider_auth`
Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00			`import after_request`
some stuff idfk 2023-08-04 03:30:56 +02:00			`import load_balancing`

sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`from helpers import network, chat, errors`
some stuff idfk 2023-08-04 03:30:56 +02:00
			`load_dotenv()`

I forgor 💀 2023-09-11 02:47:21 +02:00			`async def respond(`
some stuff idfk 2023-08-04 03:30:56 +02:00			`path: str='/v1/chat/completions',`
			`user: dict=None,`
			`payload: dict=None,`
			`credits_cost: int=0,`
			`input_tokens: int=0,`
			`incoming_request: starlette.requests.Request=None,`
			`):`
Codebase changes + a lot of commenting 2023-08-13 17:12:35 +02:00			`"""Stream the completions request. Sends data in chunks`
Ratelimit system 🎉 2023-08-14 10:47:03 +02:00			`If not streaming, it sends the result in its entirety.`
Codebase changes + a lot of commenting 2023-08-13 17:12:35 +02:00			`"""`
Ratelimit system 🎉 2023-08-14 10:47:03 +02:00
proxies have issues 2023-08-04 17:29:49 +02:00			`is_chat = False`
some stuff idfk 2023-08-04 03:30:56 +02:00
Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00			`model = None`
Fixed function calling 2023-09-14 18:18:19 +02:00			`is_stream = False`
Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00
proxies have issues 2023-08-04 17:29:49 +02:00			`if 'chat/completions' in path:`
			`is_chat = True`
			`model = payload['model']`
some stuff idfk 2023-08-04 03:30:56 +02:00
cool stuff or smth 2023-08-27 04:29:16 +02:00			`json_response = {}`
some stuff idfk 2023-08-04 03:30:56 +02:00
User agent fix 2023-08-25 19:13:39 +02:00			`headers = {`
			`'Content-Type': 'application/json',`
Fixed function calling 2023-09-14 18:18:19 +02:00			`'User-Agent': 'axios/0.21.1',`
User agent fix 2023-08-25 19:13:39 +02:00			`}`

Fixed function calling 2023-09-14 18:18:19 +02:00			`for _ in range(10):`
I don't even fkin know lmfao 2023-08-18 21:23:00 +02:00			`# Load balancing: randomly selecting a suitable provider`
add comments to streaming.py 2023-08-13 18:29:45 +02:00			`# If the request is a chat completion, then we need to load balance between chat providers`
			`# If the request is an organic request, then we need to load balance between organic providers`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`try:`
			`if is_chat:`
			`target_request = await load_balancing.balance_chat_request(payload)`
			`else:`
add comments to streaming.py 2023-08-13 18:29:45 +02:00
			`# In this case we are doing a organic request. "organic" means that it's not using a reverse engineered front-end, but rather ClosedAI's API directly`
			`# churchless.tech is an example of an organic provider, because it redirects the request to ClosedAI.`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`target_request = await load_balancing.balance_organic_request({`
			`'method': incoming_request.method,`
			`'path': path,`
			`'payload': payload,`
			`'headers': headers,`
			`'cookies': incoming_request.cookies`
			`})`
			`except ValueError as exc:`
No false notifications 2023-09-04 13:25:12 +02:00			`if model in ['gpt-3.5-turbo', 'gpt-4', 'gpt-4-32k']:`
			`webhook = dhooks.Webhook(os.environ['DISCORD_WEBHOOK__API_ISSUE'])`
			webhook.send(content=f'API Issue: `{exc}`\nhttps://i.imgflip.com/7uv122.jpg')
			`yield await errors.yield_error(500, 'Sorry, the API has no working keys anymore.', 'The admins have been messaged automatically.')`
idk 2023-08-06 12:46:41 +02:00			`return`
some thingies 2023-08-05 02:30:42 +02:00
massive cleanup of streaming (i think this works?) 2023-08-13 18:26:35 +02:00			`target_request['headers'].update(target_request.get('headers', {}))`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00
			`if target_request['method'] == 'GET' and not payload:`
			`target_request['payload'] = None`
proxies have issues 2023-08-04 17:29:49 +02:00
add comments to streaming.py 2023-08-13 18:29:45 +02:00			`# We haven't done any requests as of right now, everything until now was just preparation`
			`# Here, we process the request`
Added more documentation 2023-08-12 17:49:31 +02:00			`async with aiohttp.ClientSession(connector=proxies.get_proxy().connector) as session:`
some thingies 2023-08-05 02:30:42 +02:00			`try:`
			`async with session.request(`
			`method=target_request.get('method', 'POST'),`
			`url=target_request['url'],`
			`data=target_request.get('data'),`
			`json=target_request.get('payload'),`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`headers=target_request.get('headers', {}),`
some thingies 2023-08-05 02:30:42 +02:00			`cookies=target_request.get('cookies'),`
			`ssl=False,`
Some fixes? 2023-08-16 15:06:16 +02:00			`timeout=aiohttp.ClientTimeout(`
Fixed function calling 2023-09-14 18:18:19 +02:00			`connect=0.3,`
Changed timeout to 500 2023-09-10 16:22:46 +02:00			`total=float(os.getenv('TRANSFER_TIMEOUT', '500'))`
Some fixes? 2023-08-16 15:06:16 +02:00			`),`
some thingies 2023-08-05 02:30:42 +02:00			`) as response:`
Fixed function calling 2023-09-14 18:18:19 +02:00			`is_stream = response.content_type == 'text/event-stream'`
Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00
I think I fixed the errors 2023-08-23 23:26:43 +02:00			`if response.status == 429:`
			`continue`

Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`if response.content_type == 'application/json':`
			`data = await response.json()`
moderation is done yay 2023-08-06 21:42:07 +02:00
Fixed non-stream responses 2023-09-06 11:44:29 +02:00			`if 'method_not_supported' in str(data):`
			`await errors.error(500, 'Sorry, this endpoint does not support this method.', data['error']['message'])`

Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00			`if 'invalid_api_key' in str(data) or 'account_deactivated' in str(data):`
			`print('[!] invalid api key', target_request.get('provider_auth'))`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`await provider_auth.invalidate_key(target_request.get('provider_auth'))`
some thingies 2023-08-05 02:30:42 +02:00			`continue`
some stuff idfk 2023-08-04 03:30:56 +02:00
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`if response.ok:`
			`json_response = data`

sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`if is_stream:`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`try:`
			`response.raise_for_status()`
			`except Exception as exc:`
			`if 'Too Many Requests' in str(exc):`
			`continue`

Fixed function calling 2023-09-14 18:18:19 +02:00			`async for chunk in response.content.iter_any():`
			`chunk = chunk.decode('utf8').strip()`
			`yield chunk + '\n\n'`
proxies have issues 2023-08-04 17:29:49 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`break`
proxies have issues 2023-08-04 17:29:49 +02:00
Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00			`except Exception as exc:`
cool stuff or smth 2023-08-27 04:29:16 +02:00			`continue`

Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00			`if (not json_response) and is_chat:`
cool stuff or smth 2023-08-27 04:29:16 +02:00			`print('[!] chat response is empty')`
Resolved some issues 2023-08-24 14:57:36 +02:00			`continue`
Fixed non-stream responses 2023-09-06 11:44:29 +02:00			`else:`
Fixed function calling 2023-09-14 18:18:19 +02:00			`yield await errors.yield_error(500, 'Sorry, the provider is not responding. We\'re possibly getting rate-limited.', 'Please try again later.')`
Fixed non-stream responses 2023-09-06 11:44:29 +02:00			`return`
Resolved some issues 2023-08-24 14:57:36 +02:00
Fixed non-stream responses 2023-09-06 11:44:29 +02:00			`if (not is_stream) and json_response:`
moderation is done yay 2023-08-06 21:42:07 +02:00			`yield json.dumps(json_response)`

Fixed function calling 2023-09-14 18:18:19 +02:00			`print(f'[+] {path} -> {model or ""}')`

Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00			`await after_request.after_request(`
			`incoming_request=incoming_request,`
			`target_request=target_request,`
			`user=user,`
			`credits_cost=credits_cost,`
			`input_tokens=input_tokens,`
			`path=path,`
			`is_chat=is_chat,`
			`model=model,`
			`)`