nova-api/api/load_balancing.py

import random
import asyncio
from db.key_validation import cached_key_is_rated

import providers

async def _get_module_name(module) -> str:
    name = module.__name__
    if '.' in name:
        return name.split('.')[-1]
    return name

async def balance_chat_request(payload: dict) -> dict:
    """
    ### Load balance the chat completion request between chat providers.
    Providers are sorted by streaming and models. Target (provider.chat_completion) is returned
    """

    providers_available = []

    for provider_module in providers.MODULES:
        if payload['stream'] and not provider_module.STREAMING:
            continue

        if payload['model'] not in provider_module.MODELS:
            continue

        providers_available.append(provider_module)

    if not providers_available:
        raise ValueError(f'The model "{payload["model"]}" is not available. MODEL_UNAVAILABLE')

    provider = random.choice(providers_available)
    target = await provider.chat_completion(**payload)

    while True:
        key = target.get('provider_auth')

        if not await cached_key_is_rated(key):
            break

        else:
            target = await provider.chat_completion(**payload)

    module_name = await _get_module_name(provider)
    target['module'] = module_name

    return target

async def balance_organic_request(request: dict) -> dict:
    """
    ### Load balance non-chat completion request
    Balances between other "organic" providers which respond in the desired format already.
    Organic providers are used for non-chat completions, such as moderation and other paths.    
    """
    providers_available = []

    if not request.get('headers'):
        request['headers'] = {
            'Content-Type': 'application/json'
        }

    for provider_module in providers.MODULES:
        if not provider_module.ORGANIC:
            continue

        if '/moderations' in request['path']:
            if not provider_module.MODERATIONS:
                continue

        providers_available.append(provider_module)

    provider = random.choice(providers_available)
    target = await provider.organify(request)

    module_name = await _get_module_name(provider)
    target['module'] = module_name

    return target

if __name__ == '__main__':
    req = asyncio.run(balance_chat_request(payload={'model': 'gpt-3.5-turbo', 'stream': True}))
    print(req['url'])
some stuff idfk 2023-08-04 03:30:56 +02:00			`import random`
			`import asyncio`
Added key validation by API-key instead of IP Added rate limited keys getting logged in a database 2023-09-23 21:41:48 +02:00			`from db.key_validation import cached_key_is_rated`
some stuff idfk 2023-08-04 03:30:56 +02:00
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`import providers`
some stuff idfk 2023-08-04 03:30:56 +02:00
moderation is done yay 2023-08-06 21:42:07 +02:00			`async def _get_module_name(module) -> str:`
proxies have issues 2023-08-04 17:29:49 +02:00			`name = module.__name__`
			`if '.' in name:`
			`return name.split('.')[-1]`
			`return name`

some stuff idfk 2023-08-04 03:30:56 +02:00			`async def balance_chat_request(payload: dict) -> dict:`
Codebase changes + a lot of commenting 2023-08-13 17:12:35 +02:00			`"""`
			`### Load balance the chat completion request between chat providers.`
			`Providers are sorted by streaming and models. Target (provider.chat_completion) is returned`
			`"""`
moderation is done yay 2023-08-06 21:42:07 +02:00
some stuff idfk 2023-08-04 03:30:56 +02:00			`providers_available = []`

Added auto-rewards and invalid key system 2023-08-07 23:28:24 +02:00			`for provider_module in providers.MODULES:`
some stuff idfk 2023-08-04 03:30:56 +02:00			`if payload['stream'] and not provider_module.STREAMING:`
			`continue`

			`if payload['model'] not in provider_module.MODELS:`
			`continue`

			`providers_available.append(provider_module)`

some thingies 2023-08-05 02:30:42 +02:00			`if not providers_available:`
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`raise ValueError(f'The model "{payload["model"]}" is not available. MODEL_UNAVAILABLE')`
some thingies 2023-08-05 02:30:42 +02:00
some stuff idfk 2023-08-04 03:30:56 +02:00			`provider = random.choice(providers_available)`
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`target = await provider.chat_completion(**payload)`

Added key validation by API-key instead of IP Added rate limited keys getting logged in a database 2023-09-23 21:41:48 +02:00			`while True:`
			`key = target.get('provider_auth')`

			`if not await cached_key_is_rated(key):`
			`break`

			`else:`
			`target = await provider.chat_completion(**payload)`

moderation is done yay 2023-08-06 21:42:07 +02:00			`module_name = await _get_module_name(provider)`
			`target['module'] = module_name`
proxies have issues 2023-08-04 17:29:49 +02:00
			`return target`
some stuff idfk 2023-08-04 03:30:56 +02:00
			`async def balance_organic_request(request: dict) -> dict:`
Codebase changes + a lot of commenting 2023-08-13 17:12:35 +02:00			`"""`
			`### Load balance non-chat completion request`
			`Balances between other "organic" providers which respond in the desired format already.`
			`Organic providers are used for non-chat completions, such as moderation and other paths.`
			`"""`
some stuff idfk 2023-08-04 03:30:56 +02:00			`providers_available = []`

moderation is done yay 2023-08-06 21:42:07 +02:00			`if not request.get('headers'):`
			`request['headers'] = {`
			`'Content-Type': 'application/json'`
			`}`

Added auto-rewards and invalid key system 2023-08-07 23:28:24 +02:00			`for provider_module in providers.MODULES:`
moderation is done yay 2023-08-06 21:42:07 +02:00			`if not provider_module.ORGANIC:`
			`continue`

			`if '/moderations' in request['path']:`
			`if not provider_module.MODERATIONS:`
			`continue`

			`providers_available.append(provider_module)`
some stuff idfk 2023-08-04 03:30:56 +02:00
			`provider = random.choice(providers_available)`
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`target = await provider.organify(request)`
moderation is done yay 2023-08-06 21:42:07 +02:00
			`module_name = await _get_module_name(provider)`
			`target['module'] = module_name`
some stuff idfk 2023-08-04 03:30:56 +02:00
proxies have issues 2023-08-04 17:29:49 +02:00			`return target`
some stuff idfk 2023-08-04 03:30:56 +02:00
			`if __name__ == '__main__':`
			`req = asyncio.run(balance_chat_request(payload={'model': 'gpt-3.5-turbo', 'stream': True}))`
			`print(req['url'])`