nova-api/api/handler.py

"""Does quite a few checks and prepares the incoming request for the target endpoint, so it can be streamed"""

import os
import json
import yaml
import time
import fastapi

from dotenv import load_dotenv

import responder
import moderation

from rich import print
from db.users import UserManager
from helpers import tokens, errors, network

load_dotenv()

users = UserManager()
with open(os.path.join('cache', 'models.json'), encoding='utf8') as f:
    models_list = json.load(f)
models = [model['id'] for model in models_list['data']]

with open(os.path.join('config', 'config.yml'), encoding='utf8') as f:
    config = yaml.safe_load(f)

moderation_debug_key_key = os.getenv('MODERATION_DEBUG_KEY')

async def handle(incoming_request: fastapi.Request):
    """Transfer a streaming response 
    Takes the request from the incoming request to the target endpoint.
    Checks method, token amount, auth and cost along with if request is NSFW.
    """

    path = incoming_request.url.path
    path = path.replace('/v1/v1', '/v1')

    ip_address = await network.get_ip(incoming_request)

    if '/dashboard' in path:
        return errors.error(404, 'You can\'t access /dashboard.', 'This is a private endpoint.')

    if path.startswith('/v1/models'):
        return fastapi.responses.JSONResponse(content=models_list)

    try:
        payload = await incoming_request.json()
    except json.decoder.JSONDecodeError:
        payload = {}
    except UnicodeDecodeError:
        payload = {}

    received_key = incoming_request.headers.get('Authorization')

    if not received_key or not received_key.startswith('Bearer '):
        return await errors.error(401, 'No NovaAI API key given!', 'Add \'Authorization: Bearer nv-...\' to your request headers.')

    key_tags = ''

    if '#' in received_key:
        key_tags = received_key.split('#')[1]
        received_key = received_key.split('#')[0]

    user = await users.user_by_api_key(received_key.split('Bearer ')[1].strip())

    if not user or not user['status']['active']:
        return await errors.error(418, 'Invalid or inactive NovaAI API key!', 'Create a new NovaOSS API key or reactivate your account.')

    ban_reason = user['status']['ban_reason']
    if ban_reason:
        return await errors.error(403, f'Your NovaAI account has been banned. Reason: \'{ban_reason}\'.', 'Contact the staff for an appeal.')

    # Checking for enterprise status
    enterprise_keys = os.environ.get('ENTERPRISE_KEYS')
    if path.startswith('/enterprise/v1') and user.get('api_key') not in enterprise_keys.split():
        return await errors.error(403, 'Enterprise API is not available.', 'Contact the staff for an upgrade.')

    if 'account/credits' in path:
        return fastapi.responses.JSONResponse({'credits': user['credits']})

    costs = config['costs']
    cost = costs['other']

    if 'chat/completions' in path:
        cost = costs['chat-models'].get(payload.get('model'), cost)

    role = user.get('role', 'default')

    try:
        role_cost_multiplier = config['roles'][role]['bonus']
    except KeyError:
        role_cost_multiplier = 1

    cost = round(cost * role_cost_multiplier)

    if user['credits'] < cost:
        return await errors.error(429, 'Not enough credits.', 'Wait or earn more credits. Learn more on our website or Discord server.')

    if 'DISABLE_VARS' not in key_tags:
        payload_with_vars = json.dumps(payload)

        replace_dict = {
            'timestamp': str(int(time.time())),
            'date': time.strftime('%Y-%m-%d'),
            'time': time.strftime('%H:%M:%S'),
            'datetime': time.strftime('%Y-%m-%d %H:%M:%S'),
            'model': payload.get('model', 'unknown'),
        }

        if 'ALLOW_INSECURE_VARS' in key_tags:
            replace_dict.update({
                'my.ip': ip_address,
                'my.id': str(user['_id']),
                'my.role': user.get('role', 'default'),
                'my.credits': str(user['credits']),
                'my.discord': user.get('auth', {}).get('discord', ''),
            })

        for key, value in replace_dict.items():
            payload_with_vars = payload_with_vars.replace(f'[[{key}]]', value)

        payload = json.loads(payload_with_vars)

    policy_violation = False

    if not (moderation_debug_key_key and moderation_debug_key_key in key_tags and 'gpt-3' in payload.get('model', '')):
        if '/moderations' not in path:
            inp = ''

            if 'input' in payload or 'prompt' in payload:
                inp = payload.get('input', payload.get('prompt', ''))

            if isinstance(payload.get('messages'), list):
                inp = ''

                for message in payload.get('messages', []):
                    if message.get('role') == 'user':
                        inp += message.get('content', '') + '\n'

            if 'functions' in payload:
                inp += '\n'.join([function.get('description', '') for function in payload.get('functions', [])])

            if inp and len(inp) > 2 and not inp.isnumeric():
                policy_violation = await moderation.is_policy_violated(inp)

    if policy_violation:
        return await errors.error(
            400, f'The request contains content which violates this model\'s policies for <{policy_violation}>.',
            'We currently don\'t support any NSFW models.'
        )

    if 'chat/completions' in path and not payload.get('stream', False):
        payload['stream'] = False
    if 'chat/completions' in path and not payload.get('model'):
        payload['model'] = 'gpt-3.5-turbo'

    media_type = 'text/event-stream' if payload.get('stream', False) else 'application/json'

    if (model := payload.get('model')) not in models and model is not None:
        return await errors.error(404, 'Model not found.', 'Check the model name and try again.')

    return fastapi.responses.StreamingResponse(
        content=responder.respond(
            user=user,
            path=path,
            payload=payload,
            credits_cost=cost,
            input_tokens=0,
            incoming_request=incoming_request,
        ),
        media_type=media_type
    )
Added more documentation 2023-08-12 17:49:31 +02:00			`"""Does quite a few checks and prepares the incoming request for the target endpoint, so it can be streamed"""`
First actually working version I guess (streaming support) 2023-06-30 02:49:56 +02:00
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`import os`
Works for BetterGPT 2023-07-19 23:51:28 +02:00			`import json`
some stuff idfk 2023-08-04 03:30:56 +02:00			`import yaml`
Added variables 2023-08-29 01:18:55 +02:00			`import time`
moderation is done yay 2023-08-06 21:42:07 +02:00			`import fastapi`
First actually working version I guess (streaming support) 2023-06-30 02:49:56 +02:00
Fixed trademarks 2023-06-28 15:21:14 +02:00			`from dotenv import load_dotenv`
Added load balancer, MongoDB, improved proxy streaming support, more error messages, entire new world order 2023-08-03 01:46:49 +02:00
I forgor 💀 2023-09-11 02:47:21 +02:00			`import responder`
moderation is done yay 2023-08-06 21:42:07 +02:00			`import moderation`
Added load balancer, MongoDB, improved proxy streaming support, more error messages, entire new world order 2023-08-03 01:46:49 +02:00
User agent fix 2023-08-25 19:13:39 +02:00			`from rich import print`
Slight improvements/fixes 2023-08-15 13:55:12 +02:00			`from db.users import UserManager`
Resolved some issues 2023-08-24 14:57:36 +02:00			`from helpers import tokens, errors, network`
Fixed trademarks 2023-06-28 15:21:14 +02:00
			`load_dotenv()`

Resolved some issues 2023-08-24 14:57:36 +02:00			`users = UserManager()`
Refactor file operations 2023-10-06 09:37:16 +02:00			`with open(os.path.join('cache', 'models.json'), encoding='utf8') as f:`
			`models_list = json.load(f)`
Made the API return 404 if the model can't be found 2023-09-21 20:17:32 +02:00			`models = [model['id'] for model in models_list['data']]`
Models endpoint is now free and very quick 2023-08-09 11:43:05 +02:00
Refactor file operations 2023-10-06 09:37:16 +02:00			`with open(os.path.join('config', 'config.yml'), encoding='utf8') as f:`
Re-added rate limiting, fixed a bunch of issues 2023-08-17 13:11:35 +02:00			`config = yaml.safe_load(f)`
some stuff idfk 2023-08-04 03:30:56 +02:00
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`moderation_debug_key_key = os.getenv('MODERATION_DEBUG_KEY')`

cool stuff or smth 2023-08-27 04:29:16 +02:00			`async def handle(incoming_request: fastapi.Request):`
Added key validation by API-key instead of IP Added rate limited keys getting logged in a database 2023-09-23 21:41:48 +02:00			`"""Transfer a streaming response`
Codebase changes + a lot of commenting 2023-08-13 17:12:35 +02:00			`Takes the request from the incoming request to the target endpoint.`
			`Checks method, token amount, auth and cost along with if request is NSFW.`
			`"""`
Added key validation by API-key instead of IP Added rate limited keys getting logged in a database 2023-09-23 21:41:48 +02:00
			`path = incoming_request.url.path`
			`path = path.replace('/v1/v1', '/v1')`
First actually working version I guess (streaming support) 2023-06-30 02:49:56 +02:00
Resolved some issues 2023-08-24 14:57:36 +02:00			`ip_address = await network.get_ip(incoming_request)`

some stuff 2023-10-09 19:09:01 +02:00			`if '/dashboard' in path:`
			`return errors.error(404, 'You can\'t access /dashboard.', 'This is a private endpoint.')`

			`if path.startswith('/v1/models'):`
Quicker models endpoint 2023-08-19 17:53:48 +02:00			`return fastapi.responses.JSONResponse(content=models_list)`

Slight improvements/fixes 2023-08-15 13:55:12 +02:00			`try:`
			`payload = await incoming_request.json()`
			`except json.decoder.JSONDecodeError:`
			`payload = {}`
Small improvements 2023-08-30 20:55:31 +02:00			`except UnicodeDecodeError:`
			`payload = {}`
WIP 2023-07-25 02:42:53 +02:00
some stuff idfk 2023-08-04 03:30:56 +02:00			`received_key = incoming_request.headers.get('Authorization')`
Several improvements, about to change DB 2023-08-01 20:19:00 +02:00
clean up code a lot 2023-08-13 18:19:56 +02:00			`if not received_key or not received_key.startswith('Bearer '):`
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`return await errors.error(401, 'No NovaAI API key given!', 'Add \'Authorization: Bearer nv-...\' to your request headers.')`
Several improvements, about to change DB 2023-08-01 20:19:00 +02:00
Fix 2023-08-29 01:23:00 +02:00			`key_tags = ''`

Added variables 2023-08-29 01:18:55 +02:00			`if '#' in received_key:`
			`key_tags = received_key.split('#')[1]`
			`received_key = received_key.split('#')[0]`

Alotta changes. Setup managers and modified other files, cleaning up codebase. Created user.py class for future type usage. 2023-08-14 05:11:15 +02:00			`user = await users.user_by_api_key(received_key.split('Bearer ')[1].strip())`
Several improvements, about to change DB 2023-08-01 20:19:00 +02:00
clean up code a lot 2023-08-13 18:19:56 +02:00			`if not user or not user['status']['active']:`
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`return await errors.error(418, 'Invalid or inactive NovaAI API key!', 'Create a new NovaOSS API key or reactivate your account.')`
Added load balancer, MongoDB, improved proxy streaming support, more error messages, entire new world order 2023-08-03 01:46:49 +02:00
			`ban_reason = user['status']['ban_reason']`
			`if ban_reason:`
Made code more robust (dotenv) and working on tests 2023-08-21 20:58:05 +02:00			`return await errors.error(403, f'Your NovaAI account has been banned. Reason: \'{ban_reason}\'.', 'Contact the staff for an appeal.')`
Added load balancer, MongoDB, improved proxy streaming support, more error messages, entire new world order 2023-08-03 01:46:49 +02:00
Added key validation by API-key instead of IP Added rate limited keys getting logged in a database 2023-09-23 21:41:48 +02:00			`# Checking for enterprise status`
Added azure endpoints 2023-10-06 23:05:38 +02:00			`enterprise_keys = os.environ.get('ENTERPRISE_KEYS')`
			`if path.startswith('/enterprise/v1') and user.get('api_key') not in enterprise_keys.split():`
Added key validation by API-key instead of IP Added rate limited keys getting logged in a database 2023-09-23 21:41:48 +02:00			`return await errors.error(403, 'Enterprise API is not available.', 'Contact the staff for an upgrade.')`

Added /v1/accounts/credits 2023-09-22 02:38:21 +02:00			`if 'account/credits' in path:`
			`return fastapi.responses.JSONResponse({'credits': user['credits']})`

Re-added rate limiting, fixed a bunch of issues 2023-08-17 13:11:35 +02:00			`costs = config['costs']`
some stuff idfk 2023-08-04 03:30:56 +02:00			`cost = costs['other']`
Added load balancer, MongoDB, improved proxy streaming support, more error messages, entire new world order 2023-08-03 01:46:49 +02:00
some stuff idfk 2023-08-04 03:30:56 +02:00			`if 'chat/completions' in path:`
clean up code a lot 2023-08-13 18:19:56 +02:00			`cost = costs['chat-models'].get(payload.get('model'), cost)`
Added load balancer, MongoDB, improved proxy streaming support, more error messages, entire new world order 2023-08-03 01:46:49 +02:00
Added variables 2023-08-29 01:18:55 +02:00			`role = user.get('role', 'default')`

			`try:`
			`role_cost_multiplier = config['roles'][role]['bonus']`
			`except KeyError:`
			`role_cost_multiplier = 1`

			`cost = round(cost * role_cost_multiplier)`

			`if user['credits'] < cost:`
			`return await errors.error(429, 'Not enough credits.', 'Wait or earn more credits. Learn more on our website or Discord server.')`

Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`if 'DISABLE_VARS' not in key_tags:`
Small improvements 2023-08-30 20:55:31 +02:00			`payload_with_vars = json.dumps(payload)`

			`replace_dict = {`
			`'timestamp': str(int(time.time())),`
			`'date': time.strftime('%Y-%m-%d'),`
			`'time': time.strftime('%H:%M:%S'),`
			`'datetime': time.strftime('%Y-%m-%d %H:%M:%S'),`
			`'model': payload.get('model', 'unknown'),`
			`}`

			`if 'ALLOW_INSECURE_VARS' in key_tags:`
			`replace_dict.update({`
			`'my.ip': ip_address,`
			`'my.id': str(user['_id']),`
			`'my.role': user.get('role', 'default'),`
			`'my.credits': str(user['credits']),`
			`'my.discord': user.get('auth', {}).get('discord', ''),`
			`})`

			`for key, value in replace_dict.items():`
			`payload_with_vars = payload_with_vars.replace(f'[[{key}]]', value)`

			`payload = json.loads(payload_with_vars)`
Added variables 2023-08-29 01:18:55 +02:00
clean up code a lot 2023-08-13 18:19:56 +02:00			`policy_violation = False`
Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`if not (moderation_debug_key_key and moderation_debug_key_key in key_tags and 'gpt-3' in payload.get('model', '')):`
			`if '/moderations' not in path:`
			`inp = ''`

			`if 'input' in payload or 'prompt' in payload:`
			`inp = payload.get('input', payload.get('prompt', ''))`
Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`if isinstance(payload.get('messages'), list):`
Fixed function calling 2023-09-14 18:18:19 +02:00			`inp = ''`

			`for message in payload.get('messages', []):`
			`if message.get('role') == 'user':`
			`inp += message.get('content', '') + '\n'`

			`if 'functions' in payload:`
			`inp += '\n'.join([function.get('description', '') for function in payload.get('functions', [])])`
Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`if inp and len(inp) > 2 and not inp.isnumeric():`
			`policy_violation = await moderation.is_policy_violated(inp)`
Added auto-rewards and invalid key system 2023-08-07 23:28:24 +02:00
Fixed some several issues with moderation, models etc. 2023-08-08 01:04:35 +02:00			`if policy_violation:`
Resolved some issues 2023-08-24 14:57:36 +02:00			`return await errors.error(`
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`400, f'The request contains content which violates this model\'s policies for <{policy_violation}>.',`
Resolved some issues 2023-08-24 14:57:36 +02:00			`'We currently don\'t support any NSFW models.'`
			`)`
some general changes 2023-08-12 17:56:21 +02:00
clean up code a lot 2023-08-13 18:19:56 +02:00			`if 'chat/completions' in path and not payload.get('stream', False):`
some stuff idfk 2023-08-04 03:30:56 +02:00			`payload['stream'] = False`
Special: halved GPT-3 credits cost (thanks for 1.000 members!) If no model is given, the API now defaults to gpt-3.5-turbo We now also support gpt-3.5-turbo-0301! Made provider code asynchronous New dependency requirement: aiofiles Staff now gets a notification when a provider key is invalid Internal improvements with log webhooks for staff Removed image model check 2023-09-02 21:15:55 +02:00			`if 'chat/completions' in path and not payload.get('model'):`
			`payload['model'] = 'gpt-3.5-turbo'`
Work in progess 2023-08-03 03:50:04 +02:00
moderation is done yay 2023-08-06 21:42:07 +02:00			`media_type = 'text/event-stream' if payload.get('stream', False) else 'application/json'`

Added /v1/accounts/credits 2023-09-22 02:38:21 +02:00			`if (model := payload.get('model')) not in models and model is not None:`
Made the API return 404 if the model can't be found 2023-09-21 20:17:32 +02:00			`return await errors.error(404, 'Model not found.', 'Check the model name and try again.')`

moderation is done yay 2023-08-06 21:42:07 +02:00			`return fastapi.responses.StreamingResponse(`
I forgor 💀 2023-09-11 02:47:21 +02:00			`content=responder.respond(`
some stuff idfk 2023-08-04 03:30:56 +02:00			`user=user,`
			`path=path,`
			`payload=payload,`
			`credits_cost=cost,`
Fixed function calling 2023-09-14 18:18:19 +02:00			`input_tokens=0,`
some stuff idfk 2023-08-04 03:30:56 +02:00			`incoming_request=incoming_request,`
			`),`
moderation is done yay 2023-08-06 21:42:07 +02:00			`media_type=media_type`
some stuff idfk 2023-08-04 03:30:56 +02:00			`)`