nova-api/api/responder.py

"""This module contains the streaming logic for the API."""

import os
import json
import yaml
import ujson
import aiohttp
import asyncio
import starlette

from typing import Any, Coroutine, Set
from rich import print
from dotenv import load_dotenv

import proxies
import after_request
import load_balancing

from helpers import errors
from db import providerkeys
from helpers.tokens import count_tokens_for_messages

load_dotenv()

RETRIES = 10

CRITICAL_API_ERRORS = ['invalid_api_key', 'account_deactivated']
keymanager = providerkeys.manager
background_tasks: Set[asyncio.Task[Any]] = set()

with open(os.path.join('config', 'config.yml'), encoding='utf8') as f:
    config = yaml.safe_load(f)

def create_background_task(coro: Coroutine[Any, Any, Any]) -> None:
    """Utilizes asyncio.create_task, which prevents the task from being garbage collected.

    https://docs.python.org/3/library/asyncio-task.html#asyncio.create_task
    """
    task = asyncio.create_task(coro)
    background_tasks.add(task)
    task.add_done_callback(background_tasks.discard)

async def respond(
    path: str='/v1/chat/completions',
    user: dict=None,
    payload: dict=None,
    incoming_request=None,
    overwrite_method=None
):
    """
    Stream the completions request. Sends data in chunks
    If not streaming, it sends the result in its entirety.
    """

    is_chat = False

    model = None

    if 'chat/completions' in path:
        is_chat = True
        model = payload['model']

    server_json_response = {}

    headers = {
        'Content-Type': 'application/json'
    }

    skipped_errors = {
        'no_provider_key': 0,
        'insufficient_quota': 0,
        'billing_not_active': 0,
        'critical_provider_error': 0,
        'timeout': 0,
        'other_errors': []
    }

    input_tokens = 0
    output_tokens = 0

    if incoming_request:
        cookies = incoming_request.cookies
    else:
        cookies = {}
        
    if overwrite_method:
        method = overwrite_method
    else:
        method = incoming_request.method

    for _ in range(RETRIES):
        try:
            if is_chat:
                target_request = await load_balancing.balance_chat_request(payload)
            else:
                target_request = await load_balancing.balance_organic_request({
                    'method': method,
                    'path': path,
                    'payload': payload,
                    'headers': headers,
                    'cookies': cookies
                })

        except ValueError:
            yield await errors.yield_error(500, f'Sorry, the API has no active API keys for {model}.', 'Please use a different model.')
            return

        provider_auth = target_request.get('provider_auth')

        if provider_auth:
            provider_name = provider_auth.split('>')[0]
            provider_key = provider_auth.split('>')[1]

        if provider_key == '--NO_KEY--':
            skipped_errors['no_provider_key'] += 1
            continue

        target_request['headers'].update(target_request.get('headers', {}))

        if target_request['method'] == 'GET' and not payload:
            target_request['payload'] = None

        connector = None

        if os.getenv('PROXY_HOST') or os.getenv('USE_PROXY_LIST', 'False').lower() == 'true':
            connector = proxies.get_proxy().connector

        async with aiohttp.ClientSession(connector=connector) as session:
            try:
                async with session.request(
                    method=target_request.get('method', 'POST'),
                    url=target_request['url'],
                    data=target_request.get('data'),
                    json=target_request.get('payload'),
                    headers=target_request.get('headers', {}),
                    cookies=target_request.get('cookies'),
                    ssl=False,
                    timeout=aiohttp.ClientTimeout(
                        connect=0.75,
                        total=float(os.getenv('TRANSFER_TIMEOUT', '500'))
                    )
                ) as response:
                    is_stream = response.content_type == 'text/event-stream'

                    if response.content_type == 'application/json':
                        client_json_response = await response.json()

                        try:
                            error_code = client_json_response['error']['code']
                        except KeyError:
                            error_code = ''

                        if error_code == 'method_not_supported':
                            yield await errors.yield_error(400, 'Sorry, this endpoint does not support this method.', 'Please use a different method.')

                        if error_code == 'insufficient_quota':
                            print('[!] insufficient quota')
                            await keymanager.rate_limit_key(provider_name, provider_key, 86400)
                            skipped_errors['insufficient_quota'] += 1
                            continue

                        if error_code == 'billing_not_active':
                            print('[!] billing not active')
                            await keymanager.deactivate_key(provider_name, provider_key, 'billing_not_active')
                            skipped_errors['billing_not_active'] += 1
                            continue

                        critical_error = False
                        for error in CRITICAL_API_ERRORS:
                            if error in str(client_json_response):
                                await keymanager.deactivate_key(provider_name, provider_key, error)
                                critical_error = True

                        if critical_error:
                            print('[!] critical provider error')
                            skipped_errors['critical_provider_error'] += 1
                            continue

                        if response.ok:
                            if is_chat and not is_stream:
                                input_tokens = client_json_response['usage']['prompt_tokens']
                                output_tokens = client_json_response['usage']['completion_tokens']

                            server_json_response = client_json_response
                    elif response.content_type == 'text/plain':
                        data = (await response.read()).decode("utf-8")
                        print(f'[!] {data}')
                        skipped_errors['other_errors'] = skipped_errors['other_errors'].append(data)
                        continue

                    if is_stream:
                        input_tokens = await count_tokens_for_messages(payload['messages'], model=model)

                        chunk_no = 0
                        buffer = ''

                        async for chunk in response.content.iter_any():
                            chunk_no += 1

                            chunk = chunk.decode('utf8')

                            if 'azure' in provider_name:
                                chunk = chunk.replace('data: ', '', 1)

                                if not chunk.strip() or chunk_no == 1:
                                    continue

                            buffer += chunk
                            while '\n\n' in buffer:
                                subchunk, buffer = buffer.split('\n\n', 1)

                                if not subchunk.strip():
                                    continue

                                if not subchunk.startswith('data: '):
                                    subchunk = 'data: ' + subchunk

                                subchunk = subchunk.rsplit('[DONE]', 1)[0]
                                subchunk += '\n\n'

                                yield subchunk


                        output_tokens = chunk_no
                    break

            except aiohttp.client_exceptions.ServerTimeoutError:
                skipped_errors['timeout'] += 1
                continue
    else:
        skipped_errors = {k: v for k, v in skipped_errors.items() if ((isinstance(v, int) and v > 0) or (isinstance(v, list) and len(v) > 0))}
        skipped_errors['model'] = model
        skipped_errors['provider'] = provider_name
        print(f'[!] Skipped {RETRIES} errors:\n{skipped_errors}')

        skipped_errors = ujson.dumps(skipped_errors, indent=4)
        yield await errors.yield_error(500,
            f'Sorry, our API seems to have issues connecting to "{model}".',
            f'Please send this info to support: {skipped_errors}'
        )
        return

    if (not is_stream) and server_json_response:
        server_json_response['system_fingerprint'] = f'fp_' + os.urandom(5).hex()
        yield json.dumps(server_json_response)

    if incoming_request: # not called by other code, but actually a request
        role = user.get('role', 'default')
        model_multipliers = config['costs']
        model_multiplier = model_multipliers['other']

        if is_chat:
            model_multiplier = model_multipliers['chat-models'].get(payload.get('model'), model_multiplier)
            total_tokens = input_tokens + output_tokens
            credits_cost = total_tokens / 60
            credits_cost = round(credits_cost * model_multiplier)

            if credits_cost < 1:
                credits_cost = 1

            tokens = {'input': input_tokens, 'output': output_tokens, 'total': total_tokens}

        elif model == 'dall-e-2':
            credits_cost = 50
            tokens = {'input': 0,'output': 0,'total': credits_cost}

        elif model == 'dall-e-3':
            credits_cost = 100
            tokens = {'input': 0, 'output': 0, 'total': credits_cost}

        try:
            role_cost_multiplier = config['roles'][role]['bonus']
        except KeyError:
            role_cost_multiplier = 1


        credits_cost = round(credits_cost * role_cost_multiplier)

        create_background_task(
            after_request.after_request(
                provider=provider_name,
                incoming_request=incoming_request,
                target_request=target_request,
                user=user,
                credits_cost=credits_cost,
                tokens=tokens,
                path=path,
                is_chat=is_chat,
                model=model,
            )
        )
Added more documentation 2023-08-12 17:49:31 +02:00			`"""This module contains the streaming logic for the API."""`

some stuff idfk 2023-08-04 03:30:56 +02:00			`import os`
proxies have issues 2023-08-04 17:29:49 +02:00			`import json`
Added token-based credit cost 2023-10-16 23:34:54 +02:00			`import yaml`
pls dont abuse my api thnkx <3 2023-10-08 00:28:13 +02:00			`import ujson`
some stuff idfk 2023-08-04 03:30:56 +02:00			`import aiohttp`
yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`import asyncio`
some stuff idfk 2023-08-04 03:30:56 +02:00			`import starlette`

Fix dangling asyncio tasks 2023-10-06 09:45:50 +02:00			`from typing import Any, Coroutine, Set`
proxies have issues 2023-08-04 17:29:49 +02:00			`from rich import print`
some stuff idfk 2023-08-04 03:30:56 +02:00			`from dotenv import load_dotenv`

			`import proxies`
Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00			`import after_request`
some stuff idfk 2023-08-04 03:30:56 +02:00			`import load_balancing`

implemented key ratelimit checks 2023-10-02 21:09:39 +02:00			`from helpers import errors`
yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`from db import providerkeys`
Added token-based credit cost 2023-10-16 23:34:54 +02:00			`from helpers.tokens import count_tokens_for_messages`
some stuff idfk 2023-08-04 03:30:56 +02:00
			`load_dotenv()`

Various improvements. 2023-11-07 00:56:43 +01:00			`RETRIES = 10`

yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`CRITICAL_API_ERRORS = ['invalid_api_key', 'account_deactivated']`
			`keymanager = providerkeys.manager`
Fix dangling asyncio tasks 2023-10-06 09:45:50 +02:00			`background_tasks: Set[asyncio.Task[Any]] = set()`

Added token-based credit cost 2023-10-16 23:34:54 +02:00			`with open(os.path.join('config', 'config.yml'), encoding='utf8') as f:`
			`config = yaml.safe_load(f)`
Fix dangling asyncio tasks 2023-10-06 09:45:50 +02:00
			`def create_background_task(coro: Coroutine[Any, Any, Any]) -> None:`
Various improvements. 2023-11-07 00:56:43 +01:00			`"""Utilizes asyncio.create_task, which prevents the task from being garbage collected.`
Fix dangling asyncio tasks 2023-10-06 09:45:50 +02:00
			`https://docs.python.org/3/library/asyncio-task.html#asyncio.create_task`
			`"""`
			`task = asyncio.create_task(coro)`
			`background_tasks.add(task)`
			`task.add_done_callback(background_tasks.discard)`

I forgor 💀 2023-09-11 02:47:21 +02:00			`async def respond(`
some stuff idfk 2023-08-04 03:30:56 +02:00			`path: str='/v1/chat/completions',`
			`user: dict=None,`
			`payload: dict=None,`
Various improvements. 2023-11-07 00:56:43 +01:00			`incoming_request=None,`
			`overwrite_method=None`
some stuff idfk 2023-08-04 03:30:56 +02:00			`):`
Documented almost everything 2023-10-12 00:03:15 +02:00			`"""`
			`Stream the completions request. Sends data in chunks`
Ratelimit system 🎉 2023-08-14 10:47:03 +02:00			`If not streaming, it sends the result in its entirety.`
Codebase changes + a lot of commenting 2023-08-13 17:12:35 +02:00			`"""`
Ratelimit system 🎉 2023-08-14 10:47:03 +02:00
proxies have issues 2023-08-04 17:29:49 +02:00			`is_chat = False`
some stuff idfk 2023-08-04 03:30:56 +02:00
Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00			`model = None`

proxies have issues 2023-08-04 17:29:49 +02:00			`if 'chat/completions' in path:`
			`is_chat = True`
			`model = payload['model']`
some stuff idfk 2023-08-04 03:30:56 +02:00
yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`server_json_response = {}`
some stuff idfk 2023-08-04 03:30:56 +02:00
User agent fix 2023-08-25 19:13:39 +02:00			`headers = {`
Added key validation by API-key instead of IP Added rate limited keys getting logged in a database 2023-09-23 21:41:48 +02:00			`'Content-Type': 'application/json'`
User agent fix 2023-08-25 19:13:39 +02:00			`}`

some stuff 2023-10-09 19:09:01 +02:00			`skipped_errors = {`
Fixed API returning error if no provider available 2023-10-16 12:37:33 +02:00			`'no_provider_key': 0,`
some stuff 2023-10-09 19:09:01 +02:00			`'insufficient_quota': 0,`
			`'billing_not_active': 0,`
			`'critical_provider_error': 0,`
i luv u @Zapzatron <3 2023-10-25 21:09:49 +02:00			`'timeout': 0,`
			`'other_errors': []`
some stuff 2023-10-09 19:09:01 +02:00			`}`

Added token-based credit cost 2023-10-16 23:34:54 +02:00			`input_tokens = 0`
			`output_tokens = 0`

Various improvements. 2023-11-07 00:56:43 +01:00			`if incoming_request:`
			`cookies = incoming_request.cookies`
			`else:`
			`cookies = {}`

			`if overwrite_method:`
			`method = overwrite_method`
			`else:`
			`method = incoming_request.method`

			`for _ in range(RETRIES):`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`try:`
			`if is_chat:`
			`target_request = await load_balancing.balance_chat_request(payload)`
			`else:`
			`target_request = await load_balancing.balance_organic_request({`
Various improvements. 2023-11-07 00:56:43 +01:00			`'method': method,`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`'path': path,`
			`'payload': payload,`
			`'headers': headers,`
Various improvements. 2023-11-07 00:56:43 +01:00			`'cookies': cookies`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`})`
Added azure endpoints 2023-10-06 23:05:38 +02:00
yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`except ValueError:`
Added key validation by API-key instead of IP Added rate limited keys getting logged in a database 2023-09-23 21:41:48 +02:00			`yield await errors.yield_error(500, f'Sorry, the API has no active API keys for {model}.', 'Please use a different model.')`
idk 2023-08-06 12:46:41 +02:00			`return`
some thingies 2023-08-05 02:30:42 +02:00
yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`provider_auth = target_request.get('provider_auth')`

			`if provider_auth:`
			`provider_name = provider_auth.split('>')[0]`
			`provider_key = provider_auth.split('>')[1]`

Improved errors, checking and fixed ratelimit retrying 2023-10-05 14:17:53 +02:00			`if provider_key == '--NO_KEY--':`
Fixed API returning error if no provider available 2023-10-16 12:37:33 +02:00			`skipped_errors['no_provider_key'] += 1`
			`continue`
Improved errors, checking and fixed ratelimit retrying 2023-10-05 14:17:53 +02:00
massive cleanup of streaming (i think this works?) 2023-08-13 18:26:35 +02:00			`target_request['headers'].update(target_request.get('headers', {}))`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00
			`if target_request['method'] == 'GET' and not payload:`
			`target_request['payload'] = None`
proxies have issues 2023-08-04 17:29:49 +02:00
Minor fixes, really 2023-10-15 22:35:18 +02:00			`connector = None`

			`if os.getenv('PROXY_HOST') or os.getenv('USE_PROXY_LIST', 'False').lower() == 'true':`
			`connector = proxies.get_proxy().connector`

			`async with aiohttp.ClientSession(connector=connector) as session:`
some thingies 2023-08-05 02:30:42 +02:00			`try:`
			`async with session.request(`
			`method=target_request.get('method', 'POST'),`
			`url=target_request['url'],`
			`data=target_request.get('data'),`
			`json=target_request.get('payload'),`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`headers=target_request.get('headers', {}),`
some thingies 2023-08-05 02:30:42 +02:00			`cookies=target_request.get('cookies'),`
			`ssl=False,`
Some fixes? 2023-08-16 15:06:16 +02:00			`timeout=aiohttp.ClientTimeout(`
Added buffering, fixing a common chunk yielding issue 2023-10-08 23:56:32 +02:00			`connect=0.75,`
Changed timeout to 500 2023-09-10 16:22:46 +02:00			`total=float(os.getenv('TRANSFER_TIMEOUT', '500'))`
Improved errors, checking and fixed ratelimit retrying 2023-10-05 14:17:53 +02:00			`)`
some thingies 2023-08-05 02:30:42 +02:00			`) as response:`
Fixed function calling 2023-09-14 18:18:19 +02:00			`is_stream = response.content_type == 'text/event-stream'`
Fixed moderation, cleanup and other performance changes 2023-08-28 00:58:32 +02:00
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`if response.content_type == 'application/json':`
yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`client_json_response = await response.json()`
moderation is done yay 2023-08-06 21:42:07 +02:00
Added azure endpoints 2023-10-06 23:05:38 +02:00			`try:`
			`error_code = client_json_response['error']['code']`
			`except KeyError:`
			`error_code = ''`

			`if error_code == 'method_not_supported':`
			`yield await errors.yield_error(400, 'Sorry, this endpoint does not support this method.', 'Please use a different method.')`

			`if error_code == 'insufficient_quota':`
			`print('[!] insufficient quota')`
			`await keymanager.rate_limit_key(provider_name, provider_key, 86400)`
some stuff 2023-10-09 19:09:01 +02:00			`skipped_errors['insufficient_quota'] += 1`
Added azure endpoints 2023-10-06 23:05:38 +02:00			`continue`

			`if error_code == 'billing_not_active':`
			`print('[!] billing not active')`
			`await keymanager.deactivate_key(provider_name, provider_key, 'billing_not_active')`
some stuff 2023-10-09 19:09:01 +02:00			`skipped_errors['billing_not_active'] += 1`
Added azure endpoints 2023-10-06 23:05:38 +02:00			`continue`
Fixed non-stream responses 2023-09-06 11:44:29 +02:00
yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`critical_error = False`
			`for error in CRITICAL_API_ERRORS:`
			`if error in str(client_json_response):`
			`await keymanager.deactivate_key(provider_name, provider_key, error)`
			`critical_error = True`
some stuff 2023-10-09 19:09:01 +02:00
yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`if critical_error:`
some stuff 2023-10-09 19:09:01 +02:00			`print('[!] critical provider error')`
			`skipped_errors['critical_provider_error'] += 1`
some thingies 2023-08-05 02:30:42 +02:00			`continue`
some stuff idfk 2023-08-04 03:30:56 +02:00
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00			`if response.ok:`
Added token-based credit cost 2023-10-16 23:34:54 +02:00			`if is_chat and not is_stream:`
			`input_tokens = client_json_response['usage']['prompt_tokens']`
			`output_tokens = client_json_response['usage']['completion_tokens']`

yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`server_json_response = client_json_response`
i luv u @Zapzatron <3 2023-10-25 21:09:49 +02:00			`elif response.content_type == 'text/plain':`
			`data = (await response.read()).decode("utf-8")`
			`print(f'[!] {data}')`
			`skipped_errors['other_errors'] = skipped_errors['other_errors'].append(data)`
			`continue`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00			`if is_stream:`
Added token-based credit cost 2023-10-16 23:34:54 +02:00			`input_tokens = await count_tokens_for_messages(payload['messages'], model=model)`

aight 2023-10-08 21:53:27 +02:00			`chunk_no = 0`
Added buffering, fixing a common chunk yielding issue 2023-10-08 23:56:32 +02:00			`buffer = ''`

Various improvements. 2023-11-07 00:56:43 +01:00			`async for chunk in response.content.iter_any():`
aight 2023-10-08 21:53:27 +02:00			`chunk_no += 1`
Added buffering, fixing a common chunk yielding issue 2023-10-08 23:56:32 +02:00
			`chunk = chunk.decode('utf8')`
pls dont abuse my api thnkx <3 2023-10-08 00:28:13 +02:00
			`if 'azure' in provider_name:`
some stuff 2023-10-09 19:09:01 +02:00			`chunk = chunk.replace('data: ', '', 1)`
pls dont abuse my api thnkx <3 2023-10-08 00:28:13 +02:00
Added token-based credit cost 2023-10-16 23:34:54 +02:00			`if not chunk.strip() or chunk_no == 1:`
pls dont abuse my api thnkx <3 2023-10-08 00:28:13 +02:00			`continue`

Various improvements. 2023-11-07 00:56:43 +01:00			`buffer += chunk`
			`while '\n\n' in buffer:`
			`subchunk, buffer = buffer.split('\n\n', 1)`

			`if not subchunk.strip():`
			`continue`
Added buffering, fixing a common chunk yielding issue 2023-10-08 23:56:32 +02:00
some stuff 2023-10-09 19:09:01 +02:00			`if not subchunk.startswith('data: '):`
			`subchunk = 'data: ' + subchunk`
Added buffering, fixing a common chunk yielding issue 2023-10-08 23:56:32 +02:00
Various improvements. 2023-11-07 00:56:43 +01:00			`subchunk = subchunk.rsplit('[DONE]', 1)[0]`
			`subchunk += '\n\n'`

			`yield subchunk`
proxies have issues 2023-08-04 17:29:49 +02:00
Added token-based credit cost 2023-10-16 23:34:54 +02:00
			`output_tokens = chunk_no`
some thingies 2023-08-05 02:30:42 +02:00			`break`
proxies have issues 2023-08-04 17:29:49 +02:00
Added buffering, fixing a common chunk yielding issue 2023-10-08 23:56:32 +02:00			`except aiohttp.client_exceptions.ServerTimeoutError:`
some stuff 2023-10-09 19:09:01 +02:00			`skipped_errors['timeout'] += 1`
Added buffering, fixing a common chunk yielding issue 2023-10-08 23:56:32 +02:00			`continue`
Fixed non-stream responses 2023-09-06 11:44:29 +02:00			`else:`
Various improvements. 2023-11-07 00:56:43 +01:00			`skipped_errors = {k: v for k, v in skipped_errors.items() if ((isinstance(v, int) and v > 0) or (isinstance(v, list) and len(v) > 0))}`
			`skipped_errors['model'] = model`
			`skipped_errors['provider'] = provider_name`
			`print(f'[!] Skipped {RETRIES} errors:\n{skipped_errors}')`

some stuff 2023-10-09 19:09:01 +02:00			`skipped_errors = ujson.dumps(skipped_errors, indent=4)`
			`yield await errors.yield_error(500,`
Added token-based credit cost 2023-10-16 23:34:54 +02:00			`f'Sorry, our API seems to have issues connecting to "{model}".',`
some stuff 2023-10-09 19:09:01 +02:00			`f'Please send this info to support: {skipped_errors}'`
			`)`
Fixed non-stream responses 2023-09-06 11:44:29 +02:00			`return`
Resolved some issues 2023-08-24 14:57:36 +02:00
yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`if (not is_stream) and server_json_response:`
Add system fingerprint to server JSON response 2023-11-07 01:05:00 +01:00			`server_json_response['system_fingerprint'] = f'fp_' + os.urandom(5).hex()`
yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`yield json.dumps(server_json_response)`

Various improvements. 2023-11-07 00:56:43 +01:00			`if incoming_request: # not called by other code, but actually a request`
			`role = user.get('role', 'default')`
			`model_multipliers = config['costs']`
			`model_multiplier = model_multipliers['other']`
Added token-based credit cost 2023-10-16 23:34:54 +02:00
Various improvements. 2023-11-07 00:56:43 +01:00			`if is_chat:`
			`model_multiplier = model_multipliers['chat-models'].get(payload.get('model'), model_multiplier)`
			`total_tokens = input_tokens + output_tokens`
			`credits_cost = total_tokens / 60`
			`credits_cost = round(credits_cost * model_multiplier)`
Added token-based credit cost 2023-10-16 23:34:54 +02:00
Various improvements. 2023-11-07 00:56:43 +01:00			`if credits_cost < 1:`
			`credits_cost = 1`
Added token-based credit cost 2023-10-16 23:34:54 +02:00
Various improvements. 2023-11-07 00:56:43 +01:00			`tokens = {'input': input_tokens, 'output': output_tokens, 'total': total_tokens}`
Much cheaper API 2023-10-16 23:55:54 +02:00
Various improvements. 2023-11-07 00:56:43 +01:00			`elif model == 'dall-e-2':`
			`credits_cost = 50`
			`tokens = {'input': 0,'output': 0,'total': credits_cost}`

			`elif model == 'dall-e-3':`
			`credits_cost = 100`
			`tokens = {'input': 0, 'output': 0, 'total': credits_cost}`

			`try:`
			`role_cost_multiplier = config['roles'][role]['bonus']`
			`except KeyError:`
			`role_cost_multiplier = 1`


			`credits_cost = round(credits_cost * role_cost_multiplier)`

			`create_background_task(`
			`after_request.after_request(`
			`provider=provider_name,`
			`incoming_request=incoming_request,`
			`target_request=target_request,`
			`user=user,`
			`credits_cost=credits_cost,`
			`tokens=tokens,`
			`path=path,`
			`is_chat=is_chat,`
			`model=model,`
			`)`
yoooo everything works now 100% :fire: 2023-10-04 23:24:55 +02:00			`)`