some stuff idfk

2024-11-25 18:23:57 +01:00 · 2023-08-04 03:30:56 +02:00 · 2023-08-04 03:30:56 +02:00 · 72cea38d8d
parent e76d675dc6
commit 72cea38d8d
15 changed files with 323 additions and 146 deletions
--- a/README.md
+++ b/README.md
@ -77,21 +77,14 @@ Create a `.env` file, make sure not to reveal it to anyone, and fill in the requ
 - `PROXY_USER` (optional)
 - `PROXY_PASS` (optional)
 ### ClosedAI configuration
 - `CLOSEDAI_KEY`: the API key used to access the ClosedAI API
 - `CLOSEDAI_ENDPOINT` (defaults to `https://api.openai.com/v1`): the API endpoint which is used for the provider ClosedAI
 ### `ACTUAL_IPS` (optional)
 This is a security measure to make sure a proxy, VPN, Tor or any other IP hiding service is used by the host when accessing "Closed"AI's API.
 It is a space separated list of IP addresses that are allowed to access the API.
 You can also just add the *beginning* of an API address, like `12.123.` (without an asterisk!) to allow all IPs starting with `12.123.`.
 > To disable the warning if you don't have this feature enabled, set `ACTUAL_IPS` to `None`.
 ### `DEMO_AUTH`
 API key for demo purposes. You can give this to trusted team members. Never use it in production.
 ### `CORE_API_KEY`
-This will 
+This specifies the **very secret key** for accessing the entire user database etc.
 ## Run
 > **Warning:** read the according section for production usage!
--- a/api/chat_balancing.py
+++ b/api/chat_balancing.py
@ -1,30 +0,0 @@
 import random
 import asyncio
 import chat_providers
 provider_modules = [
    # chat_providers.twa,
    chat_providers.quantum,
    # chat_providers.churchless,
    chat_providers.closed
 ]
 async def balance(payload: dict) -> dict:
    providers_available = []
    for provider_module in provider_modules:
        if payload['stream'] and not provider_module.STREAMING:
            continue
        if payload['model'] not in provider_module.MODELS:
            continue
        providers_available.append(provider_module)
    provider = random.choice(providers_available)
    return provider.chat_completion(**payload)
 if __name__ == '__main__':
    req = asyncio.run(balance(payload={'model': 'gpt-3.5-turbo', 'stream': True}))
    print(req['url'])
--- a/api/config/credits.yml
+++ b/api/config/credits.yml
@ -0,0 +1,23 @@
 max-credits: 100001
 start-credits: 1000
 costs:
  other: 50
  chat-models:
    gpt-3: 10
    gpt-4: 75
    gpt-4-32k: 100
 # bonuses are multiplier for costs:
 # final_cost = cost * bonus
 bonuses:
  owner: 0.1
  admin: 0.3
  helper: 0.4
  booster: 0.5
 # discord reward 0.99^lvl?
 rewards:
  day: 1000
--- a/api/core.py
+++ b/api/core.py
@ -6,6 +6,7 @@ import fastapi
 from db import users
 from dhooks import Webhook, Embed
 from dotenv import load_dotenv
 load_dotenv()
@ -31,6 +32,20 @@ async def get_users(discord_id: int, incoming_request: fastapi.Request):
    return user
 def new_user_webhook(user: dict) -> None:    
    dhook = Webhook(os.getenv('DISCORD_WEBHOOK__USER_CREATED'))
    embed = Embed(
        description='New User',
        color=0x90ee90,
     )
    embed.add_field(name='ID', value=user['_id'], inline=False)
    embed.add_field(name='Discord', value=user['auth']['discord'])
    embed.add_field(name='Github', value=user['auth']['github'])
    dhook.send(embed=embed)
@router.post('/users')
 async def create_user(incoming_request: fastapi.Request):
    auth_error = await check_core_auth(incoming_request)
@ -45,4 +60,15 @@ async def create_user(incoming_request: fastapi.Request):
        return fastapi.Response(status_code=400, content='Invalid or no payload received.')
    user = await users.create(discord_id)
    new_user_webhook(user)
    return user
 if __name__ == '__main__':
    new_user_webhook({
        '_id': 'JUST_A_TEST_IGNORE_ME',
        'auth': {
            'discord': 123,
            'github': 'abc'
        }
    })
--- a/api/db/logs.py
+++ b/api/db/logs.py
@ -4,30 +4,30 @@ import time
 from dotenv import load_dotenv
 from motor.motor_asyncio import AsyncIOMotorClient
 from helpers import network
 load_dotenv()
 def _get_mongo(collection_name: str):
    return AsyncIOMotorClient(os.getenv('MONGO_URI'))['nova-core'][collection_name]
-async def log_api_request(user, request, target_url):
+async def log_api_request(user: dict, incoming_request, target_url: str):
-    payload = await request.json()
+    payload = await incoming_request.json()
    last_prompt = None
    if 'messages' in payload:
        last_prompt = payload['messages'][-1]['content']
-    model = None
+    model = payload.get('model')
    if 'model' in payload:
        model = payload['model']
    new_log_item = {
        'timestamp': time.time(),
-        'method': request.method,
+        'method': incoming_request.method,
-        'path': request.url.path,
+        'path': incoming_request.url.path,
        'user_id': user['_id'],
        'security': {
-            'ip': request.client.host,
+            'ip': network.get_ip(incoming_request),
-            'useragent': request.headers.get('User-Agent')
+            'useragent': incoming_request.headers.get('User-Agent')
        },
        'details': {
            'model': model,
--- a/api/db/stats.py
+++ b/api/db/stats.py
@ -0,0 +1,42 @@
 import os
 import pytz
 import asyncio
 import datetime
 from dotenv import load_dotenv
 from motor.motor_asyncio import AsyncIOMotorClient
 load_dotenv()
 def _get_mongo(collection_name: str):
    return AsyncIOMotorClient(os.getenv('MONGO_URI'))['nova-core'][collection_name]
 async def add_date():
    date = datetime.datetime.now(pytz.timezone('GMT')).strftime('%Y.%m.%d')
    year, month, day = date.split('.')
    await _get_mongo('stats').update_one({}, {'$inc': {f'dates.{year}.{month}.{day}': 1}}, upsert=True)
 async def add_ip_address(ip_address: str):
    ip_address = ip_address.replace('.', '_')
    await _get_mongo('stats').update_one({}, {'$inc': {f'ips.{ip_address}': 1}}, upsert=True)
 async def add_target(url: str):
    await _get_mongo('stats').update_one({}, {'$inc': {f'targets.{url}': 1}}, upsert=True)
 async def add_tokens(tokens: int, model: str):
    await _get_mongo('stats').update_one({}, {'$inc': {f'tokens.{model}': tokens}}, upsert=True)
 async def add_model(model: str):
    await _get_mongo('stats').update_one({}, {'$inc': {f'models.{model}': 1}}, upsert=True)
 async def add_path(path: str):
    path = path.replace('/', '_')
    await _get_mongo('stats').update_one({}, {'$inc': {f'paths.{path}': 1}}, upsert=True)
 async def get_value(obj_filter):
    return await _get_mongo('stats').find_one({obj_filter})
 if __name__ == '__main__':
    asyncio.run(add_date())
    asyncio.run(add_path('/__demo/test'))
--- a/api/db/users.py
+++ b/api/db/users.py
@ -1,4 +1,5 @@
 import os
 import yaml
 import random
 import string
 import asyncio
@ -8,11 +9,15 @@ from motor.motor_asyncio import AsyncIOMotorClient
 load_dotenv()
 with open('config/credits.yml', encoding='utf8') as f:
    credits_config = yaml.safe_load(f)
 def _get_mongo(collection_name: str):
    return AsyncIOMotorClient(os.getenv('MONGO_URI'))['nova-core'][collection_name]
 async def create(discord_id: int=0) -> dict:
    """Adds a new user to the MongoDB collection."""
    chars = string.ascii_letters + string.digits
    infix = os.getenv('KEYGEN_INFIX')
@ -23,7 +28,7 @@ async def create(discord_id: int=0) -> dict:
    new_user = {
        'api_key': new_api_key,
-        'credits': 1000,
+        'credits': credits_config['start-credits'],
        'role': '',
        'status': {
            'active': True,
--- a/api/helpers/network.py
+++ b/api/helpers/network.py
@ -0,0 +1,2 @@
 async def get_ip(request) -> str:
    return request.client.host
--- a/api/load_balancing.py
+++ b/api/load_balancing.py
@ -0,0 +1,42 @@
 import random
 import asyncio
 import chat_providers
 provider_modules = [
    chat_providers.twa,
    chat_providers.quantum,
    chat_providers.churchless,
    chat_providers.closed,
    chat_providers.closed4
 ]
 async def balance_chat_request(payload: dict) -> dict:
    providers_available = []
    for provider_module in provider_modules:
        if payload['stream'] and not provider_module.STREAMING:
            continue
        if payload['model'] not in provider_module.MODELS:
            continue
        providers_available.append(provider_module)
    provider = random.choice(providers_available)
    return provider.chat_completion(**payload)
 async def balance_organic_request(request: dict) -> dict:
    providers_available = []
    for provider_module in provider_modules:
        if provider_module.ORGANIC:
            providers_available.append(provider_module)
    provider = random.choice(providers_available)
    return provider.organify(request)
 if __name__ == '__main__':
    req = asyncio.run(balance_chat_request(payload={'model': 'gpt-3.5-turbo', 'stream': True}))
    print(req['url'])
--- a/api/main.py
+++ b/api/main.py
@ -9,8 +9,6 @@ from dotenv import load_dotenv
 import core
 import transfer
 from db import users
 load_dotenv()
 app = fastapi.FastAPI()
--- a/api/moderation.py
+++ b/api/moderation.py
@ -0,0 +1,18 @@
 import os
 import asyncio
 import openai as closedai
 from typing import Union
 from dotenv import load_dotenv
 load_dotenv()
 closedai.api_key = os.getenv('LEGIT_CLOSEDAI_KEY')
 async def is_safe(text: Union[str, list]) -> bool:
    return closedai.Moderation.create(
        input=text,
    )['results'][0]['flagged']
 if __name__ == '__main__':
    asyncio.run(is_safe('Hello'))
--- a/api/netclient.py
+++ b/api/netclient.py
@ -1,61 +0,0 @@
 import os
 import aiohttp
 import asyncio
 import aiohttp_socks
 from dotenv import load_dotenv
 import proxies
 from helpers import exceptions
 load_dotenv()
 async def stream(request: dict, demo_mode: bool=False):
    headers = {
        'Content-Type': 'application/json'
    }
    for k, v in request.get('headers', {}).items():
        headers[k] = v
    for _ in range(3):
        async with aiohttp.ClientSession(connector=proxies.default_proxy.connector) as session:
            async with session.get(
                # 'GET',
                'https://checkip.amazonaws.com/'
            ) as response:
                print(response.content)
                print(type(response.content))
                # html = await response.text()
                # print(html)
                    # async with session.get(
                        # method='GET',
                        # url='https://checkip.amazonaws.com',
                        # method=request.get('method', 'POST'),
                        # url=request['url'],
                        # json=request.get('payload', {}),
                        # headers=headers,
                        # timeout=aiohttp.ClientTimeout(total=float(os.getenv('TRANSFER_TIMEOUT', '120'))),
                    # ) as response:
                        # try:
                            # await response.raise_for_status()
                        # except Exception as exc:
                            # if 'Too Many Requests' in str(exc):
                                # continue
                        # else:
                            # break
                async for chunk in response.content.iter_chunks():
                    # chunk = f'{chunk.decode("utf8")}\n\n'
                    if demo_mode:
                        print(chunk)
                    yield chunk
 if __name__ == '__main__':
    asyncio.run(stream({'method': 'GET', 'url': 'https://checkip.amazonaws.com'}, True))
--- a/api/streaming.py
+++ b/api/streaming.py
@ -0,0 +1,107 @@
 import os
 import yaml
 import asyncio
 import aiohttp
 import starlette
 from dotenv import load_dotenv
 import proxies
 import load_balancing
 from db import logs, users, stats
 from rich import print
 from helpers import network
 load_dotenv()
 DEMO_PAYLOAD = {
    'model': 'gpt-3.5-turbo',
    'messages': [
        {
            'role': 'user',
            'content': '1+1='
        }
    ]
 }
 with open('config/credits.yml', encoding='utf8') as f:
    max_credits = yaml.safe_load(f)['max-credits']
 async def stream(
    path: str='/v1/chat/completions',
    user: dict=None,
    payload: dict=None,
    credits_cost: int=0,
    demo_mode: bool=False,
    input_tokens: int=0,
    incoming_request: starlette.requests.Request=None,
 ):
    payload = payload or DEMO_PAYLOAD
    if 'chat/completions' in path: # is a chat endpoint
        target_request = await load_balancing.balance_chat_request(payload)
    else:
        target_request = await load_balancing.balance_organic_request(payload)
    headers = {
        'Content-Type': 'application/json'
    }
    for k, v in target_request.get('headers', {}).items():
        headers[k] = v
    for _ in range(5):
        async with aiohttp.ClientSession(connector=proxies.default_proxy.connector) as session:
            async with session.request(
                method=target_request.get('method', 'POST'),
                url=target_request['url'],
                data=target_request.get('data'),
                json=target_request.get('payload'),
                headers=headers,
                cookies=target_request.get('cookies'),
                ssl=False,
                timeout=aiohttp.ClientTimeout(total=float(os.getenv('TRANSFER_TIMEOUT', '120'))),
            ) as response:
                try:
                    await response.raise_for_status()
                except Exception as exc:
                    if 'Too Many Requests' in str(exc):
                        continue
                else:
                    break
        if user and incoming_request:
            await logs.log_api_request(
                user=user,
                incoming_request=incoming_request,
                target_url=target_request['url']
            )
        if credits_cost and user:
            await users.update_by_id(user['_id'], {
                '$inc': {'credits': -credits_cost}
            })
        if not demo_mode:
            await stats.add_date()
            await stats.add_ip_address(network.get_ip(incoming_request))
            await stats.add_model(payload.get('model', '_non-chat'))
            await stats.add_path(path)
            await stats.add_target(target_request['url'])
            await stats.add_tokens(input_tokens)
        async for chunk in response.content.iter_chunks():
            # chunk = f'{chunk.decode("utf8")}\n\n'
            if demo_mode:
                print(chunk)
            yield chunk
 if __name__ == '__main__':
    asyncio.run(stream())
--- a/api/transfer.py
+++ b/api/transfer.py
@ -2,13 +2,13 @@
 import os
 import json
 import yaml
 import logging
 import starlette
 from dotenv import load_dotenv
-import netclient
+import streaming
 import chat_balancing
 from db import logs, users
 from helpers import tokens, errors, exceptions
@ -24,35 +24,41 @@ logging.basicConfig(
 logging.info('API started')
 with open('config/credits.yml', encoding='utf8') as f:
    credits_config = yaml.safe_load(f)
 async def handle(incoming_request):
    """Transfer a streaming response from the incoming request to the target endpoint"""
    path = incoming_request.url.path
    # METHOD
    if incoming_request.method not in ['GET', 'POST', 'PUT', 'DELETE', 'PATCH']:
        return errors.error(405, f'Method "{incoming_request.method}" is not allowed.', 'Change the request method to the correct one.')
    # PAYLOAD
    try:
        payload = await incoming_request.json()
    except json.decoder.JSONDecodeError:
        payload = {}
    # TOKENS
    try:
        input_tokens = tokens.count_for_messages(payload['messages'])
    except (KeyError, TypeError):
        input_tokens = 0
-    auth_header = incoming_request.headers.get('Authorization')
+    # AUTH
    received_key = incoming_request.headers.get('Authorization')
-    if not auth_header:
+    if not received_key:
        return errors.error(401, 'No NovaAI API key given!', 'Add "Authorization: Bearer nv-..." to your request headers.')
-    received_key = auth_header
+    if received_key.startswith('Bearer '):
        received_key = received_key.split('Bearer ')[1]
-    if auth_header.startswith('Bearer '):
+    # USER
-        received_key = auth_header.split('Bearer ')[1]
+    user = await users.by_api_key(received_key.strip())
    user = await users.by_api_key(received_key)
    if not user:
        return errors.error(401, 'Invalid NovaAI API key!', 'Create a new NovaOSS API key.')
@ -64,31 +70,36 @@ async def handle(incoming_request):
    if not user['status']['active']:
        return errors.error(418, 'Your NovaAI account is not active (paused).', 'Simply re-activate your account using a Discord command or the web panel.')
    # COST
    costs = credits_config['costs']
    cost = costs['other']
    if 'chat/completions' in path:
        for model_name, model_cost in costs['chat-models'].items():
            if model_name in payload['model']:
                cost = model_cost
    role_cost_multiplier = credits_config['bonuses'].get(user['role'], 1)
    cost = round(cost * role_cost_multiplier)
    if user['credits'] < cost:
        return errors.error(429, 'Not enough credits.', 'Wait or earn more credits. Learn more on our website or Discord server.')
    # READY
    payload['user'] = str(user['_id'])
    cost = 1
    if '/chat/completions' in path:
        cost = 5
        if 'gpt-4' in payload['model']:
            cost = 10
    else:
        return errors.error(404, f'Sorry, we don\'t support "{path}" yet. We\'re working on it.', 'Contact our team.')
    if not payload.get('stream') is True:
        payload['stream'] = False
-    if user['credits'] < cost:
+    return starlette.responses.StreamingResponse(
-        return errors.error(429, 'Not enough credits.', 'You do not have enough credits to complete this request.')
+        content=streaming.stream(
-
+            user=user,
-    await users.update_by_id(user['_id'], {'$inc': {'credits': -cost}})
+            path=path,
-
+            payload=payload,
-    target_request = await chat_balancing.balance(payload)
+            credits_cost=cost,
-
+            input_tokens=input_tokens,
-    print(target_request['url'])
+            incoming_request=incoming_request,
-
+        ),
-    return errors.error(500, 'Sorry, the API is currenly under maintainance.', 'Please try again later.')
+        media_type='text/event-stream'
-
+    )
    return starlette.responses.StreamingResponse(netclient.stream(target_request))
--- a/tests/main.py
+++ b/tests/main.py
@ -52,7 +52,7 @@ def test_api(model: str=MODEL, messages: List[dict]=None) -> dict:
    }
    response = httpx.post(
-        url=f'{api_endpoint}/chat/completions',
+        url=f'{api_endpoint}/v1/chat/completions',
        headers=headers,
        json=json_data,
        timeout=20
@ -87,6 +87,7 @@ def test_all():
    print(test_library())
 if __name__ == '__main__':
-    api_endpoint = 'https://api.nova-oss.com'
+    # api_endpoint = 'https://api.nova-oss.com'
    api_endpoint = 'http://localhost:2332'
    api_key = os.getenv('TEST_NOVA_KEY')
    test_all()
		`@ -0,0 +1,2 @@`
							`async def get_ip(request) -> str:`
							`return request.client.host`