Added more documentation

This commit is contained in:
nsde 2023-08-12 17:49:31 +02:00
parent 23d463fad8
commit a7bd57c5a8
14 changed files with 136 additions and 55 deletions

3
.gitignore vendored
View file

@ -1,8 +1,5 @@
last_update.txt last_update.txt
!api/providers/__main__.py
!api/providers/helpers/utils.py
*.log.json *.log.json
/logs /logs
/log /log

View file

@ -63,14 +63,3 @@ async def create_user(incoming_request: fastapi.Request):
await new_user_webhook(user) await new_user_webhook(user)
return user return user
if __name__ == '__main__':
# new_user_webhook({
# '_id': 'JUST_A_TEST_IGNORE_ME',
# 'auth': {
# 'discord': 123,
# 'github': 'abc'
# }
# })
pass

View file

@ -12,12 +12,16 @@ class CompletionStop:
"""End of a chat""" """End of a chat"""
async def create_chat_id() -> str: async def create_chat_id() -> str:
"""Generates a random chat ID"""
chars = string.ascii_letters + string.digits chars = string.ascii_letters + string.digits
chat_id = ''.join(random.choices(chars, k=32)) chat_id = ''.join(random.choices(chars, k=32))
return f'chatcmpl-{chat_id}' return f'chatcmpl-{chat_id}'
async def create_chat_chunk(chat_id: str, model: str, content=None) -> dict: async def create_chat_chunk(chat_id: str, model: str, content=None) -> dict:
"""Creates a new chat chunk"""
content = content or {} content = content or {}
delta = {} delta = {}

View file

@ -2,6 +2,8 @@ import json
import starlette import starlette
async def error(code: int, message: str, tip: str) -> starlette.responses.Response: async def error(code: int, message: str, tip: str) -> starlette.responses.Response:
"""Returns a starlette response JSON with the given error code, message and tip."""
info = {'error': { info = {'error': {
'code': code, 'code': code,
'message': message, 'message': message,
@ -13,6 +15,8 @@ async def error(code: int, message: str, tip: str) -> starlette.responses.Respon
return starlette.responses.Response(status_code=code, content=json.dumps(info)) return starlette.responses.Response(status_code=code, content=json.dumps(info))
async def yield_error(code: int, message: str, tip: str) -> str: async def yield_error(code: int, message: str, tip: str) -> str:
"""Returns a dumped JSON response with the given error code, message and tip."""
return json.dumps({ return json.dumps({
'code': code, 'code': code,
'message': message, 'message': message,

View file

@ -1,2 +0,0 @@
class Retry(Exception):
"""The server should retry the request."""

View file

@ -2,6 +2,8 @@ import base64
import asyncio import asyncio
async def get_ip(request) -> str: async def get_ip(request) -> str:
"""Get the IP address of the incoming request."""
xff = None xff = None
if request.headers.get('x-forwarded-for'): if request.headers.get('x-forwarded-for'):
xff, *_ = request.headers['x-forwarded-for'].split(', ') xff, *_ = request.headers['x-forwarded-for'].split(', ')
@ -17,6 +19,8 @@ async def get_ip(request) -> str:
return detected_ip return detected_ip
async def add_proxy_auth_to_headers(username: str, password: str, headers: dict) -> dict: async def add_proxy_auth_to_headers(username: str, password: str, headers: dict) -> dict:
"""Add proxy authentication to the headers. This is useful if the proxy authentication doesn't work as it should."""
proxy_auth = base64.b64encode(f'{username}:{password}'.encode()).decode() proxy_auth = base64.b64encode(f'{username}:{password}'.encode()).decode()
headers['Proxy-Authorization'] = f'Basic {proxy_auth}' headers['Proxy-Authorization'] = f'Basic {proxy_auth}'
return headers return headers

View file

@ -25,13 +25,13 @@ async def count_for_messages(messages: list, model: str='gpt-3.5-turbo-0613') ->
tokens_per_name = -1 # if there's a name, the role is omitted tokens_per_name = -1 # if there's a name, the role is omitted
elif 'gpt-3.5-turbo' in model: elif 'gpt-3.5-turbo' in model:
return num_tokens_from_messages(messages, model='gpt-3.5-turbo-0613') return count_for_messages(messages, model='gpt-3.5-turbo-0613')
elif 'gpt-4' in model: elif 'gpt-4' in model:
return num_tokens_from_messages(messages, model='gpt-4-0613') return count_for_messages(messages, model='gpt-4-0613')
else: else:
raise NotImplementedError(f"""num_tokens_from_messages() is not implemented for model {model}. raise NotImplementedError(f"""count_for_messages() is not implemented for model {model}.
See https://github.com/openai/openai-python/blob/main/chatml.md See https://github.com/openai/openai-python/blob/main/chatml.md
for information on how messages are converted to tokens.""") for information on how messages are converted to tokens.""")

View file

@ -10,7 +10,8 @@ async def _get_module_name(module) -> str:
return name return name
async def balance_chat_request(payload: dict) -> dict: async def balance_chat_request(payload: dict) -> dict:
"""Load balance the chat completion request between chat providers.""" """Load balance the chat completion request between chat providers.
"""
providers_available = [] providers_available = []
@ -35,7 +36,9 @@ async def balance_chat_request(payload: dict) -> dict:
return target return target
async def balance_organic_request(request: dict) -> dict: async def balance_organic_request(request: dict) -> dict:
"""Load balnace to non-chat completion request between other "organic" providers which respond in the desired format already.""" """Load balnace to non-chat completion request between other "organic" providers which respond in the desired format already.
Organic providers are used for non-chat completions, such as moderation and other paths.
"""
providers_available = [] providers_available = []

View file

@ -1,3 +1,5 @@
"""This module contains functions for checking if a message violates the moderation policy."""
import asyncio import asyncio
import aiohttp import aiohttp
@ -5,7 +7,16 @@ import proxies
import provider_auth import provider_auth
import load_balancing import load_balancing
async def is_policy_violated(inp) -> bool: from typing import Union
async def is_policy_violated(inp: Union[str, list]) -> bool:
"""Check if a message violates the moderation policy.
You can either pass a list of messages consisting of dicts with "role" and "content", as used in the API parameter,
or just a simple string.
Returns True if the message violates the policy, False otherwise.
"""
text = inp text = inp
if isinstance(inp, list): if isinstance(inp, list):

View file

@ -1,6 +1,14 @@
"""This module contains functions for authenticating with providers."""
import asyncio import asyncio
async def invalidate_key(provider_and_key): async def invalidate_key(provider_and_key: str) -> none:
"""Invalidates a key stored in the secret/ folder by storing it in the associated .invalid.txt file.
The schmea in which <provider_and_key> should be passed is:
<provider_name><key>, e.g.
closed4>sk-...
"""
if not provider_and_key: if not provider_and_key:
return return

View file

@ -12,8 +12,14 @@ from dotenv import load_dotenv
load_dotenv() load_dotenv()
USE_PROXY_LIST = os.getenv('USE_PROXY_LIST', 'False').lower() == 'true'
class Proxy: class Proxy:
"""Represents a proxy. The type can be either http, https, socks4 or socks5.""" """Represents a proxy. The type can be either http, https, socks4 or socks5.
You can also pass a url, which will be parsed into the other attributes.
URL format:
[type]://[username:password@]host:port
"""
def __init__(self, def __init__(self,
url: str=None, url: str=None,
@ -36,7 +42,7 @@ class Proxy:
self.proxy_type = proxy_type self.proxy_type = proxy_type
self.host_or_ip = host_or_ip self.host_or_ip = host_or_ip
self.ip_address = socket.gethostbyname(self.host_or_ip) #if host_or_ip.replace('.', '').isdigit() else host_or_ip self.ip_address = socket.gethostbyname(self.host_or_ip) # get ip address from host
self.host = self.host_or_ip self.host = self.host_or_ip
self.port = port self.port = port
self.username = username self.username = username
@ -54,6 +60,8 @@ class Proxy:
@property @property
def connector(self): def connector(self):
"""Returns an aiohttp_socks.ProxyConnector object. Which can be used in aiohttp.ClientSession."""
proxy_types = { proxy_types = {
'http': aiohttp_socks.ProxyType.HTTP, 'http': aiohttp_socks.ProxyType.HTTP,
'https': aiohttp_socks.ProxyType.HTTP, 'https': aiohttp_socks.ProxyType.HTTP,
@ -65,11 +73,13 @@ class Proxy:
proxy_type=proxy_types[self.proxy_type], proxy_type=proxy_types[self.proxy_type],
host=self.ip_address, host=self.ip_address,
port=self.port, port=self.port,
rdns=False, rdns=False, # remote DNS
username=self.username, username=self.username,
password=self.password password=self.password
) )
# load proxies from files
proxies_in_files = [] proxies_in_files = []
try: try:
@ -84,27 +94,19 @@ try:
except FileNotFoundError: except FileNotFoundError:
pass pass
class ProxyChain: # Proxy lists support
class ProxyLists:
def __init__(self): def __init__(self):
random_proxy = random.choice(proxies_in_files) random_proxy = random.choice(proxies_in_files)
self.get_random = Proxy(url=random_proxy) self.get_random = Proxy(url=random_proxy)
self.connector = aiohttp_socks.ChainProxyConnector.from_urls(proxies_in_files) self.connector = aiohttp_socks.ChainProxyConnector.from_urls(proxies_in_files)
try: # ================================================================================================================================ #
default_chain = ProxyChain()
random_proxy = ProxyChain().get_random
except IndexError:
pass
default_proxy = Proxy(
proxy_type=os.getenv('PROXY_TYPE', 'http'),
host_or_ip=os.getenv('PROXY_HOST', '127.0.0.1'),
port=int(os.getenv('PROXY_PORT', '8080')),
username=os.getenv('PROXY_USER'),
password=os.getenv('PROXY_PASS')
)
# Proxy tests
# Can be useful if you want to troubleshoot your proxies
def test_httpx_workaround(): def test_httpx_workaround():
import httpx import httpx
@ -153,6 +155,22 @@ async def text_httpx_socks():
res = await client.get('https://checkip.amazonaws.com') res = await client.get('https://checkip.amazonaws.com')
return res.text return res.text
# ================================================================================================================================ #
def get_proxy() -> Proxy:
"""Returns a Proxy object. The proxy is either from the proxy list or from the environment variables.
"""
if USE_PROXY_LIST:
return ProxyLists().get_random
return Proxy(
proxy_type=os.getenv('PROXY_TYPE', 'http'),
host_or_ip=os.getenv('PROXY_HOST', '127.0.0.1'),
port=int(os.getenv('PROXY_PORT', '8080')),
username=os.getenv('PROXY_USER'),
password=os.getenv('PROXY_PASS')
)
if __name__ == '__main__': if __name__ == '__main__':
# print(test_httpx()) # print(test_httpx())
# print(test_requests()) # print(test_requests())

View file

@ -1,3 +1,5 @@
"""This module contains the streaming logic for the API."""
import os import os
import json import json
import dhooks import dhooks
@ -33,7 +35,6 @@ async def stream(
user: dict=None, user: dict=None,
payload: dict=None, payload: dict=None,
credits_cost: int=0, credits_cost: int=0,
demo_mode: bool=False,
input_tokens: int=0, input_tokens: int=0,
incoming_request: starlette.requests.Request=None, incoming_request: starlette.requests.Request=None,
): ):
@ -44,6 +45,7 @@ async def stream(
is_chat = True is_chat = True
model = payload['model'] model = payload['model']
# Chat completions always have the same beginning
if is_chat and is_stream: if is_chat and is_stream:
chat_id = await chat.create_chat_id() chat_id = await chat.create_chat_id()
@ -66,15 +68,22 @@ async def stream(
'error': 'No JSON response could be received' 'error': 'No JSON response could be received'
} }
# Try to get a response from the API
for _ in range(5): for _ in range(5):
headers = { headers = {
'Content-Type': 'application/json' 'Content-Type': 'application/json'
} }
# Load balancing
# If the request is a chat completion, then we need to load balance between chat providers
# If the request is an organic request, then we need to load balance between organic providers
try: try:
if is_chat: if is_chat:
target_request = await load_balancing.balance_chat_request(payload) target_request = await load_balancing.balance_chat_request(payload)
else: else:
# "organic" means that it's not using a reverse engineered front-end, but rather ClosedAI's API directly
# churchless.tech is an example of an organic provider, because it redirects the request to ClosedAI.
target_request = await load_balancing.balance_organic_request({ target_request = await load_balancing.balance_organic_request({
'method': incoming_request.method, 'method': incoming_request.method,
'path': path, 'path': path,
@ -83,9 +92,10 @@ async def stream(
'cookies': incoming_request.cookies 'cookies': incoming_request.cookies
}) })
except ValueError as exc: except ValueError as exc:
# Error load balancing? Send a webhook to the admins
webhook = dhooks.Webhook(os.getenv('DISCORD_WEBHOOK__API_ISSUE')) webhook = dhooks.Webhook(os.getenv('DISCORD_WEBHOOK__API_ISSUE'))
webhook.send(content=f'API Issue: **`{exc}`**\nhttps://i.imgflip.com/7uv122.jpg') webhook.send(content=f'API Issue: **`{exc}`**\nhttps://i.imgflip.com/7uv122.jpg')
error = await errors.yield_error( error = await errors.yield_error(
500, 500,
'Sorry, the API has no working keys anymore.', 'Sorry, the API has no working keys anymore.',
@ -100,7 +110,9 @@ async def stream(
if target_request['method'] == 'GET' and not payload: if target_request['method'] == 'GET' and not payload:
target_request['payload'] = None target_request['payload'] = None
async with aiohttp.ClientSession(connector=proxies.default_proxy.connector) as session: # We haven't done any requests as of right now, everything until now was just preparation
# Here, we process the request
async with aiohttp.ClientSession(connector=proxies.get_proxy().connector) as session:
try: try:
async with session.request( async with session.request(
method=target_request.get('method', 'POST'), method=target_request.get('method', 'POST'),
@ -116,9 +128,11 @@ async def stream(
timeout=aiohttp.ClientTimeout(total=float(os.getenv('TRANSFER_TIMEOUT', '120'))), timeout=aiohttp.ClientTimeout(total=float(os.getenv('TRANSFER_TIMEOUT', '120'))),
) as response: ) as response:
# if the answer is JSON
if response.content_type == 'application/json': if response.content_type == 'application/json':
data = await response.json() data = await response.json()
# Invalidate the key if it's not working
if data.get('code') == 'invalid_api_key': if data.get('code') == 'invalid_api_key':
await provider_auth.invalidate_key(target_request.get('provider_auth')) await provider_auth.invalidate_key(target_request.get('provider_auth'))
continue continue
@ -126,37 +140,40 @@ async def stream(
if response.ok: if response.ok:
json_response = data json_response = data
# if the answer is a stream
if is_stream: if is_stream:
try: try:
response.raise_for_status() response.raise_for_status()
except Exception as exc: except Exception as exc:
# Rate limit? Balance again
if 'Too Many Requests' in str(exc): if 'Too Many Requests' in str(exc):
continue continue
try: try:
# process the response chunks
async for chunk in response.content.iter_any(): async for chunk in response.content.iter_any():
send = False send = False
chunk = f'{chunk.decode("utf8")}\n\n' chunk = f'{chunk.decode("utf8")}\n\n'
chunk = chunk.replace(os.getenv('MAGIC_WORD', 'novaOSScheckKeyword'), payload['model'])
chunk = chunk.replace(os.getenv('MAGIC_USER_WORD', 'novaOSSuserKeyword'), str(user['_id']))
if is_chat and '{' in chunk: if is_chat and '{' in chunk:
# parse the JSON
data = json.loads(chunk.split('data: ')[1]) data = json.loads(chunk.split('data: ')[1])
chunk = chunk.replace(data['id'], chat_id) chunk = chunk.replace(data['id'], chat_id)
send = True send = True
# create a custom chunk if we're using specific providers
if target_request['module'] == 'twa' and data.get('text'): if target_request['module'] == 'twa' and data.get('text'):
chunk = await chat.create_chat_chunk( chunk = await chat.create_chat_chunk(
chat_id=chat_id, chat_id=chat_id,
model=model, model=model,
content=['text'] content=['text']
) )
if not data['choices'][0]['delta']:
send = False # don't send empty/unnecessary messages
if (not data['choices'][0]['delta']) or data['choices'][0]['delta'] == {'role': 'assistant'}:
if data['choices'][0]['delta'] == {'role': 'assistant'}:
send = False send = False
# send the chunk
if send and chunk.strip(): if send and chunk.strip():
final_chunk = chunk.strip().replace('data: [DONE]', '') + '\n\n' final_chunk = chunk.strip().replace('data: [DONE]', '') + '\n\n'
yield final_chunk yield final_chunk
@ -174,9 +191,10 @@ async def stream(
break break
except ProxyError as exc: except ProxyError as exc:
print('proxy error') print('[!] Proxy error:', exc)
continue continue
# Chat completions always have the same ending
if is_chat and is_stream: if is_chat and is_stream:
chunk = await chat.create_chat_chunk( chunk = await chat.create_chat_chunk(
chat_id=chat_id, chat_id=chat_id,
@ -186,10 +204,11 @@ async def stream(
yield chunk yield chunk
yield 'data: [DONE]\n\n' yield 'data: [DONE]\n\n'
# If the response is JSON, then we need to yield it like this
if not is_stream and json_response: if not is_stream and json_response:
yield json.dumps(json_response) yield json.dumps(json_response)
# DONE ========================================================= # DONE WITH REQUEST, NOW LOGGING ETC.
if user and incoming_request: if user and incoming_request:
await logs.log_api_request( await logs.log_api_request(

View file

@ -1,4 +1,4 @@
"""Module for transferring requests to ClosedAI API""" """Does quite a few checks and prepares the incoming request for the target endpoint, so it can be streamed"""
import json import json
import yaml import yaml

View file

@ -36,6 +36,9 @@ Set up a MongoDB database and set `MONGO_URI` to the MongoDB database connection
- `PROXY_USER` (optional) - `PROXY_USER` (optional)
- `PROXY_PASS` (optional) - `PROXY_PASS` (optional)
Want to use a proxy list? See the according section!
Keep in mind to set `USE_PROXY_LIST` to `True`! Otherwise, the proxy list won't be used.
### `ACTUAL_IPS` (optional) ### `ACTUAL_IPS` (optional)
This is a security measure to make sure a proxy, VPN, Tor or any other IP hiding service is used by the host when accessing "Closed"AI's API. This is a security measure to make sure a proxy, VPN, Tor or any other IP hiding service is used by the host when accessing "Closed"AI's API.
It is a space separated list of IP addresses that are allowed to access the API. It is a space separated list of IP addresses that are allowed to access the API.
@ -49,13 +52,36 @@ You can also just add the *beginning* of an API address, like `12.123.` (without
`CORE_API_KEY` specifies the **very secret key** for which need to access the entire user database etc. `CORE_API_KEY` specifies the **very secret key** for which need to access the entire user database etc.
`TEST_NOVA_KEY` is the API key the which is used in tests. It should be one with tons of credits. `TEST_NOVA_KEY` is the API key the which is used in tests. It should be one with tons of credits.
## Webhooks ### Webhooks
`DISCORD_WEBHOOK__USER_CREATED` is the Discord webhook URL for when a user is created. `DISCORD_WEBHOOK__USER_CREATED` is the Discord webhook URL for when a user is created.
`DISCORD_WEBHOOK__API_ISSUE` is the Discord webhook URL for when an API issue occurs. `DISCORD_WEBHOOK__API_ISSUE` is the Discord webhook URL for when an API issue occurs.
## Other ### Other
`KEYGEN_INFIX` can be almost any string (avoid spaces or special characters) - this string will be put in the middle of every NovaAI API key which is generated. This is useful for identifying the source of the key using e.g. RegEx. `KEYGEN_INFIX` can be almost any string (avoid spaces or special characters) - this string will be put in the middle of every NovaAI API key which is generated. This is useful for identifying the source of the key using e.g. RegEx.
## Proxy Lists
To use proxy lists, navigate to `api/secret/proxies/` and create the following files:
- `http.txt`
- `socks4.txt`
- `socks5.txt`
Then, paste your proxies in the following format:
```
[username:password@]host:port
```
e.g.
```
1.2.3.4:8080
user:pass@127.0.0.1:1337
```
You can use comments just like in Python.
**Important:** to use the proxy lists, you need to change the `USE_PROXY_LIST` environment variable to `True`!
## Run ## Run
> **Warning:** read the according section for production usage! > **Warning:** read the according section for production usage!