nova-api/api/streaming.py

import os
import yaml
import json
import asyncio
import aiohttp
import starlette

from rich import print
from dotenv import load_dotenv
from python_socks._errors import ProxyError

import proxies
import load_balancing

from db import logs, users, stats
from helpers import network, chat

load_dotenv()

DEMO_PAYLOAD = {
    'model': 'gpt-3.5-turbo',
    'messages': [
        {
            'role': 'user',
            'content': '1+1='
        }
    ]
}

with open('config/credits.yml', encoding='utf8') as f:
    max_credits = yaml.safe_load(f)['max-credits']

async def stream(
    path: str='/v1/chat/completions',
    user: dict=None,
    payload: dict=None,
    credits_cost: int=0,
    demo_mode: bool=False,
    input_tokens: int=0,
    incoming_request: starlette.requests.Request=None,
):

    payload = payload or DEMO_PAYLOAD
    is_chat = False

    if 'chat/completions' in path:
        is_chat = True
        chat_id = await chat.create_chat_id()
        model = payload['model']

        yield chat.create_chat_chunk(
            chat_id=chat_id,
            model=model,
            content=chat.CompletionStart
        )

        yield chat.create_chat_chunk(
            chat_id=chat_id,
            model=model,
            content=None
        )

    for _ in range(5):
        headers = {
            'Content-Type': 'application/json'
        }

        if is_chat:
            target_request = await load_balancing.balance_chat_request(payload)
        else:
            target_request = await load_balancing.balance_organic_request({
                'path': path,
                'payload': payload,
                'headers': headers
            })

        for k, v in target_request.get('headers', {}).items():
            headers[k] = v

        async with aiohttp.ClientSession(connector=proxies.default_proxy.connector) as session:

            try:
                async with session.request(
                    method=target_request.get('method', 'POST'),
                    url=target_request['url'],

                    data=target_request.get('data'),
                    json=target_request.get('payload'),

                    headers=headers,
                    cookies=target_request.get('cookies'),

                    ssl=False,

                    timeout=aiohttp.ClientTimeout(total=float(os.getenv('TRANSFER_TIMEOUT', '120'))),
                ) as response:

                    try:
                        response.raise_for_status()
                    except Exception as exc:
                        if 'Too Many Requests' in str(exc):
                            print(429)
                            continue

                    if user and incoming_request:
                        await logs.log_api_request(
                            user=user,
                            incoming_request=incoming_request,
                            target_url=target_request['url']
                        )

                    if credits_cost and user:
                        await users.update_by_id(user['_id'], {
                            '$inc': {'credits': -credits_cost}
                        })


                    try:
                        async for chunk in response.content.iter_any():
                            chunk = f'{chunk.decode("utf8")}\n\n'

                            if chunk.strip():
                                if is_chat:
                                    if target_request['module'] == 'twa':
                                        data = json.loads(chunk.split('data: ')[1])

                                        if data.get('text'):
                                            chunk = chat.create_chat_chunk(
                                                chat_id=chat_id,
                                                model=model,
                                                content=['text']
                                            )
                                yield chunk

                    except Exception as exc:
                        if 'Connection closed' in str(exc):
                            print('connection closed')
                            continue

                    if not demo_mode:
                        ip_address = await network.get_ip(incoming_request)

                        await stats.add_date()
                        await stats.add_ip_address(ip_address)
                        await stats.add_path(path)
                        await stats.add_target(target_request['url'])

                        if is_chat:
                            await stats.add_model(model)
                            await stats.add_tokens(input_tokens, model)

                    break

            except ProxyError:
                print('proxy error')
                continue

                print(3)
    if is_chat:
        chat_chunk = chat.create_chat_chunk(
            chat_id=chat_id,
            model=model,
            content=chat.CompletionStop
        )
        data = json.dumps(chat_chunk)

        yield 'data: [DONE]\n\n'

if __name__ == '__main__':
    asyncio.run(stream())
some stuff idfk 2023-08-04 03:30:56 +02:00			`import os`
			`import yaml`
proxies have issues 2023-08-04 17:29:49 +02:00			`import json`
some stuff idfk 2023-08-04 03:30:56 +02:00			`import asyncio`
			`import aiohttp`
			`import starlette`

proxies have issues 2023-08-04 17:29:49 +02:00			`from rich import print`
some stuff idfk 2023-08-04 03:30:56 +02:00			`from dotenv import load_dotenv`
some thingies 2023-08-05 02:30:42 +02:00			`from python_socks._errors import ProxyError`
some stuff idfk 2023-08-04 03:30:56 +02:00
			`import proxies`
			`import load_balancing`

			`from db import logs, users, stats`
proxies have issues 2023-08-04 17:29:49 +02:00			`from helpers import network, chat`
some stuff idfk 2023-08-04 03:30:56 +02:00
			`load_dotenv()`

			`DEMO_PAYLOAD = {`
			`'model': 'gpt-3.5-turbo',`
			`'messages': [`
			`{`
			`'role': 'user',`
			`'content': '1+1='`
			`}`
			`]`
			`}`

			`with open('config/credits.yml', encoding='utf8') as f:`
			`max_credits = yaml.safe_load(f)['max-credits']`

			`async def stream(`
			`path: str='/v1/chat/completions',`
			`user: dict=None,`
			`payload: dict=None,`
			`credits_cost: int=0,`
			`demo_mode: bool=False,`
			`input_tokens: int=0,`
			`incoming_request: starlette.requests.Request=None,`
			`):`
some thingies 2023-08-05 02:30:42 +02:00
some stuff idfk 2023-08-04 03:30:56 +02:00			`payload = payload or DEMO_PAYLOAD`
proxies have issues 2023-08-04 17:29:49 +02:00			`is_chat = False`
some stuff idfk 2023-08-04 03:30:56 +02:00
proxies have issues 2023-08-04 17:29:49 +02:00			`if 'chat/completions' in path:`
			`is_chat = True`
			`chat_id = await chat.create_chat_id()`
			`model = payload['model']`
some stuff idfk 2023-08-04 03:30:56 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`yield chat.create_chat_chunk(`
proxies have issues 2023-08-04 17:29:49 +02:00			`chat_id=chat_id,`
			`model=model,`
			`content=chat.CompletionStart`
			`)`
some stuff idfk 2023-08-04 03:30:56 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`yield chat.create_chat_chunk(`
			`chat_id=chat_id,`
			`model=model,`
			`content=None`
			`)`
some stuff idfk 2023-08-04 03:30:56 +02:00
			`for _ in range(5):`
proxies have issues 2023-08-04 17:29:49 +02:00			`headers = {`
			`'Content-Type': 'application/json'`
			`}`

some thingies 2023-08-05 02:30:42 +02:00			`if is_chat:`
			`target_request = await load_balancing.balance_chat_request(payload)`
			`else:`
			`target_request = await load_balancing.balance_organic_request({`
			`'path': path,`
			`'payload': payload,`
			`'headers': headers`
			`})`

proxies have issues 2023-08-04 17:29:49 +02:00			`for k, v in target_request.get('headers', {}).items():`
			`headers[k] = v`

some thingies 2023-08-05 02:30:42 +02:00			`async with aiohttp.ClientSession(connector=proxies.default_proxy.connector) as session:`

			`try:`
			`async with session.request(`
			`method=target_request.get('method', 'POST'),`
			`url=target_request['url'],`

			`data=target_request.get('data'),`
			`json=target_request.get('payload'),`

			`headers=headers,`
			`cookies=target_request.get('cookies'),`

			`ssl=False,`

			`timeout=aiohttp.ClientTimeout(total=float(os.getenv('TRANSFER_TIMEOUT', '120'))),`
			`) as response:`
some stuff idfk 2023-08-04 03:30:56 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`try:`
			`response.raise_for_status()`
			`except Exception as exc:`
			`if 'Too Many Requests' in str(exc):`
			`print(429)`
			`continue`
some stuff idfk 2023-08-04 03:30:56 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`if user and incoming_request:`
			`await logs.log_api_request(`
			`user=user,`
			`incoming_request=incoming_request,`
			`target_url=target_request['url']`
			`)`
some stuff idfk 2023-08-04 03:30:56 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`if credits_cost and user:`
			`await users.update_by_id(user['_id'], {`
			`'$inc': {'credits': -credits_cost}`
			`})`
some stuff idfk 2023-08-04 03:30:56 +02:00
proxies have issues 2023-08-04 17:29:49 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`try:`
			`async for chunk in response.content.iter_any():`
			`chunk = f'{chunk.decode("utf8")}\n\n'`
proxies have issues 2023-08-04 17:29:49 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`if chunk.strip():`
			`if is_chat:`
			`if target_request['module'] == 'twa':`
			`data = json.loads(chunk.split('data: ')[1])`
proxies have issues 2023-08-04 17:29:49 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`if data.get('text'):`
			`chunk = chat.create_chat_chunk(`
			`chat_id=chat_id,`
			`model=model,`
			`content=['text']`
			`)`
			`yield chunk`
proxies have issues 2023-08-04 17:29:49 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`except Exception as exc:`
			`if 'Connection closed' in str(exc):`
			`print('connection closed')`
			`continue`
proxies have issues 2023-08-04 17:29:49 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`if not demo_mode:`
			`ip_address = await network.get_ip(incoming_request)`
proxies have issues 2023-08-04 17:29:49 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`await stats.add_date()`
			`await stats.add_ip_address(ip_address)`
			`await stats.add_path(path)`
			`await stats.add_target(target_request['url'])`
proxies have issues 2023-08-04 17:29:49 +02:00
			`if is_chat:`
some thingies 2023-08-05 02:30:42 +02:00			`await stats.add_model(model)`
			`await stats.add_tokens(input_tokens, model)`
proxies have issues 2023-08-04 17:29:49 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`break`
proxies have issues 2023-08-04 17:29:49 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`except ProxyError:`
			`print('proxy error')`
			`continue`
proxies have issues 2023-08-04 17:29:49 +02:00
some thingies 2023-08-05 02:30:42 +02:00			`print(3)`
proxies have issues 2023-08-04 17:29:49 +02:00			`if is_chat:`
			`chat_chunk = chat.create_chat_chunk(`
			`chat_id=chat_id,`
			`model=model,`
			`content=chat.CompletionStop`
			`)`
			`data = json.dumps(chat_chunk)`

some thingies 2023-08-05 02:30:42 +02:00			`yield 'data: [DONE]\n\n'`
some stuff idfk 2023-08-04 03:30:56 +02:00
			`if __name__ == '__main__':`
			`asyncio.run(stream())`