nova-api/checks/client.py

"""Tests the API."""

import os
import time
import json
import httpx
import openai
import asyncio
import traceback

from rich import print
from typing import List
from dotenv import load_dotenv
from pydantic import BaseModel

load_dotenv()

MODEL = 'gpt-3.5-turbo'

MESSAGES = [
    {
        'role': 'user',
        'content': 'Just respond with the number "1337", nothing else.'
    }
]

api_endpoint = os.getenv('CHECKS_ENDPOINT', 'http://localhost:2332/v1')
# api_endpoint = 'http://localhost:2333/v1'

async def _response_base_check(response: httpx.Response) -> None:
    try:
        response.raise_for_status()
    except httpx.HTTPStatusError as exc:
        raise ConnectionError(f'API returned an error: {response.json()}') from exc

async def test_server():
    """Tests if the API server is running."""

    try:
        request_start = time.perf_counter()
        async with httpx.AsyncClient() as client:
            response = await client.get(
                url=f'{api_endpoint.replace("/v1", "")}',
                timeout=3
            )
            await _response_base_check(response)

        assert response.json()['ping'] == 'pong', 'The API did not return a correct response.'
    except httpx.ConnectError as exc:
        raise ConnectionError(f'API is not running on port {api_endpoint}.') from exc

    else:
        return time.perf_counter() - request_start

async def test_chat_non_stream_gpt4() -> float:
    """Tests non-streamed chat completions with the GPT-4 model."""

    json_data = {
        'model': 'gpt-4',
        'messages': MESSAGES,
        'stream': False
    }

    request_start = time.perf_counter()

    async with httpx.AsyncClient() as client:
        response = await client.post(
            url=f'{api_endpoint}/chat/completions',
            headers=HEADERS,
            json=json_data,
            timeout=10,
        )
        await _response_base_check(response)

    assert '1337' in response.json()['choices'][0]['message']['content'], 'The API did not return a correct response.'
    return time.perf_counter() - request_start

async def test_chat_stream_gpt3() -> float:
    """Tests the text stream endpoint with the GPT-3.5-Turbo model."""

    json_data = {
        'model': 'gpt-3.5-turbo',
        'messages': MESSAGES,
        'stream': True,
    }

    request_start = time.perf_counter()

    async with httpx.AsyncClient() as client:
        response = await client.post(
            url=f'{api_endpoint}/chat/completions',
            headers=HEADERS,
            json=json_data,
            timeout=10,
        )
        await _response_base_check(response)

    chunks = []
    resulting_text = ''

    async for chunk in response.aiter_text():
        for subchunk in chunk.split('\n\n'):
            chunk = subchunk.replace('data: ', '').strip()

            if chunk == '[DONE]':
                break

            if chunk:
                chunks.append(json.loads(chunk))

                try:
                    resulting_text += json.loads(chunk)['choices'][0]['delta']['content']
                except KeyError:
                    pass

    assert '1337' in resulting_text, 'The API did not return a correct response.'

    return time.perf_counter() - request_start

async def test_image_generation() -> float:
    """Tests the image generation endpoint with the SDXL model."""

    json_data = {
        'prompt': 'a nice sunset with a samurai standing in the middle',
        'n': 1,
        'size': '1024x1024'
    }

    request_start = time.perf_counter()

    async with httpx.AsyncClient() as client:
        response = await client.post(
            url=f'{api_endpoint}/images/generations',
            headers=HEADERS,
            json=json_data,
            timeout=10,
        )
        await _response_base_check(response)

    assert '://' in response.json()['data'][0]['url']
    return time.perf_counter() - request_start

class StepByStepAIResponse(BaseModel):
    """Demo response structure for the function calling test."""
    title: str
    steps: List[str]

async def test_function_calling():
    """Tests function calling functionality with newer GPT models."""

    json_data = {
        'stream': False,
        'model': 'gpt-3.5-turbo-0613',
        'messages': [
            {"role": "user", "content": "Explain how to assemble a PC"}
        ],
        'functions': [
            {
                'name': 'get_answer_for_user_query',
                'description': 'Get user answer in series of steps',
                'parameters': StepByStepAIResponse.schema()
            }
        ],
        'function_call': {'name': 'get_answer_for_user_query'}
    }

    request_start = time.perf_counter()

    async with httpx.AsyncClient() as client:
        response = await client.post(
            url=f'{api_endpoint}/chat/completions',
            headers=HEADERS,
            json=json_data,
            timeout=15,
        )
        await _response_base_check(response)

    res = response.json()
    output = json.loads(res['choices'][0]['message']['function_call']['arguments'])
    print(output)

    assert output.get('title') and output.get('steps'), 'The API did not return a correct response.'
    return time.perf_counter() - request_start

async def test_models():
    """Tests the models endpoint."""

    request_start = time.perf_counter()
    async with httpx.AsyncClient() as client:
        response = await client.get(
            url=f'{api_endpoint}/models',
            headers=HEADERS,
            timeout=3
        )
        await _response_base_check(response)
        res = response.json()

    all_models = [model['id'] for model in res['data']]

    assert 'gpt-3.5-turbo' in all_models, 'The model gpt-3.5-turbo is not present in the models endpoint.'
    return time.perf_counter() - request_start

# ==========================================================================================

async def demo():
    """Runs all tests."""

    try:
        for _ in range(30):
            if await test_server():
                break

            print('Waiting until API Server is started up...')
            time.sleep(1)
        else:
            raise ConnectionError('API Server is not running.')

        for func in [test_chat_non_stream_gpt4, test_chat_stream_gpt3]:
            print(f'[*] {func.__name__}')
            result = await func()
            print(f'[+] {func.__name__} - {result}')

    except Exception as exc:
        print('[red]Error: ' + str(exc))
        traceback.print_exc()
        exit(500)

openai.api_base = api_endpoint
openai.api_key = os.environ['NOVA_KEY']

HEADERS = {
    'Content-Type': 'application/json',
    'Authorization': 'Bearer ' + openai.api_key
}

if __name__ == '__main__':
    asyncio.run(demo())
git finally works 2023-06-23 02:18:28 +02:00			`"""Tests the API."""`

Works for BetterGPT 2023-07-19 23:51:28 +02:00			`import os`
hopefully final please work 2023-08-20 12:46:20 +02:00			`import time`
Fixed function calling 2023-09-14 18:18:19 +02:00			`import json`
Made code more robust (dotenv) and working on tests 2023-08-21 20:58:05 +02:00			`import httpx`
			`import openai`
			`import asyncio`
			`import traceback`
git finally works 2023-06-23 02:18:28 +02:00
Small improvements 2023-08-17 16:47:54 +02:00			`from rich import print`
Works for BetterGPT 2023-07-19 23:51:28 +02:00			`from typing import List`
			`from dotenv import load_dotenv`
Fixed function calling 2023-09-14 18:18:19 +02:00			`from pydantic import BaseModel`
Works for BetterGPT 2023-07-19 23:51:28 +02:00
			`load_dotenv()`
git finally works 2023-06-23 02:18:28 +02:00
			`MODEL = 'gpt-3.5-turbo'`
Re-added rate limiting, fixed a bunch of issues 2023-08-17 13:11:35 +02:00
git finally works 2023-06-23 02:18:28 +02:00			`MESSAGES = [`
			`{`
			`'role': 'user',`
Fixed checks 2023-09-14 22:37:29 +02:00			`'content': 'Just respond with the number "1337", nothing else.'`
Added load balancer, MongoDB, improved proxy streaming support, more error messages, entire new world order 2023-08-03 01:46:49 +02:00			`}`
git finally works 2023-06-23 02:18:28 +02:00			`]`
Works for BetterGPT 2023-07-19 23:51:28 +02:00
Resolved some issues 2023-08-24 14:57:36 +02:00			`api_endpoint = os.getenv('CHECKS_ENDPOINT', 'http://localhost:2332/v1')`
Added azure endpoints 2023-10-06 23:05:38 +02:00			`# api_endpoint = 'http://localhost:2333/v1'`
git finally works 2023-06-23 02:18:28 +02:00
Improved errors, checking and fixed ratelimit retrying 2023-10-05 14:17:53 +02:00			`async def _response_base_check(response: httpx.Response) -> None:`
			`try:`
			`response.raise_for_status()`
			`except httpx.HTTPStatusError as exc:`
			`raise ConnectionError(f'API returned an error: {response.json()}') from exc`

Made code more robust (dotenv) and working on tests 2023-08-21 20:58:05 +02:00			`async def test_server():`
Works for BetterGPT 2023-07-19 23:51:28 +02:00			`"""Tests if the API server is running."""`
git finally works 2023-06-23 02:18:28 +02:00
			`try:`
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`request_start = time.perf_counter()`
			`async with httpx.AsyncClient() as client:`
			`response = await client.get(`
			`url=f'{api_endpoint.replace("/v1", "")}',`
			`timeout=3`
			`)`
Improved errors, checking and fixed ratelimit retrying 2023-10-05 14:17:53 +02:00			`await _response_base_check(response)`
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00
			`assert response.json()['ping'] == 'pong', 'The API did not return a correct response.'`
git finally works 2023-06-23 02:18:28 +02:00			`except httpx.ConnectError as exc:`
Works for BetterGPT 2023-07-19 23:51:28 +02:00			`raise ConnectionError(f'API is not running on port {api_endpoint}.') from exc`
git finally works 2023-06-23 02:18:28 +02:00
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`else:`
			`return time.perf_counter() - request_start`

Fixed function calling 2023-09-14 18:18:19 +02:00			`async def test_chat_non_stream_gpt4() -> float:`
			`"""Tests non-streamed chat completions with the GPT-4 model."""`
git finally works 2023-06-23 02:18:28 +02:00
			`json_data = {`
Fixed function calling 2023-09-14 18:18:19 +02:00			`'model': 'gpt-4',`
			`'messages': MESSAGES,`
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`'stream': False`
git finally works 2023-06-23 02:18:28 +02:00			`}`

Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`request_start = time.perf_counter()`

			`async with httpx.AsyncClient() as client:`
			`response = await client.post(`
			`url=f'{api_endpoint}/chat/completions',`
			`headers=HEADERS,`
			`json=json_data,`
			`timeout=10,`
			`)`
Improved errors, checking and fixed ratelimit retrying 2023-10-05 14:17:53 +02:00			`await _response_base_check(response)`
git finally works 2023-06-23 02:18:28 +02:00
Fixed checks 2023-09-14 22:37:29 +02:00			`assert '1337' in response.json()['choices'][0]['message']['content'], 'The API did not return a correct response.'`
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`return time.perf_counter() - request_start`
git finally works 2023-06-23 02:18:28 +02:00
Fixed function calling 2023-09-14 18:18:19 +02:00			`async def test_chat_stream_gpt3() -> float:`
			`"""Tests the text stream endpoint with the GPT-3.5-Turbo model."""`

			`json_data = {`
			`'model': 'gpt-3.5-turbo',`
			`'messages': MESSAGES,`
			`'stream': True,`
			`}`

			`request_start = time.perf_counter()`

			`async with httpx.AsyncClient() as client:`
			`response = await client.post(`
			`url=f'{api_endpoint}/chat/completions',`
			`headers=HEADERS,`
			`json=json_data,`
			`timeout=10,`
			`)`
Improved errors, checking and fixed ratelimit retrying 2023-10-05 14:17:53 +02:00			`await _response_base_check(response)`
Fixed function calling 2023-09-14 18:18:19 +02:00
Fixed checks 2023-09-14 22:37:29 +02:00			`chunks = []`
			`resulting_text = ''`

			`async for chunk in response.aiter_text():`
			`for subchunk in chunk.split('\n\n'):`
			`chunk = subchunk.replace('data: ', '').strip()`

			`if chunk == '[DONE]':`
			`break`

			`if chunk:`
			`chunks.append(json.loads(chunk))`

			`try:`
			`resulting_text += json.loads(chunk)['choices'][0]['delta']['content']`
			`except KeyError:`
			`pass`

			`assert '1337' in resulting_text, 'The API did not return a correct response.'`

Fixed function calling 2023-09-14 18:18:19 +02:00			`return time.perf_counter() - request_start`

			`async def test_image_generation() -> float:`
Small moderation timeout improvements, added SDXL check 2023-08-28 13:47:13 +02:00			`"""Tests the image generation endpoint with the SDXL model."""`

			`json_data = {`
			`'prompt': 'a nice sunset with a samurai standing in the middle',`
			`'n': 1,`
			`'size': '1024x1024'`
			`}`
git finally works 2023-06-23 02:18:28 +02:00
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`request_start = time.perf_counter()`
git finally works 2023-06-23 02:18:28 +02:00
Small moderation timeout improvements, added SDXL check 2023-08-28 13:47:13 +02:00			`async with httpx.AsyncClient() as client:`
			`response = await client.post(`
			`url=f'{api_endpoint}/images/generations',`
			`headers=HEADERS,`
			`json=json_data,`
			`timeout=10,`
			`)`
Improved errors, checking and fixed ratelimit retrying 2023-10-05 14:17:53 +02:00			`await _response_base_check(response)`
Small moderation timeout improvements, added SDXL check 2023-08-28 13:47:13 +02:00
			`assert '://' in response.json()['data'][0]['url']`
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`return time.perf_counter() - request_start`
Removed unused proxy tests and fixed moderation proxy 2023-08-13 00:59:54 +02:00
Fixed function calling 2023-09-14 18:18:19 +02:00			`class StepByStepAIResponse(BaseModel):`
			`"""Demo response structure for the function calling test."""`
			`title: str`
			`steps: List[str]`

			`async def test_function_calling():`
			`"""Tests function calling functionality with newer GPT models."""`

			`json_data = {`
			`'stream': False,`
			`'model': 'gpt-3.5-turbo-0613',`
			`'messages': [`
			`{"role": "user", "content": "Explain how to assemble a PC"}`
			`],`
			`'functions': [`
			`{`
			`'name': 'get_answer_for_user_query',`
			`'description': 'Get user answer in series of steps',`
			`'parameters': StepByStepAIResponse.schema()`
			`}`
			`],`
			`'function_call': {'name': 'get_answer_for_user_query'}`
			`}`

			`request_start = time.perf_counter()`

			`async with httpx.AsyncClient() as client:`
			`response = await client.post(`
			`url=f'{api_endpoint}/chat/completions',`
			`headers=HEADERS,`
			`json=json_data,`
Added key validation by API-key instead of IP Added rate limited keys getting logged in a database 2023-09-23 21:41:48 +02:00			`timeout=15,`
Fixed function calling 2023-09-14 18:18:19 +02:00			`)`
Improved errors, checking and fixed ratelimit retrying 2023-10-05 14:17:53 +02:00			`await _response_base_check(response)`
Fixed function calling 2023-09-14 18:18:19 +02:00
			`res = response.json()`
			`output = json.loads(res['choices'][0]['message']['function_call']['arguments'])`
			`print(output)`

			`assert output.get('title') and output.get('steps'), 'The API did not return a correct response.'`
			`return time.perf_counter() - request_start`

Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`async def test_models():`
			`"""Tests the models endpoint."""`
git finally works 2023-06-23 02:18:28 +02:00
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`request_start = time.perf_counter()`
			`async with httpx.AsyncClient() as client:`
			`response = await client.get(`
			`url=f'{api_endpoint}/models',`
			`headers=HEADERS,`
			`timeout=3`
			`)`
Improved errors, checking and fixed ratelimit retrying 2023-10-05 14:17:53 +02:00			`await _response_base_check(response)`
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`res = response.json()`
sleep deprivation caused me to be not productive today 2023-08-06 00:43:36 +02:00
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`all_models = [model['id'] for model in res['data']]`

			`assert 'gpt-3.5-turbo' in all_models, 'The model gpt-3.5-turbo is not present in the models endpoint.'`
			`return time.perf_counter() - request_start`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00
Slight improvements/fixes 2023-08-15 13:55:12 +02:00			`# ==========================================================================================`

Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`async def demo():`
git finally works 2023-06-23 02:18:28 +02:00			`"""Runs all tests."""`
Made code more robust (dotenv) and working on tests 2023-08-21 20:58:05 +02:00
making tests properly handle exceptions 2023-08-20 13:23:48 +02:00			`try:`
Made code more robust (dotenv) and working on tests 2023-08-21 20:58:05 +02:00			`for _ in range(30):`
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`if await test_server():`
Made code more robust (dotenv) and working on tests 2023-08-21 20:58:05 +02:00			`break`
git finally works 2023-06-23 02:18:28 +02:00
Made code more robust (dotenv) and working on tests 2023-08-21 20:58:05 +02:00			`print('Waiting until API Server is started up...')`
			`time.sleep(1)`
			`else:`
			`raise ConnectionError('API Server is not running.')`
updating tests to add tests back since they were removed for some reason? 2023-08-13 17:16:33 +02:00
Improved errors, checking and fixed ratelimit retrying 2023-10-05 14:17:53 +02:00			`for func in [test_chat_non_stream_gpt4, test_chat_stream_gpt3]:`
			`print(f'[*] {func.__name__}')`
			`result = await func()`
			`print(f'[+] {func.__name__} - {result}')`
Made code more robust (dotenv) and working on tests 2023-08-21 20:58:05 +02:00
			`except Exception as exc:`
			`print('[red]Error: ' + str(exc))`
			`traceback.print_exc()`
making tests properly handle exceptions 2023-08-20 13:23:48 +02:00			`exit(500)`
some thingies 2023-08-05 02:30:42 +02:00
Made code more robust (dotenv) and working on tests 2023-08-21 20:58:05 +02:00			`openai.api_base = api_endpoint`
			`openai.api_key = os.environ['NOVA_KEY']`
some thingies 2023-08-05 02:30:42 +02:00
Made code more robust (dotenv) and working on tests 2023-08-21 20:58:05 +02:00			`HEADERS = {`
			`'Content-Type': 'application/json',`
			`'Authorization': 'Bearer ' + openai.api_key`
			`}`
Added /v1/models and fixed key invalidation 2023-08-09 11:15:49 +02:00
Made code more robust (dotenv) and working on tests 2023-08-21 20:58:05 +02:00			`if __name__ == '__main__':`
Auto-trigger - Production server started 2023-08-23 23:27:09 +02:00			`asyncio.run(demo())`