Skip to content

Commit

Permalink
add otel load test
Browse files Browse the repository at this point in the history
  • Loading branch information
ishaan-jaff committed Sep 12, 2024
1 parent e7b0472 commit 850b5db
Showing 1 changed file with 108 additions and 0 deletions.
108 changes: 108 additions & 0 deletions tests/load_tests/test_otel_load_test.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,108 @@
import sys

import os

sys.path.insert(0, os.path.abspath("../.."))

import asyncio
import litellm
from litellm._logging import verbose_logger
import logging
import time
import pytest


def test_otel_logging_async():
# this tests time added to make otel logging calls, vs just acompletion calls
try:

os.environ["OTEL_EXPORTER"] = "otlp_http"
os.environ["OTEL_ENDPOINT"] = "http://0.0.0.0:8090/traces"
os.environ["OTEL_HEADERS"] = "Authorization=K0BSwd"

# Make 5 calls with an empty success_callback
litellm.success_callback = []
litellm.callbacks = []
litellm._async_success_callback = []
litellm._async_failure_callback = []
litellm._async_failure_callback = []
litellm.failure_callback = []
start_time_empty_callback = asyncio.run(make_async_calls())
print("done with no callback test")

print("starting otel test")
# Make 5 calls with success_callback set to "otel"
litellm.callbacks = ["otel"]
start_time_otel = asyncio.run(make_async_calls())
print("done with otel test")

# Compare the time for both scenarios
print(f"Time taken with success_callback='otel': {start_time_otel}")
print(f"Time taken with empty success_callback: {start_time_empty_callback}")

# Calculate the percentage difference
percentage_diff = (
abs(start_time_otel - start_time_empty_callback)
/ start_time_empty_callback
* 100
)

# Assert that the difference is not more than 10%
assert (
percentage_diff < 10
), f"Performance difference of {percentage_diff:.2f}% exceeds 10% threshold"

print(f"Performance difference: {percentage_diff:.2f}%")

except litellm.Timeout as e:
pass
except Exception as e:
pytest.fail(f"An exception occurred - {e}")


async def make_async_calls(metadata=None, **completion_kwargs):
total_start_time = asyncio.get_event_loop().time()
tasks = []

async def create_and_run_task():
task = create_async_task(**completion_kwargs)
response = await task
print(f"Response: {response}")

for _ in range(3): # Run for 10 seconds
# Create 100 tasks
tasks = []
for _ in range(100):
tasks.append(asyncio.create_task(create_and_run_task()))

# Wait for any remaining tasks to complete
await asyncio.gather(*tasks)

await asyncio.sleep(1)

# Calculate the total time taken
total_time = asyncio.get_event_loop().time() - total_start_time

return total_time


def create_async_task(**completion_kwargs):
"""
Creates an async task for the litellm.acompletion function.
This is just the task, but it is not run here.
To run the task it must be awaited or used in other asyncio coroutine execution functions like asyncio.gather.
Any kwargs passed to this function will be passed to the litellm.acompletion function.
By default a standard set of arguments are used for the litellm.acompletion function.
"""
completion_args = {
"model": "openai/chatgpt-v-2",
"api_version": "2024-02-01",
"messages": [{"role": "user", "content": "This is a test" * 100}],
"max_tokens": 5,
"temperature": 0.7,
"timeout": 5,
"user": "langfuse_latency_test_user",
"mock_response": "Mock response",
}
completion_args.update(completion_kwargs)
return asyncio.create_task(litellm.acompletion(**completion_args))

0 comments on commit 850b5db

Please sign in to comment.