Spaces:

DesertWolf
/

test3

Paused

App Files Files Community

test3 / tests /test_litellm /test_main.py

DesertWolf

Upload folder using huggingface_hub

447ebeb verified 6 months ago

raw

history blame contribute delete

14.1 kB

	import json
	import os
	import sys

	import httpx
	import pytest
	import respx
	from fastapi.testclient import TestClient

	sys.path.insert(
	0, os.path.abspath("../..")
	) # Adds the parent directory to the system path

	import urllib.parse
	from unittest.mock import MagicMock, patch

	import litellm


	@pytest.fixture(autouse=True)
	def add_api_keys_to_env(monkeypatch):
	monkeypatch.setenv("ANTHROPIC_API_KEY", "sk-ant-api03-1234567890")
	monkeypatch.setenv("OPENAI_API_KEY", "sk-openai-api03-1234567890")
	monkeypatch.setenv("AWS_ACCESS_KEY_ID", "my-fake-aws-access-key-id")
	monkeypatch.setenv("AWS_SECRET_ACCESS_KEY", "my-fake-aws-secret-access-key")
	monkeypatch.setenv("AWS_REGION", "us-east-1")


	@pytest.fixture
	def openai_api_response():
	mock_response_data = {
	"id": "chatcmpl-B0W3vmiM78Xkgx7kI7dr7PC949DMS",
	"choices": [
	{
	"finish_reason": "stop",
	"index": 0,
	"logprobs": None,
	"message": {
	"content": "",
	"refusal": None,
	"role": "assistant",
	"audio": None,
	"function_call": None,
	"tool_calls": None,
	},
	}
	],
	"created": 1739462947,
	"model": "gpt-4o-mini-2024-07-18",
	"object": "chat.completion",
	"service_tier": "default",
	"system_fingerprint": "fp_bd83329f63",
	"usage": {
	"completion_tokens": 1,
	"prompt_tokens": 121,
	"total_tokens": 122,
	"completion_tokens_details": {
	"accepted_prediction_tokens": 0,
	"audio_tokens": 0,
	"reasoning_tokens": 0,
	"rejected_prediction_tokens": 0,
	},
	"prompt_tokens_details": {"audio_tokens": 0, "cached_tokens": 0},
	},
	}

	return mock_response_data


	def test_completion_missing_role(openai_api_response):
	from openai import OpenAI

	from litellm.types.utils import ModelResponse

	client = OpenAI(api_key="test_api_key")

	mock_raw_response = MagicMock()
	mock_raw_response.headers = {
	"x-request-id": "123",
	"openai-organization": "org-123",
	"x-ratelimit-limit-requests": "100",
	"x-ratelimit-remaining-requests": "99",
	}
	mock_raw_response.parse.return_value = ModelResponse(**openai_api_response)

	print(f"openai_api_response: {openai_api_response}")

	with patch.object(
	client.chat.completions.with_raw_response, "create", mock_raw_response
	) as mock_create:
	litellm.completion(
	model="gpt-4o-mini",
	messages=[
	{"role": "user", "content": "Hey"},
	{
	"content": "",
	"tool_calls": [
	{
	"id": "call_m0vFJjQmTH1McvaHBPR2YFwY",
	"function": {
	"arguments": '{"input": "dksjsdkjdhskdjshdskhjkhlk"}',
	"name": "tool_name",
	},
	"type": "function",
	"index": 0,
	},
	{
	"id": "call_Vw6RaqV2n5aaANXEdp5pYxo2",
	"function": {
	"arguments": '{"input": "jkljlkjlkjlkjlk"}',
	"name": "tool_name",
	},
	"type": "function",
	"index": 1,
	},
	{
	"id": "call_hBIKwldUEGlNh6NlSXil62K4",
	"function": {
	"arguments": '{"input": "jkjlkjlkjlkj;lj"}',
	"name": "tool_name",
	},
	"type": "function",
	"index": 2,
	},
	],
	},
	],
	client=client,
	)

	mock_create.assert_called_once()


	@pytest.mark.parametrize(
	"model",
	[
	"gemini/gemini-1.5-flash",
	"bedrock/anthropic.claude-3-5-sonnet-20240620-v1:0",
	"bedrock/invoke/anthropic.claude-3-5-sonnet-20240620-v1:0",
	"anthropic/claude-3-5-sonnet",
	],
	)
	@pytest.mark.parametrize("sync_mode", [True, False])
	@pytest.mark.asyncio
	async def test_url_with_format_param(model, sync_mode, monkeypatch):
	from litellm import acompletion, completion
	from litellm.llms.custom_httpx.http_handler import AsyncHTTPHandler, HTTPHandler

	if sync_mode:
	client = HTTPHandler()
	else:
	client = AsyncHTTPHandler()

	args = {
	"model": model,
	"messages": [
	{
	"role": "user",
	"content": [
	{
	"type": "image_url",
	"image_url": {
	"url": "https://upload.wikimedia.org/wikipedia/commons/thumb/d/dd/Gfp-wisconsin-madison-the-nature-boardwalk.jpg/2560px-Gfp-wisconsin-madison-the-nature-boardwalk.jpg",
	"format": "image/png",
	},
	},
	{"type": "text", "text": "Describe this image"},
	],
	}
	],
	}
	with patch.object(client, "post", new=MagicMock()) as mock_client:
	try:
	if sync_mode:
	response = completion(**args, client=client)
	else:
	response = await acompletion(**args, client=client)
	print(response)
	except Exception as e:
	pass

	mock_client.assert_called()

	print(mock_client.call_args.kwargs)

	if "data" in mock_client.call_args.kwargs:
	json_str = mock_client.call_args.kwargs["data"]
	else:
	json_str = json.dumps(mock_client.call_args.kwargs["json"])

	if isinstance(json_str, bytes):
	json_str = json_str.decode("utf-8")

	print(f"type of json_str: {type(json_str)}")
	assert "png" in json_str
	assert "jpeg" not in json_str


	@pytest.mark.parametrize("model", ["gpt-4o-mini"])
	@pytest.mark.parametrize("sync_mode", [True, False])
	@pytest.mark.asyncio
	async def test_url_with_format_param_openai(model, sync_mode):
	from openai import AsyncOpenAI, OpenAI

	from litellm import acompletion, completion

	if sync_mode:
	client = OpenAI()
	else:
	client = AsyncOpenAI()

	args = {
	"model": model,
	"messages": [
	{
	"role": "user",
	"content": [
	{
	"type": "image_url",
	"image_url": {
	"url": "https://upload.wikimedia.org/wikipedia/commons/thumb/d/dd/Gfp-wisconsin-madison-the-nature-boardwalk.jpg/2560px-Gfp-wisconsin-madison-the-nature-boardwalk.jpg",
	"format": "image/png",
	},
	},
	{"type": "text", "text": "Describe this image"},
	],
	}
	],
	}
	with patch.object(
	client.chat.completions.with_raw_response, "create"
	) as mock_client:
	try:
	if sync_mode:
	response = completion(**args, client=client)
	else:
	response = await acompletion(**args, client=client)
	print(response)
	except Exception as e:
	print(e)

	mock_client.assert_called()

	print(mock_client.call_args.kwargs)

	json_str = json.dumps(mock_client.call_args.kwargs)

	assert "format" not in json_str


	def test_bedrock_latency_optimized_inference():
	from litellm.llms.custom_httpx.http_handler import HTTPHandler

	client = HTTPHandler()
	with patch.object(client, "post") as mock_post:
	try:
	response = litellm.completion(
	model="bedrock/anthropic.claude-3-5-sonnet-20240620-v1:0",
	messages=[{"role": "user", "content": "Hello, how are you?"}],
	performanceConfig={"latency": "optimized"},
	client=client,
	)
	except Exception as e:
	print(e)

	mock_post.assert_called_once()
	json_data = json.loads(mock_post.call_args.kwargs["data"])
	assert json_data["performanceConfig"]["latency"] == "optimized"


	@pytest.fixture(autouse=True)
	def set_openrouter_api_key():
	original_api_key = os.environ.get("OPENROUTER_API_KEY")
	os.environ["OPENROUTER_API_KEY"] = "fake-key-for-testing"
	yield
	if original_api_key is not None:
	os.environ["OPENROUTER_API_KEY"] = original_api_key
	else:
	del os.environ["OPENROUTER_API_KEY"]


	@pytest.mark.asyncio
	async def test_extra_body_with_fallback(
	respx_mock: respx.MockRouter, set_openrouter_api_key
	):
	"""
	test regression for https://github.com/BerriAI/litellm/issues/8425.

	This was perhaps a wider issue with the acompletion function not passing kwargs such as extra_body correctly when fallbacks are specified.
	"""

	# since this uses respx, we need to set use_aiohttp_transport to False
	litellm.disable_aiohttp_transport = True
	# Set up test parameters
	model = "openrouter/deepseek/deepseek-chat"
	messages = [{"role": "user", "content": "Hello, world!"}]
	extra_body = {
	"provider": {
	"order": ["DeepSeek"],
	"allow_fallbacks": False,
	"require_parameters": True,
	}
	}
	fallbacks = [{"model": "openrouter/google/gemini-flash-1.5-8b"}]

	respx_mock.post("https://openrouter.ai/api/v1/chat/completions").respond(
	json={
	"id": "chatcmpl-123",
	"object": "chat.completion",
	"created": 1677652288,
	"model": model,
	"choices": [
	{
	"index": 0,
	"message": {
	"role": "assistant",
	"content": "Hello from mocked response!",
	},
	"finish_reason": "stop",
	}
	],
	"usage": {"prompt_tokens": 9, "completion_tokens": 12, "total_tokens": 21},
	}
	)

	response = await litellm.acompletion(
	model=model,
	messages=messages,
	extra_body=extra_body,
	fallbacks=fallbacks,
	api_key="fake-openrouter-api-key",
	)

	# Get the request from the mock
	request: httpx.Request = respx_mock.calls[0].request
	request_body = request.read()
	request_body = json.loads(request_body)

	# Verify basic parameters
	assert request_body["model"] == "deepseek/deepseek-chat"
	assert request_body["messages"] == messages

	# Verify the extra_body parameters remain under the provider key
	assert request_body["provider"]["order"] == ["DeepSeek"]
	assert request_body["provider"]["allow_fallbacks"] is False
	assert request_body["provider"]["require_parameters"] is True

	# Verify the response
	assert response is not None
	assert response.choices[0].message.content == "Hello from mocked response!"


	@pytest.mark.parametrize("env_base", ["OPENAI_BASE_URL", "OPENAI_API_BASE"])
	@pytest.mark.asyncio
	async def test_openai_env_base(
	respx_mock: respx.MockRouter, env_base, openai_api_response, monkeypatch
	):
	"This tests OpenAI env variables are honored, including legacy OPENAI_API_BASE"
	litellm.disable_aiohttp_transport = True

	expected_base_url = "http://localhost:12345/v1"

	# Assign the environment variable based on env_base, and use a fake API key.
	monkeypatch.setenv(env_base, expected_base_url)
	monkeypatch.setenv("OPENAI_API_KEY", "fake_openai_api_key")

	model = "gpt-4o"
	messages = [{"role": "user", "content": "Hello, how are you?"}]

	respx_mock.post(f"{expected_base_url}/chat/completions").respond(
	json={
	"id": "chatcmpl-123",
	"object": "chat.completion",
	"created": 1677652288,
	"model": model,
	"choices": [
	{
	"index": 0,
	"message": {
	"role": "assistant",
	"content": "Hello from mocked response!",
	},
	"finish_reason": "stop",
	}
	],
	"usage": {"prompt_tokens": 9, "completion_tokens": 12, "total_tokens": 21},
	}
	)

	response = await litellm.acompletion(model=model, messages=messages)

	# verify we had a response
	assert response.choices[0].message.content == "Hello from mocked response!"


	def build_database_url(username, password, host, dbname):
	username_enc = urllib.parse.quote_plus(username)
	password_enc = urllib.parse.quote_plus(password)
	dbname_enc = urllib.parse.quote_plus(dbname)
	return f"postgresql://{username_enc}:{password_enc}@{host}/{dbname_enc}"


	def test_build_database_url():
	url = build_database_url("user@name", "p@ss:word", "localhost", "db/name")
	assert url == "postgresql://user%40name:p%40ss%3Aword@localhost/db%2Fname"


	def test_bedrock_llama():
	litellm._turn_on_debug()
	from litellm.types.utils import CallTypes
	from litellm.utils import return_raw_request

	model = "bedrock/invoke/us.meta.llama4-scout-17b-instruct-v1:0"

	request = return_raw_request(
	endpoint=CallTypes.completion,
	kwargs={
	"model": model,
	"messages": [
	{"role": "user", "content": "hi"},
	],
	},
	)
	print(request)

	assert (
	request["raw_request_body"]["prompt"]
	== "<\|begin_of_text\|><\|start_header_id\|>user<\|end_header_id\|>\n\nhi<\|eot_id\|><\|start_header_id\|>assistant<\|end_header_id\|>\n\n"
	)