Skip to content

Commit

Permalink
fix(anthropic.py): support async claude 3 tool calling + streaming
Browse files Browse the repository at this point in the history
  • Loading branch information
krrishdholakia committed Mar 23, 2024
1 parent 2e284a0 commit 42a7588
Show file tree
Hide file tree
Showing 2 changed files with 80 additions and 3 deletions.
28 changes: 25 additions & 3 deletions litellm/llms/anthropic.py
Original file line number Diff line number Diff line change
Expand Up @@ -301,7 +301,7 @@ def completion(
)
streaming_choice.delta = delta_obj
streaming_model_response.choices = [streaming_choice]
completion_stream = model_response_iterator(
completion_stream = ModelResponseIterator(
model_response=streaming_model_response
)
print_verbose(
Expand Down Expand Up @@ -330,8 +330,30 @@ def completion(
return model_response


def model_response_iterator(model_response):
yield model_response
class ModelResponseIterator:
def __init__(self, model_response):
self.model_response = model_response
self.is_done = False

# Sync iterator
def __iter__(self):
return self

def __next__(self):
if self.is_done:
raise StopIteration
self.is_done = True
return self.model_response

# Async iterator
def __aiter__(self):
return self

async def __anext__(self):
if self.is_done:
raise StopAsyncIteration
self.is_done = True
return self.model_response


def embedding():
Expand Down
55 changes: 55 additions & 0 deletions litellm/tests/test_streaming.py
Original file line number Diff line number Diff line change
Expand Up @@ -2089,3 +2089,58 @@ def test_completion_claude_3_function_call_with_streaming():
# raise Exception("it worked!")
except Exception as e:
pytest.fail(f"Error occurred: {e}")


@pytest.mark.asyncio
async def test_acompletion_claude_3_function_call_with_streaming():
litellm.set_verbose = True
tools = [
{
"type": "function",
"function": {
"name": "get_current_weather",
"description": "Get the current weather in a given location",
"parameters": {
"type": "object",
"properties": {
"location": {
"type": "string",
"description": "The city and state, e.g. San Francisco, CA",
},
"unit": {"type": "string", "enum": ["celsius", "fahrenheit"]},
},
"required": ["location"],
},
},
}
]
messages = [{"role": "user", "content": "What's the weather like in Boston today?"}]
try:
# test without max tokens
response = await acompletion(
model="claude-3-opus-20240229",
messages=messages,
tools=tools,
tool_choice="auto",
stream=True,
)
idx = 0
print(f"response: {response}")
async for chunk in response:
# print(f"chunk: {chunk}")
if idx == 0:
assert (
chunk.choices[0].delta.tool_calls[0].function.arguments is not None
)
assert isinstance(
chunk.choices[0].delta.tool_calls[0].function.arguments, str
)
validate_first_streaming_function_calling_chunk(chunk=chunk)
elif idx == 1:
validate_second_streaming_function_calling_chunk(chunk=chunk)
elif chunk.choices[0].finish_reason is not None: # last chunk
validate_final_streaming_function_calling_chunk(chunk=chunk)
idx += 1
# raise Exception("it worked!")
except Exception as e:
pytest.fail(f"Error occurred: {e}")

0 comments on commit 42a7588

Please sign in to comment.