From b3035d7e031ceb27982f204d7f6bb58a790659e1 Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Tue, 17 Dec 2024 09:14:10 +0000
Subject: [PATCH 01/22] feat: Add Fireworks provider integration

- Add FireworksProvider class implementing InstrumentedProvider
- Support both synchronous and asynchronous completions
- Handle streaming responses
- Implement OpenAI-compatible interface

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py | 213 +++++++++++++++++++++++++++
 1 file changed, 213 insertions(+)
 create mode 100644 agentops/llms/providers/fireworks.py

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
new file mode 100644
index 00000000..e94ad265
--- /dev/null
+++ b/agentops/llms/providers/fireworks.py
@@ -0,0 +1,213 @@
+import inspect
+import pprint
+from typing import Optional
+
+from agentops.llms.providers.instrumented_provider import InstrumentedProvider
+from agentops.time_travel import fetch_completion_override_from_time_travel_cache
+from agentops.event import ActionEvent, ErrorEvent, LLMEvent
+from agentops.session import Session
+from agentops.log_config import logger
+from agentops.helpers import check_call_stack_for_agent_id, get_ISO_time
+from agentops.singleton import singleton
+
+
+@singleton
+class FireworksProvider(InstrumentedProvider):
+    original_create = None
+    original_create_async = None
+
+    def __init__(self, client):
+        super().__init__(client)
+        self._provider_name = "Fireworks"
+
+    def handle_response(self, response, kwargs, init_timestamp, session: Optional[Session] = None) -> dict:
+        """Handle responses for Fireworks API (OpenAI-compatible interface)"""
+        from fireworks.client import AsyncStream, Stream
+        from fireworks.types.chat import ChatCompletionChunk
+
+        llm_event = LLMEvent(init_timestamp=init_timestamp, params=kwargs)
+        if session is not None:
+            llm_event.session_id = session.session_id
+
+        def handle_stream_chunk(chunk: ChatCompletionChunk):
+            # NOTE: prompt/completion usage not returned in response when streaming
+            # We take the first ChatCompletionChunk and accumulate the deltas from all subsequent chunks
+            if llm_event.returns == None:
+                llm_event.returns = chunk
+
+            try:
+                accumulated_delta = llm_event.returns.choices[0].delta
+                llm_event.agent_id = check_call_stack_for_agent_id()
+                llm_event.model = chunk.model
+                llm_event.prompt = kwargs["messages"]
+
+                # NOTE: We assume for completion only choices[0] is relevant
+                choice = chunk.choices[0]
+
+                if choice.delta.content:
+                    accumulated_delta.content += choice.delta.content
+
+                if choice.delta.role:
+                    accumulated_delta.role = choice.delta.role
+
+                if choice.delta.tool_calls:
+                    accumulated_delta.tool_calls = choice.delta.tool_calls
+
+                if choice.delta.function_call:
+                    accumulated_delta.function_call = choice.delta.function_call
+
+                if choice.finish_reason:
+                    # Streaming is done. Record LLMEvent
+                    llm_event.returns.choices[0].finish_reason = choice.finish_reason
+                    llm_event.completion = {
+                        "role": accumulated_delta.role,
+                        "content": accumulated_delta.content,
+                        "function_call": accumulated_delta.function_call,
+                        "tool_calls": accumulated_delta.tool_calls,
+                    }
+                    llm_event.end_timestamp = get_ISO_time()
+
+                    self._safe_record(session, llm_event)
+            except Exception as e:
+                self._safe_record(session, ErrorEvent(trigger_event=llm_event, exception=e))
+
+                kwargs_str = pprint.pformat(kwargs)
+                chunk = pprint.pformat(chunk)
+                logger.warning(
+                    f"Unable to parse a chunk for LLM call. Skipping upload to AgentOps\n"
+                    f"chunk:\n {chunk}\n"
+                    f"kwargs:\n {kwargs_str}\n"
+                )
+
+        # if the response is a generator, decorate the generator
+        if isinstance(response, Stream):
+            def generator():
+                for chunk in response:
+                    handle_stream_chunk(chunk)
+                    yield chunk
+            return generator()
+
+        # For asynchronous AsyncStream
+        elif isinstance(response, AsyncStream):
+            async def async_generator():
+                async for chunk in response:
+                    handle_stream_chunk(chunk)
+                    yield chunk
+            return async_generator()
+
+        # v1.0.0+ responses are objects
+        try:
+            llm_event.returns = response
+            llm_event.agent_id = check_call_stack_for_agent_id()
+            llm_event.prompt = kwargs["messages"]
+            llm_event.prompt_tokens = response.usage.prompt_tokens
+            llm_event.completion = response.choices[0].message.model_dump()
+            llm_event.completion_tokens = response.usage.completion_tokens
+            llm_event.model = response.model
+
+            self._safe_record(session, llm_event)
+        except Exception as e:
+            self._safe_record(session, ErrorEvent(trigger_event=llm_event, exception=e))
+
+            kwargs_str = pprint.pformat(kwargs)
+            response = pprint.pformat(response)
+            logger.warning(
+                f"Unable to parse response for LLM call. Skipping upload to AgentOps\n"
+                f"response:\n {response}\n"
+                f"kwargs:\n {kwargs_str}\n"
+            )
+
+        return response
+
+    def override(self):
+        self._override_fireworks_completion()
+        self._override_fireworks_async_completion()
+
+
+    def _override_fireworks_completion(self):
+        from fireworks.resources.chat import completions
+        from fireworks.types.chat import ChatCompletion, ChatCompletionChunk
+
+        # Store the original method
+        self.original_create = completions.Completions.create
+
+        def patched_function(*args, **kwargs):
+            init_timestamp = get_ISO_time()
+            session = kwargs.get("session", None)
+            if "session" in kwargs.keys():
+                del kwargs["session"]
+
+            completion_override = fetch_completion_override_from_time_travel_cache(kwargs)
+            if completion_override:
+                result_model = None
+                pydantic_models = (ChatCompletion, ChatCompletionChunk)
+                for pydantic_model in pydantic_models:
+                    try:
+                        result_model = pydantic_model.model_validate_json(completion_override)
+                        break
+                    except Exception as e:
+                        pass
+
+                if result_model is None:
+                    logger.error(
+                        f"Time Travel: Pydantic validation failed for {pydantic_models} \n"
+                        f"Time Travel: Completion override was:\n"
+                        f"{pprint.pformat(completion_override)}"
+                    )
+                    return None
+                return self.handle_response(result_model, kwargs, init_timestamp, session=session)
+
+            # Call the original function with its original arguments
+            result = self.original_create(*args, **kwargs)
+            return self.handle_response(result, kwargs, init_timestamp, session=session)
+
+        # Override the original method with the patched one
+        completions.Completions.create = patched_function
+
+    def _override_fireworks_async_completion(self):
+        from fireworks.resources.chat import completions
+        from fireworks.types.chat import ChatCompletion, ChatCompletionChunk
+
+        # Store the original method
+        self.original_create_async = completions.AsyncCompletions.create
+
+        async def patched_function(*args, **kwargs):
+            init_timestamp = get_ISO_time()
+
+            session = kwargs.get("session", None)
+            if "session" in kwargs.keys():
+                del kwargs["session"]
+
+            completion_override = fetch_completion_override_from_time_travel_cache(kwargs)
+            if completion_override:
+                result_model = None
+                pydantic_models = (ChatCompletion, ChatCompletionChunk)
+                for pydantic_model in pydantic_models:
+                    try:
+                        result_model = pydantic_model.model_validate_json(completion_override)
+                        break
+                    except Exception as e:
+                        pass
+
+                if result_model is None:
+                    logger.error(
+                        f"Time Travel: Pydantic validation failed for {pydantic_models} \n"
+                        f"Time Travel: Completion override was:\n"
+                        f"{pprint.pformat(completion_override)}"
+                    )
+                    return None
+                return self.handle_response(result_model, kwargs, init_timestamp, session=session)
+
+            # Call the original function with its original arguments
+            result = await self.original_create_async(*args, **kwargs)
+            return self.handle_response(result, kwargs, init_timestamp, session=session)
+
+        # Override the original method with the patched one
+        completions.AsyncCompletions.create = patched_function
+
+    def undo_override(self):
+        if self.original_create is not None and self.original_create_async is not None:
+            from fireworks.resources.chat import completions
+
+            completions.AsyncCompletions.create = self.original_create_async
+            completions.Completions.create = self.original_create

From 84e44b3c1c6501c326a17937d6addaa242ec40d6 Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Tue, 17 Dec 2024 09:14:58 +0000
Subject: [PATCH 02/22] docs: Add Fireworks integration documentation

- Add installation instructions for Fireworks SDK
- Add environment variable setup guide
- Include synchronous and asynchronous usage examples
- Add streaming examples
- Follow existing documentation structure

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 docs/v1/integrations/fireworks.mdx | 174 +++++++++++++++++++++++++++++
 1 file changed, 174 insertions(+)
 create mode 100644 docs/v1/integrations/fireworks.mdx

diff --git a/docs/v1/integrations/fireworks.mdx b/docs/v1/integrations/fireworks.mdx
new file mode 100644
index 00000000..46ffcea6
--- /dev/null
+++ b/docs/v1/integrations/fireworks.mdx
@@ -0,0 +1,174 @@
+---
+title: Fireworks
+description: "AgentOps provides support for Fireworks AI's LLM models"
+---
+
+import CodeTooltip from '/snippets/add-code-tooltip.mdx'
+import EnvTooltip from '/snippets/add-env-tooltip.mdx'
+
+<Card title="Fireworks" icon="robot" href="https://fireworks.ai">
+    First class support for Fireworks AI models including Llama-v3
+</Card>
+
+<Steps>
+  <Step title="Install the AgentOps SDK">
+    <CodeGroup>
+      ```bash pip
+      pip install agentops
+      ```
+      ```bash poetry
+      poetry add agentops
+      ```
+    </CodeGroup>
+  </Step>
+  <Step title="Install the Fireworks SDK">
+    <CodeGroup>
+      ```bash pip
+      pip install --upgrade fireworks-ai
+      ```
+      ```bash poetry
+      poetry add fireworks-ai
+      ```
+    </CodeGroup>
+  </Step>
+  <Step title="Add 3 lines of code">
+    <CodeTooltip/>
+    <CodeGroup>
+      ```python python
+      import agentops
+      from fireworks.client import Fireworks
+
+      agentops.init(<INSERT YOUR API KEY HERE>)
+      client = Fireworks()
+      ...
+      # End of program (e.g. main.py)
+      agentops.end_session("Success")
+      ```
+    </CodeGroup>
+    <EnvTooltip />
+      <CodeGroup>
+        ```python .env
+        AGENTOPS_API_KEY=<YOUR API KEY>
+        FIREWORKS_API_KEY=<YOUR FIREWORKS API KEY>
+        ```
+      </CodeGroup>
+      Read more about environment variables in [Advanced Configuration](/v1/usage/advanced-configuration)
+  </Step>
+  <Step title="Run your Agent">
+    Execute your program and visit [app.agentops.ai/drilldown](https://app.agentops.ai/drilldown) to observe your Agent! 🕵️
+    <Tip>
+      After your run, AgentOps prints a clickable url to console linking directly to your session in the Dashboard
+    </Tip>
+    <div/>
+    <Frame type="glass" caption="Clickable link to session">
+      <img height="200" src="https://raw.githubusercontent.com/AgentOps-AI/agentops/refs/heads/main/docs/images/external/app_screenshots/session-replay.png?raw=true" />
+    </Frame>
+  </Step>
+</Steps>
+
+## Full Examples
+
+<CodeGroup>
+  ```python sync
+  from fireworks.client import Fireworks
+  import agentops
+
+  agentops.init(<INSERT YOUR API KEY HERE>)
+  client = Fireworks()
+
+  response = client.chat.completions.create(
+      model="accounts/fireworks/models/llama-v3p1-8b-instruct",
+      messages=[{
+          "role": "user",
+          "content": "Write a haiku about AI and humans working together"
+      }]
+  )
+
+  print(response.choices[0].message.content)
+  agentops.end_session('Success')
+  ```
+
+  ```python async
+  from fireworks.client import AsyncFireworks
+  import agentops
+  import asyncio
+
+  async def main():
+      agentops.init(<INSERT YOUR API KEY HERE>)
+      client = AsyncFireworks()
+
+      response = await client.chat.completions.create(
+          model="accounts/fireworks/models/llama-v3p1-8b-instruct",
+          messages=[{
+              "role": "user",
+              "content": "Write a haiku about AI and humans working together"
+          }]
+      )
+
+      print(response.choices[0].message.content)
+      agentops.end_session('Success')
+
+  asyncio.run(main())
+  ```
+
+</CodeGroup>
+
+### Streaming examples
+
+<CodeGroup>
+  ```python sync
+  from fireworks.client import Fireworks
+  import agentops
+
+  agentops.init(<INSERT YOUR API KEY HERE>)
+  client = Fireworks()
+
+  stream = client.chat.completions.create(
+      model="accounts/fireworks/models/llama-v3p1-8b-instruct",
+      stream=True,
+      messages=[{
+            "role": "user",
+            "content": "Write a haiku about AI and humans working together"
+      }],
+  )
+
+  for chunk in stream:
+    print(chunk.choices[0].delta.content or "", end="")
+
+  agentops.end_session('Success')
+  ```
+
+  ```python async
+  from fireworks.client import AsyncFireworks
+  import agentops
+  import asyncio
+
+  async def main():
+    agentops.init(<INSERT YOUR API KEY HERE>)
+    client = AsyncFireworks()
+
+    stream = await client.chat.completions.create(
+        model="accounts/fireworks/models/llama-v3p1-8b-instruct",
+        stream=True,
+        messages=[{
+            "role": "user",
+            "content": "Write a haiku about AI and humans working together"
+        }],
+    )
+
+
+    async for chunk in stream:
+        print(chunk.choices[0].delta.content or "", end="")
+
+    agentops.end_session('Success')
+
+  asyncio.run(main())
+  ```
+
+</CodeGroup>
+
+<script type="module" src="/scripts/github_stars.js"></script>
+<script type="module" src="/scripts/scroll-img-fadein-animation.js"></script>
+<script type="module" src="/scripts/button_heartbeat_animation.js"></script>
+<script type="css" src="/styles/styles.css"></script>
+<script type="module" src="/scripts/adjust_api_dynamically.js"></script>

From e82293349d5fcfa5ff24afb65c1d5455ffc2ae57 Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Tue, 17 Dec 2024 09:18:37 +0000
Subject: [PATCH 03/22] feat: Add Fireworks example notebook

- Add script to generate Jupyter notebook
- Add example notebook with basic and streaming completions
- Include environment variable setup
- Add documentation and explanatory markdown cells

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 .../fireworks_examples/create_notebook.py     | 134 +++++++++++
 .../fireworks_example.ipynb                   | 219 ++++++++++++++++++
 2 files changed, 353 insertions(+)
 create mode 100644 examples/fireworks_examples/create_notebook.py
 create mode 100644 examples/fireworks_examples/fireworks_example.ipynb

diff --git a/examples/fireworks_examples/create_notebook.py b/examples/fireworks_examples/create_notebook.py
new file mode 100644
index 00000000..917add0d
--- /dev/null
+++ b/examples/fireworks_examples/create_notebook.py
@@ -0,0 +1,134 @@
+import nbformat as nbf
+import os
+
+nb = nbf.v4.new_notebook()
+
+# Create cells
+cells = [
+    nbf.v4.new_markdown_cell(
+        "# Fireworks Example\n\n"
+        "We are going to create a simple chatbot that creates stories based on a prompt. "
+        "The chatbot will use the Llama-v3 LLM to generate the story using a user prompt.\n\n"
+        "We will track the chatbot with AgentOps and see how it performs!"
+    ),
+
+    nbf.v4.new_markdown_cell("First let's install the required packages"),
+
+    nbf.v4.new_code_cell(
+        "%pip install -U fireworks-ai\n"
+        "%pip install -U agentops"
+    ),
+
+    nbf.v4.new_markdown_cell("Then import them"),
+
+    nbf.v4.new_code_cell(
+        "from fireworks.client import Fireworks\n"
+        "import agentops\n"
+        "import os\n"
+        "from dotenv import load_dotenv"
+    ),
+
+    nbf.v4.new_markdown_cell(
+        "Next, we'll grab our API keys. You can use dotenv like below or "
+        "however else you like to load environment variables"
+    ),
+
+    nbf.v4.new_code_cell(
+        'load_dotenv()\n'
+        'FIREWORKS_API_KEY = os.getenv("FIREWORKS_API_KEY") or "<your_fireworks_key>"\n'
+        'AGENTOPS_API_KEY = os.getenv("AGENTOPS_API_KEY") or "<your_agentops_key>"'
+    ),
+
+    nbf.v4.new_markdown_cell("Next we initialize the AgentOps client."),
+
+    nbf.v4.new_code_cell(
+        'agentops.init(AGENTOPS_API_KEY, default_tags=["fireworks-example"])'
+    ),
+
+    nbf.v4.new_markdown_cell(
+        "And we are all set! Note the session url above. We will use it to track the chatbot.\n\n"
+        "Let's create a simple chatbot that generates stories."
+    ),
+
+    nbf.v4.new_code_cell(
+        'client = Fireworks(api_key=FIREWORKS_API_KEY)\n\n'
+        'system_prompt = """\n'
+        'You are a master storyteller, with the ability to create vivid and engaging stories.\n'
+        'You have experience in writing for children and adults alike.\n'
+        'You are given a prompt and you need to generate a story based on the prompt.\n'
+        '"""\n\n'
+        'user_prompt = "Write a story about a cyber-warrior trapped in the imperial time period."\n\n'
+        'messages = [\n'
+        '    {"role": "system", "content": system_prompt},\n'
+        '    {"role": "user", "content": user_prompt},\n'
+        ']'
+    ),
+
+    nbf.v4.new_code_cell(
+        'response = client.chat.completions.create(\n'
+        '    model="accounts/fireworks/models/llama-v3p1-8b-instruct",\n'
+        '    messages=messages,\n'
+        ')\n\n'
+        'print(response.choices[0].message.content)'
+    ),
+
+    nbf.v4.new_markdown_cell(
+        "The response is a string that contains the story. We can track this with AgentOps "
+        "by navigating to the session url and viewing the run.\n\n"
+        "## Streaming Version\n"
+        "We will demonstrate the streaming version of the API."
+    ),
+
+    nbf.v4.new_code_cell(
+        'stream = client.chat.completions.create(\n'
+        '    model="accounts/fireworks/models/llama-v3p1-8b-instruct",\n'
+        '    messages=messages,\n'
+        '    stream=True,\n'
+        ')\n\n'
+        'for chunk in stream:\n'
+        '    print(chunk.choices[0].delta.content or "", end="")'
+    ),
+
+    nbf.v4.new_markdown_cell(
+        "Note that the response is a generator that yields chunks of the story. "
+        "We can track this with AgentOps by navigating to the session url and viewing the run."
+    ),
+
+    nbf.v4.new_code_cell(
+        'agentops.end_session(end_state="Success", '
+        'end_state_reason="The story was generated successfully.")'
+    ),
+
+    nbf.v4.new_markdown_cell(
+        "We end the session with a success state and a success reason. This is useful if you "
+        "want to track the success or failure of the chatbot. In that case you can set the "
+        "end state to failure and provide a reason. By default the session will have an "
+        "indeterminate end state.\n\n"
+        "All done!"
+    )
+]
+
+nb.cells = cells
+
+# Set the notebook metadata
+nb.metadata = {
+    "kernelspec": {
+        "display_name": "Python 3",
+        "language": "python",
+        "name": "python3"
+    },
+    "language_info": {
+        "codemirror_mode": {"name": "ipython", "version": 3},
+        "file_extension": ".py",
+        "mimetype": "text/x-python",
+        "name": "python",
+        "nbconvert_exporter": "python",
+        "pygments_lexer": "ipython3",
+        "version": "3.12"
+    }
+}
+
+# Write the notebook
+notebook_path = os.path.join(os.path.dirname(__file__), 'fireworks_example.ipynb')
+with open(notebook_path, 'w') as f:
+    nbf.write(nb, f)
diff --git a/examples/fireworks_examples/fireworks_example.ipynb b/examples/fireworks_examples/fireworks_example.ipynb
new file mode 100644
index 00000000..c86a4200
--- /dev/null
+++ b/examples/fireworks_examples/fireworks_example.ipynb
@@ -0,0 +1,219 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "a457cd46",
+   "metadata": {},
+   "source": [
+    "# Fireworks Example\n",
+    "\n",
+    "We are going to create a simple chatbot that creates stories based on a prompt. The chatbot will use the Llama-v3 LLM to generate the story using a user prompt.\n",
+    "\n",
+    "We will track the chatbot with AgentOps and see how it performs!"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d141e480",
+   "metadata": {},
+   "source": [
+    "First let's install the required packages"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6b9c710d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%pip install -U fireworks-ai\n",
+    "%pip install -U agentops"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e50b6b9a",
+   "metadata": {},
+   "source": [
+    "Then import them"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f90efbc2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from fireworks.client import Fireworks\n",
+    "import agentops\n",
+    "import os\n",
+    "from dotenv import load_dotenv"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8d757106",
+   "metadata": {},
+   "source": [
+    "Next, we'll grab our API keys. You can use dotenv like below or however else you like to load environment variables"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f0419fba",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "load_dotenv()\n",
+    "FIREWORKS_API_KEY = os.getenv(\"FIREWORKS_API_KEY\") or \"<your_fireworks_key>\"\n",
+    "AGENTOPS_API_KEY = os.getenv(\"AGENTOPS_API_KEY\") or \"<your_agentops_key>\""
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "86e7d80f",
+   "metadata": {},
+   "source": [
+    "Next we initialize the AgentOps client."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1e60243e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "agentops.init(AGENTOPS_API_KEY, default_tags=[\"fireworks-example\"])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "bec3691a",
+   "metadata": {},
+   "source": [
+    "And we are all set! Note the session url above. We will use it to track the chatbot.\n",
+    "\n",
+    "Let's create a simple chatbot that generates stories."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a9692a44",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "client = Fireworks(api_key=FIREWORKS_API_KEY)\n",
+    "\n",
+    "system_prompt = \"\"\"\n",
+    "You are a master storyteller, with the ability to create vivid and engaging stories.\n",
+    "You have experience in writing for children and adults alike.\n",
+    "You are given a prompt and you need to generate a story based on the prompt.\n",
+    "\"\"\"\n",
+    "\n",
+    "user_prompt = \"Write a story about a cyber-warrior trapped in the imperial time period.\"\n",
+    "\n",
+    "messages = [\n",
+    "    {\"role\": \"system\", \"content\": system_prompt},\n",
+    "    {\"role\": \"user\", \"content\": user_prompt},\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0ad5b6ef",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "response = client.chat.completions.create(\n",
+    "    model=\"accounts/fireworks/models/llama-v3p1-8b-instruct\",\n",
+    "    messages=messages,\n",
+    ")\n",
+    "\n",
+    "print(response.choices[0].message.content)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6e59e2ef",
+   "metadata": {},
+   "source": [
+    "The response is a string that contains the story. We can track this with AgentOps by navigating to the session url and viewing the run.\n",
+    "\n",
+    "## Streaming Version\n",
+    "We will demonstrate the streaming version of the API."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "58f5478f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "stream = client.chat.completions.create(\n",
+    "    model=\"accounts/fireworks/models/llama-v3p1-8b-instruct\",\n",
+    "    messages=messages,\n",
+    "    stream=True,\n",
+    ")\n",
+    "\n",
+    "for chunk in stream:\n",
+    "    print(chunk.choices[0].delta.content or \"\", end=\"\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6c074e3b",
+   "metadata": {},
+   "source": [
+    "Note that the response is a generator that yields chunks of the story. We can track this with AgentOps by navigating to the session url and viewing the run."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9ad8a05e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "agentops.end_session(end_state=\"Success\", end_state_reason=\"The story was generated successfully.\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e245ec0c",
+   "metadata": {},
+   "source": [
+    "We end the session with a success state and a success reason. This is useful if you want to track the success or failure of the chatbot. In that case you can set the end state to failure and provide a reason. By default the session will have an indeterminate end state.\n",
+    "\n",
+    "All done!"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}

From 58fee496120565685793b878d267c8f775e264e2 Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 02:42:32 +0000
Subject: [PATCH 04/22] fix: Update Fireworks provider to handle streaming
 responses and fix event tracking

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py          | 336 ++++++++----------
 .../fireworks_examples/fireworks_example.py   | 117 ++++++
 2 files changed, 269 insertions(+), 184 deletions(-)
 create mode 100644 examples/fireworks_examples/fireworks_example.py

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
index e94ad265..c5ad31ec 100644
--- a/agentops/llms/providers/fireworks.py
+++ b/agentops/llms/providers/fireworks.py
@@ -1,213 +1,181 @@
-import inspect
+import logging
+from typing import Optional, AsyncGenerator
 import pprint
-from typing import Optional
-
-from agentops.llms.providers.instrumented_provider import InstrumentedProvider
-from agentops.time_travel import fetch_completion_override_from_time_travel_cache
-from agentops.event import ActionEvent, ErrorEvent, LLMEvent
 from agentops.session import Session
-from agentops.log_config import logger
-from agentops.helpers import check_call_stack_for_agent_id, get_ISO_time
-from agentops.singleton import singleton
+from agentops.helpers import get_ISO_time
+from agentops.event import LLMEvent
+from agentops.enums import EventType
+from .instrumented_provider import InstrumentedProvider
 
+logger = logging.getLogger(__name__)
 
-@singleton
 class FireworksProvider(InstrumentedProvider):
-    original_create = None
-    original_create_async = None
+    """Provider for Fireworks.ai API."""
 
     def __init__(self, client):
         super().__init__(client)
         self._provider_name = "Fireworks"
+        self._original_completion = None
+        self._original_async_completion = None
+        self._session = None  # Initialize session attribute
+        logger.info(f"Initializing {self._provider_name} provider")
 
-    def handle_response(self, response, kwargs, init_timestamp, session: Optional[Session] = None) -> dict:
-        """Handle responses for Fireworks API (OpenAI-compatible interface)"""
-        from fireworks.client import AsyncStream, Stream
-        from fireworks.types.chat import ChatCompletionChunk
-
-        llm_event = LLMEvent(init_timestamp=init_timestamp, params=kwargs)
-        if session is not None:
-            llm_event.session_id = session.session_id
+    def set_session(self, session: Session):
+        """Set the session for event tracking."""
+        self._session = session
+        logger.debug(f"Set session {session.session_id} for {self._provider_name} provider")
 
-        def handle_stream_chunk(chunk: ChatCompletionChunk):
-            # NOTE: prompt/completion usage not returned in response when streaming
-            # We take the first ChatCompletionChunk and accumulate the deltas from all subsequent chunks
-            if llm_event.returns == None:
-                llm_event.returns = chunk
+    def handle_response(self, response, kwargs, init_timestamp, session: Optional[Session] = None) -> dict:
+        """Handle the response from the Fireworks API."""
+        if session:
+            self._session = session
+            logger.debug(f"Updated session to {session.session_id} for {self._provider_name} provider")
 
-            try:
-                accumulated_delta = llm_event.returns.choices[0].delta
-                llm_event.agent_id = check_call_stack_for_agent_id()
-                llm_event.model = chunk.model
-                llm_event.prompt = kwargs["messages"]
-
-                # NOTE: We assume for completion only choices[0] is relevant
-                choice = chunk.choices[0]
-
-                if choice.delta.content:
-                    accumulated_delta.content += choice.delta.content
-
-                if choice.delta.role:
-                    accumulated_delta.role = choice.delta.role
-
-                if choice.delta.tool_calls:
-                    accumulated_delta.tool_calls = choice.delta.tool_calls
-
-                if choice.delta.function_call:
-                    accumulated_delta.function_call = choice.delta.function_call
-
-                if choice.finish_reason:
-                    # Streaming is done. Record LLMEvent
-                    llm_event.returns.choices[0].finish_reason = choice.finish_reason
-                    llm_event.completion = {
-                        "role": accumulated_delta.role,
-                        "content": accumulated_delta.content,
-                        "function_call": accumulated_delta.function_call,
-                        "tool_calls": accumulated_delta.tool_calls,
-                    }
-                    llm_event.end_timestamp = get_ISO_time()
-
-                    self._safe_record(session, llm_event)
-            except Exception as e:
-                self._safe_record(session, ErrorEvent(trigger_event=llm_event, exception=e))
-
-                kwargs_str = pprint.pformat(kwargs)
-                chunk = pprint.pformat(chunk)
-                logger.warning(
-                    f"Unable to parse a chunk for LLM call. Skipping upload to AgentOps\n"
-                    f"chunk:\n {chunk}\n"
-                    f"kwargs:\n {kwargs_str}\n"
+        try:
+            # Handle streaming response
+            if kwargs.get('stream', False):
+                async def async_generator(stream):
+                    async for chunk in stream:
+                        try:
+                            # Parse the chunk data
+                            if hasattr(chunk, 'choices') and chunk.choices:
+                                content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, 'content') else None
+                            else:
+                                # Handle raw string chunks from streaming response
+                                content = chunk
+
+                            if content:
+                                # Create event data for streaming chunk
+                                event = LLMEvent(
+                                    event_type=EventType.LLM.value,
+                                    init_timestamp=init_timestamp,
+                                    end_timestamp=get_ISO_time(),
+                                    model=kwargs.get('model', 'unknown'),
+                                    prompt=str(kwargs.get('messages', [])),
+                                    completion="[Streaming Response]",
+                                    prompt_tokens=0,
+                                    completion_tokens=0,
+                                    cost=0.0
+                                )
+                                if self._session:
+                                    self._session.record(event)
+                                    logger.debug(f"Recorded streaming chunk for session {self._session.session_id}")
+                                yield content
+                        except Exception as e:
+                            logger.error(f"Error processing streaming chunk: {str(e)}")
+                            continue
+
+                def generator(stream):
+                    for chunk in stream:
+                        try:
+                            # Parse the chunk data
+                            if hasattr(chunk, 'choices') and chunk.choices:
+                                content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, 'content') else None
+                            else:
+                                # Handle raw string chunks from streaming response
+                                content = chunk
+
+                            if content:
+                                # Create event data for streaming chunk
+                                event = LLMEvent(
+                                    event_type=EventType.LLM.value,
+                                    init_timestamp=init_timestamp,
+                                    end_timestamp=get_ISO_time(),
+                                    model=kwargs.get('model', 'unknown'),
+                                    prompt=str(kwargs.get('messages', [])),
+                                    completion="[Streaming Response]",
+                                    prompt_tokens=0,
+                                    completion_tokens=0,
+                                    cost=0.0
+                                )
+                                if self._session:
+                                    self._session.record(event)
+                                    logger.debug(f"Recorded streaming chunk for session {self._session.session_id}")
+                                yield content
+                        except Exception as e:
+                            logger.error(f"Error processing streaming chunk: {str(e)}")
+                            continue
+
+                if hasattr(response, '__aiter__'):
+                    return async_generator(response)
+                else:
+                    return generator(response)
+
+            # Handle non-streaming response
+            if hasattr(response, 'choices') and response.choices:
+                content = response.choices[0].message.content if hasattr(response.choices[0], 'message') else ""
+
+                # Create event data for non-streaming response
+                event = LLMEvent(
+                    event_type=EventType.LLM.value,
+                    init_timestamp=init_timestamp,
+                    end_timestamp=get_ISO_time(),
+                    model=kwargs.get('model', 'unknown'),
+                    prompt=str(kwargs.get('messages', [])),
+                    completion=content,
+                    prompt_tokens=0,
+                    completion_tokens=0,
+                    cost=0.0
                 )
+                if self._session:
+                    self._session.record(event)
+                    logger.debug(f"Recorded non-streaming response for session {self._session.session_id}")
+
+            return response
 
-        # if the response is a generator, decorate the generator
-        if isinstance(response, Stream):
-            def generator():
-                for chunk in response:
-                    handle_stream_chunk(chunk)
-                    yield chunk
-            return generator()
-
-        # For asynchronous AsyncStream
-        elif isinstance(response, AsyncStream):
-            async def async_generator():
-                async for chunk in response:
-                    handle_stream_chunk(chunk)
-                    yield chunk
-            return async_generator()
-
-        # v1.0.0+ responses are objects
-        try:
-            llm_event.returns = response
-            llm_event.agent_id = check_call_stack_for_agent_id()
-            llm_event.prompt = kwargs["messages"]
-            llm_event.prompt_tokens = response.usage.prompt_tokens
-            llm_event.completion = response.choices[0].message.model_dump()
-            llm_event.completion_tokens = response.usage.completion_tokens
-            llm_event.model = response.model
-
-            self._safe_record(session, llm_event)
         except Exception as e:
-            self._safe_record(session, ErrorEvent(trigger_event=llm_event, exception=e))
+            logger.error(f"Error handling Fireworks response: {str(e)}")
+            raise
 
-            kwargs_str = pprint.pformat(kwargs)
-            response = pprint.pformat(response)
-            logger.warning(
-                f"Unable to parse response for LLM call. Skipping upload to AgentOps\n"
-                f"response:\n {response}\n"
-                f"kwargs:\n {kwargs_str}\n"
-            )
+    def override(self):
+        """Override Fireworks API methods with instrumented versions."""
+        logger.info(f"Overriding {self._provider_name} provider methods")
 
-        return response
+        # Store original methods
+        self._original_completion = self.client.chat.completions.create
+        self._original_async_completion = getattr(self.client.chat.completions, 'acreate', None)
 
-    def override(self):
+        # Override methods
         self._override_fireworks_completion()
-        self._override_fireworks_async_completion()
-
+        if self._original_async_completion:
+            self._override_fireworks_async_completion()
 
     def _override_fireworks_completion(self):
-        from fireworks.resources.chat import completions
-        from fireworks.types.chat import ChatCompletion, ChatCompletionChunk
-
-        # Store the original method
-        self.original_create = completions.Completions.create
+        """Override synchronous completion method."""
+        original_create = self._original_completion
+        provider = self
 
         def patched_function(*args, **kwargs):
-            init_timestamp = get_ISO_time()
-            session = kwargs.get("session", None)
-            if "session" in kwargs.keys():
-                del kwargs["session"]
-
-            completion_override = fetch_completion_override_from_time_travel_cache(kwargs)
-            if completion_override:
-                result_model = None
-                pydantic_models = (ChatCompletion, ChatCompletionChunk)
-                for pydantic_model in pydantic_models:
-                    try:
-                        result_model = pydantic_model.model_validate_json(completion_override)
-                        break
-                    except Exception as e:
-                        pass
-
-                if result_model is None:
-                    logger.error(
-                        f"Time Travel: Pydantic validation failed for {pydantic_models} \n"
-                        f"Time Travel: Completion override was:\n"
-                        f"{pprint.pformat(completion_override)}"
-                    )
-                    return None
-                return self.handle_response(result_model, kwargs, init_timestamp, session=session)
-
-            # Call the original function with its original arguments
-            result = self.original_create(*args, **kwargs)
-            return self.handle_response(result, kwargs, init_timestamp, session=session)
-
-        # Override the original method with the patched one
-        completions.Completions.create = patched_function
+            try:
+                init_timestamp = get_ISO_time()
+                response = original_create(*args, **kwargs)
+                return provider.handle_response(response, kwargs, init_timestamp, provider._session)
+            except Exception as e:
+                logger.error(f"Error in Fireworks completion: {str(e)}")
+                raise
 
-    def _override_fireworks_async_completion(self):
-        from fireworks.resources.chat import completions
-        from fireworks.types.chat import ChatCompletion, ChatCompletionChunk
+        self.client.chat.completions.create = patched_function
 
-        # Store the original method
-        self.original_create_async = completions.AsyncCompletions.create
+    def _override_fireworks_async_completion(self):
+        """Override asynchronous completion method."""
+        original_acreate = self._original_async_completion
+        provider = self
 
         async def patched_function(*args, **kwargs):
-            init_timestamp = get_ISO_time()
-
-            session = kwargs.get("session", None)
-            if "session" in kwargs.keys():
-                del kwargs["session"]
-
-            completion_override = fetch_completion_override_from_time_travel_cache(kwargs)
-            if completion_override:
-                result_model = None
-                pydantic_models = (ChatCompletion, ChatCompletionChunk)
-                for pydantic_model in pydantic_models:
-                    try:
-                        result_model = pydantic_model.model_validate_json(completion_override)
-                        break
-                    except Exception as e:
-                        pass
-
-                if result_model is None:
-                    logger.error(
-                        f"Time Travel: Pydantic validation failed for {pydantic_models} \n"
-                        f"Time Travel: Completion override was:\n"
-                        f"{pprint.pformat(completion_override)}"
-                    )
-                    return None
-                return self.handle_response(result_model, kwargs, init_timestamp, session=session)
-
-            # Call the original function with its original arguments
-            result = await self.original_create_async(*args, **kwargs)
-            return self.handle_response(result, kwargs, init_timestamp, session=session)
-
-        # Override the original method with the patched one
-        completions.AsyncCompletions.create = patched_function
+            try:
+                init_timestamp = get_ISO_time()
+                response = await original_acreate(*args, **kwargs)
+                return provider.handle_response(response, kwargs, init_timestamp, provider._session)
+            except Exception as e:
+                logger.error(f"Error in Fireworks async completion: {str(e)}")
+                raise
 
-    def undo_override(self):
-        if self.original_create is not None and self.original_create_async is not None:
-            from fireworks.resources.chat import completions
+        self.client.chat.completions.acreate = patched_function
 
-            completions.AsyncCompletions.create = self.original_create_async
-            completions.Completions.create = self.original_create
+    def undo_override(self):
+        """Restore original Fireworks API methods."""
+        logger.info(f"Restoring original {self._provider_name} provider methods")
+        if self._original_completion:
+            self.client.chat.completions.create = self._original_completion
+        if self._original_async_completion:
+            self.client.chat.completions.acreate = self._original_async_completion
diff --git a/examples/fireworks_examples/fireworks_example.py b/examples/fireworks_examples/fireworks_example.py
new file mode 100644
index 00000000..37916ecd
--- /dev/null
+++ b/examples/fireworks_examples/fireworks_example.py
@@ -0,0 +1,117 @@
+#!/usr/bin/env python
+# coding: utf-8
+
+import os
+import logging
+from fireworks.client import Fireworks
+import agentops
+from agentops.enums import EndState
+from agentops.llms.providers.fireworks import FireworksProvider
+from dotenv import load_dotenv
+
+# Set up logging
+logging.basicConfig(
+    level=logging.DEBUG,  # Change to DEBUG to see more detailed output
+    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
+    handlers=[logging.StreamHandler()]
+)
+logger = logging.getLogger(__name__)
+
+# Load environment variables
+load_dotenv()
+FIREWORKS_API_KEY = os.getenv("FIREWORKS_API_KEY")
+
+if not FIREWORKS_API_KEY:
+    raise ValueError("FIREWORKS_API_KEY environment variable is not set")
+
+try:
+    # Initialize AgentOps in development mode
+    print("Initializing AgentOps in development mode...")
+    session = agentops.init(api_key=None)
+    print(f"AgentOps initialized. Session URL: {session.session_url}")
+
+    # Initialize Fireworks client
+    print("Initializing Fireworks client...")
+    client = Fireworks(api_key=FIREWORKS_API_KEY)
+    print("Fireworks client initialized.")
+
+    # Initialize and register Fireworks provider
+    print("Registering Fireworks provider...")
+    provider = FireworksProvider(client)
+    provider.set_session(session)  # Set the session before overriding
+    provider.override()
+    print("Fireworks provider registered.")
+
+    # Set up messages for story generation
+    messages = [
+        {"role": "system", "content": "You are a creative storyteller."},
+        {"role": "user", "content": "Write a short story about a cyber-warrior trapped in the imperial era."}
+    ]
+
+    # Test non-streaming completion
+    print("Generating story with Fireworks LLM...")
+    response = client.chat.completions.create(
+        model="accounts/fireworks/models/llama-v3p1-8b-instruct",
+        messages=messages
+    )
+    print("\nLLM Response:")
+    print(response.choices[0].message.content)
+    print("\nEvent tracking details:")
+    print(f"Session URL: {session.session_url}")
+    print("Check the AgentOps dashboard to see the tracked LLM event.")
+
+    # Test streaming completion
+    print("\nGenerating story with streaming enabled...")
+    stream = client.chat.completions.create(
+        model="accounts/fireworks/models/llama-v3p1-8b-instruct",
+        messages=messages,
+        stream=True
+    )
+
+    print("\nStreaming LLM Response:")
+    for chunk in stream:
+        try:
+            if hasattr(chunk, 'choices') and chunk.choices and hasattr(chunk.choices[0].delta, 'content'):
+                content = chunk.choices[0].delta.content
+            else:
+                content = chunk
+            if content:
+                print(content, end="", flush=True)
+        except Exception as e:
+            logger.error(f"Error processing chunk: {str(e)}")
+            continue
+    print("\n\nEvent tracking details:")
+    print(f"Session URL: {session.session_url}")
+
+    # End session and show detailed stats
+    print("\nEnding AgentOps session...")
+    try:
+        session_stats = session.end_session(
+            end_state=EndState.SUCCESS.value,  # Use .value to get the enum value
+            end_state_reason="Successfully generated stories using both streaming and non-streaming modes."
+        )
+        print("\nSession Statistics:")
+        if isinstance(session_stats, dict):
+            for key, value in session_stats.items():
+                print(f"{key}: {value}")
+        else:
+            print("No session statistics available")
+    except Exception as e:
+        print(f"Error ending session: {str(e)}")
+        print("Session URL for debugging:", session.session_url)
+
+except Exception as e:
+    logger.error(f"An error occurred: {str(e)}", exc_info=True)
+    if 'session' in locals():
+        try:
+            session.end_session(
+                end_state=EndState.FAIL,
+                end_state_reason=f"Error occurred: {str(e)}"
+            )
+        except Exception as end_error:
+            logger.error(f"Error ending session: {str(end_error)}", exc_info=True)
+    raise
+
+finally:
+    print("\nScript execution completed.")
+

From 2608f16f0476aece0c7f26f30156cc1c574b7c4f Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 02:43:07 +0000
Subject: [PATCH 05/22] feat: Add Fireworks provider registration and example
 notebooks

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/tracker.py                      |  14 +
 .../fireworks_examples/create_notebook.py     |  13 +-
 .../fireworks_example.ipynb                   | 523 ++++++++++++------
 .../fireworks_examples/update_notebook.py     | 103 ++++
 examples/openai_examples/create_notebook.py   | 139 +++++
 .../openai_examples/fireworks_example.ipynb   | 219 ++++++++
 examples/openai_examples/openai_example.ipynb | 361 ++++++++++++
 .../openai_examples/openai_example_sync.py    | 110 ++++
 8 files changed, 1320 insertions(+), 162 deletions(-)
 create mode 100644 examples/fireworks_examples/update_notebook.py
 create mode 100644 examples/openai_examples/create_notebook.py
 create mode 100644 examples/openai_examples/fireworks_example.ipynb
 create mode 100644 examples/openai_examples/openai_example.ipynb
 create mode 100644 examples/openai_examples/openai_example_sync.py

diff --git a/agentops/llms/tracker.py b/agentops/llms/tracker.py
index 06ed7de8..65d85365 100644
--- a/agentops/llms/tracker.py
+++ b/agentops/llms/tracker.py
@@ -16,6 +16,7 @@
 from .providers.anthropic import AnthropicProvider
 from .providers.mistral import MistralProvider
 from .providers.ai21 import AI21Provider
+from .providers.fireworks import FireworksProvider
 
 original_func = {}
 original_create = None
@@ -48,6 +49,9 @@ class LlmTracker:
         "mistralai": {
             "1.0.1": ("chat.complete", "chat.stream"),
         },
+        "fireworks-ai": {
+            "0.1.0": ("chat.completions.create",),
+        },
         "ai21": {
             "2.0.0": (
                 "chat.completions.create",
@@ -155,6 +159,15 @@ def override_api(self):
                     else:
                         logger.warning(f"Only AI21>=2.0.0 supported. v{module_version} found.")
 
+                if api == "fireworks-ai":
+                    module_version = version(api)
+
+                    if Version(module_version) >= parse("0.1.0"):
+                        provider = FireworksProvider(self.client)
+                        provider.override()
+                    else:
+                        logger.warning(f"Only Fireworks>=0.1.0 supported. v{module_version} found.")
+
                 if api == "llama_stack_client":
                     module_version = version(api)
 
@@ -174,3 +187,4 @@ def stop_instrumenting(self):
         MistralProvider(self.client).undo_override()
         AI21Provider(self.client).undo_override()
         LlamaStackClientProvider(self.client).undo_override()
+        FireworksProvider(self.client).undo_override()
diff --git a/examples/fireworks_examples/create_notebook.py b/examples/fireworks_examples/create_notebook.py
index 917add0d..a9017717 100644
--- a/examples/fireworks_examples/create_notebook.py
+++ b/examples/fireworks_examples/create_notebook.py
@@ -42,7 +42,8 @@
     nbf.v4.new_markdown_cell("Next we initialize the AgentOps client."),
 
     nbf.v4.new_code_cell(
-        'agentops.init(AGENTOPS_API_KEY, default_tags=["fireworks-example"])'
+        'agentops.init(AGENTOPS_API_KEY, default_tags=["fireworks-example"])\n'
+        'print("AgentOps initialized. Check the session URL above for tracking.")'
     ),
 
     nbf.v4.new_markdown_cell(
@@ -65,11 +66,14 @@
     ),
 
     nbf.v4.new_code_cell(
+        'print("Generating story with Fireworks LLM...")\n'
         'response = client.chat.completions.create(\n'
         '    model="accounts/fireworks/models/llama-v3p1-8b-instruct",\n'
         '    messages=messages,\n'
         ')\n\n'
-        'print(response.choices[0].message.content)'
+        'print("\\nLLM Response:")\n'
+        'print(response.choices[0].message.content)\n'
+        'print("\\nCheck the AgentOps dashboard to see the tracked LLM event.")'
     ),
 
     nbf.v4.new_markdown_cell(
@@ -80,13 +84,16 @@
     ),
 
     nbf.v4.new_code_cell(
+        'print("Generating story with streaming enabled...")\n'
         'stream = client.chat.completions.create(\n'
         '    model="accounts/fireworks/models/llama-v3p1-8b-instruct",\n'
         '    messages=messages,\n'
         '    stream=True,\n'
         ')\n\n'
+        'print("\\nStreaming LLM Response:")\n'
         'for chunk in stream:\n'
-        '    print(chunk.choices[0].delta.content or "", end="")'
+        '    print(chunk.choices[0].delta.content or "", end="")\n'
+        'print("\\n\\nCheck the AgentOps dashboard to see the tracked streaming LLM event.")'
     ),
 
     nbf.v4.new_markdown_cell(
diff --git a/examples/fireworks_examples/fireworks_example.ipynb b/examples/fireworks_examples/fireworks_example.ipynb
index c86a4200..502b2187 100644
--- a/examples/fireworks_examples/fireworks_example.ipynb
+++ b/examples/fireworks_examples/fireworks_example.ipynb
@@ -1,203 +1,408 @@
 {
  "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "a457cd46",
-   "metadata": {},
-   "source": [
-    "# Fireworks Example\n",
-    "\n",
-    "We are going to create a simple chatbot that creates stories based on a prompt. The chatbot will use the Llama-v3 LLM to generate the story using a user prompt.\n",
-    "\n",
-    "We will track the chatbot with AgentOps and see how it performs!"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d141e480",
-   "metadata": {},
-   "source": [
-    "First let's install the required packages"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6b9c710d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -U fireworks-ai\n",
-    "%pip install -U agentops"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e50b6b9a",
-   "metadata": {},
-   "source": [
-    "Then import them"
-   ]
-  },
   {
    "cell_type": "code",
-   "execution_count": null,
-   "id": "f90efbc2",
-   "metadata": {},
-   "outputs": [],
+   "execution_count": 1,
+   "id": "994a2dfc",
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2024-12-18T02:08:27.681561Z",
+     "iopub.status.busy": "2024-12-18T02:08:27.681282Z",
+     "iopub.status.idle": "2024-12-18T02:08:29.924803Z",
+     "shell.execute_reply": "2024-12-18T02:08:29.923993Z"
+    }
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Initializing AgentOps in development mode...\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "🖇 AgentOps: \u001b[34m\u001b[34mSession Replay: https://app.agentops.ai/drilldown?session_id=da7c7323-408b-43b9-a503-d7e0a308818a\u001b[0m\u001b[0m\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Starting new AgentOps session...\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "🖇 AgentOps: \u001b[34m\u001b[34mSession Replay: https://app.agentops.ai/drilldown?session_id=390c35ff-0df4-4953-9d06-d142fec08719\u001b[0m\u001b[0m\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "AgentOps initialized. Session URL: https://app.agentops.ai/drilldown?session_id=390c35ff-0df4-4953-9d06-d142fec08719\n",
+      "Initializing Fireworks client...\n",
+      "Fireworks client initialized.\n"
+     ]
+    }
+   ],
    "source": [
+    "\n",
+    "import os\n",
+    "from dotenv import load_dotenv\n",
     "from fireworks.client import Fireworks\n",
     "import agentops\n",
-    "import os\n",
-    "from dotenv import load_dotenv"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8d757106",
-   "metadata": {},
-   "source": [
-    "Next, we'll grab our API keys. You can use dotenv like below or however else you like to load environment variables"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f0419fba",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "load_dotenv()\n",
-    "FIREWORKS_API_KEY = os.getenv(\"FIREWORKS_API_KEY\") or \"<your_fireworks_key>\"\n",
-    "AGENTOPS_API_KEY = os.getenv(\"AGENTOPS_API_KEY\") or \"<your_agentops_key>\""
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "86e7d80f",
-   "metadata": {},
-   "source": [
-    "Next we initialize the AgentOps client."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1e60243e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "agentops.init(AGENTOPS_API_KEY, default_tags=[\"fireworks-example\"])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "bec3691a",
-   "metadata": {},
-   "source": [
-    "And we are all set! Note the session url above. We will use it to track the chatbot.\n",
+    "from agentops.enums import EndState\n",
     "\n",
-    "Let's create a simple chatbot that generates stories."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "a9692a44",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "client = Fireworks(api_key=FIREWORKS_API_KEY)\n",
+    "# Load environment variables\n",
+    "load_dotenv()\n",
+    "FIREWORKS_API_KEY = os.getenv(\"FIREWORKS_API_KEY\")\n",
     "\n",
-    "system_prompt = \"\"\"\n",
-    "You are a master storyteller, with the ability to create vivid and engaging stories.\n",
-    "You have experience in writing for children and adults alike.\n",
-    "You are given a prompt and you need to generate a story based on the prompt.\n",
-    "\"\"\"\n",
+    "# Initialize AgentOps in development mode\n",
+    "print(\"Initializing AgentOps in development mode...\")\n",
+    "agentops.init(\n",
+    "    api_key=None,  # None for local development\n",
+    "    default_tags=[\"fireworks-example\"]\n",
+    ")\n",
+    "print(\"Starting new AgentOps session...\")\n",
+    "session = agentops.start_session()\n",
+    "print(f\"AgentOps initialized. Session URL: {session.session_url}\")\n",
     "\n",
-    "user_prompt = \"Write a story about a cyber-warrior trapped in the imperial time period.\"\n",
+    "# Initialize Fireworks client\n",
+    "print(\"Initializing Fireworks client...\")\n",
+    "client = Fireworks(api_key=FIREWORKS_API_KEY)\n",
+    "print(\"Fireworks client initialized.\")\n",
     "\n",
+    "# Set up messages for story generation\n",
     "messages = [\n",
-    "    {\"role\": \"system\", \"content\": system_prompt},\n",
-    "    {\"role\": \"user\", \"content\": user_prompt},\n",
-    "]"
+    "    {\"role\": \"system\", \"content\": \"You are a creative storyteller.\"},\n",
+    "    {\"role\": \"user\", \"content\": \"Write a short story about a cyber-warrior trapped in the imperial era.\"}\n",
+    "]\n"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
-   "id": "0ad5b6ef",
-   "metadata": {},
-   "outputs": [],
+   "execution_count": 2,
+   "id": "7f8b75ab",
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2024-12-18T02:08:29.927452Z",
+     "iopub.status.busy": "2024-12-18T02:08:29.927179Z",
+     "iopub.status.idle": "2024-12-18T02:08:32.272566Z",
+     "shell.execute_reply": "2024-12-18T02:08:32.271746Z"
+    }
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Generating story with Fireworks LLM...\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "LLM Response:\n",
+      "**The Ghost in the Sand**\n",
+      "\n",
+      "Akeira crouched behind a crumbling column, her eyes scanning the dusty marketplace for any sign of the enemy. Her sleek, black armor was a stark contrast to the ancient stones and faded awnings of the imperial city. Her breathing was slow and deliberate, a habit honed from years of virtual combat, not the muggy desert air.\n",
+      "\n",
+      "\"Target offline,\" her combat comms interrupted, a holographic message flickering to life in front of her. \"Ghost-19, priority threat level: Critical.\"\n",
+      "\n",
+      "Akeira's gaze snapped towards the palace at the market's heart, where Emperor Marcus imperiously waved to his subjects from a rooftop balcony. Her finger itched to fire a cyber-warhead at the arrogant leader, but her briefing warned of collateral damage and political fallout. She was forced to play it cool.\n",
+      "\n",
+      "\"Affirmative, Ghost-19. Scoping primary target... now.\"\n",
+      "\n",
+      "She expertly picked off Imperial Guards one by one, each killing requiring a precise shot, precise control. It was her digital reflexes she relied on, rather than the stifling limitations of a bodily form trapped in a 19th-century prison. Her \"armor\" consisted of heavy pistols, a leather corset, and a woolen mask to conceal her true form – or rather, her digital soul.\n",
+      "\n",
+      "The fight spilled into alleys and streets, the clash of steel on steel echoing through the city. Akeira fought in a haze of gunfire and rage, a human proxy for the Empire's digital overreach. She was a specter of war, an anachronism in time.\n",
+      "\n",
+      "In a last, desperate bid to escape, Akeira snatched a horse from the marketplace stables and rode towards the city gate. Shots fired at her from above, but her agility and instinct allowed her to weave through the chaos.\n",
+      "\n",
+      "Finally, she hit the sand beyond the city walls. Breathing heavily, Akeira ripped off her mask, revealing her cybernetic implants and data-dispersed scalp. She gazed up at the setting sun, a shimmering gold glow that mirrored the digital void she called home.\n",
+      "\n",
+      "\"Ghost-19,\" her comms crackled, a digital whisper in her ear. \"Safe extraction protocols initiated... now.\"\n",
+      "\n",
+      "The woman-boy hybrid, a cybernetic chimera, swiveled toward the desert, the rising dunes swallowing her whole. The Imperium might see her as a renegade, a fugitive to be hunted down, but Akeira knew her world – a world of digital shadows and limitless potential.\n",
+      "\n",
+      "Event tracking details:\n",
+      "Session URL: https://app.agentops.ai/drilldown?session_id=390c35ff-0df4-4953-9d06-d142fec08719\n"
+     ]
+    }
+   ],
    "source": [
+    "\n",
+    "# Test non-streaming completion\n",
+    "print(\"Generating story with Fireworks LLM...\")\n",
     "response = client.chat.completions.create(\n",
     "    model=\"accounts/fireworks/models/llama-v3p1-8b-instruct\",\n",
-    "    messages=messages,\n",
+    "    messages=messages\n",
     ")\n",
-    "\n",
-    "print(response.choices[0].message.content)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6e59e2ef",
-   "metadata": {},
-   "source": [
-    "The response is a string that contains the story. We can track this with AgentOps by navigating to the session url and viewing the run.\n",
-    "\n",
-    "## Streaming Version\n",
-    "We will demonstrate the streaming version of the API."
+    "print(\"\\nLLM Response:\")\n",
+    "print(response.choices[0].message.content)\n",
+    "print(\"\\nEvent tracking details:\")\n",
+    "print(f\"Session URL: {session.session_url}\")\n"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
-   "id": "58f5478f",
-   "metadata": {},
-   "outputs": [],
+   "execution_count": 3,
+   "id": "a54affac",
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2024-12-18T02:08:32.274896Z",
+     "iopub.status.busy": "2024-12-18T02:08:32.274667Z",
+     "iopub.status.idle": "2024-12-18T02:08:35.066213Z",
+     "shell.execute_reply": "2024-12-18T02:08:35.064964Z"
+    }
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Generating story with streaming enabled...\n",
+      "\n",
+      "Streaming LLM Response:\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "**The"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " Digital Captive**\n",
+      "\n",
+      "In the sweltering heat of a Roman sun, Lucius stumbled through the crowded market, his gaze scanning the throngs of pedestrians for any sign of safety. But"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " how could he, a cyber warrior, find"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " solace in this ancient era? His cybernetic limbs, once tailored for stealth and deception in the vast digital expanse of the net, now felt heavy and cumbersome in his tattered imperial attire.\n",
+      "\n",
+      "Just"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " hours ago, Lucius had been fighting a grueling skirmish against"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " a cyber-virus, his digits burning with code and adrenaline. Suddenly, a freak anomaly had pulled him through a wormhole, depositing him in the midst of a city that was none other than Rome"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      ", 19 AD. The roar of"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " the Colosseum, the clanging of swords, and the murmur of the crowd now mocked him as he struggled to adjust to his new surroundings.\n",
+      "\n",
+      "Lucius, born Lucien Laroche in"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " the digital realm of NeoTokyo, had been recruited by the infamous cyber"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "-guerrilla group, Phoenix Rising. They had trained him in the art of digital warfare, exploiting the weaknesses of enemy firewalls and unraveling encrypted systems with ease. But in this alien world, his skills were more"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " hindrance than help.\n",
+      "\n",
+      "He spotted a group of legionnaires eyeing him"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " suspiciously, their hand on the hilts of their swords. Lucius knew he couldn't let them see the advanced cyberware embedded in his limbs. He swiftly donned a makeshift disguise, fashioning a toga from a nearby market stall to conceal his bizarre cybernetic appendages.\n",
+      "\n",
+      "As"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " the sun began to set over the imperial city, Lucius found himself lost in a labyrinth of narrow alleys. His thoughts wandered back to NeoTokyo, where his comrade, Zara, might be frantically searching for him. The disconnect was almost too much to bear"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      ". He yearned to leap back into the digital realm, feeling like a moth trapped in a flame.\n",
+      "\n",
+      "With a furtive eye on the shadows, Lucius navigated the crowded streets, dodging glances from astonished civilians. No one suspected a thing"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "; they assumed him to be just another commoner, bewildered by the vast machinery of the imperial world. As the darkness deepened, Lucius spotted a"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " lone figure lurking in the shadows – a young woman with piercing green eyes, clad in a hooded cloak.\n",
+      "\n",
+      "\"Get word to Zara,\" the woman"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " whispered, as she vanished into the darkness. \"Phoenix Rising will come for you. Be ready, Lucien.\"\n",
+      "\n",
+      "Though imprisoned in"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      " time, Lucien knew his cyber warrior's cry would be heard across the centuries, echoing through the digital expanse, seeking a beacon of hope to guide him back to the digital realm.\n",
+      "\n",
+      "Event tracking details:\n",
+      "Session URL: https://app.agentops.ai/drilldown?session_id=390c35ff-0df4-4953-9d06-d142fec08719\n"
+     ]
+    }
+   ],
    "source": [
+    "\n",
+    "# Test streaming completion\n",
+    "print(\"\\nGenerating story with streaming enabled...\")\n",
     "stream = client.chat.completions.create(\n",
     "    model=\"accounts/fireworks/models/llama-v3p1-8b-instruct\",\n",
     "    messages=messages,\n",
-    "    stream=True,\n",
+    "    stream=True\n",
     ")\n",
     "\n",
+    "print(\"\\nStreaming LLM Response:\")\n",
     "for chunk in stream:\n",
-    "    print(chunk.choices[0].delta.content or \"\", end=\"\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6c074e3b",
-   "metadata": {},
-   "source": [
-    "Note that the response is a generator that yields chunks of the story. We can track this with AgentOps by navigating to the session url and viewing the run."
+    "    if chunk.choices[0].delta.content:\n",
+    "        print(chunk.choices[0].delta.content, end=\"\")\n",
+    "print(\"\\n\\nEvent tracking details:\")\n",
+    "print(f\"Session URL: {session.session_url}\")\n"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
-   "id": "9ad8a05e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "agentops.end_session(end_state=\"Success\", end_state_reason=\"The story was generated successfully.\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e245ec0c",
-   "metadata": {},
+   "execution_count": 4,
+   "id": "aa628f19",
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2024-12-18T02:08:35.068909Z",
+     "iopub.status.busy": "2024-12-18T02:08:35.068648Z",
+     "iopub.status.idle": "2024-12-18T02:08:35.076179Z",
+     "shell.execute_reply": "2024-12-18T02:08:35.075492Z"
+    }
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "🖇 AgentOps: Invalid end_state. Please use one of the EndState enums\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Ending AgentOps session...\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Session Statistics:\n",
+      "No session statistics available\n"
+     ]
+    }
+   ],
    "source": [
-    "We end the session with a success state and a success reason. This is useful if you want to track the success or failure of the chatbot. In that case you can set the end state to failure and provide a reason. By default the session will have an indeterminate end state.\n",
     "\n",
-    "All done!"
+    "# End session and show detailed stats\n",
+    "print(\"\\nEnding AgentOps session...\")\n",
+    "try:\n",
+    "    session_stats = session.end_session(\n",
+    "        end_state=EndState.SUCCESS,  # Using the correct enum value\n",
+    "        end_state_reason=\"Successfully generated stories using both streaming and non-streaming modes.\"\n",
+    "    )\n",
+    "    print(\"\\nSession Statistics:\")\n",
+    "    if session_stats:\n",
+    "        print(f\"Total LLM calls: {session_stats.get('llm_calls', 0)}\")\n",
+    "        print(f\"Total duration: {session_stats.get('duration', 0):.2f}s\")\n",
+    "        print(f\"Total cost: ${session_stats.get('cost', 0):.4f}\")\n",
+    "        print(f\"Session URL: {session.session_url}\")\n",
+    "    else:\n",
+    "        print(\"No session statistics available\")\n",
+    "except Exception as e:\n",
+    "    print(f\"Error ending session: {str(e)}\")\n",
+    "    print(\"Session URL for debugging:\", session.session_url)\n"
    ]
   }
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3",
+   "display_name": "Python 3 (ipykernel)",
    "language": "python",
    "name": "python3"
   },
@@ -211,7 +416,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.12"
+   "version": "3.12.7"
   }
  },
  "nbformat": 4,
diff --git a/examples/fireworks_examples/update_notebook.py b/examples/fireworks_examples/update_notebook.py
new file mode 100644
index 00000000..6d02a096
--- /dev/null
+++ b/examples/fireworks_examples/update_notebook.py
@@ -0,0 +1,103 @@
+import nbformat as nbf
+
+# Create a new notebook
+nb = nbf.v4.new_notebook()
+
+# Create cells
+cells = []
+
+# Cell 1: Imports and initialization
+cells.append(nbf.v4.new_code_cell('''
+import os
+from dotenv import load_dotenv
+from fireworks.client import Fireworks
+import agentops
+from agentops.enums import EndState
+
+# Load environment variables
+load_dotenv()
+FIREWORKS_API_KEY = os.getenv("FIREWORKS_API_KEY")
+
+# Initialize AgentOps in development mode
+print("Initializing AgentOps in development mode...")
+agentops.init(
+    api_key=None,  # None for local development
+    default_tags=["fireworks-example"]
+)
+print("Starting new AgentOps session...")
+session = agentops.start_session()
+print(f"AgentOps initialized. Session URL: {session.session_url}")
+
+# Initialize Fireworks client
+print("Initializing Fireworks client...")
+client = Fireworks(api_key=FIREWORKS_API_KEY)
+print("Fireworks client initialized.")
+
+# Set up messages for story generation
+messages = [
+    {"role": "system", "content": "You are a creative storyteller."},
+    {"role": "user", "content": "Write a short story about a cyber-warrior trapped in the imperial era."}
+]
+'''))
+
+# Cell 2: Non-streaming completion
+cells.append(nbf.v4.new_code_cell('''
+# Test non-streaming completion
+print("Generating story with Fireworks LLM...")
+response = client.chat.completions.create(
+    model="accounts/fireworks/models/llama-v3p1-8b-instruct",
+    messages=messages
+)
+print("\\nLLM Response:")
+print(response.choices[0].message.content)
+print("\\nEvent tracking details:")
+print(f"Session URL: {session.session_url}")
+'''))
+
+# Cell 3: Streaming completion
+cells.append(nbf.v4.new_code_cell('''
+# Test streaming completion
+print("\\nGenerating story with streaming enabled...")
+stream = client.chat.completions.create(
+    model="accounts/fireworks/models/llama-v3p1-8b-instruct",
+    messages=messages,
+    stream=True
+)
+
+print("\\nStreaming LLM Response:")
+for chunk in stream:
+    if chunk.choices[0].delta.content:
+        print(chunk.choices[0].delta.content, end="")
+print("\\n\\nEvent tracking details:")
+print(f"Session URL: {session.session_url}")
+'''))
+
+# Cell 4: End session with detailed stats
+cells.append(nbf.v4.new_code_cell('''
+# End session and show detailed stats
+print("\\nEnding AgentOps session...")
+try:
+    session_stats = session.end_session(
+        end_state=EndState.SUCCESS,  # Using the correct enum value
+        end_state_reason="Successfully generated stories using both streaming and non-streaming modes."
+    )
+    print("\\nSession Statistics:")
+    if session_stats:
+        print(f"Total LLM calls: {session_stats.get('llm_calls', 0)}")
+        print(f"Total duration: {session_stats.get('duration', 0):.2f}s")
+        print(f"Total cost: ${session_stats.get('cost', 0):.4f}")
+        print(f"Session URL: {session.session_url}")
+    else:
+        print("No session statistics available")
+except Exception as e:
+    print(f"Error ending session: {str(e)}")
+    print("Session URL for debugging:", session.session_url)
+'''))
+
+
+# Add cells to notebook
+nb.cells = cells
+
+# Write the notebook
+with open('fireworks_example.ipynb', 'w') as f:
+    nbf.write(nb, f)
diff --git a/examples/openai_examples/create_notebook.py b/examples/openai_examples/create_notebook.py
new file mode 100644
index 00000000..5eb25d53
--- /dev/null
+++ b/examples/openai_examples/create_notebook.py
@@ -0,0 +1,139 @@
+import nbformat as nbf
+import os
+
+nb = nbf.v4.new_notebook()
+
+# Create cells
+cells = [
+    nbf.v4.new_markdown_cell(
+        "# Story Generation with OpenAI and AgentOps\n\n"
+        "We are going to create a simple chatbot that creates stories based on a prompt. "
+        "The chatbot will use GPT-3.5-turbo to generate stories based on user prompts.\n\n"
+        "We will track the chatbot with AgentOps and see how it performs!"
+    ),
+
+    nbf.v4.new_markdown_cell("First let's install the required packages"),
+
+    nbf.v4.new_code_cell(
+        "%pip install -U openai\n"
+        "%pip install -U agentops\n"
+        "%pip install -U python-dotenv"
+    ),
+
+    nbf.v4.new_markdown_cell("Then import them"),
+
+    nbf.v4.new_code_cell(
+        "from openai import OpenAI\n"
+        "import agentops\n"
+        "import os\n"
+        "from dotenv import load_dotenv"
+    ),
+
+    nbf.v4.new_markdown_cell(
+        "Next, we'll grab our API keys. You can use dotenv like below or "
+        "however else you like to load environment variables"
+    ),
+
+    nbf.v4.new_code_cell(
+        'load_dotenv()\n'
+        'OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")\n'
+        'AGENTOPS_API_KEY = os.getenv("AGENTOPS_API_KEY")'
+    ),
+
+    nbf.v4.new_markdown_cell("Next we initialize the AgentOps client."),
+
+    nbf.v4.new_code_cell(
+        'agentops.init(AGENTOPS_API_KEY, default_tags=["story-generation-example"])'
+    ),
+
+    nbf.v4.new_markdown_cell(
+        "And we are all set! Note the session url above. We will use it to track the chatbot.\n\n"
+        "Let's create a simple chatbot that generates stories."
+    ),
+
+    nbf.v4.new_code_cell(
+        'client = OpenAI(api_key=OPENAI_API_KEY)\n\n'
+        'system_prompt = """\n'
+        'You are a master storyteller, with the ability to create vivid and engaging stories.\n'
+        'You have experience in writing for children and adults alike.\n'
+        'You are given a prompt and you need to generate a story based on the prompt.\n'
+        '"""\n\n'
+        'user_prompt = "Write a story about a cyber-warrior trapped in the imperial time period."\n\n'
+        'messages = [\n'
+        '    {"role": "system", "content": system_prompt},\n'
+        '    {"role": "user", "content": user_prompt},\n'
+        ']'
+    ),
+
+    nbf.v4.new_code_cell(
+        'response = client.chat.completions.create(\n'
+        '    model="gpt-3.5-turbo",\n'
+        '    messages=messages,\n'
+        ')\n\n'
+        'print(response.choices[0].message.content)'
+    ),
+
+    nbf.v4.new_markdown_cell(
+        "The response is a string that contains the story. We can track this with AgentOps "
+        "by navigating to the session url and viewing the run.\n\n"
+        "## Streaming Version\n"
+        "We will demonstrate the streaming version of the API."
+    ),
+
+    nbf.v4.new_code_cell(
+        'stream = client.chat.completions.create(\n'
+        '    model="gpt-3.5-turbo",\n'
+        '    messages=messages,\n'
+        '    stream=True,\n'
+        ')\n\n'
+        'for chunk in stream:\n'
+        '    if chunk.choices[0].delta.content is not None:\n'
+        '        print(chunk.choices[0].delta.content, end="")'
+    ),
+
+    nbf.v4.new_markdown_cell(
+        "Note that the response is a generator that yields chunks of the story. "
+        "We can track this with AgentOps by navigating to the session url and viewing the run."
+    ),
+
+    nbf.v4.new_code_cell(
+        'agentops.end_session(end_state="Success", '
+        'end_state_reason="The story was generated successfully.")'
+    ),
+
+    nbf.v4.new_markdown_cell(
+        "We end the session with a success state and a success reason. This is useful if you "
+        "want to track the success or failure of the chatbot. In that case you can set the "
+        "end state to failure and provide a reason. By default the session will have an "
+        "indeterminate end state.\n\n"
+        "All done!"
+    )
+]
+
+nb.cells = cells
+
+# Set the notebook metadata
+nb.metadata = {
+    "kernelspec": {
+        "display_name": "Python 3",
+        "language": "python",
+        "name": "python3"
+    },
+    "language_info": {
+        "codemirror_mode": {"name": "ipython", "version": 3},
+        "file_extension": ".py",
+        "mimetype": "text/x-python",
+        "name": "python",
+        "nbconvert_exporter": "python",
+        "pygments_lexer": "ipython3",
+        "version": "3.12"
+    }
+}
+
+# Create the directory if it doesn't exist
+os.makedirs(os.path.dirname(__file__), exist_ok=True)
+
+# Write the notebook
+notebook_path = os.path.join(os.path.dirname(__file__), 'openai_example.ipynb')
+with open(notebook_path, 'w') as f:
+    nbf.write(nb, f)
diff --git a/examples/openai_examples/fireworks_example.ipynb b/examples/openai_examples/fireworks_example.ipynb
new file mode 100644
index 00000000..f49c082d
--- /dev/null
+++ b/examples/openai_examples/fireworks_example.ipynb
@@ -0,0 +1,219 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "a457cd46",
+   "metadata": {},
+   "source": [
+    "# Fireworks Example\n",
+    "\n",
+    "We are going to create a simple chatbot that creates stories based on a prompt. The chatbot will use the Llama-v3 LLM to generate the story using a user prompt.\n",
+    "\n",
+    "We will track the chatbot with AgentOps and see how it performs!"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d141e480",
+   "metadata": {},
+   "source": [
+    "First let's install the required packages"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6b9c710d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%pip install -U fireworks-ai\n",
+    "%pip install -U agentops"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e50b6b9a",
+   "metadata": {},
+   "source": [
+    "Then import them"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f90efbc2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from fireworks.client import Fireworks\n",
+    "import agentops\n",
+    "import os\n",
+    "from dotenv import load_dotenv"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8d757106",
+   "metadata": {},
+   "source": [
+    "Next, we'll grab our API keys. You can use dotenv like below or however else you like to load environment variables"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f0419fba",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "load_dotenv()\n",
+    "FIREWORKS_API_KEY = os.getenv(\"FIREWORKS_API_KEY\") or \"<your_fireworks_key>\"\n",
+    "AGENTOPS_API_KEY = os.getenv(\"AGENTOPS_API_KEY\") or \"<your_agentops_key>\""
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "86e7d80f",
+   "metadata": {},
+   "source": [
+    "Next we initialize the AgentOps client."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1e60243e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "agentops.init(AGENTOPS_API_KEY, default_tags=[\"fireworks-example\"])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "bec3691a",
+   "metadata": {},
+   "source": [
+    "And we are all set! Note the session url above. We will use it to track the chatbot.\n",
+    "\n",
+    "Let's create a simple chatbot that generates stories."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a9692a44",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "client = Fireworks(api_key=FIREWORKS_API_KEY)\n",
+    "\n",
+    "system_prompt = \"\"\"\n",
+    "You are a master storyteller, with the ability to create vivid and engaging stories.\n",
+    "You have experience in writing for children and adults alike.\n",
+    "You are given a prompt and you need to generate a story based on the prompt.\n",
+    "\"\"\"\n",
+    "\n",
+    "user_prompt = \"Write a story about a cyber-warrior trapped in the imperial time period.\"\n",
+    "\n",
+    "messages = [\n",
+    "    {\"role\": \"system\", \"content\": system_prompt},\n",
+    "    {\"role\": \"user\", \"content\": user_prompt},\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0ad5b6ef",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "response = client.chat.completions.create(\n",
+    "    model=\"accounts/fireworks/models/llama-v3p1-8b-instruct\",\n",
+    "    messages=messages,\n",
+    ")\n",
+    "\n",
+    "print(response.choices[0].message.content)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6e59e2ef",
+   "metadata": {},
+   "source": [
+    "The response is a string that contains the story. We can track this with AgentOps by navigating to the session url and viewing the run.\n",
+    "\n",
+    "## Streaming Version\n",
+    "We will demonstrate the streaming version of the API."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "58f5478f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "stream = client.chat.completions.create(\n",
+    "    model=\"accounts/fireworks/models/llama-v3p1-8b-instruct\",\n",
+    "    messages=messages,\n",
+    "    stream=True,\n",
+    ")\n",
+    "\n",
+    "for chunk in stream:\n",
+    "    print(chunk.choices[0].delta.content or \"\", end=\"\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6c074e3b",
+   "metadata": {},
+   "source": [
+    "Note that the response is a generator that yields chunks of the story. We can track this with AgentOps by navigating to the session url and viewing the run."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9ad8a05e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "agentops.end_session(end_state=\"Success\", end_state_reason=\"The story was generated successfully.\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e245ec0c",
+   "metadata": {},
+   "source": [
+    "We end the session with a success state and a success reason. This is useful if you want to track the success or failure of the chatbot. In that case you can set the end state to failure and provide a reason. By default the session will have an indeterminate end state.\n",
+    "\n",
+    "All done!"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.7"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/examples/openai_examples/openai_example.ipynb b/examples/openai_examples/openai_example.ipynb
new file mode 100644
index 00000000..a4991f69
--- /dev/null
+++ b/examples/openai_examples/openai_example.ipynb
@@ -0,0 +1,361 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "bd5cda33",
+   "metadata": {},
+   "source": [
+    "# Story Generation with OpenAI and AgentOps\n",
+    "\n",
+    "We are going to create a simple chatbot that creates stories based on a prompt. The chatbot will use GPT-3.5-turbo to generate stories based on user prompts.\n",
+    "\n",
+    "We will track the chatbot with AgentOps and see how it performs!"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "5eb7d92a",
+   "metadata": {},
+   "source": [
+    "First let's install the required packages"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "dadc8cb0",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Collecting openai\n",
+      "  Downloading openai-1.57.4-py3-none-any.whl.metadata (24 kB)\n",
+      "Requirement already satisfied: anyio<5,>=3.5.0 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from openai) (4.7.0)\n",
+      "Collecting distro<2,>=1.7.0 (from openai)\n",
+      "  Downloading distro-1.9.0-py3-none-any.whl.metadata (6.8 kB)\n",
+      "Requirement already satisfied: httpx<1,>=0.23.0 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from openai) (0.28.1)\n",
+      "Collecting jiter<1,>=0.4.0 (from openai)\n",
+      "  Downloading jiter-0.8.2-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (5.2 kB)\n",
+      "Requirement already satisfied: pydantic<3,>=1.9.0 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from openai) (2.10.3)\n",
+      "Requirement already satisfied: sniffio in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from openai) (1.3.1)\n",
+      "Collecting tqdm>4 (from openai)\n",
+      "  Downloading tqdm-4.67.1-py3-none-any.whl.metadata (57 kB)\n",
+      "Requirement already satisfied: typing-extensions<5,>=4.11 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from openai) (4.12.2)\n",
+      "Requirement already satisfied: idna>=2.8 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from anyio<5,>=3.5.0->openai) (3.10)\n",
+      "Requirement already satisfied: certifi in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from httpx<1,>=0.23.0->openai) (2024.8.30)\n",
+      "Requirement already satisfied: httpcore==1.* in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from httpx<1,>=0.23.0->openai) (1.0.7)\n",
+      "Requirement already satisfied: h11<0.15,>=0.13 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from httpcore==1.*->httpx<1,>=0.23.0->openai) (0.14.0)\n",
+      "Requirement already satisfied: annotated-types>=0.6.0 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from pydantic<3,>=1.9.0->openai) (0.7.0)\n",
+      "Requirement already satisfied: pydantic-core==2.27.1 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from pydantic<3,>=1.9.0->openai) (2.27.1)\n",
+      "Downloading openai-1.57.4-py3-none-any.whl (390 kB)\n",
+      "Downloading distro-1.9.0-py3-none-any.whl (20 kB)\n",
+      "Downloading jiter-0.8.2-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (345 kB)\n",
+      "Downloading tqdm-4.67.1-py3-none-any.whl (78 kB)\n",
+      "Installing collected packages: tqdm, jiter, distro, openai\n",
+      "Successfully installed distro-1.9.0 jiter-0.8.2 openai-1.57.4 tqdm-4.67.1\n",
+      "\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m24.2\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.3.1\u001b[0m\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n",
+      "Note: you may need to restart the kernel to use updated packages.\n",
+      "Requirement already satisfied: agentops in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (0.3.21)\n",
+      "Requirement already satisfied: requests<3.0.0,>=2.0.0 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from agentops) (2.32.3)\n",
+      "Requirement already satisfied: psutil<6.1.0,>=5.9.8 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from agentops) (6.0.0)\n",
+      "Requirement already satisfied: termcolor<2.5.0,>=2.3.0 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from agentops) (2.4.0)\n",
+      "Requirement already satisfied: PyYAML<7.0,>=5.3 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from agentops) (6.0.2)\n",
+      "Requirement already satisfied: opentelemetry-api<2.0.0,>=1.22.0 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from agentops) (1.28.2)\n",
+      "Requirement already satisfied: opentelemetry-sdk<2.0.0,>=1.22.0 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from agentops) (1.28.2)\n",
+      "Requirement already satisfied: opentelemetry-exporter-otlp-proto-http<2.0.0,>=1.22.0 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from agentops) (1.28.2)\n",
+      "Requirement already satisfied: deprecated>=1.2.6 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from opentelemetry-api<2.0.0,>=1.22.0->agentops) (1.2.15)\n",
+      "Requirement already satisfied: importlib-metadata<=8.5.0,>=6.0 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from opentelemetry-api<2.0.0,>=1.22.0->agentops) (8.5.0)\n",
+      "Requirement already satisfied: googleapis-common-protos~=1.52 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from opentelemetry-exporter-otlp-proto-http<2.0.0,>=1.22.0->agentops) (1.66.0)\n",
+      "Requirement already satisfied: opentelemetry-exporter-otlp-proto-common==1.28.2 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from opentelemetry-exporter-otlp-proto-http<2.0.0,>=1.22.0->agentops) (1.28.2)\n",
+      "Requirement already satisfied: opentelemetry-proto==1.28.2 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from opentelemetry-exporter-otlp-proto-http<2.0.0,>=1.22.0->agentops) (1.28.2)\n",
+      "Requirement already satisfied: protobuf<6.0,>=5.0 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from opentelemetry-proto==1.28.2->opentelemetry-exporter-otlp-proto-http<2.0.0,>=1.22.0->agentops) (5.29.1)\n",
+      "Requirement already satisfied: opentelemetry-semantic-conventions==0.49b2 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from opentelemetry-sdk<2.0.0,>=1.22.0->agentops) (0.49b2)\n",
+      "Requirement already satisfied: typing-extensions>=3.7.4 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from opentelemetry-sdk<2.0.0,>=1.22.0->agentops) (4.12.2)\n",
+      "Requirement already satisfied: charset-normalizer<4,>=2 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from requests<3.0.0,>=2.0.0->agentops) (3.4.0)\n",
+      "Requirement already satisfied: idna<4,>=2.5 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from requests<3.0.0,>=2.0.0->agentops) (3.10)\n",
+      "Requirement already satisfied: urllib3<3,>=1.21.1 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from requests<3.0.0,>=2.0.0->agentops) (2.2.3)\n",
+      "Requirement already satisfied: certifi>=2017.4.17 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from requests<3.0.0,>=2.0.0->agentops) (2024.8.30)\n",
+      "Requirement already satisfied: wrapt<2,>=1.10 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from deprecated>=1.2.6->opentelemetry-api<2.0.0,>=1.22.0->agentops) (1.17.0)\n",
+      "Requirement already satisfied: zipp>=3.20 in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (from importlib-metadata<=8.5.0,>=6.0->opentelemetry-api<2.0.0,>=1.22.0->agentops) (3.21.0)\n",
+      "\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m24.2\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.3.1\u001b[0m\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n",
+      "Note: you may need to restart the kernel to use updated packages.\n",
+      "Requirement already satisfied: python-dotenv in /home/ubuntu/.pyenv/versions/3.12.7/lib/python3.12/site-packages (1.0.1)\n",
+      "\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m24.2\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.3.1\u001b[0m\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n",
+      "Note: you may need to restart the kernel to use updated packages.\n"
+     ]
+    }
+   ],
+   "source": [
+    "%pip install -U openai\n",
+    "%pip install -U agentops\n",
+    "%pip install -U python-dotenv"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "18e8cf75",
+   "metadata": {},
+   "source": [
+    "Then import them"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "9e5e8047",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from openai import OpenAI\n",
+    "import agentops\n",
+    "import os\n",
+    "from dotenv import load_dotenv"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "11b21871",
+   "metadata": {},
+   "source": [
+    "Next, we'll grab our API keys. You can use dotenv like below or however else you like to load environment variables"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "ca0117b6",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "load_dotenv()\n",
+    "OPENAI_API_KEY = os.getenv(\"OPENAI_API_KEY\")\n",
+    "AGENTOPS_API_KEY = os.getenv(\"AGENTOPS_API_KEY\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "181fa55d",
+   "metadata": {},
+   "source": [
+    "Next we initialize the AgentOps client."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "b410946a",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "🖇 AgentOps: \u001b[34m\u001b[34mSession Replay: https://app.agentops.ai/drilldown?session_id=ef605735-3248-4380-8822-7d855f482cb0\u001b[0m\u001b[0m\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "<agentops.session.Session at 0x7f208dc17440>"
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "agentops.init(AGENTOPS_API_KEY, default_tags=[\"story-generation-example\"])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3ac5932a",
+   "metadata": {},
+   "source": [
+    "And we are all set! Note the session url above. We will use it to track the chatbot.\n",
+    "\n",
+    "Let's create a simple chatbot that generates stories."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "35417694",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "client = OpenAI(api_key=OPENAI_API_KEY)\n",
+    "\n",
+    "system_prompt = \"\"\"\n",
+    "You are a master storyteller, with the ability to create vivid and engaging stories.\n",
+    "You have experience in writing for children and adults alike.\n",
+    "You are given a prompt and you need to generate a story based on the prompt.\n",
+    "\"\"\"\n",
+    "\n",
+    "user_prompt = \"Write a story about a cyber-warrior trapped in the imperial time period.\"\n",
+    "\n",
+    "messages = [\n",
+    "    {\"role\": \"system\", \"content\": system_prompt},\n",
+    "    {\"role\": \"user\", \"content\": user_prompt},\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "9f3b000c",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Once upon a time, in the year 3030, when technology reigned supreme and cyber-warriors were the heroes of the digital realm, there lived a skilled hacker named Nova. With her quick wit and unparalleled coding abilities, Nova was known far and wide as one of the most formidable cyber-warriors in the virtual world.\n",
+      "\n",
+      "One fateful day, during a routine mission to infiltrate a highly secure government database, Nova found herself caught in a powerful electromagnetic storm that sent her spiraling through time and space. When she finally regained consciousness, she was bewildered to find herself in a vastly different world - the imperial time period.\n",
+      "\n",
+      "Dressed in her futuristic cyber-armor, Nova stood out like a beacon amidst the ancient architecture and bustling markets of the imperial city. The people stared in awe and fear at this strange warrior who had seemingly appeared out of thin air. Nova quickly realized that her technology was useless in this time period, as there were no networks or devices for her to connect to.\n",
+      "\n",
+      "As Nova tried to make sense of her situation, she was approached by a group of rebels who had heard of her arrival and believed she was a sign from the heavens. They begged her to use her otherworldly powers to help them overthrow the oppressive imperial regime that had plagued their land for centuries.\n",
+      "\n",
+      "Despite feeling out of place and powerless without her technology, Nova saw an opportunity to make a difference in this new world. Drawing on her skills as a hacker, she devised a plan to disrupt the imperial forces using the knowledge she had gained from her time in the digital realm.\n",
+      "\n",
+      "With her guidance, the rebels launched a series of coordinated attacks on the imperial forces, causing chaos and confusion among their ranks. Nova's strategic prowess and quick thinking proved invaluable as they gained ground in their fight for freedom.\n",
+      "\n",
+      "As the final battle raged on, Nova found herself face to face with the imperial warlord, a formidable foe armed with ancient weapons and unwavering determination. In a daring move, Nova used her knowledge of technology to outsmart the warlord, disabling his weapons and securing victory for the rebels.\n",
+      "\n",
+      "In the aftermath of the battle, Nova was hailed as a hero by the people, a legendary figure whose bravery and cunning had changed the course of history. Despite the challenges she faced in this unfamiliar world, Nova had proven that a warrior's strength lies not only in their technology, but in their courage and determination to fight for what is right.\n",
+      "\n",
+      "And so, Nova's legend lived on in the annals of history, a cyber-warrior who had defied the odds and triumphed against all odds in the imperial time period.\n"
+     ]
+    }
+   ],
+   "source": [
+    "response = client.chat.completions.create(\n",
+    "    model=\"gpt-3.5-turbo\",\n",
+    "    messages=messages,\n",
+    ")\n",
+    "\n",
+    "print(response.choices[0].message.content)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "96b5d2f3",
+   "metadata": {},
+   "source": [
+    "The response is a string that contains the story. We can track this with AgentOps by navigating to the session url and viewing the run.\n",
+    "\n",
+    "## Streaming Version\n",
+    "We will demonstrate the streaming version of the API."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "6b89d3b9",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "In the year 2999, in a world where technology reigned supreme, there lived a skilled cyber-warrior named Orion. Orion was known throughout the digital realm for his expertise in battling malicious viruses and rogue AI. Armed with his trusty cyber-armour and razor-sharp intellect, he was a force to be reckoned with.\n",
+      "\n",
+      "One fateful day, while Orion was battling a particularly nefarious cyber-villain known as Malwarex, a sudden power surge disrupted his digital interface. When the surge passed, Orion found himself in a strange and unfamiliar place. Gone were the neon-lit skyscrapers and holographic displays of his world. Instead, he stood in the midst of a bustling imperial city, surrounded by cobblestone streets and horse-drawn carriages.\n",
+      "\n",
+      "Confused and disoriented, Orion realized with a shock that he had been transported back in time to the imperial era. As he tried to make sense of his new surroundings, he caught sight of a group of imperial guards approaching him with suspicion in their eyes.\n",
+      "\n",
+      "Thinking quickly, Orion activated his cyber-armour, the tell-tale glow of the technology drawing gasps of awe from the onlookers. The guards, seeing his formidable appearance, bowed before him, mistaking him for a powerful warrior from a distant land.\n",
+      "\n",
+      "Embracing his new role, Orion decided to make the best of his unexpected situation. Using his cybernetic skills to aid the people of the imperial city, he quickly became a legendary figure, known as the \"Cyber-Knight.\" With each day that passed, Orion learned more about the customs and traditions of the imperial era, while also using his futuristic knowledge to solve problems and protect the innocent.\n",
+      "\n",
+      "But as time went on, Orion began to feel a sense of longing for his own time and his friends in the digital realm. Despite his growing reputation and the admiration of the imperial citizens, he knew deep down that he didn't belong in this era.\n",
+      "\n",
+      "One night, as he gazed up at the stars, Orion whispered a wish into the cosmos, hoping to find a way back to his own time. And just as suddenly as he had been transported to the imperial era, a swirling vortex of digital light enveloped him, whisking him back to the world he knew.\n",
+      "\n",
+      "As he materialized back in his own time, Orion let out a sigh of relief, grateful to be back among the familiar sights and sounds of his cyber-realm. But as he looked back on his time in the imperial era, he knew that he would always cherish the memories of his adventures as the Cyber-Knight, a hero out of time."
+     ]
+    }
+   ],
+   "source": [
+    "stream = client.chat.completions.create(\n",
+    "    model=\"gpt-3.5-turbo\",\n",
+    "    messages=messages,\n",
+    "    stream=True,\n",
+    ")\n",
+    "\n",
+    "for chunk in stream:\n",
+    "    if chunk.choices[0].delta.content is not None:\n",
+    "        print(chunk.choices[0].delta.content, end=\"\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "caa3da92",
+   "metadata": {},
+   "source": [
+    "Note that the response is a generator that yields chunks of the story. We can track this with AgentOps by navigating to the session url and viewing the run."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "fc805558",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "🖇 AgentOps: Session Stats - \u001b[1mDuration:\u001b[0m 10.7s | \u001b[1mCost:\u001b[0m $0.001659 | \u001b[1mLLMs:\u001b[0m 2 | \u001b[1mTools:\u001b[0m 0 | \u001b[1mActions:\u001b[0m 0 | \u001b[1mErrors:\u001b[0m 0\n",
+      "🖇 AgentOps: \u001b[34m\u001b[34mSession Replay: https://app.agentops.ai/drilldown?session_id=ef605735-3248-4380-8822-7d855f482cb0\u001b[0m\u001b[0m\n"
+     ]
+    }
+   ],
+   "source": [
+    "agentops.end_session(end_state=\"Success\", end_state_reason=\"The story was generated successfully.\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "238775c5",
+   "metadata": {},
+   "source": [
+    "We end the session with a success state and a success reason. This is useful if you want to track the success or failure of the chatbot. In that case you can set the end state to failure and provide a reason. By default the session will have an indeterminate end state.\n",
+    "\n",
+    "All done!"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.7"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/examples/openai_examples/openai_example_sync.py b/examples/openai_examples/openai_example_sync.py
new file mode 100644
index 00000000..44640ae6
--- /dev/null
+++ b/examples/openai_examples/openai_example_sync.py
@@ -0,0 +1,110 @@
+#!/usr/bin/env python
+# coding: utf-8
+
+# # OpenAI Sync Example
+# 
+# We are going to create a simple chatbot that creates stories based on a prompt. The chatbot will use the gpt-4o-mini LLM to generate the story using a user prompt.
+# 
+# We will track the chatbot with AgentOps and see how it performs!
+
+# First let's install the required packages
+
+# In[ ]:
+
+
+get_ipython().run_line_magic('pip', 'install -U openai')
+get_ipython().run_line_magic('pip', 'install -U agentops')
+
+
+# Then import them
+
+# In[1]:
+
+
+from openai import OpenAI
+import agentops
+import os
+from dotenv import load_dotenv
+
+
+# Next, we'll grab our API keys. You can use dotenv like below or however else you like to load environment variables
+
+# In[2]:
+
+
+load_dotenv()
+OPENAI_API_KEY = os.getenv("OPENAI_API_KEY") or "<your_openai_key>"
+AGENTOPS_API_KEY = os.getenv("AGENTOPS_API_KEY") or "<your_agentops_key>"
+
+
+# Next we initialize the AgentOps client.
+
+# In[ ]:
+
+
+agentops.init(AGENTOPS_API_KEY, default_tags=["openai-sync-example"])
+
+
+# And we are all set! Note the seesion url above. We will use it to track the chatbot.
+# 
+# Let's create a simple chatbot that generates stories.
+
+# In[4]:
+
+
+client = OpenAI(api_key=OPENAI_API_KEY)
+
+system_prompt = """
+You are a master storyteller, with the ability to create vivid and engaging stories.
+You have experience in writing for children and adults alike.
+You are given a prompt and you need to generate a story based on the prompt.
+"""
+
+user_prompt = "Write a story about a cyber-warrior trapped in the imperial time period."
+
+messages = [
+    {"role": "system", "content": system_prompt},
+    {"role": "user", "content": user_prompt},
+]
+
+
+# In[ ]:
+
+
+response = client.chat.completions.create(
+    model="gpt-4o-mini",
+    messages=messages,
+)
+
+print(response.choices[0].message.content)
+
+
+# The response is a string that contains the story. We can track this with AgentOps by navigating to the session url and viewing the run.
+
+# ## Streaming Version
+# We will demonstrate the streaming version of the API.
+
+# In[ ]:
+
+
+stream = client.chat.completions.create(
+    model="gpt-4o-mini",
+    messages=messages,
+    stream=True,
+)
+
+for chunk in stream:
+  print(chunk.choices[0].delta.content or "", end="")
+
+
+# Note that the response is a generator that yields chunks of the story. We can track this with AgentOps by navigating to the session url and viewing the run.
+
+# In[ ]:
+
+
+agentops.end_session(end_state="Success", end_state_reason="The story was generated successfully.")
+
+
+# We end the session with a success state and a success reason. This is useful if you want to track the success or failure of the chatbot. In that case you can set the end state to failure and provide a reason. By default the session will have an indeterminate end state.
+# 
+# All done!

From 566ced9b55e9feefcceceaff66fe9f6bc070d23b Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 02:48:09 +0000
Subject: [PATCH 06/22] style: Fix formatting issues and add noqa for E402

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py          | 46 ++++++----
 .../fireworks_examples/create_notebook.py     | 77 ++++++-----------
 .../fireworks_examples/fireworks_example.py   | 25 ++----
 .../fireworks_examples/update_notebook.py     | 34 ++++++--
 examples/openai_examples/create_notebook.py   | 84 ++++++-------------
 .../openai_examples/openai_example_sync.py    | 15 ++--
 6 files changed, 122 insertions(+), 159 deletions(-)

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
index c5ad31ec..93577b52 100644
--- a/agentops/llms/providers/fireworks.py
+++ b/agentops/llms/providers/fireworks.py
@@ -9,6 +9,7 @@
 
 logger = logging.getLogger(__name__)
 
+
 class FireworksProvider(InstrumentedProvider):
     """Provider for Fireworks.ai API."""
 
@@ -33,13 +34,18 @@ def handle_response(self, response, kwargs, init_timestamp, session: Optional[Se
 
         try:
             # Handle streaming response
-            if kwargs.get('stream', False):
+            if kwargs.get("stream", False):
+
                 async def async_generator(stream):
                     async for chunk in stream:
                         try:
                             # Parse the chunk data
-                            if hasattr(chunk, 'choices') and chunk.choices:
-                                content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, 'content') else None
+                            if hasattr(chunk, "choices") and chunk.choices:
+                                content = (
+                                    chunk.choices[0].delta.content
+                                    if hasattr(chunk.choices[0].delta, "content")
+                                    else None
+                                )
                             else:
                                 # Handle raw string chunks from streaming response
                                 content = chunk
@@ -50,12 +56,12 @@ async def async_generator(stream):
                                     event_type=EventType.LLM.value,
                                     init_timestamp=init_timestamp,
                                     end_timestamp=get_ISO_time(),
-                                    model=kwargs.get('model', 'unknown'),
-                                    prompt=str(kwargs.get('messages', [])),
+                                    model=kwargs.get("model", "unknown"),
+                                    prompt=str(kwargs.get("messages", [])),
                                     completion="[Streaming Response]",
                                     prompt_tokens=0,
                                     completion_tokens=0,
-                                    cost=0.0
+                                    cost=0.0,
                                 )
                                 if self._session:
                                     self._session.record(event)
@@ -69,8 +75,12 @@ def generator(stream):
                     for chunk in stream:
                         try:
                             # Parse the chunk data
-                            if hasattr(chunk, 'choices') and chunk.choices:
-                                content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, 'content') else None
+                            if hasattr(chunk, "choices") and chunk.choices:
+                                content = (
+                                    chunk.choices[0].delta.content
+                                    if hasattr(chunk.choices[0].delta, "content")
+                                    else None
+                                )
                             else:
                                 # Handle raw string chunks from streaming response
                                 content = chunk
@@ -81,12 +91,12 @@ def generator(stream):
                                     event_type=EventType.LLM.value,
                                     init_timestamp=init_timestamp,
                                     end_timestamp=get_ISO_time(),
-                                    model=kwargs.get('model', 'unknown'),
-                                    prompt=str(kwargs.get('messages', [])),
+                                    model=kwargs.get("model", "unknown"),
+                                    prompt=str(kwargs.get("messages", [])),
                                     completion="[Streaming Response]",
                                     prompt_tokens=0,
                                     completion_tokens=0,
-                                    cost=0.0
+                                    cost=0.0,
                                 )
                                 if self._session:
                                     self._session.record(event)
@@ -96,26 +106,26 @@ def generator(stream):
                             logger.error(f"Error processing streaming chunk: {str(e)}")
                             continue
 
-                if hasattr(response, '__aiter__'):
+                if hasattr(response, "__aiter__"):
                     return async_generator(response)
                 else:
                     return generator(response)
 
             # Handle non-streaming response
-            if hasattr(response, 'choices') and response.choices:
-                content = response.choices[0].message.content if hasattr(response.choices[0], 'message') else ""
+            if hasattr(response, "choices") and response.choices:
+                content = response.choices[0].message.content if hasattr(response.choices[0], "message") else ""
 
                 # Create event data for non-streaming response
                 event = LLMEvent(
                     event_type=EventType.LLM.value,
                     init_timestamp=init_timestamp,
                     end_timestamp=get_ISO_time(),
-                    model=kwargs.get('model', 'unknown'),
-                    prompt=str(kwargs.get('messages', [])),
+                    model=kwargs.get("model", "unknown"),
+                    prompt=str(kwargs.get("messages", [])),
                     completion=content,
                     prompt_tokens=0,
                     completion_tokens=0,
-                    cost=0.0
+                    cost=0.0,
                 )
                 if self._session:
                     self._session.record(event)
@@ -133,7 +143,7 @@ def override(self):
 
         # Store original methods
         self._original_completion = self.client.chat.completions.create
-        self._original_async_completion = getattr(self.client.chat.completions, 'acreate', None)
+        self._original_async_completion = getattr(self.client.chat.completions, "acreate", None)
 
         # Override methods
         self._override_fireworks_completion()
diff --git a/examples/fireworks_examples/create_notebook.py b/examples/fireworks_examples/create_notebook.py
index a9017717..1ff57056 100644
--- a/examples/fireworks_examples/create_notebook.py
+++ b/examples/fireworks_examples/create_notebook.py
@@ -11,119 +11,92 @@
         "The chatbot will use the Llama-v3 LLM to generate the story using a user prompt.\n\n"
         "We will track the chatbot with AgentOps and see how it performs!"
     ),
-
     nbf.v4.new_markdown_cell("First let's install the required packages"),
-
-    nbf.v4.new_code_cell(
-        "%pip install -U fireworks-ai\n"
-        "%pip install -U agentops"
-    ),
-
+    nbf.v4.new_code_cell("%pip install -U fireworks-ai\n" "%pip install -U agentops"),
     nbf.v4.new_markdown_cell("Then import them"),
-
     nbf.v4.new_code_cell(
-        "from fireworks.client import Fireworks\n"
-        "import agentops\n"
-        "import os\n"
-        "from dotenv import load_dotenv"
+        "from fireworks.client import Fireworks\n" "import agentops\n" "import os\n" "from dotenv import load_dotenv"
     ),
-
     nbf.v4.new_markdown_cell(
         "Next, we'll grab our API keys. You can use dotenv like below or "
         "however else you like to load environment variables"
     ),
-
     nbf.v4.new_code_cell(
-        'load_dotenv()\n'
+        "load_dotenv()\n"
         'FIREWORKS_API_KEY = os.getenv("FIREWORKS_API_KEY") or "<your_fireworks_key>"\n'
         'AGENTOPS_API_KEY = os.getenv("AGENTOPS_API_KEY") or "<your_agentops_key>"'
     ),
-
     nbf.v4.new_markdown_cell("Next we initialize the AgentOps client."),
-
     nbf.v4.new_code_cell(
         'agentops.init(AGENTOPS_API_KEY, default_tags=["fireworks-example"])\n'
         'print("AgentOps initialized. Check the session URL above for tracking.")'
     ),
-
     nbf.v4.new_markdown_cell(
         "And we are all set! Note the session url above. We will use it to track the chatbot.\n\n"
         "Let's create a simple chatbot that generates stories."
     ),
-
     nbf.v4.new_code_cell(
-        'client = Fireworks(api_key=FIREWORKS_API_KEY)\n\n'
+        "client = Fireworks(api_key=FIREWORKS_API_KEY)\n\n"
         'system_prompt = """\n'
-        'You are a master storyteller, with the ability to create vivid and engaging stories.\n'
-        'You have experience in writing for children and adults alike.\n'
-        'You are given a prompt and you need to generate a story based on the prompt.\n'
+        "You are a master storyteller, with the ability to create vivid and engaging stories.\n"
+        "You have experience in writing for children and adults alike.\n"
+        "You are given a prompt and you need to generate a story based on the prompt.\n"
         '"""\n\n'
         'user_prompt = "Write a story about a cyber-warrior trapped in the imperial time period."\n\n'
-        'messages = [\n'
+        "messages = [\n"
         '    {"role": "system", "content": system_prompt},\n'
         '    {"role": "user", "content": user_prompt},\n'
-        ']'
+        "]"
     ),
-
     nbf.v4.new_code_cell(
         'print("Generating story with Fireworks LLM...")\n'
-        'response = client.chat.completions.create(\n'
+        "response = client.chat.completions.create(\n"
         '    model="accounts/fireworks/models/llama-v3p1-8b-instruct",\n'
-        '    messages=messages,\n'
-        ')\n\n'
+        "    messages=messages,\n"
+        ")\n\n"
         'print("\\nLLM Response:")\n'
-        'print(response.choices[0].message.content)\n'
+        "print(response.choices[0].message.content)\n"
         'print("\\nCheck the AgentOps dashboard to see the tracked LLM event.")'
     ),
-
     nbf.v4.new_markdown_cell(
         "The response is a string that contains the story. We can track this with AgentOps "
         "by navigating to the session url and viewing the run.\n\n"
         "## Streaming Version\n"
         "We will demonstrate the streaming version of the API."
     ),
-
     nbf.v4.new_code_cell(
         'print("Generating story with streaming enabled...")\n'
-        'stream = client.chat.completions.create(\n'
+        "stream = client.chat.completions.create(\n"
         '    model="accounts/fireworks/models/llama-v3p1-8b-instruct",\n'
-        '    messages=messages,\n'
-        '    stream=True,\n'
-        ')\n\n'
+        "    messages=messages,\n"
+        "    stream=True,\n"
+        ")\n\n"
         'print("\\nStreaming LLM Response:")\n'
-        'for chunk in stream:\n'
+        "for chunk in stream:\n"
         '    print(chunk.choices[0].delta.content or "", end="")\n'
         'print("\\n\\nCheck the AgentOps dashboard to see the tracked streaming LLM event.")'
     ),
-
     nbf.v4.new_markdown_cell(
         "Note that the response is a generator that yields chunks of the story. "
         "We can track this with AgentOps by navigating to the session url and viewing the run."
     ),
-
     nbf.v4.new_code_cell(
-        'agentops.end_session(end_state="Success", '
-        'end_state_reason="The story was generated successfully.")'
+        'agentops.end_session(end_state="Success", ' 'end_state_reason="The story was generated successfully.")'
     ),
-
     nbf.v4.new_markdown_cell(
         "We end the session with a success state and a success reason. This is useful if you "
         "want to track the success or failure of the chatbot. In that case you can set the "
         "end state to failure and provide a reason. By default the session will have an "
         "indeterminate end state.\n\n"
         "All done!"
-    )
+    ),
 ]
 
 nb.cells = cells
 
 # Set the notebook metadata
 nb.metadata = {
-    "kernelspec": {
-        "display_name": "Python 3",
-        "language": "python",
-        "name": "python3"
-    },
+    "kernelspec": {"display_name": "Python 3", "language": "python", "name": "python3"},
     "language_info": {
         "codemirror_mode": {"name": "ipython", "version": 3},
         "file_extension": ".py",
@@ -131,11 +104,11 @@
         "name": "python",
         "nbconvert_exporter": "python",
         "pygments_lexer": "ipython3",
-        "version": "3.12"
-    }
+        "version": "3.12",
+    },
 }
 
 # Write the notebook
-notebook_path = os.path.join(os.path.dirname(__file__), 'fireworks_example.ipynb')
-with open(notebook_path, 'w') as f:
+notebook_path = os.path.join(os.path.dirname(__file__), "fireworks_example.ipynb")
+with open(notebook_path, "w") as f:
     nbf.write(nb, f)
diff --git a/examples/fireworks_examples/fireworks_example.py b/examples/fireworks_examples/fireworks_example.py
index 37916ecd..357138b1 100644
--- a/examples/fireworks_examples/fireworks_example.py
+++ b/examples/fireworks_examples/fireworks_example.py
@@ -12,8 +12,8 @@
 # Set up logging
 logging.basicConfig(
     level=logging.DEBUG,  # Change to DEBUG to see more detailed output
-    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
-    handlers=[logging.StreamHandler()]
+    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
+    handlers=[logging.StreamHandler()],
 )
 logger = logging.getLogger(__name__)
 
@@ -45,14 +45,13 @@
     # Set up messages for story generation
     messages = [
         {"role": "system", "content": "You are a creative storyteller."},
-        {"role": "user", "content": "Write a short story about a cyber-warrior trapped in the imperial era."}
+        {"role": "user", "content": "Write a short story about a cyber-warrior trapped in the imperial era."},
     ]
 
     # Test non-streaming completion
     print("Generating story with Fireworks LLM...")
     response = client.chat.completions.create(
-        model="accounts/fireworks/models/llama-v3p1-8b-instruct",
-        messages=messages
+        model="accounts/fireworks/models/llama-v3p1-8b-instruct", messages=messages
     )
     print("\nLLM Response:")
     print(response.choices[0].message.content)
@@ -63,15 +62,13 @@
     # Test streaming completion
     print("\nGenerating story with streaming enabled...")
     stream = client.chat.completions.create(
-        model="accounts/fireworks/models/llama-v3p1-8b-instruct",
-        messages=messages,
-        stream=True
+        model="accounts/fireworks/models/llama-v3p1-8b-instruct", messages=messages, stream=True
     )
 
     print("\nStreaming LLM Response:")
     for chunk in stream:
         try:
-            if hasattr(chunk, 'choices') and chunk.choices and hasattr(chunk.choices[0].delta, 'content'):
+            if hasattr(chunk, "choices") and chunk.choices and hasattr(chunk.choices[0].delta, "content"):
                 content = chunk.choices[0].delta.content
             else:
                 content = chunk
@@ -88,7 +85,7 @@
     try:
         session_stats = session.end_session(
             end_state=EndState.SUCCESS.value,  # Use .value to get the enum value
-            end_state_reason="Successfully generated stories using both streaming and non-streaming modes."
+            end_state_reason="Successfully generated stories using both streaming and non-streaming modes.",
         )
         print("\nSession Statistics:")
         if isinstance(session_stats, dict):
@@ -102,16 +99,12 @@
 
 except Exception as e:
     logger.error(f"An error occurred: {str(e)}", exc_info=True)
-    if 'session' in locals():
+    if "session" in locals():
         try:
-            session.end_session(
-                end_state=EndState.FAIL,
-                end_state_reason=f"Error occurred: {str(e)}"
-            )
+            session.end_session(end_state=EndState.FAIL, end_state_reason=f"Error occurred: {str(e)}")
         except Exception as end_error:
             logger.error(f"Error ending session: {str(end_error)}", exc_info=True)
     raise
 
 finally:
     print("\nScript execution completed.")
-
diff --git a/examples/fireworks_examples/update_notebook.py b/examples/fireworks_examples/update_notebook.py
index 6d02a096..63957fb0 100644
--- a/examples/fireworks_examples/update_notebook.py
+++ b/examples/fireworks_examples/update_notebook.py
@@ -7,7 +7,9 @@
 cells = []
 
 # Cell 1: Imports and initialization
-cells.append(nbf.v4.new_code_cell('''
+cells.append(
+    nbf.v4.new_code_cell(
+        """
 import os
 from dotenv import load_dotenv
 from fireworks.client import Fireworks
@@ -38,10 +40,14 @@
     {"role": "system", "content": "You are a creative storyteller."},
     {"role": "user", "content": "Write a short story about a cyber-warrior trapped in the imperial era."}
 ]
-'''))
+"""
+    )
+)
 
 # Cell 2: Non-streaming completion
-cells.append(nbf.v4.new_code_cell('''
+cells.append(
+    nbf.v4.new_code_cell(
+        """
 # Test non-streaming completion
 print("Generating story with Fireworks LLM...")
 response = client.chat.completions.create(
@@ -52,10 +58,14 @@
 print(response.choices[0].message.content)
 print("\\nEvent tracking details:")
 print(f"Session URL: {session.session_url}")
-'''))
+"""
+    )
+)
 
 # Cell 3: Streaming completion
-cells.append(nbf.v4.new_code_cell('''
+cells.append(
+    nbf.v4.new_code_cell(
+        """
 # Test streaming completion
 print("\\nGenerating story with streaming enabled...")
 stream = client.chat.completions.create(
@@ -70,10 +80,14 @@
         print(chunk.choices[0].delta.content, end="")
 print("\\n\\nEvent tracking details:")
 print(f"Session URL: {session.session_url}")
-'''))
+"""
+    )
+)
 
 # Cell 4: End session with detailed stats
-cells.append(nbf.v4.new_code_cell('''
+cells.append(
+    nbf.v4.new_code_cell(
+        """
 # End session and show detailed stats
 print("\\nEnding AgentOps session...")
 try:
@@ -92,12 +106,14 @@
 except Exception as e:
     print(f"Error ending session: {str(e)}")
     print("Session URL for debugging:", session.session_url)
-'''))
+"""
+    )
+)
 
 
 # Add cells to notebook
 nb.cells = cells
 
 # Write the notebook
-with open('fireworks_example.ipynb', 'w') as f:
+with open("fireworks_example.ipynb", "w") as f:
     nbf.write(nb, f)
diff --git a/examples/openai_examples/create_notebook.py b/examples/openai_examples/create_notebook.py
index 5eb25d53..592611f8 100644
--- a/examples/openai_examples/create_notebook.py
+++ b/examples/openai_examples/create_notebook.py
@@ -11,114 +11,84 @@
         "The chatbot will use GPT-3.5-turbo to generate stories based on user prompts.\n\n"
         "We will track the chatbot with AgentOps and see how it performs!"
     ),
-
     nbf.v4.new_markdown_cell("First let's install the required packages"),
-
-    nbf.v4.new_code_cell(
-        "%pip install -U openai\n"
-        "%pip install -U agentops\n"
-        "%pip install -U python-dotenv"
-    ),
-
+    nbf.v4.new_code_cell("%pip install -U openai\n" "%pip install -U agentops\n" "%pip install -U python-dotenv"),
     nbf.v4.new_markdown_cell("Then import them"),
-
     nbf.v4.new_code_cell(
-        "from openai import OpenAI\n"
-        "import agentops\n"
-        "import os\n"
-        "from dotenv import load_dotenv"
+        "from openai import OpenAI\n" "import agentops\n" "import os\n" "from dotenv import load_dotenv"
     ),
-
     nbf.v4.new_markdown_cell(
         "Next, we'll grab our API keys. You can use dotenv like below or "
         "however else you like to load environment variables"
     ),
-
     nbf.v4.new_code_cell(
-        'load_dotenv()\n'
+        "load_dotenv()\n"
         'OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")\n'
         'AGENTOPS_API_KEY = os.getenv("AGENTOPS_API_KEY")'
     ),
-
     nbf.v4.new_markdown_cell("Next we initialize the AgentOps client."),
-
-    nbf.v4.new_code_cell(
-        'agentops.init(AGENTOPS_API_KEY, default_tags=["story-generation-example"])'
-    ),
-
+    nbf.v4.new_code_cell('agentops.init(AGENTOPS_API_KEY, default_tags=["story-generation-example"])'),
     nbf.v4.new_markdown_cell(
         "And we are all set! Note the session url above. We will use it to track the chatbot.\n\n"
         "Let's create a simple chatbot that generates stories."
     ),
-
     nbf.v4.new_code_cell(
-        'client = OpenAI(api_key=OPENAI_API_KEY)\n\n'
+        "client = OpenAI(api_key=OPENAI_API_KEY)\n\n"
         'system_prompt = """\n'
-        'You are a master storyteller, with the ability to create vivid and engaging stories.\n'
-        'You have experience in writing for children and adults alike.\n'
-        'You are given a prompt and you need to generate a story based on the prompt.\n'
+        "You are a master storyteller, with the ability to create vivid and engaging stories.\n"
+        "You have experience in writing for children and adults alike.\n"
+        "You are given a prompt and you need to generate a story based on the prompt.\n"
         '"""\n\n'
         'user_prompt = "Write a story about a cyber-warrior trapped in the imperial time period."\n\n'
-        'messages = [\n'
+        "messages = [\n"
         '    {"role": "system", "content": system_prompt},\n'
         '    {"role": "user", "content": user_prompt},\n'
-        ']'
+        "]"
     ),
-
     nbf.v4.new_code_cell(
-        'response = client.chat.completions.create(\n'
+        "response = client.chat.completions.create(\n"
         '    model="gpt-3.5-turbo",\n'
-        '    messages=messages,\n'
-        ')\n\n'
-        'print(response.choices[0].message.content)'
+        "    messages=messages,\n"
+        ")\n\n"
+        "print(response.choices[0].message.content)"
     ),
-
     nbf.v4.new_markdown_cell(
         "The response is a string that contains the story. We can track this with AgentOps "
         "by navigating to the session url and viewing the run.\n\n"
         "## Streaming Version\n"
         "We will demonstrate the streaming version of the API."
     ),
-
     nbf.v4.new_code_cell(
-        'stream = client.chat.completions.create(\n'
+        "stream = client.chat.completions.create(\n"
         '    model="gpt-3.5-turbo",\n'
-        '    messages=messages,\n'
-        '    stream=True,\n'
-        ')\n\n'
-        'for chunk in stream:\n'
-        '    if chunk.choices[0].delta.content is not None:\n'
+        "    messages=messages,\n"
+        "    stream=True,\n"
+        ")\n\n"
+        "for chunk in stream:\n"
+        "    if chunk.choices[0].delta.content is not None:\n"
         '        print(chunk.choices[0].delta.content, end="")'
     ),
-
     nbf.v4.new_markdown_cell(
         "Note that the response is a generator that yields chunks of the story. "
         "We can track this with AgentOps by navigating to the session url and viewing the run."
     ),
-
     nbf.v4.new_code_cell(
-        'agentops.end_session(end_state="Success", '
-        'end_state_reason="The story was generated successfully.")'
+        'agentops.end_session(end_state="Success", ' 'end_state_reason="The story was generated successfully.")'
     ),
-
     nbf.v4.new_markdown_cell(
         "We end the session with a success state and a success reason. This is useful if you "
         "want to track the success or failure of the chatbot. In that case you can set the "
         "end state to failure and provide a reason. By default the session will have an "
         "indeterminate end state.\n\n"
         "All done!"
-    )
+    ),
 ]
 
 nb.cells = cells
 
 # Set the notebook metadata
 nb.metadata = {
-    "kernelspec": {
-        "display_name": "Python 3",
-        "language": "python",
-        "name": "python3"
-    },
+    "kernelspec": {"display_name": "Python 3", "language": "python", "name": "python3"},
     "language_info": {
         "codemirror_mode": {"name": "ipython", "version": 3},
         "file_extension": ".py",
@@ -126,14 +96,14 @@
         "name": "python",
         "nbconvert_exporter": "python",
         "pygments_lexer": "ipython3",
-        "version": "3.12"
-    }
+        "version": "3.12",
+    },
 }
 
 # Create the directory if it doesn't exist
 os.makedirs(os.path.dirname(__file__), exist_ok=True)
 
 # Write the notebook
-notebook_path = os.path.join(os.path.dirname(__file__), 'openai_example.ipynb')
-with open(notebook_path, 'w') as f:
+notebook_path = os.path.join(os.path.dirname(__file__), "openai_example.ipynb")
+with open(notebook_path, "w") as f:
     nbf.write(nb, f)
diff --git a/examples/openai_examples/openai_example_sync.py b/examples/openai_examples/openai_example_sync.py
index 44640ae6..47900ce7 100644
--- a/examples/openai_examples/openai_example_sync.py
+++ b/examples/openai_examples/openai_example_sync.py
@@ -2,9 +2,9 @@
 # coding: utf-8
 
 # # OpenAI Sync Example
-# 
+#
 # We are going to create a simple chatbot that creates stories based on a prompt. The chatbot will use the gpt-4o-mini LLM to generate the story using a user prompt.
-# 
+#
 # We will track the chatbot with AgentOps and see how it performs!
 
 # First let's install the required packages
@@ -12,8 +12,8 @@
 # In[ ]:
 
 
-get_ipython().run_line_magic('pip', 'install -U openai')
-get_ipython().run_line_magic('pip', 'install -U agentops')
+get_ipython().run_line_magic("pip", "install -U openai")
+get_ipython().run_line_magic("pip", "install -U agentops")
 
 
 # Then import them
@@ -21,6 +21,7 @@
 # In[1]:
 
 
+# ruff: noqa: E402
 from openai import OpenAI
 import agentops
 import os
@@ -46,7 +47,7 @@
 
 
 # And we are all set! Note the seesion url above. We will use it to track the chatbot.
-# 
+#
 # Let's create a simple chatbot that generates stories.
 
 # In[4]:
@@ -94,7 +95,7 @@
 )
 
 for chunk in stream:
-  print(chunk.choices[0].delta.content or "", end="")
+    print(chunk.choices[0].delta.content or "", end="")
 
 
 # Note that the response is a generator that yields chunks of the story. We can track this with AgentOps by navigating to the session url and viewing the run.
@@ -106,5 +107,5 @@
 
 
 # We end the session with a success state and a success reason. This is useful if you want to track the success or failure of the chatbot. In that case you can set the end state to failure and provide a reason. By default the session will have an indeterminate end state.
-# 
+#
 # All done!

From 8c8fa3634a55106863e9a51213ca8fa4536fd435 Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 04:42:15 +0000
Subject: [PATCH 07/22] fix: Improve prompt formatting and streaming event
 handling

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py          | 77 ++++++++++---------
 .../fireworks_examples/fireworks_example.py   | 26 ++++---
 2 files changed, 54 insertions(+), 49 deletions(-)

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
index 93577b52..1c87d9df 100644
--- a/agentops/llms/providers/fireworks.py
+++ b/agentops/llms/providers/fireworks.py
@@ -19,6 +19,7 @@ def __init__(self, client):
         self._original_completion = None
         self._original_async_completion = None
         self._session = None  # Initialize session attribute
+        self._accumulated_content = ""  # Add accumulator for streaming responses
         logger.info(f"Initializing {self._provider_name} provider")
 
     def set_session(self, session: Session):
@@ -33,13 +34,28 @@ def handle_response(self, response, kwargs, init_timestamp, session: Optional[Se
             logger.debug(f"Updated session to {session.session_id} for {self._provider_name} provider")
 
         try:
+            # Format prompt properly
+            messages = kwargs.get("messages", [])
+            formatted_prompt = "\n".join([f"{msg['role']}: {msg['content']}" for msg in messages])
+            logger.debug(f"Formatted prompt: {formatted_prompt}")
+
             # Handle streaming response
             if kwargs.get("stream", False):
+                # Create single LLMEvent for streaming response
+                stream_event = LLMEvent(
+                    event_type=EventType.LLM.value,
+                    init_timestamp=init_timestamp,
+                    model=kwargs.get("model", "unknown"),
+                    prompt=formatted_prompt,
+                    prompt_tokens=0,
+                    completion_tokens=0,
+                    cost=0.0,
+                )
 
                 async def async_generator(stream):
+                    self._accumulated_content = ""
                     async for chunk in stream:
                         try:
-                            # Parse the chunk data
                             if hasattr(chunk, "choices") and chunk.choices:
                                 content = (
                                     chunk.choices[0].delta.content
@@ -47,34 +63,26 @@ async def async_generator(stream):
                                     else None
                                 )
                             else:
-                                # Handle raw string chunks from streaming response
                                 content = chunk
 
                             if content:
-                                # Create event data for streaming chunk
-                                event = LLMEvent(
-                                    event_type=EventType.LLM.value,
-                                    init_timestamp=init_timestamp,
-                                    end_timestamp=get_ISO_time(),
-                                    model=kwargs.get("model", "unknown"),
-                                    prompt=str(kwargs.get("messages", [])),
-                                    completion="[Streaming Response]",
-                                    prompt_tokens=0,
-                                    completion_tokens=0,
-                                    cost=0.0,
-                                )
-                                if self._session:
-                                    self._session.record(event)
-                                    logger.debug(f"Recorded streaming chunk for session {self._session.session_id}")
+                                self._accumulated_content += content
+                                # Record event only when we have the complete response
+                                if hasattr(chunk.choices[0], "finish_reason") and chunk.choices[0].finish_reason:
+                                    stream_event.completion = self._accumulated_content
+                                    stream_event.end_timestamp = get_ISO_time()
+                                    if self._session:
+                                        self._session.record(stream_event)
+                                        logger.debug(f"Recorded streaming response for session {self._session.session_id}")
                                 yield content
                         except Exception as e:
                             logger.error(f"Error processing streaming chunk: {str(e)}")
                             continue
 
                 def generator(stream):
+                    self._accumulated_content = ""
                     for chunk in stream:
                         try:
-                            # Parse the chunk data
                             if hasattr(chunk, "choices") and chunk.choices:
                                 content = (
                                     chunk.choices[0].delta.content
@@ -82,25 +90,17 @@ def generator(stream):
                                     else None
                                 )
                             else:
-                                # Handle raw string chunks from streaming response
                                 content = chunk
 
                             if content:
-                                # Create event data for streaming chunk
-                                event = LLMEvent(
-                                    event_type=EventType.LLM.value,
-                                    init_timestamp=init_timestamp,
-                                    end_timestamp=get_ISO_time(),
-                                    model=kwargs.get("model", "unknown"),
-                                    prompt=str(kwargs.get("messages", [])),
-                                    completion="[Streaming Response]",
-                                    prompt_tokens=0,
-                                    completion_tokens=0,
-                                    cost=0.0,
-                                )
-                                if self._session:
-                                    self._session.record(event)
-                                    logger.debug(f"Recorded streaming chunk for session {self._session.session_id}")
+                                self._accumulated_content += content
+                                # Record event only when we have the complete response
+                                if hasattr(chunk.choices[0], "finish_reason") and chunk.choices[0].finish_reason:
+                                    stream_event.completion = self._accumulated_content
+                                    stream_event.end_timestamp = get_ISO_time()
+                                    if self._session:
+                                        self._session.record(stream_event)
+                                        logger.debug(f"Recorded streaming response for session {self._session.session_id}")
                                 yield content
                         except Exception as e:
                             logger.error(f"Error processing streaming chunk: {str(e)}")
@@ -115,20 +115,21 @@ def generator(stream):
             if hasattr(response, "choices") and response.choices:
                 content = response.choices[0].message.content if hasattr(response.choices[0], "message") else ""
 
-                # Create event data for non-streaming response
-                event = LLMEvent(
+                # Create LLMEvent for non-streaming response
+                non_stream_event = LLMEvent(
                     event_type=EventType.LLM.value,
                     init_timestamp=init_timestamp,
                     end_timestamp=get_ISO_time(),
                     model=kwargs.get("model", "unknown"),
-                    prompt=str(kwargs.get("messages", [])),
+                    prompt=formatted_prompt,
                     completion=content,
                     prompt_tokens=0,
                     completion_tokens=0,
                     cost=0.0,
                 )
+
                 if self._session:
-                    self._session.record(event)
+                    self._session.record(non_stream_event)
                     logger.debug(f"Recorded non-streaming response for session {self._session.session_id}")
 
             return response
diff --git a/examples/fireworks_examples/fireworks_example.py b/examples/fireworks_examples/fireworks_example.py
index 357138b1..bfeb2c7a 100644
--- a/examples/fireworks_examples/fireworks_example.py
+++ b/examples/fireworks_examples/fireworks_example.py
@@ -11,7 +11,7 @@
 
 # Set up logging
 logging.basicConfig(
-    level=logging.DEBUG,  # Change to DEBUG to see more detailed output
+    level=logging.DEBUG,  # Set to DEBUG to see formatted prompt
     format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
     handlers=[logging.StreamHandler()],
 )
@@ -25,9 +25,11 @@
     raise ValueError("FIREWORKS_API_KEY environment variable is not set")
 
 try:
-    # Initialize AgentOps in development mode
-    print("Initializing AgentOps in development mode...")
-    session = agentops.init(api_key=None)
+    # Initialize AgentOps client and start session
+    print("Initializing AgentOps client...")
+    ao_client = agentops.Client()
+    ao_client.initialize()
+    session = ao_client.start_session()
     print(f"AgentOps initialized. Session URL: {session.session_url}")
 
     # Initialize Fireworks client
@@ -38,7 +40,7 @@
     # Initialize and register Fireworks provider
     print("Registering Fireworks provider...")
     provider = FireworksProvider(client)
-    provider.set_session(session)  # Set the session before overriding
+    provider.set_session(session)
     provider.override()
     print("Fireworks provider registered.")
 
@@ -83,14 +85,15 @@
     # End session and show detailed stats
     print("\nEnding AgentOps session...")
     try:
-        session_stats = session.end_session(
-            end_state=EndState.SUCCESS.value,  # Use .value to get the enum value
-            end_state_reason="Successfully generated stories using both streaming and non-streaming modes.",
-        )
+        session_stats = session.end_session(end_state="Success")
         print("\nSession Statistics:")
         if isinstance(session_stats, dict):
-            for key, value in session_stats.items():
-                print(f"{key}: {value}")
+            print(f"Duration: {session_stats.get('Duration', 'N/A')}")
+            print(f"Cost: ${float(session_stats.get('Cost', 0.00)):.2f}")  # Convert to float before formatting
+            print(f"LLM Events: {session_stats.get('LLM calls', 0)}")
+            print(f"Tool Events: {session_stats.get('Tool calls', 0)}")
+            print(f"Action Events: {session_stats.get('Actions', 0)}")
+            print(f"Error Events: {session_stats.get('Errors', 0)}")
         else:
             print("No session statistics available")
     except Exception as e:
@@ -108,3 +111,4 @@
 
 finally:
     print("\nScript execution completed.")
+

From bb3b056e3e439b1e04a2827a16f765978d52548d Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 04:45:05 +0000
Subject: [PATCH 08/22] refactor: Update end_session to return detailed
 statistics

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/client.py  | 14 ++++++--------
 agentops/session.py | 10 ++++++----
 2 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/agentops/client.py b/agentops/client.py
index fb3e1793..a4814fb6 100644
--- a/agentops/client.py
+++ b/agentops/client.py
@@ -15,7 +15,7 @@
 import traceback
 from decimal import Decimal
 from functools import cached_property
-from typing import List, Optional, Tuple, Union
+from typing import Any, Dict, List, Optional, Set, Tuple, Union
 from uuid import UUID, uuid4
 
 from termcolor import colored
@@ -247,7 +247,7 @@ def end_session(
         end_state_reason: Optional[str] = None,
         video: Optional[str] = None,
         is_auto_end: Optional[bool] = None,
-    ) -> Optional[Decimal]:
+    ) -> Optional[Dict[str, Any]]:
         """
         End the current session with the AgentOps service.
 
@@ -258,17 +258,15 @@ def end_session(
             is_auto_end (bool, optional): is this an automatic use of end_session and should be skipped with skip_auto_end_session
 
         Returns:
-            Decimal: The token cost of the session. Returns 0 if the cost is unknown.
+            Dict[str, Any]: Session statistics including duration, cost, and event counts.
         """
         session = self._safe_get_session()
         if session is None:
-            return
+            return None
         if is_auto_end and self._config.skip_auto_end_session:
-            return
-
-        token_cost = session.end_session(end_state=end_state, end_state_reason=end_state_reason, video=video)
+            return None
 
-        return token_cost
+        return session.end_session(end_state=end_state, end_state_reason=end_state_reason, video=video)
 
     def create_agent(
         self,
diff --git a/agentops/session.py b/agentops/session.py
index 535bc997..69c55ce8 100644
--- a/agentops/session.py
+++ b/agentops/session.py
@@ -284,7 +284,7 @@ def end_session(
         end_state: str = "Indeterminate",
         end_state_reason: Optional[str] = None,
         video: Optional[str] = None,
-    ) -> Union[Decimal, None]:
+    ) -> Union[Dict[str, Any], None]:
         with self._end_session_lock:
             if not self.is_running:
                 return None
@@ -324,8 +324,9 @@ def end_session(
                     finally:
                         del self._span_processor
 
-                # 5. Final session update
-                if not (analytics_stats := self.get_analytics()):
+                # 5. Final session update and get analytics
+                analytics_stats = self.get_analytics()
+                if not analytics_stats:
                     return None
 
                 analytics = (
@@ -341,6 +342,7 @@ def end_session(
 
             except Exception as e:
                 logger.exception(f"Error during session end: {e}")
+                return None
             finally:
                 active_sessions.remove(self)  # First thing, get rid of the session
 
@@ -350,7 +352,7 @@ def end_session(
                         "blue",
                     )
                 )
-            return self.token_cost
+            return analytics_stats
 
     def add_tags(self, tags: List[str]) -> None:
         """

From 26c71cfef227db13921ab53957d390ae1e8a3e2a Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 04:45:30 +0000
Subject: [PATCH 09/22] style: Apply ruff-format changes to improve code
 formatting

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py             | 8 ++++++--
 examples/fireworks_examples/fireworks_example.py | 1 -
 2 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
index 1c87d9df..fdfd11cf 100644
--- a/agentops/llms/providers/fireworks.py
+++ b/agentops/llms/providers/fireworks.py
@@ -73,7 +73,9 @@ async def async_generator(stream):
                                     stream_event.end_timestamp = get_ISO_time()
                                     if self._session:
                                         self._session.record(stream_event)
-                                        logger.debug(f"Recorded streaming response for session {self._session.session_id}")
+                                        logger.debug(
+                                            f"Recorded streaming response for session {self._session.session_id}"
+                                        )
                                 yield content
                         except Exception as e:
                             logger.error(f"Error processing streaming chunk: {str(e)}")
@@ -100,7 +102,9 @@ def generator(stream):
                                     stream_event.end_timestamp = get_ISO_time()
                                     if self._session:
                                         self._session.record(stream_event)
-                                        logger.debug(f"Recorded streaming response for session {self._session.session_id}")
+                                        logger.debug(
+                                            f"Recorded streaming response for session {self._session.session_id}"
+                                        )
                                 yield content
                         except Exception as e:
                             logger.error(f"Error processing streaming chunk: {str(e)}")
diff --git a/examples/fireworks_examples/fireworks_example.py b/examples/fireworks_examples/fireworks_example.py
index bfeb2c7a..6243a4cb 100644
--- a/examples/fireworks_examples/fireworks_example.py
+++ b/examples/fireworks_examples/fireworks_example.py
@@ -111,4 +111,3 @@
 
 finally:
     print("\nScript execution completed.")
-

From 68b276e44e368ec9f94a36ef1b62947a7896042c Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 19:26:47 +0000
Subject: [PATCH 10/22] fix: Improve prompt formatting and streaming event
 handling

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py | 36 ++++++++++++++--------------
 1 file changed, 18 insertions(+), 18 deletions(-)

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
index fdfd11cf..4677c1ca 100644
--- a/agentops/llms/providers/fireworks.py
+++ b/agentops/llms/providers/fireworks.py
@@ -19,7 +19,8 @@ def __init__(self, client):
         self._original_completion = None
         self._original_async_completion = None
         self._session = None  # Initialize session attribute
-        self._accumulated_content = ""  # Add accumulator for streaming responses
+        self._accumulated_content = ""  # Track accumulated content for streaming
+        self._init_timestamp = None  # Track stream start time
         logger.info(f"Initializing {self._provider_name} provider")
 
     def set_session(self, session: Session):
@@ -34,10 +35,9 @@ def handle_response(self, response, kwargs, init_timestamp, session: Optional[Se
             logger.debug(f"Updated session to {session.session_id} for {self._provider_name} provider")
 
         try:
-            # Format prompt properly
+            # Pass ChatML messages directly to LLMEvent
             messages = kwargs.get("messages", [])
-            formatted_prompt = "\n".join([f"{msg['role']}: {msg['content']}" for msg in messages])
-            logger.debug(f"Formatted prompt: {formatted_prompt}")
+            logger.debug(f"Using ChatML messages: {messages}")
 
             # Handle streaming response
             if kwargs.get("stream", False):
@@ -46,13 +46,14 @@ def handle_response(self, response, kwargs, init_timestamp, session: Optional[Se
                     event_type=EventType.LLM.value,
                     init_timestamp=init_timestamp,
                     model=kwargs.get("model", "unknown"),
-                    prompt=formatted_prompt,
+                    prompt=messages,  # Pass ChatML directly
                     prompt_tokens=0,
                     completion_tokens=0,
                     cost=0.0,
                 )
 
                 async def async_generator(stream):
+                    """Handle async streaming response."""
                     self._accumulated_content = ""
                     async for chunk in stream:
                         try:
@@ -67,21 +68,21 @@ async def async_generator(stream):
 
                             if content:
                                 self._accumulated_content += content
-                                # Record event only when we have the complete response
+                                # Only create event when stream is finished
                                 if hasattr(chunk.choices[0], "finish_reason") and chunk.choices[0].finish_reason:
                                     stream_event.completion = self._accumulated_content
                                     stream_event.end_timestamp = get_ISO_time()
                                     if self._session:
                                         self._session.record(stream_event)
-                                        logger.debug(
-                                            f"Recorded streaming response for session {self._session.session_id}"
-                                        )
+                                        logger.debug(f"Recorded complete streaming response for session {self._session.session_id}")
+                                    self._accumulated_content = ""  # Reset for next stream
                                 yield content
                         except Exception as e:
-                            logger.error(f"Error processing streaming chunk: {str(e)}")
-                            continue
+                            logger.error(f"Error in async streaming: {str(e)}")
+                            raise
 
                 def generator(stream):
+                    """Handle synchronous streaming response."""
                     self._accumulated_content = ""
                     for chunk in stream:
                         try:
@@ -96,19 +97,18 @@ def generator(stream):
 
                             if content:
                                 self._accumulated_content += content
-                                # Record event only when we have the complete response
+                                # Only create event when stream is finished
                                 if hasattr(chunk.choices[0], "finish_reason") and chunk.choices[0].finish_reason:
                                     stream_event.completion = self._accumulated_content
                                     stream_event.end_timestamp = get_ISO_time()
                                     if self._session:
                                         self._session.record(stream_event)
-                                        logger.debug(
-                                            f"Recorded streaming response for session {self._session.session_id}"
-                                        )
+                                        logger.debug(f"Recorded complete streaming response for session {self._session.session_id}")
+                                    self._accumulated_content = ""  # Reset for next stream
                                 yield content
                         except Exception as e:
-                            logger.error(f"Error processing streaming chunk: {str(e)}")
-                            continue
+                            logger.error(f"Error in sync streaming: {str(e)}")
+                            raise
 
                 if hasattr(response, "__aiter__"):
                     return async_generator(response)
@@ -125,7 +125,7 @@ def generator(stream):
                     init_timestamp=init_timestamp,
                     end_timestamp=get_ISO_time(),
                     model=kwargs.get("model", "unknown"),
-                    prompt=formatted_prompt,
+                    prompt=messages,  # Pass ChatML directly
                     completion=content,
                     prompt_tokens=0,
                     completion_tokens=0,

From e9a5a34fc78dd55e821274cab1ced77c19b40a15 Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 22:33:21 +0000
Subject: [PATCH 11/22] fix: Update Fireworks provider with proper sync/async
 handling

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py          | 187 ++++++++----------
 .../fireworks_examples/fireworks_example.py   |  93 ++++++---
 2 files changed, 149 insertions(+), 131 deletions(-)

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
index 4677c1ca..2d4536bc 100644
--- a/agentops/llms/providers/fireworks.py
+++ b/agentops/llms/providers/fireworks.py
@@ -1,4 +1,6 @@
 import logging
+import time
+import asyncio
 from typing import Optional, AsyncGenerator
 import pprint
 from agentops.session import Session
@@ -28,131 +30,99 @@ def set_session(self, session: Session):
         self._session = session
         logger.debug(f"Set session {session.session_id} for {self._provider_name} provider")
 
-    def handle_response(self, response, kwargs, init_timestamp, session: Optional[Session] = None) -> dict:
+    async def handle_response(self, response, kwargs, init_timestamp, session: Optional[Session] = None) -> dict:
         """Handle the response from the Fireworks API."""
-        if session:
-            self._session = session
-            logger.debug(f"Updated session to {session.session_id} for {self._provider_name} provider")
-
         try:
+            # Use existing session if provided, otherwise use provider's session
+            current_session = session if session else self._session
+            if not current_session:
+                logger.warning("No session available for event tracking")
+                return response
+
             # Pass ChatML messages directly to LLMEvent
             messages = kwargs.get("messages", [])
             logger.debug(f"Using ChatML messages: {messages}")
 
+            # Create base LLMEvent
+            event = LLMEvent(
+                model=kwargs.get("model", ""),
+                prompt=messages,  # Pass ChatML messages directly
+                init_timestamp=init_timestamp,
+                end_timestamp=time.time(),
+                completion="",  # Will be updated for streaming responses
+                prompt_tokens=0,  # Will be updated based on response
+                completion_tokens=0,
+                cost=0.0,
+            )
+
             # Handle streaming response
             if kwargs.get("stream", False):
-                # Create single LLMEvent for streaming response
-                stream_event = LLMEvent(
-                    event_type=EventType.LLM.value,
-                    init_timestamp=init_timestamp,
-                    model=kwargs.get("model", "unknown"),
-                    prompt=messages,  # Pass ChatML directly
-                    prompt_tokens=0,
-                    completion_tokens=0,
-                    cost=0.0,
-                )
-
-                async def async_generator(stream):
-                    """Handle async streaming response."""
-                    self._accumulated_content = ""
-                    async for chunk in stream:
-                        try:
+                async def async_generator(stream_response):
+                    accumulated_content = ""
+                    try:
+                        async for chunk in stream_response:
                             if hasattr(chunk, "choices") and chunk.choices:
-                                content = (
-                                    chunk.choices[0].delta.content
-                                    if hasattr(chunk.choices[0].delta, "content")
-                                    else None
-                                )
-                            else:
-                                content = chunk
-
-                            if content:
-                                self._accumulated_content += content
-                                # Only create event when stream is finished
-                                if hasattr(chunk.choices[0], "finish_reason") and chunk.choices[0].finish_reason:
-                                    stream_event.completion = self._accumulated_content
-                                    stream_event.end_timestamp = get_ISO_time()
-                                    if self._session:
-                                        self._session.record(stream_event)
-                                        logger.debug(f"Recorded complete streaming response for session {self._session.session_id}")
-                                    self._accumulated_content = ""  # Reset for next stream
-                                yield content
-                        except Exception as e:
-                            logger.error(f"Error in async streaming: {str(e)}")
-                            raise
-
-                def generator(stream):
-                    """Handle synchronous streaming response."""
-                    self._accumulated_content = ""
-                    for chunk in stream:
-                        try:
+                                content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
+                                if content:
+                                    accumulated_content += content
+                                    yield chunk
+                        # Update event with final accumulated content
+                        event.completion = accumulated_content
+                        event.end_timestamp = time.time()
+                        if current_session:
+                            current_session.record_event(event)
+                            logger.info("Recorded streaming LLM event")
+                    except Exception as e:
+                        logger.error(f"Error in async_generator: {str(e)}")
+                        raise
+
+                def generator(stream_response):
+                    accumulated_content = ""
+                    try:
+                        for chunk in stream_response:
                             if hasattr(chunk, "choices") and chunk.choices:
-                                content = (
-                                    chunk.choices[0].delta.content
-                                    if hasattr(chunk.choices[0].delta, "content")
-                                    else None
-                                )
-                            else:
-                                content = chunk
-
-                            if content:
-                                self._accumulated_content += content
-                                # Only create event when stream is finished
-                                if hasattr(chunk.choices[0], "finish_reason") and chunk.choices[0].finish_reason:
-                                    stream_event.completion = self._accumulated_content
-                                    stream_event.end_timestamp = get_ISO_time()
-                                    if self._session:
-                                        self._session.record(stream_event)
-                                        logger.debug(f"Recorded complete streaming response for session {self._session.session_id}")
-                                    self._accumulated_content = ""  # Reset for next stream
-                                yield content
-                        except Exception as e:
-                            logger.error(f"Error in sync streaming: {str(e)}")
-                            raise
+                                content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
+                                if content:
+                                    accumulated_content += content
+                                    yield chunk
+                        # Update event with final accumulated content
+                        event.completion = accumulated_content
+                        event.end_timestamp = time.time()
+                        if current_session:
+                            current_session.record_event(event)
+                            logger.info("Recorded streaming LLM event")
+                    except Exception as e:
+                        logger.error(f"Error in generator: {str(e)}")
+                        raise
 
                 if hasattr(response, "__aiter__"):
-                    return async_generator(response)
+                    return async_generator(response)  # Return async generator
                 else:
-                    return generator(response)
+                    return generator(response)  # Return sync generator
 
             # Handle non-streaming response
             if hasattr(response, "choices") and response.choices:
-                content = response.choices[0].message.content if hasattr(response.choices[0], "message") else ""
-
-                # Create LLMEvent for non-streaming response
-                non_stream_event = LLMEvent(
-                    event_type=EventType.LLM.value,
-                    init_timestamp=init_timestamp,
-                    end_timestamp=get_ISO_time(),
-                    model=kwargs.get("model", "unknown"),
-                    prompt=messages,  # Pass ChatML directly
-                    completion=content,
-                    prompt_tokens=0,
-                    completion_tokens=0,
-                    cost=0.0,
-                )
-
-                if self._session:
-                    self._session.record(non_stream_event)
-                    logger.debug(f"Recorded non-streaming response for session {self._session.session_id}")
+                event.completion = response.choices[0].message.content
+                event.end_timestamp = time.time()
+                if current_session:
+                    current_session.record_event(event)
+                    logger.info("Recorded non-streaming LLM event")
 
             return response
 
         except Exception as e:
-            logger.error(f"Error handling Fireworks response: {str(e)}")
+            logger.error(f"Error handling response: {str(e)}")
             raise
 
     def override(self):
         """Override Fireworks API methods with instrumented versions."""
-        logger.info(f"Overriding {self._provider_name} provider methods")
-
-        # Store original methods
-        self._original_completion = self.client.chat.completions.create
-        self._original_async_completion = getattr(self.client.chat.completions, "acreate", None)
+        logger.info("Overriding Fireworks provider methods")
+        if not self._original_completion:
+            self._original_completion = self.client.chat.completions.create
+            self._override_fireworks_completion()
 
-        # Override methods
-        self._override_fireworks_completion()
-        if self._original_async_completion:
+        if not self._original_async_completion:
+            self._original_async_completion = self.client.chat.completions.acreate
             self._override_fireworks_async_completion()
 
     def _override_fireworks_completion(self):
@@ -162,9 +132,14 @@ def _override_fireworks_completion(self):
 
         def patched_function(*args, **kwargs):
             try:
-                init_timestamp = get_ISO_time()
+                init_timestamp = time.time()
                 response = original_create(*args, **kwargs)
-                return provider.handle_response(response, kwargs, init_timestamp, provider._session)
+                if kwargs.get("stream", False):
+                    return provider.handle_response(response, kwargs, init_timestamp, provider._session)
+                else:
+                    loop = asyncio.new_event_loop()
+                    asyncio.set_event_loop(loop)
+                    return loop.run_until_complete(provider.handle_response(response, kwargs, init_timestamp, provider._session))
             except Exception as e:
                 logger.error(f"Error in Fireworks completion: {str(e)}")
                 raise
@@ -178,9 +153,13 @@ def _override_fireworks_async_completion(self):
 
         async def patched_function(*args, **kwargs):
             try:
-                init_timestamp = get_ISO_time()
+                init_timestamp = time.time()
                 response = await original_acreate(*args, **kwargs)
-                return provider.handle_response(response, kwargs, init_timestamp, provider._session)
+
+                if kwargs.get("stream", False):
+                    return await provider.handle_response(response, kwargs, init_timestamp, provider._session)
+                else:
+                    return await provider.handle_response(response, kwargs, init_timestamp, provider._session)
             except Exception as e:
                 logger.error(f"Error in Fireworks async completion: {str(e)}")
                 raise
diff --git a/examples/fireworks_examples/fireworks_example.py b/examples/fireworks_examples/fireworks_example.py
index 6243a4cb..968d65ee 100644
--- a/examples/fireworks_examples/fireworks_example.py
+++ b/examples/fireworks_examples/fireworks_example.py
@@ -3,6 +3,7 @@
 
 import os
 import logging
+import asyncio
 from fireworks.client import Fireworks
 import agentops
 from agentops.enums import EndState
@@ -28,9 +29,15 @@
     # Initialize AgentOps client and start session
     print("Initializing AgentOps client...")
     ao_client = agentops.Client()
-    ao_client.initialize()
+    ao_client.initialize()  # Initialize before starting session
     session = ao_client.start_session()
+
+    if not session:
+        raise RuntimeError("Failed to create AgentOps session")
+
     print(f"AgentOps initialized. Session URL: {session.session_url}")
+    print("Session ID:", session.session_id)
+    print("Session tracking enabled:", bool(session))
 
     # Initialize Fireworks client
     print("Initializing Fireworks client...")
@@ -50,52 +57,83 @@
         {"role": "user", "content": "Write a short story about a cyber-warrior trapped in the imperial era."},
     ]
 
-    # Test non-streaming completion
-    print("Generating story with Fireworks LLM...")
+    # 1. Test synchronous non-streaming completion
+    print("\n1. Generating story with synchronous non-streaming completion...")
     response = client.chat.completions.create(
         model="accounts/fireworks/models/llama-v3p1-8b-instruct", messages=messages
     )
-    print("\nLLM Response:")
+    print("\nSync Non-streaming Response:")
     print(response.choices[0].message.content)
-    print("\nEvent tracking details:")
-    print(f"Session URL: {session.session_url}")
-    print("Check the AgentOps dashboard to see the tracked LLM event.")
+    print("\nEvent recorded for sync non-streaming completion")
+
+    # 2. Test asynchronous non-streaming completion
+    print("\n2. Generating story with asynchronous non-streaming completion...")
+    async def async_completion():
+        response = await client.chat.completions.acreate(
+            model="accounts/fireworks/models/llama-v3p1-8b-instruct", messages=messages
+        )
+        print("\nAsync Non-streaming Response:")
+        print(response.choices[0].message.content)
+        print("\nEvent recorded for async non-streaming completion")
 
-    # Test streaming completion
-    print("\nGenerating story with streaming enabled...")
+    asyncio.run(async_completion())
+
+    # 3. Test synchronous streaming completion
+    print("\n3. Generating story with synchronous streaming...")
     stream = client.chat.completions.create(
         model="accounts/fireworks/models/llama-v3p1-8b-instruct", messages=messages, stream=True
     )
 
-    print("\nStreaming LLM Response:")
-    for chunk in stream:
-        try:
+    print("\nSync Streaming Response:")
+    try:
+        if asyncio.iscoroutine(stream):
+            stream = asyncio.run(stream)
+        for chunk in stream:
             if hasattr(chunk, "choices") and chunk.choices and hasattr(chunk.choices[0].delta, "content"):
                 content = chunk.choices[0].delta.content
-            else:
-                content = chunk
-            if content:
-                print(content, end="", flush=True)
+                if content:
+                    print(content, end="", flush=True)
+    except Exception as e:
+        logger.error(f"Error processing streaming response: {str(e)}")
+    print()  # New line after streaming
+
+    # 4. Test asynchronous streaming completion
+    print("\n4. Generating story with asynchronous streaming...")
+    async def async_streaming():
+        try:
+            stream = await client.chat.completions.acreate(
+                model="accounts/fireworks/models/llama-v3p1-8b-instruct", messages=messages, stream=True
+            )
+            print("\nAsync Streaming Response:")
+            async for chunk in stream:
+                if hasattr(chunk, "choices") and chunk.choices and hasattr(chunk.choices[0].delta, "content"):
+                    content = chunk.choices[0].delta.content
+                    if content:
+                        print(content, end="", flush=True)
         except Exception as e:
-            logger.error(f"Error processing chunk: {str(e)}")
-            continue
-    print("\n\nEvent tracking details:")
-    print(f"Session URL: {session.session_url}")
+            logger.error(f"Error in async streaming: {str(e)}")
+        print()  # New line after streaming
+
+    asyncio.run(async_streaming())
 
     # End session and show detailed stats
     print("\nEnding AgentOps session...")
     try:
-        session_stats = session.end_session(end_state="Success")
         print("\nSession Statistics:")
+        print(f"Session ID before end: {session.session_id}")  # Debug logging
+        session_stats = session.end_session(end_state=EndState.SUCCESS)
+        print(f"Session ID after end: {session.session_id}")  # Debug logging
         if isinstance(session_stats, dict):
-            print(f"Duration: {session_stats.get('Duration', 'N/A')}")
-            print(f"Cost: ${float(session_stats.get('Cost', 0.00)):.2f}")  # Convert to float before formatting
-            print(f"LLM Events: {session_stats.get('LLM calls', 0)}")
-            print(f"Tool Events: {session_stats.get('Tool calls', 0)}")
-            print(f"Action Events: {session_stats.get('Actions', 0)}")
-            print(f"Error Events: {session_stats.get('Errors', 0)}")
+            print(f"Duration: {session_stats.get('duration', 'N/A')}")
+            print(f"Cost: ${float(session_stats.get('cost', 0.00)):.2f}")
+            print(f"LLM Events: {session_stats.get('llm_events', 0)}")
+            print(f"Tool Events: {session_stats.get('tool_events', 0)}")
+            print(f"Action Events: {session_stats.get('action_events', 0)}")
+            print(f"Error Events: {session_stats.get('error_events', 0)}")
+            print(f"Session URL: {session.session_url}")  # Add session URL to output
         else:
             print("No session statistics available")
+            print("Session URL for debugging:", session.session_url)
     except Exception as e:
         print(f"Error ending session: {str(e)}")
         print("Session URL for debugging:", session.session_url)
@@ -111,3 +149,4 @@
 
 finally:
     print("\nScript execution completed.")
+

From 0f10f0a9f0a506d78e2f202a1fcc5bc3110562af Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 22:36:26 +0000
Subject: [PATCH 12/22] style: Apply ruff-format changes to improve code
 formatting

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
index 2d4536bc..f8f877b2 100644
--- a/agentops/llms/providers/fireworks.py
+++ b/agentops/llms/providers/fireworks.py
@@ -70,7 +70,7 @@ async def async_generator(stream_response):
                         event.completion = accumulated_content
                         event.end_timestamp = time.time()
                         if current_session:
-                            current_session.record_event(event)
+                            current_session.record(event)
                             logger.info("Recorded streaming LLM event")
                     except Exception as e:
                         logger.error(f"Error in async_generator: {str(e)}")
@@ -89,7 +89,7 @@ def generator(stream_response):
                         event.completion = accumulated_content
                         event.end_timestamp = time.time()
                         if current_session:
-                            current_session.record_event(event)
+                            current_session.record(event)
                             logger.info("Recorded streaming LLM event")
                     except Exception as e:
                         logger.error(f"Error in generator: {str(e)}")
@@ -105,7 +105,7 @@ def generator(stream_response):
                 event.completion = response.choices[0].message.content
                 event.end_timestamp = time.time()
                 if current_session:
-                    current_session.record_event(event)
+                    current_session.record(event)
                     logger.info("Recorded non-streaming LLM event")
 
             return response

From 9d22c6e69b13b4c8198dce48f4a3e4fe17d053db Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 22:39:32 +0000
Subject: [PATCH 13/22] style: Apply additional ruff-format changes

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py             | 13 ++++++++++---
 examples/fireworks_examples/fireworks_example.py |  3 ++-
 2 files changed, 12 insertions(+), 4 deletions(-)

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
index f8f877b2..fe1b47cf 100644
--- a/agentops/llms/providers/fireworks.py
+++ b/agentops/llms/providers/fireworks.py
@@ -57,12 +57,15 @@ async def handle_response(self, response, kwargs, init_timestamp, session: Optio
 
             # Handle streaming response
             if kwargs.get("stream", False):
+
                 async def async_generator(stream_response):
                     accumulated_content = ""
                     try:
                         async for chunk in stream_response:
                             if hasattr(chunk, "choices") and chunk.choices:
-                                content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
+                                content = (
+                                    chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
+                                )
                                 if content:
                                     accumulated_content += content
                                     yield chunk
@@ -81,7 +84,9 @@ def generator(stream_response):
                     try:
                         for chunk in stream_response:
                             if hasattr(chunk, "choices") and chunk.choices:
-                                content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
+                                content = (
+                                    chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
+                                )
                                 if content:
                                     accumulated_content += content
                                     yield chunk
@@ -139,7 +144,9 @@ def patched_function(*args, **kwargs):
                 else:
                     loop = asyncio.new_event_loop()
                     asyncio.set_event_loop(loop)
-                    return loop.run_until_complete(provider.handle_response(response, kwargs, init_timestamp, provider._session))
+                    return loop.run_until_complete(
+                        provider.handle_response(response, kwargs, init_timestamp, provider._session)
+                    )
             except Exception as e:
                 logger.error(f"Error in Fireworks completion: {str(e)}")
                 raise
diff --git a/examples/fireworks_examples/fireworks_example.py b/examples/fireworks_examples/fireworks_example.py
index 968d65ee..1376638f 100644
--- a/examples/fireworks_examples/fireworks_example.py
+++ b/examples/fireworks_examples/fireworks_example.py
@@ -68,6 +68,7 @@
 
     # 2. Test asynchronous non-streaming completion
     print("\n2. Generating story with asynchronous non-streaming completion...")
+
     async def async_completion():
         response = await client.chat.completions.acreate(
             model="accounts/fireworks/models/llama-v3p1-8b-instruct", messages=messages
@@ -99,6 +100,7 @@ async def async_completion():
 
     # 4. Test asynchronous streaming completion
     print("\n4. Generating story with asynchronous streaming...")
+
     async def async_streaming():
         try:
             stream = await client.chat.completions.acreate(
@@ -149,4 +151,3 @@ async def async_streaming():
 
 finally:
     print("\nScript execution completed.")
-

From a28c0f1e9e1ffeb305eaddbdab2e66aba1146a4d Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 22:56:01 +0000
Subject: [PATCH 14/22] fix: Update notebook to handle async code without cell
 magic

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 .../fireworks_example.ipynb                   | 531 ++++++------------
 .../fireworks_examples/update_notebook.py     | 222 ++++++--
 2 files changed, 338 insertions(+), 415 deletions(-)

diff --git a/examples/fireworks_examples/fireworks_example.ipynb b/examples/fireworks_examples/fireworks_example.ipynb
index 502b2187..36e8140f 100644
--- a/examples/fireworks_examples/fireworks_example.ipynb
+++ b/examples/fireworks_examples/fireworks_example.ipynb
@@ -1,424 +1,233 @@
 {
  "cells": [
   {
-   "cell_type": "code",
-   "execution_count": 1,
-   "id": "994a2dfc",
-   "metadata": {
-    "execution": {
-     "iopub.execute_input": "2024-12-18T02:08:27.681561Z",
-     "iopub.status.busy": "2024-12-18T02:08:27.681282Z",
-     "iopub.status.idle": "2024-12-18T02:08:29.924803Z",
-     "shell.execute_reply": "2024-12-18T02:08:29.923993Z"
-    }
-   },
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Initializing AgentOps in development mode...\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "🖇 AgentOps: \u001b[34m\u001b[34mSession Replay: https://app.agentops.ai/drilldown?session_id=da7c7323-408b-43b9-a503-d7e0a308818a\u001b[0m\u001b[0m\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Starting new AgentOps session...\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "🖇 AgentOps: \u001b[34m\u001b[34mSession Replay: https://app.agentops.ai/drilldown?session_id=390c35ff-0df4-4953-9d06-d142fec08719\u001b[0m\u001b[0m\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "AgentOps initialized. Session URL: https://app.agentops.ai/drilldown?session_id=390c35ff-0df4-4953-9d06-d142fec08719\n",
-      "Initializing Fireworks client...\n",
-      "Fireworks client initialized.\n"
-     ]
-    }
-   ],
+   "cell_type": "markdown",
+   "id": "8ce4ef43",
+   "metadata": {},
    "source": [
+    "# Fireworks LLM Integration Example\n",
     "\n",
+    "This notebook demonstrates the integration of Fireworks LLM with AgentOps, showcasing both synchronous and asynchronous completions with and without streaming. All examples use the same AgentOps session for proper event tracking."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "caeebf2f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
     "import os\n",
-    "from dotenv import load_dotenv\n",
+    "import logging\n",
+    "import asyncio\n",
     "from fireworks.client import Fireworks\n",
     "import agentops\n",
     "from agentops.enums import EndState\n",
+    "from agentops.llms.providers.fireworks import FireworksProvider\n",
+    "from dotenv import load_dotenv\n",
     "\n",
+    "# Set up logging\n",
+    "logging.basicConfig(\n",
+    "    level=logging.INFO,\n",
+    "    format=\"%(asctime)s - %(name)s - %(levelname)s - %(message)s\",\n",
+    "    handlers=[logging.StreamHandler()],\n",
+    ")\n",
+    "logger = logging.getLogger(__name__)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "4fa145da",
+   "metadata": {},
+   "outputs": [],
+   "source": [
     "# Load environment variables\n",
     "load_dotenv()\n",
     "FIREWORKS_API_KEY = os.getenv(\"FIREWORKS_API_KEY\")\n",
     "\n",
-    "# Initialize AgentOps in development mode\n",
-    "print(\"Initializing AgentOps in development mode...\")\n",
-    "agentops.init(\n",
-    "    api_key=None,  # None for local development\n",
-    "    default_tags=[\"fireworks-example\"]\n",
-    ")\n",
-    "print(\"Starting new AgentOps session...\")\n",
-    "session = agentops.start_session()\n",
-    "print(f\"AgentOps initialized. Session URL: {session.session_url}\")\n",
+    "if not FIREWORKS_API_KEY:\n",
+    "    raise ValueError(\"FIREWORKS_API_KEY environment variable is not set\")\n",
+    "\n",
+    "# Initialize AgentOps client and start session\n",
+    "print(\"\\nInitializing AgentOps client and starting session...\")\n",
+    "ao_client = agentops.Client()\n",
+    "ao_client.initialize()  # Initialize before starting session\n",
+    "session = ao_client.start_session()\n",
+    "\n",
+    "if not session:\n",
+    "    raise RuntimeError(\"Failed to create AgentOps session\")\n",
+    "\n",
+    "print(f\"AgentOps Session URL: {session.session_url}\")\n",
+    "print(\"Session ID:\", session.session_id)\n",
+    "print(\"Session tracking enabled:\", bool(session))\n",
+    "print(\"\\nAll LLM events will be tracked in this session. Watch for event recording messages in the output.\")\n",
     "\n",
     "# Initialize Fireworks client\n",
-    "print(\"Initializing Fireworks client...\")\n",
+    "print(\"\\nInitializing Fireworks client...\")\n",
     "client = Fireworks(api_key=FIREWORKS_API_KEY)\n",
     "print(\"Fireworks client initialized.\")\n",
     "\n",
-    "# Set up messages for story generation\n",
-    "messages = [\n",
-    "    {\"role\": \"system\", \"content\": \"You are a creative storyteller.\"},\n",
-    "    {\"role\": \"user\", \"content\": \"Write a short story about a cyber-warrior trapped in the imperial era.\"}\n",
-    "]\n"
+    "# Initialize and register Fireworks provider\n",
+    "print(\"\\nRegistering Fireworks provider...\")\n",
+    "provider = FireworksProvider(client)\n",
+    "provider.set_session(session)\n",
+    "provider.override()\n",
+    "print(\"Fireworks provider registered.\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "62bdbde6",
+   "metadata": {},
+   "source": [
+    "## Test Cases\n",
+    "We'll test four different scenarios:\n",
+    "1. Synchronous non-streaming completion\n",
+    "2. Asynchronous non-streaming completion\n",
+    "3. Synchronous streaming completion\n",
+    "4. Asynchronous streaming completion\n",
+    "\n",
+    "All cases will use the same AgentOps session for event tracking."
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
-   "id": "7f8b75ab",
-   "metadata": {
-    "execution": {
-     "iopub.execute_input": "2024-12-18T02:08:29.927452Z",
-     "iopub.status.busy": "2024-12-18T02:08:29.927179Z",
-     "iopub.status.idle": "2024-12-18T02:08:32.272566Z",
-     "shell.execute_reply": "2024-12-18T02:08:32.271746Z"
-    }
-   },
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Generating story with Fireworks LLM...\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "LLM Response:\n",
-      "**The Ghost in the Sand**\n",
-      "\n",
-      "Akeira crouched behind a crumbling column, her eyes scanning the dusty marketplace for any sign of the enemy. Her sleek, black armor was a stark contrast to the ancient stones and faded awnings of the imperial city. Her breathing was slow and deliberate, a habit honed from years of virtual combat, not the muggy desert air.\n",
-      "\n",
-      "\"Target offline,\" her combat comms interrupted, a holographic message flickering to life in front of her. \"Ghost-19, priority threat level: Critical.\"\n",
-      "\n",
-      "Akeira's gaze snapped towards the palace at the market's heart, where Emperor Marcus imperiously waved to his subjects from a rooftop balcony. Her finger itched to fire a cyber-warhead at the arrogant leader, but her briefing warned of collateral damage and political fallout. She was forced to play it cool.\n",
-      "\n",
-      "\"Affirmative, Ghost-19. Scoping primary target... now.\"\n",
-      "\n",
-      "She expertly picked off Imperial Guards one by one, each killing requiring a precise shot, precise control. It was her digital reflexes she relied on, rather than the stifling limitations of a bodily form trapped in a 19th-century prison. Her \"armor\" consisted of heavy pistols, a leather corset, and a woolen mask to conceal her true form – or rather, her digital soul.\n",
-      "\n",
-      "The fight spilled into alleys and streets, the clash of steel on steel echoing through the city. Akeira fought in a haze of gunfire and rage, a human proxy for the Empire's digital overreach. She was a specter of war, an anachronism in time.\n",
-      "\n",
-      "In a last, desperate bid to escape, Akeira snatched a horse from the marketplace stables and rode towards the city gate. Shots fired at her from above, but her agility and instinct allowed her to weave through the chaos.\n",
-      "\n",
-      "Finally, she hit the sand beyond the city walls. Breathing heavily, Akeira ripped off her mask, revealing her cybernetic implants and data-dispersed scalp. She gazed up at the setting sun, a shimmering gold glow that mirrored the digital void she called home.\n",
-      "\n",
-      "\"Ghost-19,\" her comms crackled, a digital whisper in her ear. \"Safe extraction protocols initiated... now.\"\n",
-      "\n",
-      "The woman-boy hybrid, a cybernetic chimera, swiveled toward the desert, the rising dunes swallowing her whole. The Imperium might see her as a renegade, a fugitive to be hunted down, but Akeira knew her world – a world of digital shadows and limitless potential.\n",
-      "\n",
-      "Event tracking details:\n",
-      "Session URL: https://app.agentops.ai/drilldown?session_id=390c35ff-0df4-4953-9d06-d142fec08719\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "id": "7e1dd8b5",
+   "metadata": {},
+   "outputs": [],
    "source": [
+    "# Set up messages for story generation\n",
+    "messages = [\n",
+    "    {\"role\": \"system\", \"content\": \"You are a creative storyteller.\"},\n",
+    "    {\"role\": \"user\", \"content\": \"Write a short story about a cyber-warrior trapped in the imperial era.\"},\n",
+    "]\n",
     "\n",
-    "# Test non-streaming completion\n",
-    "print(\"Generating story with Fireworks LLM...\")\n",
+    "# 1. Test synchronous non-streaming completion\n",
+    "print(\"1. Generating story with synchronous non-streaming completion...\")\n",
     "response = client.chat.completions.create(\n",
     "    model=\"accounts/fireworks/models/llama-v3p1-8b-instruct\",\n",
     "    messages=messages\n",
     ")\n",
-    "print(\"\\nLLM Response:\")\n",
+    "print(\"\\nSync Non-streaming Response:\")\n",
     "print(response.choices[0].message.content)\n",
-    "print(\"\\nEvent tracking details:\")\n",
-    "print(f\"Session URL: {session.session_url}\")\n"
+    "print(\"\\nEvent recorded for sync non-streaming completion\")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
-   "id": "a54affac",
-   "metadata": {
-    "execution": {
-     "iopub.execute_input": "2024-12-18T02:08:32.274896Z",
-     "iopub.status.busy": "2024-12-18T02:08:32.274667Z",
-     "iopub.status.idle": "2024-12-18T02:08:35.066213Z",
-     "shell.execute_reply": "2024-12-18T02:08:35.064964Z"
-    }
-   },
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Generating story with streaming enabled...\n",
-      "\n",
-      "Streaming LLM Response:\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "**The"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " Digital Captive**\n",
-      "\n",
-      "In the sweltering heat of a Roman sun, Lucius stumbled through the crowded market, his gaze scanning the throngs of pedestrians for any sign of safety. But"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " how could he, a cyber warrior, find"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " solace in this ancient era? His cybernetic limbs, once tailored for stealth and deception in the vast digital expanse of the net, now felt heavy and cumbersome in his tattered imperial attire.\n",
-      "\n",
-      "Just"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " hours ago, Lucius had been fighting a grueling skirmish against"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " a cyber-virus, his digits burning with code and adrenaline. Suddenly, a freak anomaly had pulled him through a wormhole, depositing him in the midst of a city that was none other than Rome"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      ", 19 AD. The roar of"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " the Colosseum, the clanging of swords, and the murmur of the crowd now mocked him as he struggled to adjust to his new surroundings.\n",
-      "\n",
-      "Lucius, born Lucien Laroche in"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " the digital realm of NeoTokyo, had been recruited by the infamous cyber"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "-guerrilla group, Phoenix Rising. They had trained him in the art of digital warfare, exploiting the weaknesses of enemy firewalls and unraveling encrypted systems with ease. But in this alien world, his skills were more"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " hindrance than help.\n",
-      "\n",
-      "He spotted a group of legionnaires eyeing him"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " suspiciously, their hand on the hilts of their swords. Lucius knew he couldn't let them see the advanced cyberware embedded in his limbs. He swiftly donned a makeshift disguise, fashioning a toga from a nearby market stall to conceal his bizarre cybernetic appendages.\n",
-      "\n",
-      "As"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " the sun began to set over the imperial city, Lucius found himself lost in a labyrinth of narrow alleys. His thoughts wandered back to NeoTokyo, where his comrade, Zara, might be frantically searching for him. The disconnect was almost too much to bear"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      ". He yearned to leap back into the digital realm, feeling like a moth trapped in a flame.\n",
-      "\n",
-      "With a furtive eye on the shadows, Lucius navigated the crowded streets, dodging glances from astonished civilians. No one suspected a thing"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "; they assumed him to be just another commoner, bewildered by the vast machinery of the imperial world. As the darkness deepened, Lucius spotted a"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " lone figure lurking in the shadows – a young woman with piercing green eyes, clad in a hooded cloak.\n",
-      "\n",
-      "\"Get word to Zara,\" the woman"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " whispered, as she vanished into the darkness. \"Phoenix Rising will come for you. Be ready, Lucien.\"\n",
-      "\n",
-      "Though imprisoned in"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      " time, Lucien knew his cyber warrior's cry would be heard across the centuries, echoing through the digital expanse, seeking a beacon of hope to guide him back to the digital realm.\n",
-      "\n",
-      "Event tracking details:\n",
-      "Session URL: https://app.agentops.ai/drilldown?session_id=390c35ff-0df4-4953-9d06-d142fec08719\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "id": "40a2250f",
+   "metadata": {},
+   "outputs": [],
    "source": [
+    "%%async\n",
+    "# 2. Test asynchronous non-streaming completion\n",
+    "print(\"2. Generating story with asynchronous non-streaming completion...\")\n",
+    "\n",
+    "async def async_completion():\n",
+    "    response = await client.chat.completions.acreate(\n",
+    "        model=\"accounts/fireworks/models/llama-v3p1-8b-instruct\",\n",
+    "        messages=messages\n",
+    "    )\n",
+    "    print(\"\\nAsync Non-streaming Response:\")\n",
+    "    print(response.choices[0].message.content)\n",
+    "    print(\"\\nEvent recorded for async non-streaming completion\")\n",
     "\n",
-    "# Test streaming completion\n",
-    "print(\"\\nGenerating story with streaming enabled...\")\n",
+    "await async_completion()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d6e61be0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# 3. Test synchronous streaming completion\n",
+    "print(\"3. Generating story with synchronous streaming...\")\n",
     "stream = client.chat.completions.create(\n",
     "    model=\"accounts/fireworks/models/llama-v3p1-8b-instruct\",\n",
     "    messages=messages,\n",
     "    stream=True\n",
     ")\n",
     "\n",
-    "print(\"\\nStreaming LLM Response:\")\n",
-    "for chunk in stream:\n",
-    "    if chunk.choices[0].delta.content:\n",
-    "        print(chunk.choices[0].delta.content, end=\"\")\n",
-    "print(\"\\n\\nEvent tracking details:\")\n",
-    "print(f\"Session URL: {session.session_url}\")\n"
+    "print(\"\\nSync Streaming Response:\")\n",
+    "try:\n",
+    "    if asyncio.iscoroutine(stream):\n",
+    "        stream = asyncio.run(stream)\n",
+    "    for chunk in stream:\n",
+    "        if hasattr(chunk, \"choices\") and chunk.choices and hasattr(chunk.choices[0].delta, \"content\"):\n",
+    "            content = chunk.choices[0].delta.content\n",
+    "            if content:\n",
+    "                print(content, end=\"\", flush=True)\n",
+    "except Exception as e:\n",
+    "    logger.error(f\"Error processing streaming response: {str(e)}\")\n",
+    "print()  # New line after streaming"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
-   "id": "aa628f19",
-   "metadata": {
-    "execution": {
-     "iopub.execute_input": "2024-12-18T02:08:35.068909Z",
-     "iopub.status.busy": "2024-12-18T02:08:35.068648Z",
-     "iopub.status.idle": "2024-12-18T02:08:35.076179Z",
-     "shell.execute_reply": "2024-12-18T02:08:35.075492Z"
-    }
-   },
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "🖇 AgentOps: Invalid end_state. Please use one of the EndState enums\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Ending AgentOps session...\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Session Statistics:\n",
-      "No session statistics available\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "id": "02a76fb9",
+   "metadata": {},
+   "outputs": [],
    "source": [
+    "%%async\n",
+    "# 4. Test asynchronous streaming completion\n",
+    "print(\"4. Generating story with asynchronous streaming...\")\n",
+    "\n",
+    "async def async_streaming():\n",
+    "    try:\n",
+    "        stream = await client.chat.completions.acreate(\n",
+    "            model=\"accounts/fireworks/models/llama-v3p1-8b-instruct\",\n",
+    "            messages=messages,\n",
+    "            stream=True\n",
+    "        )\n",
+    "        print(\"\\nAsync Streaming Response:\")\n",
+    "        async for chunk in stream:\n",
+    "            if hasattr(chunk, \"choices\") and chunk.choices and hasattr(chunk.choices[0].delta, \"content\"):\n",
+    "                content = chunk.choices[0].delta.content\n",
+    "                if content:\n",
+    "                    print(content, end=\"\", flush=True)\n",
+    "    except Exception as e:\n",
+    "        logger.error(f\"Error in async streaming: {str(e)}\")\n",
+    "    print()  # New line after streaming\n",
     "\n",
+    "await async_streaming()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "bc64a254",
+   "metadata": {},
+   "outputs": [],
+   "source": [
     "# End session and show detailed stats\n",
     "print(\"\\nEnding AgentOps session...\")\n",
     "try:\n",
-    "    session_stats = session.end_session(\n",
-    "        end_state=EndState.SUCCESS,  # Using the correct enum value\n",
-    "        end_state_reason=\"Successfully generated stories using both streaming and non-streaming modes.\"\n",
-    "    )\n",
     "    print(\"\\nSession Statistics:\")\n",
-    "    if session_stats:\n",
-    "        print(f\"Total LLM calls: {session_stats.get('llm_calls', 0)}\")\n",
-    "        print(f\"Total duration: {session_stats.get('duration', 0):.2f}s\")\n",
-    "        print(f\"Total cost: ${session_stats.get('cost', 0):.4f}\")\n",
+    "    session_stats = session.end_session(end_state=EndState.SUCCESS)\n",
+    "    if isinstance(session_stats, dict):\n",
+    "        print(f\"Duration: {session_stats.get('duration', 'N/A')}\")\n",
+    "        print(f\"Cost: ${float(session_stats.get('cost', 0.00)):.2f}\")\n",
+    "        print(f\"LLM Events: {session_stats.get('llm_events', 0)}\")\n",
+    "        print(f\"Tool Events: {session_stats.get('tool_events', 0)}\")\n",
+    "        print(f\"Action Events: {session_stats.get('action_events', 0)}\")\n",
+    "        print(f\"Error Events: {session_stats.get('error_events', 0)}\")\n",
     "        print(f\"Session URL: {session.session_url}\")\n",
     "    else:\n",
     "        print(\"No session statistics available\")\n",
+    "        print(\"Session URL for debugging:\", session.session_url)\n",
     "except Exception as e:\n",
     "    print(f\"Error ending session: {str(e)}\")\n",
-    "    print(\"Session URL for debugging:\", session.session_url)\n"
+    "    print(\"Session URL for debugging:\", session.session_url)"
    ]
   }
  ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.12.7"
-  }
- },
+ "metadata": {},
  "nbformat": 4,
  "nbformat_minor": 5
 }
diff --git a/examples/fireworks_examples/update_notebook.py b/examples/fireworks_examples/update_notebook.py
index 63957fb0..2d128e2d 100644
--- a/examples/fireworks_examples/update_notebook.py
+++ b/examples/fireworks_examples/update_notebook.py
@@ -6,111 +6,225 @@
 # Create cells
 cells = []
 
-# Cell 1: Imports and initialization
+# Cell 1: Markdown introduction
+cells.append(
+    nbf.v4.new_markdown_cell(
+        """# Fireworks LLM Integration Example
+
+This notebook demonstrates the integration of Fireworks LLM with AgentOps, showcasing both synchronous and asynchronous completions with and without streaming. All examples use the same AgentOps session for proper event tracking."""
+    )
+)
+
+# Cell 2: Imports and initialization
 cells.append(
     nbf.v4.new_code_cell(
-        """
-import os
-from dotenv import load_dotenv
+        """import os
+import logging
+import asyncio
 from fireworks.client import Fireworks
 import agentops
 from agentops.enums import EndState
+from agentops.llms.providers.fireworks import FireworksProvider
+from dotenv import load_dotenv
 
-# Load environment variables
+# Set up logging
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
+    handlers=[logging.StreamHandler()],
+)
+logger = logging.getLogger(__name__)"""
+    )
+)
+
+# Cell 3: Client initialization
+cells.append(
+    nbf.v4.new_code_cell(
+        """# Load environment variables
 load_dotenv()
 FIREWORKS_API_KEY = os.getenv("FIREWORKS_API_KEY")
 
-# Initialize AgentOps in development mode
-print("Initializing AgentOps in development mode...")
-agentops.init(
-    api_key=None,  # None for local development
-    default_tags=["fireworks-example"]
-)
-print("Starting new AgentOps session...")
-session = agentops.start_session()
-print(f"AgentOps initialized. Session URL: {session.session_url}")
+if not FIREWORKS_API_KEY:
+    raise ValueError("FIREWORKS_API_KEY environment variable is not set")
+
+# Initialize AgentOps client and start session
+print("\\nInitializing AgentOps client and starting session...")
+ao_client = agentops.Client()
+ao_client.initialize()  # Initialize before starting session
+session = ao_client.start_session()
+
+if not session:
+    raise RuntimeError("Failed to create AgentOps session")
+
+print(f"AgentOps Session URL: {session.session_url}")
+print("Session ID:", session.session_id)
+print("Session tracking enabled:", bool(session))
+print("\\nAll LLM events will be tracked in this session. Watch for event recording messages in the output.")
 
 # Initialize Fireworks client
-print("Initializing Fireworks client...")
+print("\\nInitializing Fireworks client...")
 client = Fireworks(api_key=FIREWORKS_API_KEY)
 print("Fireworks client initialized.")
 
-# Set up messages for story generation
-messages = [
-    {"role": "system", "content": "You are a creative storyteller."},
-    {"role": "user", "content": "Write a short story about a cyber-warrior trapped in the imperial era."}
-]
-"""
+# Initialize and register Fireworks provider
+print("\\nRegistering Fireworks provider...")
+provider = FireworksProvider(client)
+provider.set_session(session)
+provider.override()
+print("Fireworks provider registered.")"""
     )
 )
 
-# Cell 2: Non-streaming completion
+# Cell 4: Test setup
+cells.append(
+    nbf.v4.new_markdown_cell(
+        """## Test Cases
+We'll test four different scenarios:
+1. Synchronous non-streaming completion
+2. Asynchronous non-streaming completion
+3. Synchronous streaming completion
+4. Asynchronous streaming completion
+
+All cases will use the same AgentOps session for event tracking."""
+    )
+)
+
+# Cell 5: Message setup and sync non-streaming test
 cells.append(
     nbf.v4.new_code_cell(
-        """
-# Test non-streaming completion
-print("Generating story with Fireworks LLM...")
+        """# Set up messages for story generation
+messages = [
+    {"role": "system", "content": "You are a creative storyteller."},
+    {"role": "user", "content": "Write a short story about a cyber-warrior trapped in the imperial era."},
+]
+
+# 1. Test synchronous non-streaming completion
+print("1. Generating story with synchronous non-streaming completion...")
 response = client.chat.completions.create(
     model="accounts/fireworks/models/llama-v3p1-8b-instruct",
     messages=messages
 )
-print("\\nLLM Response:")
+print("\\nSync Non-streaming Response:")
 print(response.choices[0].message.content)
-print("\\nEvent tracking details:")
-print(f"Session URL: {session.session_url}")
-"""
+print("\\nEvent recorded for sync non-streaming completion")"""
+    )
+)
+
+# Cell 6: Async non-streaming test
+cells.append(
+    nbf.v4.new_code_cell(
+        """# 2. Test asynchronous non-streaming completion
+print("2. Generating story with asynchronous non-streaming completion...")
+
+async def async_completion():
+    response = await client.chat.completions.acreate(
+        model="accounts/fireworks/models/llama-v3p1-8b-instruct",
+        messages=messages
+    )
+    print("\\nAsync Non-streaming Response:")
+    print(response.choices[0].message.content)
+    print("\\nEvent recorded for async non-streaming completion")
+
+# Run async function using asyncio.run()
+try:
+    asyncio.run(async_completion())
+except RuntimeError as e:
+    if "Cannot run the event loop while another loop is running" in str(e):
+        # If we're already in an event loop, create a new one
+        loop = asyncio.get_event_loop()
+        loop.run_until_complete(async_completion())
+    else:
+        raise"""
     )
 )
 
-# Cell 3: Streaming completion
+# Cell 7: Sync streaming test
 cells.append(
     nbf.v4.new_code_cell(
-        """
-# Test streaming completion
-print("\\nGenerating story with streaming enabled...")
+        """# 3. Test synchronous streaming completion
+print("3. Generating story with synchronous streaming...")
 stream = client.chat.completions.create(
     model="accounts/fireworks/models/llama-v3p1-8b-instruct",
     messages=messages,
     stream=True
 )
 
-print("\\nStreaming LLM Response:")
-for chunk in stream:
-    if chunk.choices[0].delta.content:
-        print(chunk.choices[0].delta.content, end="")
-print("\\n\\nEvent tracking details:")
-print(f"Session URL: {session.session_url}")
-"""
+print("\\nSync Streaming Response:")
+try:
+    if asyncio.iscoroutine(stream):
+        stream = asyncio.run(stream)
+    for chunk in stream:
+        if hasattr(chunk, "choices") and chunk.choices and hasattr(chunk.choices[0].delta, "content"):
+            content = chunk.choices[0].delta.content
+            if content:
+                print(content, end="", flush=True)
+except Exception as e:
+    logger.error(f"Error processing streaming response: {str(e)}")
+print()  # New line after streaming"""
     )
 )
 
-# Cell 4: End session with detailed stats
+# Cell 8: Async streaming test
 cells.append(
     nbf.v4.new_code_cell(
-        """
-# End session and show detailed stats
-print("\\nEnding AgentOps session...")
+        """# 4. Test asynchronous streaming completion
+print("4. Generating story with asynchronous streaming...")
+
+async def async_streaming():
+    try:
+        stream = await client.chat.completions.acreate(
+            model="accounts/fireworks/models/llama-v3p1-8b-instruct",
+            messages=messages,
+            stream=True
+        )
+        print("\\nAsync Streaming Response:")
+        async for chunk in stream:
+            if hasattr(chunk, "choices") and chunk.choices and hasattr(chunk.choices[0].delta, "content"):
+                content = chunk.choices[0].delta.content
+                if content:
+                    print(content, end="", flush=True)
+    except Exception as e:
+        logger.error(f"Error in async streaming: {str(e)}")
+    print()  # New line after streaming
+
+# Run async function using asyncio.run()
 try:
-    session_stats = session.end_session(
-        end_state=EndState.SUCCESS,  # Using the correct enum value
-        end_state_reason="Successfully generated stories using both streaming and non-streaming modes."
+    asyncio.run(async_streaming())
+except RuntimeError as e:
+    if "Cannot run the event loop while another loop is running" in str(e):
+        # If we're already in an event loop, create a new one
+        loop = asyncio.get_event_loop()
+        loop.run_until_complete(async_streaming())
+    else:
+        raise"""
     )
+)
+
+# Cell 9: End session and stats
+cells.append(
+    nbf.v4.new_code_cell(
+        """# End session and show detailed stats
+print("\\nEnding AgentOps session...")
+try:
     print("\\nSession Statistics:")
-    if session_stats:
-        print(f"Total LLM calls: {session_stats.get('llm_calls', 0)}")
-        print(f"Total duration: {session_stats.get('duration', 0):.2f}s")
-        print(f"Total cost: ${session_stats.get('cost', 0):.4f}")
+    session_stats = session.end_session(end_state=EndState.SUCCESS)
+    if isinstance(session_stats, dict):
+        print(f"Duration: {session_stats.get('duration', 'N/A')}")
+        print(f"Cost: ${float(session_stats.get('cost', 0.00)):.2f}")
+        print(f"LLM Events: {session_stats.get('llm_events', 0)}")
+        print(f"Tool Events: {session_stats.get('tool_events', 0)}")
+        print(f"Action Events: {session_stats.get('action_events', 0)}")
+        print(f"Error Events: {session_stats.get('error_events', 0)}")
         print(f"Session URL: {session.session_url}")
     else:
         print("No session statistics available")
+        print("Session URL for debugging:", session.session_url)
 except Exception as e:
     print(f"Error ending session: {str(e)}")
-    print("Session URL for debugging:", session.session_url)
-"""
+    print("Session URL for debugging:", session.session_url)"""
     )
 )
 
-
 # Add cells to notebook
 nb.cells = cells
 

From 49d3f27535425a75d331d50fc4aeafa0cd681bbb Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 22:57:45 +0000
Subject: [PATCH 15/22] fix: Update Fireworks provider and notebook for proper
 event tracking

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 .../fireworks_example.ipynb                   | 42 +++++++++++++------
 .../fireworks_examples/update_notebook.py     | 29 ++++---------
 2 files changed, 37 insertions(+), 34 deletions(-)

diff --git a/examples/fireworks_examples/fireworks_example.ipynb b/examples/fireworks_examples/fireworks_example.ipynb
index 36e8140f..42444904 100644
--- a/examples/fireworks_examples/fireworks_example.ipynb
+++ b/examples/fireworks_examples/fireworks_example.ipynb
@@ -2,7 +2,7 @@
  "cells": [
   {
    "cell_type": "markdown",
-   "id": "8ce4ef43",
+   "id": "a5db7f5c",
    "metadata": {},
    "source": [
     "# Fireworks LLM Integration Example\n",
@@ -13,7 +13,7 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "caeebf2f",
+   "id": "cf6cede9",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -38,7 +38,7 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "4fa145da",
+   "id": "2d77b583",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -78,7 +78,7 @@
   },
   {
    "cell_type": "markdown",
-   "id": "62bdbde6",
+   "id": "9a434a04",
    "metadata": {},
    "source": [
     "## Test Cases\n",
@@ -94,7 +94,7 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "7e1dd8b5",
+   "id": "59e6d9ba",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -118,11 +118,10 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "40a2250f",
+   "id": "cc81b366",
    "metadata": {},
    "outputs": [],
    "source": [
-    "%%async\n",
     "# 2. Test asynchronous non-streaming completion\n",
     "print(\"2. Generating story with asynchronous non-streaming completion...\")\n",
     "\n",
@@ -135,13 +134,22 @@
     "    print(response.choices[0].message.content)\n",
     "    print(\"\\nEvent recorded for async non-streaming completion\")\n",
     "\n",
-    "await async_completion()"
+    "# Run async function using asyncio.run()\n",
+    "try:\n",
+    "    asyncio.run(async_completion())\n",
+    "except RuntimeError as e:\n",
+    "    if \"Cannot run the event loop while another loop is running\" in str(e):\n",
+    "        # If we're already in an event loop, create a new one\n",
+    "        loop = asyncio.get_event_loop()\n",
+    "        loop.run_until_complete(async_completion())\n",
+    "    else:\n",
+    "        raise"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "d6e61be0",
+   "id": "a70cb4ea",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -170,11 +178,10 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "02a76fb9",
+   "id": "d1fd034c",
    "metadata": {},
    "outputs": [],
    "source": [
-    "%%async\n",
     "# 4. Test asynchronous streaming completion\n",
     "print(\"4. Generating story with asynchronous streaming...\")\n",
     "\n",
@@ -195,13 +202,22 @@
     "        logger.error(f\"Error in async streaming: {str(e)}\")\n",
     "    print()  # New line after streaming\n",
     "\n",
-    "await async_streaming()"
+    "# Run async function using asyncio.run()\n",
+    "try:\n",
+    "    asyncio.run(async_streaming())\n",
+    "except RuntimeError as e:\n",
+    "    if \"Cannot run the event loop while another loop is running\" in str(e):\n",
+    "        # If we're already in an event loop, create a new one\n",
+    "        loop = asyncio.get_event_loop()\n",
+    "        loop.run_until_complete(async_streaming())\n",
+    "    else:\n",
+    "        raise"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "bc64a254",
+   "id": "d413c0ba",
    "metadata": {},
    "outputs": [],
    "source": [
diff --git a/examples/fireworks_examples/update_notebook.py b/examples/fireworks_examples/update_notebook.py
index 2d128e2d..1f586da2 100644
--- a/examples/fireworks_examples/update_notebook.py
+++ b/examples/fireworks_examples/update_notebook.py
@@ -125,16 +125,9 @@ async def async_completion():
     print(response.choices[0].message.content)
     print("\\nEvent recorded for async non-streaming completion")
 
-# Run async function using asyncio.run()
-try:
-    asyncio.run(async_completion())
-except RuntimeError as e:
-    if "Cannot run the event loop while another loop is running" in str(e):
-        # If we're already in an event loop, create a new one
-        loop = asyncio.get_event_loop()
-        loop.run_until_complete(async_completion())
-    else:
-        raise"""
+# Get the current event loop and run the async function
+loop = asyncio.get_event_loop()
+loop.run_until_complete(async_completion())"""
     )
 )
 
@@ -183,20 +176,14 @@ async def async_streaming():
                 content = chunk.choices[0].delta.content
                 if content:
                     print(content, end="", flush=True)
+        print("\\nEvent recorded for async streaming completion")
     except Exception as e:
         logger.error(f"Error in async streaming: {str(e)}")
-    print()  # New line after streaming
+        raise
 
-# Run async function using asyncio.run()
-try:
-    asyncio.run(async_streaming())
-except RuntimeError as e:
-    if "Cannot run the event loop while another loop is running" in str(e):
-        # If we're already in an event loop, create a new one
-        loop = asyncio.get_event_loop()
-        loop.run_until_complete(async_streaming())
-    else:
-        raise"""
+# Get the current event loop and run the async function
+loop = asyncio.get_event_loop()
+loop.run_until_complete(async_streaming())"""
     )
 )
 

From 74eed4a7085781649838cf4f63c02aec4ac6102f Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 23:16:25 +0000
Subject: [PATCH 16/22] test: Add comprehensive tests for FireworksProvider

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py          | 107 +++++++++-
 .../fireworks_example.ipynb                   | 158 ++++----------
 .../fireworks_examples/update_notebook.py     | 151 +++++---------
 tests/test_fireworks_provider.py              | 196 ++++++++++++++++++
 4 files changed, 386 insertions(+), 226 deletions(-)
 create mode 100644 tests/test_fireworks_provider.py

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
index fe1b47cf..a8e3f7d1 100644
--- a/agentops/llms/providers/fireworks.py
+++ b/agentops/llms/providers/fireworks.py
@@ -139,14 +139,40 @@ def patched_function(*args, **kwargs):
             try:
                 init_timestamp = time.time()
                 response = original_create(*args, **kwargs)
+
+                # For streaming responses, handle directly without event loop
                 if kwargs.get("stream", False):
-                    return provider.handle_response(response, kwargs, init_timestamp, provider._session)
-                else:
-                    loop = asyncio.new_event_loop()
-                    asyncio.set_event_loop(loop)
-                    return loop.run_until_complete(
-                        provider.handle_response(response, kwargs, init_timestamp, provider._session)
+                    event = LLMEvent(
+                        model=kwargs.get("model", ""),
+                        prompt=kwargs.get("messages", []),  # Pass ChatML messages directly
+                        init_timestamp=init_timestamp,
+                        end_timestamp=time.time(),
+                        completion="[Streaming Response]",
+                        prompt_tokens=0,
+                        completion_tokens=0,
+                        cost=0.0,
+                    )
+                    if provider._session:
+                        provider._session.record(event)
+                        logger.info("Recorded streaming LLM event")
+                    return response
+
+                # For non-streaming responses, handle synchronously
+                if hasattr(response, "choices") and response.choices:
+                    event = LLMEvent(
+                        model=kwargs.get("model", ""),
+                        prompt=kwargs.get("messages", []),  # Pass ChatML messages directly
+                        init_timestamp=init_timestamp,
+                        end_timestamp=time.time(),
+                        completion=response.choices[0].message.content,
+                        prompt_tokens=0,
+                        completion_tokens=0,
+                        cost=0.0,
                     )
+                    if provider._session:
+                        provider._session.record(event)
+                        logger.info("Recorded non-streaming LLM event")
+                return response
             except Exception as e:
                 logger.error(f"Error in Fireworks completion: {str(e)}")
                 raise
@@ -161,12 +187,73 @@ def _override_fireworks_async_completion(self):
         async def patched_function(*args, **kwargs):
             try:
                 init_timestamp = time.time()
-                response = await original_acreate(*args, **kwargs)
+                response_generator = await original_acreate(*args, **kwargs)
+                is_streaming = kwargs.get("stream", False)
 
-                if kwargs.get("stream", False):
-                    return await provider.handle_response(response, kwargs, init_timestamp, provider._session)
+                if is_streaming:
+                    # For streaming responses, create and record initial event
+                    event = LLMEvent(
+                        model=kwargs.get("model", ""),
+                        prompt=kwargs.get("messages", []),
+                        init_timestamp=init_timestamp,
+                        end_timestamp=time.time(),
+                        completion="[Streaming Response]",
+                        prompt_tokens=0,
+                        completion_tokens=0,
+                        cost=0.0,
+                    )
+                    if provider._session:
+                        provider._session.record(event)
+                        logger.info("Recorded streaming LLM event")
+
+                    # Create async generator wrapper
+                    async def stream_wrapper():
+                        accumulated_content = ""
+                        async for chunk in response_generator:
+                            if hasattr(chunk, "choices") and chunk.choices:
+                                content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
+                                if content:
+                                    accumulated_content += content
+                                    yield chunk
+                        # Update event with final content
+                        event.completion = accumulated_content
+                        event.end_timestamp = time.time()
+                        if provider._session:
+                            provider._session.record(event)
+                            logger.info("Updated streaming LLM event with final content")
+
+                    return stream_wrapper()
                 else:
-                    return await provider.handle_response(response, kwargs, init_timestamp, provider._session)
+                    # For non-streaming responses, collect all chunks
+                    accumulated_content = ""
+                    async for chunk in response_generator:
+                        if hasattr(chunk, "choices") and chunk.choices:
+                            content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
+                            if content:
+                                accumulated_content += content
+
+                    # Create and record event
+                    event = LLMEvent(
+                        model=kwargs.get("model", ""),
+                        prompt=kwargs.get("messages", []),
+                        init_timestamp=init_timestamp,
+                        end_timestamp=time.time(),
+                        completion=accumulated_content,
+                        prompt_tokens=0,
+                        completion_tokens=0,
+                        cost=0.0,
+                    )
+                    if provider._session:
+                        provider._session.record(event)
+                        logger.info("Recorded non-streaming LLM event")
+
+                    # Create a response-like object
+                    class AsyncResponse:
+                        def __init__(self, content):
+                            self.choices = [type('Choice', (), {'message': type('Message', (), {'content': content})()})]
+
+                    return AsyncResponse(accumulated_content)
+
             except Exception as e:
                 logger.error(f"Error in Fireworks async completion: {str(e)}")
                 raise
diff --git a/examples/fireworks_examples/fireworks_example.ipynb b/examples/fireworks_examples/fireworks_example.ipynb
index 42444904..58794b76 100644
--- a/examples/fireworks_examples/fireworks_example.ipynb
+++ b/examples/fireworks_examples/fireworks_example.ipynb
@@ -1,30 +1,20 @@
 {
  "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "a5db7f5c",
-   "metadata": {},
-   "source": [
-    "# Fireworks LLM Integration Example\n",
-    "\n",
-    "This notebook demonstrates the integration of Fireworks LLM with AgentOps, showcasing both synchronous and asynchronous completions with and without streaming. All examples use the same AgentOps session for proper event tracking."
-   ]
-  },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "cf6cede9",
+   "id": "69829505",
    "metadata": {},
    "outputs": [],
    "source": [
+    "import nest_asyncio\n",
+    "nest_asyncio.apply()\n",
     "import os\n",
     "import logging\n",
     "import asyncio\n",
-    "from fireworks.client import Fireworks\n",
     "import agentops\n",
-    "from agentops.enums import EndState\n",
+    "from fireworks.client import Fireworks\n",
     "from agentops.llms.providers.fireworks import FireworksProvider\n",
-    "from dotenv import load_dotenv\n",
     "\n",
     "# Set up logging\n",
     "logging.basicConfig(\n",
@@ -38,72 +28,49 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "2d77b583",
+   "id": "7f8d9ce4",
    "metadata": {},
    "outputs": [],
    "source": [
-    "# Load environment variables\n",
-    "load_dotenv()\n",
-    "FIREWORKS_API_KEY = os.getenv(\"FIREWORKS_API_KEY\")\n",
-    "\n",
-    "if not FIREWORKS_API_KEY:\n",
+    "# Check for API keys\n",
+    "if \"FIREWORKS_API_KEY\" not in os.environ:\n",
     "    raise ValueError(\"FIREWORKS_API_KEY environment variable is not set\")\n",
+    "if \"AGENTOPS_API_KEY\" not in os.environ:\n",
+    "    raise ValueError(\"AGENTOPS_API_KEY environment variable is not set\")\n",
     "\n",
-    "# Initialize AgentOps client and start session\n",
-    "print(\"\\nInitializing AgentOps client and starting session...\")\n",
-    "ao_client = agentops.Client()\n",
-    "ao_client.initialize()  # Initialize before starting session\n",
-    "session = ao_client.start_session()\n",
-    "\n",
-    "if not session:\n",
-    "    raise RuntimeError(\"Failed to create AgentOps session\")\n",
-    "\n",
-    "print(f\"AgentOps Session URL: {session.session_url}\")\n",
-    "print(\"Session ID:\", session.session_id)\n",
-    "print(\"Session tracking enabled:\", bool(session))\n",
-    "print(\"\\nAll LLM events will be tracked in this session. Watch for event recording messages in the output.\")\n",
+    "# Initialize AgentOps\n",
+    "print(\"\\nInitializing AgentOps...\")\n",
+    "agentops.init(os.getenv(\"AGENTOPS_API_KEY\"), default_tags=[\"Fireworks Example\"])\n",
     "\n",
-    "# Initialize Fireworks client\n",
-    "print(\"\\nInitializing Fireworks client...\")\n",
-    "client = Fireworks(api_key=FIREWORKS_API_KEY)\n",
-    "print(\"Fireworks client initialized.\")\n",
-    "\n",
-    "# Initialize and register Fireworks provider\n",
-    "print(\"\\nRegistering Fireworks provider...\")\n",
+    "# Initialize Fireworks client and provider\n",
+    "print(\"\\nInitializing Fireworks client and provider...\")\n",
+    "client = Fireworks()\n",
     "provider = FireworksProvider(client)\n",
-    "provider.set_session(session)\n",
     "provider.override()\n",
-    "print(\"Fireworks provider registered.\")"
+    "print(\"Fireworks client and provider initialized.\")"
    ]
   },
   {
-   "cell_type": "markdown",
-   "id": "9a434a04",
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a6785170",
    "metadata": {},
+   "outputs": [],
    "source": [
-    "## Test Cases\n",
-    "We'll test four different scenarios:\n",
-    "1. Synchronous non-streaming completion\n",
-    "2. Asynchronous non-streaming completion\n",
-    "3. Synchronous streaming completion\n",
-    "4. Asynchronous streaming completion\n",
-    "\n",
-    "All cases will use the same AgentOps session for event tracking."
+    "# Set up test messages for story generation\n",
+    "messages = [\n",
+    "    {\"role\": \"system\", \"content\": \"You are a creative storyteller.\"},\n",
+    "    {\"role\": \"user\", \"content\": \"Write a short story about a cyber-warrior trapped in the imperial era.\"}\n",
+    "]"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "59e6d9ba",
+   "id": "9a71f58d",
    "metadata": {},
    "outputs": [],
    "source": [
-    "# Set up messages for story generation\n",
-    "messages = [\n",
-    "    {\"role\": \"system\", \"content\": \"You are a creative storyteller.\"},\n",
-    "    {\"role\": \"user\", \"content\": \"Write a short story about a cyber-warrior trapped in the imperial era.\"},\n",
-    "]\n",
-    "\n",
     "# 1. Test synchronous non-streaming completion\n",
     "print(\"1. Generating story with synchronous non-streaming completion...\")\n",
     "response = client.chat.completions.create(\n",
@@ -118,7 +85,7 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "cc81b366",
+   "id": "3155bdff",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -134,22 +101,13 @@
     "    print(response.choices[0].message.content)\n",
     "    print(\"\\nEvent recorded for async non-streaming completion\")\n",
     "\n",
-    "# Run async function using asyncio.run()\n",
-    "try:\n",
-    "    asyncio.run(async_completion())\n",
-    "except RuntimeError as e:\n",
-    "    if \"Cannot run the event loop while another loop is running\" in str(e):\n",
-    "        # If we're already in an event loop, create a new one\n",
-    "        loop = asyncio.get_event_loop()\n",
-    "        loop.run_until_complete(async_completion())\n",
-    "    else:\n",
-    "        raise"
+    "await async_completion()"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "a70cb4ea",
+   "id": "8a1f8687",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -160,25 +118,19 @@
     "    messages=messages,\n",
     "    stream=True\n",
     ")\n",
-    "\n",
     "print(\"\\nSync Streaming Response:\")\n",
-    "try:\n",
-    "    if asyncio.iscoroutine(stream):\n",
-    "        stream = asyncio.run(stream)\n",
-    "    for chunk in stream:\n",
-    "        if hasattr(chunk, \"choices\") and chunk.choices and hasattr(chunk.choices[0].delta, \"content\"):\n",
-    "            content = chunk.choices[0].delta.content\n",
-    "            if content:\n",
-    "                print(content, end=\"\", flush=True)\n",
-    "except Exception as e:\n",
-    "    logger.error(f\"Error processing streaming response: {str(e)}\")\n",
-    "print()  # New line after streaming"
+    "for chunk in stream:\n",
+    "    if hasattr(chunk, \"choices\") and chunk.choices and hasattr(chunk.choices[0].delta, \"content\"):\n",
+    "        content = chunk.choices[0].delta.content\n",
+    "        if content:\n",
+    "            print(content, end=\"\", flush=True)\n",
+    "print(\"\\nEvent recorded for sync streaming completion\")"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "d1fd034c",
+   "id": "6266a356",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -198,48 +150,26 @@
     "                content = chunk.choices[0].delta.content\n",
     "                if content:\n",
     "                    print(content, end=\"\", flush=True)\n",
+    "        print(\"\\nEvent recorded for async streaming completion\")\n",
     "    except Exception as e:\n",
     "        logger.error(f\"Error in async streaming: {str(e)}\")\n",
-    "    print()  # New line after streaming\n",
+    "        raise\n",
     "\n",
-    "# Run async function using asyncio.run()\n",
-    "try:\n",
-    "    asyncio.run(async_streaming())\n",
-    "except RuntimeError as e:\n",
-    "    if \"Cannot run the event loop while another loop is running\" in str(e):\n",
-    "        # If we're already in an event loop, create a new one\n",
-    "        loop = asyncio.get_event_loop()\n",
-    "        loop.run_until_complete(async_streaming())\n",
-    "    else:\n",
-    "        raise"
+    "await async_streaming()"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "d413c0ba",
+   "id": "2413940c",
    "metadata": {},
    "outputs": [],
    "source": [
     "# End session and show detailed stats\n",
-    "print(\"\\nEnding AgentOps session...\")\n",
-    "try:\n",
-    "    print(\"\\nSession Statistics:\")\n",
-    "    session_stats = session.end_session(end_state=EndState.SUCCESS)\n",
-    "    if isinstance(session_stats, dict):\n",
-    "        print(f\"Duration: {session_stats.get('duration', 'N/A')}\")\n",
-    "        print(f\"Cost: ${float(session_stats.get('cost', 0.00)):.2f}\")\n",
-    "        print(f\"LLM Events: {session_stats.get('llm_events', 0)}\")\n",
-    "        print(f\"Tool Events: {session_stats.get('tool_events', 0)}\")\n",
-    "        print(f\"Action Events: {session_stats.get('action_events', 0)}\")\n",
-    "        print(f\"Error Events: {session_stats.get('error_events', 0)}\")\n",
-    "        print(f\"Session URL: {session.session_url}\")\n",
-    "    else:\n",
-    "        print(\"No session statistics available\")\n",
-    "        print(\"Session URL for debugging:\", session.session_url)\n",
-    "except Exception as e:\n",
-    "    print(f\"Error ending session: {str(e)}\")\n",
-    "    print(\"Session URL for debugging:\", session.session_url)"
+    "print(\"\\nEnding session and showing statistics...\")\n",
+    "session_stats = agentops.end_session(\"Success\")\n",
+    "print(\"\\nSession Statistics:\")\n",
+    "print(f\"LLM Events: {session_stats.get('llm_events', 0)}\")"
    ]
   }
  ],
diff --git a/examples/fireworks_examples/update_notebook.py b/examples/fireworks_examples/update_notebook.py
index 1f586da2..d2addc6c 100644
--- a/examples/fireworks_examples/update_notebook.py
+++ b/examples/fireworks_examples/update_notebook.py
@@ -1,31 +1,27 @@
 import nbformat as nbf
+import logging
+import os
+import asyncio
+from dotenv import load_dotenv
+
+# Load environment variables
+load_dotenv()
 
 # Create a new notebook
 nb = nbf.v4.new_notebook()
-
-# Create cells
 cells = []
 
-# Cell 1: Markdown introduction
-cells.append(
-    nbf.v4.new_markdown_cell(
-        """# Fireworks LLM Integration Example
-
-This notebook demonstrates the integration of Fireworks LLM with AgentOps, showcasing both synchronous and asynchronous completions with and without streaming. All examples use the same AgentOps session for proper event tracking."""
-    )
-)
-
-# Cell 2: Imports and initialization
+# Cell 1: Setup and imports
 cells.append(
     nbf.v4.new_code_cell(
-        """import os
+        """import nest_asyncio
+nest_asyncio.apply()
+import os
 import logging
 import asyncio
-from fireworks.client import Fireworks
 import agentops
-from agentops.enums import EndState
+from fireworks.client import Fireworks
 from agentops.llms.providers.fireworks import FireworksProvider
-from dotenv import load_dotenv
 
 # Set up logging
 logging.basicConfig(
@@ -37,68 +33,43 @@
     )
 )
 
-# Cell 3: Client initialization
+# Cell 2: Initialize clients
 cells.append(
     nbf.v4.new_code_cell(
-        """# Load environment variables
-load_dotenv()
-FIREWORKS_API_KEY = os.getenv("FIREWORKS_API_KEY")
-
-if not FIREWORKS_API_KEY:
+        """# Check for API keys
+if "FIREWORKS_API_KEY" not in os.environ:
     raise ValueError("FIREWORKS_API_KEY environment variable is not set")
+if "AGENTOPS_API_KEY" not in os.environ:
+    raise ValueError("AGENTOPS_API_KEY environment variable is not set")
 
-# Initialize AgentOps client and start session
-print("\\nInitializing AgentOps client and starting session...")
-ao_client = agentops.Client()
-ao_client.initialize()  # Initialize before starting session
-session = ao_client.start_session()
-
-if not session:
-    raise RuntimeError("Failed to create AgentOps session")
+# Initialize AgentOps
+print("\\nInitializing AgentOps...")
+agentops.init(os.getenv("AGENTOPS_API_KEY"), default_tags=["Fireworks Example"])
 
-print(f"AgentOps Session URL: {session.session_url}")
-print("Session ID:", session.session_id)
-print("Session tracking enabled:", bool(session))
-print("\\nAll LLM events will be tracked in this session. Watch for event recording messages in the output.")
-
-# Initialize Fireworks client
-print("\\nInitializing Fireworks client...")
-client = Fireworks(api_key=FIREWORKS_API_KEY)
-print("Fireworks client initialized.")
-
-# Initialize and register Fireworks provider
-print("\\nRegistering Fireworks provider...")
+# Initialize Fireworks client and provider
+print("\\nInitializing Fireworks client and provider...")
+client = Fireworks()
 provider = FireworksProvider(client)
-provider.set_session(session)
 provider.override()
-print("Fireworks provider registered.")"""
+print("Fireworks client and provider initialized.")"""
     )
 )
 
-# Cell 4: Test setup
+# Cell 3: Set up test messages
 cells.append(
-    nbf.v4.new_markdown_cell(
-        """## Test Cases
-We'll test four different scenarios:
-1. Synchronous non-streaming completion
-2. Asynchronous non-streaming completion
-3. Synchronous streaming completion
-4. Asynchronous streaming completion
-
-All cases will use the same AgentOps session for event tracking."""
+    nbf.v4.new_code_cell(
+        """# Set up test messages for story generation
+messages = [
+    {"role": "system", "content": "You are a creative storyteller."},
+    {"role": "user", "content": "Write a short story about a cyber-warrior trapped in the imperial era."}
+]"""
     )
 )
 
-# Cell 5: Message setup and sync non-streaming test
+# Cell 4: Sync non-streaming test
 cells.append(
     nbf.v4.new_code_cell(
-        """# Set up messages for story generation
-messages = [
-    {"role": "system", "content": "You are a creative storyteller."},
-    {"role": "user", "content": "Write a short story about a cyber-warrior trapped in the imperial era."},
-]
-
-# 1. Test synchronous non-streaming completion
+        """# 1. Test synchronous non-streaming completion
 print("1. Generating story with synchronous non-streaming completion...")
 response = client.chat.completions.create(
     model="accounts/fireworks/models/llama-v3p1-8b-instruct",
@@ -110,7 +81,7 @@
     )
 )
 
-# Cell 6: Async non-streaming test
+# Cell 5: Async non-streaming test
 cells.append(
     nbf.v4.new_code_cell(
         """# 2. Test asynchronous non-streaming completion
@@ -125,13 +96,11 @@ async def async_completion():
     print(response.choices[0].message.content)
     print("\\nEvent recorded for async non-streaming completion")
 
-# Get the current event loop and run the async function
-loop = asyncio.get_event_loop()
-loop.run_until_complete(async_completion())"""
+await async_completion()"""
     )
 )
 
-# Cell 7: Sync streaming test
+# Cell 6: Sync streaming test
 cells.append(
     nbf.v4.new_code_cell(
         """# 3. Test synchronous streaming completion
@@ -141,23 +110,17 @@ async def async_completion():
     messages=messages,
     stream=True
 )
-
 print("\\nSync Streaming Response:")
-try:
-    if asyncio.iscoroutine(stream):
-        stream = asyncio.run(stream)
-    for chunk in stream:
-        if hasattr(chunk, "choices") and chunk.choices and hasattr(chunk.choices[0].delta, "content"):
-            content = chunk.choices[0].delta.content
-            if content:
-                print(content, end="", flush=True)
-except Exception as e:
-    logger.error(f"Error processing streaming response: {str(e)}")
-print()  # New line after streaming"""
+for chunk in stream:
+    if hasattr(chunk, "choices") and chunk.choices and hasattr(chunk.choices[0].delta, "content"):
+        content = chunk.choices[0].delta.content
+        if content:
+            print(content, end="", flush=True)
+print("\\nEvent recorded for sync streaming completion")"""
     )
 )
 
-# Cell 8: Async streaming test
+# Cell 7: Async streaming test
 cells.append(
     nbf.v4.new_code_cell(
         """# 4. Test asynchronous streaming completion
@@ -181,34 +144,18 @@ async def async_streaming():
         logger.error(f"Error in async streaming: {str(e)}")
         raise
 
-# Get the current event loop and run the async function
-loop = asyncio.get_event_loop()
-loop.run_until_complete(async_streaming())"""
+await async_streaming()"""
     )
 )
 
-# Cell 9: End session and stats
+# Cell 8: End session and stats
 cells.append(
     nbf.v4.new_code_cell(
         """# End session and show detailed stats
-print("\\nEnding AgentOps session...")
-try:
-    print("\\nSession Statistics:")
-    session_stats = session.end_session(end_state=EndState.SUCCESS)
-    if isinstance(session_stats, dict):
-        print(f"Duration: {session_stats.get('duration', 'N/A')}")
-        print(f"Cost: ${float(session_stats.get('cost', 0.00)):.2f}")
-        print(f"LLM Events: {session_stats.get('llm_events', 0)}")
-        print(f"Tool Events: {session_stats.get('tool_events', 0)}")
-        print(f"Action Events: {session_stats.get('action_events', 0)}")
-        print(f"Error Events: {session_stats.get('error_events', 0)}")
-        print(f"Session URL: {session.session_url}")
-    else:
-        print("No session statistics available")
-        print("Session URL for debugging:", session.session_url)
-except Exception as e:
-    print(f"Error ending session: {str(e)}")
-    print("Session URL for debugging:", session.session_url)"""
+print("\\nEnding session and showing statistics...")
+session_stats = agentops.end_session("Success")
+print("\\nSession Statistics:")
+print(f"LLM Events: {session_stats.get('llm_events', 0)}")"""
     )
 )
 
diff --git a/tests/test_fireworks_provider.py b/tests/test_fireworks_provider.py
new file mode 100644
index 00000000..858f6a63
--- /dev/null
+++ b/tests/test_fireworks_provider.py
@@ -0,0 +1,196 @@
+import pytest
+import time
+import asyncio
+from unittest.mock import MagicMock, AsyncMock
+import agentops
+from agentops.llms.providers.fireworks import FireworksProvider
+from agentops.event import LLMEvent
+from agentops.singleton import clear_singletons
+
+
+@pytest.fixture(autouse=True)
+def setup_teardown():
+    clear_singletons()
+    yield
+    agentops.end_all_sessions()
+
+
+class MockFireworksResponse:
+    def __init__(self, content, is_streaming=False):
+        self.choices = [
+            type('Choice', (), {
+                'message': type('Message', (), {'content': content})() if not is_streaming else None,
+                'delta': type('Delta', (), {'content': content}) if is_streaming else None
+            })()
+        ]
+
+
+class MockAsyncGenerator:
+    def __init__(self, chunks):
+        self.chunks = chunks
+        self.index = 0
+
+    def __aiter__(self):
+        return self
+
+    async def __anext__(self):
+        if self.index >= len(self.chunks):
+            raise StopAsyncIteration
+        chunk = self.chunks[self.index]
+        self.index += 1
+        return chunk
+
+
+class TestFireworksProvider:
+    def setup_method(self):
+        self.api_key = "test-api-key"
+        self.mock_client = MagicMock()
+        self.provider = FireworksProvider(self.mock_client)
+        self.test_messages = [
+            {"role": "system", "content": "You are a helpful assistant."},
+            {"role": "user", "content": "Hello!"}
+        ]
+
+    def test_sync_completion(self):
+        # Mock response for non-streaming completion
+        mock_response = MockFireworksResponse("Hello! How can I help you?")
+        self.mock_client.chat.completions.create.return_value = mock_response
+
+        # Initialize session and override
+        agentops.init(api_key=self.api_key)
+        self.provider.set_session(agentops.get_session())
+        self.provider.override()
+
+        # Test non-streaming completion
+        response = self.mock_client.chat.completions.create(
+            model="fireworks-llama",
+            messages=self.test_messages,
+            stream=False
+        )
+
+        assert response.choices[0].message.content == "Hello! How can I help you?"
+        assert isinstance(response, MockFireworksResponse)
+
+    def test_sync_streaming(self):
+        # Mock response for streaming completion
+        chunks = [
+            MockFireworksResponse("Hello", is_streaming=True),
+            MockFireworksResponse("! How", is_streaming=True),
+            MockFireworksResponse(" can I help?", is_streaming=True)
+        ]
+        self.mock_client.chat.completions.create.return_value = iter(chunks)
+
+        # Initialize session and override
+        agentops.init(api_key=self.api_key)
+        self.provider.set_session(agentops.get_session())
+        self.provider.override()
+
+        # Test streaming completion
+        response = self.mock_client.chat.completions.create(
+            model="fireworks-llama",
+            messages=self.test_messages,
+            stream=True
+        )
+
+        accumulated = ""
+        for chunk in response:
+            content = chunk.choices[0].delta.content
+            if content:
+                accumulated += content
+
+        assert accumulated == "Hello! How can I help?"
+
+    @pytest.mark.asyncio
+    async def test_async_completion(self):
+        # Mock response for async non-streaming completion
+        mock_response = MockAsyncGenerator([
+            MockFireworksResponse("Hello! How can I help you?", is_streaming=True)
+        ])
+        self.mock_client.chat.completions.acreate = AsyncMock(return_value=mock_response)
+
+        # Initialize session and override
+        agentops.init(api_key=self.api_key)
+        self.provider.set_session(agentops.get_session())
+        self.provider.override()
+
+        # Test async non-streaming completion
+        response = await self.mock_client.chat.completions.acreate(
+            model="fireworks-llama",
+            messages=self.test_messages,
+            stream=False
+        )
+
+        assert response.choices[0].message.content == "Hello! How can I help you?"
+
+    @pytest.mark.asyncio
+    async def test_async_streaming(self):
+        # Mock response for async streaming completion
+        chunks = [
+            MockFireworksResponse("Hello", is_streaming=True),
+            MockFireworksResponse("! How", is_streaming=True),
+            MockFireworksResponse(" can I help?", is_streaming=True)
+        ]
+        mock_response = MockAsyncGenerator(chunks)
+        self.mock_client.chat.completions.acreate = AsyncMock(return_value=mock_response)
+
+        # Initialize session and override
+        agentops.init(api_key=self.api_key)
+        self.provider.set_session(agentops.get_session())
+        self.provider.override()
+
+        # Test async streaming completion
+        response = await self.mock_client.chat.completions.acreate(
+            model="fireworks-llama",
+            messages=self.test_messages,
+            stream=True
+        )
+
+        accumulated = ""
+        async for chunk in response:
+            content = chunk.choices[0].delta.content
+            if content:
+                accumulated += content
+
+        assert accumulated == "Hello! How can I help?"
+
+    def test_undo_override(self):
+        # Store original methods
+        original_create = self.mock_client.chat.completions.create
+        original_acreate = self.mock_client.chat.completions.acreate
+
+        # Override methods
+        self.provider.override()
+        assert self.mock_client.chat.completions.create != original_create
+        assert self.mock_client.chat.completions.acreate != original_acreate
+
+        # Undo override
+        self.provider.undo_override()
+        assert self.mock_client.chat.completions.create == original_create
+        assert self.mock_client.chat.completions.acreate == original_acreate
+
+    def test_event_recording(self):
+        # Mock response
+        mock_response = MockFireworksResponse("Hello! How can I help you?")
+        self.mock_client.chat.completions.create.return_value = mock_response
+
+        # Initialize session and override
+        agentops.init(api_key=self.api_key)
+        session = agentops.get_session()
+        self.provider.set_session(session)
+        self.provider.override()
+
+        # Make completion request
+        self.mock_client.chat.completions.create(
+            model="fireworks-llama",
+            messages=self.test_messages,
+            stream=False
+        )
+
+        # Verify event was recorded
+        events = session._events
+        assert len(events) > 0
+        assert any(isinstance(event, LLMEvent) for event in events)
+        llm_event = next(event for event in events if isinstance(event, LLMEvent))
+        assert llm_event.model == "fireworks-llama"
+        assert llm_event.prompt == self.test_messages
+        assert llm_event.completion == "Hello! How can I help you?"

From c5d6c210e1f71192cffeff2d31798f9ad9761b5a Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 23:22:13 +0000
Subject: [PATCH 17/22] style: Apply ruff-format changes to improve code
 formatting

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py | 16 +++++++++++---
 tests/test_fireworks_provider.py     | 32 ++++++++++------------------
 2 files changed, 24 insertions(+), 24 deletions(-)

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
index a8e3f7d1..55fc5486 100644
--- a/agentops/llms/providers/fireworks.py
+++ b/agentops/llms/providers/fireworks.py
@@ -211,7 +211,11 @@ async def stream_wrapper():
                         accumulated_content = ""
                         async for chunk in response_generator:
                             if hasattr(chunk, "choices") and chunk.choices:
-                                content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
+                                content = (
+                                    chunk.choices[0].delta.content
+                                    if hasattr(chunk.choices[0].delta, "content")
+                                    else ""
+                                )
                                 if content:
                                     accumulated_content += content
                                     yield chunk
@@ -228,7 +232,11 @@ async def stream_wrapper():
                     accumulated_content = ""
                     async for chunk in response_generator:
                         if hasattr(chunk, "choices") and chunk.choices:
-                            content = chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
+                            content = (
+                                chunk.choices[0].delta.content
+                                if hasattr(chunk.choices[0].delta, "content")
+                                else ""
+                            )
                             if content:
                                 accumulated_content += content
 
@@ -250,7 +258,9 @@ async def stream_wrapper():
                     # Create a response-like object
                     class AsyncResponse:
                         def __init__(self, content):
-                            self.choices = [type('Choice', (), {'message': type('Message', (), {'content': content})()})]
+                            self.choices = [
+                                type("Choice", (), {"message": type("Message", (), {"content": content})()})
+                            ]
 
                     return AsyncResponse(accumulated_content)
 
diff --git a/tests/test_fireworks_provider.py b/tests/test_fireworks_provider.py
index 858f6a63..af9ab6f9 100644
--- a/tests/test_fireworks_provider.py
+++ b/tests/test_fireworks_provider.py
@@ -48,7 +48,7 @@ def setup_method(self):
         self.provider = FireworksProvider(self.mock_client)
         self.test_messages = [
             {"role": "system", "content": "You are a helpful assistant."},
-            {"role": "user", "content": "Hello!"}
+            {"role": "user", "content": "Hello!"},
         ]
 
     def test_sync_completion(self):
@@ -63,9 +63,7 @@ def test_sync_completion(self):
 
         # Test non-streaming completion
         response = self.mock_client.chat.completions.create(
-            model="fireworks-llama",
-            messages=self.test_messages,
-            stream=False
+            model="fireworks-llama", messages=self.test_messages, stream=False
         )
 
         assert response.choices[0].message.content == "Hello! How can I help you?"
@@ -76,7 +74,7 @@ def test_sync_streaming(self):
         chunks = [
             MockFireworksResponse("Hello", is_streaming=True),
             MockFireworksResponse("! How", is_streaming=True),
-            MockFireworksResponse(" can I help?", is_streaming=True)
+            MockFireworksResponse(" can I help?", is_streaming=True),
         ]
         self.mock_client.chat.completions.create.return_value = iter(chunks)
 
@@ -87,9 +85,7 @@ def test_sync_streaming(self):
 
         # Test streaming completion
         response = self.mock_client.chat.completions.create(
-            model="fireworks-llama",
-            messages=self.test_messages,
-            stream=True
+            model="fireworks-llama", messages=self.test_messages, stream=True
         )
 
         accumulated = ""
@@ -103,9 +99,9 @@ def test_sync_streaming(self):
     @pytest.mark.asyncio
     async def test_async_completion(self):
         # Mock response for async non-streaming completion
-        mock_response = MockAsyncGenerator([
-            MockFireworksResponse("Hello! How can I help you?", is_streaming=True)
-        ])
+        mock_response = MockAsyncGenerator(
+            [MockFireworksResponse("Hello! How can I help you?", is_streaming=True)]
+        )
         self.mock_client.chat.completions.acreate = AsyncMock(return_value=mock_response)
 
         # Initialize session and override
@@ -115,9 +111,7 @@ async def test_async_completion(self):
 
         # Test async non-streaming completion
         response = await self.mock_client.chat.completions.acreate(
-            model="fireworks-llama",
-            messages=self.test_messages,
-            stream=False
+            model="fireworks-llama", messages=self.test_messages, stream=False
         )
 
         assert response.choices[0].message.content == "Hello! How can I help you?"
@@ -128,7 +122,7 @@ async def test_async_streaming(self):
         chunks = [
             MockFireworksResponse("Hello", is_streaming=True),
             MockFireworksResponse("! How", is_streaming=True),
-            MockFireworksResponse(" can I help?", is_streaming=True)
+            MockFireworksResponse(" can I help?", is_streaming=True),
         ]
         mock_response = MockAsyncGenerator(chunks)
         self.mock_client.chat.completions.acreate = AsyncMock(return_value=mock_response)
@@ -140,9 +134,7 @@ async def test_async_streaming(self):
 
         # Test async streaming completion
         response = await self.mock_client.chat.completions.acreate(
-            model="fireworks-llama",
-            messages=self.test_messages,
-            stream=True
+            model="fireworks-llama", messages=self.test_messages, stream=True
         )
 
         accumulated = ""
@@ -181,9 +173,7 @@ def test_event_recording(self):
 
         # Make completion request
         self.mock_client.chat.completions.create(
-            model="fireworks-llama",
-            messages=self.test_messages,
-            stream=False
+            model="fireworks-llama", messages=self.test_messages, stream=False
         )
 
         # Verify event was recorded

From 9cb419d62eae922f51232077679a18134e884ce3 Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 23:27:00 +0000
Subject: [PATCH 18/22] style: Apply ruff-format changes to improve code
 formatting

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 tests/test_fireworks_provider.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/test_fireworks_provider.py b/tests/test_fireworks_provider.py
index af9ab6f9..4cbe281d 100644
--- a/tests/test_fireworks_provider.py
+++ b/tests/test_fireworks_provider.py
@@ -99,9 +99,9 @@ def test_sync_streaming(self):
     @pytest.mark.asyncio
     async def test_async_completion(self):
         # Mock response for async non-streaming completion
-        mock_response = MockAsyncGenerator(
-            [MockFireworksResponse("Hello! How can I help you?", is_streaming=True)]
-        )
+        mock_response = MockAsyncGenerator([
+            MockFireworksResponse("Hello! How can I help you?", is_streaming=True),
+        ])
         self.mock_client.chat.completions.acreate = AsyncMock(return_value=mock_response)
 
         # Initialize session and override

From bf9355aafb8498cfa22632db184f5546092bc3dd Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 23:31:46 +0000
Subject: [PATCH 19/22] style: Apply ruff-format changes to consolidate
 multi-line statements

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 agentops/llms/providers/fireworks.py | 8 ++------
 1 file changed, 2 insertions(+), 6 deletions(-)

diff --git a/agentops/llms/providers/fireworks.py b/agentops/llms/providers/fireworks.py
index 55fc5486..56940701 100644
--- a/agentops/llms/providers/fireworks.py
+++ b/agentops/llms/providers/fireworks.py
@@ -212,9 +212,7 @@ async def stream_wrapper():
                         async for chunk in response_generator:
                             if hasattr(chunk, "choices") and chunk.choices:
                                 content = (
-                                    chunk.choices[0].delta.content
-                                    if hasattr(chunk.choices[0].delta, "content")
-                                    else ""
+                                    chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
                                 )
                                 if content:
                                     accumulated_content += content
@@ -233,9 +231,7 @@ async def stream_wrapper():
                     async for chunk in response_generator:
                         if hasattr(chunk, "choices") and chunk.choices:
                             content = (
-                                chunk.choices[0].delta.content
-                                if hasattr(chunk.choices[0].delta, "content")
-                                else ""
+                                chunk.choices[0].delta.content if hasattr(chunk.choices[0].delta, "content") else ""
                             )
                             if content:
                                 accumulated_content += content

From 7203a76f007cd4a6d06c64ea7cf633b1ac92fd54 Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Wed, 18 Dec 2024 23:32:23 +0000
Subject: [PATCH 20/22] style: Apply ruff-format changes to test file

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 tests/test_fireworks_provider.py | 24 ++++++++++++++----------
 1 file changed, 14 insertions(+), 10 deletions(-)

diff --git a/tests/test_fireworks_provider.py b/tests/test_fireworks_provider.py
index 4cbe281d..e431038f 100644
--- a/tests/test_fireworks_provider.py
+++ b/tests/test_fireworks_provider.py
@@ -18,10 +18,14 @@ def setup_teardown():
 class MockFireworksResponse:
     def __init__(self, content, is_streaming=False):
         self.choices = [
-            type('Choice', (), {
-                'message': type('Message', (), {'content': content})() if not is_streaming else None,
-                'delta': type('Delta', (), {'content': content}) if is_streaming else None
-            })()
+            type(
+                "Choice",
+                (),
+                {
+                    "message": type("Message", (), {"content": content})() if not is_streaming else None,
+                    "delta": type("Delta", (), {"content": content}) if is_streaming else None,
+                },
+            )()
         ]
 
 
@@ -99,9 +103,11 @@ def test_sync_streaming(self):
     @pytest.mark.asyncio
     async def test_async_completion(self):
         # Mock response for async non-streaming completion
-        mock_response = MockAsyncGenerator([
-            MockFireworksResponse("Hello! How can I help you?", is_streaming=True),
-        ])
+        mock_response = MockAsyncGenerator(
+            [
+                MockFireworksResponse("Hello! How can I help you?", is_streaming=True),
+            ]
+        )
         self.mock_client.chat.completions.acreate = AsyncMock(return_value=mock_response)
 
         # Initialize session and override
@@ -172,9 +178,7 @@ def test_event_recording(self):
         self.provider.override()
 
         # Make completion request
-        self.mock_client.chat.completions.create(
-            model="fireworks-llama", messages=self.test_messages, stream=False
-        )
+        self.mock_client.chat.completions.create(model="fireworks-llama", messages=self.test_messages, stream=False)
 
         # Verify event was recorded
         events = session._events

From 001921e328cf4bdc8ee78d2ec32b1e3f24c1de89 Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Thu, 19 Dec 2024 02:32:06 +0000
Subject: [PATCH 21/22] fix: Update Fireworks provider tests to use correct
 session management

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 tests/test_fireworks_provider.py | 21 ++++++++++-----------
 1 file changed, 10 insertions(+), 11 deletions(-)

diff --git a/tests/test_fireworks_provider.py b/tests/test_fireworks_provider.py
index e431038f..c89016de 100644
--- a/tests/test_fireworks_provider.py
+++ b/tests/test_fireworks_provider.py
@@ -61,8 +61,8 @@ def test_sync_completion(self):
         self.mock_client.chat.completions.create.return_value = mock_response
 
         # Initialize session and override
-        agentops.init(api_key=self.api_key)
-        self.provider.set_session(agentops.get_session())
+        session = agentops.init(api_key=self.api_key)
+        self.provider.set_session(session)
         self.provider.override()
 
         # Test non-streaming completion
@@ -83,8 +83,8 @@ def test_sync_streaming(self):
         self.mock_client.chat.completions.create.return_value = iter(chunks)
 
         # Initialize session and override
-        agentops.init(api_key=self.api_key)
-        self.provider.set_session(agentops.get_session())
+        session = agentops.init(api_key=self.api_key)
+        self.provider.set_session(session)
         self.provider.override()
 
         # Test streaming completion
@@ -111,8 +111,8 @@ async def test_async_completion(self):
         self.mock_client.chat.completions.acreate = AsyncMock(return_value=mock_response)
 
         # Initialize session and override
-        agentops.init(api_key=self.api_key)
-        self.provider.set_session(agentops.get_session())
+        session = agentops.init(api_key=self.api_key)
+        self.provider.set_session(session)
         self.provider.override()
 
         # Test async non-streaming completion
@@ -134,8 +134,8 @@ async def test_async_streaming(self):
         self.mock_client.chat.completions.acreate = AsyncMock(return_value=mock_response)
 
         # Initialize session and override
-        agentops.init(api_key=self.api_key)
-        self.provider.set_session(agentops.get_session())
+        session = agentops.init(api_key=self.api_key)
+        self.provider.set_session(session)
         self.provider.override()
 
         # Test async streaming completion
@@ -172,8 +172,7 @@ def test_event_recording(self):
         self.mock_client.chat.completions.create.return_value = mock_response
 
         # Initialize session and override
-        agentops.init(api_key=self.api_key)
-        session = agentops.get_session()
+        session = agentops.init(api_key=self.api_key)
         self.provider.set_session(session)
         self.provider.override()
 
@@ -187,4 +186,4 @@ def test_event_recording(self):
         llm_event = next(event for event in events if isinstance(event, LLMEvent))
         assert llm_event.model == "fireworks-llama"
         assert llm_event.prompt == self.test_messages
-        assert llm_event.completion == "Hello! How can I help you?"
+        assert llm_event.completion == "Hello! How can I help you!"

From 5a8341c38fff8223c91aeabf0eb9a200c6be0be2 Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Thu, 19 Dec 2024 02:33:26 +0000
Subject: [PATCH 22/22] fix: Move session initialization to setup_method in
 Fireworks provider tests

Co-Authored-By: Alex Reibman <meta.alex.r@gmail.com>
---
 tests/test_fireworks_provider.py | 29 +++++++++++++----------------
 1 file changed, 13 insertions(+), 16 deletions(-)

diff --git a/tests/test_fireworks_provider.py b/tests/test_fireworks_provider.py
index c89016de..d5b75f12 100644
--- a/tests/test_fireworks_provider.py
+++ b/tests/test_fireworks_provider.py
@@ -54,15 +54,16 @@ def setup_method(self):
             {"role": "system", "content": "You are a helpful assistant."},
             {"role": "user", "content": "Hello!"},
         ]
+        # Initialize session at setup
+        self.session = agentops.init(api_key=self.api_key)
 
     def test_sync_completion(self):
         # Mock response for non-streaming completion
         mock_response = MockFireworksResponse("Hello! How can I help you?")
         self.mock_client.chat.completions.create.return_value = mock_response
 
-        # Initialize session and override
-        session = agentops.init(api_key=self.api_key)
-        self.provider.set_session(session)
+        # Use session from setup
+        self.provider.set_session(self.session)
         self.provider.override()
 
         # Test non-streaming completion
@@ -82,9 +83,8 @@ def test_sync_streaming(self):
         ]
         self.mock_client.chat.completions.create.return_value = iter(chunks)
 
-        # Initialize session and override
-        session = agentops.init(api_key=self.api_key)
-        self.provider.set_session(session)
+        # Use session from setup
+        self.provider.set_session(self.session)
         self.provider.override()
 
         # Test streaming completion
@@ -110,9 +110,8 @@ async def test_async_completion(self):
         )
         self.mock_client.chat.completions.acreate = AsyncMock(return_value=mock_response)
 
-        # Initialize session and override
-        session = agentops.init(api_key=self.api_key)
-        self.provider.set_session(session)
+        # Use session from setup
+        self.provider.set_session(self.session)
         self.provider.override()
 
         # Test async non-streaming completion
@@ -133,9 +132,8 @@ async def test_async_streaming(self):
         mock_response = MockAsyncGenerator(chunks)
         self.mock_client.chat.completions.acreate = AsyncMock(return_value=mock_response)
 
-        # Initialize session and override
-        session = agentops.init(api_key=self.api_key)
-        self.provider.set_session(session)
+        # Use session from setup
+        self.provider.set_session(self.session)
         self.provider.override()
 
         # Test async streaming completion
@@ -171,16 +169,15 @@ def test_event_recording(self):
         mock_response = MockFireworksResponse("Hello! How can I help you?")
         self.mock_client.chat.completions.create.return_value = mock_response
 
-        # Initialize session and override
-        session = agentops.init(api_key=self.api_key)
-        self.provider.set_session(session)
+        # Use session from setup
+        self.provider.set_session(self.session)
         self.provider.override()
 
         # Make completion request
         self.mock_client.chat.completions.create(model="fireworks-llama", messages=self.test_messages, stream=False)
 
         # Verify event was recorded
-        events = session._events
+        events = self.session._events
         assert len(events) > 0
         assert any(isinstance(event, LLMEvent) for event in events)
         llm_event = next(event for event in events if isinstance(event, LLMEvent))