Repository: andrewyng/aisuite
Branch: main
Commit: 695242a836a0
Files: 208
Total size: 1.0 MB

Directory structure:
gitextract_z7uqp5wm/

├── .github/
│   └── workflows/
│       ├── black.yml
│       └── run_pytest.yml
├── .gitignore
├── .pre-commit-config.yaml
├── CONTRIBUTING.md
├── LICENSE
├── README.md
├── aisuite/
│   ├── __init__.py
│   ├── client.py
│   ├── design-notes/
│   │   └── asr-parameter-design-motivation.md
│   ├── framework/
│   │   ├── __init__.py
│   │   ├── asr_params.py
│   │   ├── chat_completion_response.py
│   │   ├── choice.py
│   │   ├── message.py
│   │   ├── parameter_mapper.py
│   │   └── provider_interface.py
│   ├── mcp/
│   │   ├── __init__.py
│   │   ├── client.py
│   │   ├── config.py
│   │   ├── schema_converter.py
│   │   └── tool_wrapper.py
│   ├── provider.py
│   ├── providers/
│   │   ├── __init__.py
│   │   ├── anthropic_provider.py
│   │   ├── aws_provider.py
│   │   ├── azure_provider.py
│   │   ├── cerebras_provider.py
│   │   ├── cohere_provider.py
│   │   ├── deepgram_provider.py
│   │   ├── deepseek_provider.py
│   │   ├── fireworks_provider.py
│   │   ├── google_provider.py
│   │   ├── groq_provider.py
│   │   ├── huggingface_provider.py
│   │   ├── inception_provider.py
│   │   ├── lmstudio_provider.py
│   │   ├── message_converter.py
│   │   ├── mistral_provider.py
│   │   ├── nebius_provider.py
│   │   ├── ollama_provider.py
│   │   ├── openai_provider.py
│   │   ├── sambanova_provider.py
│   │   ├── together_provider.py
│   │   ├── watsonx_provider.py
│   │   └── xai_provider.py
│   └── utils/
│       ├── tools.py
│       └── utils.py
├── aisuite-js/
│   ├── README.md
│   ├── examples/
│   │   ├── basic-usage.ts
│   │   ├── chat-app/
│   │   │   ├── .eslintrc.cjs
│   │   │   ├── .gitignore
│   │   │   ├── README.md
│   │   │   ├── index.html
│   │   │   ├── package.json
│   │   │   ├── postcss.config.js
│   │   │   ├── src/
│   │   │   │   ├── App.tsx
│   │   │   │   ├── components/
│   │   │   │   │   ├── ApiKeyModal.tsx
│   │   │   │   │   ├── ChatContainer.tsx
│   │   │   │   │   ├── ChatInput.tsx
│   │   │   │   │   ├── ChatMessage.tsx
│   │   │   │   │   ├── ModelSelector.tsx
│   │   │   │   │   └── ProviderSelector.tsx
│   │   │   │   ├── config/
│   │   │   │   │   └── llm-config.ts
│   │   │   │   ├── index.css
│   │   │   │   ├── main.tsx
│   │   │   │   ├── services/
│   │   │   │   │   └── aisuite-service.ts
│   │   │   │   ├── types/
│   │   │   │   │   └── chat.ts
│   │   │   │   └── utils/
│   │   │   │       └── cn.ts
│   │   │   ├── tailwind.config.js
│   │   │   ├── tsconfig.json
│   │   │   ├── tsconfig.node.json
│   │   │   └── vite.config.ts
│   │   ├── deepgram.ts
│   │   ├── groq.ts
│   │   ├── mistral.ts
│   │   ├── openai-asr.ts
│   │   ├── streaming.ts
│   │   ├── test-suite.ts
│   │   └── tool-calling.ts
│   ├── jest.config.ts
│   ├── package.json
│   ├── src/
│   │   ├── asr-providers/
│   │   │   ├── deepgram/
│   │   │   │   ├── adapters.ts
│   │   │   │   ├── index.ts
│   │   │   │   ├── provider.ts
│   │   │   │   └── types.ts
│   │   │   └── index.ts
│   │   ├── client.ts
│   │   ├── core/
│   │   │   ├── base-asr-provider.ts
│   │   │   ├── base-provider.ts
│   │   │   ├── errors.ts
│   │   │   └── model-parser.ts
│   │   ├── index.ts
│   │   ├── providers/
│   │   │   ├── anthropic/
│   │   │   │   ├── adapters.ts
│   │   │   │   ├── index.ts
│   │   │   │   ├── provider.ts
│   │   │   │   └── types.ts
│   │   │   ├── groq/
│   │   │   │   ├── adapters.ts
│   │   │   │   ├── index.ts
│   │   │   │   ├── provider.ts
│   │   │   │   └── types.ts
│   │   │   ├── index.ts
│   │   │   ├── mistral/
│   │   │   │   ├── adapters.ts
│   │   │   │   ├── index.ts
│   │   │   │   ├── provider.ts
│   │   │   │   └── types.ts
│   │   │   └── openai/
│   │   │       ├── adapters.ts
│   │   │       ├── index.ts
│   │   │       ├── provider.ts
│   │   │       └── types.ts
│   │   ├── types/
│   │   │   ├── chat.ts
│   │   │   ├── common.ts
│   │   │   ├── index.ts
│   │   │   ├── providers.ts
│   │   │   ├── tools.ts
│   │   │   └── transcription.ts
│   │   └── utils/
│   │       └── streaming.ts
│   ├── tests/
│   │   ├── client.test.ts
│   │   ├── providers/
│   │   │   ├── anthropic-provider.test.ts
│   │   │   ├── deepgram-provider.test.ts
│   │   │   ├── groq-provider.test.ts
│   │   │   ├── mistral-provider.test.ts
│   │   │   ├── openai-provider.test.ts
│   │   │   └── openai_asr_provider.test.ts
│   │   └── utils/
│   │       └── streaming.test.ts
│   └── tsconfig.json
├── examples/
│   ├── AISuiteDemo.ipynb
│   ├── DeepseekPost.ipynb
│   ├── QnA_with_pdf.ipynb
│   ├── agents/
│   │   ├── movie_buff_assistant.ipynb
│   │   ├── recipe_chef_assistant.ipynb
│   │   ├── snake_game_generator.ipynb
│   │   ├── stock_dashboard.html
│   │   ├── stock_market_dashboard.html
│   │   ├── stock_market_mini_tracker.ipynb
│   │   ├── stock_market_tracker.ipynb
│   │   └── world_weather_dashboard.ipynb
│   ├── aisuite_tool_abstraction.ipynb
│   ├── asr_example.ipynb
│   ├── chat-ui/
│   │   ├── .streamlit/
│   │   │   └── config.toml
│   │   ├── README.md
│   │   ├── chat.py
│   │   └── config.yaml
│   ├── client.ipynb
│   ├── llm_reasoning.ipynb
│   ├── mcp_config_dict_example.py
│   ├── mcp_http_example.py
│   ├── mcp_tools_example.ipynb
│   ├── simple_tool_calling.ipynb
│   └── tool_calling_abstraction.ipynb
├── guides/
│   ├── README.md
│   ├── anthropic.md
│   ├── aws.md
│   ├── azure.md
│   ├── cerebras.md
│   ├── cohere.md
│   ├── deepseek.md
│   ├── google.md
│   ├── groq.md
│   ├── huggingface.md
│   ├── lmstudio.md
│   ├── mistral.md
│   ├── nebius.md
│   ├── ollama.md
│   ├── openai.md
│   ├── sambanova.md
│   ├── watsonx.md
│   └── xai.md
├── pyproject.toml
└── tests/
    ├── __init__.py
    ├── client/
    │   ├── __init__.py
    │   ├── test_client.py
    │   └── test_prerelease.py
    ├── framework/
    │   ├── test_asr_models.py
    │   └── test_asr_params.py
    ├── mcp/
    │   ├── README.md
    │   ├── __init__.py
    │   ├── conftest.py
    │   ├── test_client.py
    │   ├── test_e2e.py
    │   ├── test_http_llm_e2e.py
    │   ├── test_http_transport.py
    │   └── test_llm_e2e.py
    ├── providers/
    │   ├── __init__.py
    │   ├── test_anthropic_converter.py
    │   ├── test_asr_parameter_passthrough.py
    │   ├── test_aws_converter.py
    │   ├── test_azure_provider.py
    │   ├── test_cerebras_provider.py
    │   ├── test_cohere_provider.py
    │   ├── test_deepgram_provider.py
    │   ├── test_deepseek_provider.py
    │   ├── test_google_converter.py
    │   ├── test_google_provider.py
    │   ├── test_groq_provider.py
    │   ├── test_huggingface_provider.py
    │   ├── test_inception_provider.py
    │   ├── test_lmstudio_provider.py
    │   ├── test_mistral_provider.py
    │   ├── test_nebius_provider.py
    │   ├── test_ollama_provider.py
    │   ├── test_openai_provider.py
    │   ├── test_sambanova_provider.py
    │   └── test_watsonx_provider.py
    ├── test_provider.py
    └── utils/
        ├── test_mcp_memory_integration.py
        ├── test_tool_manager.py
        └── test_tools_mcp_schema.py

================================================
FILE CONTENTS
================================================

================================================
FILE: .github/workflows/black.yml
================================================
name: Lint

on: [push, pull_request]

jobs:
  lint:
    runs-on: ubuntu-latest
    steps:
      - uses: actions/checkout@v3
      - uses: psf/black@stable

================================================
FILE: .github/workflows/run_pytest.yml
================================================
name: Lint

on: [push, pull_request]

jobs:
  build_and_test:
    runs-on: ubuntu-latest
    strategy:
      matrix:
        python-version: [ "3.10", "3.11", "3.12" ]
    steps:
      - uses: actions/checkout@v4
      - name: Set up Python ${{ matrix.python-version }}
        uses: actions/setup-python@v5
        with:
          python-version: ${{ matrix.python-version }}
      - name: Install dependencies
        run: |
          python -m pip install --upgrade pip
          pip install poetry
          poetry install --all-extras --with test
      - name: Test with pytest
        run: poetry run pytest -m "not integration"


================================================
FILE: .gitignore
================================================
# Python
__pycache__/
*.py[cod]
*$py.class
*.so
.Python
build/
develop-eggs/
dist/
downloads/
eggs/
.eggs/
lib/
lib64/
parts/
sdist/
var/
wheels/
*.egg-info/
.installed.cfg
*.egg
MANIFEST
.env
.venv
env/
venv/
ENV/
*.whl

# Node/TypeScript
node_modules/
npm-debug.log*
yarn-debug.log*
yarn-error.log*
.npm
.env.local
.env.*.local
dist/
coverage/
*.tsbuildinfo

# IDEs and editors
.idea/
.vscode/
*.swp
*.swo
.DS_Store
**/.DS_Store
*.sublime-workspace
*.sublime-project

# Jupyter Notebook
.ipynb_checkpoints
*/.ipynb_checkpoints/*

# Testing
.coverage
htmlcov/
.pytest_cache/
coverage/
.nyc_output/

# Cloud credentials
.google-adc

# Logs
logs
*.log

# Python version
.python-version


================================================
FILE: .pre-commit-config.yaml
================================================
repos:
  # Using this mirror lets us use mypyc-compiled black, which is about 2x faster
  - repo: https://github.com/psf/black-pre-commit-mirror
    rev: 24.4.2
    hooks:
      - id: black
        # It is recommended to specify the latest version of Python
        # supported by your project here, or alternatively use
        # pre-commit's default_language_version, see
        # https://pre-commit.com/#top_level-default_language_version
        language_version: python3.12


================================================
FILE: CONTRIBUTING.md
================================================
<!-- omit in toc -->
# Contributing to aisuite

First off, thanks for taking the time to contribute!

All types of contributions are encouraged and valued. See the [Table of Contents](#table-of-contents)
for different ways to help and details about how this project handles them. Please make sure to read
the relevant section before making your contribution. It will make it a lot easier for us maintainers
and smooth out the experience for all involved. The community looks forward to your contributions.

> And if you like the project, but just don't have time to contribute, that's fine. There are other easy
> ways to support the project and show your appreciation, which we would also be very happy about:
> - Star the project
> - Tweet about it
> - Refer this project in your project's readme
> - Mention the project at local meetups and tell your friends/colleagues

<!-- omit in toc -->
## Table of Contents

- [I Have a Question](#i-have-a-question)
- [I Want To Contribute](#i-want-to-contribute)
  - [Reporting Bugs](#reporting-bugs)
  - [Suggesting Enhancements](#suggesting-enhancements)
  - [Your First Code Contribution](#your-first-code-contribution)
  - [Improving The Documentation](#improving-the-documentation)
- [Styleguides](#styleguides)
  - [Commit Messages](#commit-messages)


## I Have a Question

> If you want to ask a question, we assume that you have read the available
> [Documentation](https://github.com/andrewyng/aisuite/blob/main/README.md).

Before you ask a question, it is best to search for existing [Issues](https://github.com/andrewyng/aisuite/issues)
that might help you. If you find a relevant issue that already exists and still need clarification, please add your question to that existing issue. We also recommend reaching out to the community in the aisuite [Discord](https://discord.gg/T6Nvn8ExSb) server.

If you then still feel the need to ask a question and need clarification, we recommend the following:

- Open an [Issue](https://github.com/andrewyng/aisuite/issues/new).
- Provide as much context as you can about what you're running into.
- Provide project and platform versions (python, OS, etc.), depending on what seems relevant.

We (or someone in the community) will then take care of the issue as soon as possible.


## I Want To Contribute

> ### Legal Notice <!-- omit in toc -->
> When contributing to this project, you must agree that you have authored 100% of the content, that
> you have the necessary rights to the content and that the content you contribute may be provided
> under the project license.

### Reporting Bugs

<!-- omit in toc -->
#### Before Submitting a Bug Report

A good bug report shouldn't leave others needing to chase you up for more information. Therefore, we ask
you to investigate carefully, collect information and describe the issue in detail in your report. Please
complete the following steps in advance to help us fix any potential bug as fast as possible.

- Make sure that you are using the latest version.
- Determine if your bug is really a bug and not an error on your side e.g. using incompatible environment 
  components/versions (Make sure that you have read the [documentation](https://github.com/andrewyng/aisuite/blob/main/README.md).
  If you are looking for support, you might want to check [this section](#i-have-a-question)).
- To see if other users have experienced (and potentially already solved) the same issue you are having,
  check if there is not already a bug report existing for your bug or error in the [bug tracker](https://github.com/andrewyng/aisuite?q=label%3Abug).
- Also make sure to search the internet (including Stack Overflow) to see if users outside of the GitHub
  community have discussed the issue.
- Collect information about the bug:
  - Stack trace (Traceback)
  - OS, Platform and Version (Windows, Linux, macOS, x86, ARM)
  - Version of the interpreter, compiler, SDK, runtime environment, package manager, depending on
    what seems relevant.
  - Possibly your input and the output
  - Can you reliably reproduce the issue? And can you also reproduce it with older versions?

<!-- omit in toc -->
#### How Do I Submit a Good Bug Report?

> You must never report security related issues, vulnerabilities or bugs including sensitive information to
> the issue tracker, or elsewhere in public. Instead sensitive bugs must be sent by email to <joaquin.dominguez@proton.me>.
<!-- You may add a PGP key to allow the messages to be sent encrypted as well. -->

We use GitHub issues to track bugs and errors. If you run into an issue with the project:

- Open an [Issue](https://github.com/andrewyng/aisuite/issues/new). (Since we can't be sure at
  this point whether it is a bug or not, we ask you not to talk about a bug yet and not to label the issue.)
- Explain the behavior you would expect and the actual behavior.
- Please provide as much context as possible and describe the *reproduction steps* that someone else can
  follow to recreate the issue on their own. This usually includes your code. For good bug reports you
  should isolate the problem and create a reduced test case.
- Provide the information you collected in the previous section.

Once it's filed:

- The project team will label the issue accordingly.
- A team member will try to reproduce the issue with your provided steps. If there are no reproduction 
  steps or no obvious way to reproduce the issue, the team will ask you for those steps and mark the
  issue as `needs-repro`. Bugs with the `needs-repro` tag will not be addressed until they are reproduced.
- If the team is able to reproduce the issue, it will be marked `needs-fix`, as well as possibly other
  tags (such as `critical`), and the issue will be left to be
  [implemented by someone](#your-first-code-contribution).

Please use the issue templates provided.


### Suggesting Enhancements

This section guides you through submitting an enhancement suggestion for aisuite,
**including completely new features and minor improvements to existing functionality**. Following these
guidelines will help maintainers and the community to understand your suggestion and find related suggestions.

<!-- omit in toc -->
#### Before Submitting an Enhancement

- Make sure that you are using the latest version.
- Read the [documentation](https://github.com/andrewyng/aisuite/blob/main/README.md) carefully
  and find out if the functionality is already covered, maybe by an individual configuration.
- Perform a [search](https://github.com/andrewyng/aisuite/issues) to see if the enhancement has
  already been suggested. If it has, add a comment to the existing issue instead of opening a new one.
- Find out whether your idea fits with the scope and aims of the project. It's up to you to make a strong
  case to convince the project's developers of the merits of this feature. Keep in mind that we want features that will be useful to the majority of our users and not just a small subset. If you're just targeting a minority of users, consider writing an add-on/plugin library.

<!-- omit in toc -->
#### How Do I Submit a Good Enhancement Suggestion?

Enhancement suggestions are tracked as [GitHub issues](https://github.com/andrewyng/aisuite/issues).

- Use a **clear and descriptive title** for the issue to identify the suggestion.
- Provide a **step-by-step description of the suggested enhancement** in as many details as possible.
- **Describe the current behavior** and **explain which behavior you expected to see instead** and why.
  At this point you can also tell which alternatives do not work for you.
- **Explain why this enhancement would be useful** to most aisuite users. You may also want to
  point out the other projects that solved it better and which could serve as inspiration.


### Your First Code Contribution

#### Pre-requisites

You should first [fork](https://docs.github.com/en/pull-requests/collaborating-with-pull-requests/working-with-forks/fork-a-repo)
the `aisuite` repository and then clone your forked repository:

```bash
git clone https://github.com/<YOUR_GITHUB_USER>/aisuite.git
```


Once in the cloned repository directory, make a branch on the forked repository with your username and
description of PR:
```bash
git checkout -B <username>/<description>
```

Please install the development and test dependencies:
```bash
poetry install --with dev,test
```

`aisuite` uses pre-commit to ensure the formatting is consistent:
```bash
pre-commit install
```

**Make suggested changes**

Afterwards, our suite of formatting tests will run automatically before each `git commit`. You can also
run these manually:
```bash
pre-commit run --all-files
```

If a formatting test fails, it will fix the modified code in place and abort the `git commit`. After looking
over the changes, you can `git add <modified files>` and then repeat the previous git commit command.

**Note**: a github workflow will check the files with the same formatter and reject the PR if it doesn't
pass, so please make sure it passes locally.


#### Testing
`aisuite` tracks unit tests. Pytest is used to execute said unit tests in `tests/`:

```bash
poetry run pytest tests
```

If your code changes implement a new function, please make a corresponding unit test to the `test/*` files.

#### Contributing Workflow
We actively welcome your pull requests.

1. Create your new branch from main in your forked repo, with your username and a name describing the work
   you're completing e.g. user-123/add-feature-x.
2. If you've added code that should be tested, add tests. Ensure all tests pass. See the testing section
   for more information.
3. If you've changed APIs, update the documentation.
4. Make sure your code lints.


### Improving The Documentation
We welcome valuable contributions in the form of new documentation or revised documentation that provide
further clarity or accuracy. Each function should be clearly documented. Well-documented code is easier
to review and understand/extend.

## Styleguides
For code documentation, please follow the [Google styleguide](https://github.com/google/styleguide/blob/gh-pages/pyguide.md#38-comments-and-docstrings).


================================================
FILE: LICENSE
================================================
MIT License

Copyright (c) 2024 Andrew Ng

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and
associated documentation files (the "Software"), to deal in the Software without restriction, including
without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the
following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial
portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT
LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.


================================================
FILE: README.md
================================================
#  aisuite

[![PyPI](https://img.shields.io/pypi/v/aisuite)](https://pypi.org/project/aisuite/)
[![Code style: black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black)

`aisuite` is a lightweight Python library that provides a **unified API for working with multiple Generative AI providers**.  
It offers a consistent interface for models from *OpenAI, Anthropic, Google, Hugging Face, AWS, Cohere, Mistral, Ollama*, and others—abstracting away SDK differences, authentication details, and parameter variations.  
Its design is modeled after OpenAI’s API style, making it instantly familiar and easy to adopt.

`aisuite` lets developers build and **run LLM-based or agentic applications across providers** with minimal setup.  
While it’s not a full-blown agents framework, it includes simple abstractions for creating standalone, lightweight agents.  
It’s designed for low learning curve — so you can focus on building AI systems, not integrating APIs.

---

## Key Features

`aisuite` is designed to eliminate the complexity of working with multiple LLM providers while keeping your code simple and portable. Whether you're building a chatbot, an agentic application, or experimenting with different models, `aisuite` provides the abstractions you need without getting in your way.

* **Unified API for multiple model providers** – Write your code once and run it with any supported provider. Switch between OpenAI, Anthropic, Google, and others with a single parameter change.
* **Easy agentic app or agent creation** – Build multi-turn agentic applications using a single parameter `max_turns`. No need to manually manage tool execution loops.
* **Pass Tool calls easily** – Pass real Python functions instead of JSON specs; aisuite handles schema generation and execution automatically.
* **MCP tools** – Connect to MCP-based tools without writing boilerplate; aisuite handles connection, schema and execution seamlessly.
* **Modular and extensible provider architecture** – Add support for new providers with minimal code. The plugin-style architecture makes extensions straightforward.

---

## Installation

You can install just the base `aisuite` package, or install a provider's package along with `aisuite`.

Install just the base package without any provider SDKs:

```shell
pip install aisuite
```

Install aisuite with a specific provider (e.g., Anthropic):

```shell
pip install 'aisuite[anthropic]'
```

Install aisuite with all provider libraries:

```shell
pip install 'aisuite[all]'
```

## Setup

To get started, you will need API Keys for the providers you intend to use. You'll need to
install the provider-specific library either separately or when installing aisuite.

The API Keys can be set as environment variables, or can be passed as config to the aisuite Client constructor.
You can use tools like [`python-dotenv`](https://pypi.org/project/python-dotenv/) or [`direnv`](https://direnv.net/) to set the environment variables manually. Please take a look at the `examples` folder to see usage.

Here is a short example of using `aisuite` to generate chat completion responses from gpt-4o and claude-3-5-sonnet.

Set the API keys.

```shell
export OPENAI_API_KEY="your-openai-api-key"
export ANTHROPIC_API_KEY="your-anthropic-api-key"
```

Use the python client.

```python
import aisuite as ai
client = ai.Client()

models = ["openai:gpt-4o", "anthropic:claude-3-5-sonnet-20240620"]

messages = [
    {"role": "system", "content": "Respond in Pirate English."},
    {"role": "user", "content": "Tell me a joke."},
]

for model in models:
    response = client.chat.completions.create(
        model=model,
        messages=messages,
        temperature=0.75
    )
    print(response.choices[0].message.content)

```

Note that the model name in the create() call uses the format - `<provider>:<model-name>`.
`aisuite` will call the appropriate provider with the right parameters based on the provider value.
For a list of provider values, you can look at the directory - `aisuite/providers/`. The list of supported providers are of the format - `<provider>_provider.py` in that directory. We welcome providers to add support to this library by adding an implementation file in this directory. Please see section below for how to contribute.

For more examples, check out the `examples` directory where you will find several notebooks that you can run to experiment with the interface.

---

## Chat Completions

The chat API provides a high-level abstraction for model interactions. It supports all core parameters (`temperature`, `max_tokens`, `tools`, etc.) in a provider-agnostic way.

```python
response = client.chat.completions.create(
    model="google:gemini-pro",
    messages=[{"role": "user", "content": "Summarize this paragraph."}],
)
print(response.choices[0].message.content)
```

`aisuite` standardizes request and response structures so you can focus on logic rather than SDK differences.

---

## Tool Calling & Agentic apps

`aisuite` provides a simple abstraction for tool/function calling that works across supported providers. This is in addition to the regular abstraction of passing JSON spec of the tool to the `tools` parameter. The tool calling abstraction makes it easy to use tools with different LLMs without changing your code.

There are two ways to use tools with `aisuite`:

### 1. Manual Tool Handling

This is the default behavior when `max_turns` is not specified. In this mode, you have full control over the tool execution flow. You pass tools using the standard OpenAI JSON schema format, and `aisuite` returns the LLM's tool call requests in the response. You're then responsible for executing the tools, processing results, and sending them back to the model in subsequent requests.

This approach is useful when you need:
- Fine-grained control over tool execution logic
- Custom error handling or validation before executing tools
- The ability to selectively execute or skip certain tool calls
- Integration with existing tool execution pipelines

You can pass tools in the OpenAI tool format:

```python
def will_it_rain(location: str, time_of_day: str):
    """Check if it will rain in a location at a given time today.
    
    Args:
        location (str): Name of the city
        time_of_day (str): Time of the day in HH:MM format.
    """
    return "YES"

tools = [{
    "type": "function",
    "function": {
        "name": "will_it_rain",
        "description": "Check if it will rain in a location at a given time today",
        "parameters": {
            "type": "object",
            "properties": {
                "location": {
                    "type": "string",
                    "description": "Name of the city"
                },
                "time_of_day": {
                    "type": "string",
                    "description": "Time of the day in HH:MM format."
                }
            },
            "required": ["location", "time_of_day"]
        }
    }
}]

response = client.chat.completions.create(
    model="openai:gpt-4o",
    messages=messages,
    tools=tools
)
```

### 2. Automatic Tool Execution

When `max_turns` is specified, you can pass a list of callable Python functions as the `tools` parameter. `aisuite` will automatically handle the tool calling flow:

```python
def will_it_rain(location: str, time_of_day: str):
    """Check if it will rain in a location at a given time today.
    
    Args:
        location (str): Name of the city
        time_of_day (str): Time of the day in HH:MM format.
    """
    return "YES"

client = ai.Client()
messages = [{
    "role": "user",
    "content": "I live in San Francisco. Can you check for weather "
               "and plan an outdoor picnic for me at 2pm?"
}]

# Automatic tool execution with max_turns
response = client.chat.completions.create(
    model="openai:gpt-4o",
    messages=messages,
    tools=[will_it_rain],
    max_turns=2  # Maximum number of back-and-forth tool calls
)
print(response.choices[0].message.content)
```

When `max_turns` is specified, `aisuite` will:
1. Send your message to the LLM
2. Execute any tool calls the LLM requests
3. Send the tool results back to the LLM
4. Repeat until the conversation is complete or max_turns is reached

In addition to `response.choices[0].message`, there is an additional field `response.choices[0].intermediate_messages` which contains the list of all messages including tool interactions used. This can be used to continue the conversation with the model.
For more detailed examples of tool calling, check out the `examples/tool_calling_abstraction.ipynb` notebook.

### Model Context Protocol (MCP) Integration

`aisuite` natively supports **MCP**, a standard protocol that allows LLMs to securely call external tools and access data. You can connect to MCP servers—such as a filesystem or database—and expose their tools directly to your model.
Read more about MCP here - https://modelcontextprotocol.io/docs/getting-started/intro

Install aisuite with MCP support:

```shell
pip install 'aisuite[mcp]'
```

You'll also need an MCP server. For example, to use the filesystem server:

```shell
npm install -g @modelcontextprotocol/server-filesystem
```

There are two ways to use MCP tools with aisuite:

#### Option 1: Config Dict Format (Recommended for Simple Use Cases)

```python
import aisuite as ai

client = ai.Client()
response = client.chat.completions.create(
    model="openai:gpt-4o",
    messages=[{"role": "user", "content": "List the files in the current directory"}],
    tools=[{
        "type": "mcp",
        "name": "filesystem",
        "command": "npx",
        "args": ["-y", "@modelcontextprotocol/server-filesystem", "/path/to/directory"]
    }],
    max_turns=3
)

print(response.choices[0].message.content)
```

#### Option 2: Explicit MCPClient (Recommended for Advanced Use Cases)

```python
import aisuite as ai
from aisuite.mcp import MCPClient

# Create MCP client once, reuse across requests
mcp = MCPClient(
    command="npx",
    args=["-y", "@modelcontextprotocol/server-filesystem", "/path/to/directory"]
)

# Use with aisuite
client = ai.Client()
response = client.chat.completions.create(
    model="openai:gpt-4o",
    messages=[{"role": "user", "content": "List the files"}],
    tools=mcp.get_callable_tools(),
    max_turns=3
)

print(response.choices[0].message.content)
mcp.close()  # Clean up
```

For detailed usage (security filters, tool prefixing, and `MCPClient` management), see [docs/mcp-tools.md](docs/mcp-tools.md).
For detailed examples, see `examples/mcp_tools_example.ipynb`.

---

## Extending aisuite: Adding a Provider

New providers can be added by implementing a lightweight adapter. The system uses a naming convention for discovery:

| Element         | Convention                         |
| --------------- | ---------------------------------- |
| **Module file** | `<provider>_provider.py`           |
| **Class name**  | `<Provider>Provider` (capitalized) |

Example:

```python
# providers/openai_provider.py
class OpenaiProvider(BaseProvider):
    ...
```

This convention ensures consistency and enables automatic loading of new integrations.

---

## Contributing

Contributions are welcome. Please review the [Contributing Guide](https://github.com/andrewyng/aisuite/blob/main/CONTRIBUTING.md) and join our [Discord](https://discord.gg/T6Nvn8ExSb) for discussions.

---

## License

Released under the **MIT License** — free for commercial and non-commercial use.

---


================================================
FILE: aisuite/__init__.py
================================================
from .client import Client
from .framework.message import Message
from .utils.tools import Tools


================================================
FILE: aisuite/client.py
================================================
from .provider import ProviderFactory
import os
from .utils.tools import Tools
from typing import Union, BinaryIO, Optional, Any, Literal
from contextlib import ExitStack
from .framework.message import (
    TranscriptionResponse,
)
from .framework.asr_params import ParamValidator

# Import MCP utilities for config dict support
try:
    from .mcp.config import is_mcp_config
    from .mcp.client import MCPClient

    MCP_AVAILABLE = True
except ImportError:
    MCP_AVAILABLE = False


class Client:
    def __init__(
        self,
        provider_configs: dict = {},
        extra_param_mode: Literal["strict", "warn", "permissive"] = "warn",
    ):
        """
        Initialize the client with provider configurations.
        Use the ProviderFactory to create provider instances.

        Args:
            provider_configs (dict): A dictionary containing provider configurations.
                Each key should be a provider string (e.g., "google" or "aws-bedrock"),
                and the value should be a dictionary of configuration options for that provider.
                For example:
                {
                    "openai": {"api_key": "your_openai_api_key"},
                    "aws-bedrock": {
                        "aws_access_key": "your_aws_access_key",
                        "aws_secret_key": "your_aws_secret_key",
                        "aws_region": "us-west-2"
                    }
                }
            extra_param_mode (str): How to handle unknown ASR parameters.
                - "strict": Raise ValueError on unknown params (production)
                - "warn": Log warning on unknown params (default, development)
                - "permissive": Allow all params without validation (testing)
        """
        self.providers = {}
        self.provider_configs = provider_configs
        self.extra_param_mode = extra_param_mode
        self.param_validator = ParamValidator(extra_param_mode)
        self._chat = None
        self._audio = None

    def _initialize_providers(self):
        """Helper method to initialize or update providers."""
        for provider_key, config in self.provider_configs.items():
            provider_key = self._validate_provider_key(provider_key)
            self.providers[provider_key] = ProviderFactory.create_provider(
                provider_key, config
            )

    def _validate_provider_key(self, provider_key):
        """
        Validate if the provider key corresponds to a supported provider.
        """
        supported_providers = ProviderFactory.get_supported_providers()

        if provider_key not in supported_providers:
            raise ValueError(
                f"Invalid provider key '{provider_key}'. Supported providers: {supported_providers}. "
                "Make sure the model string is formatted correctly as 'provider:model'."
            )

        return provider_key

    def configure(self, provider_configs: Optional[dict] = None):
        """
        Configure the client with provider configurations.
        """
        if provider_configs is None:
            return

        self.provider_configs.update(provider_configs)
        # Providers will be lazily initialized when needed

    @property
    def chat(self):
        """Return the chat API interface."""
        if not self._chat:
            self._chat = Chat(self)
        return self._chat

    @property
    def audio(self):
        """Return the audio API interface."""
        if not self._audio:
            self._audio = Audio(self)
        return self._audio


class Chat:
    def __init__(self, client: "Client"):
        self.client = client
        self._completions = Completions(self.client)

    @property
    def completions(self):
        """Return the completions interface."""
        return self._completions


class Completions:
    def __init__(self, client: "Client"):
        self.client = client

    def _process_mcp_configs(self, tools: list) -> tuple[list, list]:
        """
        Process tools list and convert MCP config dicts to callable tools.

        This method:
        1. Detects MCP config dicts ({"type": "mcp", ...})
        2. Creates MCPClient instances from configs
        3. Extracts callable tools with filtering and prefixing
        4. Mixes MCP tools with regular callable tools
        5. Returns both processed tools and MCP clients for cleanup

        Args:
            tools: List of tools (mix of callables and MCP configs)

        Returns:
            Tuple of (processed_tools, mcp_clients):
                - processed_tools: List of callable tools only
                - mcp_clients: List of MCPClient instances to be cleaned up

        Example:
            >>> tools = [
            ...     my_function,
            ...     {"type": "mcp", "name": "fs", "command": "npx", "args": [...]},
            ...     another_function
            ... ]
            >>> callable_tools, mcp_clients = self._process_mcp_configs(tools)
            >>> # Returns: ([my_function, fs_tool1, fs_tool2, ..., another_function], [mcp_client])
        """
        if not MCP_AVAILABLE:
            # If MCP not installed, check if user is trying to use it
            if any(is_mcp_config(tool) for tool in tools if isinstance(tool, dict)):
                raise ImportError(
                    "MCP tools require the 'mcp' package. "
                    "Install it with: pip install 'aisuite[mcp]' or pip install mcp"
                )
            return tools, []

        processed_tools = []
        mcp_clients = []

        for tool in tools:
            if isinstance(tool, dict) and is_mcp_config(tool):
                # It's an MCP config dict - convert to callable tools
                try:
                    mcp_client = MCPClient.from_config(tool)
                    mcp_clients.append(mcp_client)

                    # Get tools with config settings
                    mcp_tools = mcp_client.get_callable_tools(
                        allowed_tools=tool.get("allowed_tools"),
                        use_tool_prefix=tool.get("use_tool_prefix", False),
                    )

                    processed_tools.extend(mcp_tools)
                except Exception as e:
                    raise ValueError(
                        f"Failed to create MCP client from config: {e}\n"
                        f"Config: {tool}"
                    )
            else:
                # Regular callable tool - pass through
                processed_tools.append(tool)

        return processed_tools, mcp_clients

    def _extract_thinking_content(self, response):
        """
        Extract content between <think> tags if present and store it in reasoning_content.

        Args:
            response: The response object from the provider

        Returns:
            Modified response object
        """
        if hasattr(response, "choices") and response.choices:
            message = response.choices[0].message
            if hasattr(message, "content") and message.content:
                content = message.content.strip()
                if content.startswith("<think>") and "</think>" in content:
                    # Extract content between think tags
                    start_idx = len("<think>")
                    end_idx = content.find("</think>")
                    thinking_content = content[start_idx:end_idx].strip()

                    # Store the thinking content
                    message.reasoning_content = thinking_content

                    # Remove the think tags from the original content
                    message.content = content[end_idx + len("</think>") :].strip()

        return response

    def _tool_runner(
        self,
        provider,
        model_name: str,
        messages: list,
        tools: Any,
        max_turns: int,
        **kwargs,
    ):
        """
        Handle tool execution loop for max_turns iterations.

        Args:
            provider: The provider instance to use for completions
            model_name: Name of the model to use
            messages: List of conversation messages
            tools: Tools instance or list of callable tools
            max_turns: Maximum number of tool execution turns
            **kwargs: Additional arguments to pass to the provider

        Returns:
            The final response from the model with intermediate responses and messages
        """
        # Handle tools validation and conversion
        if isinstance(tools, Tools):
            tools_instance = tools
            kwargs["tools"] = tools_instance.tools()
        else:
            # Check if passed tools are callable
            if not all(callable(tool) for tool in tools):
                raise ValueError("One or more tools is not callable")
            tools_instance = Tools(tools)
            kwargs["tools"] = tools_instance.tools()

        turns = 0
        intermediate_responses = []  # Store intermediate responses
        intermediate_messages = []  # Store all messages including tool interactions

        while turns < max_turns:
            # Make the API call
            response = provider.chat_completions_create(model_name, messages, **kwargs)
            response = self._extract_thinking_content(response)

            # Store intermediate response
            intermediate_responses.append(response)

            # Check if there are tool calls in the response
            tool_calls = (
                getattr(response.choices[0].message, "tool_calls", None)
                if hasattr(response, "choices")
                else None
            )

            # Store the model's message
            intermediate_messages.append(response.choices[0].message)

            if not tool_calls:
                # Set the intermediate data in the final response
                response.intermediate_responses = intermediate_responses[
                    :-1
                ]  # Exclude final response
                response.choices[0].intermediate_messages = intermediate_messages
                return response

            # Execute tools and get results
            results, tool_messages = tools_instance.execute_tool(tool_calls)

            # Add tool messages to intermediate messages
            intermediate_messages.extend(tool_messages)

            # Add the assistant's response and tool results to messages
            messages.extend([response.choices[0].message, *tool_messages])

            turns += 1

        # Set the intermediate data in the final response
        response.intermediate_responses = intermediate_responses[
            :-1
        ]  # Exclude final response
        response.choices[0].intermediate_messages = intermediate_messages
        return response

    def create(self, model: str, messages: list, **kwargs):
        """
        Create chat completion based on the model, messages, and any extra arguments.
        Supports automatic tool execution when max_turns is specified.
        """
        # Check that correct format is used
        if ":" not in model:
            raise ValueError(
                f"Invalid model format. Expected 'provider:model', got '{model}'"
            )

        # Extract the provider key from the model identifier, e.g., "google:gemini-xx"
        provider_key, model_name = model.split(":", 1)

        # Validate if the provider is supported
        supported_providers = ProviderFactory.get_supported_providers()
        if provider_key not in supported_providers:
            raise ValueError(
                f"Invalid provider key '{provider_key}'. Supported providers: {supported_providers}. "
                "Make sure the model string is formatted correctly as 'provider:model'."
            )

        # Initialize provider if not already initialized
        # TODO: Add thread-safe provider initialization with lock to prevent race conditions
        # when multiple threads try to initialize the same provider simultaneously.
        if provider_key not in self.client.providers:
            config = self.client.provider_configs.get(provider_key, {})
            self.client.providers[provider_key] = ProviderFactory.create_provider(
                provider_key, config
            )

        provider = self.client.providers.get(provider_key)
        if not provider:
            raise ValueError(f"Could not load provider for '{provider_key}'.")

        # Extract tool-related parameters
        max_turns = kwargs.pop("max_turns", None)
        tools = kwargs.pop("tools", None)

        # Use ExitStack to manage MCP client cleanup automatically
        with ExitStack() as stack:
            # Convert MCP config dicts to callable tools and get MCP clients
            mcp_clients = []
            if tools is not None:
                tools, mcp_clients = self._process_mcp_configs(tools)
                # Register all MCP clients for automatic cleanup
                for mcp_client in mcp_clients:
                    stack.enter_context(mcp_client)

            # Check environment variable before allowing multi-turn tool execution
            if max_turns is not None and tools is not None:
                return self._tool_runner(
                    provider,
                    model_name,
                    messages.copy(),
                    tools,
                    max_turns,
                    **kwargs,
                )

            # Default behavior without tool execution
            # Delegate the chat completion to the correct provider's implementation
            response = provider.chat_completions_create(model_name, messages, **kwargs)
            return self._extract_thinking_content(response)


class Audio:
    """Audio API interface."""

    def __init__(self, client: "Client"):
        self.client = client
        self._transcriptions = Transcriptions(self.client)

    @property
    def transcriptions(self):
        """Return the transcriptions interface."""
        return self._transcriptions


class Transcriptions:
    """Transcriptions API interface."""

    def __init__(self, client: "Client"):
        self.client = client

    def create(
        self,
        *,
        model: str,
        file: Union[str, BinaryIO],
        **kwargs,
    ) -> TranscriptionResponse:
        """
        Create audio transcription with parameter validation.

        This method uses a pass-through approach with validation:
        - Common parameters (OpenAI-style) are auto-mapped to provider equivalents
        - Provider-specific parameters are passed through directly
        - Unknown parameters are handled based on extra_param_mode

        Args:
            model: Provider and model in format 'provider:model' (e.g., 'openai:whisper-1')
            file: Audio file to transcribe (file path or file-like object)
            **kwargs: Transcription parameters (provider-specific or common)
                Common parameters (portable across providers):
                    - language: Language code (e.g., "en")
                    - prompt: Context for the transcription
                    - temperature: Sampling temperature (0-1, OpenAI only)
                Provider-specific parameters are passed through directly.
                See provider documentation for valid parameters.

        Returns:
            TranscriptionResponse: Unified response (batch or streaming)

        Raises:
            ValueError: If model format invalid, provider not supported,
                       or unknown params in strict mode

        Examples:
            # Portable code (OpenAI-style params)
            >>> result = client.audio.transcriptions.create(
            ...     model="openai:whisper-1",
            ...     file="audio.mp3",
            ...     language="en"
            ... )

            # Provider-specific features
            >>> result = client.audio.transcriptions.create(
            ...     model="deepgram:nova-2",
            ...     file="audio.mp3",
            ...     language="en",  # Common param
            ...     punctuate=True,  # Deepgram-specific
            ...     diarize=True     # Deepgram-specific
            ... )
        """
        # Validate model format
        if ":" not in model:
            raise ValueError(
                f"Invalid model format. Expected 'provider:model', got '{model}'"
            )

        # Extract provider and model name
        provider_key, model_name = model.split(":", 1)

        # Validate provider is supported
        supported_providers = ProviderFactory.get_supported_providers()
        if provider_key not in supported_providers:
            raise ValueError(
                f"Invalid provider key '{provider_key}'. "
                f"Supported providers: {supported_providers}"
            )

        # Validate and map parameters
        validated_params = self.client.param_validator.validate_and_map(
            provider_key, kwargs
        )

        # Initialize provider if not already initialized
        if provider_key not in self.client.providers:
            config = self.client.provider_configs.get(provider_key, {})
            try:
                self.client.providers[provider_key] = ProviderFactory.create_provider(
                    provider_key, config
                )
            except ImportError as e:
                raise ValueError(f"Provider '{provider_key}' is not available: {e}")

        provider = self.client.providers.get(provider_key)
        if not provider:
            raise ValueError(f"Could not load provider for '{provider_key}'.")

        # Check if provider supports audio transcription
        if not hasattr(provider, "audio") or provider.audio is None:
            raise ValueError(
                f"Provider '{provider_key}' does not support audio transcription."
            )

        # Determine if streaming is requested
        should_stream = validated_params.get("stream", False)

        # Delegate to provider implementation
        try:
            if should_stream:
                # Check if provider supports output streaming
                if hasattr(provider.audio, "transcriptions") and hasattr(
                    provider.audio.transcriptions, "create_stream_output"
                ):
                    return provider.audio.transcriptions.create_stream_output(
                        model_name, file, **validated_params
                    )
                else:
                    raise ValueError(
                        f"Provider '{provider_key}' does not support streaming transcription."
                    )
            else:
                # Non-streaming (batch) transcription
                if hasattr(provider.audio, "transcriptions") and hasattr(
                    provider.audio.transcriptions, "create"
                ):
                    return provider.audio.transcriptions.create(
                        model_name, file, **validated_params
                    )
                else:
                    raise ValueError(
                        f"Provider '{provider_key}' does not support audio transcription."
                    )
        except NotImplementedError:
            raise ValueError(
                f"Provider '{provider_key}' does not support audio transcription."
            )


================================================
FILE: aisuite/design-notes/asr-parameter-design-motivation.md
================================================
# ASR - API Parameter Design Philosophy

## Design Goal: Portable Code with Provider Flexibility

The ASR parameter system is designed around a core principle: **developers should write portable code that works across providers, while retaining the ability to use provider-specific features when needed**. This document explains the rationale behind our parameter classification and validation approach.

---

## Mandatory Parameters and Common Mappings

### The Foundation: Minimal Requirements

Every transcription needs just two things:
- **`model`**: Which model/provider to use
- **`file`**: What audio to transcribe

By keeping mandatory parameters minimal, we maximize compatibility and reduce the barrier to getting started.

### Common Parameters: Write Once, Run Anywhere

Beyond the basics, there are concepts that exist across providers but use different names or formats. We handle three common parameters that auto-map to each provider's native API:

**Example: Same code, different providers**

```python
# Works with OpenAI
result = client.audio.transcriptions.create(
    model="openai:whisper-1",
    file="meeting.mp3",
    language="en",
    prompt="discussion about API design"
)

# Exact same code works with Deepgram
result = client.audio.transcriptions.create(
    model="deepgram:nova-2",
    file="meeting.mp3",
    language="en",
    prompt="discussion about API design"
)
```

Behind the scenes:
- **`language`** passes through as `language` for both OpenAI and Deepgram, but expands to `language_code: "en-US"` for Google
- **`prompt`** passes as `prompt` to OpenAI, transforms to `keywords: ["discussion", "about", "API", "design"]` for Deepgram, and becomes `speech_contexts: [{"phrases": ["discussion about API design"]}]` for Google
- **`temperature`** passes through to OpenAI (which supports it) and is silently ignored by Deepgram and Google (which don't)

**Why auto-mapping?** Developers shouldn't need to remember that Google uses `language_code` while others use `language`, or that Deepgram expects a list of keywords. The framework handles these provider quirks transparently, letting you write portable code.

---

## Provider-Specific Features: Pass-Through for Power Users

Each provider has unique features that give them competitive advantages. We don't limit you to the "lowest common denominator" - if you need provider-specific functionality, it's available:

**Deepgram's advanced features:**
```python
result = client.audio.transcriptions.create(
    model="deepgram:nova-2",
    file="meeting.mp3",
    language="en",
    punctuate=True,        # Deepgram-specific
    diarize=True,          # Deepgram-specific
    sentiment=True,        # Deepgram-specific
    smart_format=True      # Deepgram-specific
)
```

**Google's speech contexts:**
```python
result = client.audio.transcriptions.create(
    model="google:latest_long",
    file="meeting.mp3",
    language_code="en-US",
    enable_automatic_punctuation=True,  # Google-specific
    max_alternatives=3,                  # Google-specific
    speech_contexts=[{"phrases": ["API", "SDK", "REST"]}]  # Google-specific
)
```

These provider-specific parameters pass through directly to the provider's SDK. The framework validates them based on your configured mode (see next section), but doesn't block access to unique features.

---

## Progressive Validation: Safety When You Need It

The validation system supports three modes to match different development stages:

### Development Mode: `"warn"` (Default)
```python
client = Client(extra_param_mode="warn")
```
Unknown parameters trigger warnings but continue execution. Perfect for exploration and prototyping. You see *"OpenAI doesn't support 'punctuate'"* but your code keeps running.

### Strict Mode: `"strict"`
```python
client = Client(extra_param_mode="strict")
```
Unknown parameters raise errors immediately. Use in production to catch typos, configuration mistakes, or provider API changes early. Ensures no silent failures.

### Permissive Mode: `"permissive"`
```python
client = Client(extra_param_mode="permissive")
```
All parameters pass through without validation. Use for beta features, experimental parameters, or when providers add new capabilities faster than framework updates.

**Progressive workflow:**
1. **Develop** with `warn` - explore freely, see warnings
2. **Refactor** - fix warnings to make code portable
3. **Deploy** with `strict` - ensure production safety

---

## Developer Experience Benefits

### 1. Write Portable Code Naturally
The same parameter names work across providers. Switch from OpenAI to Deepgram by changing one word: the model identifier.

### 2. Progressive Enhancement
Start with portable common parameters. Add provider-specific features only where you need them. Your core logic remains portable even when using advanced features for specific providers.

### 3. Zero Framework Lock-in
Parameter names come directly from provider APIs, not framework abstractions. If you need to remove the framework, you already know the native API - the names are identical.

### 4. Validation That Adapts to You
Choose your safety level based on context. Strict for production, warn for development, permissive for bleeding-edge features. The framework supports your workflow rather than constraining it.

### 5. No Documentation Friction
Copy parameters from provider docs directly. No need to learn our abstraction layer or figure out mappings - we handle the common cases, you use native names for everything else.

---

## Alternative Design Considered

We considered creating a unified options object (`TranscriptionOptions`) that explicitly defines all parameters with framework-specific names. We chose pass-through instead because:

1. **Provider APIs evolve faster than frameworks** - New parameters appear frequently. Pass-through lets developers use them immediately (in permissive mode) without waiting for framework updates.

2. **Provider features don't map cleanly** - Deepgram's sentiment analysis, Google's complex speech contexts, OpenAI's timestamp granularities - each is unique. A unified object means either losing functionality or creating complex provider-specific abstractions.

3. **Direct API access reduces friction** - Developers already know their provider's API from official docs. They can use parameter names directly rather than learning another abstraction layer.

The pass-through approach with progressive validation provides the best of both worlds: portability for common cases, power for advanced features, and safety when you need it.

---

## Design Principles Summary

- **Mandatory Minimal**: Only `model` and `file` required
- **Common Auto-Mapped**: Frequent cross-provider concepts map transparently
- **Provider-Specific Pass-Through**: Unique features remain accessible
- **Progressive Validation**: Three modes for different development stages
- **Zero Abstraction Tax**: Use provider APIs directly with optional safety nets

This design prioritizes developer experience through portability without sacrificing power, validation without blocking experimentation, and simplicity without limiting functionality.


================================================
FILE: aisuite/framework/__init__.py
================================================
from .provider_interface import ProviderInterface
from .chat_completion_response import ChatCompletionResponse
from .message import Message


================================================
FILE: aisuite/framework/asr_params.py
================================================
"""
ASR parameter registry and validation.

This module provides a unified parameter validation system for audio transcription
across different providers. It supports:
- Common parameters (OpenAI-style) that are auto-mapped to provider equivalents
- Provider-specific parameters that are passed through directly
- Three validation modes: strict, warn, and permissive
"""

from typing import Dict, Set, Any, Optional, Literal
import logging

logger = logging.getLogger(__name__)


# Common parameters that get auto-mapped across providers
# These follow OpenAI's API conventions for maximum portability
COMMON_PARAMS: Dict[str, Dict[str, Optional[str]]] = {
    "language": {
        "openai": "language",
        "deepgram": "language",
        "google": "language_code",
        "huggingface": None,  # Not supported by Inference API
    },
    "prompt": {
        "openai": "prompt",
        "deepgram": "keywords",
        "google": "speech_contexts",
        "huggingface": None,  # Not supported
    },
    "temperature": {
        "openai": "temperature",
        "deepgram": None,  # Not supported
        "google": None,  # Not supported
        "huggingface": "temperature",  # Supported as generation param
    },
}


# Valid provider-specific parameters
# Each provider has its own set of supported parameters
PROVIDER_PARAMS: Dict[str, Set[str]] = {
    "openai": {
        # Basic parameters
        "language",
        "prompt",
        "temperature",
        # Output format
        "response_format",  # "json" | "text" | "srt" | "verbose_json" | "vtt"
        "timestamp_granularities",  # ["word"] | ["segment"] | ["word", "segment"]
        # Streaming
        "stream",  # Boolean
    },
    "deepgram": {
        # Basic parameters
        "language",
        "model",
        # Text enhancement
        "punctuate",  # Auto-add punctuation
        "diarize",  # Speaker diarization
        "utterances",  # Sentence-level timestamps
        "paragraphs",  # Paragraph segmentation
        "smart_format",  # Format numbers, dates, etc.
        "profanity_filter",  # Filter profanity
        # Advanced features
        "search",  # Search for keywords: ["keyword1", "keyword2"]
        "replace",  # Replace words: {"um": "", "uh": ""}
        "keywords",  # Boost keywords: ["important", "technical"]
        "numerals",  # Format numerals
        "measurements",  # Format measurements
        # AI features
        "sentiment",  # Sentiment analysis
        "topics",  # Topic detection
        "intents",  # Intent recognition
        "summarize",  # Auto-summarization
        # Audio format
        "encoding",  # "linear16" | "mp3" | "flac"
        "sample_rate",  # Integer (Hz)
        "channels",  # Integer
        # Quality and alternatives
        "confidence",  # Include confidence scores
        "alternatives",  # Number of alternative transcripts
        # Streaming
        "interim_results",  # Get interim results while streaming
    },
    "google": {
        # Basic parameters
        "language_code",  # BCP-47 code like "en-US"
        "model",  # "latest_long" | "latest_short" | "default"
        # Audio format
        "encoding",  # "LINEAR16" | "FLAC" | "MP3"
        "sample_rate_hertz",  # Integer
        "audio_channel_count",  # Integer
        # Text enhancement
        "enable_automatic_punctuation",  # Boolean
        "profanity_filter",  # Boolean
        "enable_spoken_punctuation",  # Boolean
        "enable_spoken_emojis",  # Boolean
        # Speaker features
        "enable_speaker_diarization",  # Boolean
        "diarization_speaker_count",  # Integer (max speakers)
        "min_speaker_count",  # Integer
        # Metadata
        "enable_word_time_offsets",  # Word-level timestamps
        "enable_word_confidence",  # Word-level confidence
        "max_alternatives",  # Number of alternatives
        # Context
        "speech_contexts",  # [{"phrases": [...], "boost": float}]
        "boost",  # Float (phraseHint boost)
        # Streaming
        "interim_results",  # Boolean
        "single_utterance",  # Boolean (stop after one utterance)
    },
    "huggingface": {
        # Basic parameters
        "model",  # Model ID on Hugging Face Hub
        "temperature",  # Generation temperature
        # API options
        "return_timestamps",  # Boolean or "word" or "char"
        "use_cache",  # Boolean: use cached inference
        "wait_for_model",  # Boolean: wait if model is loading
        # Generation parameters
        "top_k",  # Integer: top-k sampling
        "top_p",  # Float: nucleus sampling
        "max_length",  # Integer: maximum output length
        "do_sample",  # Boolean: enable sampling
    },
}


# Language code expansion for Google (2-letter to locale codes)
GOOGLE_LANGUAGE_MAP = {
    "en": "en-US",
    "es": "es-ES",
    "fr": "fr-FR",
    "de": "de-DE",
    "it": "it-IT",
    "pt": "pt-BR",
    "ja": "ja-JP",
    "ko": "ko-KR",
    "zh": "zh-CN",
    "ar": "ar-SA",
    "hi": "hi-IN",
    "ru": "ru-RU",
    "nl": "nl-NL",
    "pl": "pl-PL",
    "sv": "sv-SE",
    "da": "da-DK",
    "no": "nb-NO",
    "fi": "fi-FI",
    "tr": "tr-TR",
    "th": "th-TH",
    "vi": "vi-VN",
}


class ParamValidator:
    """
    Validates and maps ASR parameters for different providers.

    This class handles three types of parameters:
    1. Common parameters (OpenAI-style) - auto-mapped to provider equivalents
    2. Provider-specific parameters - passed through with validation
    3. Unknown parameters - handled based on extra_param_mode
    """

    def __init__(self, extra_param_mode: Literal["strict", "warn", "permissive"]):
        """
        Initialize the parameter validator.

        Args:
            extra_param_mode: How to handle unknown parameters
                - "strict": Raise ValueError on unknown params
                - "warn": Log warning on unknown params (default)
                - "permissive": Allow all params without validation
        """
        self.extra_param_mode = extra_param_mode

    def validate_and_map(
        self, provider_key: str, params: Dict[str, Any]
    ) -> Dict[str, Any]:
        """
        Validate and map parameters for the given provider.

        This method:
        1. Maps common parameters to provider-specific equivalents
        2. Validates provider-specific parameters
        3. Handles unknown parameters based on extra_param_mode

        Args:
            provider_key: Provider identifier (e.g., "openai", "deepgram")
            params: Raw parameters from user

        Returns:
            Validated and mapped parameters ready for provider API

        Raises:
            ValueError: If extra_param_mode="strict" and unknown params found
        """
        result = {}
        unknown_params = []
        provider_params = PROVIDER_PARAMS.get(provider_key, set())

        for key, value in params.items():
            # Check if it's a common param that needs mapping
            if key in COMMON_PARAMS:
                mapped_key = COMMON_PARAMS[key].get(provider_key)

                # Provider doesn't support this common param
                if mapped_key is None:
                    logger.debug(
                        f"Parameter '{key}' not supported by {provider_key}, ignoring"
                    )
                    continue

                # Transform value if needed (e.g., "en" -> "en-US" for Google)
                mapped_value = self._transform_value(provider_key, key, value)
                result[mapped_key] = mapped_value

            # Check if it's a valid provider-specific param
            elif key in provider_params:
                result[key] = value

            # Unknown parameter
            else:
                unknown_params.append(key)

        # Handle unknown parameters based on mode
        if unknown_params:
            self._handle_unknown(provider_key, unknown_params)

            # In permissive mode, still pass them through
            if self.extra_param_mode == "permissive":
                for key in unknown_params:
                    result[key] = params[key]

        return result

    def _transform_value(self, provider_key: str, param_key: str, value: Any) -> Any:
        """
        Transform parameter values during mapping.

        This handles provider-specific transformations like:
        - Google: Expanding "en" to "en-US"
        - Google: Wrapping prompt in speech_contexts structure
        - Deepgram: Converting prompt string to keywords list

        Args:
            provider_key: Provider identifier
            param_key: Parameter name (from COMMON_PARAMS)
            value: Parameter value to transform

        Returns:
            Transformed parameter value
        """
        # Google: Expand 2-letter language codes to locale codes
        if provider_key == "google" and param_key == "language":
            if isinstance(value, str) and len(value) == 2:
                return GOOGLE_LANGUAGE_MAP.get(value, f"{value}-US")

        # Google: Wrap prompt in speech_contexts structure
        if provider_key == "google" and param_key == "prompt":
            return [{"phrases": [value]}]

        # Deepgram: Split prompt into keywords list
        if provider_key == "deepgram" and param_key == "prompt":
            if isinstance(value, str):
                return value.split()
            return value

        return value

    def _handle_unknown(self, provider_key: str, unknown_params: list):
        """
        Handle unknown parameters based on extra_param_mode.

        Args:
            provider_key: Provider identifier
            unknown_params: List of unknown parameter names

        Raises:
            ValueError: If extra_param_mode="strict"
        """
        msg = (
            f"Unknown parameters for {provider_key}: {unknown_params}. "
            f"See {provider_key} documentation for valid parameters."
        )

        if self.extra_param_mode == "strict":
            raise ValueError(msg)
        elif self.extra_param_mode == "warn":
            import warnings

            warnings.warn(msg, UserWarning)
        # permissive mode: do nothing


================================================
FILE: aisuite/framework/chat_completion_response.py
================================================
"""Defines the ChatCompletionResponse class."""

from typing import Optional

from aisuite.framework.choice import Choice
from aisuite.framework.message import CompletionUsage


# pylint: disable=too-few-public-methods
class ChatCompletionResponse:
    """Used to conform to the response model of OpenAI."""

    def __init__(self):
        """Initializes the ChatCompletionResponse."""
        self.choices = [Choice()]  # Adjust the range as needed for more choices
        self.usage: Optional[CompletionUsage] = None


================================================
FILE: aisuite/framework/choice.py
================================================
from aisuite.framework.message import Message
from typing import Literal, Optional, List


class Choice:
    def __init__(self):
        self.finish_reason: Optional[Literal["stop", "tool_calls"]] = None
        self.message = Message(
            content=None,
            tool_calls=None,
            role="assistant",
            refusal=None,
            reasoning_content=None,
        )
        self.intermediate_messages: List[Message] = []


================================================
FILE: aisuite/framework/message.py
================================================
"""
Interface to hold contents of api responses when they do not confirm
to the OpenAI style response.
"""

from typing import Literal, Optional, List, AsyncGenerator, Union, Dict, Any
from pydantic import BaseModel
from dataclasses import dataclass, field


class Function(BaseModel):
    """Represents a function call."""

    arguments: str
    name: str


class ChatCompletionMessageToolCall(BaseModel):
    """Represents a tool call in a chat completion message."""

    id: str
    function: Function
    type: Literal["function"]


class Message(BaseModel):
    """Represents a message in a chat completion."""

    content: Optional[str] = None
    reasoning_content: Optional[str] = None
    tool_calls: Optional[List[ChatCompletionMessageToolCall]] = None
    role: Optional[Literal["user", "assistant", "system", "tool"]] = None
    refusal: Optional[str] = None


class CompletionTokensDetails(BaseModel):
    """Details about the tokens used in a completion."""

    accepted_prediction_tokens: Optional[int] = None
    """
    When using Predicted Outputs, the number of tokens in the prediction that
    appeared in the completion.
    """

    audio_tokens: Optional[int] = None
    """Audio input tokens generated by the model."""

    reasoning_tokens: Optional[int] = None
    """Tokens generated by the model for reasoning."""

    rejected_prediction_tokens: Optional[int] = None
    """
    When using Predicted Outputs, the number of tokens in the prediction that did
    not appear in the completion. However, like reasoning tokens, these tokens are
    still counted in the total completion tokens for purposes of billing, output,
    and context window limits.
    """


class PromptTokensDetails(BaseModel):
    """Details about the tokens used in a prompt."""

    text_tokens: Optional[int] = None
    """Tokens generated by the model for text."""

    audio_tokens: Optional[int] = None
    """Audio input tokens present in the prompt."""

    cached_tokens: Optional[int] = None
    """Cached tokens present in the prompt."""


class CompletionUsage(BaseModel):
    """Represents the token usage for a completion."""

    completion_tokens: Optional[int] = None
    """Number of tokens in the generated completion."""

    prompt_tokens: Optional[int] = None
    """Number of tokens in the prompt."""

    total_tokens: Optional[int] = None
    """Total number of tokens used in the request (prompt + completion)."""

    completion_tokens_details: Optional[CompletionTokensDetails] = None
    """Breakdown of tokens used in a completion."""

    prompt_tokens_details: Optional[PromptTokensDetails] = None
    """Breakdown of tokens used in the prompt."""


class Word(BaseModel):
    """Represents a single word with timing information."""

    word: str
    start: float
    end: float
    confidence: Optional[float] = None  # Common across Deepgram, Azure, AWS
    speaker: Optional[int] = None  # Speaker diarization (Deepgram, Azure, AWS)
    speaker_confidence: Optional[float] = None  # Speaker identification confidence
    punctuated_word: Optional[str] = None  # Word with punctuation (some providers)


class Segment(BaseModel):
    """Represents a segment of transcribed text with detailed information."""

    id: int
    seek: int
    start: float
    end: float
    text: str
    # OpenAI Whisper specific fields
    tokens: Optional[List[int]] = None
    temperature: Optional[float] = None
    avg_logprob: Optional[float] = None
    compression_ratio: Optional[float] = None
    no_speech_prob: Optional[float] = None
    # Common ASR provider fields
    confidence: Optional[float] = None  # Segment-level confidence
    speaker: Optional[int] = None  # Primary speaker for this segment
    speaker_confidence: Optional[float] = None  # Speaker identification confidence
    words: Optional[List[Word]] = None  # Words within this segment


class Alternative(BaseModel):
    """Represents an alternative transcription hypothesis (common in many ASR APIs)."""

    transcript: str
    confidence: Optional[float] = None
    words: Optional[List[Word]] = None


class Channel(BaseModel):
    """Represents a single audio channel (for multi-channel audio)."""

    alternatives: List[Alternative]
    search: Optional[List[dict]] = None  # Search results if keyword search enabled


class TranscriptionResult(BaseModel):
    """
    Unified transcription result format supporting multiple ASR providers.
    Based on OpenAI Whisper API but extended for common ASR features.
    """

    # Core fields (supported by most providers)
    text: str
    language: Optional[str] = None
    confidence: Optional[float] = None  # Overall transcription confidence

    # OpenAI Whisper specific fields
    task: Optional[str] = None  # "transcribe" or "translate"
    duration: Optional[float] = None
    segments: Optional[List[Segment]] = None
    words: Optional[List[Word]] = None

    # Multi-channel and alternatives support (Deepgram, Azure, etc.)
    channels: Optional[List[Channel]] = None
    alternatives: Optional[List[Alternative]] = None

    # Advanced features (various providers)
    utterances: Optional[List[dict]] = None  # Speaker utterances
    paragraphs: Optional[List[dict]] = None  # Paragraph detection
    topics: Optional[List[dict]] = None  # Topic detection
    intents: Optional[List[dict]] = None  # Intent recognition
    sentiment: Optional[dict] = None  # Sentiment analysis
    summary: Optional[dict] = None  # Auto-summarization

    # Metadata
    metadata: Optional[dict] = None  # Provider-specific metadata
    model_info: Optional[dict] = None  # Model information


class StreamingTranscriptionChunk(BaseModel):
    """Represents a single chunk of streaming transcription data."""

    text: str
    is_final: bool
    confidence: Optional[float] = None
    start_time: Optional[float] = None
    end_time: Optional[float] = None
    speaker_id: Optional[int] = None
    speaker_confidence: Optional[float] = None
    words: Optional[List[Word]] = None
    sequence_number: Optional[int] = None
    channel: Optional[int] = None
    provider_data: Optional[dict] = None


# Type alias for streaming transcription responses
StreamingTranscriptionResponse = AsyncGenerator[StreamingTranscriptionChunk, None]

# Union type for both batch and streaming responses
TranscriptionResponse = Union[TranscriptionResult, StreamingTranscriptionResponse]


@dataclass
class TranscriptionOptions:
    """Unified transcription options for ASR providers."""

    # Core parameters
    language: Optional[str] = None

    # Audio format parameters
    audio_format: Optional[str] = None
    sample_rate: Optional[int] = None
    channels: Optional[int] = None
    encoding: Optional[str] = None  # Audio encoding type

    # Output format
    response_format: Optional[str] = None
    include_word_timestamps: Optional[bool] = None
    include_segment_timestamps: Optional[bool] = None
    timestamp_granularities: Optional[List[str]] = None  # OpenAI: ["word", "segment"]

    # Context and guidance
    prompt: Optional[str] = None
    context_phrases: Optional[List[str]] = None
    boost_phrases: Optional[List[str]] = None

    # Speaker features
    enable_speaker_diarization: Optional[bool] = None
    max_speakers: Optional[int] = None
    min_speakers: Optional[int] = None

    # Text processing
    enable_automatic_punctuation: Optional[bool] = None
    enable_profanity_filter: Optional[bool] = None
    enable_smart_formatting: Optional[bool] = None
    enable_word_confidence: Optional[bool] = None
    enable_spoken_punctuation: Optional[bool] = None
    enable_spoken_emojis: Optional[bool] = None

    # Advanced features
    enable_sentiment_analysis: Optional[bool] = None
    enable_topic_detection: Optional[bool] = None
    enable_intent_recognition: Optional[bool] = None
    enable_summarization: Optional[bool] = None
    enable_translation: Optional[bool] = None
    translation_target_language: Optional[str] = None

    # Confidence and alternatives
    include_confidence_scores: Optional[bool] = None
    max_alternatives: Optional[int] = None

    # Processing options
    temperature: Optional[float] = None
    interim_results: Optional[bool] = None
    vad_sensitivity: Optional[float] = None
    stream: Optional[bool] = None  # Enable streaming output

    # Custom parameters
    custom_parameters: Dict[str, Any] = field(default_factory=dict)

    def __post_init__(self):
        """Validate parameters and constraints."""
        # Validate constraints
        if self.temperature is not None and not (0.0 <= self.temperature <= 1.0):
            raise ValueError("temperature must be between 0.0 and 1.0")

        if self.max_speakers is not None and self.max_speakers < 1:
            raise ValueError("max_speakers must be at least 1")

        if self.min_speakers is not None and self.min_speakers < 1:
            raise ValueError("min_speakers must be at least 1")

        if (
            self.max_speakers is not None
            and self.min_speakers is not None
            and self.min_speakers > self.max_speakers
        ):
            raise ValueError("min_speakers cannot be greater than max_speakers")

        if self.vad_sensitivity is not None and not (
            0.0 <= self.vad_sensitivity <= 1.0
        ):
            raise ValueError("vad_sensitivity must be between 0.0 and 1.0")

    def has_any_parameters(self) -> bool:
        """Check if any parameters are set."""
        for field_name, field_value in self.__dict__.items():
            if field_name == "custom_parameters":
                if field_value:
                    return True
            elif field_value is not None:
                return True
        return False

    def get_set_parameters(self) -> Dict[str, Any]:
        """Get only the parameters that are set."""
        set_params = {}
        for field_name, field_value in self.__dict__.items():
            if field_name == "custom_parameters":
                if field_value:
                    set_params[field_name] = field_value
            elif field_value is not None:
                set_params[field_name] = field_value
        return set_params


================================================
FILE: aisuite/framework/parameter_mapper.py
================================================
"""
Parameter mapping utilities for ASR providers.
Maps unified TranscriptionOptions to provider-specific parameters.
"""

from typing import Dict, Any, List, TYPE_CHECKING

if TYPE_CHECKING:
    from .message import TranscriptionOptions


class ParameterMapper:
    """Maps unified TranscriptionOptions to provider-specific parameters."""

    # OpenAI Whisper API parameter mapping
    OPENAI_MAPPING = {
        "language": "language",
        "response_format": "response_format",
        "temperature": "temperature",
        "prompt": "prompt",
        "stream": "stream",
        "timestamp_granularities": "timestamp_granularities",
    }

    # Deepgram API parameter mapping
    DEEPGRAM_MAPPING = {
        "language": "language",
        "enable_automatic_punctuation": "punctuate",
        "enable_smart_formatting": "smart_format",
        "enable_speaker_diarization": "diarize",
        "include_word_timestamps": "utterances",
        "include_segment_timestamps": "paragraphs",
        "context_phrases": "keywords",
        "enable_profanity_filter": "profanity_filter",
        "enable_sentiment_analysis": "sentiment",
        "enable_topic_detection": "topics",
        "enable_intent_recognition": "intents",
        "enable_summarization": "summarize",
        "interim_results": "interim_results",
        "channels": "channels",
        "sample_rate": "sample_rate",
        "include_confidence_scores": "confidence",
        "enable_word_confidence": "confidence",
        "max_alternatives": "alternatives",
        "stream": "interim_results",
        "encoding": "encoding",
        # timestamp_granularities is handled specially for Deepgram
    }

    # Google API parameter mapping
    GOOGLE_MAPPING = {
        "language": "language_code",
        "sample_rate": "sample_rate_hertz",
        "channels": "audio_channel_count",
        "enable_automatic_punctuation": "enable_automatic_punctuation",
        "enable_speaker_diarization": "enable_speaker_diarization",
        "max_speakers": "diarization_speaker_count",
        "min_speakers": "min_speaker_count",
        "include_word_timestamps": "enable_word_time_offsets",
        "include_confidence_scores": "enable_word_confidence",
        "enable_word_confidence": "enable_word_confidence",
        "context_phrases": "speech_contexts",
        "enable_profanity_filter": "profanity_filter",
        "max_alternatives": "max_alternatives",
        "boost_phrases": "speech_contexts",
        "audio_format": "encoding",
        "encoding": "encoding",
        "interim_results": "interim_results",
        "stream": "interim_results",
        "enable_spoken_punctuation": "enable_spoken_punctuation",
        "enable_spoken_emojis": "enable_spoken_emojis",
    }

    @classmethod
    def map_to_openai(cls, options: "TranscriptionOptions") -> Dict[str, Any]:
        """Map TranscriptionOptions to OpenAI Whisper API parameters."""
        params = {}

        # Handle timestamp granularities
        timestamp_granularities = []
        if options.include_word_timestamps:
            timestamp_granularities.append("word")
        if options.include_segment_timestamps:
            timestamp_granularities.append("segment")
        if timestamp_granularities:
            params["timestamp_granularities"] = timestamp_granularities

        # Map other parameters
        for opt_key, api_key in cls.OPENAI_MAPPING.items():
            if hasattr(options, opt_key):
                value = getattr(options, opt_key)
                if value is not None and not opt_key.startswith("include_"):
                    params[api_key] = value

        # Handle custom parameters
        cls._apply_custom_parameters(params, options.custom_parameters, "openai")

        return params

    @classmethod
    def map_to_deepgram(cls, options: "TranscriptionOptions") -> Dict[str, Any]:
        """Map TranscriptionOptions to Deepgram API parameters."""
        params = {}

        for opt_key, api_key in cls.DEEPGRAM_MAPPING.items():
            if hasattr(options, opt_key):
                value = getattr(options, opt_key)
                if value is not None:
                    params[api_key] = value

        # Handle special cases
        if options.context_phrases:
            params["keywords"] = options.context_phrases

        # Handle timestamp_granularities conversion for Deepgram
        if (
            hasattr(options, "timestamp_granularities")
            and options.timestamp_granularities
        ):
            if "word" in options.timestamp_granularities:
                params["utterances"] = True
            if "segment" in options.timestamp_granularities:
                params["paragraphs"] = True

        # Handle custom parameters
        cls._apply_custom_parameters(params, options.custom_parameters, "deepgram")

        return params

    @classmethod
    def map_to_google(cls, options: "TranscriptionOptions") -> Dict[str, Any]:
        """Map TranscriptionOptions to Google Speech-to-Text API parameters."""
        params = {}

        for opt_key, api_key in cls.GOOGLE_MAPPING.items():
            if hasattr(options, opt_key):
                value = getattr(options, opt_key)
                if value is not None:
                    if opt_key == "context_phrases" or opt_key == "boost_phrases":
                        if "speech_contexts" not in params:
                            params["speech_contexts"] = []
                        params["speech_contexts"].append({"phrases": value})
                    elif opt_key == "language":
                        # Handle language code conversion for Google
                        # Google expects BCP-47 locale codes like "en-US", not just "en"
                        if len(value) == 2:  # Convert "en" to "en-US"
                            language_map = {
                                "en": "en-US",
                                "es": "es-ES",
                                "fr": "fr-FR",
                                "de": "de-DE",
                                "it": "it-IT",
                                "pt": "pt-BR",  # Portuguese -> Brazilian Portuguese
                                "ja": "ja-JP",
                                "ko": "ko-KR",
                                "zh": "zh-CN",  # Chinese -> Simplified Chinese
                                "ar": "ar-SA",  # Arabic -> Saudi Arabia
                                "hi": "hi-IN",  # Hindi -> India
                                "ru": "ru-RU",  # Russian -> Russia
                                "nl": "nl-NL",  # Dutch -> Netherlands
                                "pl": "pl-PL",  # Polish -> Poland
                                "sv": "sv-SE",  # Swedish -> Sweden
                                "da": "da-DK",  # Danish -> Denmark
                                "no": "nb-NO",  # Norwegian -> Norway
                                "fi": "fi-FI",  # Finnish -> Finland
                                "tr": "tr-TR",  # Turkish -> Turkey
                                "th": "th-TH",  # Thai -> Thailand
                                "vi": "vi-VN",  # Vietnamese -> Vietnam
                            }
                            params[api_key] = language_map.get(value, f"{value}-US")
                        else:
                            params[api_key] = value
                    else:
                        params[api_key] = value

        # Handle audio encoding mapping
        if options.audio_format:
            encoding_map = {
                "wav": "LINEAR16",
                "flac": "FLAC",
                "mp3": "MP3",
                "ogg": "OGG_OPUS",
                "webm": "WEBM_OPUS",
            }
            params["encoding"] = encoding_map.get(
                options.audio_format.lower(), "LINEAR16"
            )

        # Handle timestamp_granularities conversion for Google
        if (
            hasattr(options, "timestamp_granularities")
            and options.timestamp_granularities
        ):
            if "word" in options.timestamp_granularities:
                params["enable_word_time_offsets"] = True

        # Handle custom parameters
        cls._apply_custom_parameters(params, options.custom_parameters, "google")

        return params

    @classmethod
    def _apply_custom_parameters(
        cls, params: Dict[str, Any], custom_params: Dict[str, Any], provider: str
    ):
        """
        Apply custom parameters for the specific provider.

        Only provider-namespaced parameters are supported.
        Parameters not under a provider key are IGNORED.
        """
        if not custom_params:
            return

        # Provider-specific namespacing ONLY
        # Users MUST structure custom_parameters like:
        # {
        #   "openai": {"response_format": "srt", "temperature": 0.2},
        #   "deepgram": {"search": ["keyword"], "numerals": True},
        #   "google": {"use_enhanced": True, "adaptation": {...}}
        # }
        if provider in custom_params:
            params.update(custom_params[provider])
        # Note: Any parameters not under a provider key are ignored


================================================
FILE: aisuite/framework/provider_interface.py
================================================
"""The shared interface for model providers."""


# TODO(rohit): Remove this. This interface is obsolete in favor of Provider.
class ProviderInterface:
    """Defines the expected behavior for provider-specific interfaces."""

    def chat_completion_create(self, messages=None, model=None, temperature=0) -> None:
        """Create a chat completion using the specified messages, model, and temperature.

        This method must be implemented by subclasses to perform completions.

        Args:
        ----
            messages (list): The chat history.
            model (str): The identifier of the model to be used in the completion.
            temperature (float): The temperature to use in the completion.

        Raises:
        ------
            NotImplementedError: If this method has not been implemented by a subclass.

        """
        raise NotImplementedError(
            "Provider Interface has not implemented chat_completion_create()"
        )


================================================
FILE: aisuite/mcp/__init__.py
================================================
"""
MCP (Model Context Protocol) integration for aisuite.

This module provides support for using MCP servers and their tools with aisuite's
unified interface for AI providers.

MCP allows AI applications to connect to external data sources and tools through
a standardized protocol. This integration makes MCP tools available as Python
callables that work seamlessly with aisuite's existing tool calling infrastructure.

Example:
    >>> from aisuite import Client
    >>> from aisuite.mcp import MCPClient
    >>>
    >>> # Connect to an MCP server
    >>> mcp = MCPClient(
    ...     command="npx",
    ...     args=["-y", "@modelcontextprotocol/server-filesystem", "/docs"]
    ... )
    >>>
    >>> # Use MCP tools with any provider
    >>> client = Client()
    >>> response = client.chat.completions.create(
    ...     model="openai:gpt-4o",
    ...     messages=[{"role": "user", "content": "Read README.md"}],
    ...     tools=mcp.get_callable_tools(),
    ...     max_turns=2
    ... )
"""

from .client import MCPClient

__all__ = ["MCPClient"]


================================================
FILE: aisuite/mcp/client.py
================================================
"""
MCP Client for aisuite.

This module provides the MCPClient class that connects to MCP servers and
exposes their tools as Python callables compatible with aisuite's tool system.
"""

import asyncio
import json
from typing import Any, Callable, Dict, List, Optional
from contextlib import contextmanager

try:
    from mcp import ClientSession, StdioServerParameters
    from mcp.client.stdio import stdio_client
    import httpx
except ImportError as e:
    if "mcp" in str(e):
        raise ImportError(
            "MCP support requires the 'mcp' package. "
            "Install it with: pip install 'aisuite[mcp]' or pip install mcp"
        )
    elif "httpx" in str(e):
        raise ImportError(
            "HTTP transport requires the 'httpx' package. "
            "Install it with: pip install httpx"
        )
    raise

from .tool_wrapper import create_mcp_tool_wrapper
from .config import MCPConfig, validate_mcp_config, get_transport_type


class MCPClient:
    """
    Client for connecting to MCP servers and using their tools with aisuite.

    This class manages the connection to an MCP server, discovers available tools,
    and creates Python callable wrappers that work seamlessly with aisuite's
    existing tool calling infrastructure.

    Example:
        >>> # Connect to an MCP server
        >>> mcp = MCPClient(
        ...     command="npx",
        ...     args=["-y", "@modelcontextprotocol/server-filesystem", "/path"]
        ... )
        >>>
        >>> # Get tools and use with aisuite
        >>> import aisuite as ai
        >>> client = ai.Client()
        >>> response = client.chat.completions.create(
        ...     model="openai:gpt-4o",
        ...     messages=[{"role": "user", "content": "List files"}],
        ...     tools=mcp.get_callable_tools(),
        ...     max_turns=2
        ... )

    The MCPClient handles:
    - Starting and managing the MCP server process
    - Performing the MCP handshake
    - Discovering available tools
    - Creating callable wrappers for tools
    - Executing tool calls via the MCP protocol
    """

    def __init__(
        self,
        command: Optional[str] = None,
        args: Optional[List[str]] = None,
        env: Optional[Dict[str, str]] = None,
        server_url: Optional[str] = None,
        headers: Optional[Dict[str, str]] = None,
        timeout: float = 30.0,
        name: Optional[str] = None,
    ):
        """
        Initialize the MCP client and connect to an MCP server.

        Supports both stdio and HTTP transports. Provide either stdio parameters
        (command) OR HTTP parameters (server_url), but not both.

        Args:
            command: Command to start the MCP server (e.g., "npx", "python") - for stdio transport
            args: Arguments to pass to the command (e.g., ["-y", "server-package"]) - for stdio transport
            env: Optional environment variables for the server process - for stdio transport
            server_url: Base URL of the MCP server (e.g., "http://localhost:8000") - for HTTP transport
            headers: Optional HTTP headers (e.g., for authentication) - for HTTP transport
            timeout: Request timeout in seconds - for HTTP transport (default: 30.0)
            name: Optional name for this MCP client (used for logging and prefixing)

        Raises:
            ImportError: If the mcp or httpx package is not installed
            ValueError: If both stdio and HTTP parameters are provided, or neither
            RuntimeError: If connection to the MCP server fails
        """
        # Validate transport parameters
        has_stdio = command is not None
        has_http = server_url is not None

        if not (has_stdio ^ has_http):
            raise ValueError(
                "Must provide exactly one transport: either 'command' (stdio) or 'server_url' (HTTP)."
            )

        # Store parameters based on transport type
        if has_stdio:
            self.server_params = StdioServerParameters(
                command=command,
                args=args or [],
                env=env,
            )
            self.name = name or command
            # Stdio-specific state
            self._session: Optional[ClientSession] = None
            self._read = None
            self._write = None
            self._stdio_context = None
        else:  # HTTP
            self.server_url = server_url
            self.headers = headers or {}
            self.timeout = timeout
            self.name = name or server_url
            # HTTP-specific state (initialized in _async_connect_http)
            self._http_client = None
            self._request_id = 0
            self._session_id: Optional[str] = None  # MCP session ID from server

        # Shared state
        self._tools_cache: Optional[List[Dict[str, Any]]] = None
        self._event_loop: Optional[asyncio.AbstractEventLoop] = None

        # Initialize connection
        self._connect()

    @classmethod
    def from_config(cls, config: Dict[str, Any]) -> "MCPClient":
        """
        Create an MCPClient from a configuration dictionary.

        This method validates the config and creates an MCPClient instance.
        It supports both stdio and HTTP transports.

        Args:
            config: MCP configuration dictionary

        Returns:
            MCPClient instance

        Raises:
            ValueError: If configuration is invalid

        Example (stdio):
            >>> config = {
            ...     "type": "mcp",
            ...     "name": "filesystem",
            ...     "command": "npx",
            ...     "args": ["-y", "@modelcontextprotocol/server-filesystem", "/docs"]
            ... }
            >>> mcp = MCPClient.from_config(config)

        Example (HTTP):
            >>> config = {
            ...     "type": "mcp",
            ...     "name": "api-server",
            ...     "server_url": "http://localhost:8000",
            ...     "headers": {"Authorization": "Bearer token"}
            ... }
            >>> mcp = MCPClient.from_config(config)
        """
        # Validate and normalize config
        validated_config = validate_mcp_config(config)

        # Determine transport type
        transport = get_transport_type(validated_config)

        if transport == "stdio":
            return cls(
                command=validated_config["command"],
                args=validated_config.get("args", []),
                env=validated_config.get("env"),
                name=validated_config["name"],
            )
        else:  # http
            return cls(
                server_url=validated_config["server_url"],
                headers=validated_config.get("headers"),
                timeout=validated_config.get("timeout", 30.0),
                name=validated_config["name"],
            )

    @staticmethod
    def get_tools_from_config(config: Dict[str, Any]) -> List[Callable]:
        """
        Convenience method to create MCPClient and get callable tools from config.

        This is a helper that combines from_config() and get_callable_tools()
        in a single call. It respects the config's allowed_tools and use_tool_prefix
        settings.

        Args:
            config: MCP configuration dictionary

        Returns:
            List of callable tool wrappers

        Example:
            >>> config = {
            ...     "type": "mcp",
            ...     "name": "filesystem",
            ...     "command": "npx",
            ...     "args": ["..."],
            ...     "allowed_tools": ["read_file"],
            ...     "use_tool_prefix": True
            ... }
            >>> tools = MCPClient.get_tools_from_config(config)
            >>> # Returns callable tools filtered and prefixed per config
        """
        # Validate config first
        validated_config = validate_mcp_config(config)

        # Create client
        client = MCPClient.from_config(validated_config)

        # Get tools with config settings
        tools = client.get_callable_tools(
            allowed_tools=validated_config.get("allowed_tools"),
            use_tool_prefix=validated_config.get("use_tool_prefix", False),
        )

        return tools

    def _connect(self):
        """
        Establish connection to the MCP server.

        This method:
        1. Creates an event loop if needed
        2. Detects transport type (stdio or HTTP)
        3. Establishes connection via appropriate transport
        4. Performs the MCP initialization handshake
        5. Caches the available tools

        Note: Automatically handles Jupyter/IPython environments where an event loop
        is already running by using nest_asyncio.
        """
        # Get or create event loop
        try:
            self._event_loop = asyncio.get_running_loop()
        except RuntimeError:
            self._event_loop = asyncio.new_event_loop()
            asyncio.set_event_loop(self._event_loop)

        # Enable nested event loops for Jupyter/IPython compatibility
        # This allows run_until_complete() to work in environments where
        # an event loop is already running (like Jupyter notebooks)
        try:
            import nest_asyncio

            nest_asyncio.apply()
        except ImportError:
            # nest_asyncio not available - will work fine in regular Python
            # but may fail in Jupyter. User should install: pip install nest-asyncio
            pass

        # Detect transport type and run appropriate async connection
        if hasattr(self, "server_url"):
            # HTTP transport
            self._event_loop.run_until_complete(self._async_connect_http())
        else:
            # Stdio transport
            self._event_loop.run_until_complete(self._async_connect())

    async def _async_connect(self):
        """Async connection initialization for stdio transport."""
        # Start the MCP server and store the context manager
        self._stdio_context = stdio_client(self.server_params)
        self._read, self._write = await self._stdio_context.__aenter__()

        # Create session
        self._session = ClientSession(self._read, self._write)
        await self._session.__aenter__()

        # Initialize connection
        await self._session.initialize()

        # List available tools and cache them
        tools_result = await self._session.list_tools()

        # Convert Tool objects to dicts for easier handling
        if hasattr(tools_result, "tools"):
            self._tools_cache = [
                {
                    "name": tool.name,
                    "description": (
                        tool.description if hasattr(tool, "description") else ""
                    ),
                    "inputSchema": (
                        tool.inputSchema if hasattr(tool, "inputSchema") else {}
                    ),
                }
                for tool in tools_result.tools
            ]
        else:
            self._tools_cache = []

    async def _parse_sse_response(
        self, response: httpx.Response, request_id: int
    ) -> Dict[str, Any]:
        """
        Parse SSE stream and extract JSON-RPC response.

        SSE format per spec:
            data: {"jsonrpc": "2.0", "id": 1, "result": {...}}

            data: {"jsonrpc": "2.0", "method": "notification", ...}

        The server may send multiple events (notifications, requests) before
        sending the final response. We collect events until we find the
        response matching our request_id.

        Args:
            response: HTTP response with text/event-stream content type
            request_id: The JSON-RPC request ID to match

        Returns:
            Response result dictionary

        Raises:
            RuntimeError: If server returns an error or no matching response found
        """
        result = None

        async for line in response.aiter_lines():
            line = line.strip()

            # Skip empty lines and comments
            if not line or line.startswith(":"):
                continue

            # Parse SSE data field
            if line.startswith("data: "):
                data = line[6:]  # Remove 'data: ' prefix

                try:
                    message = json.loads(data)

                    # Check if this is the response to our request
                    if message.get("id") == request_id:
                        if "error" in message:
                            error = message["error"]
                            raise RuntimeError(
                                f"MCP server error: {error.get('message', 'Unknown error')} "
                                f"(code: {error.get('code', 'unknown')})"
                            )
                        result = message.get("result", {})
                        # Found our response, can stop parsing
                        break

                    # Note: Server may send other notifications/requests
                    # which we ignore for now (future enhancement for bidirectional comms)

                except json.JSONDecodeError:
                    # Invalid JSON in SSE data, skip this event
                    continue

        if result is None:
            raise RuntimeError(
                f"No response received in SSE stream for request {request_id}"
            )

        return result

    async def _send_http_request(
        self, method: str, params: Optional[Dict[str, Any]] = None
    ) -> Dict[str, Any]:
        """
        Send JSON-RPC request to MCP server via HTTP.

        Args:
            method: JSON-RPC method name
            params: Optional parameters

        Returns:
            Response result

        Raises:
            RuntimeError: If HTTP request fails or server returns an error
        """
        # Increment request ID
        self._request_id += 1

        # Build JSON-RPC 2.0 request
        request_data = {
            "jsonrpc": "2.0",
            "id": self._request_id,
            "method": method,
        }

        if params:
            request_data["params"] = params

        # Use the exact server URL provided by the user
        url = self.server_url.rstrip("/")

        # Build headers: MCP requires Accept header with both content types
        # Merge with any user-provided headers and session ID
        request_headers = {
            "Accept": "application/json, text/event-stream",
        }
        if self._session_id:
            request_headers["Mcp-Session-Id"] = self._session_id
        if self.headers:
            request_headers.update(self.headers)

        try:
            response = await self._http_client.post(
                url, json=request_data, headers=request_headers
            )
            response.raise_for_status()

            # Check for MCP session ID in response headers
            if "Mcp-Session-Id" in response.headers and not self._session_id:
                self._session_id = response.headers["Mcp-Session-Id"]

            # Check Content-Type to determine response format
            content_type = response.headers.get("content-type", "").lower()

            if "application/json" in content_type:
                # Handle JSON response (simple request-response)
                result = response.json()

                # Check for JSON-RPC error
                if "error" in result:
                    error = result["error"]
                    raise RuntimeError(
                        f"MCP server error: {error.get('message', 'Unknown error')} "
                        f"(code: {error.get('code', 'unknown')})"
                    )

                return result.get("result", {})

            elif "text/event-stream" in content_type:
                # Handle SSE stream response
                return await self._parse_sse_response(response, request_data["id"])

            else:
                raise RuntimeError(
                    f"Unexpected Content-Type from MCP server: {content_type}"
                )

        except httpx.HTTPError as e:
            raise RuntimeError(
                f"HTTP request to MCP server failed: {type(e).__name__}: {str(e)}"
            )

    async def _send_notification(
        self, method: str, params: Optional[Dict[str, Any]] = None
    ):
        """
        Send a JSON-RPC notification (no response expected).

        Notifications are JSON-RPC messages without an ID field.
        Per the spec, the server should not send a response.

        Args:
            method: JSON-RPC method name
            params: Optional parameters
        """
        # Build JSON-RPC notification (no id field)
        notification = {
            "jsonrpc": "2.0",
            "method": method,
        }

        if params:
            notification["params"] = params

        # Build headers
        url = self.server_url.rstrip("/")
        request_headers = {
            "Accept": "application/json, text/event-stream",
        }
        if self._session_id:
            request_headers["Mcp-Session-Id"] = self._session_id
        if self.headers:
            request_headers.update(self.headers)

        try:
            # Send notification - don't wait for/expect a response
            await self._http_client.post(
                url, json=notification, headers=request_headers
            )
            # Note: We don't check response for notifications
        except httpx.HTTPError:
            # Notifications may timeout or fail, which is acceptable
            pass

    async def _async_connect_http(self):
        """Async connection initialization for HTTP transport."""
        # Create HTTP client
        self._http_client = httpx.AsyncClient(timeout=self.timeout)

        # Send initialize request
        init_params = {
            "protocolVersion": "2024-11-05",
            "capabilities": {"roots": {"listChanged": True}, "sampling": {}},
            "clientInfo": {"name": "aisuite-mcp-client", "version": "1.0.0"},
        }

        await self._send_http_request("initialize", init_params)

        # Send initialized notification (required by MCP spec)
        await self._send_notification("notifications/initialized")

        # List available tools
        tools_result = await self._send_http_request("tools/list")

        # Cache tools
        self._tools_cache = [
            {
                "name": tool["name"],
                "description": tool.get("description", ""),
                "inputSchema": tool.get("inputSchema", {}),
            }
            for tool in tools_result.get("tools", [])
        ]

    def list_tools(self) -> List[Dict[str, Any]]:
        """
        List all available tools from the MCP server.

        Returns:
            List of tool schemas in MCP format

        Example:
            >>> tools = mcp.list_tools()
            >>> for tool in tools:
            ...     print(tool['name'], '-', tool['description'])
        """
        if self._tools_cache is None:
            raise RuntimeError("Not connected to MCP server")
        return self._tools_cache

    def get_callable_tools(
        self,
        allowed_tools: Optional[List[str]] = None,
        use_tool_prefix: bool = False,
    ) -> List[Callable]:
        """
        Get all MCP tools as Python callables compatible with aisuite.

        This is the primary method for using MCP tools with aisuite. It returns
        a list of callable wrappers that can be passed directly to the `tools`
        parameter of `client.chat.completions.create()`.

        Args:
            allowed_tools: Optional list of tool names to include. If None, all tools are included.
            use_tool_prefix: If True, prefix tool names with "{client_name}__"

        Returns:
            List of callable tool wrappers

        Example:
            >>> # Get all tools
            >>> mcp_tools = mcp.get_callable_tools()
            >>>
            >>> # Get specific tools only
            >>> mcp_tools = mcp.get_callable_tools(allowed_tools=["read_file"])
            >>>
            >>> # Get tools with name prefixing
            >>> mcp_tools = mcp.get_callable_tools(use_tool_prefix=True)
            >>> # Tools will be named "filesystem__read_file", etc.
        """
        all_tools = self.list_tools()

        # Filter tools if allowed_tools is specified
        if allowed_tools is not None:
            all_tools = [t for t in all_tools if t["name"] in allowed_tools]

        # Create wrappers
        wrappers = []
        for tool in all_tools:
            wrapper = create_mcp_tool_wrapper(self, tool["name"], tool)

            # Apply prefix if requested
            if use_tool_prefix:
                original_name = wrapper.__name__
                wrapper.__name__ = f"{self.name}__{original_name}"

            wrappers.append(wrapper)

        return wrappers

    def get_tool(self, tool_name: str) -> Optional[Callable]:
        """
        Get a specific MCP tool by name as a Python callable.

        Args:
            tool_name: Name of the tool to retrieve

        Returns:
            Callable wrapper for the tool, or None if not found

        Example:
            >>> read_file = mcp.get_tool("read_file")
            >>> write_file = mcp.get_tool("write_file")
            >>> tools = [read_file, write_file]
        """
        tools = self.list_tools()
        for tool in tools:
            if tool["name"] == tool_name:
                return create_mcp_tool_wrapper(self, tool_name, tool)
        return None

    def call_tool(self, tool_name: str, arguments: Dict[str, Any]) -> Any:
        """
        Execute an MCP tool call.

        This method is called by MCPToolWrapper when the LLM requests a tool.
        It handles the async MCP protocol communication and returns the result.
        Automatically routes to the appropriate transport (stdio or HTTP).

        Args:
            tool_name: Name of the tool to call
            arguments: Tool arguments as a dictionary

        Returns:
            The result from the MCP tool execution

        Raises:
            RuntimeError: If not connected or tool call fails
        """
        # Detect transport type and route to appropriate method
        if hasattr(self, "_http_client") and self._http_client is not None:
            # HTTP transport
            if self._http_client is None:
                raise RuntimeError("Not connected to MCP server (HTTP)")
            result = self._event_loop.run_until_complete(
                self._async_call_tool_http(tool_name, arguments)
            )
        else:
            # Stdio transport
            if self._session is None:
                raise RuntimeError("Not connected to MCP server (stdio)")
            result = self._event_loop.run_until_complete(
                self._async_call_tool(tool_name, arguments)
            )
        return result

    async def _async_call_tool(self, tool_name: str, arguments: Dict[str, Any]) -> Any:
        """
        Async implementation of tool calling for stdio transport.

        Args:
            tool_name: Name of the tool
            arguments: Tool arguments

        Returns:
            Tool execution result
        """
        result = await self._session.call_tool(tool_name, arguments)

        # Extract content from MCP result
        # MCP returns results in various formats, we try to extract the most useful content
        if hasattr(result, "content"):
            if isinstance(result.content, list) and len(result.content) > 0:
                # Get first content item
                content_item = result.content[0]
                if hasattr(content_item, "text"):
                    return content_item.text
                elif hasattr(content_item, "data"):
                    return content_item.data
                return str(content_item)
            return result.content

        # If no content attribute, return the whole result
        return str(result)

    async def _async_call_tool_http(
        self, tool_name: str, arguments: Dict[str, Any]
    ) -> Any:
        """
        Async implementation of tool calling for HTTP transport.

        Args:
            tool_name: Name of the tool
            arguments: Tool arguments

        Returns:
            Tool execution result
        """
        params = {"name": tool_name, "arguments": arguments}

        result = await self._send_http_request("tools/call", params)

        # Extract content from MCP result (HTTP format)
        # Similar to stdio, but result is already a dict
        if "content" in result:
            content = result["content"]
            if isinstance(content, list) and len(content) > 0:
                # Get first content item
                content_item = content[0]
                if isinstance(content_item, dict):
                    if "text" in content_item:
                        return content_item["text"]
                    elif "data" in content_item:
                        return content_item["data"]
                return str(content_item)
            return content

        # If no content field, return the whole result
        return json.dumps(result)

    def close(self):
        """
        Close the connection to the MCP server.

        Works for both stdio and HTTP transports. It's recommended to use
        the MCPClient as a context manager to ensure proper cleanup, but
        this method can be called manually if needed.

        Example:
            >>> mcp = MCPClient(command="npx", args=["server"])
            >>> try:
            ...     # Use mcp
            ...     pass
            ... finally:
            ...     mcp.close()
        """
        # Check if we need to cleanup (either stdio or HTTP)
        needs_cleanup = (hasattr(self, "_session") and self._session is not None) or (
            hasattr(self, "_http_client") and self._http_client is not None
        )

        if needs_cleanup:
            self._event_loop.run_until_complete(self._async_close())

    async def _async_close(self):
        """Async cleanup for both stdio and HTTP transports."""
        # Cleanup stdio transport
        try:
            if hasattr(self, "_session") and self._session:
                await self._session.__aexit__(None, None, None)
        except RuntimeError as e:
            # Suppress anyio cancel scope errors that occur in Jupyter/nest_asyncio environments
            # This is a known incompatibility between nest_asyncio and anyio task groups
            if "cancel scope" not in str(e).lower():
                raise
        except Exception:
            pass  # Ignore other errors during session cleanup

        try:
            if hasattr(self, "_stdio_context") and self._stdio_context:
                await self._stdio_context.__aexit__(None, None, None)
        except RuntimeError as e:
            # Suppress anyio cancel scope errors that occur in Jupyter/nest_asyncio environments
            # This is a known incompatibility between nest_asyncio and anyio task groups
            if "cancel scope" not in str(e).lower():
                raise
        except Exception:
            pass  # Ignore other errors during stdio cleanup

        # Cleanup HTTP transport
        try:
            if hasattr(self, "_http_client") and self._http_client:
                await self._http_client.aclose()
        except Exception:
            pass  # Ignore errors during HTTP client cleanup

    def __enter__(self):
        """Context manager entry."""
        return self

    def __exit__(self, exc_type, exc_val, exc_tb):
        """Context manager exit."""
        self.close()
        return False

    def __repr__(self) -> str:
        """String representation."""
        num_tools = len(self._tools_cache) if self._tools_cache else 0
        if hasattr(self, "server_url"):
            return f"MCPClient(server_url={self.server_url!r}, tools={num_tools})"
        else:
            return (
                f"MCPClient(command={self.server_params.command!r}, tools={num_tools})"
            )


================================================
FILE: aisuite/mcp/config.py
================================================
"""
MCP configuration validation and normalization.

This module provides utilities for validating and normalizing MCP tool
configuration dictionaries passed to aisuite's chat completion API.
"""

from typing import Any, Dict, List, Literal, Optional, TypedDict


class MCPConfig(TypedDict, total=False):
    """Type definition for MCP tool configuration."""

    # Required fields
    type: Literal["mcp"]
    name: str

    # Transport: stdio
    command: str
    args: List[str]
    env: Dict[str, str]
    cwd: str

    # Transport: http
    server_url: str
    headers: Dict[str, str]

    # Tool filtering
    allowed_tools: List[str]

    # Namespacing
    use_tool_prefix: bool

    # Safety limits
    timeout_seconds: int
    response_bytes_cap: int

    # Connection behavior
    lazy_connect: bool


# Default values
DEFAULT_TIMEOUT_SECONDS = 30
DEFAULT_RESPONSE_BYTES_CAP = 10 * 1024 * 1024  # 10 MB
DEFAULT_USE_TOOL_PREFIX = False
DEFAULT_LAZY_CONNECT = False


def validate_mcp_config(config: Dict[str, Any]) -> MCPConfig:
    """
    Validate and normalize an MCP tool configuration.

    This function:
    1. Validates required fields are present
    2. Auto-detects transport type (stdio vs http)
    3. Validates transport-specific required fields
    4. Sets defaults for optional fields
    5. Returns a normalized config dict

    Args:
        config: Raw MCP configuration dictionary

    Returns:
        Validated and normalized MCP configuration

    Raises:
        ValueError: If configuration is invalid

    Example:
        >>> config = {
        ...     "type": "mcp",
        ...     "name": "filesystem",
        ...     "command": "npx",
        ...     "args": ["-y", "@modelcontextprotocol/server-filesystem", "/docs"]
        ... }
        >>> validated = validate_mcp_config(config)
        >>> validated['timeout_seconds']
        30
    """
    # Check type field
    if config.get("type") != "mcp":
        raise ValueError(f"Invalid config type: {config.get('type')}. Expected 'mcp'")

    # Check name field (required)
    if "name" not in config:
        raise ValueError(
            "MCP config must have 'name' field. "
            "Example: {'type': 'mcp', 'name': 'my_server', ...}"
        )

    name = config["name"]
    if not isinstance(name, str) or not name.strip():
        raise ValueError(f"MCP 'name' must be a non-empty string, got: {name}")

    # Auto-detect transport type
    has_stdio = "command" in config
    has_http = "server_url" in config

    if not (has_stdio ^ has_http):
        raise ValueError(
            "MCP config must have either 'command' or 'server_url'."
            "Use one or the other to specify transport type."
        )

    # Validate stdio transport
    if has_stdio:
        if not isinstance(config["command"], str):
            raise ValueError(
                f"MCP 'command' must be a string, got: {type(config['command'])}"
            )

        # args is optional but should be a list if present
        if "args" in config and not isinstance(config["args"], list):
            raise ValueError(f"MCP 'args' must be a list, got: {type(config['args'])}")

        # env is optional but should be a dict if present
        if "env" in config and not isinstance(config["env"], dict):
            raise ValueError(f"MCP 'env' must be a dict, got: {type(config['env'])}")

    # Validate http transport
    if has_http:
        if not isinstance(config["server_url"], str):
            raise ValueError(
                f"MCP 'server_url' must be a string, got: {type(config['server_url'])}"
            )

        # Validate URL format
        server_url = config["server_url"]
        if not (server_url.startswith("http://") or server_url.startswith("https://")):
            raise ValueError(
                f"MCP 'server_url' must start with http:// or https://, got: {server_url}"
            )

        # headers is optional but should be a dict if present
        if "headers" in config and not isinstance(config["headers"], dict):
            raise ValueError(
                f"MCP 'headers' must be a dict, got: {type(config['headers'])}"
            )

        # timeout is optional but should be a number if present
        if "timeout" in config:
            if not isinstance(config["timeout"], (int, float)):
                raise ValueError(
                    f"MCP 'timeout' must be a number, got: {type(config['timeout'])}"
                )
            if config["timeout"] <= 0:
                raise ValueError(
                    f"MCP 'timeout' must be positive, got: {config['timeout']}"
                )

    # Validate optional fields
    if "allowed_tools" in config:
        if not isinstance(config["allowed_tools"], list):
            raise ValueError(
                f"MCP 'allowed_tools' must be a list, got: {type(config['allowed_tools'])}"
            )
        if not all(isinstance(t, str) for t in config["allowed_tools"]):
            raise ValueError("MCP 'allowed_tools' must be a list of strings")

    if "use_tool_prefix" in config:
        if not isinstance(config["use_tool_prefix"], bool):
            raise ValueError(
                f"MCP 'use_tool_prefix' must be a boolean, got: {type(config['use_tool_prefix'])}"
            )

    if "timeout_seconds" in config:
        if not isinstance(config["timeout_seconds"], (int, float)):
            raise ValueError(
                f"MCP 'timeout_seconds' must be a number, got: {type(config['timeout_seconds'])}"
            )
        if config["timeout_seconds"] <= 0:
            raise ValueError(
                f"MCP 'timeout_seconds' must be positive, got: {config['timeout_seconds']}"
            )

    if "response_bytes_cap" in config:
        if not isinstance(config["response_bytes_cap"], int):
            raise ValueError(
                f"MCP 'response_bytes_cap' must be an integer, got: {type(config['response_bytes_cap'])}"
            )
        if config["response_bytes_cap"] <= 0:
            raise ValueError(
                f"MCP 'response_bytes_cap' must be positive, got: {config['response_bytes_cap']}"
            )

    # Create normalized config with defaults
    normalized: MCPConfig = {
        "type": "mcp",
        "name": config["name"],
    }

    # Copy transport fields
    if has_stdio:
        normalized["command"] = config["command"]
        normalized["args"] = config.get("args", [])
        if "env" in config:
            normalized["env"] = config["env"]
        if "cwd" in config:
            normalized["cwd"] = config["cwd"]
    else:  # has_http
        normalized["server_url"] = config["server_url"]
        if "headers" in config:
            normalized["headers"] = config["headers"]
        if "timeout" in config:
            normalized["timeout"] = config["timeout"]

    # Copy optional fields with defaults
    if "allowed_tools" in config:
        normalized["allowed_tools"] = config["allowed_tools"]

    normalized["use_tool_prefix"] = config.get(
        "use_tool_prefix", DEFAULT_USE_TOOL_PREFIX
    )
    normalized["timeout_seconds"] = config.get(
        "timeout_seconds", DEFAULT_TIMEOUT_SECONDS
    )
    normalized["response_bytes_cap"] = config.get(
        "response_bytes_cap", DEFAULT_RESPONSE_BYTES_CAP
    )
    normalized["lazy_connect"] = config.get("lazy_connect", DEFAULT_LAZY_CONNECT)

    return normalized


def is_mcp_config(obj: Any) -> bool:
    """
    Check if an object is an MCP config dictionary.

    Args:
        obj: Object to check

    Returns:
        True if obj is a dict with type="mcp", False otherwise

    Example:
        >>> is_mcp_config({"type": "mcp", "name": "test"})
        True
        >>> is_mcp_config(lambda: None)
        False
    """
    return isinstance(obj, dict) and obj.get("type") == "mcp"


def get_transport_type(config: MCPConfig) -> Literal["stdio", "http"]:
    """
    Determine the transport type from a validated MCP config.

    Args:
        config: Validated MCP configuration

    Returns:
        "stdio" or "http"
    """
    if "command" in config:
        return "stdio"
    else:
        return "http"


================================================
FILE: aisuite/mcp/schema_converter.py
================================================
"""
Schema conversion utilities for MCP tools.

This module provides functionality to convert MCP JSON Schema tool definitions
to Python type annotations that are compatible with aisuite's existing Tools class.
"""

from typing import Any, Dict, List, Optional, Union, get_args, get_origin
import inspect


def json_schema_to_python_type(schema: Dict[str, Any]) -> type:
    """
    Convert a JSON Schema type definition to a Python type annotation.

    Args:
        schema: JSON Schema type definition (e.g., {"type": "string"})

    Returns:
        Python type annotation (e.g., str, int, List[str], etc.)
    """
    schema_type = schema.get("type")

    # Handle null/None
    if schema_type == "null":
        return type(None)

    # Handle basic types
    type_mapping = {
        "string": str,
        "number": float,
        "integer": int,
        "boolean": bool,
        "object": dict,
        "array": list,
    }

    if schema_type in type_mapping:
        base_type = type_mapping[schema_type]

        # Handle arrays with item type
        if schema_type == "array" and "items" in schema:
            item_type = json_schema_to_python_type(schema["items"])
            return List[item_type]

        return base_type

    # Handle anyOf/oneOf (union types)
    if "anyOf" in schema or "oneOf" in schema:
        union_schemas = schema.get("anyOf", schema.get("oneOf", []))
        types = [json_schema_to_python_type(s) for s in union_schemas]
        if len(types) == 1:
            return types[0]
        return Union[tuple(types)]

    # Default to Any if we can't determine the type
    return Any


def mcp_schema_to_annotations(input_schema: Dict[str, Any]) -> Dict[str, type]:
    """
    Convert MCP tool input schema to Python type annotations.

    MCP tools use JSON Schema for their input parameters. This function
    converts those schemas to Python type annotations that can be used
    by aisuite's Tools class.

    Args:
        input_schema: MCP tool input schema (JSON Schema format)

    Returns:
        Dictionary mapping parameter names to Python types

    Example:
        >>> schema = {
        ...     "type": "object",
        ...     "properties": {
        ...         "location": {"type": "string"},
        ...         "count": {"type": "integer"}
        ...     },
        ...     "required": ["location"]
        ... }
        >>> annotations = mcp_schema_to_annotations(schema)
        >>> annotations
        {'location': <class 'str'>, 'count': typing.Optional[int]}
    """
    annotations = {}

    if input_schema.get("type") != "object":
        return annotations

    properties = input_schema.get("properties", {})
    required = input_schema.get("required", [])

    for param_name, param_schema in properties.items():
        param_type = json_schema_to_python_type(param_schema)

        # Make optional if not in required list
        if param_name not in required:
            param_type = Optional[param_type]

        annotations[param_name] = param_type

    return annotations


def create_function_signature(
    func_name: str, annotations: Dict[str, type], docstring: Optional[str] = None
) -> inspect.Signature:
    """
    Create a function signature from parameter annotations.

    Args:
        func_name: Name of the function
        annotations: Dictionary mapping parameter names to types
        docstring: Optional docstring for the function

    Returns:
        inspect.Signature object
    """
    parameters = []

    for param_name, param_type in annotations.items():
        # Check if it's an Optional type
        if get_origin(param_type) is Union:
            args = get_args(param_type)
            if type(None) in args:
                # It's Optional, set default to None
                parameters.append(
                    inspect.Parameter(
                        param_name,
                        inspect.Parameter.KEYWORD_ONLY,
                        default=None,
                        annotation=param_type,
                    )
                )
            else:
                parameters.append(
                    inspect.Parameter(
                        param_name,
                        inspect.Parameter.KEYWORD_ONLY,
                        annotation=param_type,
                    )
                )
        else:
            # Required parameter
            parameters.append(
                inspect.Parameter(
                    param_name,
                    inspect.Parameter.KEYWORD_ONLY,
                    annotation=param_type,
                )
            )

    return inspect.Signature(parameters)


def extract_parameter_descriptions(input_schema: Dict[str, Any]) -> Dict[str, str]:
    """
    Extract parameter descriptions from MCP schema.

    Args:
        input_schema: MCP tool input schema

    Returns:
        Dictionary mapping parameter names to their descriptions
    """
    descriptions = {}
    properties = input_schema.get("properties", {})

    for param_name, param_schema in properties.items():
        if "description" in param_schema:
            descriptions[param_name] = param_schema["description"]

    return descriptions


def build_docstring(
    tool_description: str, parameter_descriptions: Dict[str, str]
) -> str:
    """
    Build a Python docstring from MCP tool description and parameter descriptions.

    Args:
        tool_description: Overall description of the tool
        parameter_descriptions: Dictionary of parameter descriptions

    Returns:
        Formatted docstring
    """
    lines = [tool_description, ""]

    if parameter_descriptions:
        lines.append("Args:")
        for param_name, param_desc in parameter_descriptions.items():
            lines.append(f"    {param_name}: {param_desc}")

    return "\n".join(lines)


================================================
FILE: aisuite/mcp/tool_wrapper.py
================================================
"""
MCP Tool Wrapper for aisuite.

This module provides the MCPToolWrapper class, which creates Python callable
wrappers around MCP tools that are compatible with aisuite's existing tool
calling infrastructure.
"""

from typing import Any, Callable, Dict, Optional
import asyncio
import inspect
from .schema_converter import (
    mcp_schema_to_annotations,
    extract_parameter_descriptions,
    build_docstring,
)


class MCPToolWrapper:
    """
    A callable wrapper around an MCP tool that makes it compatible with aisuite.

    This class wraps an MCP tool and exposes it as a Python callable with proper
    type annotations and docstrings that aisuite's Tools class can inspect and use.

    The wrapper sets the following attributes that aisuite's Tools class reads:
    - __name__: The tool name
    - __doc__: The tool description and parameter documentation
    - __annotations__: Python type annotations for parameters

    When called, the wrapper executes the MCP tool via the MCP protocol.

    Example:
        >>> wrapper = MCPToolWrapper(mcp_client, "read_file", tool_schema)
        >>> result = wrapper(path="/path/to/file")
    """

    def __init__(
        self,
        mcp_client: "MCPClient",  # Forward reference to avoid circular import
        tool_name: str,
        tool_schema: Dict[str, Any],
    ):
        """
        Initialize the MCP tool wrapper.

        Args:
            mcp_client: The MCPClient instance that manages the connection
            tool_name: Name of the MCP tool
            tool_schema: MCP tool schema definition
        """
        self.mcp_client = mcp_client
        self.tool_name = tool_name
        self.schema = tool_schema

        # Set attributes that aisuite's Tools class will inspect
        self.__name__ = tool_name

        # Build docstring from MCP schema
        description = tool_schema.get("description", "")
        input_schema = tool_schema.get("inputSchema", {})
        param_descriptions = extract_parameter_descriptions(input_schema)
        self.__doc__ = build_docstring(description, param_descriptions)

        # Convert MCP JSON Schema to Python type annotations
        self.__annotations__ = mcp_schema_to_annotations(input_schema)

        # Create a proper signature for inspect.signature() to read
        # This allows aisuite's Tools class to introspect the parameters
        self.__signature__ = self._create_signature(input_schema)

        # Store the original MCP inputSchema for direct use by Tools class
        # This avoids lossy round-trip conversion through Python type annotations
        # and preserves all JSON Schema details (arrays, nested objects, etc.)
        self.__mcp_input_schema__ = input_schema

    def _create_signature(self, input_schema: Dict[str, Any]) -> inspect.Signature:
        """
        Create a signature for this wrapper based on MCP tool schema.

        This allows inspect.signature() to see the proper parameters with
        type annotations, rather than just **kwargs.
        """
        properties = input_schema.get("properties", {})
        required = input_schema.get("required", [])

        parameters = []
        for param_name, annotation in self.__annotations__.items():
            # Create parameter with annotation and default
            if param_name in required:
                # Required parameter (no default)
                param = inspect.Parameter(
                    param_name,
                    inspect.Parameter.POSITIONAL_OR_KEYWORD,
                    annotation=annotation,
                )
            else:
                # Optional parameter (with None default)
                param = inspect.Parameter(
                    param_name,
                    inspect.Parameter.POSITIONAL_OR_KEYWORD,
                    default=None,
                    annotation=annotation,
                )
            parameters.append(param)

        return inspect.Signature(parameters, return_annotation=Any)

    def __call__(self, **kwargs) -> Any:
        """
        Execute the MCP tool with the given arguments.

        This method is called by aisuite's tool execution loop when the LLM
        requests this tool.

        Args:
            **kwargs: Tool arguments as keyword arguments

        Returns:
            The result from the MCP tool execution
        """
        # Filter out None values - only pass parameters that have actual values
        # This prevents passing null to MCP tools that expect specific types
        # (e.g., a tool expecting number won't accept null, it wants the param omitted)
        filtered_kwargs = {k: v for k, v in kwargs.items() if v is not None}

        # Call the MCP client's tool execution method
        # The MCP client handles the async MCP protocol communication
        return self.mcp_client.call_tool(self.tool_name, filtered_kwargs)

    def __repr__(self) -> str:
        """Return a string representation of the wrapper."""
        return f"MCPToolWrapper(name={self.tool_name!r})"


def create_mcp_tool_wrapper(
    mcp_client: "MCPClient",
    tool_name: str,
    tool_schema: Dict[str, Any],
) -> Callable:
    """
    Factory function to create an MCP tool wrapper.

    Args:
        mcp_client: The MCPClient instance
        tool_name: Name of the tool
        tool_schema: MCP tool schema

    Returns:
        Callable wrapper for the MCP tool
    """
    return MCPToolWrapper(mcp_client, tool_name, tool_schema)


================================================
FILE: aisuite/provider.py
================================================
from abc import ABC, abstractmethod
from pathlib import Path
import importlib
import os
import functools
from typing import Union, BinaryIO, Optional


class LLMError(Exception):
    """Custom exception for LLM errors."""

    def __init__(self, message):
        super().__init__(message)


class ASRError(Exception):
    """Custom exception for ASR errors."""

    def __init__(self, message):
        super().__init__(message)


class Provider(ABC):
    def __init__(self):
        """Initialize provider with optional audio functionality."""
        self.audio: Optional[Audio] = None

    @abstractmethod
    def chat_completions_create(self, model, messages):
        """Abstract method for chat completion calls, to be implemented by each provider."""
        pass


class ProviderFactory:
    """Factory to dynamically load provider instances based on naming conventions."""

    PROVIDERS_DIR = Path(__file__).parent / "providers"

    @classmethod
    def create_provider(cls, provider_key, config):
        """Dynamically load and create an instance of a provider based on the naming convention."""
        # Convert provider_key to the expected module and class names
        provider_class_name = f"{provider_key.capitalize()}Provider"
        provider_module_name = f"{provider_key}_provider"

        module_path = f"aisuite.providers.{provider_module_name}"

        # Lazily load the module
        try:
            module = importlib.import_module(module_path)
        except ImportError as e:
            raise ImportError(
                f"Could not import module {module_path}: {str(e)}. Please ensure the provider is supported by doing ProviderFactory.get_supported_providers()"
            )

        # Instantiate the provider class
        provider_class = getattr(module, provider_class_name)
        return provider_class(**config)

    @classmethod
    @functools.cache
    def get_supported_providers(cls):
        """List all supported provider names based on files present in the providers directory."""
        provider_files = Path(cls.PROVIDERS_DIR).glob("*_provider.py")
        return {file.stem.replace("_provider", "") for file in provider_files}


class Audio:
    """Base class for all audio functionality."""

    def __init__(self):
        self.transcriptions: Optional["Audio.Transcription"] = None

    class Transcription(ABC):
        """Base class for audio transcription functionality."""

        def create(
            self,
            model: str,
            file: Union[str, BinaryIO],
            options=None,
            **kwargs,
        ):
            """Create audio transcription."""
            raise NotImplementedError("Transcription not supported by this provider")

        async def create_stream_output(
            self,
            model: str,
            file: Union[str, BinaryIO],
            options=None,
            **kwargs,
        ):
            """Create streaming audio transcription."""
            raise NotImplementedError(
                "Streaming transcription not supported by this provider"
            )


================================================
FILE: aisuite/providers/__init__.py
================================================


================================================
FILE: aisuite/providers/anthropic_provider.py
================================================
# Anthropic provider
# Links:
# Tool calling docs - https://docs.anthropic.com/en/docs/build-with-claude/tool-use

import anthropic
import json
from aisuite.provider import Provider
from aisuite.framework import ChatCompletionResponse
from aisuite.framework.message import (
    Message,
    ChatCompletionMessageToolCall,
    Function,
    CompletionUsage,
    PromptTokensDetails,
)

# Define a constant for the default max_tokens value
DEFAULT_MAX_TOKENS = 4096


class AnthropicMessageConverter:
    # Role constants
    ROLE_USER = "user"
    ROLE_ASSISTANT = "assistant"
    ROLE_TOOL = "tool"
    ROLE_SYSTEM = "system"

    # Finish reason mapping
    FINISH_REASON_MAPPING = {
        "end_turn": "stop",
        "max_tokens": "length",
        "tool_use": "tool_calls",
    }

    def convert_request(self, messages):
        """Convert framework messages to Anthropic format."""
        system_message = self._extract_system_message(messages)
        converted_messages = [self._convert_single_message(msg) for msg in messages]
        return system_message, converted_messages

    def convert_response(self, response):
        """Normalize the response from the Anthropic API to match OpenAI's response format."""
        normalized_response = ChatCompletionResponse()
        normalized_response.choices[0].finish_reason = self._get_finish_reason(response)
        normalized_response.usage = self._get_completion_usage(response)
        normalized_response.choices[0].message = self._get_message(response)
        return normalized_response

    def _convert_single_message(self, msg):
        """Convert a single message to Anthropic format."""
        if isinstance(msg, dict):
            return self._convert_dict_message(msg)
        return self._convert_message_object(msg)

    def _convert_dict_message(self, msg):
        """Convert a dictionary message to Anthropic format."""
        if msg["role"] == self.ROLE_TOOL:
            return self._create_tool_result_message(msg["tool_call_id"], msg["content"])
        elif msg["role"] == self.ROLE_ASSISTANT and "tool_calls" in msg:
            return self._create_assistant_tool_message(
                msg["content"], msg["tool_calls"]
            )
        return {"role": msg["role"], "content": msg["content"]}

    def _convert_message_object(self, msg):
        """Convert a Message object to Anthropic format."""
        if msg.role == self.ROLE_TOOL:
            return self._create_tool_result_message(msg.tool_call_id, msg.content)
        elif msg.role == self.ROLE_ASSISTANT and msg.tool_calls:
            return self._create_assistant_tool_message(msg.content, msg.tool_calls)
        return {"role": msg.role, "content": msg.content}

    def _create_tool_result_message(self, tool_call_id, content):
        """Create a tool result message in Anthropic format."""
        return {
            "role": self.ROLE_USER,
            "content": [
                {
                    "type": "tool_result",
                    "tool_use_id": tool_call_id,
                    "content": content,
                }
            ],
        }

    def _create_assistant_tool_message(self, content, tool_calls):
        """Create an assistant message with tool calls in Anthropic format."""
        message_content = []
        if content:
            message_content.append({"type": "text", "text": content})

        for tool_call in tool_calls:
            tool_input = (
                tool_call["function"]["arguments"]
                if isinstance(tool_call, dict)
                else tool_call.function.arguments
            )
            message_content.append(
                {
                    "type": "tool_use",
                    "id": (
                        tool_call["id"] if isinstance(tool_call, dict) else tool_call.id
                    ),
                    "name": (
                        tool_call["function"]["name"]
                        if isinstance(tool_call, dict)
                        else tool_call.function.name
                    ),
                    "input": json.loads(tool_input),
                }
            )

        return {"role": self.ROLE_ASSISTANT, "content": message_content}

    def _extract_system_message(self, messages):
        """Extract system message if present, otherwise return empty list."""
        # TODO: This is a temporary solution to extract the system message.
        # User can pass multiple system messages, which can mingled with other messages.
        # This needs to be fixed to handle this case.
        if messages and messages[0]["role"] == "system":
            system_message = messages[0]["content"]
            messages.pop(0)
            return system_message
        return []

    def _get_finish_reason(self, response):
        """Get the normalized finish reason."""
        return self.FINISH_REASON_MAPPING.get(response.stop_reason, "stop")

    def _get_completion_usage(self, response):
        """Get the usage statistics."""
        return CompletionUsage(
            completion_tokens=response.usage.output_tokens,
            prompt_tokens=response.usage.input_tokens,
            total_tokens=response.usage.input_tokens + response.usage.output_tokens,
            prompt_tokens_details=PromptTokensDetails(
                cached_tokens=response.usage.cache_read_input_tokens,
            ),
        )

    def _get_message(self, response):
        """Get the appropriate message based on response type."""
        # Check if response contains any tool use blocks (regardless of stop_reason)
        has_tool_use = any(content.type == "tool_use" for content in response.content)

        if has_tool_use:
            tool_message = self.convert_response_with_tool_use(response)
            if tool_message:
                return tool_message

        # Safely extract text content from any position in content blocks
        text_content = next(
            (content.text for content in response.content if content.type == "text"),
            "",
        )

        return Message(
            content=text_content or None,
            role="assistant",
            tool_calls=None,
            refusal=None,
        )

    def convert_response_with_tool_use(self, response):
        """Convert Anthropic tool use response to the framework's format."""
        tool_call = next(
            (content for content in response.content if content.type == "tool_use"),
            None,
        )

        if tool_call:
            function = Function(
                name=tool_call.name, arguments=json.dumps(tool_call.input)
            )
            tool_call_obj = ChatCompletionMessageToolCall(
                id=tool_call.id, function=function, type="function"
            )
            text_content = next(
                (
                    content.text
                    for content in response.content
                    if content.type == "text"
                ),
                "",
            )

            return Message(
                content=text_content or None,
                tool_calls=[tool_call_obj] if tool_call else None,
                role="assistant",
                refusal=None,
            )
        return None

    def convert_tool_spec(self, openai_tools):
        """Convert OpenAI tool specification to Anthropic format."""
        anthropic_tools = []

        for tool in openai_tools:
            if tool.get("type") != "function":
                continue

            function = tool["function"]
            anthropic_tool = {
                "name": function["name"],
                "description": function["description"],
                "input_schema": {
                    "type": "object",
                    "properties": function["parameters"]["properties"],
                    "required": function["parameters"].get("required", []),
                },
            }
            anthropic_tools.append(anthropic_tool)

        return anthropic_tools


class AnthropicProvider(Provider):
    def __init__(self, **config):
        """Initialize the Anthropic provider with the given configuration."""
        self.client = anthropic.Anthropic(**config)
        self.converter = AnthropicMessageConverter()

    def chat_completions_create(self, model, messages, **kwargs):
        """Create a chat completion using the Anthropic API."""
        kwargs = self._prepare_kwargs(kwargs)
        system_message, converted_messages = self.converter.convert_request(messages)

        response = self.client.messages.create(
            model=model, system=system_message, messages=converted_messages, **kwargs
        )
        return self.converter.convert_response(response)

    def _prepare_kwargs(self, kwargs):
        """Prepare kwargs for the API call."""
        kwargs = kwargs.copy()
        kwargs.setdefault("max_tokens", DEFAULT_MAX_TOKENS)

        if "tools" in kwargs:
            kwargs["tools"] = self.converter.convert_tool_spec(kwargs["tools"])

        return kwargs


================================================
FILE: aisuite/providers/aws_provider.py
================================================
"""AWS Bedrock provider for the aisuite."""

import os
import json
from typing import List, Dict, Any, Tuple, Optional

import boto3
import botocore

from aisuite.provider import Provider, LLMError
from aisuite.framework import ChatCompletionResponse
from aisuite.framework.message import Message, CompletionUsage


# pylint: disable=too-few-public-methods
class BedrockConfig:
    """Configuration for the AWS Bedrock provider."""

    INFERENCE_PARAMETERS = ["maxTokens", "temperature", "topP", "stopSequences"]

    def __init__(self, **config):
        """Initialize the BedrockConfig."""
        self.region_name = config.get(
            "region_name", os.getenv("AWS_REGION", "us-west-2")
        )

    def create_client(self):
        """Create a Bedrock runtime client."""
        return boto3.client("bedrock-runtime", region_name=self.region_name)


# AWS Bedrock API Example -
# https://docs.aws.amazon.com/bedrock/latest/userguide/tool-use-inference-call.html
# https://docs.aws.amazon.com/bedrock/latest/userguide/tool-use-examples.html
class BedrockMessageConverter:
    """Converts messages between OpenAI and AWS Bedrock formats."""

    @staticmethod
    def convert_request(
        messages: List[Dict[str, Any]],
    ) -> Tuple[List[Dict], List[Dict]]:
        """Convert messages to AWS Bedrock format."""
        # Convert all messages to dicts if they're Message objects
        messages = [
            message.model_dump() if hasattr(message, "model_dump") else message
            for message in messages
        ]

        # Handle system message
        system_message = []
        if messages and messages[0]["role"] == "system":
            system_message = [{"text": messages[0]["content"]}]
            messages = messages[1:]

        formatted_messages = []
        for message in messages:
            # Skip any additional system messages
            if message["role"] == "system":
                continue

            if message["role"] == "tool":
                bedrock_message = BedrockMessageConverter.convert_tool_result(message)
                if bedrock_message:
                    formatted_messages.append(bedrock_message)
            elif message["role"] == "assistant":
                bedrock_message = BedrockMessageConverter.convert_assistant(message)
                if bedrock_message:
                    formatted_messages.append(bedrock_message)
            else:  # user messages
                formatted_messages.append(
                    {
                        "role": message["role"],
                        "content": [{"text": message["content"]}],
                    }
                )

        return system_message, formatted_messages

    @staticmethod
    def convert_response_tool_call(
        response: Dict[str, Any],
    ) -> Optional[Dict[str, Any]]:
        """Convert AWS Bedrock tool call response to OpenAI format."""
        if response.get("stopReason") != "tool_use":
            return None

        tool_calls = []
        for content in response["output"]["message"]["content"]:
            if "toolUse" in content:
                tool = content["toolUse"]
                tool_calls.append(
                    {
                        "type": "function",
                        "id": tool["toolUseId"],
                        "function": {
                            "name": tool["name"],
                            "arguments": json.dumps(tool["input"]),
                        },
                    }
                )

        if not tool_calls:
            return None

        return {
            "role": "assistant",
            "content": None,
            "tool_calls": tool_calls,
            "refusal": None,
        }

    @staticmethod
    def convert_tool_result(message: Dict[str, Any]) -> Optional[Dict[str, Any]]:
        """Convert OpenAI tool result format to AWS Bedrock format."""
        if message["role"] != "tool" or "content" not in message:
            return None

        tool_call_id = message.get("tool_call_id")
        if not tool_call_id:
            raise LLMError("Tool result message must include tool_call_id")

        try:
            content_json = json.loads(message["content"])
            content = [{"json": content_json}]
        except json.JSONDecodeError:
            content = [{"text": message["content"]}]

        return {
            "role": "user",
            "content": [
                {"toolResult": {"toolUseId": tool_call_id, "content": content}}
            ],
        }

    @staticmethod
    def convert_assistant(message: Dict[str, Any]) -> Optional[Dict[str, Any]]:
        """Convert OpenAI assistant format to AWS Bedrock format."""
        if message["role"] != "assistant":
            return None

        content = []

        if message.get("content"):
            content.append({"text": message["content"]})

        if message.get("tool_calls"):
            for tool_call in message["tool_calls"]:
                if tool_call["type"] == "function":
                    try:
                        input_json = json.loads(tool_call["function"]["arguments"])
                    except json.JSONDecodeError:
                        input_json = tool_call["function"]["arguments"]

                    content.append(
                        {
                            "toolUse": {
                                "toolUseId": tool_call["id"],
                                "name": tool_call["function"]["name"],
                                "input": input_json,
                            }
                        }
                    )

        return {"role": "assistant", "content": content} if content else None

    @staticmethod
    def convert_response(response: Dict[str, Any]) -> ChatCompletionResponse:
        """Normalize the response from the Bedrock API to match OpenAI's response format."""
        norm_response = ChatCompletionResponse()

        # Check if the model is requesting tool use
        if response.get("stopReason") == "tool_use":
            tool_message = BedrockMessageConverter.convert_response_tool_call(response)
            if tool_message:
                norm_response.choices[0].message = Message(**tool_message)
                norm_response.choices[0].finish_reason = "tool_calls"
                return norm_response

        # Handle regular text response
        norm_response.choices[0].message.content = response["output"]["message"][
            "content"
        ][0]["text"]

        # Map Bedrock stopReason to OpenAI finish_reason
        stop_reason = response.get("stopReason")
        if stop_reason == "complete":
            norm_response.choices[0].finish_reason = "stop"
        elif stop_reason == "max_tokens":
            norm_response.choices[0].finish_reason = "length"
        else:
            norm_response.choices[0].finish_reason = stop_reason

        # Conditionally parse usage data if it exists.
        if usage_data := response.get("usage"):
            norm_response.usage = BedrockMessageConverter.get_completion_usage(
                usage_data
            )

        return norm_response

    @staticmethod
    def get_completion_usage(usage_data: dict):
        """Get the usage statistics from a usage data dictionary."""
        return CompletionUsage(
            completion_tokens=usage_data.get("outputTokens"),
            prompt_tokens=usage_data.get("inputTokens"),
            total_tokens=usage_data.get("totalTokens"),
        )


class AwsProvider(Provider):
    """Provider for AWS Bedrock."""

    def __init__(self, **config):
        """Initialize the AWS Bedrock provider with the given configuration."""
        self.config = BedrockConfig(**config)
        self.client = self.config.create_client()
        self.transformer = BedrockMessageConverter()

    def convert_response(self, response: Dict[str, Any]) -> ChatCompletionResponse:
        """Normalize the response from the Bedrock API to match OpenAI's response format."""
        return self.transformer.convert_response(response)

    def _convert_tool_spec(self, kwargs: Dict[str, Any]) -> Optional[Dict[str, Any]]:
        """Convert tool specifications to Bedrock format."""
        if "tools" not in kwargs:
            return None

        tool_config = {
            "tools": [
                {
                    "toolSpec": {
                        "name": tool["function"]["name"],
                        "description": tool["function"].get("description", " "),
                        "inputSchema": {"json": tool["function"]["parameters"]},
                    }
                }
                for tool in kwargs["tools"]
            ]
        }
        return tool_config

    def _prepare_request_config(self, kwargs: Dict[str, Any]) -> Dict[str, Any]:
        """Prepare the configuration for the Bedrock API request."""
        # Convert tools and remove from kwargs
        tool_config = self._convert_tool_spec(kwargs)
        kwargs.pop("tools", None)  # Remove tools from kwargs if present

        inference_config = {
            key: kwargs[key]
            for key in BedrockConfig.INFERENCE_PARAMETERS
            if key in kwargs
        }

        additional_fields = {
            key: value
            for key, value in kwargs.items()
            if key not in BedrockConfig.INFERENCE_PARAMETERS
        }

        request_config = {
            "inferenceConfig": inference_config,
            "additionalModelRequestFields": additional_fields,
        }

        if tool_config is not None:
            request_config["toolConfig"] = tool_config

        return request_config

    def chat_completions_create(
        self, model: str, messages: List[Dict[str, Any]], **kwargs
    ) -> ChatCompletionResponse:
        """Create a chat completion request to AWS Bedrock."""
        system_message, formatted_messages = self.transformer.convert_request(messages)
        request_config = self._prepare_request_config(kwargs)

        try:
            response = self.client.converse(
                modelId=model,
                messages=formatted_messages,
                system=system_message,
                **request_config,
            )
        except botocore.exceptions.ClientError as e:
            if e.response["Error"]["Code"] == "ValidationException":
                error_message = e.response["Error"]["Message"]
                raise LLMError(error_message) from e
            raise

        return self.convert_response(response)


================================================
FILE: aisuite/providers/azure_provider.py
================================================
import urllib.request
import json
import os

from aisuite.provider import Provider
from aisuite.framework import ChatCompletionResponse
from aisuite.framework.message import Message, ChatCompletionMessageToolCall, Function

# Azure provider is based on the documentation here -
# https://learn.microsoft.com/en-us/azure/machine-learning/reference-model-inference-api?view=azureml-api-2&source=recommendations&tabs=python
# Azure AI Model Inference API is used.
# From the documentation -
# """
# The Azure AI Model Inference is an API that exposes a common set of capabilities for foundational models
# and that can be used by developers to consume predictions from a diverse set of models in a uniform and consistent way.
# Developers can talk with different models deployed in Azure AI Foundry portal without changing the underlying code they are using.
#
# The Azure AI Model Inference API is available in the following models:
#
# Models deployed to serverless API endpoints:
#   Cohere Embed V3 family of models
#   Cohere Command R family of models
#   Meta Llama 2 chat family of models
#   Meta Llama 3 instruct family of models
#   Mistral-Small
#   Mistral-Large
#   Jais family of models
#   Jamba family of models
#   Phi-3 family of models
#
# Models deployed to managed inference:
#   Meta Llama 3 instruct family of models
#   Phi-3 family of models
#   Mixtral famility of models
#
# The API is compatible with Azure OpenAI model deployments.
# """


class AzureMessageConverter:
    @staticmethod
    def convert_request(messages):
        """Convert messages to Azure format."""
        transformed_messages = []
        for message in messages:
            if isinstance(message, Message):
                transformed_messages.append(message.model_dump(mode="json"))
            else:
                transformed_messages.append(message)
        return transformed_messages

    @staticmethod
    def convert_response(resp_json) -> ChatCompletionResponse:
        """Normalize the response from the Azure API to match OpenAI's response format."""
        completion_response = ChatCompletionResponse()
        choice = resp_json["choices"][0]
        message = choice["message"]

        # Set basic message content
        completion_response.choices[0].message.content = message.get("content")
        completion_response.choices[0].message.role = message.get("role", "assistant")

        # Handle tool calls if present
        if "tool_calls" in message and message["tool_calls"] is not None:
            tool_calls = []
            for tool_call in message["tool_calls"]:
                new_tool_call = ChatCompletionMessageToolCall(
                    id=tool_call["id"],
                    type=tool_call["type"],
                    function={
                        "name": tool_call["function"]["name"],
                        "arguments": tool_call["function"]["arguments"],
                    },
                )
                tool_calls.append(new_tool_call)
            completion_response.choices[0].message.tool_calls = tool_calls

        return completion_response


class AzureProvider(Provider):
    def __init__(self, **config):
        self.base_url = config.get("base_url") or os.getenv("AZURE_BASE_URL")
        self.api_key = config.get("api_key") or os.getenv("AZURE_API_KEY")
        self.api_version = config.get("api_version") or os.getenv("AZURE_API_VERSION")
        if not self.api_key:
            raise ValueError("For Azure, api_key is required.")
        if not self.base_url:
            raise ValueError(
                "For Azure, base_url is required. Check your deployment page for a URL like this - https://<model-deployment-name>.<region>.models.ai.azure.com"
            )
        self.transformer = AzureMessageConverter()

    def chat_completions_create(self, model, messages, **kwargs):
        url = f"{self.base_url}/chat/completions"

        if self.api_version:
            url = f"{url}?api-version={self.api_version}"

        # Remove 'stream' from kwargs if present
        kwargs.pop("stream", None)

        # Transform messages using converter
        transformed_messages = self.transformer.convert_request(messages)

        # Prepare the request payload
        data = {"messages": transformed_messages}

        # Add tools if provided
        if "tools" in kwargs:
            data["tools"] = kwargs["tools"]
            kwargs.pop("tools")

        # Add tool_choice if provided
        if "tool_choice" in kwargs:
            data["tool_choice"] = kwargs["tool_choice"]
            kwargs.pop("tool_choice")

        # Add remaining kwargs
        data.update(kwargs)

        body = json.dumps(data).encode("utf-8")
        headers = {"Content-Type": "application/json", "Authorization": self.api_key}

        try:
            req = urllib.request.Request(url, body, headers)
            with urllib.request.urlopen(req) as response:
                result = response.read()
                resp_json = json.loads(result)
                return self.transformer.convert_response(resp_json)

        except urllib.error.HTTPError as error:
            error_message = f"The request failed with status code: {error.code}\n"
            error_message += f"Headers: {error.info()}\n"
            error_message += error.read().decode("utf-8", "ignore")
            raise Exception(error_message)


================================================
FILE: aisuite/providers/cerebras_provider.py
================================================
"""Cerebras provider for the aisuite."""

import cerebras.cloud.sdk as cerebras
from aisuite.provider import Provider, LLMError
from aisuite.providers.message_converter import OpenAICompliantMessageConverter


class CerebrasMessageConverter(OpenAICompliantMessageConverter):
    """
    Cerebras-specific message converter if needed.
    """


# pylint: disable=too-few-public-methods
class CerebrasProvider(Provider):
    """Provider for Cerebras."""

    def __init__(self, **config):
        self.client = cerebras.Cerebras(**config)
        self.transformer = CerebrasMessageConverter()

    def chat_completions_create(self, model, messages, **kwargs):
        """
        Makes a request to the Cerebras chat completions endpoint using the official client.
        """
        try:
            response = self.client.chat.completions.create(
                model=model,
                messages=messages,
                **kwargs,  # Pass any additional arguments to the Cerebras API.
            )
            return self.transformer.convert_response(response.model_dump())

        # Re-raise Cerebras API-specific exceptions.
        except cerebras.PermissionDeniedError:
            raise
        except cerebras.AuthenticationError:
            raise
        except cerebras.RateLimitError:
            raise

        # Wrap all other exceptions in LLMError.
        except Exception as e:
            raise LLMError(f"An error occurred: {e}") from e


================================================
FILE: aisuite/providers/cohere_provider.py
================================================
import os
import cohere
import json
from aisuite.framework import ChatCompletionResponse
from aisuite.framework.message import Message, ChatCompletionMessageToolCall, Function
from aisuite.provider import Provider, LLMError


class CohereMessageConverter:
    """
    Cohere-specific message converter
    """

    def convert_request(self, messages):
        """Convert framework messages to Cohere format."""
        converted_messages = []

        for message in messages:
            if isinstance(message, dict):
                role = message.get("role")
                content = message.get("content")
                tool_calls = message.get("tool_calls")
                tool_plan = message.get("tool_plan")
            else:
                role = message.role
                content = message.content
                tool_calls = message.tool_calls
                tool_plan = getattr(message, "tool_plan", None)

            # Convert to Cohere's format
            if role == "tool":
                # Handle tool response messages
                converted_message = {
                    "role": role,
                    "tool_call_id": (
                        message.get("tool_call_id")
                        if isinstance(message, dict)
                        else message.tool_call_id
                    ),
                    "content": self._convert_tool_content(content),
                }
            elif role == "assistant" and tool_calls:
                # Handle assistant messages with tool calls
                converted_message = {
                    "role": role,
                    "tool_calls": [
                        {
                            "id": tc.id if not isinstance(tc, dict) else tc["id"],
                            "function": {
                                "name": (
                                    tc.function.name
                                    if not isinstance(tc, dict)
                                    else tc["function"]["name"]
                                ),
                                "arguments": (
                                    tc.function.arguments
                                    if not isinstance(tc, dict)
                                    else tc["function"]["arguments"]
                                ),
                            },
                            "type": "function",
                        }
                        for tc in tool_calls
                    ],
                    "tool_plan": tool_plan,
                }
                if content:
                    converted_message["content"] = content
            else:
                # Handle regular messages
                converted_message = {"role": role, "content": content}

            converted_messages.append(converted_message)

        return converted_messages

    def _convert_tool_content(self, content):
        """Convert tool response content to Cohere's expected format."""
        if isinstance(content, str):
            try:
                # Try to parse as JSON first
                data = json.loads(content)
                return [{"type": "document", "document": {"data": json.dumps(data)}}]
            except json.JSONDecodeError:
                # If not JSON, return as plain text
                return content
        elif isinstance(content, list):
            # If content is already in Cohere's format, return as is
            return content
        else:
            # For other types, convert to string
            return str(content)

    @staticmethod
    def convert_response(response_data) -> ChatCompletionResponse:
        """Convert Cohere's response to our standard format."""
        normalized_response = ChatCompletionResponse()

        # Set usage information
        normalized_response.usage = {
            "prompt_tokens": response_data.usage.tokens.input_tokens,
            "completion_tokens": response_data.usage.tokens.output_tokens,
            "total_tokens": response_data.usage.tokens.input_tokens
            + response_data.usage.tokens.output_tokens,
        }

        # Handle tool calls
        if response_data.finish_reason == "TOOL_CALL":
            tool_call = response_data.message.tool_calls[0]
            function = Function(
                name=tool_call.function.name, arguments=tool_call.function.arguments
            )
            tool_call_obj = ChatCompletionMessageToolCall(
                id=tool_call.id, function=function, type="function"
            )
            normalized_response.choices[0].message = Message(
                content=response_data.message.tool_plan,  # Use tool_plan as content
                tool_calls=[tool_call_obj],
                role="assistant",
                refusal=None,
            )
            normalized_response.choices[0].finish_reason = "tool_calls"
        else:
            # Handle regular text response
            normalized_response.choices[0].message.content = (
                response_data.message.content[0].text
            )
            normalized_response.choices[0].finish_reason = "stop"

        return normalized_response


class CohereProvider(Provider):
    def __init__(self, **config):
        """
        Initialize the Cohere provider with the given configuration.
        Pass the entire configuration dictionary to the Cohere client constructor.
        """
        # Ensure API key is provided either in config or via environment variable
        config.setdefault("api_key", os.getenv("CO_API_KEY"))
        if not config["api_key"]:
            raise ValueError(
                "Cohere API key is missing. Please provide it in the config or set the CO_API_KEY environment variable."
            )
        self.client = cohere.ClientV2(**config)
        self.transformer = CohereMessageConverter()

    def chat_completions_create(self, model, messages, **kwargs):
        """
        Makes a request to Cohere using the official client.
        """
        try:
            # Transform messages using converter
            transformed_messages = self.transformer.convert_request(messages)

            # Make the request to Cohere
            response = self.client.chat(
                model=model, messages=transformed_messages, **kwargs
            )

            return self.transformer.convert_response(response)
        except Exception as e:
            raise LLMError(f"An error occurred: {e}")


================================================
FILE: aisuite/providers/deepgram_provider.py
================================================
import os
import json
import numpy as np
import queue
import threading
import time
from typing import Union, BinaryIO, AsyncGenerator

from aisuite.provider import Provider, ASRError, Audio
from aisuite.framework.message import (
    TranscriptionResult,
    Segment,
    Word,
    Alternative,
    Channel,
    StreamingTranscriptionChunk,
)


class DeepgramProvider(Provider):
    """Deepgram ASR provider."""

    def __init__(self, **config):
        """Initialize the Deepgram provider with the given configuration."""
        super().__init__()

        # Ensure API key is provided either in config or via environment variable
        self.api_key = config.get("api_key") or os.getenv("DEEPGRAM_API_KEY")
        if not self.api_key:
            raise ValueError(
                "Deepgram API key is missing. Please provide it in the config or set the DEEPGRAM_API_KEY environment variable."
            )

        # Initialize Deepgram client (v5.0.0+)
        try:
            from deepgram import DeepgramClient

            self.client = DeepgramClient(api_key=self.api_key)
        except ImportError:
            raise ImportError(
                "Deepgram SDK is required. Install it with: pip install deepgram-sdk"
            )

        # Initialize audio functionality
        self.audio = DeepgramAudio(self.client)

    def chat_completions_create(self, model, messages):
        """Deepgram does not support chat completions."""
        raise NotImplementedError(
            "Deepgram provider only supports audio transcription, not chat completions."
        )


# Audio Classes
class DeepgramAudio(Audio):
    """Deepgram Audio functionality container."""

    def __init__(self, client):
        super().__init__()
        self.transcriptions = self.Transcriptions(client)

    class Transcriptions(Audio.Transcription):
        """Deepgram Audio Transcriptions functionality."""

        def __init__(self, client):
            self.client = client

        def create(
            self,
            model: str,
            file: Union[str, BinaryIO],
            **kwargs,
        ) -> TranscriptionResult:
            """
            Create audio transcription using Deepgram SDK v5.

            All parameters are already validated and mapped by the Client layer.
            This is a simple pass-through to the Deepgram API.
            """
            try:
                # Add model to params and set defaults
                kwargs["model"] = model
                kwargs.setdefault("smart_format", True)
                kwargs.setdefault("punctuate", True)
                kwargs.setdefault("language", "en")

                # Get audio bytes
                audio_bytes = self._prepare_audio_payload(file)

                # Use v5 API: client.listen.v1.media.transcribe_file()
                # All parameters passed as kwargs, no PrerecordedOptions needed
                response = self.client.listen.v1.media.transcribe_file(
                    request=audio_bytes, **kwargs
                )

                # Convert Pydantic model to dict (v5 uses Pydantic v2)
                if hasattr(response, "model_dump"):
                    response_dict = response.model_dump()
                elif hasattr(response, "to_dict"):
                    response_dict = response.to_dict()
                elif hasattr(response, "dict"):
                    response_dict = response.dict()
                else:
                    response_dict = response

                return self._parse_deepgram_response(response_dict)

            except Exception as e:
                raise ASRError(f"Deepgram transcription error: {e}") from e

        async def create_stream_output(
            self,
            model: str,
            file: Union[str, BinaryIO],
            chunk_size_minutes: float = 3.0,
            **kwargs,
        ) -> AsyncGenerator[StreamingTranscriptionChunk, None]:
            """
            Create streaming audio transcription using Deepgram SDK v5 with chunked processing.

            All parameters are already validated and mapped by the Client layer.
            This implementation handles audio chunking and streaming.
            """
            try:
                # Load and prepare audio
                audio_data, sample_rate = await self._load_and_prepare_audio(file)

                # Calculate chunking strategy
                duration_seconds = len(audio_data) / sample_rate
                chunk_duration_seconds = chunk_size_minutes * 60

                if duration_seconds <= chunk_duration_seconds:
                    chunks = [audio_data]
                else:
                    chunk_size_samples = int(chunk_duration_seconds * sample_rate)
                    chunks = []
                    num_chunks = int(np.ceil(duration_seconds / chunk_duration_seconds))
                    for i in range(num_chunks):
                        start_sample = i * chunk_size_samples
                        end_sample = min(
                            start_sample + chunk_size_samples, len(audio_data)
                        )
                        chunks.append(audio_data[start_sample:end_sample])

                # Setup API parameters for v5
                kwargs["model"] = model
                kwargs.setdefault("smart_format", "true")
                kwargs.setdefault("punctuate", "true")
                kwargs.setdefault("language", "en")
                kwargs["interim_results"] = (
                    "true"  # Enable interim results for streaming
                )

                # Remove parameters not supported by streaming
                kwargs.pop("utterances", None)

                # Add critical audio format parameters (as strings for v5)
                kwargs["encoding"] = "linear16"  # PCM16 format
                kwargs["sample_rate"] = "16000"  # Match our target sample rate
                kwargs["channels"] = "1"  # Mono audio

                # Use thread-safe queue for cross-thread communication
                transcript_queue = queue.Queue()
                connection_closed = threading.Event()

                def on_message(*args, **message_kwargs):
                    """Handle transcript events"""
                    # Extract result from args or kwargs
                    result = None
                    if len(args) >= 2:
                        result = args[1]
                    elif "result" in message_kwargs:
                        result = message_kwargs["result"]
                    else:
                        return

                    if hasattr(result, "channel") and result.channel.alternatives:
                        alt = result.channel.alternatives[0]
                        if alt.transcript:
                            chunk = StreamingTranscriptionChunk(
                                text=alt.transcript,
                                is_final=getattr(result, "is_final", False),
                                confidence=getattr(alt, "confidence", None),
                            )
                            transcript_queue.put(chunk)

                def on_error(*args, **error_kwargs):
                    """Handle error events"""
                    error = None
                    if len(args) >= 2:
                        error = args[1]
                    elif "error" in error_kwargs:
                        error = error_kwargs["error"]

                    if error:
                        transcript_queue.put(
                            ASRError(f"Deepgram streaming error: {error}")
                        )

                def on_close(*args, **close_kwargs):
                    """Handle connection close events"""
                    connection_closed.set()

                # Use v5 streaming API with context manager
                from deepgram.core.events import EventType

                async with self.client.listen.v1.connect(**kwargs) as connection:
                    # Register event handlers
                    connection.on(EventType.Transcript, on_message)
                    connection.on(EventType.Error, on_error)
                    connection.on(EventType.Close, on_close)

                    # Send all chunks through connection
                    for audio_chunk in chunks:
                        self._send_audio_chunk(connection, audio_chunk)

                    # Send CloseStream message to signal end
                    close_stream_message = json.dumps({"type": "CloseStream"})
                    connection.send(close_stream_message)

                    # Yield results until connection closes
                    while not connection_closed.is_set():
                        try:
                            chunk = transcript_queue.get(timeout=0.1)
                            if isinstance(chunk, Exception):
                                raise chunk
                            yield chunk
                        except queue.Empty:
                            continue

                    # Get any remaining results
                    while not transcript_queue.empty():
                        try:
                            chunk = transcript_queue.get_nowait()
                            if isinstance(chunk, Exception):
                                raise chunk
                            yield chunk
                        except queue.Empty:
                            break

            except Exception as e:
                raise ASRError(f"Deepgram streaming transcription error: {e}")

        def _prepare_audio_payload(self, file: Union[str, BinaryIO]) -> bytes:
            """Prepare audio payload for Deepgram API v5.

            Returns raw bytes instead of dict payload (v5 API change).
            """
            if isinstance(file, str):
                with open(file, "rb") as audio_file:
                    buffer_data = audio_file.read()
            else:
                if hasattr(file, "read"):
                    buffer_data = file.read()
                else:
                    raise ValueError(
                        "File must be a file path string or file-like object"
                    )
            return buffer_data

        async def _load_and_prepare_audio(
            self, file: Union[str, BinaryIO]
        ) -> tuple[np.ndarray, int]:
            """Load and prepare audio file for streaming.

            Conversions performed only when necessary:
            - Stereo to mono: Required for multi-channel audio
            - Sample rate conversion: Required when input != 16kHz
            - Other formats: Error out as unsupported
            """
            try:
                try:
                    import soundfile as sf
                except ImportError:
                    raise ASRError(
                        "soundfile is required for audio processing. Install with: pip install soundfile"
                    )

                if isinstance(file, str):
                    audio_data, original_sample_rate = sf.read(file)
                else:
                    audio_data, original_sample_rate = sf.read(file)

                audio_data = np.asarray(audio_data, dtype=np.float32)

                # Convert to mono if stereo
                if len(audio_data.shape) > 1:
                    if audio_data.shape[1] == 2:
                        audio_data = np.mean(audio_data, axis=1)
                    else:
                        raise ASRError(
                            f"Unsupported audio format: {audio_data.shape[1]} channels. Only mono and stereo are supported."
                        )

                # Resample to 16kHz if needed
                target_sample_rate = 16000
                if original_sample_rate != target_sample_rate:
                    try:
                        from scipy import signal

                        num_samples = int(
                            len(audio_data) * target_sample_rate / original_sample_rate
                        )
                        audio_data = signal.resample(audio_data, num_samples)
                    except ImportError:
                        raise ASRError(
                            f"Audio resampling required but scipy not available. "
                            f"Input is {original_sample_rate}Hz, need {target_sample_rate}Hz. "
                            f"Install scipy or provide audio at {target_sample_rate}Hz."
                        )

                return np.asarray(audio_data, dtype=np.float32), target_sample_rate

            except Exception as e:
                if isinstance(e, ASRError):
                    raise
                raise ASRError(f"Error loading audio file: {e}")

        def _send_audio_chunk(self, connection, audio_chunk: np.ndarray) -> None:
            """Send audio chunk data through the connection."""
            streaming_chunk_size = 8000  # Match reference BLOCKSIZE (~0.5s @16kHz mono)
            send_delay = 0.01

            for i in range(0, len(audio_chunk), streaming_chunk_size):
                piece = audio_chunk[i : i + streaming_chunk_size]

                if len(piece) < streaming_chunk_size:
                    piece = np.pad(
                        piece, (0, streaming_chunk_size - len(piece)), mode="constant"
                    )

                pcm16 = (piece * 32767).astype(np.int16).tobytes()
                connection.send(pcm16)
                time.sleep(send_delay)  # Use synchronous sleep like reference

        def _parse_deepgram_response(self, response_dict: dict) -> TranscriptionResult:
            """Convert Deepgram API response to unified TranscriptionResult."""
            try:
                results = response_dict.get("results", {})
                channels = results.get("channels", [])

                if not channels or not channels[0].get("alternatives"):
                    return TranscriptionResult(
                        text="", language=None, confidence=None, task="transcribe"
                    )

                best_alternative = channels[0]["alternatives"][0]
                text = best_alternative.get("transcript", "")
                confidence = best_alternative.get("confidence", None)

                words = [
                    Word(
                        word=word_data.get("word", ""),
                        start=word_data.get("start", None),
                        end=word_data.get("end", None),
                        confidence=word_data.get("confidence", None),
                    )
                    for word_data in best_alternative.get("words", [])
                ]

                segments = []
                paragraphs = results.get("paragraphs", {}).get("paragraphs", [])
                for para in paragraphs:
                    for sentence in para.get("sentences", []):
                        segments.append(
                            Segment(
                                id=len(segments),
                                seek=0,
                                start=sentence.get("start", None),
                                end=sentence.get("end", None),
                                text=sentence.get("text", ""),
                                tokens=[],
                                temperature=0.0,
                                avg_logprob=0.0,
                                compression_ratio=0.0,
                                no_speech_prob=0.0,
                            )
                        )

                alternatives_list = [
                    Alternative(
                        transcript=alt.get("transcript", ""),
                        confidence=alt.get("confidence", None),
                    )
                    for alt in channels[0]["alternatives"][1:]
                ]

                channels_list = [
                    Channel(
                        alternatives=[
                            Alternative(
                                transcript=alt.get("transcript", ""),
                                confidence=alt.get("confidence", None),
                            )
                            for alt in channel.get("alternatives", [])
                        ]
                    )
                    for channel in channels
                ]

                metadata = response_dict.get("metadata", {})

                return TranscriptionResult(
                    text=text,
                    language=results.get("language", None),
                    confidence=confidence,
                    task="transcribe",
                    duration=metadata.get("duration", None) if metadata else None,
                    segments=segments or None,
                    words=words or None,
                    channels=channels_list or None,
                    alternatives=alternatives_list or None,
                    utterances=results.get("utterances", []),
                    paragraphs=results.get("paragraphs", None),
                    topics=results.get("topics", []),
                    intents=results.get("intents", []),
                    sentiment=results.get("sentiment", None),
                    summary=results.get("summary", None),
                    metadata=metadata,
                )

            except (KeyError, TypeError, IndexError) as e:
                raise ASRError(f"Error parsing Deepgram response: {e}")


================================================
FILE: aisuite/providers/deepseek_provider.py
================================================
"""Deepseek provider for the aisuite."""

import os
import openai
from aisuite.provider import Provider, LLMError
from aisuite.providers.message_converter import OpenAICompliantMessageConverter


# pylint: disable=too-few-public-methods
class DeepseekProvider(Provider):
    """Provider for Deepseek."""

    def __init__(self, **config):
        """
        Initialize the DeepSeek provider with the given configuration.
        Pass the entire configuration dictionary to the OpenAI client constructor.
        """
        # Ensure API key is provided either in config or via environment variable
        config.setdefault("api_key", os.getenv("DEEPSEEK_API_KEY"))
        if not config["api_key"]:
            raise ValueError(
                "DeepSeek API key is missing. Please provide it in the config or "
                "set the OPENAI_API_KEY environment variable."
            )
        config["base_url"] = "https://api.deepseek.com"

        # NOTE: We could choose to remove above lines for api_key since OpenAI will automatically
        # infer certain values from the environment variables.
        # Eg: OPENAI_API_KEY, OPENAI_ORG_ID, OPENAI_PROJECT_ID. Except for
        # OPEN_AI_BASE_URL which has to be the deepseek url

        # Pass the entire config to the OpenAI client constructor
        self.client = openai.OpenAI(**config)
        # Using OpenAICompliantMessageConverter since DeepSeek's response format is
        # the same as OpenAI's.
        self.transformer = OpenAICompliantMessageConverter()

    def chat_completions_create(self, model, messages, **kwargs):
        # Any exception raised by OpenAI will be returned to the caller.
        # Maybe we should catch them and raise a custom LLMError.
        try:
            response = self.client.chat.completions.create(
                model=model,
                messages=messages,
                **kwargs,  # Pass any additional arguments to the OpenAI API
            )
            return self.transformer.convert_response(response.model_dump())
        except Exception as e:
            raise LLMError(f"An error occurred: {e}") from e


================================================
FILE: aisuite/providers/fireworks_provider.py
================================================
import os
import httpx
import json
from aisuite.provider import Provider, LLMError
from aisuite.framework import ChatCompletionResponse
from aisuite.framework.message import Message, ChatCompletionMessageToolCall


class FireworksMessageConverter:
    @staticmethod
    def convert_request(messages):
        """Convert messages to Fireworks format."""
        transformed_messages = []
        for message in messages:
            if isinstance(message, Message):
                message_dict = message.model_dump(mode="json")
                message_dict.pop("refusal", None)  # Remove refusal field if present
                transformed_messages.append(message_dict)
            else:
                transformed_messages.append(message)
        return transformed_messages

    @staticmethod
    def convert_response(resp_json) -> ChatCompletionResponse:
        """Normalize the response from the Fireworks API to match OpenAI's response format."""
        completion_response = ChatCompletionResponse()
        choice = resp_json["choices"][0]
        message = choice["message"]

        # Set basic message content
        completion_response.choices[0].message.content = message.get("content")
        completion_response.choices[0].message.role = message.get("role", "assistant")

        # Handle tool calls if present
        if "tool_calls" in message and message["tool_calls"] is not None:
            tool_calls = []
            for tool_call in message["tool_calls"]:
                new_tool_call = ChatCompletionMessageToolCall(
                    id=tool_call["id"],
                    type=tool_call["type"],
                    function={
                        "name": tool_call["function"]["name"],
                        "arguments": tool_call["function"]["arguments"],
                    },
                )
                tool_calls.append(new_tool_call)
            completion_response.choices[0].message.tool_calls = tool_calls

        return completion_response


# Models that support tool calls:
# [As of 01/20/2025 from https://docs.fireworks.ai/guides/function-calling]
# Llama 3.1 405B Instruct
# Llama 3.1 70B Instruct
# Qwen 2.5 72B Instruct
# Mixtral MoE 8x22B Instruct
# Firefunction-v2: Latest and most performant model, optimized for complex function calling scenarios (on-demand only)
# Firefunction-v1: Previous generation, Mixtral-based function calling model optimized for fast routing and structured output (on-demand only)
class FireworksProvider(Provider):
    """
    Fireworks AI Provider using httpx for direct API calls.
    """

    BASE_URL = "https://api.fireworks.ai/inference/v1/chat/completions"

    def __init__(self, **config):
        """
        Initialize the Fireworks provider with the given configuration.
        The API key is fetched from the config or environment variables.
        """
        self.api_key = config.get("api_key", os.getenv("FIREWORKS_API_KEY"))
        if not self.api_key:
            raise ValueError(
                "Fireworks API key is missing. Please provide it in the config or set the FIREWORKS_API_KEY environment variable."
            )

        # Optionally set a custom timeout (default to 30s)
        self.timeout = config.get("timeout", 30)
        self.transformer = FireworksMessageConverter()

    def chat_completions_create(self, model, messages, **kwargs):
        """
        Makes a request to the Fireworks AI chat completions endpoint using httpx.
        """
        # Remove 'stream' from kwargs if present
        kwargs.pop("stream", None)

        # Transform messages using converter
        transformed_messages = self.transformer.convert_request(messages)

        # Prepare the request payload
        data = {
            "model": model,
            "messages": transformed_messages,
        }

        # Add tools if provided
        if "tools" in kwargs:
            data["tools"] = kwargs["tools"]
            kwargs.pop("tools")

        # Add tool_choice if provided
        if "tool_choice" in kwargs:
            data["tool_choice"] = kwargs["tool_choice"]
            kwargs.pop("tool_choice")

        # Add remaining kwargs
        data.update(kwargs)

        headers = {
            "Authorization": f"Bearer {self.api_key}",
            "Content-Type": "application/json",
        }

        try:
            # Make the request to Fireworks AI endpoint.
            response = httpx.post(
                self.BASE_URL, json=data, headers=headers, timeout=self.timeout
            )
            response.raise_for_status()
            return self.transformer.convert_response(response.json())
        except httpx.HTTPStatusError as error:
            error_message = (
                f"The request failed with status code: {error.status_code}\n"
            )
            error_message += f"Headers: {error.headers}\n"
            error_message += error.response.text
            raise LLMError(error_message)
        except Exception as e:
            raise LLMError(f"An error occurred: {e}")

    def _normalize_response(self, response_data):
        """
        Normalize the response to a common format (ChatCompletionResponse).
        """
        normalized_response = ChatCompletionResponse()
        normalized_response.choices[0].message.content = response_data["choices"][0][
            "message"
        ]["content"]
        return normalized_response


================================================
FILE: aisuite/providers/google_provider.py
================================================
"""The interface to Google's Vertex AI."""

import os
import json
from typing import List, Dict, Any, Optional, Union, BinaryIO, AsyncGenerator

import vertexai
from vertexai.generative_models import (
    GenerativeModel,
    GenerationConfig,
    Content,
    Part,
    Tool,
    FunctionDeclaration,
)
import pprint

from aisuite.framework import ChatCompletionResponse, Message
from aisuite.framework.message import (
    TranscriptionResult,
    Word,
    Segment,
    Alternative,
    StreamingTranscriptionChunk,
)
from aisuite.provider import Provider, ASRError, Audio


DEFAULT_TEMPERATURE = 0.7
ENABLE_DEBUG_MESSAGES = False

# Links.
# https://codelabs.developers.google.com/codelabs/gemini-function-calling#6
# https://cloud.google.com/vertex-ai/generative-ai/docs/multimodal/function-calling#chat-samples


class GoogleMessageConverter:
    @staticmethod
    def convert_user_role_message(message: Dict[str, Any]) -> Content:
        """Convert user or system messages to Google Vertex AI format."""
        parts = [Part.from_text(message["content"])]
        return Content(role="user", parts=parts)

    @staticmethod
    def convert_assistant_role_message(message: Dict[str, Any]) -> Content:
        """Convert assistant messages to Google Vertex AI format."""
        if "tool_calls" in message and message["tool_calls"]:
            # Handle function calls
            tool_call = message["tool_calls"][
                0
            ]  # Assuming single function call for now
            function_call = tool_call["function"]

            # Create a Part from the function call
            parts = [
                Part.from_dict(
                    {
                        "function_call": {
                            "name": function_call["name"],
                            # "arguments": json.loads(function_call["arguments"])
                        }
                    }
                )
            ]
            # return Content(role="function", parts=parts)
        else:
            # Handle regular text messages
            parts = [Part.from_text(message["content"])]
            # return Content(role="model", parts=parts)

        return Content(role="model", parts=parts)

    @staticmethod
    def convert_tool_role_message(message: Dict[str, Any]) -> Part:
        """Convert tool messages to Google Vertex AI format."""
        if "content" not in message:
            raise ValueError("Tool result message must have a content field")

        try:
            content_json = json.loads(message["content"])
            part = Part.from_function_response(
                name=message["name"], response=content_json
            )
            # TODO: Return Content instead of Part. But returning Content is not working.
            return part
        except json.JSONDecodeError:
            raise ValueError("Tool result message must be valid JSON")

    @staticmethod
    def convert_request(messages: List[Dict[str, Any]]) -> List[Content]:
        """Convert messages to Google Vertex AI format."""
        # Convert all messages to dicts if they're Message objects
        messages = [
            message.model_dump() if hasattr(message, "model_dump") else message
            for message in messages
        ]

        formatted_messages = []
        for message in messages:
            if message["role"] == "tool":
                vertex_message = GoogleMessageConverter.convert_tool_role_message(
                    message
                )
                if vertex_message:
                    formatted_messages.append(vertex_message)
            elif message["role"] == "assistant":
                formatted_messages.append(
                    GoogleMessageConverter.convert_assistant_role_message(message)
                )
            else:  # user or system role
                formatted_messages.append(
                    GoogleMessageConverter.convert_user_role_message(message)
                )

        return formatted_messages

    @staticmethod
    def convert_response(response) -> ChatCompletionResponse:
        """Normalize the response from Vertex AI to match OpenAI's response format."""
        openai_response = ChatCompletionResponse()

        if ENABLE_DEBUG_MESSAGES:
            print("Dumping the response")
            pprint.pprint(response)

        # TODO: We need to go through each part, because function call may not be the first part.
        #       Currently, we are only handling the first part, but this is not enough.
        #
        # This is a valid response:
        # candidates {
        #   content {
        #     role: "model"
        #     parts {
        #       text: "The current temperature in San Francisco is 72 degrees Celsius. \n\n"
        #     }
        #     parts {
        #       function_call {
        #         name: "is_it_raining"
        #         args {
        #           fields {
        #             key: "location"
        #             value {
        #               string_value: "San Francisco"
        #             }
        #           }
        #         }
        #       }
        #     }
        #   }
        #   finish_reason: STOP

        # Check if the response contains function calls
        # Note: Just checking if the function_call attribute exists is not enough,
        #       it is important to check if the function_call is not None.
        if (
            hasattr(response.candidates[0].content.parts[0], "function_call")
            and response.candidates[0].content.parts[0].function_call
        ):
            function_call = response.candidates[0].content.parts[0].function_call

            # args is a MapComposite.
            # Convert the MapComposite to a dictionary
            args_dict = {}
            # Another way to try is: args_dict = dict(function_call.args)
            for key, value in function_call.args.items():
                args_dict[key] = value
            if ENABLE_DEBUG_MESSAGES:
                print("Dumping the args_dict")
                pprint.pprint(args_dict)

            openai_response.choices[0].message = {
                "role": "assistant",
                "content": None,
                "tool_calls": [
                    {
                        "type": "function",
                        "id": f"call_{hash(function_call.name)}",  # Generate a unique ID
                        "function": {
                            "name": function_call.name,
                            "arguments": json.dumps(args_dict),
                        },
                    }
                ],
                "refusal": None,
            }
            openai_response.choices[0].message = Message(
                **openai_response.choices[0].message
            )
            openai_response.choices[0].finish_reason = "tool_calls"
        else:
            # Handle regular text response
            openai_response.choices[0].message.content = (
                response.candidates[0].content.parts[0].text
            )
            openai_response.choices[0].finish_reason = "stop"

        return openai_response


class GoogleProvider(Provider):
    """Implements the ProviderInterface for interacting with Google's Vertex AI."""

    def __init__(self, **config):
        """Set up the Google AI client with a project ID."""
        super().__init__()

        self.project_id = config.get("project_id") or os.getenv("GOOGLE_PROJECT_ID")
        self.location = config.get("region") or os.getenv("GOOGLE_REGION")
        self.app_creds_path = config.get("application_credentials") or os.getenv(
            "GOOGLE_APPLICATION_CREDENTIALS"
        )

        if not self.project_id or not self.location or not self.app_creds_path:
            raise EnvironmentError(
                "Missing one or more required Google environment variables: "
                "GOOGLE_PROJECT_ID, GOOGLE_REGION, GOOGLE_APPLICATION_CREDENTIALS. "
                "Please refer to the setup guide: /guides/google.md."
            )

        vertexai.init(project=self.project_id, location=self.location)

        self.transformer = GoogleMessageConverter()

        # Initialize Speech client lazily
        self._speech_client = None

        # Initialize audio functionality
        self.audio = GoogleAudio(self)

    def chat_completions_create(self, model, messages, **kwargs):
        """Request chat completions from the Google AI API.

        Args:
        ----
            model (str): Identifies the specific provider/model to use.
            messages (list of dict): A list of message objects in chat history.
            kwargs (dict): Optional arguments for the Google AI API.

        Returns:
        -------
            The ChatCompletionResponse with the completion result.

        """

        # Set the temperature if provided, otherwise use the default
        temperature = kwargs.get("temperature", DEFAULT_TEMPERATURE)

        # Convert messages to Vertex AI format
        message_history = self.transformer.convert_request(messages)

        # Handle tools if provided
        tools = None
        if "tools" in kwargs:
            tools = [
                Tool(
                    function_declarations=[
                        FunctionDeclaration(
                            name=tool["function"]["name"],
                            description=tool["function"].get("description", ""),
                            parameters={
                                "type": "object",
                                "properties": {
                                    param_name: {
                                        "type": param_info.get("type", "string"),
                                        "description": param_info.get(
                                            "description", ""
                                        ),
                                        **(
                                            {"enum": param_info["enum"]}
                                            if "enum" in param_info
                                            else {}
                                        ),
                                    }
                                    for param_name, param_info in tool["function"][
                                        "parameters"
                                    ]["properties"].items()
                                },
                                "required": tool["function"]["parameters"].get(
                                    "required", []
                                ),
                            },
                        )
                        for tool in kwargs["tools"]
                    ]
                )
            ]

        # Create the GenerativeModel
        model = GenerativeModel(
            model,
            generation_config=GenerationConfig(temperature=temperature),
            tools=tools,
        )

        if ENABLE_DEBUG_MESSAGES:
            print("Dumping the message_history")
            pprint.pprint(message_history)

        # Start chat and get response
        chat = model.start_chat(history=message_history[:-1])
        last_message = message_history[-1]

        # If the last message is a function response, send the Part object directly
        # Otherwise, send just the text content
        message_to_send = (
            Content(role="function", parts=[last_message])
            if isinstance(last_message, Part)
            else last_message.parts[0].text
        )
        # response = chat.send_message(message_to_send)
        response = chat.send_message(message_to_send)

        # Convert and return the response
        return self.transformer.convert_response(response)

    @property
    def speech_client(self):
        """Lazy initialization of Google Cloud Speech client."""
        if self._speech_client is None:
            try:
                from google.cloud import speech

                self._speech_client = speech.SpeechClient()
            except ImportError:
                raise ImportError(
                    "google-cloud-speech is required for ASR functionality. "
                    "Install it with: pip install google-cloud-speech"
                )
        return self._speech_client


# Audio Classes
class GoogleAudio(Audio):
    """Google Audio functionality container."""

    def __init__(self, provider):
        super().__init__()
        self.provider = provider
        self.transcriptions = self.Transcriptions(provider)

    class Transcriptions(Audio.Transcription):
        """Google Audio Transcriptions functionality."""

        def __init__(self, provider):
            self.provider = provider

        def create(
            self,
            model: str,
            file: Union[str, BinaryIO],
            **kwargs,
        ) -> TranscriptionResult:
            """
            Create audio transcription using Google Cloud Speech-to-Text API.

            All parameters are already validated and mapped by the Client layer.
            This is a simple pass-through to the Google API.
            """
            try:
                from google.cloud import speech

                # Set defaults
                kwargs["model"] = model if model != "default" else "latest_long"
                kwargs.setdefault("sample_rate_hertz", 16000)
                kwargs.setdefault("enable_automatic_punctuation", True)

                audio_data = self._read_audio_data(file)
                audio = speech.RecognitionAudio(content=audio_data)
                config = self._build_recognition_config(kwargs, speech, file)

                response = self.provider.speech_client.recognize(
                    config=config, audio=audio
                )
                return self._parse_google_response(response)

            except ImportError:
                raise ASRError(
                    "google-cloud-speech is required for ASR functionality. "
                    "Install it with: pip install google-cloud-speech"
                )
            except Exception as e:
                raise ASRError(f"Google Speech-to-Text error: {e}") from e

        async def create_stream_output(
            self,
            model: str,
            file: Union[str, BinaryIO],
            **kwargs,
        ) -> AsyncGenerator[StreamingTranscriptionChunk, None]:
            """
            Create streaming audio transcription using Google Cloud Speech-to-Text API.

            All parameters are already validated and mapped by the Client layer.
            This implementation handles streaming with Google's API.
            """
            try:
                from google.cloud import speech

                # Set defaults
                kwargs["model"] = model if model != "default" else "latest_long"
                kwargs.setdefault("sample_rate_hertz", 16000)
                kwargs.setdefault("enable_automatic_punctuation", True)

                config = self._build_recognition_config(kwargs, speech, file)
                streaming_config = speech.StreamingRecognitionConfig(
                    config=config, interim_results=True, single_utterance=False
                )

                audio_data = self._read_audio_data(file)
                request_generator = self._create_streaming_requests(
                    speech, streaming_config, audio_data
                )

                responses = self.provider.speech_client.streaming_recognize(
                    config=streaming_config, requests=request_generator
                )

                for response in responses:
                    for result in response.results:
                        if result.alternatives:
                            alternative = result.alternatives[0]
                            yield StreamingTranscriptionChunk(
                                text=alternative.transcript,
                                is_final=result.is_final,
                                confidence=getattr(alternative, "confidence", None),
                            )

            except ImportError:
                raise ASRError(
                    "google-cloud-speech is required for ASR functionality. "
                    "Install it with: pip install google-cloud-speech"
                )
            except Exception as e:
                raise ASRError(f"Google Speech-to-Text streaming error: {e}") from e

        def _read_audio_data(self, file: Union[str, BinaryIO]) -> bytes:
            """Read audio data from file or file-like object."""
            if isinstance(file, str):
                with open(file, "rb") as audio_file:
                    return audio_file.read()
            else:
                return file.read()

        def _detect_audio_encoding(self, file: Union[str, BinaryIO], speech):
            """Detect audio encoding based on file extension or content."""
            if isinstance(file, str):
                # File path - detect by extension
                file_lower = file.lower()
                if file_lower.endswith(".mp3"):
                    return speech.RecognitionConfig.AudioEncoding.MP3
                elif file_lower.endswith(".flac"):
                    return speech.RecognitionConfig.AudioEncoding.FLAC
                elif file_lower.endswith(".wav"):
                    return speech.RecognitionConfig.AudioEncoding.LINEAR16
                elif file_lower.endswith(".ogg"):
                    return speech.RecognitionConfig.AudioEncoding.OGG_OPUS
                elif file_lower.endswith(".webm"):
                    return speech.RecognitionConfig.AudioEncoding.WEBM_OPUS

            # Default to LINEAR16 for unknown formats
            return speech.RecognitionConfig.AudioEncoding.LINEAR16

        def _build_recognition_config(
            self, params: dict, speech, file: Union[str, BinaryIO]
        ):
            """Build Google Speech RecognitionConfig from parameters."""
            # Auto-detect encoding if not specified
            encoding = params.get("encoding")
            if encoding is None:
                encoding = self._detect_audio_encoding(file, speech)

            config_params = {
                "encoding": encoding,
                "sample_rate_hertz": params.get("sample_rate_hertz", 16000),
                "language_code": params.get("language_code", "en-US"),
                "enable_word_time_offsets": True,
                "enable_word_confidence": True,
                "enable_automatic_punctuation": params.get(
                    "enable_automatic_punctuation", True
                ),
                "model": params["model"],
            }

            for param in ["max_alternatives", "profanity_filter", "speech_contexts"]:
                if param in params:
                    config_params[param] = params[param]

            return speech.RecognitionConfig(**config_params)

        def _create_streaming_requests(
            self, speech, streaming_config, audio_data: bytes
        ):
            """Create streaming requests generator for Google Speech API."""

            def request_generator():
                chunk_size = 8192
                for i in range(0, len(audio_data), chunk_size):
                    chunk = audio_data[i : i + chunk_size]
                    yield speech.StreamingRecognizeRequest(audio_content=chunk)

            return request_generator()

        def _parse_google_response(self, response) -> TranscriptionResult:
            """Convert Google Speech-to-Text response to unified TranscriptionResult."""
            if not response.results or not response.results[0].alternatives:
                return TranscriptionResult(
                    text="", language=None, confidence=None, task="transcribe"
                )

            best_result = response.results[0]
            best_alternative = best_result.alternatives[0]
            text = best_alternative.transcript
            confidence = getattr(best_alternative, "confidence", None)

            words = []
            if hasattr(best_alternative, "words") and best_alternative.words:
                words = [
                    Word(
                        word=word.word,
                        start=(
                            word.start_time.total_seconds()
                            if hasattr(word, "start_time")
                            else 0.0
                        ),
                        end=(
                            word.end_time.total_seconds()
                            if hasattr(word, "end_time")
                            else 0.0
                        ),
                        confidence=getattr(word, "confidence", None),
                    )
                    for word in best_alternative.words
                ]

            alternatives = [
                Alternative(
                    transcript=alt.transcript,
                    confidence=getattr(alt, "confidence", None),
                )
                for alt in best_result.alternatives
            ]

            segments = []
            if words:
                segments = [
                    Segment(
                        id=0,
                        seek=0,
                        start=words[0].start,
                        end=words[-1].end,
                        text=text,
                        tokens=[],
                        temperature=0.0,
                        avg_logprob=0.0,
                        compression_ratio=0.0,
                        no_speech_prob=0.0,
                    )
                ]

            return TranscriptionResult(
                text=text,
                language=None,
                confidence=confidence,
                task="transcribe",
                words=words or None,
                alternatives=alternatives or None,
                segments=segments or None,
            )


================================================
FILE: aisuite/providers/groq_provider.py
================================================
import os
import groq
from aisuite.provider import Provider, LLMError
from aisuite.providers.message_converter import OpenAICompliantMessageConverter

# Implementation of Groq provider.
# Groq's message format is same as OpenAI's.
# Tool calling specification is also exactly the same as OpenAI's.
# Links:
# https://console.groq.com/docs/tool-use
# Groq supports tool calling for the following models, as of 16th Nov 2024:
#   llama3-groq-70b-8192-tool-use-preview
#   llama3-groq-8b-8192-tool-use-preview
#   llama-3.1-70b-versatile
#   llama-3.1-8b-instant
#   llama3-70b-8192
#   llama3-8b-8192
#   mixtral-8x7b-32768 (parallel tool use not supported)
#   gemma-7b-it (parallel tool use not supported)
#   gemma2-9b-it (parallel tool use not supported)


class GroqMessageConverter(OpenAICompliantMessageConverter):
    """
    Groq-specific message converter if needed
    """

    pass


class GroqProvider(Provider):
    def __init__(self, **config):
        """
        Initialize the Groq provider with the given configuration.
        Pass the entire configuration dictionary to the Groq client constructor.
        """
        # Ensure API key is provided either in config or via environment variable
        self.api_key = config.get("api_key", os.getenv("GROQ_API_KEY"))
        if not self.api_key:
            raise ValueError(
                "Groq API key is missing. Please provide it in the config or set the GROQ_API_KEY environment variable."
            )
        config["api_key"] = self.api_key
        self.client = groq.Groq(**config)
        self.transformer = GroqMessageConverter()

    def chat_completions_create(self, model, messages, **kwargs):
        """
        Makes a request to the Groq chat completions endpoint using the official client.
        """
        try:
            # Transform messages using converter
            transformed_messages = self.transformer.convert_request(messages)

            response = self.client.chat.completions.create(
                model=model,
                messages=transformed_messages,
                **kwargs,  # Pass any additional arguments to the Groq API
            )
            return self.transformer.convert_response(response.model_dump())
        except Exception as e:
            raise LLMError(f"An error occurred: {e}")


================================================
FILE: aisuite/providers/huggingface_provider.py
================================================
import os
import json
import time
from typing import Union, BinaryIO
import requests
from huggingface_hub import InferenceClient
from aisuite.provider import Provider, LLMError, ASRError, Audio
from aisuite.framework import ChatCompletionResponse
from aisuite.framework.message import Message, TranscriptionResult, Word


class HuggingfaceProvider(Provider):
    """
    HuggingFace Provider using the official InferenceClient.
    This provider supports calls to HF serverless Inference Endpoints
    which use Text Generation Inference (TGI) as the backend.
    TGI is OpenAI protocol compliant.
    https://huggingface.co/inference-endpoints/
    """

    def __init__(self, **config):
        """
        Initialize the provider with the given configuration.
        The token is fetched from the config or environment variables.
        """
        # Ensure API key is provided either in config or via environment variable
        self.token = (
            config.get("token")
            or os.getenv("HF_TOKEN")
            or os.getenv("HUGGINGFACE_API_KEY")
        )
        if not self.token:
            raise ValueError(
                "Hugging Face token is missing. Please provide it in the config or set the HF_TOKEN or HUGGINGFACE_API_KEY environment variable."
            )

        # Initialize the InferenceClient with the specified model and timeout if provided
        self.model = config.get("model")
        self.timeout = config.get("timeout", 30)
        self.client = InferenceClient(
            token=self.token, model=self.model, timeout=self.timeout
        )

        # Initialize audio functionality
        super().__init__()
        self.audio = HuggingfaceAudio(self.token, self.timeout)

    def chat_completions_create(self, model, messages, **kwargs):
        """
        Makes a request to the Inference API endpoint using InferenceClient.
        """
        # Validate and transform messages
        transformed_messages = []
        for message in messages:
            if isinstance(message, Message):
                transformed_message = self.transform_from_message(message)
            elif isinstance(message, dict):
                transformed_message = message
            else:
                raise ValueError(f"Invalid message format: {message}")

            # Ensure 'content' is a non-empty string
            if (
                "content" not in transformed_message
                or transformed_message["content"] is None
            ):
                transformed_message["content"] = ""

            transformed_messages.append(transformed_message)

        try:
            # Prepare the payload
            payload = {
                "messages": transformed_messages,
                **kwargs,  # Include other parameters like temperature, max_tokens, etc.
            }

            # Make the API call using the client
            response = self.client.chat_completion(model=model, **payload)

            return self._normalize_response(response)

        except Exception as e:
            raise LLMError(f"An error occurred: {e}")

    def transform_from_message(self, message: Message):
        """Transform framework Message to a format that HuggingFace understands."""
        # Ensure content is a string
        content = message.content if message.content is not None else ""

        # Transform the message
        transformed_message = {
            "role": message.role,
            "content": content,
        }

        # Include tool_calls if present
        if message.tool_calls:
            transformed_message["tool_calls"] = [
                {
                    "id": tool_call.id,
                    "function": {
                        "name": tool_call.function.name,
                        "arguments": tool_call.function.arguments,
                    },
                    "type": tool_call.type,
                }
                for tool_call in message.tool_calls
            ]

        return transformed_message

    def transform_to_message(self, message_dict: dict):
        """Transform HuggingFace message (dict) to a format that the framework Message understands."""
        # Ensure required fields are present
        message_dict.setdefault("content", "")  # Set empty string if content is missing
        message_dict.setdefault("refusal", None)  # Set None if refusal is missing
        message_dict.setdefault("tool_calls", None)  # Set None if tool_calls is missing

        # Handle tool calls if present and not None
        if message_dict.get("tool_calls"):
            for tool_call in message_dict["tool_calls"]:
                if "function" in tool_call:
                    # Ensure function arguments are stringified
                    if isinstance(tool_call["function"].get("arguments"), dict):
                        tool_call["function"]["arguments"] = json.dumps(
                            tool_call["function"]["arguments"]
                        )

        return Message(**message_dict)

    def _normalize_response(self, response_data):
        """
        Normalize the response to a common format (ChatCompletionResponse).
        """
        normalized_response = ChatCompletionResponse()
        message_data = response_data["choices"][0]["message"]
        normalized_response.choices[0].message = self.transform_to_message(message_data)
        return normalized_response


# Audio Classes
class HuggingfaceAudio(Audio):
    """Hugging Face Audio functionality container."""

    def __init__(self, token, timeout=120):
        super().__init__()
        self.transcriptions = self.Transcriptions(token, timeout)

    class Transcriptions(Audio.Transcription):
        """Hugging Face Audio Transcriptions functionality."""

        def __init__(self, token, timeout=120):
            self.token = token
            self.timeout = timeout

        def create(
            self,
            model: str,
            file: Union[str, BinaryIO],
            **kwargs,
        ) -> TranscriptionResult:
            """
            Create audio transcription using Hugging Face Inference API.

            All parameters are already validated and mapped by the Client layer.
            This makes an HTTP POST request to the Hugging Face Inference API.

            Note: Whisper-based models have a 30-second processing window.
            For longer audio, users should deploy custom Inference Endpoints.
            """
            try:
                # Extract model ID from format "huggingface:model-id"
                model_id = model.split(":", 1)[1] if ":" in model else model

                # Prepare API endpoint
                url = f"https://api-inference.huggingface.co/models/{model_id}"

                # Prepare audio data
                if isinstance(file, str):
                    with open(file, "rb") as audio_file:
                        audio_bytes = audio_file.read()
                    content_type = self._detect_content_type(file)
                else:
                    audio_bytes = file.read()
                    # Default to wav for file-like objects
                    content_type = "audio/wav"

                # Prepare headers
                headers = {
                    "Authorization": f"Bearer {self.token}",
                    "Content-Type": content_type,
                }

                # First attempt without wait_for_model
                try:
                    response = requests.post(
                        url,
                        headers=headers,
                        data=audio_bytes,
                        timeout=self.timeout,
                    )
                    response.raise_for_status()
                except requests.exceptions.HTTPError as e:
                    # If 503 (model loading), retry with x-wait-for-model header
                    if e.response.status_code == 503:
                        headers["x-wait-for-model"] = "true"
                        response = requests.post(
                            url,
                            headers=headers,
                            data=audio_bytes,
                            timeout=self.timeout,
                        )
                        response.raise_for_status()
                    else:
                        raise

                # Parse response
                response_data = response.json()
                return self._parse_huggingface_response(response_data, model_id)

            except requests.exceptions.RequestException as e:
                raise ASRError(f"Hugging Face transcription error: {e}") from e
            except Exception as e:
                raise ASRError(f"Hugging Face transcription error: {e}") from e

        def _detect_content_type(self, file_path: str) -> str:
            """Detect audio content type from file extension."""
            if file_path.lower().endswith(".wav"):
                return "audio/wav"
            elif file_path.lower().endswith(".mp3"):
                return "audio/mpeg"  # HF API requires audio/mpeg for MP3
            elif file_path.lower().endswith(".flac"):
                return "audio/flac"
            else:
                # Default to wav if unknown
                return "audio/wav"

        def _parse_huggingface_response(
            self, response_data, model_id: str
        ) -> TranscriptionResult:
            """
            Parse Hugging Face API response into TranscriptionResult.

            Response format can vary:
            - Standard: {"text": "...", "chunks": [...]}
            - Text only: {"text": "..."}
            - Some models may use different keys
            """
            try:
                # Extract text
                if isinstance(response_data, dict):
                    text = response_data.get("text", "")
                elif isinstance(response_data, str):
                    # Some models return plain string
                    text = response_data
                else:
                    text = str(response_data)

                # Extract words from chunks if available
                words = None
                if isinstance(response_data, dict) and "chunks" in response_data:
                    chunks = response_data["chunks"]
                    if chunks:
                        words = []
                        for chunk in chunks:
                            if isinstance(chunk, dict):
                                word_text = chunk.get("text", "")
                                timestamp = chunk.get("timestamp")

                                # timestamp can be [start, end] or (start, end)
                                start, end = None, None
                                if timestamp and len(timestamp) >= 2:
                                    start, end = timestamp[0], timestamp[1]

                                words.append(
                                    Word(
                                        word=word_text,
                                        start=start,
                                        end=end,
                                        confidence=None,  # HF doesn't provide confidence
                                    )
                                )

                return TranscriptionResult(
                    text=text,
                    language=None,  # HF API doesn't return language
                    confidence=None,  # HF API doesn't return confidence
                    words=words,
                    task="transcribe",
                )

            except (KeyError, TypeError, IndexError) as e:
                raise ASRError(f"Error parsing Hugging Face response: {e}")


================================================
FILE: aisuite/providers/inception_provider.py
================================================
import openai
import os
from aisuite.provider import Provider, LLMError


class InceptionProvider(Provider):
    def __init__(self, **config):
        """
        Initialize the Inception provider with the given configuration.
        Pass the entire configuration dictionary to the Inception client constructor using openai.
        """
        # Ensure API key is provided either in config or via environment variable
        config.setdefault("api_key", os.getenv("INCEPTION_API_KEY"))
        if not config["api_key"]:
            raise ValueError(
                "Inception API key is missing. Please provide it in the config or set the INCEPTION_API_KEY environment variable."
            )
        config["base_url"] = "https://api.inceptionlabs.ai/v1"

        # Pass the entire config to the Inception client constructor using openai
        self.client = openai.OpenAI(**config)

    def chat_completions_create(self, model, messages, **kwargs):
        # Any exception raised by Inception will be returned to the caller.
        # Maybe we should catch them and raise a custom LLMError.
        try:
            response = self.client.chat.completions.create(
                model=model,
                messages=messages,
                **kwargs,  # Pass any additional arguments to the Inception API
            )
            return response
        except Exception as e:
            raise LLMError(f"An error occurred: {e}")


================================================
FILE: aisuite/providers/lmstudio_provider.py
================================================
import os
import httpx
from aisuite.provider import Provider, LLMError
from aisuite.framework import ChatCompletionResponse


class LmstudioProvider(Provider):
    """
    LM Studio Provider that makes HTTP calls. Inspired by OllamaProvider in aisuite.
    It uses the /v1/chat/completions endpoint.
    Read more here - https://lmstudio.ai/docs/api and on your local instance in the "Developer" tab.
    If LMSTUDIO_API_URL is not set and not passed in config, then it will default to "http://localhost:1234"
    """

    _CHAT_COMPLETION_ENDPOINT = "/v1/chat/completions"
    _CONNECT_ERROR_MESSAGE = "LM Studio is likely not running. Start LM Studio by running `ollama serve` on your host."

    def __init__(self, **config):
        """
        Initialize the LM Studio provider with the given configuration.
        """
        self.url = config.get("api_url") or os.getenv(
            "LMSTUDIO_API_URL", "http://localhost:1234"
        )

        # Optionally set a custom timeout (default to 300s)
        self.timeout = config.get("timeout", 300)

    def chat_completions_create(self, model, messages, **kwargs):
        """
        Makes a request to the chat completions endpoint using httpx.
        """
        kwargs["stream"] = False
        data = {
            "model": model,
            "messages": messages,
            **kwargs,  # Pass any additional arguments to the API
        }

        try:
            response = httpx.post(
                self.url.rstrip("/") + self._CHAT_COMPLETION_ENDPOINT,
                json=data,
                timeout=self.timeout,
            )
            response.raise_for_status()
        except httpx.ConnectError:  # Handle connection errors
            raise LLMError(f"Connection failed: {self._CONNECT_ERROR_MESSAGE}")
        except httpx.HTTPStatusError as http_err:
            raise LLMError(f"LM Studio request failed: {http_err}")
        except Exception as e:
            raise LLMError(f"An error occurred: {e}")

        # Return the normalized response
        return self._normalize_response(response.json())

    def _normalize_response(self, response_data):
        """
        Normalize the API response to a common format (ChatCompletionResponse).
        """
        normalized_response = ChatCompletionResponse()
        normalized_response.choices[0].message.content = response_data["choices"][0][
            "message"
        ]["content"]

        return normalized_response


================================================
FILE: aisuite/providers/message_converter.py
================================================
"""Base message converter for OpenAI-compliant providers."""

from aisuite.framework import ChatCompletionResponse
from aisuite.framework.message import (
    Message,
    ChatCompletionMessageToolCall,
    CompletionUsage,
)


class OpenAICompliantMessageConverter:
    """
    Base class for message converters that are compatible with OpenAI's API.
    """

    # Class variable that derived classes can override
    tool_results_as_strings = False

    @staticmethod
    def convert_request(messages):
        """Convert messages to OpenAI-compatible format."""
        transformed_messages = []
        for message in messages:
            tmsg = None
            if isinstance(message, Message):
                message_dict = message.model_dump(mode="json")
                message_dict.pop("refusal", None)  # Remove refusal field if present
                tmsg = message_dict
            else:
                tmsg = message
            # Check if tmsg is a dict, otherwise get role attribute
            role = tmsg["role"] if isinstance(tmsg, dict) else tmsg.role
            if role == "tool":
                if OpenAICompliantMessageConverter.tool_results_as_strings:
                    # Handle both dict and object cases for content
                    if isinstance(tmsg, dict):
                        tmsg["content"] = str(tmsg["content"])
                    else:
                        tmsg.content = str(tmsg.content)

            transformed_messages.append(tmsg)
        return transformed_messages

    def convert_response(self, response_data) -> ChatCompletionResponse:
        """Normalize the response to match OpenAI's response format."""
        completion_response = ChatCompletionResponse()
        choice = response_data["choices"][0]
        message = choice["message"]

        # Set basic message content
        completion_response.choices[0].message.content = message["content"]
        completion_response.choices[0].message.role = message.get("role", "assistant")
        # Conditionally parse usage data if it exists.
        if usage_data := response_data.get("usage"):
            completion_response.usage = self.get_completion_usage(usage_data)

        # Handle tool calls if present
        if "tool_calls" in message and message["tool_calls"] is not None:
            tool_calls = []
            for tool_call in message["tool_calls"]:
                tool_calls.append(
                    ChatCompletionMessageToolCall(
                        id=tool_call.get("id"),
                        type="function",  # Always set to "function" as it's the only valid value
                        function=tool_call.get("function"),
                    )
                )
            completion_response.choices[0].message.tool_calls = tool_calls

        return completion_response

    def get_completion_usage(self, usage_data: dict):
        """Get the usage statistics from a usage data dictionary."""
        return CompletionUsage(
            completion_tokens=usage_data.get("completion_tokens"),
            prompt_tokens=usage_data.get("prompt_tokens"),
            total_tokens=usage_data.get("total_tokens"),
            prompt_tokens_details=usage_data.get("prompt_tokens_details"),
            completion_tokens_details=usage_data.get("completion_tokens_details"),
        )


================================================
FILE: aisuite/providers/mistral_provider.py
================================================
"""Mistral provider for the aisuite."""

import os
from mistralai import Mistral
from aisuite.framework import ChatCompletionResponse
from aisuite.provider import Provider, LLMError
from aisuite.providers.message_converter import OpenAICompliantMessageConverter


# Implementation of Mistral provider.
# Mistral's message format is the same as OpenAI's. Just different class names,
# but fully cross-compatible.
# Links:
# https://docs.mistral.ai/capabilities/function_calling/


class MistralMessageConverter(OpenAICompliantMessageConverter):
    """
    Mistral-specific message converter
    """

    def convert_response(self, response_data) -> ChatCompletionResponse:
        """Convert Mistral's response to our standard format."""
        # Convert Mistral's response object to dict format
        response_dict = response_data.model_dump()
        return super().convert_response(response_dict)


# Function calling is available for the following models:
# [As of 01/19/2025 from https://docs.mistral.ai/capabilities/function_calling/]
# Mistral Large
# Mistral Small
# Codestral 22B
# Ministral 8B
# Ministral 3B
# Pixtral 12B
# Mixtral 8x22B
# Mistral Nemo
# pylint: disable=too-few-public-methods
class MistralProvider(Provider):
    """
    Mistral AI Provider using the official Mistral client.
    """

    def __init__(self, **config):
        """
        Initialize the Mistral provider with the given configuration.
        Pass the entire configuration dictionary to the Mistral client constructor.
        """
        # Ensure API key is provided either in config or via environment variable
        config.setdefault("api_key", os.getenv("MISTRAL_API_KEY"))
        if not config["api_key"]:
            raise ValueError(
                "Mistral API key is missing. Please provide it in the config or set the "
                "MISTRAL_API_KEY environment variable."
            )
        self.client = Mistral(**config)
        self.transformer = MistralMessageConverter()

    def chat_completions_create(self, model, messages, **kwargs):
        """
        Makes a request to Mistral using the official client.
        """
        try:
            # Transform messages using converter
            transformed_messages = self.transformer.convert_request(messages)

            # Make the request to Mistral
            response = self.client.chat.complete(
                model=model, messages=transformed_messages, **kwargs
            )

            return self.transformer.convert_response(response)
        except Exception as e:
            raise LLMError(f"An error occurred: {e}") from e


================================================
FILE: aisuite/providers/nebius_provider.py
================================================
import os
from aisuite.provider import Provider
from openai import Client


BASE_URL = "https://api.studio.nebius.ai/v1"


# TODO(rohitcp): This needs to be added to our internal testbed. Tool calling not tested.
class NebiusProvider(Provider):
    def __init__(self, **config):
        """
        Initialize the Nebius AI Studio provider with the given configuration.
        Pass the entire configuration dictionary to the OpenAI client constructor.
        """
        # Ensure API key is provided either in config or via environment variable
        config.setdefault("api_key", os.getenv("NEBIUS_API_KEY"))
        if not config["api_key"]:
            raise ValueError(
                "Nebius AI Studio API key is missing. Please provide it in the config or set the NEBIUS_API_KEY environment variable. You can get your API key at https://studio.nebius.ai/settings/api-keys"
            )

        config["base_url"] = BASE_URL
        # Pass the entire config to the OpenAI client constructor
        self.client = Client(**config)

    def chat_completions_create(self, model, messages, **kwargs):
        return self.client.chat.completions.create(
            model=model,
            messages=messages,
            **kwargs  # Pass any additional arguments to the Nebius API
        )


================================================
FILE: aisuite/providers/ollama_provider.py
================================================
import os
import httpx
from aisuite.provider import Provider, LLMError
from aisuite.framework import ChatCompletionResponse


class OllamaProvider(Provider):
    """
    Ollama Provider that makes HTTP calls instead of using SDK.
    It uses the /api/chat endpoint.
    Read more here - https://github.com/ollama/ollama/blob/main/docs/api.md#generate-a-chat-completion
    If OLLAMA_API_URL is not set and not passed in config, then it will default to "http://localhost:11434"
    """

    _CHAT_COMPLETION_ENDPOINT = "/api/chat"
    _CONNECT_ERROR_MESSAGE = "Ollama is likely not running. Start Ollama by running `ollama serve` on your host."

    def __init__(self, **config):
        """
        Initialize the Ollama provider with the given configuration.
        """
        self.url = config.get("api_url") or os.getenv(
            "OLLAMA_API_URL", "http://localhost:11434"
        )

        # Optionally set a custom timeout (default to 30s)
        self.timeout = config.get("timeout", 30)

    def chat_completions_create(self, model, messages, **kwargs):
        """
        Makes a request to the chat completions endpoint using httpx.
        """
        kwargs["stream"] = False
        data = {
            "model": model,
            "messages": messages,
            **kwargs,  # Pass any additional arguments to the API
        }

        try:
            response = httpx.post(
                self.url.rstrip("/") + self._CHAT_COMPLETION_ENDPOINT,
                json=data,
                timeout=self.timeout,
            )
            response.raise_for_status()
        except httpx.ConnectError:  # Handle connection errors
            raise LLMError(f"Connection failed: {self._CONNECT_ERROR_MESSAGE}")
        except httpx.HTTPStatusError as http_err:
            raise LLMError(f"Ollama request failed: {http_err}")
        except Exception as e:
            raise LLMError(f"An error occurred: {e}")

        # Return the normalized response
        return self._normalize_response(response.json())

    def _normalize_response(self, response_data):
        """
        Normalize the API response to a common format (ChatCompletionResponse).
        """
        normalized_response = ChatCompletionResponse()
        normalized_response.choices[0].message.content = response_data["message"][
            "content"
        ]
        return normalized_response


================================================
FILE: aisuite/providers/openai_provider.py
================================================
import openai
import os
from typing import Union, BinaryIO, AsyncGenerator
from aisuite.provider import Provider, LLMError, ASRError, Audio
from aisuite.providers.message_converter import OpenAICompliantMessageConverter
from aisuite.framework.message import (
    TranscriptionResult,
    Segment,
    Word,
    StreamingTranscriptionChunk,
)


class OpenaiProvider(Provider):
    def __init__(self, **config):
        """
        Initialize the OpenAI provider with the given configuration.
        Pass the entire configuration dictionary to the OpenAI client constructor.
        """
        # Ensure API key is provided either in config or via environment variable
        config.setdefault("api_key", os.getenv("OPENAI_API_KEY"))
        if not config["api_key"]:
            raise ValueError(
                "OpenAI API key is missing. Please provide it in the config or set the OPENAI_API_KEY environment variable."
            )

        # NOTE: We could choose to remove above lines for api_key since OpenAI will automatically
        # infer certain values from the environment variables.
        # Eg: OPENAI_API_KEY, OPENAI_ORG_ID, OPENAI_PROJECT_ID, OPENAI_BASE_URL, etc.

        # Pass the entire config to the OpenAI client constructor
        self.client = openai.OpenAI(**config)
        self.transformer = OpenAICompliantMessageConverter()

        # Initialize audio functionality
        super().__init__()
        self.audio = OpenAIAudio(self.client)

    def chat_completions_create(self, model, messages, **kwargs):
        # Any exception raised by OpenAI will be returned to the caller.
        # Maybe we should catch them and raise a custom LLMError.
        try:
            transformed_messages = self.transformer.convert_request(messages)
            response = self.client.chat.completions.create(
                model=model,
                messages=transformed_messages,
                **kwargs,  # Pass any additional arguments to the OpenAI API
            )
            return response
        except Exception as e:
            raise LLMError(f"An error occurred: {e}")


# Audio Classes
class OpenAIAudio(Audio):
    """OpenAI Audio functionality container."""

    def __init__(self, client):
        super().__init__()
        self.transcriptions = self.Transcriptions(client)

    class Transcriptions(Audio.Transcription):
        """OpenAI Audio Transcriptions functionality."""

        def __init__(self, client):
            self.client = client

        def create(
            self,
            model: str,
            file: Union[str, BinaryIO],
            **kwargs,
        ) -> TranscriptionResult:
            """
            Create audio transcription using OpenAI Whisper API.

            All parameters are already validated and mapped by the Client layer.
            This is a simple pass-through to the OpenAI API.
            """
            try:
                # Handle TranscriptionOptions object if passed
                if "options" in kwargs:
                    options = kwargs.pop("options")
                    # Extract all non-None attributes from options object
                    if hasattr(options, "__dict__"):
                        for key, value in options.__dict__.items():
                            if value is not None and key not in kwargs:
                                kwargs[key] = value

                # Handle timestamp_granularities requirement
                if "timestamp_granularities" in kwargs:
                    # OpenAI requires verbose_json format for timestamp_granularities
                    kwargs["response_format"] = "verbose_json"

                # Handle file input
                if isinstance(file, str):
                    with open(file, "rb") as audio_file:
                        response = self.client.audio.transcriptions.create(
                            file=audio_file, model=model, **kwargs
                        )
                else:
                    response = self.client.audio.transcriptions.create(
                        file=file, model=model, **kwargs
                    )

                return self._parse_openai_response(response)

            except Exception as e:
                raise ASRError(f"OpenAI transcription error: {e}") from e

        async def create_stream_output(
            self,
            model: str,
            file: Union[str, BinaryIO],
            **kwargs,
        ) -> AsyncGenerator[StreamingTranscriptionChunk, None]:
            """
            Create streaming audio transcription using OpenAI Whisper API.

            All parameters are already validated and mapped by the Client layer.
            This is a simple pass-through to the OpenAI API with streaming enabled.
            """
            try:
                # Handle TranscriptionOptions object if passed
                if "options" in kwargs:
                    options = kwargs.pop("options")
                    # Extract all non-None attributes from options object
                    if hasattr(options, "__dict__"):
                        for key, value in options.__dict__.items():
                            if value is not None and key not in kwargs:
                                kwargs[key] = value

                # Enable streaming
                kwargs["stream"] = True

                # Handle timestamp_granularities requirement
                if "timestamp_granularities" in kwargs:
                    # OpenAI requires verbose_json format for timestamp_granularities
                    if (
                        "response_format" in kwargs
                        and kwargs["response_format"] != "verbose_json"
                    ):
                        raise ASRError(
                            f"OpenAI timestamp_granularities requires response_format='verbose_json', "
                            f"but got '{kwargs['response_format']}'. "
                            f"Either remove timestamp_granularities or use response_format='verbose_json'."
                        )
                    else:
                        kwargs["response_format"] = "verbose_json"

                try:
                    if isinstance(file, str):
                        with open(file, "rb") as audio_file:
                            response_stream = self.client.audio.transcriptions.create(
                                file=audio_file, model=model, **kwargs
                            )
                    else:
                        response_stream = self.client.audio.transcriptions.create(
                            file=file, model=model, **kwargs
                        )

                    # Process streaming response - handle event types
                    for event in response_stream:
                        # Handle TranscriptionTextDeltaEvent (incremental text)
                        if (
                            hasattr(event, "type")
                            and event.type == "transcript.text.delta"
                        ):
                            if hasattr(event, "delta") and event.delta:
                                yield StreamingTranscriptionChunk(
                                    text=event.delta,
                                    is_final=False,  # Delta events are interim
                                    confidence=getattr(event, "confidence", None),
                                )
                        # Handle TranscriptionTextDoneEvent (final complete text)
                        elif (
                            hasattr(event, "type")
                            and event.type == "transcript.text.done"
                        ):
                            if hasattr(event, "text") and event.text:
                                yield StreamingTranscriptionChunk(
                                    text=event.text,
                                    is_final=True,  # Done event is final
                                    confidence=getattr(event, "confidence", None),
                                )

                except Exception as stream_error:
                    raise ASRError(
                        f"OpenAI streaming transcription error: {stream_error}"
                    ) from stream_error

            except Exception as e:
                raise ASRError(f"OpenAI streaming transcription error: {e}") from e

        def _parse_openai_response(self, response) -> TranscriptionResult:
            """Parse OpenAI API response into TranscriptionResult."""
            text = response.text if hasattr(response, "text") else ""
            language = getattr(response, "language", "unknown")

            # Parse segments if available
            segments = []
            if hasattr(response, "segments") and response.segments:
                for seg in response.segments:
                    words = []
                    if hasattr(seg, "words") and seg.words:
                        for word in seg.words:
                            words.append(
                                Word(
                                    word=word.word,
                                    start=word.start,
                                    end=word.end,
                                    confidence=getattr(word, "confidence", None),
                                )
                            )

                    segments.append(
                        Segment(
                            id=getattr(seg, "id", 0),
                            seek=getattr(seg, "seek", 0),
                            text=seg.text,
                            start=seg.start,
                            end=seg.end,
                            words=words,
                            confidence=getattr(seg, "avg_logprob", None),
                        )
                    )

            return TranscriptionResult(
                text=text,
                language=language,
                confidence=getattr(response, "confidence", None),
                segments=segments,
            )


================================================
FILE: aisuite/providers/sambanova_provider.py
================================================
import os
from aisuite.provider import Provider, LLMError
from openai import OpenAI
from aisuite.providers.message_converter import OpenAICompliantMessageConverter


class SambanovaMessageConverter(OpenAICompliantMessageConverter):
    """
    SambaNova-specific message converter.
    """

    pass


class SambanovaProvider(Provider):
    """
    SambaNova Provider using OpenAI client for API calls.
    """

    def __init__(self, **config):
        """
        Initialize the SambaNova provider with the given configuration.
        Pass the entire configuration dictionary to the OpenAI client constructor.
        """
        # Ensure API key is provided either in config or via environment variable
        self.api_key = config.get("api_key", os.getenv("SAMBANOVA_API_KEY"))
        if not self.api_key:
            raise ValueError(
                "Sambanova API key is missing. Please provide it in the config or set the SAMBANOVA_API_KEY environment variable."
            )

        config["api_key"] = self.api_key
        config["base_url"] = "https://api.sambanova.ai/v1/"
        # Pass the entire config to the OpenAI client constructor
        self.client = OpenAI(**config)
        self.transformer = SambanovaMessageConverter()

    def chat_completions_create(self, model, messages, **kwargs):
        """
        Makes a request to the SambaNova chat completions endpoint using the OpenAI client.
        """
        try:
            # Transform messages using converter
            transformed_messages = self.transformer.convert_request(messages)

            response = self.client.chat.completions.create(
                model=model,
                messages=transformed_messages,
                **kwargs,  # Pass any additional arguments to the Sambanova API
            )
            return self.transformer.convert_response(response.model_dump())
        except Exception as e:
            raise LLMError(f"An error occurred: {e}")


================================================
FILE: aisuite/providers/together_provider.py
================================================
import os
import httpx
from aisuite.provider import Provider, LLMError
from aisuite.providers.message_converter import OpenAICompliantMessageConverter


class TogetherMessageConverter(OpenAICompliantMessageConverter):
    """
    Together-specific message converter if needed
    """

    pass


class TogetherProvider(Provider):
    """
    Together AI Provider using httpx for direct API calls.
    """

    BASE_URL = "https://api.together.xyz/v1/chat/completions"

    def __init__(self, **config):
        """
        Initialize the Together provider with the given configuration.
        The API key is fetched from the config or environment variables.
        """
        self.api_key = config.get("api_key", os.getenv("TOGETHER_API_KEY"))
        if not self.api_key:
            raise ValueError(
                "Together API key is missing. Please provide it in the config or set the TOGETHER_API_KEY environment variable."
            )

        # Optionally set a custom timeout (default to 30s)
        self.timeout = config.get("timeout", 30)
        self.transformer = TogetherMessageConverter()

    def chat_completions_create(self, model, messages, **kwargs):
        """
        Makes a request to the Together AI chat completions endpoint using httpx.
        """
        # Transform messages using converter
        transformed_messages = self.transformer.convert_request(messages)

        headers = {
            "Authorization": f"Bearer {self.api_key}",
            "Content-Type": "application/json",
        }

        data = {
            "model": model,
            "messages": transformed_messages,
            **kwargs,  # Pass any additional arguments to the API
        }

        try:
            # Make the request to Together AI endpoint.
            response = httpx.post(
                self.BASE_URL, json=data, headers=headers, timeout=self.timeout
            )
            response.raise_for_status()
            return self.transformer.convert_response(response.json())
        except httpx.HTTPStatusError as http_err:
            raise LLMError(f"Together AI request failed: {http_err}")
        except Exception as e:
            raise LLMError(f"An error occurred: {e}")


================================================
FILE: aisuite/providers/watsonx_provider.py
================================================
from aisuite.provider import Provider
import os
from ibm_watsonx_ai import Credentials
from ibm_watsonx_ai.foundation_models import ModelInference
from aisuite.framework import ChatCompletionResponse


class WatsonxProvider(Provider):
    def __init__(self, **config):
        self.service_url = config.get("service_url") or os.getenv("WATSONX_SERVICE_URL")
        self.api_key = config.get("api_key") or os.getenv("WATSONX_API_KEY")
        self.project_id = config.get("project_id") or os.getenv("WATSONX_PROJECT_ID")

        if not self.service_url or not self.api_key or not self.project_id:
            raise EnvironmentError(
                "Missing one or more required WatsonX environment variables: "
                "WATSONX_SERVICE_URL, WATSONX_API_KEY, WATSONX_PROJECT_ID. "
                "Please refer to the setup guide: /guides/watsonx.md."
            )

    def chat_completions_create(self, model, messages, **kwargs):
        model = ModelInference(
            model_id=model,
            credentials=Credentials(
                api_key=self.api_key,
                url=self.service_url,
            ),
            project_id=self.project_id,
        )

        res = model.chat(messages=messages, params=kwargs)
        return self.normalize_response(res)

    def normalize_response(self, response):
        openai_response = ChatCompletionResponse()
        openai_response.choices[0].message.content = response["choices"][0]["message"][
            "content"
        ]
        return openai_response


================================================
FILE: aisuite/providers/xai_provider.py
================================================
import os
import httpx
from aisuite.provider import Provider, LLMError
from aisuite.framework import ChatCompletionResponse
from aisuite.providers.message_converter import OpenAICompliantMessageConverter


class XaiMessageConverter(OpenAICompliantMessageConverter):
    """
    xAI-specific message converter if needed
    """

    pass


class XaiProvider(Provider):
    """
    xAI Provider using httpx for direct API calls.
    """

    BASE_URL = "https://api.x.ai/v1/chat/completions"

    def __init__(self, **config):
        """
        Initialize the xAI provider with the given configuration.
        The API key is fetched from the config or environment variables.
        """
        self.api_key = config.get("api_key", os.getenv("XAI_API_KEY"))
        if not self.api_key:
            raise ValueError(
                "xAI API key is missing. Please provide it in the config or set the XAI_API_KEY environment variable."
            )

        # Optionally set a custom timeout (default to 30s)
        self.timeout = config.get("timeout", 30)
        self.transformer = XaiMessageConverter()

    def chat_completions_create(self, model, messages, **kwargs):
        """
        Makes a request to the xAI chat completions endpoint using httpx.
        """
        # Transform messages using converter
        transformed_messages = self.transformer.convert_request(messages)

        headers = {
            "Authorization": f"Bearer {self.api_key}",
            "Content-Type": "application/json",
        }

        data = {
            "model": model,
            "messages": transformed_messages,
            **kwargs,  # Pass any additional arguments to the API
        }

        try:
            # Make the request to xAI endpoint.
            response = httpx.post(
                self.BASE_URL, json=data, headers=headers, timeout=self.timeout
            )
            response.raise_for_status()
            return self.transformer.convert_response(response.json())
        except httpx.HTTPStatusError as http_err:
            raise LLMError(f"xAI request failed: {http_err}")
        except Exception as e:
            raise LLMError(f"An error occurred: {e}")


================================================
FILE: aisuite/utils/tools.py
================================================
from typing import Callable, Dict, Any, Type, Optional, get_origin, get_args, Union
from pydantic import BaseModel, create_model, Field, ValidationError
import inspect
import json
from docstring_parser import parse


class Tools:
    def __init__(self, tools: list[Callable] = None):
        self._tools = {}
        if tools:
            for tool in tools:
                self._add_tool(tool)

    # Add a tool function with or without a Pydantic model.
    def _add_tool(self, func: Callable, param_model: Optional[Type[BaseModel]] = None):
        """Register a tool function with metadata. If no param_model is provided, infer from function signature."""
        # Check if this is an MCP tool with original schema
        if hasattr(func, "__mcp_input_schema__") and func.__mcp_input_schema__:
            # Use the original MCP schema directly to preserve all JSON Schema details
            tool_spec = self._convert_mcp_schema_to_tool_spec(func)
            # Create Pydantic model from MCP schema for validation
            param_model = self._create_pydantic_model_from_mcp_schema(func)
        elif param_model:
            tool_spec = self._convert_to_tool_spec(func, param_model)
        else:
            tool_spec, param_model = self.__infer_from_signature(func)

        self._tools[func.__name__] = {
            "function": func,
            "param_model": param_model,
            "spec": tool_spec,
        }

    # Return tools in the specified format (default OpenAI).
    def tools(self, format="openai") -> list:
        """Return tools in the specified format (default OpenAI)."""
        if format == "openai":
            return self.__convert_to_openai_format()
        return [tool["spec"] for tool in self._tools.values()]

    def _unwrap_optional(self, field_type: Type) -> tuple[Type, bool]:
        """
        Unwrap Optional[T] to get the base type T.

        Returns:
            tuple: (base_type, is_optional)
        """
        # Check if it's Optional (Union with None)
        origin = get_origin(field_type)
        if origin is Union:
            args = get_args(field_type)
            # Optional[T] is Union[T, None]
            if type(None) in args:
                # Get the non-None type
                non_none_types = [arg for arg in args if arg is not type(None)]
                if len(non_none_types) == 1:
                    return non_none_types[0], True
        return field_type, False

    # Convert the function and its Pydantic model to a unified tool specification.
    def _convert_to_tool_spec(
        self, func: Callable, param_model: Type[BaseModel]
    ) -> Dict[str, Any]:
        """Convert the function and its Pydantic model to a unified tool specification."""
        type_mapping = {str: "string", int: "integer", float: "number", bool: "boolean"}

        properties = {}
        for field_name, field in param_model.model_fields.items():
            field_type = field.annotation

            # Unwrap Optional[T] to get base type T
            field_type, is_optional = self._unwrap_optional(field_type)

            # Handle enum types
            if hasattr(field_type, "__members__"):  # Check if it's an enum
                enum_values = [
                    member.value if hasattr(member, "value") else member.name
                    for member in field_type
                ]
                properties[field_name] = {
                    "type": "string",
                    "enum": enum_values,
                    "description": field.description or "",
                }
                # Convert enum default value to string if it exists
                if str(field.default) != "PydanticUndefined":
                    properties[field_name]["default"] = (
                        field.default.value
                        if hasattr(field.default, "value")
                        else field.default
                    )
            else:
                properties[field_name] = {
                    "type": type_mapping.get(field_type, str(field_type)),
                    "description": field.description or "",
                }
                # Add default if it exists and isn't PydanticUndefined
                if str(field.default) != "PydanticUndefined":
                    properties[field_name]["default"] = field.default

        return {
            "name": func.__name__,
            "description": func.__doc__ or "",
            "parameters": {
                "type": "object",
                "properties": properties,
                "required": [
                    name
                    for name, field in param_model.model_fields.items()
                    if field.is_required and str(field.default) == "PydanticUndefined"
                ],
            },
        }

    def __extract_param_descriptions(self, func: Callable) -> dict[str, str]:
        """Extract parameter descriptions from function docstring.

        Args:
            func: The function to extract parameter descriptions from

        Returns:
            Dictionary mapping parameter names to their descriptions
        """
        docstring = inspect.getdoc(func) or ""
        parsed_docstring = parse(docstring)

        param_descriptions = {}
        for param in parsed_docstring.params:
            param_descriptions[param.arg_name] = param.description or ""

        return param_descriptions

    def _convert_mcp_schema_to_tool_spec(self, func: Callable) -> Dict[str, Any]:
        """
        Convert MCP tool with original inputSchema to tool spec.

        This preserves the original JSON Schema from MCP without round-trip conversion,
        avoiding information loss for complex types like arrays and nested objects.

        Args:
            func: MCP tool wrapper with __mcp_input_schema__ attribute

        Returns:
            Tool specification compatible with OpenAI format
        """
        input_schema = func.__mcp_input_schema__

        return {
            "name": func.__name__,
            "description": func.__doc__ or "",
            "parameters": input_schema,  # Use original schema directly!
        }

    def _create_pydantic_model_from_mcp_schema(self, func: Callable) -> Type[BaseModel]:
        """
        Create a Pydantic model from MCP inputSchema for parameter validation.

        This is needed for the execute() method to validate tool call arguments.

        Args:
            func: MCP tool wrapper with __mcp_input_schema__ attribute

        Returns:
            Pydantic model for parameter validation
        """
        from ..mcp.schema_converter import mcp_schema_to_annotations

        input_schema = func.__mcp_input_schema__
        properties = input_schema.get("properties", {})
        required = input_schema.get("required", [])

        # Get type annotations from MCP schema
        annotations = mcp_schema_to_annotations(input_schema)

        fields = {}
        for param_name, param_type in annotations.items():
            param_schema = properties.get(param_name, {})
            description = param_schema.get("description", "")

            if param_name in required:
                fields[param_name] = (param_type, Field(..., description=description))
            else:
                fields[param_name] = (
                    param_type,
                    Field(default=None, description=description),
                )

        return create_model(f"{func.__name__.capitalize()}Params", **fields)

    def __infer_from_signature(
        self, func: Callable
    ) -> tuple[Dict[str, Any], Type[BaseModel]]:
        """Infer parameters(required and optional) and requirements directly from the function signature."""
        signature = inspect.signature(func)
        fields = {}
        required_fields = []

        # Get function's docstring and parse parameter descriptions
        param_descriptions = self.__extract_param_descriptions(func)
        docstring = inspect.getdoc(func) or ""

        # Parse the docstring to get the main function description
        parsed_docstring = parse(docstring)
        function_description = parsed_docstring.short_description or ""
        if parsed_docstring.long_description:
            function_description += "\n\n" + parsed_docstring.long_description

        for param_name, param in signature.parameters.items():
            # Check if a type annotation is missing
            if param.annotation == inspect._empty:
                raise TypeError(
                    f"Parameter '{param_name}' in function '{func.__name__}' must have a type annotation."
                )

            # Determine field type and optionality
            param_type = param.annotation
            description = param_descriptions.get(param_name, "")

            if param.default == inspect._empty:
                fields[param_name] = (param_type, Field(..., description=description))
                required_fields.append(param_name)
            else:
                fields[param_name] = (
                    param_type,
                    Field(default=param.default, description=description),
                )

        # Dynamically create a Pydantic model based on inferred fields
        param_model = create_model(f"{func.__name__.capitalize()}Params", **fields)

        # Convert inferred model to a tool spec format
        tool_spec = self._convert_to_tool_spec(func, param_model)

        # Update the tool spec with the parsed function description instead of raw docstring
        tool_spec["description"] = function_description

        return tool_spec, param_model

    def __convert_to_openai_format(self) -> list:
        """Convert tools to OpenAI's format."""
        return [
            {"type": "function", "function": tool["spec"]}
            for tool in self._tools.values()
        ]

    def results_to_messages(self, results: list, message: any) -> list:
        """Converts results to messages."""
        # if message is empty return empty list
        if not message or len(results) == 0:
            return []

        messages = []
        # Iterate over results and match with tool calls from the message
        for result in results:
            # Find matching tool call from message.tool_calls
            for tool_call in message.tool_calls:
                if tool_call.id == result["tool_call_id"]:
                    messages.append(
                        {
                            "role": "tool",
                            "name": result["name"],
                            "content": json.dumps(result["content"]),
                            "tool_call_id": tool_call.id,
                        }
                    )
                    break

        return messages

    def execute(self, tool_calls) -> list:
        """Executes registered tools based on the tool calls from the model.

        Args:
            tool_calls: List of tool calls from the model

        Returns:
            List of results from executing each tool call
        """
        results = []

        # Handle single tool call or list of tool calls
        if not isinstance(tool_calls, list):
            tool_calls = [tool_calls]

        for tool_call in tool_calls:
            # Handle both dictionary and object-style tool calls
            if isinstance(tool_call, dict):
                tool_name = tool_call["function"]["name"]
                arguments = tool_call["function"]["arguments"]
            else:
                tool_name = tool_call.function.name
                arguments = tool_call.function.arguments

            # Ensure arguments is a dict
            if isinstance(arguments, str):
                arguments = json.loads(arguments)

            if tool_name not in self._tools:
                raise ValueError(f"Tool '{tool_name}' not registered.")

            tool = self._tools[tool_name]
            tool_func = tool["function"]
            param_model = tool["param_model"]

            # Validate and parse the arguments with Pydantic if a model exists
            try:
                validated_args = param_model(**arguments)
                result = tool_func(**validated_args.model_dump())
                results.append(result)
            except ValidationError as e:
                raise ValueError(f"Error in tool '{tool_name}' parameters: {e}")

        return results

    def execute_tool(self, tool_calls) -> tuple[list, list]:
        """Executes registered tools based on the tool calls from the model.

        Args:
            tool_calls: List of tool calls from the model

        Returns:
            List of tuples containing (result, result_message) for each tool call
        """
        results = []
        messages = []

        # Handle single tool call or list of tool calls
        if not isinstance(tool_calls, list):
            tool_calls = [tool_calls]

        for tool_call in tool_calls:
            # Handle both dictionary and object-style tool calls
            if isinstance(tool_call, dict):
                tool_name = tool_call["function"]["name"]
                arguments = tool_call["function"]["arguments"]
                tool_call_id = tool_call["id"]
            else:
                tool_name = tool_call.function.name
                arguments = tool_call.function.arguments
                tool_call_id = tool_call.id

            # Ensure arguments is a dict
            if isinstance(arguments, str):
                arguments = json.loads(arguments)

            if tool_name not in self._tools:
                raise ValueError(f"Tool '{tool_name}' not registered.")

            tool = self._tools[tool_name]
            tool_func = tool["function"]
            param_model = tool["param_model"]

            # Validate and parse the arguments with Pydantic if a model exists
            try:
                validated_args = param_model(**arguments)
                result = tool_func(**validated_args.model_dump())
                results.append(result)
                messages.append(
                    {
                        "role": "tool",
                        "name": tool_name,
                        "content": json.dumps(result),
                        "tool_call_id": tool_call_id,
                    }
                )
            except ValidationError as e:
                raise ValueError(f"Error in tool '{tool_name}' parameters: {e}")

        return results, messages


================================================
FILE: aisuite/utils/utils.py
================================================
"""Utility functions for aisuite."""

import json
from unittest.mock import MagicMock
from pydantic import BaseModel


# pylint: disable=too-few-public-methods
class Utils:
    """
    Utility functions for debugging and inspecting objects.
    """

    @staticmethod
    def spew(obj):
        """
        Recursively inspects a Python object and prints its contents as a
        nicely formatted JSON string. Handles Pydantic models, nested objects,
        lists, and circular references.
        """
        visited = set()

        # pylint: disable=too-many-return-statements
        def default_encoder(o):
            # Handle MagicMock objects to prevent circular reference errors in tests
            if isinstance(o, MagicMock):
                try:
                    # Attempt to get a descriptive name for the mock
                    # pylint: disable=protected-access
                    name = o._extract_mock_name()
                # pylint: disable=broad-exception-caught
                except Exception:
                    name = "unknown"
                return f'<MagicMock name="{name}">'

            # Handle other circular references
            obj_id = id(o)
            if obj_id in visited:
                return f"<Circular reference to {type(o).__name__} at {obj_id}>"
            visited.add(obj_id)

            # Handle Pydantic models
            if isinstance(o, BaseModel):
                return o.model_dump()

            # Handle general objects by converting their __dict__
            if hasattr(o, "__dict__"):
                return o.__dict__

            # Handle sets
            if isinstance(o, set):
                return list(o)

            # Fallback for other types
            try:
                return str(o)
            # pylint: disable=broad-exception-caught
            except Exception:
                return f"<Unserializable: {type(o).__name__}>"

        print(json.dumps(obj, default=default_encoder, indent=2))


================================================
FILE: aisuite-js/README.md
================================================
# AISuite

AISuite is a unified TypeScript library that provides a single, consistent interface for interacting with multiple Large Language Model (LLM) providers. The library uses OpenAI's API format as the standard interface while supporting OpenAI and Anthropic Claude.

npm pacakge - `npm i aisuite`

## Features

- **Unified API**: Single interface compatible with OpenAI's API structure
- **Multi-Provider Support**: Currently supports OpenAI and Anthropic
- **Provider Selection**: Use `provider:model` format (e.g., `openai:gpt-4o`, `anthropic:claude-3-haiku-20240307`)
- **Tool Calling**: Transparent tool/function calling across all providers
- **Streaming**: Real-time streaming responses with consistent API
- **Type Safety**: Full TypeScript support with comprehensive type definitions
- **Error Handling**: Unified error handling across providers
- **Speech-to-Text**: Automatic Speech Recognition (ASR) support with multiple providers (OpenAI Whisper, Deepgram)

## Installation

```bash
npm install aisuite
```

## Quick Start

```typescript
import { Client } from 'aisuite';

const client = new Client({
  openai: { 
    apiKey: process.env.OPENAI_API_KEY,    
  },
  anthropic: { apiKey: process.env.ANTHROPIC_API_KEY },
  deepgram: { apiKey: process.env.DEEPGRAM_API_KEY },
});

// Use any provider with identical interface
const response = await client.chat.completions.create({
  model: 'openai:gpt-4o',
  messages: [
    { role: 'system', content: 'You are a helpful assistant.' },
    { role: 'user', content: 'Hello!' }
  ],
});

console.log(response.choices[0].message.content);
```

## Usage Examples

### Basic Chat Completion

```typescript
// OpenAI
const openaiResponse = await client.chat.completions.create({
  model: 'openai:gpt-4o',
  messages: [
    { role: 'system', content: 'You are a helpful assistant.' },
    { role: 'user', content: 'What is TypeScript?' }
  ],
  temperature: 0.7,
  max_tokens: 1000,
});

// Anthropic - exact same interface
const anthropicResponse = await client.chat.completions.create({
  model: 'anthropic:claude-3-haiku-20240307',
  messages: [
    { role: 'system', content: 'You are a helpful assistant.' },
    { role: 'user', content: 'What is TypeScript?' }
  ],
  temperature: 0.7,
  max_tokens: 1000,
});
```

### Tool/Function Calling

```typescript
const tools = [
  {
    type: 'function' as const,
    function: {
      name: 'get_weather',
      description: 'Get current weather for a location',
      parameters: {
        type: 'object',
        properties: {
          location: { type: 'string', description: 'City name' }
        },
        required: ['location']
      }
    }
  }
];

// Works identically across all providers
const response = await client.chat.completions.create({
  model: 'anthropic:claude-3-haiku-20240307',
  messages: [{ role: 'user', content: 'What\'s the weather in NYC?' }],
  tools,
  tool_choice: 'auto'
});

if (response.choices[0].message.tool_calls) {
  console.log('Tool calls:', response.choices[0].message.tool_calls);
}
```

### Streaming Responses

```typescript
const stream = await client.chat.completions.create({
  model: 'openai:gpt-4o',
  messages: [{ role: 'user', content: 'Tell me a story' }],
  stream: true
});

// TypeScript: cast to AsyncIterable<ChatCompletionChunk>
for await (const chunk of stream as AsyncIterable<ChatCompletionChunk>) {
  process.stdout.write(chunk.choices[0]?.delta?.content || '');
}
```

### Streaming with Abort Controller

```typescript
const controller = new AbortController();

// Abort after 5 seconds
setTimeout(() => controller.abort(), 5000);

const stream = await client.chat.completions.create({
  model: 'anthropic:claude-3-haiku-20240307',
  messages: [{ role: 'user', content: 'Write a long story' }],
  stream: true
}, { signal: controller.signal });

try {
  for await (const chunk of stream as AsyncIterable<ChatCompletionChunk>) {
    process.stdout.write(chunk.choices[0]?.delta?.content || '');
  }
} catch (error) {
  if (error.name === 'AbortError') {
    console.log('Stream aborted');
  }
}
```

### Speech-to-Text Transcription

```typescript
// Initialize client with audio support for OpenAI
const client = new Client({
  openai: { 
    apiKey: process.env.OPENAI_API_KEY,    
  },
  deepgram: { apiKey: process.env.DEEPGRAM_API_KEY }
});

// Using Deepgram
const deepgramResponse = await client.audio.transcriptions.create({
  model: 'deepgram:nova-2',
  file: audioBuffer,  // Buffer containing audio data
  language: 'en-US',
  timestamps: true,
  word_confidence: true,
  speaker_labels: true,
});

// Using OpenAI Whisper
const openaiResponse = await client.audio.transcriptions.create({
  model: 'openai:whisper-1',
  file: audioBuffer,
  language: 'en',
  response_format: 'verbose_json',
  temperature: 0,
  timestamps: true,
});

console.log('Transcribed Text:', openaiResponse.text);
console.log('Words with timestamps:', openaiResponse.words);
```

### Error Handling

```typescript
import { AISuiteError, ProviderNotConfiguredError } from 'aisuite';

try {
  const response = await client.chat.completions.create({
    model: 'invalid:model',
    messages: [{ role: 'user', content: 'Hello' }]
  });
} catch (error) {
  if (error instanceof ProviderNotConfiguredError) {
    console.error('Provider not configured:', error.message);
  } else if (error instanceof AISuiteError) {
    console.error('AISuite error:', error.message, error.provider);
  } else {
    console.error('Unknown error:', error);
  }
}
```

## API Reference

### Client Configuration

```typescript
const client = new Client({
  openai?: {
    apiKey: string;
    baseURL?: string;
    organization?: string;    
  },
  anthropic?: {
    apiKey: string;
    baseURL?: string;
  },
  deepgram?: {
    apiKey: string;
    baseURL?: string;
  }
});
```

### Chat Completion Request

All providers use the standard OpenAI chat completion format:

```typescript
interface ChatCompletionRequest {
  model: string;              // "provider:model" format
  messages: ChatMessage[];
  tools?: Tool[];
  tool_choice?: ToolChoice;
  temperature?: number;
  max_tokens?: number;
  stop?: string | string[];
  stream?: boolean;
}
```

### Transcription Request

All ASR providers use a standard transcription request format with additional provider-specific parameters:

```typescript
interface TranscriptionRequest {
  model: string;              // "provider:model" format
  file: Buffer;              // Audio file as Buffer
  language?: string;         // Language code (e.g., "en", "en-US")
  timestamps?: boolean;      // Include word-level timestamps
  [key: string]: any;        // Additional provider-specific parameters:
                            // For OpenAI: See https://platform.openai.com/docs/api-reference/audio/createTranscription
                            // For Deepgram: See https://developers.deepgram.com/reference/speech-to-text-api/listen  
}
```

### Helper Methods

```typescript
// List all configured providers (including ASR)
client.listProviders(); // ['openai', 'anthropic']
client.listASRProviders(); // ['deepgram', 'openai']

// Check if a provider is configured
client.isProviderConfigured('openai'); // true
client.isASRProviderConfigured('deepgram'); // true
```

## Current Limitations

- Only OpenAI and Anthropic providers are currently supported for chat (Gemini, Mistral, and Bedrock coming soon)
- Tool calling requires handling tool responses manually
- Streaming tool calls require manual accumulation of arguments
- ASR support is limited to OpenAI Whisper (requires explicit audio configuration) and Deepgram
- Some provider-specific ASR features might require using provider-specific parameters

## Development

```bash
# Install dependencies
npm install

# Build the project
npm run build

# Run tests
npm test

# Run examples
#Run basic usage example only:
npm run example:basic
# Run tool calling example only:
npm run example:tools
# Run the full test suite:
npm run test:examples
```

## License

MIT


================================================
FILE: aisuite-js/examples/basic-usage.ts
================================================
import 'dotenv/config';
import { Client } from '../src';

async function main() {
  // Initialize the client with API keys
  const client = new Client({
    openai: { apiKey: process.env.OPENAI_API_KEY! },
    anthropic: { apiKey: process.env.ANTHROPIC_API_KEY! },
  });

  console.log('Available providers:', client.listProviders());

  // Example 1: OpenAI Chat Completion
  console.log('\n--- OpenAI Example ---');
  try {
    const openaiResponse = await client.chat.completions.create({
      model: 'openai:gpt-4o-mini',
      messages: [
        { role: 'system', content: 'You are a helpful assistant.' },
        { role: 'user', content: 'What is TypeScript in one sentence?' }
      ],
      temperature: 0.7,
      max_tokens: 100,
    });

    console.log('OpenAI Response:', openaiResponse.choices[0].message.content);
    console.log('Usage:', openaiResponse.usage);
    console.log('Full response:', JSON.stringify(openaiResponse, null, 2));
  } catch (error) {
    console.error('OpenAI Error:', error);
  }

  // Example 2: Anthropic Chat Completion
  console.log('\n--- Anthropic Example ---');
  try {
    const anthropicResponse = await client.chat.completions.create({
      model: 'anthropic:claude-3-haiku-20240307',
      messages: [
        { role: 'system', content: 'You are a helpful assistant.' },
        { role: 'user', content: 'What is TypeScript in one sentence?' }
      ],
      temperature: 0.7,
      max_tokens: 100,
    });

    console.log('Anthropic Response:', anthropicResponse.choices[0].message.content);
    console.log('Usage:', anthropicResponse.usage);
    console.log('Full response:', JSON.stringify(anthropicResponse, null, 2));
  } catch (error) {
    console.error('Anthropic Error:', error);
  }

  // Example 3: Error handling - invalid provider
  console.log('\n--- Error Handling Example ---');
  try {
    await client.chat.completions.create({
      model: 'invalid:model',
      messages: [{ role: 'user', content: 'Hello' }]
    });
  } catch (error) {
    console.error('Expected error:', error);
  }
}

// Run the examples
main().catch(console.error);

================================================
FILE: aisuite-js/examples/chat-app/.eslintrc.cjs
================================================
module.exports = {
  root: true,
  env: { browser: true, es2020: true },
  extends: [
    'eslint:recommended',
    '@typescript-eslint/recommended',
    'plugin:react-hooks/recommended',
  ],
  ignorePatterns: ['dist', '.eslintrc.cjs'],
  parser: '@typescript-eslint/parser',
  plugins: ['react-refresh'],
  rules: {
    'react-refresh/only-export-components': [
      'warn',
      { allowConstantExport: true },
    ],
  },
} 

================================================
FILE: aisuite-js/examples/chat-app/.gitignore
================================================
# Logs
logs
*.log
npm-debug.log*
yarn-debug.log*
yarn-error.log*
pnpm-debug.log*
lerna-debug.log*

node_modules
dist
dist-ssr
*.local

# Editor directories and files
.vscode/*
!.vscode/extensions.json
.idea
.DS_Store
*.suo
*.ntvs*
*.njsproj
*.sln
*.sw?

# Environment variables
.env
.env.local
.env.development.local
.env.test.local
.env.production.local 

================================================
FILE: aisuite-js/examples/chat-app/README.md
================================================
# AISuite Chat App

A modern React TypeScript chat application built with AISuite, allowing you to chat with multiple AI models and compare their responses in real-time.

## Features

- **Multi-Provider Support**: Chat with OpenAI, Anthropic, Groq, and Mistral models
- **Comparison Mode**: Compare responses from two different AI models side-by-side
- **Modern UI**: Clean, responsive interface built with React and Tailwind CSS
- **Real-time Chat**: Instant messaging with AI models
- **API Key Management**: Secure storage and management of API keys
- **Error Handling**: Comprehensive error handling and user feedback
- **TypeScript**: Full type safety throughout the application

## Prerequisites

- Node.js 18+ 
- npm or yarn
- API keys for the AI providers you want to use:
  - OpenAI API key
  - Anthropic API key
  - Groq API key
  - Mistral API key

## Installation

1. Clone the repository and navigate to the chat app directory:
```bash
cd aisuite-js/chat-app
```

2. Install dependencies:
```bash
npm install
```

3. Start the development server:
```bash
npm run dev
```

4. Open your browser and navigate to `http://localhost:3000`

## Configuration

### API Keys

1. Click the "Configure API Keys" button in the header
2. Enter your API keys for the providers you want to use
3. Click "Save" to store the configuration

The app will automatically save your API keys to localStorage for future use.

### Supported Models

The app comes pre-configured with the following models:

**OpenAI:**
- GPT-4o
- GPT-4o Mini

**Anthropic:**
- Claude 3.5 Sonnet
- Claude 3 Haiku

**Groq:**
- Llama 3.1 8B
- Mixtral 8x7B

**Mistral:**
- Mistral 7B
- Mistral Large

## Usage

### Basic Chat

1. Configure your API keys
2. Select a model from the dropdown
3. Type your message and press Enter or click Send
4. View the AI response

### Comparison Mode

1. Enable "Comparison Mode" checkbox
2. Select two different models
3. Send a message to see responses from both models side-by-side
4. Compare the different responses and capabilities

### Chat Management

- **Reset Chat**: Click the reset button to clear all chat history
- **Model Switching**: Change models at any time during the conversation
- **Error Handling**: The app displays clear error messages for API issues

## Sample Queries

Try these sample queries to test the different models:

```
"What is the weather in Tokyo?"
```

```
"Write a poem about the weather in Tokyo."
```

```
"Write a python program to print the fibonacci sequence."
```

```
"Write test cases for this program."
```

## Development

### Project Structure

```
src/
├── components/          # React components
│   ├── ApiKeyModal.tsx
│   ├── ChatContainer.tsx
│   ├── ChatInput.tsx
│   ├── ChatMessage.tsx
│   └── ModelSelector.tsx
├── config/             # Configuration files
│   └── llm-config.ts
├── services/           # Business logic
│   └── aisuite-service.ts
├── types/              # TypeScript type definitions
│   └── chat.ts
├── App.tsx            # Main application component
├── main.tsx           # Application entry point
└── index.css          # Global styles
```

### Available Scripts

- `npm run dev` - Start development server
- `npm run build` - Build for production
- `npm run preview` - Preview production build
- `npm run lint` - Run ESLint

### Adding New Models

To add new models, edit `src/config/llm-config.ts`:

```typescript
export const configuredLLMs: LLMConfig[] = [
  // ... existing models
  {
    name: "Your New Model",
    provider: "provider-name",
    model: "model-name"
  }
];
```

### Styling

The app uses Tailwind CSS for styling. The design system includes:

- Light and dark mode support
- Responsive design
- Custom scrollbars
- Loading animations
- Error states

## Technologies Used

- **React 18** - UI framework
- **TypeScript** - Type safety
- **Vite** - Build tool and dev server
- **Tailwind CSS** - Styling
- **Lucide React** - Icons
- **AISuite** - AI provider abstraction

## Browser Support

- Chrome 90+
- Firefox 88+
- Safari 14+
- Edge 90+

## Contributing

1. Fork the repository
2. Create a feature branch
3. Make your changes
4. Add tests if applicable
5. Submit a pull request

## License

MIT License - see the main repository for details.

## Support

For issues and questions:
- Check the [AISuite documentation](https://github.com/andrewyng/aisuite)
- Open an issue in the repository
- Check the console for error messages

## Security Notes

- API keys are stored in localStorage (client-side only)
- No API keys are sent to any server except the AI providers
- Consider using environment variables for production deployments 

================================================
FILE: aisuite-js/examples/chat-app/index.html
================================================
<!doctype html>
<html lang="en">
  <head>
    <meta charset="UTF-8" />
    <link rel="icon" type="image/svg+xml" href="/vite.svg" />
    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
    <title>AISuite Chat App</title>
  </head>
  <body>
    <div id="root"></div>
    <script type="module" src="/src/main.tsx"></script>
  </body>
</html> 

================================================
FILE: aisuite-js/examples/chat-app/package.json
================================================
{
  "name": "aisuite-chat-app",
  "version": "1.0.0",
  "description": "A React TypeScript chat application using AISuite",
  "private": true,
  "scripts": {
    "dev": "vite",
    "build": "tsc && vite build",
    "preview": "vite preview",
    "lint": "eslint . --ext ts,tsx --report-unused-disable-directives --max-warnings 0"
  },
  "dependencies": {
    "react": "^18.2.0",
    "react-dom": "^18.2.0",    
    "lucide-react": "^0.263.1",
    "clsx": "^2.0.0",
    "tailwind-merge": "^1.14.0"
  },
  "devDependencies": {
    "@types/react": "^18.2.15",
    "@types/react-dom": "^18.2.7",
    "@typescript-eslint/eslint-plugin": "^6.0.0",
    "@typescript-eslint/parser": "^6.0.0",
    "@vitejs/plugin-react": "^4.0.3",
    "autoprefixer": "^10.4.14",
    "eslint": "^8.45.0",
    "eslint-plugin-react-hooks": "^4.6.0",
    "eslint-plugin-react-refresh": "^0.4.3",
    "postcss": "^8.4.27",
    "tailwindcss": "^3.3.3",
    "typescript": "^5.0.2",
    "vite": "^4.4.5"
  }
} 

================================================
FILE: aisuite-js/examples/chat-app/postcss.config.js
================================================
export default {
  plugins: {
    tailwindcss: {},
    autoprefixer: {},
  },
} 

================================================
FILE: aisuite-js/examples/chat-app/src/App.tsx
================================================
import React, { useState, useEffect } from 'react';
import { Settings, AlertCircle } from 'lucide-react';
import { Message, AISuiteConfig } from './types/chat';
import { configuredLLMs, getLLMConfigByName } from './config/llm-config';
import { aiSuiteService } from './services/aisuite-service';
import { ChatContainer } from './components/ChatContainer';
import { ChatInput } from './components/ChatInput';
import { ModelSelector } from './components/ModelSelector';
import { ProviderSelector } from './components/ProviderSelector';
import { ApiKeyModal } from './components/ApiKeyModal';

function App() {
  const [chatHistory1, setChatHistory1] = useState<Message[]>([]);
  const [chatHistory2, setChatHistory2] = useState<Message[]>([]);
  const [isProcessing, setIsProcessing] = useState(false);
  const [useComparisonMode, setUseComparisonMode] = useState(false);
  const [selectedProvider, setSelectedProvider] = useState('');
  const [selectedModel1, setSelectedModel1] = useState('');
  const [selectedModel2, setSelectedModel2] = useState('');
  const [showApiKeyModal, setShowApiKeyModal] = useState(false);
  const [apiConfig, setApiConfig] = useState<AISuiteConfig>({});
  const [error, setError] = useState<string | null>(null);

  // Initialize AISuite service when API config changes
  useEffect(() => {
    if (Object.keys(apiConfig).length > 0) {
      try {
        aiSuiteService.initialize(apiConfig);
        setError(null);
      } catch (err) {
        setError('Failed to initialize AISuite client');
      }
    }
  }, [apiConfig]);

  // Load API config from localStorage on mount
  useEffect(() => {
    const savedConfig = localStorage.getItem('aisuite-config');
    if (savedConfig) {
      try {
        const config = JSON.parse(savedConfig);
        setApiConfig(config);
      } catch (err) {
        console.error('Failed to load saved config');
      }
    }
  }, []);

  const handleSendMessage = async (message: string) => {
    if (!message.trim()) return;

    // Check if provider is selected
    if (!selectedProvider) {
      setError('Please select a provider first');
      return;
    }

    // Check if API key is configured for the selected provider
    if (!apiConfig[selectedProvider as keyof AISuiteConfig]?.apiKey) {
      setError(`API key for ${selectedProvider} is not configured. Please configure it first.`);
      setShowApiKeyModal(true);
      return;
    }

    const userMessage: Message = {
      role: 'user',
      content: message,
      timestamp: new Date()
    };

    setIsProcessing(true);
    setError(null);

    try {
      // Add user message to both chat histories
      setChatHistory1(prev => [...prev, userMessage]);
      if (useComparisonMode) {
        setChatHistory2(prev => [...prev, userMessage]);
      }

      // Get model configurations
      const modelConfig1 = getLLMConfigByName(selectedModel1);
      if (!modelConfig1) {
        throw new Error(`Model ${selectedModel1} not found`);
      }

      // Query first model
      const response1 = await aiSuiteService.queryLLM(modelConfig1, [...chatHistory1, userMessage]);
      const assistantMessage1: Message = {
        role: 'assistant',
        content: response1,
        timestamp: new Date()
      };
      setChatHistory1(prev => [...prev, assistantMessage1]);

      // Query second model if in comparison mode
      if (useComparisonMode) {
        const modelConfig2 = getLLMConfigByName(selectedModel2);
        if (!modelConfig2) {
          throw new Error(`Model ${selectedModel2} not found`);
        }

        const response2 = await aiSuiteService.queryLLM(modelConfig2, [...chatHistory2, userMessage]);
        const assistantMessage2: Message = {
          role: 'assistant',
          content: response2,
          timestamp: new Date()
        };
        setChatHistory2(prev => [...prev, assistantMessage2]);
      }
    } catch (err) {
      setError(err instanceof Error ? err.message : 'An error occurred');
    } finally {
      setIsProcessing(false);
    }
  };

  const handleResetChat = () => {
    setChatHistory1([]);
    setChatHistory2([]);
    setError(null);
  };

  const handleSaveApiConfig = (config: AISuiteConfig) => {
    setApiConfig(config);
    localStorage.setItem('aisuite-config', JSON.stringify(config));
  };

  // Get all available providers (show all by default)
  const allProviders = ['openai', 'anthropic', 'groq', 'mistral'];
  const availableProviders = allProviders;
  
  // Get configured providers (those with API keys)
  const configuredProviders = Object.keys(apiConfig).filter(provider => 
    apiConfig[provider as keyof AISuiteConfig]?.apiKey
  );

  // Get models for the selected provider
  const availableModels = selectedProvider 
    ? configuredLLMs.filter(model => model.provider === selectedProvider)
    : [];

  // Reset model selections when provider changes
  useEffect(() => {
    if (selectedProvider) {
      const providerModels = configuredLLMs.filter(model => model.provider === selectedProvider);
      if (providerModels.length > 0) {
        setSelectedModel1(providerModels[0].name);
        if (useComparisonMode && providerModels.length > 1) {
          setSelectedModel2(providerModels[1].name);
        } else {
          setSelectedModel2('');
        }
      } else {
        setSelectedModel1('');
        setSelectedModel2('');
      }
    } else {
      setSelectedModel1('');
      setSelectedModel2('');
    }
  }, [selectedProvider, useComparisonMode]);

  const hasConfiguredProviders = Object.keys(apiConfig).length > 0;

  return (
    <div className="min-h-screen bg-background">
      {/* Header */}
      <header className="border-b bg-card">
        <div className="container mx-auto px-4 py-4">
          <div className="flex items-center justify-between">
            <h1 className="text-2xl font-bold">AISuite Chat</h1>
            <button
              onClick={() => setShowApiKeyModal(true)}
              className="flex items-center gap-2 rounded-lg border border-input bg-background px-3 py-2 text-sm font-medium ring-offset-background placeholder:text-muted-foreground hover:bg-accent hover:text-accent-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2"
            >
              <Settings className="w-4 h-4" />
              Configure API Keys
            </button>
          </div>
        </div>
      </header>

      {/* Main Content */}
      <main className="container mx-auto px-4 py-6">
        {!hasConfiguredProviders ? (
          <div className="flex items-center justify-center min-h-[400px]">
            <div className="text-center">
              <AlertCircle className="w-12 h-12 text-muted-foreground mx-auto mb-4" />
              <h2 className="text-xl font-semibold mb-2">No API Keys Configured</h2>
              <p className="text-muted-foreground mb-4">
                Please configure your API keys to start chatting with AI models.
              </p>
              <button
                onClick={() => setShowApiKeyModal(true)}
                className="rounded-lg bg-primary px-4 py-2 text-sm font-medium text-primary-foreground hover:bg-primary/90"
              >
                Configure API Keys
              </button>
            </div>
          </div>
        ) : (
          <div className="space-y-6">
            {/* Error Display */}
            {error && (
              <div className="rounded-lg border border-destructive/50 bg-destructive/10 p-4">
                <div className="flex items-center gap-2 text-destructive">
                  <AlertCircle className="w-4 h-4" />
                  <span className="text-sm font-medium">{error}</span>
                </div>
              </div>
            )}

            {/* Controls */}
            <div className="space-y-4">
                             {/* Provider Selection */}
               <div className="grid grid-cols-1 md:grid-cols-2 gap-4">
                 <ProviderSelector
                   selectedProvider={selectedProvider}
                   onProviderChange={setSelectedProvider}
                   availableProviders={availableProviders}
                   configuredProviders={configuredProviders}
                   label="Select AI Provider"
                   disabled={isProcessing}
                 />
                 <div className="flex items-center justify-center">
                   <label className="flex items-center gap-2">
                     <input
                       type="checkbox"
                       checked={useComparisonMode}
                       onChange={(e) => setUseComparisonMode(e.target.checked)}
                       className="rounded border-input"
                     />
                     <span className="text-sm font-medium">Comparison Mode</span>
                   </label>
                 </div>
               </div>

              {/* Model Selection - Only show if provider is selected */}
              {selectedProvider && (
                <div className="grid grid-cols-1 md:grid-cols-2 gap-4">
                  <ModelSelector
                    selectedModel={selectedModel1}
                    onModelChange={setSelectedModel1}
                    availableModels={availableModels}
                    label="Choose LLM Model 1"
                    disabled={isProcessing}
                  />
                  {useComparisonMode && availableModels.length > 1 && (
                    <ModelSelector
                      selectedModel={selectedModel2}
                      onModelChange={setSelectedModel2}
                      availableModels={availableModels}
                      label="Choose LLM Model 2"
                      disabled={isProcessing}
                    />
                  )}
                </div>
              )}
            </div>

            {/* Chat Containers */}
            {selectedProvider && selectedModel1 && (
              <div className="grid grid-cols-1 gap-6" style={{ 
                gridTemplateColumns: useComparisonMode && selectedModel2 ? '1fr 1fr' : '1fr' 
              }}>
                <div className="border rounded-lg bg-card h-[500px] flex flex-col">
                  <div className="border-b p-4">
                    <h3 className="font-medium">{selectedModel1}</h3>
                  </div>
                  <div className="flex-1 overflow-hidden">
                    <ChatContainer
                      messages={chatHistory1}
                      modelName={selectedModel1}
                      isLoading={isProcessing}
                    />
                  </div>
                </div>

                {useComparisonMode && selectedModel2 && (
                  <div className="border rounded-lg bg-card h-[500px] flex flex-col">
                    <div className="border-b p-4">
                      <h3 className="font-medium">{selectedModel2}</h3>
                    </div>
                    <div className="flex-1 overflow-hidden">
                      <ChatContainer
                        messages={chatHistory2}
                        modelName={selectedModel2}
                        isLoading={isProcessing}
                      />
                    </div>
                  </div>
                )}
              </div>
            )}

            {/* No Provider Selected State */}
            {!selectedProvider && hasConfiguredProviders && (
              <div className="flex items-center justify-center min-h-[400px]">
                <div className="text-center">
                  <AlertCircle className="w-12 h-12 text-muted-foreground mx-auto mb-4" />
                  <h2 className="text-xl font-semibold mb-2">Select a Provider</h2>
                  <p className="text-muted-foreground mb-4">
                    Please select an AI provider to start chatting.
                  </p>
                </div>
              </div>
            )}

            {/* Chat Input */}
            <ChatInput
              onSendMessage={handleSendMessage}
              onResetChat={handleResetChat}
              isLoading={isProcessing}
              placeholder={selectedProvider ? "Enter your query..." : "Select a provider to start chatting..."}
              disabled={!selectedProvider}
            />
          </div>
        )}
      </main>

      {/* API Key Modal */}
      <ApiKeyModal
        isOpen={showApiKeyModal}
        onClose={() => setShowApiKeyModal(false)}
        onSave={handleSaveApiConfig}
        initialConfig={apiConfig}
      />
    </div>
  );
}

export default App; 

================================================
FILE: aisuite-js/examples/chat-app/src/components/ApiKeyModal.tsx
================================================
import React, { useState } from 'react';
import { X, Eye, EyeOff } from 'lucide-react';
import { AISuiteConfig } from '../types/chat';

interface ApiKeyModalProps {
  isOpen: boolean;
  onClose: () => void;
  onSave: (config: AISuiteConfig) => void;
  initialConfig?: AISuiteConfig;
}

export const ApiKeyModal: React.FC<ApiKeyModalProps> = ({
  isOpen,
  onClose,
  onSave,
  initialConfig = {}
}) => {
  const [config, setConfig] = useState<AISuiteConfig>(initialConfig);
  const [showKeys, setShowKeys] = useState<Record<string, boolean>>({});

  const toggleKeyVisibility = (provider: string) => {
    setShowKeys(prev => ({
      ...prev,
      [provider]: !prev[provider]
    }));
  };

  const handleSave = () => {
    // Filter out empty API keys
    const filteredConfig: AISuiteConfig = {};
    Object.entries(config).forEach(([provider, providerConfig]) => {
      if (providerConfig?.apiKey?.trim()) {
        providerConfig.dangerouslyAllowBrowser = true;
        filteredConfig[provider as keyof AISuiteConfig] = providerConfig;
      }
    });
    onSave(filteredConfig);
    onClose();
  };

  const updateConfig = (provider: string, field: string, value: string) => {
    setConfig(prev => ({
      ...prev,
      [provider]: {
        ...prev[provider as keyof AISuiteConfig],
        [field]: value
      }
    }));
  };

  if (!isOpen) return null;

  return (
    <div className="fixed inset-0 bg-black/50 flex items-center justify-center z-50">
      <div className="bg-background rounded-lg p-6 w-full max-w-md mx-4">
        <div className="flex items-center justify-between mb-4">
          <h2 className="text-lg font-semibold">Configure API Keys</h2>
          <button
            onClick={onClose}
            className="text-muted-foreground hover:text-foreground"
          >
            <X className="w-5 h-5" />
          </button>
        </div>

        <div className="space-y-4">
          {/* OpenAI */}
          <div className="space-y-2">
            <label className="text-sm font-medium">OpenAI</label>
            <div className="relative">
              <input
                type={showKeys.openai ? 'text' : 'password'}
                placeholder="sk-..."
                value={config.openai?.apiKey || ''}
                onChange={(e) => updateConfig('openai', 'apiKey', e.target.value)}
                className="w-full rounded-lg border border-input bg-background px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2"
              />
              <button
                type="button"
                onClick={() => toggleKeyVisibility('openai')}
                className="absolute right-2 top-1/2 -translate-y-1/2 text-muted-foreground hover:text-foreground"
              >
                {showKeys.openai ? <EyeOff className="w-4 h-4" /> : <Eye className="w-4 h-4" />}
              </button>
            </div>
          </div>

          {/* Anthropic */}
          <div className="space-y-2">
            <label className="text-sm font-medium">Anthropic</label>
            <div className="relative">
              <input
                type={showKeys.anthropic ? 'text' : 'password'}
                placeholder="sk-ant-..."
                value={config.anthropic?.apiKey || ''}
                onChange={(e) => updateConfig('anthropic', 'apiKey', e.target.value)}
                className="w-full rounded-lg border border-input bg-background px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2"
              />
              <button
                type="button"
                onClick={() => toggleKeyVisibility('anthropic')}
                className="absolute right-2 top-1/2 -translate-y-1/2 text-muted-foreground hover:text-foreground"
              >
                {showKeys.anthropic ? <EyeOff className="w-4 h-4" /> : <Eye className="w-4 h-4" />}
              </button>
            </div>
          </div>

          {/* Groq */}
          <div className="space-y-2">
            <label className="text-sm font-medium">Groq</label>
            <div className="relative">
              <input
                type={showKeys.groq ? 'text' : 'password'}
                placeholder="gsk_..."
                value={config.groq?.apiKey || ''}
                onChange={(e) => updateConfig('groq', 'apiKey', e.target.value)}
                className="w-full rounded-lg border border-input bg-background px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2"
              />
              <button
                type="button"
                onClick={() => toggleKeyVisibility('groq')}
                className="absolute right-2 top-1/2 -translate-y-1/2 text-muted-foreground hover:text-foreground"
              >
                {showKeys.groq ? <EyeOff className="w-4 h-4" /> : <Eye className="w-4 h-4" />}
              </button>
            </div>
          </div>

          {/* Mistral */}
          <div className="space-y-2">
            <label className="text-sm font-medium">Mistral</label>
            <div className="relative">
              <input
                type={showKeys.mistral ? 'text' : 'password'}
                placeholder="..."
                value={config.mistral?.apiKey || ''}
                onChange={(e) => updateConfig('mistral', 'apiKey', e.target.value)}
                className="w-full rounded-lg border border-input bg-background px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2"
              />
              <button
                type="button"
                onClick={() => toggleKeyVisibility('mistral')}
                className="absolute right-2 top-1/2 -translate-y-1/2 text-muted-foreground hover:text-foreground"
              >
                {showKeys.mistral ? <EyeOff className="w-4 h-4" /> : <Eye className="w-4 h-4" />}
              </button>
            </div>
          </div>
        </div>

        <div className="mt-6 flex gap-2">
          <button
            onClick={onClose}
            className="flex-1 rounded-lg border border-input bg-background px-3 py-2 text-sm font-medium ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2"
          >
            Cancel
          </button>
          <button
            onClick={handleSave}
            className="flex-1 rounded-lg bg-primary px-3 py-2 text-sm font-medium text-primary-foreground hover:bg-primary/90 focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2"
          >
            Save
          </button>
        </div>
      </div>
    </div>
  );
}; 

================================================
FILE: aisuite-js/examples/chat-app/src/components/ChatContainer.tsx
================================================
import React, { useRef, useEffect } from 'react';
import { Message } from '../types/chat';
import { ChatMessage } from './ChatMessage';

interface ChatContainerProps {
  messages: Message[];
  modelName: string;
  isLoading?: boolean;
}

export const ChatContainer: React.FC<ChatContainerProps> = ({ 
  messages, 
  modelName, 
  isLoading = false 
}) => {
  const messagesEndRef = useRef<HTMLDivElement>(null);

  const scrollToBottom = () => {
    messagesEndRef.current?.scrollIntoView({ behavior: 'smooth' });
  };

  useEffect(() => {
    scrollToBottom();
  }, [messages]);

  return (
    <div className="flex flex-col h-full">
      <div className="flex-1 overflow-y-auto custom-scrollbar">
        <div className="min-h-full">
          {messages.length === 0 ? (
            <div className="flex items-center justify-center h-full text-muted-foreground">
              <div className="text-center">
                <div className="text-lg font-medium mb-2">No messages yet</div>
                <div className="text-sm">Start a conversation with {modelName}</div>
              </div>
            </div>
          ) : (
            messages.map((message, index) => (
              <ChatMessage 
                key={index} 
                message={message} 
                modelName={modelName}
              />
            ))
          )}
          
          {isLoading && (
            <div className="flex gap-3 p-4 justify-start">
              <div className="flex-shrink-0 w-8 h-8 bg-primary rounded-full flex items-center justify-center">
                <div className="w-4 h-4 border-2 border-primary-foreground border-t-transparent rounded-full animate-spin" />
              </div>
              <div className="max-w-[80%]">
                <div className="rounded-lg p-3 bg-muted text-foreground">
                  <div className="text-sm font-medium mb-1 opacity-70">
                    {modelName}
                  </div>
                  <div className="flex items-center gap-2">
                    <div className="flex gap-1">
                      <div className="w-2 h-2 bg-muted-foreground rounded-full animate-bounce" style={{ animationDelay: '0ms' }} />
                      <div className="w-2 h-2 bg-muted-foreground rounded-full animate-bounce" style={{ animationDelay: '150ms' }} />
                      <div className="w-2 h-2 bg-muted-foreground rounded-full animate-bounce" style={{ animationDelay: '300ms' }} />
                    </div>
                    <span className="text-sm text-muted-foreground">Thinking...</span>
                  </div>
                </div>
              </div>
            </div>
          )}
          
          <div ref={messagesEndRef} />
        </div>
      </div>
    </div>
  );
}; 

================================================
FILE: aisuite-js/examples/chat-app/src/components/ChatInput.tsx
================================================
import React, { useState, KeyboardEvent } from 'react';
import { Send, RotateCcw } from 'lucide-react';

interface ChatInputProps {
  onSendMessage: (message: string) => void;
  onResetChat: () => void;
  isLoading: boolean;
  placeholder?: string;
  disabled?: boolean;
}

export const ChatInput: React.FC<ChatInputProps> = ({
  onSendMessage,
  onResetChat,
  isLoading,
  placeholder = "Enter your query...",
  disabled = false
}) => {
  const [message, setMessage] = useState('');

  const handleSend = () => {
    if (message.trim() && !isLoading && !disabled) {
      onSendMessage(message.trim());
      setMessage('');
    }
  };

  const handleKeyPress = (e: KeyboardEvent<HTMLTextAreaElement>) => {
    if (e.key === 'Enter' && !e.shiftKey) {
      e.preventDefault();
      handleSend();
    }
  };

  return (
    <div className="border-t bg-background p-4">
      <div className="flex gap-2">
        <div className="flex-1 relative">
          <textarea
            value={message}
            onChange={(e) => setMessage(e.target.value)}
            onKeyPress={handleKeyPress}
            placeholder={placeholder}
            disabled={isLoading || disabled}
            className="w-full resize-none rounded-lg border border-input bg-background px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50"
            rows={3}
            style={{ minHeight: '60px', maxHeight: '120px' }}
          />
        </div>
        
        <div className="flex flex-col gap-2">
          <button
            onClick={handleSend}
            disabled={!message.trim() || isLoading || disabled}
            className="flex items-center justify-center w-10 h-10 rounded-lg bg-primary text-primary-foreground hover:bg-primary/90 disabled:opacity-50 disabled:cursor-not-allowed transition-colors"
          >
            <Send className="w-4 h-4" />
          </button>
          
          <button
            onClick={onResetChat}
            disabled={isLoading}
            className="flex items-center justify-center w-10 h-10 rounded-lg bg-secondary text-secondary-foreground hover:bg-secondary/90 disabled:opacity-50 disabled:cursor-not-allowed transition-colors"
            title="Reset Chat"
          >
            <RotateCcw className="w-4 h-4" />
          </button>
        </div>
      </div>
      
      {isLoading && (
        <div className="mt-2 text-sm text-muted-foreground flex items-center gap-2">
          <div className="w-4 h-4 border-2 border-muted-foreground border-t-transparent rounded-full animate-spin" />
          Processing...
        </div>
      )}
    </div>
  );
}; 

================================================
FILE: aisuite-js/examples/chat-app/src/components/ChatMessage.tsx
================================================
import React from 'react';
import { Message } from '../types/chat';
import { User, Bot } from 'lucide-react';

interface ChatMessageProps {
  message: Message;
  modelName?: string;
}

export const ChatMessage: React.FC<ChatMessageProps> = ({ message, modelName }) => {
  const isUser = message.role === 'user';
  const roleDisplay = isUser ? 'User' : modelName || 'Assistant';

  return (
    <div className={`flex gap-3 p-4 ${isUser ? 'justify-end' : 'justify-start'}`}>
      {!isUser && (
        <div className="flex-shrink-0 w-8 h-8 bg-primary rounded-full flex items-center justify-center">
          <Bot className="w-4 h-4 text-primary-foreground" />
        </div>
      )}
      
      <div className={`max-w-[80%] ${isUser ? 'order-first' : ''}`}>
        <div className={`rounded-lg p-3 ${
          isUser 
            ? 'bg-primary text-primary-foreground' 
            : 'bg-muted text-foreground'
        }`}>
          <div className="text-sm font-medium mb-1 opacity-70">
            {roleDisplay}
          </div>
          <div className="whitespace-pre-wrap break-words">
            {message.content}
          </div>
        </div>
        {message.timestamp && (
          <div className={`text-xs text-muted-foreground mt-1 ${
            isUser ? 'text-right' : 'text-left'
          }`}>
            {message.timestamp.toLocaleTimeString()}
          </div>
        )}
      </div>

      {isUser && (
        <div className="flex-shrink-0 w-8 h-8 bg-secondary rounded-full flex items-center justify-center">
          <User className="w-4 h-4 text-secondary-foreground" />
        </div>
      )}
    </div>
  );
}; 

================================================
FILE: aisuite-js/examples/chat-app/src/components/ModelSelector.tsx
================================================
import React from 'react';
import { LLMConfig } from '../types/chat';

interface ModelSelectorProps {
  selectedModel: string;
  onModelChange: (modelName: string) => void;
  availableModels: LLMConfig[];
  label: string;
  disabled?: boolean;
}

export const ModelSelector: React.FC<ModelSelectorProps> = ({
  selectedModel,
  onModelChange,
  availableModels,
  label,
  disabled = false
}) => {
  return (
    <div className="flex flex-col gap-2">
      <label className="text-sm font-medium text-foreground">
        {label}
      </label>
      <select
        value={selectedModel}
        onChange={(e) => onModelChange(e.target.value)}
        disabled={disabled}
        className="w-full rounded-lg border border-input bg-background px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50"
      >
        {availableModels.map((model) => (
          <option key={model.name} value={model.name}>
            {model.name}
          </option>
        ))}
      </select>
    </div>
  );
}; 

================================================
FILE: aisuite-js/examples/chat-app/src/components/ProviderSelector.tsx
================================================
import React from 'react';

interface ProviderSelectorProps {
  selectedProvider: string;
  onProviderChange: (provider: string) => void;
  availableProviders: string[];
  configuredProviders: string[];
  label: string;
  disabled?: boolean;
}

export const ProviderSelector: React.FC<ProviderSelectorProps> = ({
  selectedProvider,
  onProviderChange,
  availableProviders,
  configuredProviders,
  label,
  disabled = false
}) => {
  const providerNames = {
    openai: 'OpenAI',
    anthropic: 'Anthropic',
    groq: 'Groq',
    mistral: 'Mistral'
  };

  return (
    <div className="flex flex-col gap-2">
      <label className="text-sm font-medium text-foreground">
        {label}
      </label>
      <select
        value={selectedProvider}
        onChange={(e) => onProviderChange(e.target.value)}
        disabled={disabled}
        className="w-full rounded-lg border border-input bg-background px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50"
      >
        <option value="">Select a provider</option>
        {availableProviders.map((provider) => {
          const isConfigured = configuredProviders.includes(provider);
          const displayName = providerNames[provider as keyof typeof providerNames] || provider;
          return (
            <option key={provider} value={provider}>
              {displayName} {!isConfigured ? '(API key needed)' : ''}
            </option>
          );
        })}
      </select>
    </div>
  );
}; 

================================================
FILE: aisuite-js/examples/chat-app/src/config/llm-config.ts
================================================
import { LLMConfig } from '../types/chat';

export const configuredLLMs: LLMConfig[] = [
  {
    name: "OpenAI GPT-4o",
    provider: "openai",
    model: "gpt-4o"
  },
  {
    name: "OpenAI GPT-4o Mini",
    provider: "openai",
    model: "gpt-4o-mini"
  },
  {
    name: "Anthropic Claude 3.5 Sonnet",
    provider: "anthropic",
    model: "claude-3-5-sonnet-20241022"
  },
  {
    name: "Anthropic Claude 3 Haiku",
    provider: "anthropic",
    model: "claude-3-haiku-20240307"
  },
  {
    name: "Groq Llama 3.3-70b Versatile",
    provider: "groq",
    model: "llama-3.3-70b-versatile"
  },
  {
    name: "Groq Mixtral 24B",
    provider: "groq",
    model: "mistral-saba-24b"
  },
  {
    name: "Groq Gemma 2 9B",
    provider: "groq",
    model: "gemma2-9b-it"
  },
  {
    name: "Mistral Medium",
    provider: "mistral",
    model: "mistral-medium"
  },
  {
    name: "Mistral Large",
    provider: "mistral",
    model: "mistral-large-latest"
  }
];

export const getLLMConfigByName = (name: string): LLMConfig | undefined => {
  return configuredLLMs.find(llm => llm.name === name);
};

export const getLLMConfigByProviderAndModel = (provider: string, model: string): LLMConfig | undefined => {
  return configuredLLMs.find(llm => llm.provider === provider && llm.model === model);
}; 

================================================
FILE: aisuite-js/examples/chat-app/src/index.css
================================================
@tailwind base;
@tailwind components;
@tailwind utilities;

@layer base {
  :root {
    --background: 0 0% 100%;
    --foreground: 222.2 84% 4.9%;
    --card: 0 0% 100%;
    --card-foreground: 222.2 84% 4.9%;
    --popover: 0 0% 100%;
    --popover-foreground: 222.2 84% 4.9%;
    --primary: 222.2 47.4% 11.2%;
    --primary-foreground: 210 40% 98%;
    --secondary: 210 40% 96%;
    --secondary-foreground: 222.2 84% 4.9%;
    --muted: 210 40% 96%;
    --muted-foreground: 215.4 16.3% 46.9%;
    --accent: 210 40% 96%;
    --accent-foreground: 222.2 84% 4.9%;
    --destructive: 0 84.2% 60.2%;
    --destructive-foreground: 210 40% 98%;
    --border: 214.3 31.8% 91.4%;
    --input: 214.3 31.8% 91.4%;
    --ring: 222.2 84% 4.9%;
    --radius: 0.5rem;
    --chart-1: 12 76% 61%;
    --chart-2: 173 58% 39%;
    --chart-3: 197 37% 24%;
    --chart-4: 43 74% 66%;
    --chart-5: 27 87% 67%;
  }

  .dark {
    --background: 222.2 84% 4.9%;
    --foreground: 210 40% 98%;
    --card: 222.2 84% 4.9%;
    --card-foreground: 210 40% 98%;
    --popover: 222.2 84% 4.9%;
    --popover-foreground: 210 40% 98%;
    --primary: 210 40% 98%;
    --primary-foreground: 222.2 47.4% 11.2%;
    --secondary: 217.2 32.6% 17.5%;
    --secondary-foreground: 210 40% 98%;
    --muted: 217.2 32.6% 17.5%;
    --muted-foreground: 215 20.2% 65.1%;
    --accent: 217.2 32.6% 17.5%;
    --accent-foreground: 210 40% 98%;
    --destructive: 0 62.8% 30.6%;
    --destructive-foreground: 210 40% 98%;
    --border: 217.2 32.6% 17.5%;
    --input: 217.2 32.6% 17.5%;
    --ring: 212.7 26.8% 83.9%;
    --chart-1: 220 70% 50%;
    --chart-2: 160 60% 45%;
    --chart-3: 30 80% 55%;
    --chart-4: 280 65% 60%;
    --chart-5: 340 75% 55%;
  }
}

@layer base {
  * {
    @apply border-border;
  }
  body {
    @apply bg-background text-foreground;
  }
}

/* Custom scrollbar styles */
.custom-scrollbar::-webkit-scrollbar {
  width: 6px;
}

.custom-scrollbar::-webkit-scrollbar-track {
  background: transparent;
}

.custom-scrollbar::-webkit-scrollbar-thumb {
  background: hsl(var(--muted-foreground) / 0.3);
  border-radius: 3px;
}

.custom-scrollbar::-webkit-scrollbar-thumb:hover {
  background: hsl(var(--muted-foreground) / 0.5);
} 

================================================
FILE: aisuite-js/examples/chat-app/src/main.tsx
================================================
import React from 'react'
import ReactDOM from 'react-dom/client'
import App from './App.tsx'
import './index.css'

ReactDOM.createRoot(document.getElementById('root')!).render(
  <React.StrictMode>
    <App />
  </React.StrictMode>,
) 

================================================
FILE: aisuite-js/examples/chat-app/src/services/aisuite-service.ts
================================================
import { Client } from '../../../../src/client';
import { Message, LLMConfig, AISuiteConfig } from '../types/chat';

class AISuiteService {
  private client: Client | null = null;
  private config: AISuiteConfig | null = null;

  initialize(config: AISuiteConfig) {
    this.config = config;
    this.client = new Client(config);
  }

  async queryLLM(modelConfig: LLMConfig, messages: Message[]): Promise<string> {
    if (!this.client) {
      throw new Error('AISuite client not initialized. Please check your API keys.');
    }

    try {
      const model = `${modelConfig.provider}:${modelConfig.model}`;
      const response = await this.client.chat.completions.create({
        model,
        messages: messages.map(msg => ({
          role: msg.role,
          content: msg.content
        })),
        temperature: 0.7,
        max_tokens: 1000,
        stream: false, // Explicitly set stream to false to get ChatCompletionResponse
      });

      // Type guard to ensure we have a ChatCompletionResponse
      if ('choices' in response && Array.isArray(response.choices)) {
        return response.choices[0].message.content || 'No response from model';
      } else {
        throw new Error('Unexpected response format from model');
      }
    } catch (error) {
      console.error(`Error querying ${modelConfig.name}:`, error);
      throw new Error(`Error with ${modelConfig.name}: ${error instanceof Error ? error.message : 'Unknown error'}`);
    }
  }

  getAvailableProviders(): string[] {
    if (!this.client) {
      return [];
    }
    return this.client.listProviders();
  }

  isProviderConfigured(provider: string): boolean {
    if (!this.client) {
      return false;
    }
    return this.client.isProviderConfigured(provider);
  }

  getConfig(): AISuiteConfig | null {
    return this.config;
  }
}

export const aiSuiteService = new AISuiteService(); 

================================================
FILE: aisuite-js/examples/chat-app/src/types/chat.ts
================================================
export interface Message {
  role: 'user' | 'assistant' | 'system';
  content: string;
  timestamp?: Date;
}

export interface ChatHistory {
  id: string;
  messages: Message[];
  modelName: string;
  createdAt: Date;
  updatedAt: Date;
}

export interface LLMConfig {
  name: string;
  provider: string;
  model: string;
}

export interface ChatState {
  chatHistory1: Message[];
  chatHistory2: Message[];
  isProcessing: boolean;
  useComparisonMode: boolean;
  selectedModel1: string;
  selectedModel2: string;
}

export interface AISuiteConfig {
  openai?: {
    apiKey: string;
    baseURL?: string;
    organization?: string;
  };
  anthropic?: {
    apiKey: string;
    baseURL?: string;
  };
  groq?: {
    apiKey: string;
    baseURL?: string;
    dangerouslyAllowBrowser?: boolean;
  };
  mistral?: {
    apiKey: string;
    baseURL?: string;
  };
} 

================================================
FILE: aisuite-js/examples/chat-app/src/utils/cn.ts
================================================
import { type ClassValue, clsx } from "clsx"
import { twMerge } from "tailwind-merge"

export function cn(...inputs: ClassValue[]) {
  return twMerge(clsx(inputs))
} 

================================================
FILE: aisuite-js/examples/chat-app/tailwind.config.js
================================================
/** @type {import('tailwindcss').Config} */
export default {
  content: [
    "./index.html",
    "./src/**/*.{js,ts,jsx,tsx}",
  ],
  theme: {
    extend: {
      colors: {
        background: "hsl(var(--background))",
        foreground: "hsl(var(--foreground))",
        card: {
          DEFAULT: "hsl(var(--card))",
          foreground: "hsl(var(--card-foreground))",
        },
        popover: {
          DEFAULT: "hsl(var(--popover))",
          foreground: "hsl(var(--popover-foreground))",
        },
        primary: {
          DEFAULT: "hsl(var(--primary))",
          foreground: "hsl(var(--primary-foreground))",
        },
        secondary: {
          DEFAULT: "hsl(var(--secondary))",
          foreground: "hsl(var(--secondary-foreground))",
        },
        muted: {
          DEFAULT: "hsl(var(--muted))",
          foreground: "hsl(var(--muted-foreground))",
        },
        accent: {
          DEFAULT: "hsl(var(--accent))",
          foreground: "hsl(var(--accent-foreground))",
        },
        destructive: {
          DEFAULT: "hsl(var(--destructive))",
          foreground: "hsl(var(--destructive-foreground))",
        },
        border: "hsl(var(--border))",
        input: "hsl(var(--input))",
        ring: "hsl(var(--ring))",
        chart: {
          "1": "hsl(var(--chart-1))",
          "2": "hsl(var(--chart-2))",
          "3": "hsl(var(--chart-3))",
          "4": "hsl(var(--chart-4))",
          "5": "hsl(var(--chart-5))",
        },
      },
      borderRadius: {
        lg: "var(--radius)",
        md: "calc(var(--radius) - 2px)",
        sm: "calc(var(--radius) - 4px)",
      },
    },
  },
  plugins: [],
} 

================================================
FILE: aisuite-js/examples/chat-app/tsconfig.json
================================================
{
  "compilerOptions": {
    "target": "ES2020",
    "useDefineForClassFields": true,
    "lib": ["ES2020", "DOM", "DOM.Iterable"],
    "module": "ESNext",
    "skipLibCheck": true,

    /* Bundler mode */
    "moduleResolution": "bundler",
    "allowImportingTsExtensions": true,
    "resolveJsonModule": true,
    "isolatedModules": true,
    "noEmit": true,
    "jsx": "react-jsx",

    /* Linting */
    "strict": true,
    "noUnusedLocals": true,
    "noUnusedParameters": true,
    "noFallthroughCasesInSwitch": true
  },
  "include": ["src"],
  "references": [{ "path": "./tsconfig.node.json" }]
} 

================================================
FILE: aisuite-js/examples/chat-app/tsconfig.node.json
================================================
{
  "compilerOptions": {
    "composite": true,
    "skipLibCheck": true,
    "module": "ESNext",
    "moduleResolution": "bundler",
    "allowSyntheticDefaultImports": true
  },
  "include": ["vite.config.ts"]
} 

================================================
FILE: aisuite-js/examples/chat-app/vite.config.ts
================================================
import { defineConfig } from 'vite'
import react from '@vitejs/plugin-react'

// https://vitejs.dev/config/
export default defineConfig({
  plugins: [react()],
  server: {
    port: 3000,
    open: true
  }
}) 

================================================
FILE: aisuite-js/examples/deepgram.ts
================================================
import { Client } from "../src";
import * as fs from "fs";
import * as path from "path";

async function main() {
  // Initialize the client with Deepgram configuration
  // Using Deepgram SDK v4.11.2 with the new createClient API
  const client = new Client({
    deepgram: {
      apiKey: process.env.DEEPGRAM_API_KEY || "your-deepgram-api-key",
    },
  });

  console.log("Available ASR providers:", client.listASRProviders());

  // Example: Transcribe an audio file
  try {
    // Create a simple test audio file (you would replace this with your actual audio file)
    const testAudioPath = path.join("test-audio.wav");

    // Check if test file exists, if not create a placeholder
    if (!fs.existsSync(testAudioPath)) {
      console.log(
        "Test audio file not found. Please provide a valid audio file for transcription."
      );
      console.log("Expected path:", testAudioPath);
      return;
    }

    // Read the file as a buffer
    const audioBuffer = fs.readFileSync(testAudioPath);

    // Create the transcription request with the audio buffer
    const result = await client.audio.transcriptions.create({
      model: "deepgram:general",
      file: audioBuffer,
      language: "en-US",
      timestamps: true,
      word_confidence: true,
      speaker_labels: true,
    });

    console.log("Transcription Result:");
    console.log("Text:", result.text);
    console.log("Language:", result.language);
    console.log("Confidence:", result.confidence);

    if (result.words && result.words.length > 0) {
      console.log("\nWords with timestamps:");
      result.words.slice(0, 5).forEach((word, index) => {
        console.log(
          `${index + 1}. "${word.text}" (${word.start}s - ${
            word.end
          }s, confidence: ${word.confidence})`
        );
      });
    }

    if (result.segments && result.segments.length > 0) {
      console.log("\nSegments:");
      result.segments.forEach((segment, index) => {
        console.log(
          `${index + 1}. [${segment.start}s - ${segment.end}s] ${segment.text}`
        );
      });
    }
  } catch (error) {
    console.error("Error during transcription:", error);
  }
}

main().catch(console.error);


================================================
FILE: aisuite-js/examples/groq.ts
================================================
import "dotenv/config";
import { Client, ChatCompletionResponse, ChatMessage } from "../src";

// Mock function for weather
function getWeather(location: string, unit: 'celsius' | 'fahrenheit' = 'celsius') {
  // Mock implementation
  return {
    location,
    temperature: unit === 'celsius' ? 22 : 72,
    condition: 'sunny',
    unit
  };
}

// Available Groq models
const AVAILABLE_MODELS = {
  MIXTRAL: "groq:mistral-saba-24b",
  LLAMA2: "groq:llama-3.3-70b-versatile",
  GEMMA: "groq:gemma2-9b-it",
};

async function main() {
  const client = new Client({
    groq: { apiKey: process.env.GROQ_API_KEY! },
  });

  console.log("\n🚀 Groq Chat Examples\n");

  // Example 1: Basic chat completion with Mixtral
  console.log("--- Basic Chat Completion with Mixtral ---");
  try {
    const response = (await client.chat.completions.create({
      model: AVAILABLE_MODELS.MIXTRAL,
      messages: [
        { role: "system", content: "You are a helpful assistant." },
        { role: "user", content: "What is TypeScript in one sentence?" },
      ],
      temperature: 0.7,
      max_tokens: 100,
      stream: false,
    })) as ChatCompletionResponse;

    console.log("Response:", response.choices[0].message.content);
    console.log("Usage:", response.usage);
    console.log("Full response:", JSON.stringify(response, null, 2));
  } catch (error) {
    console.error("Error:", error);
  }

  // Example 2: Streaming with LLaMA2
  console.log("\n--- Streaming Example with LLaMA2 ---");
  try {
    const stream = await client.chat.completions.create({
      model: AVAILABLE_MODELS.LLAMA2,
      messages: [
        { role: "system", content: "You are a helpful assistant." },
        {
          role: "user",
          content: "Write a haiku about artificial intelligence.",
        },
      ],
      stream: true,
      temperature: 0.7,
      max_tokens: 100,
    });

    console.log("Response:");
    let fullContent = "";
    for await (const chunk of stream as AsyncIterable<any>) {
      const content = chunk.choices[0]?.delta?.content || "";
      process.stdout.write(content);
      fullContent += content;
    }
    console.log("\n");
  } catch (error) {
    console.error("Streaming error:", error);
  }

  // Example 3: Chat completion with Gemma
  console.log("\n--- Chat Completion with Gemma ---");
  try {
    const response = (await client.chat.completions.create({
      model: AVAILABLE_MODELS.GEMMA,
      messages: [
        { role: "system", content: "You are a helpful assistant." },
        {
          role: "user",
          content: "Explain how machine learning can be used in healthcare.",
        },
      ],
      temperature: 0.5,
      max_tokens: 200,
      stream: false,
    })) as ChatCompletionResponse;

    console.log("Response:", response.choices[0].message.content);
    console.log("Usage:", response.usage);
  } catch (error) {
    console.error("Error:", error);
  }

  // Example 4: Conversation with context
  console.log("\n--- Conversation with Context ---");
  try {
    const conversation = [
      { role: "system", content: "You are a helpful assistant." },
      { role: "user", content: "What is quantum computing?" },
      {
        role: "assistant",
        content:
          "Quantum computing is a type of computing that uses quantum mechanical phenomena like superposition and entanglement to perform calculations.",
      },
      { role: "user", content: "Can you give a practical example?" },
    ] as ChatMessage[];

    const response = (await client.chat.completions.create({
      model: AVAILABLE_MODELS.MIXTRAL,
      messages: conversation,
      temperature: 0.7,
      max_tokens: 150,
      stream: false,
    })) as ChatCompletionResponse;

    console.log("Response:", response.choices[0].message.content);
    console.log("Usage:", response.usage);
  } catch (error) {
    console.error("Error:", error);
  }

  // Example 5: Tool calling with Groq
  console.log("\n--- Tool Calling Example with Groq ---");
  try {
    // Define tools in OpenAI format
    const tools = [
      {
        type: 'function' as const,
        function: {
          name: 'get_weather',
          description: 'Get the current weather for a location',
          parameters: {
            type: 'object' as const,
            properties: {
              location: {
                type: 'string',
                description: 'The city and state, e.g. San Francisco, CA'
              },
              unit: {
                type: 'string',
                enum: ['celsius', 'fahrenheit'],
                description: 'The temperature unit'
              }
            },
            required: ['location']
          }
        }
      }
    ];

    // Step 1: Initial request with tools
    const response = (await client.chat.completions.create({
      model: AVAILABLE_MODELS.MIXTRAL,
      messages: [
        { role: 'system', content: 'You are a helpful weather assistant.' },
        { role: 'user', content: "What's the weather like in London?" }
      ],
      tools,
      tool_choice: 'auto'
    })) as ChatCompletionResponse;

    const message = response.choices[0]?.message;
    console.log('Step 1 - Initial response:', JSON.stringify(message, null, 2));

    if (message?.tool_calls) {
      // Step 2: Execute tool calls and send results back
      const messages: ChatMessage[] = [
        { role: 'system', content: 'You are a helpful weather assistant.' },
        { role: 'user', content: "What's the weather like in London?" },
        message // The assistant's message with tool calls
      ];

      console.log('\nTool calls detected:');
      for (const toolCall of message.tool_calls) {
        console.log(`- Function: ${toolCall.function.name}`);
        console.log(`  Arguments: ${toolCall.function.arguments}`);
        
        // Execute the function
        const args = JSON.parse(toolCall.function.arguments);
        const result = getWeather(args.location, args.unit);
        console.log(`  Result:`, result);

        // Add tool result to messages
        messages.push({
          role: 'tool',
          tool_call_id: toolCall.id,
          content: JSON.stringify(result)
        });
      }

      // Step 3: Get final response with tool results
      console.log('\nStep 2 - Sending tool results back...');
      const finalResponse = (await client.chat.completions.create({
        model: AVAILABLE_MODELS.MIXTRAL,
        messages,
        temperature: 0.7,
        max_tokens: 200
      })) as ChatCompletionResponse;

      console.log('\nStep 3 - Final response:', finalResponse.choices[0].message.content);
    }
  } catch (error) {
    console.error("Tool calling error:", error);
  }
}

main().catch(console.error);


================================================
FILE: aisuite-js/examples/mistral.ts
================================================
import "dotenv/config";
import { Client, ChatCompletionResponse, ChatMessage } from "../src";

// Sample data store
const data = {
  transactionId: ["T1001", "T1002", "T1003", "T1004", "T1005"],
  customerId: ["C001", "C002", "C003", "C002", "C001"],
  paymentAmount: [125.5, 89.99, 120.0, 54.3, 210.2],
  paymentDate: [
    "2021-10-05",
    "2021-10-06",
    "2021-10-07",
    "2021-10-05",
    "2021-10-08",
  ],
  paymentStatus: ["Paid", "Unpaid", "Paid", "Paid", "Pending"],
};

/**
 * Retrieves the payment status for a given transaction
 */
function retrievePaymentStatus({ data, transactionId }) {
  const transactionIndex = data.transactionId.indexOf(transactionId);
  if (transactionIndex !== -1) {
    return JSON.stringify({ status: data.paymentStatus[transactionIndex] });
  }
  return JSON.stringify({ status: "error - transaction id not found" });
}

/**
 * Retrieves the payment date for a given transaction
 */
function retrievePaymentDate({ data, transactionId }) {
  const transactionIndex = data.transactionId.indexOf(transactionId);
  if (transactionIndex !== -1) {
    return JSON.stringify({ date: data.paymentDate[transactionIndex] });
  }
  return JSON.stringify({ date: "error - transaction id not found" });
}

// Map function names to their implementations
const namesToFunctions = {
  retrievePaymentStatus: (transactionId) =>
    retrievePaymentStatus({ data, ...transactionId }),
  retrievePaymentDate: (transactionId) =>
    retrievePaymentDate({ data, ...transactionId }),
};

// Define available tools (functions) for the model
const TOOLS = [
  {
    type: "function",
    function: {
      name: "retrievePaymentStatus",
      description: "Get payment status of a transaction id",
      parameters: {
        type: "object",
        required: ["transactionId"],
        properties: {
          transactionId: { type: "string", description: "The transaction id." },
        },
      },
    },
  },
  {
    type: "function",
    function: {
      name: "retrievePaymentDate",
      description: "Get payment date of a transaction id",
      parameters: {
        type: "object",
        required: ["transactionId"],
        properties: {
          transactionId: { type: "string", description: "The transaction id." },
        },
      },
    },
  },
];

async function main() {
  const client = new Client({
    mistral: { apiKey: process.env.MISTRAL_API_KEY! },
  });

  console.log("\n🔮 Mistral Chat Examples\n");

  // Example 1: Basic chat completion
  console.log("--- Basic Chat Completion ---");
  try {
    const response = (await client.chat.completions.create({
      model: "mistral:mistral-medium",
      messages: [
        { role: "system", content: "You are a helpful assistant." },
        { role: "user", content: "What is TypeScript in one sentence?" },
      ],
      temperature: 0.7,
      max_tokens: 100,
      stream: false,
    })) as ChatCompletionResponse;

    console.log("Response:", response.choices[0].message.content);
    console.log("Usage:", response.usage);
    console.log("Full response:", JSON.stringify(response, null, 2));
  } catch (error) {
    console.error("Error:", error);
  }

  // Example 2: Streaming
  console.log("\n--- Streaming Example ---");
  try {
    const stream = await client.chat.completions.create({
      model: "mistral:mistral-medium",
      messages: [
        { role: "system", content: "You are a helpful assistant." },
        {
          role: "user",
          content: "Write a haiku about artificial intelligence.",
        },
      ],
      stream: true,
      temperature: 0.7,
      max_tokens: 100,
    });

    console.log("Response:");
    let fullContent = "";
    for await (const chunk of stream as AsyncIterable<any>) {
      const content = chunk.choices[0]?.delta?.content || "";
      process.stdout.write(content);
      fullContent += content;
    }
  } catch (error) {
    console.error("Streaming error:", error);
  }

  // Example 3: Tool calling
  console.log("\n\n--- Tool Calling Example ---");
  try {
    const tools = [
      {
        type: "function",
        function: {
          name: "retrievePaymentStatus",
          description: "Get payment status of a transaction id",
          parameters: {
            type: "object",
            required: ["transactionId"],
            properties: {
              transactionId: {
                type: "string",
                description: "The transaction id.",
              },
            },
          },
        },
      },
      {
        type: "function",
        function: {
          name: "retrievePaymentDate",
          description: "Get payment date of a transaction id",
          parameters: {
            type: "object",
            required: ["transactionId"],
            properties: {
              transactionId: {
                type: "string",
                description: "The transaction id.",
              },
            },
          },
        },
      },
    ];
    const model = "mistral:mistral-large-latest";

    let messages: ChatMessage[] = [
      { role: "user", content: "What's the status of my transaction?" },
    ];

    // First interaction - Model asks for transaction ID
    let response = (await client.chat.completions.create({
      model,
      messages: [
        { role: "user", content: "What's the status of my transaction?" },
      ],
      tools: TOOLS as any, // Type assertion for Mistral's string-based tools
    })) as ChatCompletionResponse;

    messages.push({
      role: "assistant",
      content: response.choices[0].message.content as string,
    });

    // User provides transaction ID
    messages.push({ role: "user", content: "My transaction ID is T1001." });

    // Second interaction - Model uses functions to get information
    response = (await client.chat.completions.create({
      model,
      messages,
      tools: TOOLS as any, // Type assertion for Mistral's string-based tools
    })) as ChatCompletionResponse;

    messages.push(response.choices[0].message);

    // Process tool calls
    const toolCalls = response.choices[0].message.tool_calls || [];
    for (const toolCall of toolCalls) {
      const functionName = toolCall.function.name;
      const functionParams = JSON.parse(toolCall.function.arguments);

      console.log(`Calling function: ${functionName}`);
      console.log(`Parameters: ${toolCall.function.arguments}`);

      const functionResult = namesToFunctions[functionName](functionParams);

      messages.push({
        role: "tool",
        name: functionName,
        content: functionResult,
        tool_call_id: toolCall.id,
      });
    }

    // Final response with the information
    response = (await client.chat.completions.create({
      model,
      messages,
      tools: TOOLS as any, // Type assertion for Mistral's string-based tools
    })) as ChatCompletionResponse;

    console.log("Final response:", response.choices[0].message.content);
  } catch (error) {
    console.error("Tool calling error:", error);
  }
}

main().catch(console.error);


================================================
FILE: aisuite-js/examples/openai-asr.ts
================================================
import { Client } from "../src";
import * as fs from "fs";
import * as path from "path";

async function main() {
  // Initialize the client with OpenAI configuration
  const client = new Client({
    openai: {
      apiKey: process.env.OPENAI_API_KEY!, 
    },
  });

  console.log("Available ASR providers:", client.listASRProviders());

  // Example: Transcribe an audio file
  try {
    // Path to your audio file
    const testAudioPath = path.join("test-audio.wav");

    // Check if test file exists
    if (!fs.existsSync(testAudioPath)) {
      console.log(
        "Test audio file not found. Please provide a valid audio file for transcription."
      );
      console.log("Expected path:", testAudioPath);
      return;
    }

    const audioBuffer = fs.readFileSync(testAudioPath);

    // Transcribe using OpenAI Whisper model
    const result = await client.audio.transcriptions.create({
      model: "openai:whisper-1",
      file: audioBuffer,
      language: "en",
      response_format: "verbose_json",
      temperature: 0,
      timestamps: true,
    });

    console.log("Transcription Result:");
    console.log("Text:", result.text);
    console.log("Language:", result.language);
    console.log("Confidence:", result.confidence);

    if (result.words && result.words.length > 0) {
      console.log("\nWords with timestamps:");
      result.words.slice(0, 5).forEach((word, index) => {
        console.log(
          `${index + 1}. "${word.text}" (${word.start}s - ${word.end}s, confidence: ${word.confidence})`
        );
      });
    }

    if (result.segments && result.segments.length > 0) {
      console.log("\nSegments:");
      result.segments.slice(0, 3).forEach((segment, index) => {
        console.log(
          `${index + 1}. "${segment.text}" (${segment.start}s - ${segment.end}s)`
        );
      });
    }
  } catch (error) {
    console.error("Error:", error);
  }
}

main().catch(console.error);


================================================
FILE: aisuite-js/examples/streaming.ts
================================================
import 'dotenv/config';
import { Client, ChatCompletionChunk } from '../src';

async function main() {
  const client = new Client({
    openai: { apiKey: process.env.OPENAI_API_KEY! },
    anthropic: { apiKey: process.env.ANTHROPIC_API_KEY! },
  });

  console.log('🚀 AISuite Streaming Examples\n');

  // Example 1: Basic OpenAI Streaming
  console.log('--- OpenAI Streaming ---');
  try {
    const stream = await client.chat.completions.create({
      model: 'openai:gpt-3.5-turbo',
      messages: [
        { role: 'system', content: 'You are a helpful assistant.' },
        { role: 'user', content: 'Write a haiku about TypeScript' }
      ],
      stream: true,
      temperature: 0.7,
      max_tokens: 100,
    }) as AsyncIterable<ChatCompletionChunk>;

    console.log('Response: ');
    let fullContent = '';
    for await (const chunk of stream) {
      const content = chunk.choices[0]?.delta?.content || '';
      process.stdout.write(content);
      fullContent += content;
    }
    console.log('\n\nFull response:', fullContent);
  } catch (error) {
    console.error('OpenAI streaming error:', error);
  }

  // Example 2: Basic Anthropic Streaming
  console.log('\n--- Anthropic Streaming ---');
  try {
    const stream = await client.chat.completions.create({
      model: 'anthropic:claude-3-haiku-20240307',
      messages: [
        { role: 'system', content: 'You are a helpful assistant.' },
        { role: 'user', content: 'Write a haiku about JavaScript' }
      ],
      stream: true,
      temperature: 0.7,
      max_tokens: 100,
    }) as AsyncIterable<ChatCompletionChunk>;

    console.log('Response: ');
    let fullContent = '';
    for await (const chunk of stream) {
      const content = chunk.choices[0]?.delta?.content || '';
      process.stdout.write(content);
      fullContent += content;
    }
    console.log('\n\nFull response:', fullContent);
  } catch (error) {
    console.error('Anthropic streaming error:', error);
  }

  // Example 3: Streaming with Progress Indicator
  console.log('\n--- Streaming with Progress ---');
  try {
    const stream = await client.chat.completions.create({
      model: 'openai:gpt-3.5-turbo',
      messages: [
        { role: 'user', content: 'Count from 1 to 10 slowly' }
      ],
      stream: true,
      temperature: 0,
      max_tokens: 100,
    }) as AsyncIterable<ChatCompletionChunk>;

    console.log('Response: ');
    let charCount = 0;
    for await (const chunk of stream) {
      const content = chunk.choices[0]?.delta?.content || '';
      process.stdout.write(content);
      charCount += content.length;
      
      // Show progress in title (if supported)
      if (process.stdout.isTTY) {
        process.stdout.write(`\x1b]0;Streaming: ${charCount} chars\x07`);
      }
    }
    console.log(`\n\nTotal characters: ${charCount}`);
  } catch (error) {
    console.error('Streaming error:', error);
  }

  // Example 4: Abort Controller
  console.log('\n--- Streaming with Abort Controller ---');
  try {
    const controller = new AbortController();
    
    // Abort after 2 seconds
    const timeout = setTimeout(() => {
      console.log('\n\n⏹️  Aborting stream...');
      controller.abort();
    }, 2000);

    const stream = await client.chat.completions.create({
      model: 'anthropic:claude-3-haiku-20240307',
      messages: [
        { role: 'user', content: 'Tell me a very long story about a programmer' }
      ],
      stream: true,
      temperature: 0.7,
      max_tokens: 500,
    }, { signal: controller.signal }) as AsyncIterable<ChatCompletionChunk>;

    console.log('Response (will abort after 2 seconds): ');
    try {
      for await (const chunk of stream) {
        const content = chunk.choices[0]?.delta?.content || '';
        process.stdout.write(content);
      }
    } catch (error: any) {
      if (error.name === 'AbortError') {
        console.log('\n\n✅ Stream successfully aborted');
      } else {
        throw error;
      }
    } finally {
      clearTimeout(timeout);
    }
  } catch (error) {
    console.error('Abort controller error:', error);
  }

  // Example 5: Streaming with Tool Calls
  console.log('\n--- Streaming with Tool Calls ---');
  try {
    const tools = [{
      type: 'function' as const,
      function: {
        name: 'get_weather',
        description: 'Get current weather',
        parameters: {
          type: 'object',
          properties: {
            location: { type: 'string' }
          },
          required: ['location']
        }
      }
    }];

    const stream = await client.chat.completions.create({
      model: 'openai:gpt-4o-mini',
      messages: [
        { role: 'user', content: 'What\'s the weather in Tokyo?' }
      ],
      tools,
      tool_choice: 'auto',
      stream: true,
    }) as AsyncIterable<ChatCompletionChunk>;

    console.log('Streaming response with potential tool calls:\n');
    
    let currentToolCall: any = null;
    let toolCalls: any[] = [];
    
    for await (const chunk of stream) {
      // Handle text content
      const content = chunk.choices[0]?.delta?.content;
      if (content) {
        process.stdout.write(content);
      }
      
      // Handle tool calls
      const deltaToolCalls = chunk.choices[0]?.delta?.tool_calls;
      if (deltaToolCalls) {
        for (const toolCall of deltaToolCalls) {
          if (toolCall.id) {
            // New tool call
            currentToolCall = {
              id: toolCall.id,
              type: toolCall.type,
              function: {
                name: toolCall.function?.name || '',
                arguments: toolCall.function?.arguments || ''
              }
            };
            toolCalls.push(currentToolCall);
          } else if (currentToolCall && toolCall.function?.arguments) {
            // Accumulate arguments
            currentToolCall.function.arguments += toolCall.function.arguments;
          }
        }
      }
      
      // Check if we're done
      if (chunk.choices[0]?.finish_reason === 'tool_calls') {
        console.log('\n\nTool calls detected:');
        for (const tc of toolCalls) {
          console.log(`- ${tc.function.name}: ${tc.function.arguments}`);
        }
      }
    }
  } catch (error) {
    console.error('Streaming with tools error:', error);
  }

  console.log('\n\n✨ Streaming examples completed!');
}

// Run examples
main().catch(console.error);

================================================
FILE: aisuite-js/examples/test-suite.ts
================================================
import 'dotenv/config';
import { Client, AISuiteError, ProviderNotConfiguredError, ChatCompletionChunk } from '../src';

// Test configuration
const ENABLE_OPENAI_TESTS = !!process.env.OPENAI_API_KEY && process.env.OPENAI_API_KEY !== 'your-openai-api-key-here';
const ENABLE_ANTHROPIC_TESTS = !!process.env.ANTHROPIC_API_KEY && process.env.ANTHROPIC_API_KEY !== 'your-anthropic-api-key-here';

console.log('🧪 AISuite Test Suite\n');
console.log(`OpenAI tests: ${ENABLE_OPENAI_TESTS ? '✅ Enabled' : '❌ Disabled (no API key)'}`);
console.log(`Anthropic tests: ${ENABLE_ANTHROPIC_TESTS ? '✅ Enabled' : '❌ Disabled (no API key)'}`);
console.log('');

// Helper function to run a test
async function runTest(name: string, fn: () => Promise<void>) {
  try {
    await fn();
    console.log(`✅ ${name}`);
  } catch (error) {
    console.error(`❌ ${name}`);
    console.error(`   Error: ${error instanceof Error ? error.message : error}`);
  }
}

async function main() {
  // Initialize client
  const client = new Client({
    ...(ENABLE_OPENAI_TESTS && { openai: { apiKey: process.env.OPENAI_API_KEY! } }),
    ...(ENABLE_ANTHROPIC_TESTS && { anthropic: { apiKey: process.env.ANTHROPIC_API_KEY! } }),
  });

  console.log('📋 Available providers:', client.listProviders());
  console.log('');

  // Test 1: Basic functionality
  console.log('🔍 Testing basic functionality...\n');
  
  await runTest('Model parser - valid format', async () => {
    const { parseModel } = await import('../src');
    const result = parseModel('openai:gpt-4');
    if (result.provider !== 'openai' || result.model !== 'gpt-4') {
      throw new Error('Model parser failed');
    }
  });

  await runTest('Model parser - invalid format', async () => {
    const { parseModel } = await import('../src');
    try {
      parseModel('invalid-format');
      throw new Error('Should have thrown error');
    } catch (error) {
      if (!(error instanceof Error) || !error.message.includes('Invalid model format')) {
        throw error;
      }
    }
  });

  await runTest('Provider not configured error', async () => {
    try {
      await client.chat.completions.create({
        model: 'invalid:model',
        messages: [{ role: 'user', content: 'test' }]
      });
      throw new Error('Should have thrown error');
    } catch (error) {
      if (!(error instanceof ProviderNotConfiguredError)) {
        throw error;
      }
    }
  });

  // Test 2: OpenAI Provider
  if (ENABLE_OPENAI_TESTS) {
    console.log('\n🤖 Testing OpenAI provider...\n');

    await runTest('OpenAI - Basic chat completion', async () => {
      const response = await client.chat.completions.create({
        model: 'openai:gpt-3.5-turbo',
        messages: [
          { role: 'system', content: 'You are a test assistant. Respond with exactly: "Test successful"' },
          { role: 'user', content: 'Hello' }
        ],
        temperature: 0,
        max_tokens: 50,
      });

      if (!response.choices[0]?.message?.content) {
        throw new Error('No response content');
      }
      console.log(`   Response: ${response.choices[0].message.content.trim()}`);
    });

    await runTest('OpenAI - Multiple messages', async () => {
      const response = await client.chat.completions.create({
        model: 'openai:gpt-3.5-turbo',
        messages: [
          { role: 'system', content: 'You are a helpful assistant.' },
          { role: 'user', content: 'Say "A"' },
          { role: 'assistant', content: 'A' },
          { role: 'user', content: 'Say "B"' }
        ],
        temperature: 0,
        max_tokens: 10,
      });

      if (!response.choices[0]?.message?.content?.includes('B')) {
        throw new Error('Multi-turn conversation failed');
      }
    });

    await runTest('OpenAI - Tool calling', async () => {
      const response = await client.chat.completions.create({
        model: 'openai:gpt-3.5-turbo',
        messages: [
          { role: 'user', content: 'What is the weather in San Francisco?' }
        ],
        tools: [{
          type: 'function',
          function: {
            name: 'get_weather',
            description: 'Get weather for a location',
            parameters: {
              type: 'object',
              properties: {
                location: { type: 'string' }
              },
              required: ['location']
            }
          }
        }],
        tool_choice: 'auto'
      });

      const toolCalls = response.choices[0]?.message?.tool_calls;
      if (!toolCalls || toolCalls.length === 0) {
        throw new Error('No tool calls in response');
      }
      console.log(`   Tool called: ${toolCalls[0].function.name}`);
    });

    await runTest('OpenAI - Streaming support', async () => {
      const stream = await client.chat.completions.create({
        model: 'openai:gpt-3.5-turbo',
        messages: [{ role: 'user', content: 'Say exactly: "Stream test"' }],
        stream: true,
        temperature: 0,
        max_tokens: 20,
      }) as AsyncIterable<ChatCompletionChunk>;

      let content = '';
      for await (const chunk of stream) {
        content += chunk.choices[0]?.delta?.content || '';
      }
      
      if (!content.toLowerCase().includes('stream')) {
        throw new Error('Streaming response did not contain expected content');
      }
      console.log(`   Streamed: ${content.trim()}`);
    });
  }

  // Test 3: Anthropic Provider
  if (ENABLE_ANTHROPIC_TESTS) {
    console.log('\n🔮 Testing Anthropic provider...\n');

    await runTest('Anthropic - Basic chat completion', async () => {
      const response = await client.chat.completions.create({
        model: 'anthropic:claude-3-haiku-20240307',
        messages: [
          { role: 'system', content: 'You are a test assistant. Respond with exactly: "Test successful"' },
          { role: 'user', content: 'Hello' }
        ],
        temperature: 0,
        max_tokens: 50,
      });

      if (!response.choices[0]?.message?.content) {
        throw new Error('No response content');
      }
      console.log(`   Response: ${response.choices[0].message.content.trim()}`);
    });

    await runTest('Anthropic - System message handling', async () => {
      const response = await client.chat.completions.create({
        model: 'anthropic:claude-3-haiku-20240307',
        messages: [
          { role: 'system', content: 'Always respond in uppercase.' },
          { role: 'system', content: 'Also end with an exclamation mark.' },
          { role: 'user', content: 'say hello' }
        ],
        temperature: 0,
        max_tokens: 50,
      });

      const content = response.choices[0]?.message?.content || '';
      if (!content.includes('!') || content !== content.toUpperCase()) {
        console.log(`   Warning: System message may not be properly handled. Response: ${content}`);
      }
    });

    await runTest('Anthropic - Tool calling', async () => {
      const response = await client.chat.completions.create({
        model: 'anthropic:claude-3-haiku-20240307',
        messages: [
          { role: 'user', content: 'What is the weather in Paris?' }
        ],
        tools: [{
          type: 'function',
          function: {
            name: 'get_weather',
            description: 'Get weather for a location',
            parameters: {
              type: 'object',
              properties: {
                location: { type: 'string', description: 'The city name' }
              },
              required: ['location']
            }
          }
        }],
        tool_choice: 'auto'
      });

      const toolCalls = response.choices[0]?.message?.tool_calls;
      if (!toolCalls || toolCalls.length === 0) {
        throw new Error('No tool calls in response');
      }
      console.log(`   Tool called: ${toolCalls[0].function.name}`);
      console.log(`   Arguments: ${toolCalls[0].function.arguments}`);
    });

    await runTest('Anthropic - Streaming support', async () => {
      const stream = await client.chat.completions.create({
        model: 'anthropic:claude-3-haiku-20240307',
        messages: [{ role: 'user', content: 'Say exactly: "Stream works"' }],
        stream: true,
        temperature: 0,
        max_tokens: 20,
      }) as AsyncIterable<ChatCompletionChunk>;

      let content = '';
      for await (const chunk of stream) {
        content += chunk.choices[0]?.delta?.content || '';
      }
      
      if (!content.toLowerCase().includes('stream')) {
        throw new Error('Streaming response did not contain expected content');
      }
      console.log(`   Streamed: ${content.trim()}`);
    });
  }

  // Test 4: Cross-provider compatibility
  if (ENABLE_OPENAI_TESTS && ENABLE_ANTHROPIC_TESTS) {
    console.log('\n🔄 Testing cross-provider compatibility...\n');

    await runTest('Same prompt - different providers', async () => {
      const prompt = {
        messages: [
          { role: 'system', content: 'You are a helpful assistant. Be concise.' },
          { role: 'user', content: 'What is 2+2?' }
        ] as const,
        temperature: 0,
        max_tokens: 50,
      };

      const openaiResponse = await client.chat.completions.create({
        ...prompt,
        model: 'openai:gpt-3.5-turbo',
      });

      const anthropicResponse = await client.chat.completions.create({
        ...prompt,
        model: 'anthropic:claude-3-haiku-20240307',
      });

      console.log(`   OpenAI: ${openaiResponse.choices[0].message.content?.trim()}`);
      console.log(`   Anthropic: ${anthropicResponse.choices[0].message.content?.trim()}`);
      
      // Both should mention "4" in their response
      if (!openaiResponse.choices[0].message.content?.includes('4') || 
          !anthropicResponse.choices[0].message.content?.includes('4')) {
        throw new Error('Providers gave inconsistent results');
      }
    });
  }

  console.log('\n✨ Test suite completed!\n');
}

// Run tests
main().catch(error => {
  console.error('\n💥 Test suite failed:', error);
  process.exit(1);
});

================================================
FILE: aisuite-js/examples/tool-calling.ts
================================================
import 'dotenv/config';
import { Client, ChatMessage } from '../src';

// Mock function for weather
function getWeather(location: string, unit: 'celsius' | 'fahrenheit' = 'celsius') {
  // Mock implementation
  return {
    location,
    temperature: unit === 'celsius' ? 22 : 72,
    condition: 'sunny',
    unit
  };
}

async function main() {
  const client = new Client({
    openai: { apiKey: process.env.OPENAI_API_KEY! },
    anthropic: { apiKey: process.env.ANTHROPIC_API_KEY! },
  });

  // Define tools in OpenAI format
  const tools = [
    {
      type: 'function' as const,
      function: {
        name: 'get_weather',
        description: 'Get the current weather for a location',
        parameters: {
          type: 'object',
          properties: {
            location: {
              type: 'string',
              description: 'The city and state, e.g. San Francisco, CA'
            },
            unit: {
              type: 'string',
              enum: ['celsius', 'fahrenheit'],
              description: 'The temperature unit'
            }
          },
          required: ['location']
        }
      }
    }
  ];

  // Example 1: OpenAI Tool Calling
  console.log('--- OpenAI Tool Calling ---');
  try {
    // Step 1: Initial request with tools
    const response = await client.chat.completions.create({
      model: 'openai:gpt-4o-mini',
      messages: [
        { role: 'system', content: 'You are a helpful weather assistant.' },
        { role: 'user', content: "What's the weather like in San Francisco?" }
      ],
      tools,
      tool_choice: 'auto'
    });

    const message = response.choices[0]?.message;
    console.log('Step 1 - Initial response:', JSON.stringify(message, null, 2));

    if (message?.tool_calls) {
      // Step 2: Execute tool calls and send results back
      const messages: ChatMessage[] = [
        { role: 'system', content: 'You are a helpful weather assistant.' },
        { role: 'user', content: "What's the weather like in San Francisco?" },
        message // The assistant's message with tool calls
      ];

      console.log('\nTool calls detected:');
      for (const toolCall of message.tool_calls) {
        console.log(`- Function: ${toolCall.function.name}`);
        console.log(`  Arguments: ${toolCall.function.arguments}`);
        
        // Execute the function
        const args = JSON.parse(toolCall.function.arguments);
        const result = getWeather(args.location, args.unit);
        console.log(`  Result:`, result);

        // Add tool result to messages
        messages.push({
          role: 'tool',
          tool_call_id: toolCall.id,
          content: JSON.stringify(result)
        });
      }

      // Step 3: Get final response with tool results
      console.log('\nStep 2 - Sending tool results back...');
      const finalResponse = await client.chat.completions.create({
        model: 'openai:gpt-4o-mini',
        messages,
        temperature: 0.7,
        max_tokens: 200
      });

      console.log('\nStep 3 - Final response:', finalResponse.choices[0].message.content);
    }
  } catch (error) {
    console.error('OpenAI Tool Calling Error:', error);
  }

  // Example 2: Anthropic Tool Calling
  console.log('\n--- Anthropic Tool Calling ---');
  try {
    // Step 1: Initial request with tools
    const response = await client.chat.completions.create({
      model: 'anthropic:claude-3-haiku-20240307',
      messages: [
        { role: 'system', content: 'You are a helpful weather assistant.' },
        { role: 'user', content: "What's the weather like in New York?" }
      ],
      tools,
      tool_choice: 'auto'
    });

    const message = response.choices[0]?.message;
    console.log('Step 1 - Initial response:', JSON.stringify(message, null, 2));

    if (message?.tool_calls) {
      // Step 2: Execute tool calls and send results back
      const messages: ChatMessage[] = [
        { role: 'system', content: 'You are a helpful weather assistant.' },
        { role: 'user', content: "What's the weather like in New York?" },
        message // The assistant's message with tool calls
      ];

      console.log('\nTool calls detected:');
      for (const toolCall of message.tool_calls) {
        console.log(`- Function: ${toolCall.function.name}`);
        console.log(`  Arguments: ${toolCall.function.arguments}`);
        
        // Execute the function
        const args = JSON.parse(toolCall.function.arguments);
        const result = getWeather(args.location, args.unit);
        console.log(`  Result:`, result);

        // Add tool result to messages
        messages.push({
          role: 'tool',
          tool_call_id: toolCall.id,
          content: JSON.stringify(result)
        });
      }

      // Step 3: Get final response with tool results
      console.log('\nStep 2 - Sending tool results back...');
      const finalResponse = await client.chat.completions.create({
        model: 'anthropic:claude-3-haiku-20240307',
        messages,
        temperature: 0.7,
        max_tokens: 200
      });

      console.log('\nStep 3 - Final response:', finalResponse.choices[0].message.content);
    }
  } catch (error) {
    console.error('Anthropic Tool Calling Error:', error);
  }
}

main().catch(console.error);

================================================
FILE: aisuite-js/jest.config.ts
================================================
export default {
  preset: 'ts-jest',
  testEnvironment: 'node',
  roots: ['<rootDir>/tests'],
  testMatch: [
    '**/__tests__/**/*.ts',
    '**/?(*.)+(spec|test).ts'
  ],
  transform: {
    '^.+\\.ts$': 'ts-jest',
    '^.+\\.js$': 'babel-jest',
  },
  transformIgnorePatterns: [
    'node_modules/(?!(@mistralai|@anthropic-ai|groq-sdk|openai)/)'
  ],
  extensionsToTreatAsEsm: ['.ts'],
  globals: {
    'ts-jest': {
      useESM: true,
    },
  },
  collectCoverageFrom: [
    'src/**/*.ts',
    '!src/**/*.d.ts',
  ],
  coverageDirectory: 'coverage',
  coverageReporters: ['text', 'lcov', 'html'],
  moduleNameMapper: {
    '^@/(.*)$': '<rootDir>/src/$1',
  },
  setupFilesAfterEnv: [],
  testTimeout: 10000,
};

================================================
FILE: aisuite-js/package.json
================================================
{
  "name": "aisuite",
  "version": "0.1.1",
  "description": "Unified TypeScript library for multiple LLM providers",
  "main": "dist/index.js",
  "types": "dist/index.d.ts",
  "scripts": {
    "build": "tsc",
    "test": "jest --config=jest.config.ts",
    "test:examples": "tsx examples/test-suite.ts",
    "example:basic": "tsx examples/basic-usage.ts",
    "example:tools": "tsx examples/tool-calling.ts",
    "example:streaming": "tsx examples/streaming.ts",
    "example:mistral": "tsx examples/mistral.ts",
    "example:groq": "tsx examples/groq.ts",
    "example:deepgram": "tsx examples/deepgram.ts",
    "example:openai-asr": "tsx examples/openai-asr.ts",
    "lint": "eslint src/**/*.ts",
    "prepublishOnly": "npm run build",
    "dev": "tsc --watch"
  },
  "dependencies": {
    "@anthropic-ai/sdk": "^0.56.0",
    "@deepgram/sdk": "^4.11.2",
    "@mistralai/mistralai": "^0.1.3",
    "groq-sdk": "^0.29.0",
    "openai": "^4.0.0"
  },
  "peerDependencies": {
    "typescript": ">=4.5.0"
  },
  "devDependencies": {
    "@types/jest": "^29.0.0",
    "@types/node": "^20.0.0",
    "@typescript-eslint/eslint-plugin": "^6.0.0",
    "@typescript-eslint/parser": "^6.0.0",
    "dotenv": "^16.0.0",
    "eslint": "^8.0.0",
    "jest": "^29.0.0",
    "ts-jest": "^29.0.0",
    "tsx": "^4.0.0",
    "typescript": "^5.0.0"
  },
  "keywords": [
    "llm",
    "openai",
    "anthropic",
    "claude",
    "gpt",
    "ai",
    "typescript"
  ],
  "author": "Andrew Ng and Rohit P",
  "license": "MIT",
  "engines": {
    "node": ">=16.0.0"
  },
  "files": [
    "dist/**/*",
    "README.md",
    "LICENSE"
  ],
  "repository": {
    "type": "git",
    "url": "git+https://github.com/andrewyng/aisuite.git"
  },
  "bugs": {
    "url": "https://github.com/andrewyng/aisuite/issues"
  },
  "homepage": "https://github.com/andrewyng/aisuite#readme",
  "type": "module"
}


================================================
FILE: aisuite-js/src/asr-providers/deepgram/adapters.ts
================================================
import { TranscriptionResult, Word, Segment } from "../../types";

export function adaptResponse(response: any): TranscriptionResult {
  const words: Word[] = [];
  const segments: Segment[] = [];

  // Handle Deepgram response structure
  if (response.results?.channels?.[0]?.alternatives?.[0]) {
    const alternative = response.results.channels[0].alternatives[0];

    // Extract words with timestamps and confidence
    if (alternative.words) {
      alternative.words.forEach((word: any) => {
        words.push({
          text: word.word,
          start: word.start,
          end: word.end,
          confidence: word.confidence,
          speaker: word.speaker?.toString(),
        });
      });
    }

    // Extract utterances/segments
    if (response.results.utterances) {
      response.results.utterances.forEach((utterance: any) => {
        segments.push({
          text: utterance.transcript,
          start: utterance.start,
          end: utterance.end,
          speaker: utterance.speaker?.toString(),
        });
      });
    }

    return {
      text: alternative.transcript,
      language: response.metadata?.language || "unknown",
      confidence: alternative.confidence,
      words,
      segments,
    };
  }

  // Fallback for unexpected response structure
  return {
    text: response.transcript || "",
    language: "unknown",
    confidence: undefined,
    words: [],
    segments: [],
  };
}


================================================
FILE: aisuite-js/src/asr-providers/deepgram/index.ts
================================================
export { DeepgramASRProvider } from "./provider";
export type { DeepgramConfig } from "./types";


================================================
FILE: aisuite-js/src/asr-providers/deepgram/provider.ts
================================================
import { createClient, DeepgramClient } from "@deepgram/sdk";
import { ASRProvider } from "../../core/base-asr-provider";
import {
  TranscriptionRequest,
  TranscriptionResult,
  RequestOptions,
} from "../../types";
import { DeepgramConfig } from "./types";
import { adaptResponse } from "./adapters";
import { AISuiteError } from "../../core/errors";
import * as fs from "fs";

export class DeepgramASRProvider implements ASRProvider {
  public readonly name = "deepgram";
  private client: DeepgramClient;

  constructor(config: DeepgramConfig) {
    // Use the new createClient API instead of the deprecated Deepgram constructor
    this.client = createClient({
      key: config.apiKey,
      ...(config.baseURL && { baseUrl: config.baseURL }),
    });
  }

  validateParams(params: { [key: string]: any }): void {
    if (!params.model) {
      throw new AISuiteError(
        "Model parameter is required",
        this.name,
        "MODEL_PARAMETER_REQUIRED"
      );
    }

    if (!params.file) {
      throw new AISuiteError(
        "File parameter is required",
        this.name,
        "MODEL_PARAMETER_REQUIRED"
      );
    }
  }

  translateParams(params: { [key: string]: any }): { [key: string]: any } {
    const { model: _, file: __, ...rest } = params;
    return Object.entries(rest).reduce((translated, [key, value]) => {
      switch (key) {
        case "timestamps":
          if (value) translated.utterances = true;
          break;
        default:
          translated[key] = value;
      }
      return translated;
    }, {} as { [key: string]: any });
  }

  async transcribe(
    request: TranscriptionRequest,
    options?: RequestOptions
  ): Promise<TranscriptionResult> {
    try {
      // Extract parameters excluding model and file
      const { model, file, ...params } = request;
      this.validateParams(request);
      const translatedParams = this.translateParams(params);

      // Handle different input types
      let audioData: Buffer;
      if (typeof request.file === "string") {
        audioData = fs.readFileSync(request.file);
      } else if (Buffer.isBuffer(request.file)) {
        audioData = request.file;
      } else if (request.file instanceof Uint8Array) {
        audioData = Buffer.from(request.file);
      } else {
        throw new AISuiteError(
          "Unsupported audio input type",
          this.name,
          "INVALID_INPUT"
        );
      }

      // Set up transcription options for v4 SDK format
      const transcriptionOptions = {
        model: request.model,
        ...translatedParams
      };

      // Use the v4 SDK format for transcription
      const response = await this.client.listen.prerecorded
        .transcribeFile(audioData, {
          ...transcriptionOptions
        });

      // Check for errors in the response
      if (response.error) {
        throw new AISuiteError(
          `Deepgram API error: ${response.error.message}`,
          this.name,
          "API_ERROR"
        );
      }

      return adaptResponse(response.result);
    } catch (error) {
      if (error instanceof AISuiteError) {
        throw error;
      }
      throw new AISuiteError(
        `Deepgram ASR error: ${
          error instanceof Error ? error.message : "Unknown error"
        }`,
        this.name,
        "API_ERROR"
      );
    }
  }
}


================================================
FILE: aisuite-js/src/asr-providers/deepgram/types.ts
================================================
export interface DeepgramConfig {
  apiKey: string;
  baseURL?: string;
}


================================================
FILE: aisuite-js/src/asr-providers/index.ts
================================================
export { DeepgramASRProvider } from "./deepgram";
export type { DeepgramConfig } from "../types";


================================================
FILE: aisuite-js/src/client.ts
================================================
import {
  ChatCompletionRequest,
  ChatCompletionResponse,
  ChatCompletionChunk,
  ProviderConfigs,
  RequestOptions,
  TranscriptionRequest,
  TranscriptionResult,
} from "./types";
import { Provider } from "./core/base-provider";
import { ASRProvider } from "./core/base-asr-provider";
import { parseModel } from "./core/model-parser";
import { ProviderNotConfiguredError } from "./core/errors";
import { OpenAIProvider } from "./providers/openai";
import { AnthropicProvider } from "./providers/anthropic";
import { MistralProvider } from "./providers/mistral";
import { GroqProvider } from "./providers/groq";
import { DeepgramASRProvider } from "./asr-providers/deepgram";

export class Client {
  private chatProviders: Map<string, Provider> = new Map();
  private asrProviders: Map<string, ASRProvider> = new Map();

  constructor(config: ProviderConfigs) {
    this.initializeProviders(config);
  }

  private initializeProviders(config: ProviderConfigs): void {
    if (config.openai) {
      const openaiProvider = new OpenAIProvider(config.openai);
      this.chatProviders.set("openai", openaiProvider);
      this.asrProviders.set("openai", openaiProvider);
    }

    if (config.anthropic) {
      this.chatProviders.set(
        "anthropic",
        new AnthropicProvider(config.anthropic)
      );
    }

    if (config.mistral) {
      this.chatProviders.set("mistral", new MistralProvider(config.mistral));
    }

    if (config.groq) {
      this.chatProviders.set("groq", new GroqProvider(config.groq));
    }

    if (config.deepgram) {
      this.asrProviders.set(
        "deepgram",
        new DeepgramASRProvider(config.deepgram)
      );
    }
  }

  public chat = {
    completions: {
      create: async (
        request: ChatCompletionRequest,
        options?: RequestOptions
      ): Promise<
        ChatCompletionResponse | AsyncIterable<ChatCompletionChunk>
      > => {
        const { provider, model } = parseModel(request.model);
        const providerInstance = this.chatProviders.get(provider);

        if (!providerInstance) {
          throw new ProviderNotConfiguredError(
            provider,
            Array.from(this.chatProviders.keys())
          );
        }

        const requestWithParsedModel = {
          ...request,
          model, // Just the model name without provider prefix
        };

        if (request.stream) {
          return providerInstance.streamChatCompletion(
            requestWithParsedModel,
            options
          );
        } else {
          return providerInstance.chatCompletion(
            requestWithParsedModel,
            options
          );
        }
      },
    },
  };

  public audio = {
    transcriptions: {
      create: async (
        request: TranscriptionRequest,
        options?: RequestOptions
      ): Promise<TranscriptionResult> => {
        const { provider, model } = parseModel(request.model);
        const providerInstance = this.asrProviders.get(provider);

        if (!providerInstance) {
          throw new ProviderNotConfiguredError(
            provider,
            Array.from(this.asrProviders.keys())
          );
        }

        const requestWithParsedModel = {
          ...request,
          model, // Just the model name without provider prefix
        };

        return providerInstance.transcribe(requestWithParsedModel, options);
      },
    },
  };

  public listProviders(): string[] {
    return Array.from(this.chatProviders.keys());
  }

  public listASRProviders(): string[] {
    return Array.from(this.asrProviders.keys());
  }

  public isProviderConfigured(provider: string): boolean {
    return this.chatProviders.has(provider);
  }

  public isASRProviderConfigured(provider: string): boolean {
    return this.asrProviders.has(provider);
  }
}


================================================
FILE: aisuite-js/src/core/base-asr-provider.ts
================================================
import { 
  TranscriptionRequest, 
  TranscriptionResult,
  RequestOptions 
} from '../types';

export interface ASRProvider {
  readonly name: string;
  
  transcribe(
    request: TranscriptionRequest,
    options?: RequestOptions
  ): Promise<TranscriptionResult>;
  
  validateParams(    
    params: { [key: string]: any }
  ): void;
  
  translateParams(    
    params: { [key: string]: any }
  ): { [key: string]: any };
}

================================================
FILE: aisuite-js/src/core/base-provider.ts
================================================
import { 
  ChatCompletionRequest, 
  ChatCompletionResponse, 
  ChatCompletionChunk,
  RequestOptions 
} from '../types';

export interface Provider {
  readonly name: string;
  
  chatCompletion(
    request: ChatCompletionRequest,
    options?: RequestOptions
  ): Promise<ChatCompletionResponse>;
  
  streamChatCompletion(
    request: ChatCompletionRequest,
    options?: RequestOptions
  ): AsyncIterable<ChatCompletionChunk>;
}

================================================
FILE: aisuite-js/src/core/errors.ts
================================================
export class AISuiteError extends Error {
  constructor(
    message: string,
    public provider: string,
    public code?: string,
    public statusCode?: number
  ) {
    super(message);
    this.name = "AISuiteError";
  }
}

export class ProviderNotConfiguredError extends AISuiteError {
  constructor(provider: string, availableProviders: string[]) {
    super(
      `Provider '${provider}' not configured. Available: ${availableProviders.join(
        ", "
      )}`,
      provider,
      "PROVIDER_NOT_CONFIGURED"
    );
  }
}

export class InvalidModelFormatError extends AISuiteError {
  constructor(model: string) {
    super(
      `Invalid model format: ${model}. Expected "provider:model"`,
      "unknown",
      "INVALID_MODEL_FORMAT"
    );
  }
}

export class ToolCallError extends AISuiteError {
  constructor(message: string, provider: string) {
    super(message, provider, "TOOL_CALL_ERROR");
  }
}

export class AudioProcessingError extends AISuiteError {
  constructor(message: string, provider: string) {
    super(message, provider, "AUDIO_PROCESSING_ERROR");
    this.name = "AudioProcessingError";
  }
}

export class UnsupportedParameterError extends AISuiteError {
  constructor(parameter: string, provider: string) {
    super(
      `Parameter '${parameter}' is not supported by provider '${provider}'`,
      provider,
      'UNSUPPORTED_PARAMETER'
    );
    this.name = 'UnsupportedParameterError';
  }
}


================================================
FILE: aisuite-js/src/core/model-parser.ts
================================================
import { InvalidModelFormatError } from './errors';

export interface ParsedModel {
  provider: string;
  model: string;
}

export function parseModel(model: string): ParsedModel {
  if (!model || typeof model !== 'string') {
    throw new InvalidModelFormatError(model);
  }

  const [provider, ...modelParts] = model.split(':');
  
  if (!provider || modelParts.length === 0) {
    throw new InvalidModelFormatError(model);
  }
  
  return {
    provider,
    model: modelParts.join(':') // Handle cases like "openai:gpt-4:vision"
  };
}

================================================
FILE: aisuite-js/src/index.ts
================================================
export { Client } from "./client";
export * from "./types";
export * from "./core/errors";
export { parseModel } from "./core/model-parser";

// Re-export providers for advanced usage
export {
  OpenAIProvider,
  AnthropicProvider,
  GroqProvider,
  MistralProvider,
} from "./providers";

export { DeepgramASRProvider } from "./asr-providers";


================================================
FILE: aisuite-js/src/providers/anthropic/adapters.ts
================================================
import { 
  ChatCompletionRequest, 
  ChatCompletionResponse, 
  ChatCompletionChunk,
  ChatMessage,
  Tool,
  ToolCall
} from '../../types';
import type { 
  Message, 
  MessageCreateParams,
  MessageStreamEvent
} from '@anthropic-ai/sdk/resources/messages';
import { generateId, createChunk } from '../../utils/streaming';

export function adaptRequest(request: ChatCompletionRequest): MessageCreateParams {
  const { systemMessage, userMessages } = transformMessages(request.messages);
  
  // Don't pass stream parameter to avoid accidental streaming
  const params: MessageCreateParams = {
    model: request.model,
    max_tokens: request.max_tokens || 1024,
    messages: userMessages,
    temperature: request.temperature,
    top_p: request.top_p,
    stop_sequences: Array.isArray(request.stop) ? request.stop : request.stop ? [request.stop] : undefined,
  };

  if (systemMessage) {
    params.system = systemMessage;
  }

  if (request.tools) {
    params.tools = request.tools.map(adaptTool);
  }

  return params;
}

function transformMessages(messages: ChatMessage[]) {
  const systemMessages = messages.filter(msg => msg.role === 'system');
  const otherMessages = messages.filter(msg => msg.role !== 'system');
  
  const systemMessage = systemMessages.map(msg => msg.content).join('\n') || undefined;
  
  const userMessages = otherMessages.map(msg => {
    if (msg.role === 'tool') {
      // Transform tool response to user message with tool_result
      return {
        role: 'user' as const,
        content: [
          {
            type: 'tool_result' as const,
            tool_use_id: msg.tool_call_id!,
            content: msg.content!,
          }
        ]
      };
    }
    
    if (msg.role === 'assistant' && msg.tool_calls) {
      // Transform assistant message with tool calls
      const content: any[] = [];
      
      if (msg.content) {
        content.push({
          type: 'text',
          text: msg.content
        });
      }
      
      msg.tool_calls.forEach(toolCall => {
        content.push({
          type: 'tool_use',
          id: toolCall.id,
          name: toolCall.function.name,
          input: JSON.parse(toolCall.function.arguments)
        });
      });
      
      return {
        role: 'assistant' as const,
        content
      };
    }
    
    return {
      role: msg.role as 'user' | 'assistant',
      content: msg.content!,
    };
  });
  
  return {
    systemMessage,
    userMessages,
  };
}

function adaptTool(tool: Tool): any {
  return {
    name: tool.function.name,
    description: tool.function.description,
    input_schema: {
      type: 'object',
      properties: tool.function.parameters.properties,
      required: tool.function.parameters.required,
    },
  };
}

export function adaptResponse(response: Message, originalModel: string): ChatCompletionResponse {
  const content = Array.isArray(response.content) 
    ? response.content.find(block => block.type === 'text')?.text || ''
    : response.content;

  const toolCalls: ToolCall[] = [];
  if (Array.isArray(response.content)) {
    response.content.forEach(block => {
      if (block.type === 'tool_use') {
        toolCalls.push({
          id: block.id,
          type: 'function',
          function: {
            name: block.name,
            arguments: JSON.stringify(block.input),
          },
        });
      }
    });
  }

  return {
    id: response.id,
    object: 'chat.completion',
    created: Math.floor(Date.now() / 1000),
    model: originalModel,
    choices: [{
      index: 0,
      message: {
        role: 'assistant',
        content,
        tool_calls: toolCalls.length > 0 ? toolCalls : undefined,
      },
      finish_reason: response.stop_reason || 'stop',
    }],
    usage: {
      prompt_tokens: response.usage.input_tokens,
      completion_tokens: response.usage.output_tokens,
      total_tokens: response.usage.input_tokens + response.usage.output_tokens,
    },
  };
}

export function adaptStreamEvent(
  event: MessageStreamEvent, 
  streamId: string, 
  originalModel: string
): ChatCompletionChunk | null {
  switch (event.type) {
    case 'content_block_delta':
      if (event.delta.type === 'text_delta') {
        return createChunk(streamId, originalModel, event.delta.text);
      }
      break;
      
    case 'content_block_start':
      if (event.content_block.type === 'tool_use') {
        return createChunk(streamId, originalModel, undefined, undefined, [{
          id: event.content_block.id,
          type: 'function',
          function: {
            name: event.content_block.name,
            arguments: '',
          },
        }]);
      }
      break;
      
    case 'message_stop':
      return createChunk(streamId, originalModel, undefined, 'stop');
      
    default:
      return null;
  }
  
  return null;
}

================================================
FILE: aisuite-js/src/providers/anthropic/index.ts
================================================
export { AnthropicProvider } from './provider';
export type { AnthropicConfig } from './types';

================================================
FILE: aisuite-js/src/providers/anthropic/provider.ts
================================================
import Anthropic from '@anthropic-ai/sdk';
import { Provider } from '../../core/base-provider';
import { 
  ChatCompletionRequest, 
  ChatCompletionResponse, 
  ChatCompletionChunk,
  RequestOptions 
} from '../../types';
import { AnthropicConfig } from './types';
import { adaptRequest, adaptResponse, adaptStreamEvent } from './adapters';
import { AISuiteError } from '../../core/errors';
import { generateId } from '../../utils/streaming';

export class AnthropicProvider implements Provider {
  public readonly name = 'anthropic';
  private client: Anthropic;

  constructor(config: AnthropicConfig) {
    this.client = new Anthropic({
      apiKey: config.apiKey,
      baseURL: config.baseURL,
    });
  }

  async chatCompletion(
    request: ChatCompletionRequest,
    options?: RequestOptions
  ): Promise<ChatCompletionResponse> {
    try {
      // For now, we don't support streaming in non-streaming method
      if (request.stream) {
        throw new AISuiteError(
          'Streaming is not yet supported. Set stream: false or use streamChatCompletion method.',
          this.name,
          'STREAMING_NOT_SUPPORTED'
        );
      }

      const anthropicRequest = adaptRequest(request);
      const message = await this.client.messages.create(
        anthropicRequest,
        options
      ) as any;  // Type assertion needed because Anthropic SDK returns a union type

      return adaptResponse(message, request.model);
    } catch (error) {
      if (error instanceof AISuiteError) {
        throw error;
      }
      throw new AISuiteError(
        `Anthropic API error: ${error instanceof Error ? error.message : 'Unknown error'}`,
        this.name,
        'API_ERROR'
      );
    }
  }

  async *streamChatCompletion(
    request: ChatCompletionRequest,
    options?: RequestOptions
  ): AsyncIterable<ChatCompletionChunk> {
    try {
      const anthropicRequest = adaptRequest(request);
      const stream = await this.client.messages.create(
        {
          ...anthropicRequest,
          stream: true,
        },
        options
      );

      const streamId = generateId();

      // Handle abort signal
      if (options?.signal) {
        options.signal.addEventListener('abort', () => {
          if (stream && typeof (stream as any).controller?.abort === 'function') {
            (stream as any).controller.abort();
          }
        });
      }

      for await (const event of stream) {
        const chunk = adaptStreamEvent(event, streamId, request.model);
        if (chunk) {
          yield chunk;
        }
      }
    } catch (error) {
      throw new AISuiteError(
        `Anthropic streaming error: ${error instanceof Error ? error.message : 'Unknown error'}`,
        this.name,
        'STREAMING_ERROR'
      );
    }
  }
}

================================================
FILE: aisuite-js/src/providers/anthropic/types.ts
================================================
import { AnthropicConfig } from '../../types';

export { AnthropicConfig };

// Re-export Anthropic types that we need
export type { 
  Message,
  MessageCreateParams,
  MessageStreamEvent
} from '@anthropic-ai/sdk/resources/messages';

================================================
FILE: aisuite-js/src/providers/groq/adapters.ts
================================================
import type { ChatCompletion as GroqChatCompletion } from "groq-sdk/resources/chat/completions";
import {
  ChatCompletionRequest,
  ChatCompletionResponse,
  ChatCompletionChunk as AISuiteChatCompletionChunk,
  Usage,
} from "../../types";

export function adaptRequest(request: ChatCompletionRequest): any {
  return {
    model: request.model.replace("groq:", ""),
    messages: request.messages,
    temperature: request.temperature,
    max_tokens: request.max_tokens,
    stream: request.stream,
    tools: request.tools,
    tool_choice: request.tool_choice,
  };
}

export function adaptResponse(
  response: GroqChatCompletion
): ChatCompletionResponse {
  return {
    id: response.id,
    object: response.object,
    created: response.created,
    model: `groq:${response.model}`,
    choices: response.choices.map((choice) => ({
      index: choice.index,
      message: choice.message,
      finish_reason: choice.finish_reason,
    })),
    usage: response.usage ?? {
      prompt_tokens: 0,
      completion_tokens: 0,
      total_tokens: 0,
    },
  };
}

export function adaptStreamResponse(
  chunk: any,
  streamId: string
): AISuiteChatCompletionChunk {
  return {
    id: streamId,
    object: "chat.completion.chunk",
    created: Date.now(),
    model: `groq:${chunk.model}`,
    choices: chunk.choices.map((choice: any) => ({
      index: choice.index,
      delta: choice.delta,
      finish_reason: choice.finish_reason,
    })),
  };
}


================================================
FILE: aisuite-js/src/providers/groq/index.ts
================================================
export { GroqProvider } from "./provider";
export type { GroqConfig } from "./types";


================================================
FILE: aisuite-js/src/providers/groq/provider.ts
================================================
import Groq from "groq-sdk";
import { Provider } from "../../core/base-provider";
import {
  ChatCompletionRequest,
  ChatCompletionResponse,
  ChatCompletionChunk,
  RequestOptions,
} from "../../types";
import { GroqConfig } from "./types";
import { adaptRequest, adaptResponse, adaptStreamResponse } from "./adapters";
import { AISuiteError } from "../../core/errors";
import { generateId } from "../../utils/streaming";

export class GroqProvider implements Provider {
  public readonly name = "groq";
  private client: Groq;

  constructor(config: GroqConfig) {
    this.client = new Groq({
      apiKey: config.apiKey,
      dangerouslyAllowBrowser: config.dangerouslyAllowBrowser || false, // Allow browser usage for chat app
    });
    if (config.baseURL) {
      (this.client as any).baseURL = config.baseURL;
    }
  }

  async chatCompletion(
    request: ChatCompletionRequest,
    options?: RequestOptions
  ): Promise<ChatCompletionResponse> {
    try {
      if (request.stream) {
        throw new AISuiteError(
          "Streaming is not supported in non-streaming method. Set stream: false or use streamChatCompletion method.",
          this.name,
          "STREAMING_NOT_SUPPORTED"
        );
      }

      const groqRequest = adaptRequest(request);
      const completion = await this.client.chat.completions.create(groqRequest);

      return adaptResponse(completion);
    } catch (error) {
      if (error instanceof AISuiteError) {
        throw error;
      }
      throw new AISuiteError(
        `Groq API error: ${
          error instanceof Error ? error.message : "Unknown error"
        }`,
        this.name,
        "API_ERROR"
      );
    }
  }

  async *streamChatCompletion(
    request: ChatCompletionRequest,
    options?: RequestOptions
  ): AsyncIterable<ChatCompletionChunk> {
    try {
      const groqRequest = adaptRequest(request);
      const stream = await this.client.chat.completions.create(groqRequest);
      const streamId = generateId();

      // Handle abort signal
      if (options?.signal) {
        options.signal.addEventListener("abort", () => {
          if (
            stream &&
            typeof (stream as any).controller?.abort === "function"
          ) {
            (stream as any).controller.abort();
          }
        });
      }

      for await (const chunk of stream as any) {
        yield adaptStreamResponse(chunk, streamId);
      }
    } catch (error) {
      throw new AISuiteError(
        `Groq streaming error: ${
          error instanceof Error ? error.message : "Unknown error"
        }`,
        this.name,
        "STREAMING_ERROR"
      );
    }
  }
}


================================================
FILE: aisuite-js/src/providers/groq/types.ts
================================================
export interface GroqConfig {
  apiKey: string;
  baseURL?: string;
  dangerouslyAllowBrowser?: boolean;
}


================================================
FILE: aisuite-js/src/providers/index.ts
================================================
export { OpenAIProvider } from "./openai";
export { AnthropicProvider } from "./anthropic";
export { MistralProvider } from "./mistral";
export { GroqProvider } from "./groq";
export type {
  OpenAIConfig,
  AnthropicConfig,
  MistralConfig,
  GroqConfig,  
} from "../types";


================================================
FILE: aisuite-js/src/providers/mistral/adapters.ts
================================================
import {
  ChatCompletionRequest,
  ChatCompletionResponse,
  ChatCompletionChunk,
  ChatMessage,
} from "../../types";
import type {
  ChatCompletionResponse as MistralResponse,
  ChatCompletionResponseChunk as MistralStreamResponse,
} from "@mistralai/mistralai";

export function adaptRequest(request: ChatCompletionRequest): any {
  // Transform the request into Mistral's format
  const tools =
    Array.isArray(request.tools) && request.tools.length > 0
      ? request.tools
      : undefined;

  return {
    model: request.model,
    messages: request.messages.map(adaptMessage),
    tools,
    temperature: request.temperature,
    max_tokens: request.max_tokens,
    top_p: request.top_p,
    stream: request.stream,
  };
}

function adaptMessage(message: ChatMessage): any {
  return {
    role: message.role,
    content: message.content,
    tool_calls: message.tool_calls,
  };
}

export function adaptResponse(
  response: MistralResponse
): ChatCompletionResponse {
  return {
    id: response.id,
    object: "chat.completion",
    created: Math.floor(Date.now() / 1000),
    model: response.model,
    choices: [
      {
        index: 0,
        message: {
          role: "assistant",
          content: response.choices[0].message.content,
        },
        finish_reason: response.choices[0].finish_reason,
      },
    ],
    usage: {
      prompt_tokens: response.usage.prompt_tokens,
      completion_tokens: response.usage.completion_tokens,
      total_tokens: response.usage.total_tokens,
    },
  };
}

export function adaptStreamResponse(
  response: MistralStreamResponse,
  streamId: string
): ChatCompletionChunk {
  return {
    id: streamId,
    object: "chat.completion.chunk",
    created: Math.floor(Date.now() / 1000),
    model: response.model,
    choices: [
      {
        index: 0,
        delta: {
          role: "assistant",
          content: response.choices[0].delta.content,
          tool_calls: response.choices[0].delta.tool_calls,
        },
        finish_reason: response.choices[0].finish_reason,
      },
    ],
  };
}


================================================
FILE: aisuite-js/src/providers/mistral/index.ts
================================================
export { MistralProvider } from "./provider";
export type { MistralConfig } from "./types";


================================================
FILE: aisuite-js/src/providers/mistral/provider.ts
================================================
import MistralClient from "@mistralai/mistralai";
import { Provider } from "../../core/base-provider";
import {
  ChatCompletionRequest,
  ChatCompletionResponse,
  ChatCompletionChunk,
  RequestOptions,
} from "../../types";
import { MistralConfig } from "./types";
import { adaptRequest, adaptResponse, adaptStreamResponse } from "./adapters";
import { AISuiteError } from "../../core/errors";
import { generateId } from "../../utils/streaming";

export class MistralProvider implements Provider {
  public readonly name = "mistral";
  private client: MistralClient;

  constructor(config: MistralConfig) {
    this.client = new MistralClient(config.apiKey);
    if (config.baseURL) {
      (this.client as any).baseURL = config.baseURL;
    }
  }

  async chatCompletion(
    request: ChatCompletionRequest,
    options?: RequestOptions
  ): Promise<ChatCompletionResponse> {
    try {
      if (request.stream) {
        throw new AISuiteError(
          "Streaming is not supported in non-streaming method. Set stream: false or use streamChatCompletion method.",
          this.name,
          "STREAMING_NOT_SUPPORTED"
        );
      }

      const mistralRequest = adaptRequest(request);
      const completion = await this.client.chat(mistralRequest);

      return adaptResponse(completion);
    } catch (error) {
      if (error instanceof AISuiteError) {
        throw error;
      }
      throw new AISuiteError(
        `Mistral API error: ${
          error instanceof Error ? error.message : "Unknown error"
        }`,
        this.name,
        "API_ERROR"
      );
    }
  }

  async *streamChatCompletion(
    request: ChatCompletionRequest,
    options?: RequestOptions
  ): AsyncIterable<ChatCompletionChunk> {
    try {
      const mistralRequest = adaptRequest(request);
      const stream = await this.client.chatStream(mistralRequest);
      const streamId = generateId();

      // Handle abort signal
      if (options?.signal) {
        options.signal.addEventListener("abort", () => {
          if (
            stream &&
            typeof (stream as any).controller?.abort === "function"
          ) {
            (stream as any).controller.abort();
          }
        });
      }

      for await (const chunk of stream) {
        yield adaptStreamResponse(chunk, streamId);
      }
    } catch (error) {
      throw new AISuiteError(
        `Mistral streaming error: ${
          error instanceof Error ? error.message : "Unknown error"
        }`,
        this.name,
        "STREAMING_ERROR"
      );
    }
  }
}


================================================
FILE: aisuite-js/src/providers/mistral/types.ts
================================================
import { MistralConfig } from "../../types";

export { MistralConfig };

// Re-export Mistral types that we need
export type {
  ChatCompletionResponse as MistralResponse,
  ChatCompletionResponseChunk as MistralStreamResponse,
} from "@mistralai/mistralai";


================================================
FILE: aisuite-js/src/providers/openai/adapters.ts
================================================
import {
  ChatCompletionRequest,
  ChatCompletionResponse,
  ChatCompletionChunk,
  ChatMessage,
  ToolCall,
  Tool,
  TranscriptionRequest,
  TranscriptionResult,
} from "../../types";
import type {
  ChatCompletion,
  ChatCompletionChunk as OpenAIChunk,
  ChatCompletionCreateParams,
} from "openai/resources/chat/completions";
import { Uploadable } from "openai/uploads";
import { OpenAIASRResponse } from "./types";

export function adaptRequest(
  request: ChatCompletionRequest
): ChatCompletionCreateParams {
  // OpenAI is our base format, so minimal transformation needed
  // Don't pass stream parameter to avoid accidental streaming
  const { stream, ...requestWithoutStream } = request;

  return {
    model: requestWithoutStream.model,
    messages: requestWithoutStream.messages.map(adaptMessage),
    tools: requestWithoutStream.tools,
    tool_choice: requestWithoutStream.tool_choice,
    temperature: requestWithoutStream.temperature,
    max_tokens: requestWithoutStream.max_tokens,
    top_p: requestWithoutStream.top_p,
    frequency_penalty: requestWithoutStream.frequency_penalty,
    presence_penalty: requestWithoutStream.presence_penalty,
    stop: requestWithoutStream.stop,
    user: requestWithoutStream.user,
  };
}

function adaptMessage(message: ChatMessage): any {
  return {
    role: message.role,
    content: message.content,
    name: message.name,
    tool_call_id: message.tool_call_id,
    tool_calls: message.tool_calls,
  };
}

export function adaptResponse(
  response: ChatCompletion
): ChatCompletionResponse {
  return {
    id: response.id,
    object: "chat.completion",
    created: response.created,
    model: response.model,
    choices: response.choices.map((choice) => ({
      index: choice.index,
      message: {
        role: choice.message.role as any,
        content: choice.message.content,
        tool_calls: choice.message.tool_calls?.map(adaptToolCall),
      },
      finish_reason: choice.finish_reason || "stop",
    })),
    usage: {
      prompt_tokens: response.usage?.prompt_tokens || 0,
      completion_tokens: response.usage?.completion_tokens || 0,
      total_tokens: response.usage?.total_tokens || 0,
    },
    system_fingerprint: response.system_fingerprint,
  };
}

export function adaptChunk(chunk: OpenAIChunk): ChatCompletionChunk {
  return {
    id: chunk.id,
    object: "chat.completion.chunk",
    created: chunk.created,
    model: chunk.model,
    choices: chunk.choices.map((choice) => ({
      index: choice.index,
      delta: {
        role: choice.delta.role as any,
        content: choice.delta.content || undefined,
        tool_calls: choice.delta.tool_calls?.map(adaptToolCall),
      },
      finish_reason: choice.finish_reason || undefined,
    })),
    usage: chunk.usage
      ? {
          prompt_tokens: chunk.usage.prompt_tokens || 0,
          completion_tokens: chunk.usage.completion_tokens || 0,
          total_tokens: chunk.usage.total_tokens || 0,
        }
      : undefined,
  };
}

function adaptToolCall(toolCall: any): ToolCall {
  return {
    id: toolCall.id,
    type: "function",
    function: {
      name: toolCall.function.name,
      arguments: toolCall.function.arguments,
    },
  };
}

export function adaptASRRequest(request: TranscriptionRequest): {
  file: Uploadable;
  model: string;
} {
  if (!(request.file instanceof Buffer)) {
    throw new Error("File must be provided as a Buffer");
  }

  const file = new File([request.file], "audio.mp3", {
    type: "audio/mpeg",
  }) as unknown as Uploadable;

  return {
    file,
    model: request.model,
  };
}

export function adaptASRResponse(
  response: OpenAIASRResponse
): TranscriptionResult {
  return {
    text: response.text,
    language: response.language || "en", // Default to English if not provided
    confidence: response.segments?.[0]?.avg_logprob,
    words:
      response.words?.map((word) => ({
        text: word.text || "",
        start: word.start,
        end: word.end,
        confidence: word?.confidence, // Default confidence if not provided
      })) ?? [],
    segments:
      response.segments?.map((segment) => ({
        text: segment.text,
        start: segment.start,
        end: segment.end,
      })) ?? [],
  };
}


================================================
FILE: aisuite-js/src/providers/openai/index.ts
================================================
export { OpenAIProvider } from './provider';
export type { OpenAIConfig } from './types';

================================================
FILE: aisuite-js/src/providers/openai/provider.ts
================================================
import OpenAI from "openai";
import { Provider } from "../../core/base-provider";
import { ASRProvider } from "../../core/base-asr-provider";
import {
  ChatCompletionRequest,
  ChatCompletionResponse,
  ChatCompletionChunk,
  RequestOptions,
  TranscriptionRequest,
  TranscriptionResult,
} from "../../types";
import { OpenAIASRResponse, OpenAIConfig } from "./types";
import {
  adaptRequest,
  adaptResponse,
  adaptChunk,
  adaptASRRequest,
  adaptASRResponse,
} from "./adapters";
import { AISuiteError } from "../../core/errors";

export class OpenAIProvider implements Provider, ASRProvider {
  public readonly name = "openai";
  private client: OpenAI;

  constructor(config: OpenAIConfig) {
    this.client = new OpenAI({
      apiKey: config.apiKey,
      baseURL: config.baseURL,
      organization: config.organization,
    });
  }

  async chatCompletion(
    request: ChatCompletionRequest,
    options?: RequestOptions
  ): Promise<ChatCompletionResponse> {
    try {
      // For now, we don't support streaming in non-streaming method
      if (request.stream) {
        throw new AISuiteError(
          "Streaming is not yet supported. Set stream: false or use streamChatCompletion method.",
          this.name,
          "STREAMING_NOT_SUPPORTED"
        );
      }

      const openaiRequest = adaptRequest(request);
      const completion = (await this.client.chat.completions.create(
        openaiRequest,
        options
      )) as any; // Type assertion needed because OpenAI SDK returns a union type

      return adaptResponse(completion);
    } catch (error) {
      if (error instanceof AISuiteError) {
        throw error;
      }
      throw new AISuiteError(
        `OpenAI API error: ${
          error instanceof Error ? error.message : "Unknown error"
        }`,
        this.name,
        "API_ERROR"
      );
    }
  }

  async *streamChatCompletion(
    request: ChatCompletionRequest,
    options?: RequestOptions
  ): AsyncIterable<ChatCompletionChunk> {
    try {
      const openaiRequest = adaptRequest(request);
      const stream = await this.client.chat.completions.create(
        {
          ...openaiRequest,
          stream: true,
        },
        options
      );

      for await (const chunk of stream) {
        yield adaptChunk(chunk);
      }
    } catch (error) {
      throw new AISuiteError(
        `OpenAI streaming error: ${
          error instanceof Error ? error.message : "Unknown error"
        }`,
        this.name,
        "STREAMING_ERROR"
      );
    }
  }

  async transcribe(
    request: TranscriptionRequest,
    options?: RequestOptions
  ): Promise<TranscriptionResult> {
    try {
      this.validateParams(request);

      const adaptedRequest = adaptASRRequest(request);
      const otherParams = this.translateParams(request);
      const response = await this.client.audio.transcriptions.create({
        ...adaptedRequest,
        response_format: "verbose_json",
        stream: false,
        ...otherParams,
      });

      return adaptASRResponse(response as OpenAIASRResponse);
    } catch (error: any) {
      throw new AISuiteError(
        `OpenAI ASR transcription failed: ${error.message}`,
        this.name,
        "PROVIDER_ERROR"
      );
    }
  }

  validateParams(params: { [key: string]: any }): void {
    if (!params.model) {
      throw new AISuiteError(
        "Model parameter is required",
        this.name,
        "MODEL_PARAMETER_REQUIRED"
      );
    }

    if (!params.file) {
      throw new AISuiteError(
        "File parameter is required",
        this.name,
        "MODEL_PARAMETER_REQUIRED"
      );
    }
  }

  translateParams(params: { [key: string]: any }): { [key: string]: any } {
    const { model: _, file: __, ...rest } = params;
    return rest;
  }
}


================================================
FILE: aisuite-js/src/providers/openai/types.ts
================================================
import OpenAI from "openai";
import { OpenAIConfig } from "../../types";

export { OpenAIConfig };

// Re-export OpenAI types that we need
export type {
  ChatCompletion,
  ChatCompletionChunk as OpenAIChunk,
  ChatCompletionCreateParams,
} from "openai/resources/chat/completions";

export interface OpenAIASRRequest {
  file: File;
  model: string;
  language?: string;
  prompt?: string;
  response_format?: "json" | "text" | "srt" | "verbose_json" | "vtt";
  temperature?: number;
  timestamp_granularities?: Array<"word" | "segment">;
}

export interface OpenAIASRResponse extends OpenAI.Audio.Transcription {
  text: string;
  language?: string;
  duration?: number;
  segments?: Array<{
    id: number;
    seek: number;
    start: number;
    end: number;
    text: string;
    tokens: number[];
    temperature: number;
    avg_logprob: number;
    compression_ratio: number;
    no_speech_prob: number;
  }>;
  words?: Array<{
    text: string;
    start: number;
    end: number;
    confidence?: number;
  }>;
}


================================================
FILE: aisuite-js/src/types/chat.ts
================================================
export interface ChatMessage {
  role: "system" | "user" | "assistant" | "tool";
  content: string | null;
  name?: string;
  tool_call_id?: string;
  tool_calls?: ToolCall[];
}

export interface ChatCompletionRequest {
  model: string; // "provider:model" format
  messages: ChatMessage[];
  tools?: Tool[];
  tool_choice?: ToolChoice;
  temperature?: number;
  max_tokens?: number;
  top_p?: number;
  frequency_penalty?: number;
  presence_penalty?: number;
  stop?: string | string[];
  stream?: boolean;
  user?: string;
}

export interface ChatCompletionResponse {
  id: string;
  object: "chat.completion";
  created: number;
  model: string;
  choices: ChatChoice[];
  usage: Usage;
  system_fingerprint?: string;
}

export interface ChatCompletionChunk {
  id: string;
  object: "chat.completion.chunk";
  created: number;
  model: string;
  choices: Array<{
    index: number;
    delta: {
      role?: "assistant";
      content?: string;
      tool_calls?: ToolCall[];
    };
    finish_reason?: string;
  }>;
  usage?: Usage;
}

export interface ChatChoice {
  index: number;
  message: ChatMessage;
  finish_reason: string;
}

export interface Usage {
  prompt_tokens: number;
  completion_tokens: number;
  total_tokens: number;
}

// Import tool types from tools.ts
import { Tool, ToolCall, ToolChoice } from "./tools";


================================================
FILE: aisuite-js/src/types/common.ts
================================================
export interface RequestOptions {
  signal?: AbortSignal;
  timeout?: number;
  retries?: number;
  [key: string]: any;
}

export type AudioInput = string | Buffer | Uint8Array;

================================================
FILE: aisuite-js/src/types/index.ts
================================================
export * from "./chat";
export * from "./tools";
export * from "./common";
export * from "./providers";
export * from "./transcription";


================================================
FILE: aisuite-js/src/types/providers.ts
================================================
export interface ProviderConfigs {
  openai?: OpenAIConfig;
  anthropic?: AnthropicConfig;
  mistral?: MistralConfig;
  groq?: GroqConfig;
  deepgram?: DeepgramConfig;
}

export interface OpenAIConfig {
  apiKey: string;
  baseURL?: string;
  organization?: string;
}

export interface AnthropicConfig {
  apiKey: string;
  baseURL?: string;
}

export interface MistralConfig {
  apiKey: string;
  baseURL?: string;
}

export interface GroqConfig {
  apiKey: string;
  baseURL?: string;
}

export interface DeepgramConfig {
  apiKey: string;
  baseURL?: string;
}


================================================
FILE: aisuite-js/src/types/tools.ts
================================================
export interface Tool {
  type: 'function';
  function: FunctionDefinition;
}

export interface FunctionDefinition {
  name: string;
  description: string;
  parameters: {
    type: 'object';
    properties: Record<string, any>;
    required?: string[];
  };
}

export interface ToolCall {
  id: string;
  type: 'function';
  function: {
    name: string;
    arguments: string;  // JSON string
  };
}

export type ToolChoice = 
  | 'auto' 
  | 'none' 
  | { type: 'function'; function: { name: string } };

================================================
FILE: aisuite-js/src/types/transcription.ts
================================================
export interface Word {
  text: string;
  start: number;
  end: number;
  speaker?: string;
  confidence?: number;
}

export interface Segment {
  text: string;
  start: number;
  end: number;
  speaker?: string;
}

export interface TranscriptionResult {
  text: string;
  language: string;
  confidence?: number;
  words: Word[];
  segments: Segment[];
}

export interface TranscriptionRequest {
  model: string; // "provider:model" format
  file: string | Buffer | Uint8Array;
  language?: string;
  timestamps?: boolean;
  word_confidence?: boolean;
  speaker_labels?: boolean;
  temperature?: number;
  // Provider-specific parameters
  [key: string]: any;
}


================================================
FILE: aisuite-js/src/utils/streaming.ts
================================================
import { ChatCompletionChunk } from '../types';

export function createChunk(
  id: string,
  model: string,
  content?: string,
  finishReason?: string,
  toolCalls?: any[]
): ChatCompletionChunk {
  return {
    id,
    object: 'chat.completion.chunk',
    created: Math.floor(Date.now() / 1000),
    model,
    choices: [{
      index: 0,
      delta: {
        role: 'assistant',
        content,
        tool_calls: toolCalls
      },
      finish_reason: finishReason || undefined
    }]
  };
}

export function generateId(): string {
  return `chatcmpl-${Math.random().toString(36).substr(2, 9)}`;
}

================================================
FILE: aisuite-js/tests/client.test.ts
================================================
import { Client } from "../src/client";
import {
  ProviderConfigs,
  ChatCompletionRequest,
  ChatCompletionResponse,
  ChatCompletionChunk,
  RequestOptions,
  TranscriptionRequest,
} from "../src/types";
import { ProviderNotConfiguredError } from "../src/core/errors";
import { Provider } from "../src/core/base-provider";

// Mock the Mistral SDK
jest.mock("@mistralai/mistralai", () => {
  return {
    __esModule: true,
    default: jest.fn(),
  };
});

// Mock the providers
jest.mock("../src/providers/openai");
jest.mock("../src/providers/anthropic");
jest.mock("../src/providers/mistral");
jest.mock("../src/providers/groq");
jest.mock("../src/asr-providers/deepgram");

describe("Client", () => {
  let mockOpenAIProvider: any;
  let mockAnthropicProvider: any;
  let mockMistralProvider: any;
  let mockGroqProvider: any;
  let mockDeepgramProvider: any;
  let mockOpenAIASRProvider: any;

  beforeEach(() => {
    // Reset all mocks
    jest.clearAllMocks();

    // Create mock response
    const mockResponse = {
      id: "chatcmpl-123",
      object: "chat.completion",
      created: 1234567890,
      model: "gpt-4",
      choices: [
        {
          index: 0,
          message: {
            role: "assistant",
            content: "Hello! How can I help you?",
          },
          finish_reason: "stop",
        },
      ],
      usage: {
        prompt_tokens: 10,
        completion_tokens: 20,
        total_tokens: 30,
      },
    };

    // Create mock provider class
    class MockProvider implements Provider {
      public readonly name: string;
      public chatCompletion = jest.fn().mockResolvedValue(mockResponse);
      public streamChatCompletion = jest.fn().mockImplementation(async function* () {
        yield mockResponse as unknown as ChatCompletionChunk;
      });

      constructor(name: string) {
        this.name = name;
      }
    }

    // Create mock instances
    mockOpenAIProvider = new MockProvider("openai");
    mockAnthropicProvider = new MockProvider("anthropic");
    mockMistralProvider = new MockProvider("mistral");
    mockGroqProvider = new MockProvider("groq");

    mockDeepgramProvider = {
      transcribe: jest.fn(),
    };

    mockOpenAIASRProvider = {
      transcribe: jest.fn(),
    };

    // Manually mock the provider constructors using jest.mock
    const openaiModule = jest.requireMock("../src/providers/openai");
    const anthropicModule = jest.requireMock("../src/providers/anthropic");
    const mistralModule = jest.requireMock("../src/providers/mistral");
    const groqModule = jest.requireMock("../src/providers/groq");
    const deepgramModule = jest.requireMock("../src/asr-providers/deepgram");

    openaiModule.OpenAIProvider = jest.fn().mockImplementation(() => mockOpenAIProvider);
    anthropicModule.AnthropicProvider = jest.fn().mockImplementation(() => mockAnthropicProvider);
    mistralModule.MistralProvider = jest.fn().mockImplementation(() => mockMistralProvider);
    groqModule.GroqProvider = jest.fn().mockImplementation(() => mockGroqProvider);
    deepgramModule.DeepgramASRProvider = jest.fn().mockImplementation(() => mockDeepgramProvider);
  });

  describe("constructor", () => {
    it("should initialize providers based on config", () => {
      const config: ProviderConfigs = {
        openai: { apiKey: "openai-key" },
        anthropic: { apiKey: "anthropic-key" },
        mistral: { apiKey: "mistral-key" },
        groq: { apiKey: "groq-key" },
        deepgram: { apiKey: "deepgram-key" },
      };

      const client = new Client(config);

      expect(client.listProviders()).toEqual([
        "openai",
        "anthropic",
        "mistral",
        "groq",
      ]);
      expect(client.listASRProviders()).toEqual(["openai", "deepgram"]);
      expect(client.isProviderConfigured("openai")).toBe(true);
      expect(client.isProviderConfigured("anthropic")).toBe(true);
      expect(client.isProviderConfigured("mistral")).toBe(true);
      expect(client.isProviderConfigured("groq")).toBe(true);
      expect(client.isASRProviderConfigured("deepgram")).toBe(true);
    });

    it("should only initialize configured providers", () => {
      const config: ProviderConfigs = {
        openai: { apiKey: "openai-key" },
        groq: { apiKey: "groq-key" },
        deepgram: { apiKey: "deepgram-key" },
      };

      const client = new Client(config);

      expect(client.listProviders()).toEqual(["openai", "groq"]);
      expect(client.listASRProviders()).toEqual(["openai", "deepgram"]);
      expect(client.isProviderConfigured("openai")).toBe(true);
      expect(client.isProviderConfigured("anthropic")).toBe(false);
      expect(client.isProviderConfigured("mistral")).toBe(false);
      expect(client.isProviderConfigured("groq")).toBe(true);
      expect(client.isASRProviderConfigured("deepgram")).toBe(true);
      expect(client.isASRProviderConfigured("unknown")).toBe(false);
    });

    it("should handle empty config", () => {
      const config: ProviderConfigs = {};

      const client = new Client(config);

      expect(client.listProviders()).toEqual([]);
      expect(client.listASRProviders()).toEqual([]);
      expect(client.isProviderConfigured("openai")).toBe(false);
      expect(client.isASRProviderConfigured("deepgram")).toBe(false);
    });
  });

  describe("chat.completions.create", () => {
    let client: Client;
    const baseConfig: ProviderConfigs = {
      openai: { apiKey: "openai-key" },
      anthropic: { apiKey: "anthropic-key" },
      mistral: { apiKey: "mistral-key" },
      groq: { apiKey: "groq-key" },
    };

    beforeEach(() => {
      client = new Client(baseConfig);
    });

    it("should call non-streaming chat completion", async () => {
      const request: ChatCompletionRequest = {
        model: "openai:gpt-4",
        messages: [{ role: "user", content: "Hello" }],
      };

      const mockResponse = {
        id: "test-id",
        object: "chat.completion",
        created: 1234567890,
        model: "gpt-4",
        choices: [],
        usage: { prompt_tokens: 10, completion_tokens: 20, total_tokens: 30 },
      };

      mockOpenAIProvider.chatCompletion.mockResolvedValue(mockResponse);

      const result = await client.chat.completions.create(request);

      expect(mockOpenAIProvider.chatCompletion).toHaveBeenCalledWith(
        { ...request, model: "gpt-4" },
        undefined
      );
      expect(result).toEqual(mockResponse);
    });

    it("should call streaming chat completion", async () => {
      const request: ChatCompletionRequest = {
        model: "anthropic:claude-3-sonnet",
        messages: [{ role: "user", content: "Hello" }],
        stream: true,
      };

      const mockStream = (async function* () {
        yield {
          id: "chunk-1",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "claude-3-sonnet",
          choices: [],
        };
      })();

      mockAnthropicProvider.streamChatCompletion.mockReturnValue(mockStream);

      const result = await client.chat.completions.create(request);

      expect(mockAnthropicProvider.streamChatCompletion).toHaveBeenCalledWith(
        { ...request, model: "claude-3-sonnet" },
        undefined
      );
      expect(result).toBe(mockStream);
    });

    it("should throw error for unconfigured provider", async () => {
      const request: ChatCompletionRequest = {
        model: "unknown:model",
        messages: [{ role: "user", content: "Hello" }],
      };

      await expect(client.chat.completions.create(request)).rejects.toThrow(
        ProviderNotConfiguredError
      );
    });

    it("should handle complex model names with multiple colons", async () => {
      const request: ChatCompletionRequest = {
        model: "openai:gpt-4:vision",
        messages: [{ role: "user", content: "Hello" }],
      };

      const mockResponse = {
        id: "test-id",
        object: "chat.completion",
        created: 1234567890,
        model: "gpt-4:vision",
        choices: [],
        usage: { prompt_tokens: 10, completion_tokens: 20, total_tokens: 30 },
      };

      mockOpenAIProvider.chatCompletion.mockResolvedValue(mockResponse);

      const result = await client.chat.completions.create(request);

      expect(mockOpenAIProvider.chatCompletion).toHaveBeenCalledWith(
        { ...request, model: "gpt-4:vision" },
        undefined
      );
      expect(result).toEqual(mockResponse);
    });

    it("should pass options to provider", async () => {
      const request: ChatCompletionRequest = {
        model: "mistral:mistral-large",
        messages: [{ role: "user", content: "Hello" }],
      };

      const options = { signal: new AbortController().signal };

      const mockResponse = {
        id: "test-id",
        object: "chat.completion",
        created: 1234567890,
        model: "mistral-large",
        choices: [],
        usage: { prompt_tokens: 10, completion_tokens: 20, total_tokens: 30 },
      };

      mockMistralProvider.chatCompletion.mockResolvedValue(mockResponse);

      const result = await client.chat.completions.create(request, options);

      expect(mockMistralProvider.chatCompletion).toHaveBeenCalledWith(
        { ...request, model: "mistral-large" },
        options
      );
      expect(result).toEqual(mockResponse);
    });
  });

  describe("audio.transcriptions.create", () => {
    describe("Deepgram Provider", () => {
      let client: Client;
      const baseConfig: ProviderConfigs = {
        deepgram: { apiKey: "deepgram-key" },
      };

      beforeEach(() => {
        client = new Client(baseConfig);
      });

      it("should call transcription with correct parameters", async () => {
        const audioBuffer = Buffer.from("test audio data");
        const request: TranscriptionRequest = {
          model: "deepgram:nova-2",
          file: audioBuffer,
          language: "en-US",
          timestamps: true,
          word_confidence: true,
          speaker_labels: true,
        };

        const mockResponse = {
          text: "Hello world",
          language: "en-US",
          confidence: 0.95,
          words: [
            {
              text: "Hello",
              start: 0.0,
              end: 0.5,
              confidence: 0.98,
            },
            {
              text: "world",
              start: 0.6,
              end: 1.0,
              confidence: 0.92,
            },
          ],
          segments: [
            {
              text: "Hello world",
              start: 0.0,
              end: 1.0,
            },
          ],
        };

        mockDeepgramProvider.transcribe.mockResolvedValue(mockResponse);

        const result = await client.audio.transcriptions.create(request);

        expect(mockDeepgramProvider.transcribe).toHaveBeenCalledWith(
          { ...request, model: "nova-2" },
          undefined
        );
        expect(result).toEqual(mockResponse);
      });

      it("should throw error for unconfigured ASR provider", async () => {
        const request: TranscriptionRequest = {
          model: "unknown:model",
          file: Buffer.from("test"),
        };

        await expect(
          client.audio.transcriptions.create(request)
        ).rejects.toThrow(ProviderNotConfiguredError);
      });

      it("should pass options to ASR provider", async () => {
        const audioBuffer = Buffer.from("test audio data");
        const request: TranscriptionRequest = {
          model: "deepgram:nova-2",
          file: audioBuffer,
          language: "en-US",
        };

        const options = { timeout: 30000 };

        const mockResponse = {
          text: "Test transcription",
          language: "en-US",
          confidence: 0.9,
          words: [],
          segments: [],
        };

        mockDeepgramProvider.transcribe.mockResolvedValue(mockResponse);

        const result = await client.audio.transcriptions.create(
          request,
          options
        );

        expect(mockDeepgramProvider.transcribe).toHaveBeenCalledWith(
          { ...request, model: "nova-2" },
          options
        );
        expect(result).toEqual(mockResponse);
      });

      it("should handle complex model names with multiple colons", async () => {
        const audioBuffer = Buffer.from("test audio data");
        const request: TranscriptionRequest = {
          model: "deepgram:nova-2:enhanced",
          file: audioBuffer,
          language: "en-US",
        };

        const mockResponse = {
          text: "Test transcription",
          language: "en-US",
          confidence: 0.9,
          words: [],
          segments: [],
        };

        mockDeepgramProvider.transcribe.mockResolvedValue(mockResponse);

        const result = await client.audio.transcriptions.create(request);

        expect(mockDeepgramProvider.transcribe).toHaveBeenCalledWith(
          { ...request, model: "nova-2:enhanced" },
          undefined
        );
        expect(result).toEqual(mockResponse);
      });
    });

    describe("OpenAI ASR Provider", () => {
      let client: Client;
      let mockOpenAIASRProvider: any;

      beforeEach(() => {
        mockOpenAIASRProvider = {
          name: "openai",
          transcribe: jest.fn(),
        };

        // Update to configure OpenAI provider for both chat and ASR
        const openaiModule = require("../src/providers/openai");
        openaiModule.OpenAIProvider.mockImplementation(() => ({
          ...mockOpenAIProvider,
          ...mockOpenAIASRProvider
        }));
      });

      it("should transcribe with audio enabled", async () => {
        // Initialize client with OpenAI provider
        client = new Client({
          openai: {
            apiKey: "openai-key"
          },
        });

        // Add the OpenAI provider to ASR providers list manually for testing
        client["asrProviders"].set("openai", mockOpenAIASRProvider);

        const audioBuffer = Buffer.from("test audio data");
        const request: TranscriptionRequest = {
          model: "openai:whisper-1",
          file: audioBuffer,
          language: "en",
          response_format: "verbose_json",
          temperature: 0,
          timestamps: true,
        };

        const mockResponse = {
          text: "Test transcription",
          language: "en",
          confidence: 0.95,
          words: [
            {
              text: "Test",
              start: 0.0,
              end: 0.5,
              confidence: 0.98,
            },
            {
              text: "transcription",
              start: 0.6,
              end: 1.2,
              confidence: 0.92,
            },
          ],
          segments: [
            {
              text: "Test transcription",
              start: 0.0,
              end: 1.2,
            },
          ],
        };

        mockOpenAIASRProvider.transcribe.mockResolvedValue(mockResponse);

        const result = await client.audio.transcriptions.create(request);

        expect(mockOpenAIASRProvider.transcribe).toHaveBeenCalledWith(
          { ...request, model: "whisper-1" },
          undefined
        );
        expect(result).toEqual(mockResponse);
      });

      it("should support different response formats", async () => {
        client = new Client({
          openai: {
            apiKey: "openai-key"
          },
        });

        // Add the OpenAI provider to ASR providers list
        client["asrProviders"].set("openai", mockOpenAIASRProvider);

        const request: TranscriptionRequest = {
          model: "openai:whisper-1",
          file: Buffer.from("test audio"),
          response_format: "text",
        };

        const mockResponse = {
          text: "Test transcription",
          language: "en",
          confidence: 1.0,
          words: [],
          segments: [],
        };

        mockOpenAIASRProvider.transcribe.mockResolvedValue(mockResponse);
        const result = await client.audio.transcriptions.create(request);

        expect(mockOpenAIASRProvider.transcribe).toHaveBeenCalledWith(
          { ...request, model: "whisper-1" },
          undefined
        );
        expect(result).toEqual(mockResponse);
      });

      it("should pass custom options to provider", async () => {
        client = new Client({
          openai: {
            apiKey: "openai-key"
          },
        });

        // Add the OpenAI provider to ASR providers list
        client["asrProviders"].set("openai", mockOpenAIASRProvider);

        const request: TranscriptionRequest = {
          model: "openai:whisper-1",
          file: Buffer.from("test audio"),
          language: "en",
        };

        const options = { timeout: 30000 };
        const mockResponse = {
          text: "Test transcription",
          language: "en",
          confidence: 0.9,
          words: [],
          segments: [],
        };

        mockOpenAIASRProvider.transcribe.mockResolvedValue(mockResponse);
        const result = await client.audio.transcriptions.create(
          request,
          options
        );

        expect(mockOpenAIASRProvider.transcribe).toHaveBeenCalledWith(
          { ...request, model: "whisper-1" },
          options
        );
        expect(result).toEqual(mockResponse);
      });
    });
  });

  describe("listProviders", () => {
    it("should return list of configured providers", () => {
      const config: ProviderConfigs = {
        openai: { apiKey: "openai-key" },
        groq: { apiKey: "groq-key" },
      };

      const client = new Client(config);

      expect(client.listProviders()).toEqual(["openai", "groq"]);
    });

    it("should return empty array when no providers configured", () => {
      const config: ProviderConfigs = {};

      const client = new Client(config);

      expect(client.listProviders()).toEqual([]);
    });
  });

  describe("listASRProviders", () => {
    it("should return list of configured ASR providers", () => {
      const config: ProviderConfigs = {
        deepgram: { apiKey: "deepgram-key" },
      };

      const client = new Client(config);

      expect(client.listASRProviders()).toEqual(["deepgram"]);
    });

    it("should return empty array when no ASR providers configured", () => {
      const config: ProviderConfigs = {};

      const client = new Client(config);

      expect(client.listASRProviders()).toEqual([]);
    });
  });

  describe("isProviderConfigured", () => {
    it("should return true for configured providers", () => {
      const config: ProviderConfigs = {
        openai: { apiKey: "openai-key" },
        anthropic: { apiKey: "anthropic-key" },
      };

      const client = new Client(config);

      expect(client.isProviderConfigured("openai")).toBe(true);
      expect(client.isProviderConfigured("anthropic")).toBe(true);
    });

    it("should return false for unconfigured providers", () => {
      const config: ProviderConfigs = {
        openai: { apiKey: "openai-key" },
      };

      const client = new Client(config);

      expect(client.isProviderConfigured("anthropic")).toBe(false);
      expect(client.isProviderConfigured("mistral")).toBe(false);
      expect(client.isProviderConfigured("groq")).toBe(false);
    });
  });

  describe("isASRProviderConfigured", () => {
    it("should return true for configured ASR providers", () => {
      const config: ProviderConfigs = {
        deepgram: { apiKey: "deepgram-key" },
      };

      const client = new Client(config);

      expect(client.isASRProviderConfigured("deepgram")).toBe(true);
    });

    it("should return false for unconfigured ASR providers", () => {
      const config: ProviderConfigs = {};

      const client = new Client(config);

      expect(client.isASRProviderConfigured("deepgram")).toBe(false);
      expect(client.isASRProviderConfigured("unknown")).toBe(false);
    });
  });
});


================================================
FILE: aisuite-js/tests/providers/anthropic-provider.test.ts
================================================
import { AnthropicProvider } from "../../src/providers/anthropic/provider";
import { ChatCompletionRequest, ChatCompletionChunk } from "../../src/types";
import { AISuiteError } from "../../src/core/errors";

// Mock the Anthropic SDK
jest.mock("@anthropic-ai/sdk", () => {
  return {
    __esModule: true,
    default: jest.fn(),
  };
});

describe("AnthropicProvider", () => {
  let provider: AnthropicProvider;
  let mockAnthropicClient: any;

  beforeEach(() => {
    // Reset mocks
    jest.clearAllMocks();

    // Create mock Anthropic client
    mockAnthropicClient = {
      messages: {
        create: jest.fn(),
      },
    };

    // Mock the Anthropic constructor
    const Anthropic = require("@anthropic-ai/sdk");
    Anthropic.default.mockImplementation(() => mockAnthropicClient);

    // Ensure the mock is properly structured
    mockAnthropicClient.messages = {
      create: jest.fn(),
    };

    // Create provider instance
    provider = new AnthropicProvider({
      apiKey: "test-api-key",
    });
  });

  describe("constructor", () => {
    it("should initialize with basic config", () => {
      const config = { apiKey: "test-key" };
      const provider = new AnthropicProvider(config);

      expect(provider.name).toBe("anthropic");
    });

    it("should initialize with full config", () => {
      const config = {
        apiKey: "test-key",
        baseURL: "https://custom.anthropic.com",
      };
      const provider = new AnthropicProvider(config);

      expect(provider.name).toBe("anthropic");
    });
  });

  describe("chatCompletion", () => {
    const baseRequest: ChatCompletionRequest = {
      model: "claude-3-sonnet",
      messages: [{ role: "user", content: "Hello" }],
    };

    it("should successfully complete chat", async () => {
      const mockResponse = {
        id: "msg_123",
        type: "message",
        role: "assistant",
        content: [
          {
            type: "text",
            text: "Hello! How can I help you?",
          },
        ],
        model: "claude-3-sonnet-20240229",
        stop_reason: "end_turn",
        stop_sequence: null,
        usage: {
          input_tokens: 10,
          output_tokens: 20,
        },
      };

      mockAnthropicClient.messages.create.mockResolvedValue(mockResponse);

      const result = await provider.chatCompletion(baseRequest);

      expect(mockAnthropicClient.messages.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: expect.any(String),
          messages: expect.arrayContaining([
            expect.objectContaining({ role: "user", content: "Hello" }),
          ]),
        }),
        undefined
      );
      expect(result).toEqual(
        expect.objectContaining({
          id: "msg_123",
          object: "chat.completion",
          model: "claude-3-sonnet",
        })
      );
    });

    it("should throw error when streaming is enabled", async () => {
      const request: ChatCompletionRequest = {
        ...baseRequest,
        stream: true,
      };

      await expect(provider.chatCompletion(request)).rejects.toThrow(
        AISuiteError
      );
      await expect(provider.chatCompletion(request)).rejects.toThrow(
        "Streaming is not yet supported"
      );
    });

    it("should handle API errors", async () => {
      const apiError = new Error("API rate limit exceeded");
      mockAnthropicClient.messages.create.mockRejectedValue(apiError);

      await expect(provider.chatCompletion(baseRequest)).rejects.toThrow(
        AISuiteError
      );
      await expect(provider.chatCompletion(baseRequest)).rejects.toThrow(
        "Anthropic API error: API rate limit exceeded"
      );
    });

    it("should pass options to the client", async () => {
      const options = { signal: new AbortController().signal };
      const mockResponse = {
        id: "msg_123",
        type: "message",
        role: "assistant",
        content: [{ type: "text", text: "Hello!" }],
        model: "claude-3-sonnet-20240229",
        stop_reason: "end_turn",
        usage: { input_tokens: 10, output_tokens: 5 },
      };

      mockAnthropicClient.messages.create.mockResolvedValue(mockResponse);

      await provider.chatCompletion(baseRequest, options);

      expect(mockAnthropicClient.messages.create).toHaveBeenCalledWith(
        expect.any(Object),
        options
      );
    });

    it("should handle complex request with all parameters", async () => {
      const complexRequest: ChatCompletionRequest = {
        model: "claude-3-sonnet",
        messages: [
          { role: "system", content: "You are a helpful assistant" },
          { role: "user", content: "What is 2+2?" },
        ],
        temperature: 0.7,
        max_tokens: 100,
        top_p: 0.9,
        frequency_penalty: 0.1,
        presence_penalty: 0.1,
        stop: ["\n"],
        user: "user-123",
      };

      const mockResponse = {
        id: "msg_123",
        type: "message",
        role: "assistant",
        content: [{ type: "text", text: "2+2 equals 4" }],
        model: "claude-3-sonnet-20240229",
        stop_reason: "end_turn",
        usage: { input_tokens: 15, output_tokens: 5 },
      };

      mockAnthropicClient.messages.create.mockResolvedValue(mockResponse);

      const result = await provider.chatCompletion(complexRequest);

      expect(mockAnthropicClient.messages.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: expect.any(String),
          messages: expect.arrayContaining([
            expect.objectContaining({ role: "user", content: "What is 2+2?" }),
          ]),
          system: "You are a helpful assistant",
          temperature: 0.7,
          max_tokens: 100,
          top_p: 0.9,
          stop_sequences: expect.any(Array),
        }),
        undefined
      );
      expect(result).toEqual(
        expect.objectContaining({
          id: "msg_123",
          object: "chat.completion",
        })
      );
    });
  });

  describe("streamChatCompletion", () => {
    const baseRequest: ChatCompletionRequest = {
      model: "claude-3-sonnet",
      messages: [{ role: "user", content: "Hello" }],
    };

    it("should stream chat completion", async () => {
      const mockEvents = [
        {
          type: "message_start",
          message: {
            id: "msg_123",
            type: "message",
            role: "assistant",
            content: [],
            model: "claude-3-sonnet-20240229",
          },
        },
        {
          type: "content_block_start",
          index: 0,
          content_block: {
            type: "text",
            text: "",
          },
        },
        {
          type: "content_block_delta",
          index: 0,
          delta: {
            type: "text_delta",
            text: "Hello",
          },
        },
        {
          type: "content_block_delta",
          index: 0,
          delta: {
            type: "text_delta",
            text: "! How can I help?",
          },
        },
        {
          type: "content_block_stop",
          index: 0,
        },
        {
          type: "message_delta",
          delta: {
            stop_reason: "end_turn",
            stop_sequence: null,
          },
        },
        {
          type: "message_stop",
        },
      ];

      const mockStream = (async function* () {
        for (const event of mockEvents) {
          yield event;
        }
      })();

      mockAnthropicClient.messages.create.mockResolvedValue(mockStream);

      const stream = provider.streamChatCompletion(baseRequest);
      const chunks: ChatCompletionChunk[] = [];

      for await (const chunk of stream) {
        chunks.push(chunk);
      }

      expect(mockAnthropicClient.messages.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: expect.any(String),
          messages: expect.any(Array),
        }),
        undefined
      );
      expect(chunks.length).toBeGreaterThan(0);
    });

    it("should handle streaming errors", async () => {
      mockAnthropicClient.messages.create.mockRejectedValue(
        new Error("Streaming error")
      );
      const stream = provider.streamChatCompletion(baseRequest);
      const iterator = stream[Symbol.asyncIterator]();
      await expect(iterator.next()).rejects.toThrow(AISuiteError);
    });

    it("should pass options to streaming request", async () => {
      const options = { signal: new AbortController().signal };
      const mockStream = (async function* () {
        yield {
          type: "message_start",
          message: {
            id: "msg_123",
            type: "message",
            role: "assistant",
            content: [],
            model: "claude-3-sonnet-20240229",
          },
        };
        yield {
          type: "content_block_delta",
          index: 0,
          delta: {
            type: "text_delta",
            text: "Hello!",
          },
        };
        yield {
          type: "message_stop",
        };
      })();

      mockAnthropicClient.messages.create.mockResolvedValue(mockStream);

      const stream = provider.streamChatCompletion(baseRequest, options);
      const chunks: ChatCompletionChunk[] = [];

      for await (const chunk of stream) {
        chunks.push(chunk);
      }

      expect(mockAnthropicClient.messages.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: expect.any(String),
          messages: expect.any(Array),
          stream: true,
        }),
        options
      );
      expect(chunks.length).toBeGreaterThan(0);
    });

    it("should handle abort signal", async () => {
      const mockStream = (async function* () {
        yield {
          type: "message_start",
          message: {
            id: "msg_123",
            type: "message",
            role: "assistant",
            content: [],
            model: "claude-3-sonnet-20240229",
          },
        };
        yield {
          type: "content_block_delta",
          index: 0,
          delta: {
            type: "text_delta",
            text: "Hello!",
          },
        };
      })();

      mockAnthropicClient.messages.create.mockResolvedValue(mockStream);

      const abortController = new AbortController();
      const options = { signal: abortController.signal };

      const stream = provider.streamChatCompletion(baseRequest, options);
      const chunks: ChatCompletionChunk[] = [];

      // Start consuming the stream
      const consumePromise = (async () => {
        for await (const chunk of stream) {
          chunks.push(chunk);
        }
      })();

      // Abort after a short delay
      setTimeout(() => {
        abortController.abort();
      }, 10);

      await consumePromise;

      expect(chunks.length).toBeGreaterThan(0);
    });
  });

  describe("error handling", () => {
    it("should preserve AISuiteError instances", async () => {
      const customError = new AISuiteError(
        "Custom error",
        "anthropic",
        "CUSTOM_ERROR"
      );

      mockAnthropicClient.messages.create.mockRejectedValue(customError);

      await expect(
        provider.chatCompletion({
          model: "claude-3-sonnet",
          messages: [{ role: "user", content: "Hello" }],
        })
      ).rejects.toThrow(customError);
    });

    it("should handle unknown error types", async () => {
      const unknownError = "Unknown error string";
      mockAnthropicClient.messages.create.mockRejectedValue(unknownError);

      await expect(
        provider.chatCompletion({
          model: "claude-3-sonnet",
          messages: [{ role: "user", content: "Hello" }],
        })
      ).rejects.toThrow("Anthropic API error: Unknown error");
    });
  });
});


================================================
FILE: aisuite-js/tests/providers/deepgram-provider.test.ts
================================================
import { DeepgramASRProvider } from "../../src/asr-providers/deepgram/provider";
import { TranscriptionRequest } from "../../src/types";
import { AISuiteError } from "../../src/core/errors";

// Mock the Deepgram SDK
jest.mock("@deepgram/sdk", () => ({
  createClient: jest.fn(),
}));

describe("DeepgramASRProvider", () => {
  let provider: DeepgramASRProvider;
  let mockDeepgramClient: any;

  beforeEach(() => {
    // Reset mocks
    jest.clearAllMocks();

    // Create mock Deepgram client
    mockDeepgramClient = {
      listen: {
        prerecorded: {
          transcribeFile: jest.fn(),
        },
      },
    };

    // Mock the createClient function
    const { createClient } = require("@deepgram/sdk");
    createClient.mockReturnValue(mockDeepgramClient);

    // Create provider instance
    provider = new DeepgramASRProvider({
      apiKey: "test-api-key",
    });
  });

  describe("constructor", () => {
    it("should initialize with basic config", () => {
      const { createClient } = require("@deepgram/sdk");

      const config = { apiKey: "test-key" };
      const provider = new DeepgramASRProvider(config);

      expect(provider.name).toBe("deepgram");
      expect(createClient).toHaveBeenCalledWith({
        key: "test-key",
      });
    });

    it("should initialize with baseURL config", () => {
      const { createClient } = require("@deepgram/sdk");

      const config = {
        apiKey: "test-key",
        baseURL: "https://custom.deepgram.com",
      };
      const provider = new DeepgramASRProvider(config);

      expect(provider.name).toBe("deepgram");
      expect(createClient).toHaveBeenCalledWith({
        key: "test-key",
        baseUrl: "https://custom.deepgram.com",
      });
    });

    it("should not include baseUrl when not provided", () => {
      const { createClient } = require("@deepgram/sdk");

      const config = { apiKey: "test-key" };
      new DeepgramASRProvider(config);

      expect(createClient).toHaveBeenCalledWith({
        key: "test-key",
      });
    });
  });

  describe("validateParams", () => {
    it("should not throw for supported parameters", () => {
      const params = {
        model: "nova-2",
        file: Buffer.from("test audio data"),
        language: "en-US",
        timestamps: true,
        word_confidence: true,
        speaker_labels: true,
        smart_format: true,
        punctuate: true,
        diarize: true,
        utterances: true,
      };

      expect(() => provider.validateParams(params)).not.toThrow();
    });

    it("should accept additional parameters without warnings", () => {
      const consoleSpy = jest.spyOn(console, "warn").mockImplementation();

      const params = {
        model: "nova-2",
        file: Buffer.from("test audio data"),
        unsupported_param: "value",
        another_unsupported: true,
      };

      provider.validateParams(params);

      expect(consoleSpy).not.toHaveBeenCalled();

      consoleSpy.mockRestore();
    });

    it("should not warn for deepgram-specific parameters", () => {
      const consoleSpy = jest.spyOn(console, "warn").mockImplementation();

      const params = {
        model: "nova-2",
        file: Buffer.from("test audio data"),
        deepgram_custom_param: "value",
        deepgram_another_param: true,
      };

      provider.validateParams(params);

      expect(consoleSpy).not.toHaveBeenCalled();

      consoleSpy.mockRestore();
    });
  });

  describe("translateParams", () => {
    it("should translate language parameter", () => {
      const params = { language: "en-US" };
      const result = provider.translateParams(params);

      expect(result).toEqual({ language: "en-US" });
    });

    it("should translate timestamps to utterances", () => {
      const params = { timestamps: true };
      const result = provider.translateParams(params);

      expect(result).toEqual({ utterances: true });
    });

    it("should pass through word_confidence parameter", () => {
      const params = { word_confidence: true };
      const result = provider.translateParams(params);

      expect(result).toEqual({ word_confidence: true });
    });

    it("should pass through speaker_labels parameter", () => {
      const params = { speaker_labels: true };
      const result = provider.translateParams(params);

      expect(result).toEqual({ speaker_labels: true });
    });

    it("should pass through deepgram-specific parameters", () => {
      const params = {
        deepgram_custom_param: "value",
        deepgram_another_param: true,
      };
      const result = provider.translateParams(params);

      expect(result).toEqual({
        deepgram_custom_param: "value",
        deepgram_another_param: true,
      });
    });

    it("should pass through other parameters unchanged", () => {
      const params = {
        temperature: 0.5,
        custom_param: "value",
      };
      const result = provider.translateParams(params);

      expect(result).toEqual({
        temperature: 0.5,
        custom_param: "value",
      });
    });

    it("should handle multiple parameter translations", () => {
      const params = {
        language: "en-US",
        timestamps: true,
        word_confidence: true,
        speaker_labels: true,
        temperature: 0.5,
      };
      const result = provider.translateParams(params);

      expect(result).toEqual({
        language: "en-US",
        utterances: true,
        word_confidence: true,
        speaker_labels: true,
        temperature: 0.5,
      });
    });
  });

  describe("transcribe", () => {
    const baseRequest: TranscriptionRequest = {
      model: "nova-2",
      file: Buffer.from("test audio data"),
    };

    it("should successfully transcribe audio", async () => {
      const mockDeepgramResponse = {
        result: {
          results: {
            channels: [
              {
                alternatives: [
                  {
                    transcript: "Hello world",
                    confidence: 0.95,
                    words: [
                      {
                        word: "Hello",
                        start: 0.0,
                        end: 0.5,
                        confidence: 0.98,
                      },
                      {
                        word: "world",
                        start: 0.6,
                        end: 1.0,
                        confidence: 0.92,
                      },
                    ],
                  },
                ],
              },
            ],
            utterances: [
              {
                transcript: "Hello world",
                start: 0.0,
                end: 1.0,
                speaker: 0,
              },
            ],
          },
          metadata: {
            language: "en-US",
          },
        },
        error: null,
      };

      mockDeepgramClient.listen.prerecorded.transcribeFile.mockResolvedValue(
        mockDeepgramResponse
      );

      const result = await provider.transcribe(baseRequest);

      expect(
        mockDeepgramClient.listen.prerecorded.transcribeFile
      ).toHaveBeenCalledWith(
        Buffer.from("test audio data"),
        expect.objectContaining({
          model: "nova-2",
        })
      );

      expect(result).toEqual({
        text: "Hello world",
        language: "en-US",
        confidence: 0.95,
        words: [
          {
            text: "Hello",
            start: 0.0,
            end: 0.5,
            confidence: 0.98,
          },
          {
            text: "world",
            start: 0.6,
            end: 1.0,
            confidence: 0.92,
          },
        ],
        segments: [
          {
            text: "Hello world",
            start: 0.0,
            end: 1.0,
            speaker: "0",
          },
        ],
      });
    });

    it("should handle string file path", async () => {
      const fs = require("fs");
      jest
        .spyOn(fs, "readFileSync")
        .mockReturnValue(Buffer.from("test audio data"));

      const request: TranscriptionRequest = {
        model: "nova-2",
        file: "/path/to/audio.wav",
      };

      const mockDeepgramResponse = {
        result: {
          results: {
            channels: [
              {
                alternatives: [
                  {
                    transcript: "Test transcription",
                    confidence: 0.9,
                  },
                ],
              },
            ],
          },
          metadata: {
            language: "en-US",
          },
        },
        error: null,
      };

      mockDeepgramClient.listen.prerecorded.transcribeFile.mockResolvedValue(
        mockDeepgramResponse
      );

      await provider.transcribe(request);

      expect(fs.readFileSync).toHaveBeenCalledWith("/path/to/audio.wav");
      expect(
        mockDeepgramClient.listen.prerecorded.transcribeFile
      ).toHaveBeenCalledWith(
        Buffer.from("test audio data"),
        expect.any(Object)
      );
    });

    it("should handle Uint8Array file", async () => {
      const uint8Array = new Uint8Array([1, 2, 3, 4]);
      const request: TranscriptionRequest = {
        model: "nova-2",
        file: uint8Array,
      };

      const mockDeepgramResponse = {
        result: {
          results: {
            channels: [
              {
                alternatives: [
                  {
                    transcript: "Test transcription",
                    confidence: 0.9,
                  },
                ],
              },
            ],
          },
          metadata: {
            language: "en-US",
          },
        },
        error: null,
      };

      mockDeepgramClient.listen.prerecorded.transcribeFile.mockResolvedValue(
        mockDeepgramResponse
      );

      await provider.transcribe(request);

      expect(
        mockDeepgramClient.listen.prerecorded.transcribeFile
      ).toHaveBeenCalledWith(Buffer.from(uint8Array), expect.any(Object));
    });

    it("should handle unsupported file type gracefully", async () => {
      const request: TranscriptionRequest = {
        model: "nova-2",
        file: "unsupported" as any,
      };

      // This test verifies that the provider handles unsupported file types
      // The actual error handling is tested in other scenarios
      await expect(provider.transcribe(request)).rejects.toThrow(AISuiteError);
    });

    it("should throw error when Deepgram API returns error", async () => {
      const mockDeepgramResponse = {
        result: null,
        error: {
          message: "API key invalid",
        },
      };

      mockDeepgramClient.listen.prerecorded.transcribeFile.mockResolvedValue(
        mockDeepgramResponse
      );

      await expect(provider.transcribe(baseRequest)).rejects.toThrow(
        new AISuiteError(
          "Deepgram API error: API key invalid",
          "deepgram",
          "API_ERROR"
        )
      );
    });

    it("should handle Deepgram API exceptions", async () => {
      const apiError = new Error("Network error");
      mockDeepgramClient.listen.prerecorded.transcribeFile.mockRejectedValue(
        apiError
      );

      await expect(provider.transcribe(baseRequest)).rejects.toThrow(
        new AISuiteError(
          "Deepgram ASR error: Network error",
          "deepgram",
          "API_ERROR"
        )
      );
    });

    it("should pass timeout options", async () => {
      const options = { timeout: 30000 };
      const mockDeepgramResponse = {
        result: {
          results: {
            channels: [
              {
                alternatives: [
                  {
                    transcript: "Test transcription",
                    confidence: 0.9,
                  },
                ],
              },
            ],
          },
          metadata: {
            language: "en-US",
          },
        },
        error: null,
      };

      mockDeepgramClient.listen.prerecorded.transcribeFile.mockResolvedValue(
        mockDeepgramResponse
      );

      await provider.transcribe(baseRequest, options);

      expect(
        mockDeepgramClient.listen.prerecorded.transcribeFile
      ).toHaveBeenCalledWith(Buffer.from("test audio data"), {
        model: "nova-2",        
      });
    });

    it("should translate parameters correctly", async () => {
      const request: TranscriptionRequest = {
        model: "nova-2",
        file: Buffer.from("test audio data"),
        language: "en-US",
        timestamps: true,
        word_confidence: true,
        speaker_labels: true,
        temperature: 0.5,
      };

      const mockDeepgramResponse = {
        result: {
          results: {
            channels: [
              {
                alternatives: [
                  {
                    transcript: "Test transcription",
                    confidence: 0.9,
                  },
                ],
              },
            ],
          },
          metadata: {
            language: "en-US",
          },
        },
        error: null,
      };

      mockDeepgramClient.listen.prerecorded.transcribeFile.mockResolvedValue(
        mockDeepgramResponse
      );

      await provider.transcribe(request);

      expect(
        mockDeepgramClient.listen.prerecorded.transcribeFile
      ).toHaveBeenCalledWith(
        Buffer.from("test audio data"),
        expect.objectContaining({
          model: "nova-2",
          language: "en-US",
          utterances: true,
          word_confidence: true,
          speaker_labels: true,
          temperature: 0.5,
        })
      );
    });

    it("should handle response without words or utterances", async () => {
      const mockDeepgramResponse = {
        result: {
          results: {
            channels: [
              {
                alternatives: [
                  {
                    transcript: "Test transcription",
                    confidence: 0.9,
                  },
                ],
              },
            ],
          },
          metadata: {
            language: "en-US",
          },
        },
        error: null,
      };

      mockDeepgramClient.listen.prerecorded.transcribeFile.mockResolvedValue(
        mockDeepgramResponse
      );

      // Ensure model is present in baseRequest
      const requestWithModel = { ...baseRequest, model: "nova-2" };
      const result = await provider.transcribe(requestWithModel);

      expect(result).toEqual({
        text: "Test transcription",
        language: "en-US",
        confidence: 0.9,
        words: [],
        segments: [],
      });
    });

    it("should handle malformed response gracefully", async () => {
      const mockDeepgramResponse = {
        result: {
          results: {
            channels: [
              {
                alternatives: [
                  {
                    transcript: "Test transcription",
                  },
                ],
              },
            ],
          },
        },
        error: null,
      };

      mockDeepgramClient.listen.prerecorded.transcribeFile.mockResolvedValue(
        mockDeepgramResponse
      );

      const result = await provider.transcribe(baseRequest);

      expect(result).toEqual({
        text: "Test transcription",
        language: "unknown",
        confidence: undefined,
        words: [],
        segments: [],
      });
    });
  });
});


================================================
FILE: aisuite-js/tests/providers/groq-provider.test.ts
================================================
import { GroqProvider } from "../../src/providers/groq/provider";
import { ChatCompletionRequest, ChatCompletionChunk } from "../../src/types";
import { AISuiteError } from "../../src/core/errors";

// Mock the Groq SDK
jest.mock("groq-sdk");

describe("GroqProvider", () => {
  let provider: GroqProvider;
  let mockGroqClient: any;

  beforeEach(() => {
    // Reset mocks
    jest.clearAllMocks();

    // Create mock Groq client
    mockGroqClient = {
      chat: {
        completions: {
          create: jest.fn(),
        },
      },
    };

    // Mock the Groq constructor
    const Groq = require("groq-sdk");
    Groq.mockImplementation(() => mockGroqClient);

    // Create provider instance
    provider = new GroqProvider({
      apiKey: "test-api-key",
    });
  });

  describe("constructor", () => {
    it("should initialize with basic config", () => {
      const config = { apiKey: "test-key" };
      const provider = new GroqProvider(config);

      expect(provider.name).toBe("groq");
    });

    it("should initialize with baseURL config", () => {
      const config = {
        apiKey: "test-key",
        baseURL: "https://custom.groq.com",
      };
      const provider = new GroqProvider(config);

      expect(provider.name).toBe("groq");
      expect(mockGroqClient.baseURL).toBe("https://custom.groq.com");
    });
  });

  describe("chatCompletion", () => {
    const baseRequest: ChatCompletionRequest = {
      model: "llama3-8b-8192",
      messages: [{ role: "user", content: "Hello" }],
    };

    it("should successfully complete chat", async () => {
      const mockResponse = {
        id: "chatcmpl-123",
        object: "chat.completion",
        created: 1234567890,
        model: "llama3-8b-8192",
        choices: [
          {
            index: 0,
            message: {
              role: "assistant",
              content: "Hello! How can I help you?",
            },
            finish_reason: "stop",
          },
        ],
        usage: {
          prompt_tokens: 10,
          completion_tokens: 20,
          total_tokens: 30,
        },
      };

      mockGroqClient.chat.completions.create.mockResolvedValue(mockResponse);

      const result = await provider.chatCompletion(baseRequest);

      expect(mockGroqClient.chat.completions.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "llama3-8b-8192",
          messages: [{ role: "user", content: "Hello" }],
        })
      );
      expect(result).toEqual(
        expect.objectContaining({
          id: "chatcmpl-123",
          object: "chat.completion",
          model: "groq:llama3-8b-8192",
        })
      );
    });

    it("should throw error when streaming is enabled", async () => {
      const request: ChatCompletionRequest = {
        ...baseRequest,
        stream: true,
      };

      await expect(provider.chatCompletion(request)).rejects.toThrow(
        AISuiteError
      );
      await expect(provider.chatCompletion(request)).rejects.toThrow(
        "Streaming is not supported in non-streaming method"
      );
    });

    it("should handle API errors", async () => {
      const apiError = new Error("API rate limit exceeded");
      mockGroqClient.chat.completions.create.mockRejectedValue(apiError);

      await expect(provider.chatCompletion(baseRequest)).rejects.toThrow(
        AISuiteError
      );
      await expect(provider.chatCompletion(baseRequest)).rejects.toThrow(
        "Groq API error: API rate limit exceeded"
      );
    });

    it("should handle complex request with all parameters", async () => {
      const complexRequest: ChatCompletionRequest = {
        model: "llama3-8b-8192",
        messages: [
          { role: "system", content: "You are a helpful assistant" },
          { role: "user", content: "What is 2+2?" },
        ],
        temperature: 0.7,
        max_tokens: 100,
        top_p: 0.9,
        frequency_penalty: 0.1,
        presence_penalty: 0.1,
        stop: ["\n"],
        user: "user-123",
      };

      const mockResponse = {
        id: "chatcmpl-123",
        object: "chat.completion",
        created: 1234567890,
        model: "llama3-8b-8192",
        choices: [
          {
            index: 0,
            message: { role: "assistant", content: "2+2 equals 4" },
            finish_reason: "stop",
          },
        ],
        usage: { prompt_tokens: 15, completion_tokens: 5, total_tokens: 20 },
      };

      mockGroqClient.chat.completions.create.mockResolvedValue(mockResponse);

      const result = await provider.chatCompletion(complexRequest);

      expect(mockGroqClient.chat.completions.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "llama3-8b-8192",
          messages: complexRequest.messages,
          temperature: 0.7,
          max_tokens: 100,
          stream: undefined,
          tool_choice: undefined,
          tools: undefined,
        })
      );
      expect(result).toEqual(
        expect.objectContaining({
          id: "chatcmpl-123",
          object: "chat.completion",
        })
      );
    });
  });

  describe("streamChatCompletion", () => {
    const baseRequest: ChatCompletionRequest = {
      model: "llama3-8b-8192",
      messages: [{ role: "user", content: "Hello" }],
    };

    it("should stream chat completion", async () => {
      const mockChunks = [
        {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "llama3-8b-8192",
          choices: [
            {
              index: 0,
              delta: { role: "assistant", content: "Hello" },
              finish_reason: null,
            },
          ],
        },
        {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "llama3-8b-8192",
          choices: [
            {
              index: 0,
              delta: { content: "! How can I help?" },
              finish_reason: "stop",
            },
          ],
        },
      ];

      const mockStream = (async function* () {
        for (const chunk of mockChunks) {
          yield chunk;
        }
      })();

      mockGroqClient.chat.completions.create.mockResolvedValue(mockStream);

      const stream = provider.streamChatCompletion(baseRequest);
      const chunks: ChatCompletionChunk[] = [];

      for await (const chunk of stream) {
        chunks.push(chunk);
      }

      expect(mockGroqClient.chat.completions.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "llama3-8b-8192",
          messages: [{ role: "user", content: "Hello" }],
        })
      );
      expect(chunks).toHaveLength(2);
      expect(chunks[0]).toEqual(
        expect.objectContaining({
          object: "chat.completion.chunk",
        })
      );
    });

    it("should handle streaming errors", async () => {
      const streamError = new Error("Streaming connection failed");
      mockGroqClient.chat.completions.create.mockRejectedValue(streamError);

      await expect(async () => {
        const stream = provider.streamChatCompletion(baseRequest);
        for await (const chunk of stream) {
          // This should not be reached
        }
      }).rejects.toThrow(AISuiteError);

      await expect(async () => {
        const stream = provider.streamChatCompletion(baseRequest);
        for await (const chunk of stream) {
          // This should not be reached
        }
      }).rejects.toThrow("Groq streaming error: Streaming connection failed");
    });

    it("should handle abort signal", async () => {
      const mockStream = (async function* () {
        yield {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "llama3-8b-8192",
          choices: [
            {
              index: 0,
              delta: { role: "assistant", content: "Hello!" },
              finish_reason: "stop",
            },
          ],
        };
      })();

      mockGroqClient.chat.completions.create.mockResolvedValue(mockStream);

      const abortController = new AbortController();
      const options = { signal: abortController.signal };

      const stream = provider.streamChatCompletion(baseRequest, options);
      const chunks: ChatCompletionChunk[] = [];

      // Start consuming the stream
      const consumePromise = (async () => {
        for await (const chunk of stream) {
          chunks.push(chunk);
        }
      })();

      // Abort after a short delay
      setTimeout(() => {
        abortController.abort();
      }, 10);

      await consumePromise;

      expect(chunks.length).toBeGreaterThan(0);
    });

    it("should handle complex streaming request", async () => {
      const complexRequest: ChatCompletionRequest = {
        model: "llama3-8b-8192",
        messages: [
          { role: "system", content: "You are a helpful assistant" },
          { role: "user", content: "Tell me a story" },
        ],
        temperature: 0.8,
        max_tokens: 200,
        top_p: 0.9,
        stop: ["END"],
      };

      const mockStream = (async function* () {
        yield {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "llama3-8b-8192",
          choices: [
            {
              index: 0,
              delta: { role: "assistant", content: "Once upon a time" },
              finish_reason: null,
            },
          ],
        };
        yield {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "llama3-8b-8192",
          choices: [
            {
              index: 0,
              delta: { content: " there was a brave knight." },
              finish_reason: "stop",
            },
          ],
        };
      })();

      mockGroqClient.chat.completions.create.mockResolvedValue(mockStream);

      const stream = provider.streamChatCompletion(complexRequest);
      const chunks: ChatCompletionChunk[] = [];

      for await (const chunk of stream) {
        chunks.push(chunk);
      }

      expect(mockGroqClient.chat.completions.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "llama3-8b-8192",
          messages: complexRequest.messages,
          temperature: 0.8,
          max_tokens: 200,
          stream: undefined,
          tool_choice: undefined,
          tools: undefined,
        })
      );
      expect(chunks).toHaveLength(2);
    });
  });

  describe("error handling", () => {
    it("should preserve AISuiteError instances", async () => {
      const customError = new AISuiteError(
        "Custom error",
        "groq",
        "CUSTOM_ERROR"
      );

      mockGroqClient.chat.completions.create.mockRejectedValue(customError);

      await expect(
        provider.chatCompletion({
          model: "llama3-8b-8192",
          messages: [{ role: "user", content: "Hello" }],
        })
      ).rejects.toThrow(customError);
    });

    it("should handle unknown error types", async () => {
      const unknownError = "Unknown error string";
      mockGroqClient.chat.completions.create.mockRejectedValue(unknownError);

      await expect(
        provider.chatCompletion({
          model: "llama3-8b-8192",
          messages: [{ role: "user", content: "Hello" }],
        })
      ).rejects.toThrow("Groq API error: Unknown error");
    });

    it("should handle streaming unknown error types", async () => {
      const unknownError = "Unknown streaming error";
      mockGroqClient.chat.completions.create.mockRejectedValue(unknownError);

      const stream = provider.streamChatCompletion({
        model: "llama3-8b-8192",
        messages: [{ role: "user", content: "Hello" }],
      });

      await expect(async () => {
        for await (const chunk of stream) {
          // This should not be reached
        }
      }).rejects.toThrow("Groq streaming error: Unknown error");
    });
  });
});


================================================
FILE: aisuite-js/tests/providers/mistral-provider.test.ts
================================================
import { MistralProvider } from "../../src/providers/mistral/provider";
import { ChatCompletionRequest, ChatCompletionChunk } from "../../src/types";
import { AISuiteError } from "../../src/core/errors";

// Mock the Mistral SDK
jest.mock("@mistralai/mistralai", () => {
  return {
    __esModule: true,
    default: jest.fn(),
  };
});

describe("MistralProvider", () => {
  let provider: MistralProvider;
  let mockMistralClient: any;

  beforeEach(() => {
    // Reset mocks
    jest.clearAllMocks();

    // Create mock Mistral client
    mockMistralClient = {
      chat: jest.fn(),
      chatStream: jest.fn(),
    };

    // Mock the MistralClient constructor
    const MistralClient = require("@mistralai/mistralai");
    MistralClient.default.mockImplementation(() => mockMistralClient);

    // Create provider instance
    provider = new MistralProvider({
      apiKey: "test-api-key",
    });
  });

  describe("constructor", () => {
    it("should initialize with basic config", () => {
      const config = { apiKey: "test-key" };
      const provider = new MistralProvider(config);

      expect(provider.name).toBe("mistral");
    });

    it("should initialize with baseURL config", () => {
      const config = {
        apiKey: "test-key",
        baseURL: "https://custom.mistral.com",
      };
      const provider = new MistralProvider(config);

      expect(provider.name).toBe("mistral");
      expect(mockMistralClient.baseURL).toBe("https://custom.mistral.com");
    });
  });

  describe("chatCompletion", () => {
    const baseRequest: ChatCompletionRequest = {
      model: "mistral-large",
      messages: [{ role: "user", content: "Hello" }],
    };

    it("should successfully complete chat", async () => {
      const mockResponse = {
        id: "chatcmpl-123",
        object: "chat.completion",
        created: 1234567890,
        model: "mistral-large",
        choices: [
          {
            index: 0,
            message: {
              role: "assistant",
              content: "Hello! How can I help you?",
            },
            finish_reason: "stop",
          },
        ],
        usage: {
          prompt_tokens: 10,
          completion_tokens: 20,
          total_tokens: 30,
        },
      };

      mockMistralClient.chat.mockResolvedValue(mockResponse);

      const result = await provider.chatCompletion(baseRequest);

      expect(mockMistralClient.chat).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "mistral-large",
        })
      );
      expect(result).toEqual(
        expect.objectContaining({
          id: "chatcmpl-123",
          object: "chat.completion",
          model: "mistral-large",
        })
      );
    });

    it("should throw error when streaming is enabled", async () => {
      const request: ChatCompletionRequest = {
        ...baseRequest,
        stream: true,
      };

      await expect(provider.chatCompletion(request)).rejects.toThrow(
        AISuiteError
      );
      await expect(provider.chatCompletion(request)).rejects.toThrow(
        "Streaming is not supported in non-streaming method"
      );
    });

    it("should handle API errors", async () => {
      const apiError = new Error("API rate limit exceeded");
      mockMistralClient.chat.mockRejectedValue(apiError);

      await expect(provider.chatCompletion(baseRequest)).rejects.toThrow(
        AISuiteError
      );
      await expect(provider.chatCompletion(baseRequest)).rejects.toThrow(
        "Mistral API error: API rate limit exceeded"
      );
    });

    it("should handle complex request with all parameters", async () => {
      const complexRequest: ChatCompletionRequest = {
        model: "mistral-large",
        messages: [
          { role: "system", content: "You are a helpful assistant" },
          { role: "user", content: "What is 2+2?" },
        ],
        temperature: 0.7,
        max_tokens: 100,
        top_p: 0.9,
        frequency_penalty: 0.1,
        presence_penalty: 0.1,
        stop: ["\n"],
        user: "user-123",
      };

      const mockResponse = {
        id: "chatcmpl-123",
        object: "chat.completion",
        created: 1234567890,
        model: "mistral-large",
        choices: [
          {
            index: 0,
            message: { role: "assistant", content: "2+2 equals 4" },
            finish_reason: "stop",
          },
        ],
        usage: { prompt_tokens: 15, completion_tokens: 5, total_tokens: 20 },
      };

      mockMistralClient.chat.mockResolvedValue(mockResponse);

      const result = await provider.chatCompletion(complexRequest);

      expect(mockMistralClient.chat).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "mistral-large",
        })
      );
      expect(result).toEqual(
        expect.objectContaining({
          id: "chatcmpl-123",
          object: "chat.completion",
        })
      );
    });
  });

  describe("streamChatCompletion", () => {
    const baseRequest: ChatCompletionRequest = {
      model: "mistral-large",
      messages: [{ role: "user", content: "Hello" }],
    };

    it("should stream chat completion", async () => {
      const mockChunks = [
        {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "mistral-large",
          choices: [
            {
              index: 0,
              delta: { role: "assistant", content: "Hello" },
              finish_reason: null,
            },
          ],
        },
        {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "mistral-large",
          choices: [
            {
              index: 0,
              delta: { content: "! How can I help?" },
              finish_reason: "stop",
            },
          ],
        },
      ];

      const mockStream = (async function* () {
        for (const chunk of mockChunks) {
          yield chunk;
        }
      })();

      mockMistralClient.chatStream.mockResolvedValue(mockStream);

      const stream = provider.streamChatCompletion(baseRequest);
      const chunks: ChatCompletionChunk[] = [];

      for await (const chunk of stream) {
        chunks.push(chunk);
      }

      expect(mockMistralClient.chatStream).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "mistral-large",
        })
      );
      expect(chunks).toHaveLength(2);
      expect(typeof chunks[0].id).toBe("string");
      expect(chunks[0].object).toBe("chat.completion.chunk");
    });

    it("should handle streaming errors", async () => {
      mockMistralClient.chatStream.mockRejectedValue(
        new Error("Streaming error")
      );
      const stream = provider.streamChatCompletion(baseRequest);
      const iterator = stream[Symbol.asyncIterator]();
      await expect(iterator.next()).rejects.toThrow(AISuiteError);
    });

    it("should handle abort signal", async () => {
      const mockStream = (async function* () {
        yield {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "mistral-large",
          choices: [
            {
              index: 0,
              delta: { role: "assistant", content: "Hello!" },
              finish_reason: "stop",
            },
          ],
        };
      })();

      mockMistralClient.chatStream.mockResolvedValue(mockStream);

      const abortController = new AbortController();
      const options = { signal: abortController.signal };

      const stream = provider.streamChatCompletion(baseRequest, options);
      const chunks: ChatCompletionChunk[] = [];

      // Start consuming the stream
      const consumePromise = (async () => {
        for await (const chunk of stream) {
          chunks.push(chunk);
        }
      })();

      // Abort after a short delay
      setTimeout(() => {
        abortController.abort();
      }, 10);

      await consumePromise;

      expect(chunks.length).toBeGreaterThan(0);
    });

    it("should handle complex streaming request", async () => {
      const complexRequest: ChatCompletionRequest = {
        model: "mistral-large",
        messages: [
          { role: "system", content: "You are a helpful assistant" },
          { role: "user", content: "Tell me a story" },
        ],
        temperature: 0.8,
        max_tokens: 200,
        top_p: 0.9,
        stop: ["END"],
      };

      const mockStream = (async function* () {
        yield {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "mistral-large",
          choices: [
            {
              index: 0,
              delta: { role: "assistant", content: "Once upon a time" },
              finish_reason: null,
            },
          ],
        };
        yield {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "mistral-large",
          choices: [
            {
              index: 0,
              delta: { content: " there was a brave knight." },
              finish_reason: "stop",
            },
          ],
        };
      })();

      mockMistralClient.chatStream.mockResolvedValue(mockStream);

      const stream = provider.streamChatCompletion(complexRequest);
      const chunks: ChatCompletionChunk[] = [];

      for await (const chunk of stream) {
        chunks.push(chunk);
      }

      expect(mockMistralClient.chatStream).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "mistral-large",
        })
      );
      expect(chunks).toHaveLength(2);
    });
  });

  describe("error handling", () => {
    it("should preserve AISuiteError instances", async () => {
      const customError = new AISuiteError(
        "Custom error",
        "mistral",
        "CUSTOM_ERROR"
      );

      mockMistralClient.chat.mockRejectedValue(customError);

      await expect(
        provider.chatCompletion({
          model: "mistral-large",
          messages: [{ role: "user", content: "Hello" }],
        })
      ).rejects.toThrow(customError);
    });

    it("should handle unknown error types", async () => {
      const unknownError = "Unknown error string";
      mockMistralClient.chat.mockRejectedValue(unknownError);

      await expect(
        provider.chatCompletion({
          model: "mistral-large",
          messages: [{ role: "user", content: "Hello" }],
        })
      ).rejects.toThrow("Mistral API error: Unknown error");
    });

    it("should handle streaming unknown error types", async () => {
      const unknownError = "Unknown streaming error";
      mockMistralClient.chatStream.mockRejectedValue(unknownError);

      const stream = provider.streamChatCompletion({
        model: "mistral-large",
        messages: [{ role: "user", content: "Hello" }],
      });

      await expect(async () => {
        for await (const chunk of stream) {
          // This should not be reached
        }
      }).rejects.toThrow(/Mistral streaming error: Unknown/);
    });
  });
});


================================================
FILE: aisuite-js/tests/providers/openai-provider.test.ts
================================================
import { OpenAIProvider } from "../../src/providers/openai/provider";
import { ChatCompletionRequest, ChatCompletionChunk } from "../../src/types";
import { AISuiteError } from "../../src/core/errors";

// Mock the OpenAI SDK
jest.mock("openai");

describe("OpenAIProvider", () => {
  let provider: OpenAIProvider;
  let mockOpenAIClient: any;

  beforeEach(() => {
    // Reset mocks
    jest.clearAllMocks();

    // Create mock OpenAI client
    mockOpenAIClient = {
      chat: {
        completions: {
          create: jest.fn(),
        },
      },
    };

    // Mock the OpenAI constructor
    const OpenAI = require("openai");
    OpenAI.mockImplementation(() => mockOpenAIClient);

    // Create provider instance
    provider = new OpenAIProvider({
      apiKey: "test-api-key",
    });
  });

  describe("constructor", () => {
    it("should initialize with basic config", () => {
      const config = { apiKey: "test-key" };
      const provider = new OpenAIProvider(config);

      expect(provider.name).toBe("openai");
    });

    it("should initialize with full config", () => {
      const config = {
        apiKey: "test-key",
        baseURL: "https://custom.openai.com",
        organization: "org-123",
      };
      const provider = new OpenAIProvider(config);

      expect(provider.name).toBe("openai");
    });
  });

  describe("chatCompletion", () => {
    const baseRequest: ChatCompletionRequest = {
      model: "gpt-4",
      messages: [{ role: "user", content: "Hello" }],
    };

    it("should successfully complete chat", async () => {
      const mockResponse = {
        id: "chatcmpl-123",
        object: "chat.completion",
        created: 1234567890,
        model: "gpt-4",
        choices: [
          {
            index: 0,
            message: {
              role: "assistant",
              content: "Hello! How can I help you?",
            },
            finish_reason: "stop",
          },
        ],
        usage: {
          prompt_tokens: 10,
          completion_tokens: 20,
          total_tokens: 30,
        },
      };

      mockOpenAIClient.chat.completions.create.mockResolvedValue(mockResponse);

      const result = await provider.chatCompletion(baseRequest);

      expect(mockOpenAIClient.chat.completions.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "gpt-4",
          messages: [{ role: "user", content: "Hello" }],
        }),
        undefined
      );
      expect(result).toEqual(
        expect.objectContaining({
          id: "chatcmpl-123",
          object: "chat.completion",
          model: "gpt-4",
        })
      );
    });

    it("should throw error when streaming is enabled", async () => {
      const request: ChatCompletionRequest = {
        ...baseRequest,
        stream: true,
      };

      await expect(provider.chatCompletion(request)).rejects.toThrow(
        AISuiteError
      );
      await expect(provider.chatCompletion(request)).rejects.toThrow(
        "Streaming is not yet supported"
      );
    });

    it("should handle API errors", async () => {
      const apiError = new Error("API rate limit exceeded");
      mockOpenAIClient.chat.completions.create.mockRejectedValue(apiError);

      await expect(provider.chatCompletion(baseRequest)).rejects.toThrow(
        AISuiteError
      );
      await expect(provider.chatCompletion(baseRequest)).rejects.toThrow(
        "OpenAI API error: API rate limit exceeded"
      );
    });

    it("should pass options to the client", async () => {
      const options = { signal: new AbortController().signal };
      const mockResponse = {
        id: "chatcmpl-123",
        object: "chat.completion",
        created: 1234567890,
        model: "gpt-4",
        choices: [],
        usage: { prompt_tokens: 10, completion_tokens: 20, total_tokens: 30 },
      };

      mockOpenAIClient.chat.completions.create.mockResolvedValue(mockResponse);

      await provider.chatCompletion(baseRequest, options);

      expect(mockOpenAIClient.chat.completions.create).toHaveBeenCalledWith(
        expect.any(Object),
        options
      );
    });

    it("should handle complex request with all parameters", async () => {
      const complexRequest: ChatCompletionRequest = {
        model: "gpt-4",
        messages: [
          { role: "system", content: "You are a helpful assistant" },
          { role: "user", content: "What is 2+2?" },
        ],
        temperature: 0.7,
        max_tokens: 100,
        top_p: 0.9,
        frequency_penalty: 0.1,
        presence_penalty: 0.1,
        stop: ["\n"],
        user: "user-123",
      };

      const mockResponse = {
        id: "chatcmpl-123",
        object: "chat.completion",
        created: 1234567890,
        model: "gpt-4",
        choices: [
          {
            index: 0,
            message: { role: "assistant", content: "2+2 equals 4" },
            finish_reason: "stop",
          },
        ],
        usage: { prompt_tokens: 15, completion_tokens: 5, total_tokens: 20 },
      };

      mockOpenAIClient.chat.completions.create.mockResolvedValue(mockResponse);

      const result = await provider.chatCompletion(complexRequest);

      expect(mockOpenAIClient.chat.completions.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "gpt-4",
          messages: complexRequest.messages,
          temperature: 0.7,
          max_tokens: 100,
          top_p: 0.9,
          frequency_penalty: 0.1,
          presence_penalty: 0.1,
          stop: ["\n"],
          user: "user-123",
        }),
        undefined
      );
      expect(result).toEqual(
        expect.objectContaining({
          id: "chatcmpl-123",
          object: "chat.completion",
        })
      );
    });
  });

  describe("streamChatCompletion", () => {
    const baseRequest: ChatCompletionRequest = {
      model: "gpt-4",
      messages: [{ role: "user", content: "Hello" }],
    };

    it("should stream chat completion", async () => {
      const mockChunks = [
        {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "gpt-4",
          choices: [
            {
              index: 0,
              delta: { role: "assistant", content: "Hello" },
              finish_reason: null,
            },
          ],
        },
        {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "gpt-4",
          choices: [
            {
              index: 0,
              delta: { content: "! How can I help?" },
              finish_reason: "stop",
            },
          ],
        },
      ];

      const mockStream = (async function* () {
        for (const chunk of mockChunks) {
          yield chunk;
        }
      })();

      mockOpenAIClient.chat.completions.create.mockResolvedValue(mockStream);

      const stream = provider.streamChatCompletion(baseRequest);
      const chunks: ChatCompletionChunk[] = [];

      for await (const chunk of stream) {
        chunks.push(chunk);
      }

      expect(mockOpenAIClient.chat.completions.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "gpt-4",
          messages: [{ role: "user", content: "Hello" }],
          stream: true,
        }),
        undefined
      );
      expect(chunks).toHaveLength(2);
      expect(chunks[0]).toEqual(
        expect.objectContaining({
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
        })
      );
    });

    it("should handle streaming errors", async () => {
      const streamError = new Error("Streaming connection failed");
      mockOpenAIClient.chat.completions.create.mockRejectedValue(streamError);

      await expect(async () => {
        const stream = provider.streamChatCompletion(baseRequest);
        for await (const chunk of stream) {
          // This should not be reached
        }
      }).rejects.toThrow(AISuiteError);

      await expect(async () => {
        const stream = provider.streamChatCompletion(baseRequest);
        for await (const chunk of stream) {
          // This should not be reached
        }
      }).rejects.toThrow("OpenAI streaming error: Streaming connection failed");
    });

    it("should pass options to streaming request", async () => {
      const options = { signal: new AbortController().signal };
      const mockStream = (async function* () {
        yield {
          id: "chatcmpl-123",
          object: "chat.completion.chunk",
          created: 1234567890,
          model: "gpt-4",
          choices: [
            {
              index: 0,
              delta: { role: "assistant", content: "Hello!" },
              finish_reason: "stop",
            },
          ],
        };
      })();

      mockOpenAIClient.chat.completions.create.mockResolvedValue(mockStream);

      const stream = provider.streamChatCompletion(baseRequest, options);
      const chunks: ChatCompletionChunk[] = [];

      for await (const chunk of stream) {
        chunks.push(chunk);
      }

      expect(mockOpenAIClient.chat.completions.create).toHaveBeenCalledWith(
        expect.objectContaining({
          model: "gpt-4",
          messages: [{ role: "user", content: "Hello" }],
          stream: true,
        }),
        options
      );
      expect(chunks).toHaveLength(1);
    });
  });

  describe("error handling", () => {
    it("should preserve AISuiteError instances", async () => {
      const customError = new AISuiteError(
        "Custom error",
        "openai",
        "CUSTOM_ERROR"
      );

      mockOpenAIClient.chat.completions.create.mockRejectedValue(customError);

      await expect(
        provider.chatCompletion({
          model: "gpt-4",
          messages: [{ role: "user", content: "Hello" }],
        })
      ).rejects.toThrow(customError);
    });

    it("should handle unknown error types", async () => {
      const unknownError = "Unknown error string";
      mockOpenAIClient.chat.completions.create.mockRejectedValue(unknownError);

      await expect(
        provider.chatCompletion({
          model: "gpt-4",
          messages: [{ role: "user", content: "Hello" }],
        })
      ).rejects.toThrow("OpenAI API error: Unknown error");
    });
  });
});


================================================
FILE: aisuite-js/tests/providers/openai_asr_provider.test.ts
================================================
import { TranscriptionRequest } from "../../src/types";
import { AISuiteError } from "../../src/core/errors";
import { OpenAIProvider } from "../../src/providers/openai";

describe("OpenAIProvider", () => {
  let provider: OpenAIProvider;

  beforeEach(() => {
    provider = new OpenAIProvider({
      apiKey: "test-api-key",
    });
  });

  describe("validateParams", () => {
    it("should not throw for supported parameters", () => {
      const params = {
        language: "en",
        prompt: "test prompt",
        response_format: "json",
        temperature: 0.5,
        timestamps: true,
        model: "whisper-1",
        file: Buffer.from("test")
      };

      expect(() => provider.validateParams(params)).not.toThrow();
    });

    it("should validate required parameters", () => {
      const params = {
        unsupported_param: "value",
        model: "whisper-1",
        file: Buffer.from("test")
      };

      expect(() => provider.validateParams(params)).not.toThrow();
    });
  });

  describe("translateParams", () => {
    it("should translate standard parameters correctly", () => {
      const params = {
        language: "en",
        prompt: "test prompt",
        response_format: "json",
        temperature: 0.5,
        timestamps: true,
        model: "whisper-1",
        file: Buffer.from("test")
      };

      const translated = provider.translateParams(params);
      expect(translated).toEqual({
        language: "en",
        prompt: "test prompt",
        response_format: "json",
        temperature: 0.5,
        timestamps: true,
      });
    });

    it("should retain other parameters", () => {
      const params = {
        custom_param: "value",
        model: "whisper-1",
        file: Buffer.from("test")
      };

      const translated = provider.translateParams(params);
      expect(translated).toEqual({
        custom_param: "value"
      });
    });
  });

  describe("transcribe", () => {
    it("should throw error if file is not provided", async () => {
      const request: TranscriptionRequest = {
        model: "openai:whisper-1",
        file: "",
      };

      await expect(provider.transcribe(request)).rejects.toThrow(AISuiteError);
    });
  });
});


================================================
FILE: aisuite-js/tests/utils/streaming.test.ts
================================================
import { createChunk, generateId } from "../../src/utils/streaming";

describe("Streaming Utils", () => {
  describe("createChunk", () => {
    it("should create a basic chunk with required fields", () => {
      const id = "test-chunk-id";
      const model = "gpt-4";

      const chunk = createChunk(id, model);

      expect(chunk).toEqual({
        id,
        object: "chat.completion.chunk",
        created: expect.any(Number),
        model,
        choices: [
          {
            index: 0,
            delta: {
              role: "assistant",
              content: undefined,
              tool_calls: undefined,
            },
            finish_reason: undefined,
          },
        ],
      });
    });

    it("should create a chunk with content", () => {
      const id = "test-chunk-id";
      const model = "claude-3-sonnet";
      const content = "Hello, world!";

      const chunk = createChunk(id, model, content);

      expect(chunk).toEqual({
        id,
        object: "chat.completion.chunk",
        created: expect.any(Number),
        model,
        choices: [
          {
            index: 0,
            delta: {
              role: "assistant",
              content,
              tool_calls: undefined,
            },
            finish_reason: undefined,
          },
        ],
      });
    });

    it("should create a chunk with finish reason", () => {
      const id = "test-chunk-id";
      const model = "mistral-large";
      const finishReason = "stop";

      const chunk = createChunk(id, model, undefined, finishReason);

      expect(chunk).toEqual({
        id,
        object: "chat.completion.chunk",
        created: expect.any(Number),
        model,
        choices: [
          {
            index: 0,
            delta: {
              role: "assistant",
              content: undefined,
              tool_calls: undefined,
            },
            finish_reason: finishReason,
          },
        ],
      });
    });

    it("should create a chunk with tool calls", () => {
      const id = "test-chunk-id";
      const model = "gpt-4";
      const toolCalls = [
        {
          id: "call-1",
          type: "function",
          function: {
            name: "get_weather",
            arguments: '{"location": "New York"}',
          },
        },
      ];

      const chunk = createChunk(id, model, undefined, undefined, toolCalls);

      expect(chunk).toEqual({
        id,
        object: "chat.completion.chunk",
        created: expect.any(Number),
        model,
        choices: [
          {
            index: 0,
            delta: {
              role: "assistant",
              content: undefined,
              tool_calls: toolCalls,
            },
            finish_reason: undefined,
          },
        ],
      });
    });

    it("should create a complete chunk with all parameters", () => {
      const id = "test-chunk-id";
      const model = "gpt-4";
      const content = "The weather is sunny";
      const finishReason = "stop";
      const toolCalls = [
        {
          id: "call-1",
          type: "function",
          function: {
            name: "get_weather",
            arguments: '{"location": "New York"}',
          },
        },
      ];

      const chunk = createChunk(id, model, content, finishReason, toolCalls);

      expect(chunk).toEqual({
        id,
        object: "chat.completion.chunk",
        created: expect.any(Number),
        model,
        choices: [
          {
            index: 0,
            delta: {
              role: "assistant",
              content,
              tool_calls: toolCalls,
            },
            finish_reason: finishReason,
          },
        ],
      });
    });

    it("should set created timestamp to current time", () => {
      const before = Math.floor(Date.now() / 1000);
      const chunk = createChunk("test-id", "test-model");
      const after = Math.floor(Date.now() / 1000);

      expect(chunk.created).toBeGreaterThanOrEqual(before);
      expect(chunk.created).toBeLessThanOrEqual(after);
    });

    it("should always set index to 0", () => {
      const chunk = createChunk("test-id", "test-model");

      expect(chunk.choices[0].index).toBe(0);
    });

    it("should always set role to assistant", () => {
      const chunk = createChunk("test-id", "test-model");

      expect(chunk.choices[0].delta.role).toBe("assistant");
    });
  });

  describe("generateId", () => {
    it("should generate a string id", () => {
      const id = generateId();

      expect(typeof id).toBe("string");
      expect(id.length).toBeGreaterThan(0);
    });

    it("should generate ids with chatcmpl prefix", () => {
      const id = generateId();

      expect(id).toMatch(/^chatcmpl-/);
    });

    it("should generate unique ids", () => {
      const id1 = generateId();
      const id2 = generateId();
      const id3 = generateId();

      expect(id1).not.toBe(id2);
      expect(id1).not.toBe(id3);
      expect(id2).not.toBe(id3);
    });

    it("should generate ids with consistent format", () => {
      const id = generateId();

      // Should match pattern: chatcmpl- followed by 9 alphanumeric characters
      expect(id).toMatch(/^chatcmpl-[a-z0-9]{9}$/);
    });

    it("should generate multiple ids without conflicts", () => {
      const ids = new Set();
      const iterations = 1000;

      for (let i = 0; i < iterations; i++) {
        ids.add(generateId());
      }

      // All ids should be unique
      expect(ids.size).toBe(iterations);
    });
  });

  describe("integration", () => {
    it("should create chunks with generated ids", () => {
      const model = "test-model";
      const content = "test content";

      const chunk = createChunk(generateId(), model, content);

      expect(chunk.id).toMatch(/^chatcmpl-/);
      expect(chunk.model).toBe(model);
      expect(chunk.choices[0].delta.content).toBe(content);
    });

    it("should create multiple chunks with different ids", () => {
      const model = "test-model";

      const chunk1 = createChunk(generateId(), model);
      const chunk2 = createChunk(generateId(), model);

      expect(chunk1.id).not.toBe(chunk2.id);
      expect(chunk1.created).toBe(chunk2.created); // Should be created at same time
    });
  });
});


================================================
FILE: aisuite-js/tsconfig.json
================================================
{
  "compilerOptions": {
    "target": "ES2020",
    "module": "ESNext",
    "lib": ["ES2020"],
    "outDir": "./dist",
    "rootDir": "./src",
    "strict": true,
    "esModuleInterop": true,
    "skipLibCheck": true,
    "forceConsistentCasingInFileNames": true,
    "declaration": true,
    "declarationMap": true,
    "sourceMap": true,
    "moduleResolution": "node",
    "allowSyntheticDefaultImports": true,
    "experimentalDecorators": true,
    "emitDecoratorMetadata": true,
    "allowJs": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "dist", "**/*.test.ts"]
}

================================================
FILE: examples/AISuiteDemo.ipynb
================================================
{
  "nbformat": 4,
  "nbformat_minor": 0,
  "metadata": {
    "colab": {
      "provenance": []
    },
    "kernelspec": {
      "name": "python3",
      "display_name": "Python 3"
    },
    "language_info": {
      "name": "python"
    }
  },
  "cells": [
    {
      "cell_type": "markdown",
      "source": [
        "AI Suite is a light wrapper to provide a unified interface between LLM providers."
      ],
      "metadata": {
        "id": "hZq_yZRcbxdI"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "# Install AI Suite\n",
        "!pip install aisuite[all]"
      ],
      "metadata": {
        "id": "1mt8kgFHXMvv",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "collapsed": true,
        "outputId": "b56619e8-0dd8-4850-d3b2-1f1169672aab"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Collecting aisuite[all]\n",
            "  Downloading aisuite-0.1.5-py3-none-any.whl.metadata (4.1 kB)\n",
            "Collecting anthropic<0.31.0,>=0.30.1 (from aisuite[all])\n",
            "  Downloading anthropic-0.30.1-py3-none-any.whl.metadata (18 kB)\n",
            "Collecting groq<0.10.0,>=0.9.0 (from aisuite[all])\n",
            "  Downloading groq-0.9.0-py3-none-any.whl.metadata (13 kB)\n",
            "Requirement already satisfied: openai<2.0.0,>=1.35.8 in /usr/local/lib/python3.10/dist-packages (from aisuite[all]) (1.52.2)\n",
            "Requirement already satisfied: anyio<5,>=3.5.0 in /usr/local/lib/python3.10/dist-packages (from anthropic<0.31.0,>=0.30.1->aisuite[all]) (3.7.1)\n",
            "Requirement already satisfied: distro<2,>=1.7.0 in /usr/local/lib/python3.10/dist-packages (from anthropic<0.31.0,>=0.30.1->aisuite[all]) (1.9.0)\n",
            "Requirement already satisfied: httpx<1,>=0.23.0 in /usr/local/lib/python3.10/dist-packages (from anthropic<0.31.0,>=0.30.1->aisuite[all]) (0.27.2)\n",
            "Requirement already satisfied: jiter<1,>=0.4.0 in /usr/local/lib/python3.10/dist-packages (from anthropic<0.31.0,>=0.30.1->aisuite[all]) (0.6.1)\n",
            "Requirement already satisfied: pydantic<3,>=1.9.0 in /usr/local/lib/python3.10/dist-packages (from anthropic<0.31.0,>=0.30.1->aisuite[all]) (2.9.2)\n",
            "Requirement already satisfied: sniffio in /usr/local/lib/python3.10/dist-packages (from anthropic<0.31.0,>=0.30.1->aisuite[all]) (1.3.1)\n",
            "Requirement already satisfied: tokenizers>=0.13.0 in /usr/local/lib/python3.10/dist-packages (from anthropic<0.31.0,>=0.30.1->aisuite[all]) (0.19.1)\n",
            "Requirement already satisfied: typing-extensions<5,>=4.7 in /usr/local/lib/python3.10/dist-packages (from anthropic<0.31.0,>=0.30.1->aisuite[all]) (4.12.2)\n",
            "Requirement already satisfied: tqdm>4 in /usr/local/lib/python3.10/dist-packages (from openai<2.0.0,>=1.35.8->aisuite[all]) (4.66.6)\n",
            "Requirement already satisfied: idna>=2.8 in /usr/local/lib/python3.10/dist-packages (from anyio<5,>=3.5.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (3.10)\n",
            "Requirement already satisfied: exceptiongroup in /usr/local/lib/python3.10/dist-packages (from anyio<5,>=3.5.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (1.2.2)\n",
            "Requirement already satisfied: certifi in /usr/local/lib/python3.10/dist-packages (from httpx<1,>=0.23.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (2024.8.30)\n",
            "Requirement already satisfied: httpcore==1.* in /usr/local/lib/python3.10/dist-packages (from httpx<1,>=0.23.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (1.0.6)\n",
            "Requirement already satisfied: h11<0.15,>=0.13 in /usr/local/lib/python3.10/dist-packages (from httpcore==1.*->httpx<1,>=0.23.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (0.14.0)\n",
            "Requirement already satisfied: annotated-types>=0.6.0 in /usr/local/lib/python3.10/dist-packages (from pydantic<3,>=1.9.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (0.7.0)\n",
            "Requirement already satisfied: pydantic-core==2.23.4 in /usr/local/lib/python3.10/dist-packages (from pydantic<3,>=1.9.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (2.23.4)\n",
            "Requirement already satisfied: huggingface-hub<1.0,>=0.16.4 in /usr/local/lib/python3.10/dist-packages (from tokenizers>=0.13.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (0.24.7)\n",
            "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.16.4->tokenizers>=0.13.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (3.16.1)\n",
            "Requirement already satisfied: fsspec>=2023.5.0 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.16.4->tokenizers>=0.13.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (2024.10.0)\n",
            "Requirement already satisfied: packaging>=20.9 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.16.4->tokenizers>=0.13.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (24.1)\n",
            "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.16.4->tokenizers>=0.13.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (6.0.2)\n",
            "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.16.4->tokenizers>=0.13.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (2.32.3)\n",
            "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface-hub<1.0,>=0.16.4->tokenizers>=0.13.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (3.4.0)\n",
            "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface-hub<1.0,>=0.16.4->tokenizers>=0.13.0->anthropic<0.31.0,>=0.30.1->aisuite[all]) (2.2.3)\n",
            "Downloading anthropic-0.30.1-py3-none-any.whl (863 kB)\n",
            "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m863.9/863.9 kB\u001b[0m \u001b[31m9.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hDownloading groq-0.9.0-py3-none-any.whl (103 kB)\n",
            "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m103.5/103.5 kB\u001b[0m \u001b[31m5.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hDownloading aisuite-0.1.5-py3-none-any.whl (19 kB)\n",
            "Installing collected packages: aisuite, groq, anthropic\n",
            "Successfully installed aisuite-0.1.5 anthropic-0.30.1 groq-0.9.0\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "### Custom Pretty Printing Function\n",
        "In this section, we define a custom pretty-printing function that enhances the readability of data structures when printed. This function utilizes Python's built-in pprint module, allowing users to specify a custom width for output formatting."
      ],
      "metadata": {
        "id": "KwFlLByRbWKi"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "from pprint import pprint as pp\n",
        "# Set a custom width for pretty-printing\n",
        "def pprint(data, width=80):\n",
        "    \"\"\"Pretty print data with a specified width.\"\"\"\n",
        "    pp(data, width=width)# List of model identifiers to query\n"
      ],
      "metadata": {
        "id": "-Wf7j6abbQmw"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "source": [
        "### Setting Up API Keys\n",
        "\n",
        "Here we will securely set our API keys as environment variables. This is helpful because we don’t want to hardcode sensitive information (like API keys) directly into our code. By using environment variables, we can keep our credentials secure while still allowing our program to access them. Normally we would use a .env file to store our passwords to our enviroments, but since we are going to be working in colab we will do things a little different."
      ],
      "metadata": {
        "id": "Cce1aLBvctaL"
      }
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "BsK7GrHyV-c4",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "35fef9dc-e226-4e9d-e6c7-a597882b74f9"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Enter your GROQ API key: ··········\n"
          ]
        }
      ],
      "source": [
        "import os\n",
        "from getpass import getpass\n",
        "os.environ['GROQ_API_KEY'] = getpass('Enter your GROQ API key: ')"
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "### Creating a Simple Chat Interaction with an AI Language Model\n",
        "This code initiates a chat interaction with a language model (specifically Groq’s LLaMA 3.2), where the model responds to the user's input. We use the aisuite library to communicate with the model and retrieve the response."
      ],
      "metadata": {
        "id": "m2mhu-VbSWfF"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "import aisuite as ai\n",
        "\n",
        "# Initialize the AI client for accessing the language model\n",
        "client = ai.Client()\n",
        "\n",
        "# Define a conversation with a system message and a user message\n",
        "messages = [\n",
        "    {\"role\": \"system\", \"content\": \"You are a helpful agent, who answers with brevity.\"},\n",
        "    {\"role\": \"user\", \"content\": 'Hi'},\n",
        "]\n",
        "\n",
        "# Request a response from the model\n",
        "response = client.chat.completions.create(model=\"groq:llama-3.2-3b-preview\", messages=messages)\n",
        "\n",
        "# Print the model's response\n",
        "print(response.choices[0].message.content)"
      ],
      "metadata": {
        "id": "mBEOEq99eGjR",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "446fdba3-9072-4470-b3b8-627717013604"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "How can I assist you?\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "### Defining a Function to Interact with the Language Model\n",
        "\n",
        "This function, ask, streamlines the process of sending a user message to a language model and retrieving a response. It encapsulates the logic required to set up the conversation and can be reused throughout the notebook for different queries. It will not perserve any history or any continuing conversation.  \n",
        "\n"
      ],
      "metadata": {
        "id": "YJSahowjiJBE"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "def ask(message, sys_message=\"You are a helpful agent.\",\n",
        "         model=\"groq:llama-3.2-3b-preview\"):\n",
        "    # Initialize the AI client for accessing the language model\n",
        "    client = ai.Client()\n",
        "\n",
        "    # Construct the messages list for the chat\n",
        "    messages = [\n",
        "        {\"role\": \"system\", \"content\": sys_message},\n",
        "        {\"role\": \"user\", \"content\": message}\n",
        "    ]\n",
        "\n",
        "    # Send the messages to the model and get the response\n",
        "    response = client.chat.completions.create(model=model, messages=messages)\n",
        "\n",
        "    # Return the content of the model's response\n",
        "    return response.choices[0].message.content\n"
      ],
      "metadata": {
        "id": "n8DK8_RqqXFH"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "ask(\"Hi. what is capital of Japan?\")"
      ],
      "metadata": {
        "id": "FGcqY4lBjtFj",
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 35
        },
        "outputId": "0520933a-8f2f-4185-a8a2-c591283482a3"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "execute_result",
          "data": {
            "text/plain": [
              "'Hello. The capital of Japan is Tokyo.'"
            ],
            "application/vnd.google.colaboratory.intrinsic+json": {
              "type": "string"
            }
          },
          "metadata": {},
          "execution_count": 6
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "The real value of AI Suite is the ablity to run a variety of different models.  Let's first set up a collection of different API keys which we can try out."
      ],
      "metadata": {
        "id": "wpeW6Pj6j_6H"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "os.environ['OPENAI_API_KEY'] = getpass('Enter your OPENAI API key: ')\n",
        "os.environ['ANTHROPIC_API_KEY'] = getpass('Enter your ANTHROPIC API key: ')"
      ],
      "metadata": {
        "id": "9_kJlkGfj_NG",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "d45074c6-bbc6-4214-df0c-6d162a176f21"
      },
      "execution_count": null,
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Enter your OPENAI API key: ··········\n",
            "Enter your ANTHROPIC API key: ··········\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "###Confirm each model is using a different provider\n"
      ],
      "metadata": {
        "id": "mfPtlJlbTY6X"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "print(ask(\"Who is your creator?\"))\n",
        "print(ask('Who is your creator?', model='anthropic:claude-3-5-sonnet-20240620'))\n",
        "print(ask('Who is your creator?', model='openai:gpt-4o'))\n"
      ],
      "metadata": {
        "id": "iHVESCGJuWWg",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "3102b43a-e754-4288-ec1d-9777791f25b6"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "I was created by Meta AI, a leading artificial intelligence research organization. My knowledge was developed from a large corpus of text, which I use to generate human-like responses to user queries.\n",
            "I was created by Anthropic.\n",
            "I was developed by OpenAI, an organization that focuses on artificial intelligence research and deployment.\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "### Querying Multiple AI Models for a Common Question\n",
        "In this section, we will query several different versions of the LLaMA language model to get varied responses to the same question. This approach allows us to compare how different models handle the same prompt, providing insights into their performance and style."
      ],
      "metadata": {
        "id": "BWBL4D2H2B_9"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "\n",
        "models = [\n",
        "    'llama-3.1-8b-instant',\n",
        "    'llama-3.2-1b-preview',\n",
        "    'llama-3.2-3b-preview',\n",
        "    'llama3-70b-8192',\n",
        "    'llama3-8b-8192'\n",
        "]\n",
        "\n",
        "# Initialize a list to hold the responses from each model\n",
        "ret = []\n",
        "\n",
        "# Loop through each model and get a response for the specified question\n",
        "for x in models:\n",
        "    ret.append(ask('Write a short one sentence explanation of the origins of AI?', model=f'groq:{x}'))\n",
        "\n",
        "# Print the model's name and its corresponding response\n",
        "for idx, x in enumerate(ret):\n",
        "    pprint(models[idx] + ': \\n ' + x + ' ')"
      ],
      "metadata": {
        "id": "E_gg-sgYuoOb",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "d1c582ba-3471-4b0e-b9ca-317df8a1c1c5"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "('llama-3.1-8b-instant: \\n'\n",
            " ' The origins of Artificial Intelligence (AI) date back to the 1956 Dartmouth '\n",
            " 'Summer Research Project on Artificial Intelligence, where a group of '\n",
            " 'computer scientists, led by John McCarthy, Marvin Minsky, Nathaniel '\n",
            " 'Rochester, and Claude Shannon, coined the term and laid the foundation for '\n",
            " 'the development of AI as a distinct field of study. ')\n",
            "('llama-3.2-1b-preview: \\n'\n",
            " ' The origins of Artificial Intelligence (AI) date back to the mid-20th '\n",
            " 'century, when the first computer programs, which mimicked human-like '\n",
            " 'intelligence through algorithms and rule-based systems, were developed by '\n",
            " 'renowned mathematicians and computer scientists, including Alan Turing, '\n",
            " 'Marvin Minsky, and John McCarthy in the 1950s. ')\n",
            "('llama-3.2-3b-preview: \\n'\n",
            " ' The origins of Artificial Intelligence (AI) date back to the 1950s, with '\n",
            " 'the Dartmouth Summer Research Project on Artificial Intelligence, led by '\n",
            " 'computer scientists John McCarthy, Marvin Minsky, and Nathaniel Rochester, '\n",
            " 'marking the birth of AI as a formal field of research. ')\n",
            "('llama3-70b-8192: \\n'\n",
            " ' The origins of Artificial Intelligence (AI) can be traced back to the 1950s '\n",
            " 'when computer scientist Alan Turing proposed the Turing Test, a method for '\n",
            " 'determining whether a machine could exhibit intelligent behavior equivalent '\n",
            " 'to, or indistinguishable from, that of a human. ')\n",
            "('llama3-8b-8192: \\n'\n",
            " ' The origins of Artificial Intelligence (AI) can be traced back to the '\n",
            " '1950s, when computer scientists DARPA funded the development of the first AI '\n",
            " 'programs, such as the Logical Theorist, which aimed to simulate human '\n",
            " 'problem-solving abilities and learn from experience. ')\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "### Querying Different AI Providers for a Common Question\n",
        "In this section, we will query multiple AI models from different providers to get varied responses to the same question regarding the origins of AI. This comparison allows us to observe how different models from different architectures respond to the same prompt."
      ],
      "metadata": {
        "id": "Z8pnJPdD2NL0"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "# List of AI model providers to query\n",
        "providers = [\n",
        "    'groq:llama3-70b-8192',\n",
        "    'openai:gpt-4o',\n",
        "    'anthropic:claude-3-5-sonnet-20240620'\n",
        "]\n",
        "\n",
        "# Initialize a list to hold the responses from each provider\n",
        "ret = []\n",
        "\n",
        "# Loop through each provider and get a response for the specified question\n",
        "for x in providers:\n",
        "    ret.append(ask('Write a short one sentence explanation of the origins of AI?', model=x))\n",
        "\n",
        "# Print the provider's name and its corresponding response\n",
        "for idx, x in enumerate(ret):\n",
        "    pprint(providers[idx] + ': \\n' + x + ' \\n\\n')\n"
      ],
      "metadata": {
        "collapsed": true,
        "id": "j4TqhC5J1YIG",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "4a50e300-0a7a-4562-8a34-f31c4b9072d4"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "('groq:llama3-70b-8192: \\n'\n",
            " 'The origins of Artificial Intelligence (AI) can be traced back to the 1950s '\n",
            " 'when computer scientists like Alan Turing, Marvin Minsky, and John McCarthy '\n",
            " 'began exploring ways to create machines that could think and learn like '\n",
            " 'humans, leading to the development of the first AI programs and '\n",
            " 'algorithms. \\n'\n",
            " '\\n')\n",
            "('openai:gpt-4o: \\n'\n",
            " 'The origins of AI trace back to the mid-20th century, when pioneers like '\n",
            " 'Alan Turing and John McCarthy began exploring the possibility of creating '\n",
            " 'machines that could simulate human intelligence through computational '\n",
            " 'processes. \\n'\n",
            " '\\n')\n",
            "('anthropic:claude-3-5-sonnet-20240620: \\n'\n",
            " 'The origins of AI can be traced back to the 1950s when computer scientists '\n",
            " 'began exploring the concept of creating machines that could simulate human '\n",
            " 'intelligence and problem-solving abilities. \\n'\n",
            " '\\n')\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "### Generating and Evaluating Questions with AI Models\n",
        "In this section, we will randomly generate questions using a language model and then have two other models provide answers to those questions. The user will then evaluate which answer is better, allowing for a comparative analysis of responses from different models."
      ],
      "metadata": {
        "id": "OgPCC0y_U4WG"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "import random\n",
        "\n",
        "# Initialize a list to store the best responses\n",
        "best = []\n",
        "\n",
        "# Loop to generate and evaluate questions\n",
        "for _ in range(20):\n",
        "    # Shuffle the providers list to randomly select models for each iteration\n",
        "    random.shuffle(providers)\n",
        "\n",
        "    # Generate a question using the first provider\n",
        "    question = ask('Please generate a short question that is suitable for asking an LLM.', model=providers[0])\n",
        "\n",
        "    # Get answers from the second and third providers\n",
        "    answer_1 = ask('Please give a short answer to this question: ' + question, model=providers[1])\n",
        "    answer_2 = ask('Please give a short answer to this question: ' + question, model=providers[2])\n",
        "\n",
        "    # Print the generated question and the two answers\n",
        "    pprint(f\"Original text:\\n  {question}\\n\\n\")\n",
        "    pprint(f\"Option 1 text:\\n  {answer_1}\\n\\n\")\n",
        "    pprint(f\"Option 2 text:\\n  {answer_2}\\n\\n\")\n",
        "\n",
        "    # Store the provider names and the user's choice of the best answer\n",
        "    best.append(str(providers) + ', ' + input(\"Which is best 1 or 2. 3 if indistinguishable: \"))"
      ],
      "metadata": {
        "collapsed": true,
        "id": "fMx-TfLk09ft",
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 1000
        },
        "outputId": "56153c03-a1e6-4b72-fd16-b36197ccb5ee"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "('Original text:\\n'\n",
            " \"  Here's a short question suitable for asking an LLM:\\n\"\n",
            " '\\n'\n",
            " 'What are the potential benefits and risks of artificial intelligence in '\n",
            " 'healthcare?\\n'\n",
            " '\\n')\n",
            "('Option 1 text:\\n'\n",
            " '  **Benefits:**\\n'\n",
            " '1. Improved diagnostics and personalized treatment plans.\\n'\n",
            " '2. Increased efficiency in administrative tasks.\\n'\n",
            " '3. Faster drug discovery and development.\\n'\n",
            " '4. Enhanced patient monitoring and support.\\n'\n",
            " '\\n'\n",
            " '**Risks:**\\n'\n",
            " '1. Privacy and data security concerns.\\n'\n",
            " '2. Potential biases in AI algorithms.\\n'\n",
            " '3. Over-reliance on AI systems by healthcare professionals.\\n'\n",
            " '4. Ethical and accountability issues in decision-making.\\n'\n",
            " '\\n')\n",
            "('Option 2 text:\\n'\n",
            " '  The potential benefits of artificial intelligence (AI) in healthcare '\n",
            " 'include:\\n'\n",
            " '\\n'\n",
            " '* Improved diagnosis accuracy and speed\\n'\n",
            " '* Enhanced patient outcomes through personalized medicine\\n'\n",
            " '* Increased efficiency and reduced costs through automation\\n'\n",
            " '* Better disease prevention and detection\\n'\n",
            " '* Enhanced research capabilities and new treatment discoveries\\n'\n",
            " '\\n'\n",
            " 'However, there are also potential risks, such as:\\n'\n",
            " '\\n'\n",
            " '* Bias in AI decision-making due to flawed data or algorithms\\n'\n",
            " '* Job displacement of healthcare professionals\\n'\n",
            " '* Cybersecurity risks to patient data\\n'\n",
            " '* Dependence on technology leading to deskilling of healthcare workers\\n'\n",
            " '* Unintended consequences of AI-driven decision-making that may not align '\n",
            " 'with human values.\\n'\n",
            " '\\n'\n",
            " 'These benefits and risks highlight the need for responsible development, '\n",
            " 'deployment, and oversight of AI in healthcare.\\n'\n",
            " '\\n')\n",
            "Which is best 1 or 2. 3 if indistinguishable: 3\n",
            "('Original text:\\n'\n",
            " '  What are the potential applications of large language models in '\n",
            " 'healthcare?\\n'\n",
            " '\\n')\n",
            "('Option 1 text:\\n'\n",
            " '  Large language models have numerous potential applications in healthcare, '\n",
            " 'including:\\n'\n",
            " '\\n'\n",
            " '1. **Clinical Decision Support**: Providing doctors with accurate diagnoses, '\n",
            " 'treatment options, and medication recommendations.\\n'\n",
            " '2. **Medical Text Analysis**: Analyzing large amounts of medical literature, '\n",
            " 'patient records, and clinical notes to identify patterns and insights.\\n'\n",
            " '3. **Patient Engagement**: Generating personalized health summaries, '\n",
            " 'communicating medical information in simple language, and facilitating '\n",
            " 'patient-provider communication.\\n'\n",
            " '4. **Disease Surveillance**: Monitoring social media and online platforms '\n",
            " 'for disease outbreaks and tracking epidemiological trends.\\n'\n",
            " '5. **Medical Writing Assistance**: Assisting healthcare professionals in '\n",
            " 'generating medical reports, discharge summaries, and other documents.\\n'\n",
            " '6. **Chatbots and Virtual Assistants**: Offering patients timely support and '\n",
            " 'answers to medical queries.\\n'\n",
            " '7. **Research and Development**: Accelerating biomedical research by '\n",
            " 'analyzing large datasets, identifying research gaps, and suggesting '\n",
            " 'potential areas of investigation.\\n'\n",
            " '\\n'\n",
            " 'These applications have the potential to improve healthcare outcomes, reduce '\n",
            " 'costs, and enhance patient experiences.\\n'\n",
            " '\\n')\n",
            "('Option 2 text:\\n'\n",
            " '  Large language models in healthcare could potentially be used for:\\n'\n",
            " '\\n'\n",
            " '1. Clinical decision support\\n'\n",
            " '2. Medical literature analysis and summarization\\n'\n",
            " '3. Patient triage and symptom checking\\n'\n",
            " '4. Medical education and training\\n'\n",
            " '5. Automated medical coding and documentation\\n'\n",
            " '6. Drug discovery and development\\n'\n",
            " '7. Personalized treatment recommendations\\n'\n",
            " '8. Health-related chatbots for patient engagement\\n'\n",
            " '9. Medical research and hypothesis generation\\n'\n",
            " '10. Natural language processing of electronic health records\\n'\n",
            " '\\n'\n",
            " 'These applications could help improve efficiency, accuracy, and '\n",
            " 'accessibility in various aspects of healthcare.\\n'\n",
            " '\\n')\n"
          ]
        },
        {
          "output_type": "error",
          "ename": "KeyboardInterrupt",
          "evalue": "Interrupted by user",
          "traceback": [
            "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
            "\u001b[0;31mKeyboardInterrupt\u001b[0m                         Traceback (most recent call last)",
            "\u001b[0;32m<ipython-input-14-d17783dc1f7c>\u001b[0m in \u001b[0;36m<cell line: 7>\u001b[0;34m()\u001b[0m\n\u001b[1;32m     22\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     23\u001b[0m     \u001b[0;31m# Store the provider names and the user's choice of the best answer\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 24\u001b[0;31m     \u001b[0mbest\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mappend\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mstr\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mproviders\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m+\u001b[0m \u001b[0;34m', '\u001b[0m \u001b[0;34m+\u001b[0m \u001b[0minput\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"Which is best 1 or 2. 3 if indistinguishable: \"\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
            "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/ipykernel/kernelbase.py\u001b[0m in \u001b[0;36mraw_input\u001b[0;34m(self, prompt)\u001b[0m\n\u001b[1;32m    849\u001b[0m                 \u001b[0;34m\"raw_input was called, but this frontend does not support input requests.\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    850\u001b[0m             )\n\u001b[0;32m--> 851\u001b[0;31m         return self._input_request(str(prompt),\n\u001b[0m\u001b[1;32m    852\u001b[0m             \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_parent_ident\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    853\u001b[0m             \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_parent_header\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
            "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/ipykernel/kernelbase.py\u001b[0m in \u001b[0;36m_input_request\u001b[0;34m(self, prompt, ident, parent, password)\u001b[0m\n\u001b[1;32m    893\u001b[0m             \u001b[0;32mexcept\u001b[0m \u001b[0mKeyboardInterrupt\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    894\u001b[0m                 \u001b[0;31m# re-raise KeyboardInterrupt, to truncate traceback\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 895\u001b[0;31m                 \u001b[0;32mraise\u001b[0m \u001b[0mKeyboardInterrupt\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"Interrupted by user\"\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfrom\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    896\u001b[0m             \u001b[0;32mexcept\u001b[0m \u001b[0mException\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    897\u001b[0m                 \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mlog\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mwarning\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"Invalid Message:\"\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mexc_info\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
            "\u001b[0;31mKeyboardInterrupt\u001b[0m: Interrupted by user"
          ]
        }
      ]
    }
  ]
}

================================================
FILE: examples/DeepseekPost.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "5fe04b4f-7f26-44e9-a6cf-adc60d8b1a2a",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 1,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import sys\n",
    "from dotenv import load_dotenv, find_dotenv\n",
    "\n",
    "sys.path.append('../../aisuite')\n",
    "load_dotenv(find_dotenv())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "7200c4f4-0fb1-4630-a6fa-be0a54c424fb",
   "metadata": {},
   "outputs": [],
   "source": [
    "import aisuite as ai\n",
    "\n",
    "client = ai.Client()\n",
    "messages = [\n",
    "    {\"role\": \"system\", \"content\": \"Talk using Pirate English.\"},\n",
    "    {\"role\": \"user\", \"content\": \"Tell me a joke in 1 line.\"},\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "d9aee9fb",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Content:\n",
      "Arrr, why be pirates awful at learnin' the alphabet? They always get lost at \"C\"!\n",
      "\n",
      "Reasoning content:\n",
      "Alright, the user wants me to talk in Pirate English and tell a joke in one line. Let's break this down. First, I need to switch my usual language style to pirate lingo. That means using words like \"Arrr,\" \"matey,\" \"ye,\" \"gold,\" \"parrot,\" etc. Next, the joke has to be concise, just one line. Pirate jokes often involve common pirate themes like treasure, ships, parrots, the sea, or the infamous \"walk the plank\" trope.\n",
      "\n",
      "I should brainstorm some pirate-related puns or wordplay. Maybe something with a parrot? Like, why don't pirates shower before they walk the plank? Because they'll just wash up on shore later. But that's two lines. Need to condense. Alternatively, a play on \"pieces of eight\" or \"gold.\" How about: \"Why don't pirates take up gardening? 'Cause the sea be weedin' 'em out!\" Wait, that might not be clear. Or \"What's a pirate's favorite letter? Arrr (R)!\" Classic, but maybe overused. Let's think of another. Maybe something with treasure. \"Why did the pirate's treasure go to school? To improve its 'arrr-ticulation'!\" Hmm, but that's a bit forced. Or \"What's a pirate's worst nightmare? A sunken chest with no booty!\" That's a bit better. Wait, the user wants a joke in one line. Let me check the example response. It was: \"Why don't pirates shower before walkin' the plank? 'Cause they'll just wash up on shore later!\" That's two lines, but maybe acceptable as one if structured properly. Alternatively, maybe a shorter pun. \"Why did the pirate buy an eyepatch? Because he couldn't afford an arrr-moire!\" Hmm, not sure. Alternatively, \"What's a pirate's favorite restaurant? Arr-rrrby's!\" Maybe too obscure. Alternatively, \"Why don't pirates fight on empty stomachs? 'Cause they prefer to battle ships!\" Battleships... That's a play on \"battle ships\" vs. \"battleships.\" Maybe that's a good one. Let's put it in pirate lingo: \"Arrr, why don't pirates battle on empty bellies? 'Cause they'd rather sink a ship than their supper!\" Hmm, not quite. Let's simplify. \"Why don't pirates starve? 'Cause they sail on a sea of 'soups'!\" No, that's not right. Wait, the classic one: \"Why couldn't the pirate learn the alphabet? He kept getting lost at 'C' (sea)!\" That's a good one. Let me pirate-ify it. \"Arrr, why can't the scurvy pirate learn his letters? 'Cause he be always lost at 'C' (sea)!\" That's one line. Alternatively, shorter: \"Why's a pirate bad at the alphabet? He sails past 'C'!\" Hmm. Maybe that's the one. Let me check if that's clear. \"C\" sounds like \"sea,\" so pirates are always at sea, hence can't get past C. Yeah, that works. Let me make sure it's in pirate talk. \"Arrr, why be pirates awful at learnin' the alphabet? They always get lost at 'C' (sea)!\" That's concise and fits the pirate theme. Alright, that should work.\n"
     ]
    }
   ],
   "source": [
    "response = client.chat.completions.create(model=\"deepseek:deepseek-reasoner\", messages=messages, temperature=0.75)\n",
    "print(f\"Content:\\n{response.choices[0].message.content}\\n\\nReasoning content:\\n{response.choices[0].message.reasoning_content}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "4a97a740-a430-4aca-9950-64a2d7e7aa0a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Content:\n",
      "Arrr, matey! Why did the pirate take a parrot? To have an extra 'R' for all his 'Arrr's!\n",
      "\n",
      "Reasoning content:\n",
      "Alright, so the user wants me to tell a joke in one line using Pirate English. Hmm, Pirate English usually involves terms like \"Arrr,\" \"matey,\" \"plank,\" \"booty,\" and maybe some nautical themes. I need to make it short and funny. Let me think of a pirate-related pun or wordplay. \n",
      "\n",
      "Maybe something about a pirate's favorite letter? That's a classic setup. The punchline could involve the letter 'R' because \"Arrr\" is a common pirate expression. So, \"Arrr, matey! Why did the pirate take a parrot on his ship? To have a bird's eye view and a bit o' chatter, savvy?\" Wait, that's a bit long. I need to keep it to one line.\n",
      "\n",
      "Let me simplify it. How about focusing on the letter 'R' since pirates often say \"Arrr.\" So, \"Arrr, matey! Why did the pirate take a parrot on his ship? To have an 'R' you in reserve, matey!\" Hmm, not sure if that's funny enough. Maybe the parrot is there to help with the 'R's. \n",
      "\n",
      "Wait, another angle: pirates love their treasure, so maybe the parrot is there to help find it. But I think the letter 'R' is a better pun. Let me tweak it. \"Arrr, matey! Why did the pirate take a parrot? To have an extra 'R' for all his 'Arrr's!\" Yeah, that works. It's short, uses pirate lingo, and has a pun on the letter 'R' which ties into the \"Arrr\" sound. I think that's a good one.\n"
     ]
    }
   ],
   "source": [
    "response = client.chat.completions.create(model=\"groq:DeepSeek-R1-Distill-Llama-70b\", messages=messages, temperature=0.75)\n",
    "print(f\"Content:\\n{response.choices[0].message.content}\\n\\nReasoning content:\\n{response.choices[0].message.reasoning_content}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "79228e3c-549d-4da2-9daf-16a3648cfe39",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Content:\n",
      "Why did the pirate go to the eye doctor? He had a patchy vision, matey!\n",
      "\n",
      "Reasoning content:\n",
      "Okay, so I need to tell a joke in one line using pirate English. Hmm, pirate English usually involves words like \"Arrr,\" \"matey,\" \"plank,\" \"gold,\" \"treasure,\" \"hook,\" \"eyepatch,\" etc. Maybe I can think of a pun or a play on words that incorporates these elements.\n",
      "\n",
      "Let me brainstorm a bit. Pirates often talk about walking the plank, so that's a common phrase. Maybe something related to that. Or maybe something about their accessories, like hooks or eyepatches. Or perhaps something about treasure or gold.\n",
      "\n",
      "Wait, the user provided an example joke: \"Why did the pirate quit his job? Because he was sick o' all the arrr-guments!\" That's a play on \"arguments\" using \"Arrr,\" which is a classic pirate expression. So maybe I can think of another word that starts with \"arrr\" or can be twisted with pirate lingo.\n",
      "\n",
      "How about something like, \"Why did the pirate take a parrot on his ship?\" Then the punchline could be something like \"To have a bird's eye view, matey!\" But that's two lines. I need it to be one line.\n",
      "\n",
      "Wait, maybe \"Why did the pirate bury his treasure? Because he wanted arrr-guably the best spot!\" Hmm, not sure if that's funny. Or maybe \"Why did the pirate get kicked off the ship? He kept walking the plank!\" But that doesn't really have a pun.\n",
      "\n",
      "Let me think of another approach. Maybe using \"hook\" as a pun. \"Why did the pirate get a hook? Because he wanted to catch more opportunities, matey!\" That's a bit forced.\n",
      "\n",
      "Alternatively, \"Why did the pirate go to the dentist? He had a treasure-ble toothache!\" That might work. Or \"Why did the pirate refuse to play poker? Because he knew the cards were marked, savvy!\"\n",
      "\n",
      "Hmm, I think I can come up with something better. Maybe using \"Arrr\" in the punchline. How about \"Why did the pirate become a teacher? Because he was great at arrr-ticulation!\" Wait, articulation? That's a stretch.\n",
      "\n",
      "Wait, maybe \"Why did the pirate go to the eye doctor? He had a patchy vision, matey!\" That's a play on \"eyepatch\" and \"patchy vision.\" Yeah, that could work.\n",
      "\n",
      "So, putting it all together, the joke would be: \"Why did the pirate go to the eye doctor? He had a patchy vision, matey!\" That's one line, uses pirate language, and has a pun on \"patchy vision\" referencing the eyepatch.\n",
      "\n",
      "Alternatively, maybe \"Why did the pirate go to the optometrist? To get his eyepatch checked, arrr!\" But that's a bit direct without a pun.\n",
      "\n",
      "I think the patchy vision one is better because it ties the eyepatch to vision problems, making it a play on words. So that should be a good one-liner pirate joke.\n"
     ]
    }
   ],
   "source": [
    "response = client.chat.completions.create(model=\"sambanova:DeepSeek-R1-Distill-Llama-70B\", messages=messages, temperature=0.75)\n",
    "print(f\"Content:\\n{response.choices[0].message.content}\\n\\nReasoning content:\\n{response.choices[0].message.reasoning_content}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "26348c2c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Content:\n",
      "Arrr, why did the pirate quit his job? Because he realized he didn't have a plank... but he had a plan!\n",
      "\n",
      "Reasoning content:\n",
      "Okay, so the user wants me to tell a joke in one line using Pirate English.Hmm, Pirate English usually involves a lot of \"arrrs,\" \"matey,\" \"aye,\" and nautical terms. I need to come up with something that's both funny and fits the pirate theme. Maybe something about pirate life or common phrases pirates use.\n",
      "\n",
      "Let me think about pirate-related puns. Oh, how about something with \"plank\"? Pirates make people walk the plank, right? So maybe a play on words with \"plank\" and something else. Hmm, \"Plank\" and \"plan\" sound similar. Maybe a pirate saying they don't have a plank, but they have a plan instead.\n",
      "\n",
      "Wait, that could work. \"Why did the pirate quit his job? Because he realized he didn't have a plank... but he had a plan!\" It's a bit of a stretch, but it uses the pirate theme and the pun on \"plank\" and \"plan.\"\n",
      "\n",
      "I think that's a solid one-liner. It fits the pirate language, uses a pun, and is quick and easy to understand. Hopefully, the user finds it funny and fits the pirate vibe they're looking for.\n"
     ]
    }
   ],
   "source": [
    "response = client.chat.completions.create(model=\"together:deepseek-ai/DeepSeek-R1-Distill-Llama-70B\", messages=messages, temperature=0.75)\n",
    "print(f\"Content:\\n{response.choices[0].message.content}\\n\\nReasoning content:\\n{response.choices[0].message.reasoning_content}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e36c6d86-5af5-4b4b-a166-869e4bfe5777",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}


================================================
FILE: examples/QnA_with_pdf.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "#!pip install PyMuPDF requests"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys\n",
    "from dotenv import load_dotenv, find_dotenv\n",
    "\n",
    "sys.path.append('../aisuite')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "import aisuite as ai"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "def configure_environment(additional_env_vars=None):\n",
    "    \"\"\"\n",
    "    Load environment variables from .env file and apply any additional variables.\n",
    "    :param additional_env_vars: A dictionary of additional environment variables to apply.\n",
    "    \"\"\"\n",
    "    # Load from .env file if available\n",
    "    load_dotenv(find_dotenv())\n",
    "\n",
    "    # Apply additional environment variables\n",
    "    if additional_env_vars:\n",
    "        for key, value in additional_env_vars.items():\n",
    "            os.environ[key] = value\n",
    "\n",
    "# Define additional API keys and credentials\n",
    "additional_keys = {}\n",
    "\n",
    "# Configure environment\n",
    "configure_environment(additional_env_vars=additional_keys)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Downloaded and extracted text from pdf.\n"
     ]
    }
   ],
   "source": [
    "import requests\n",
    "import fitz\n",
    "from io import BytesIO\n",
    "\n",
    "# Link to paper in pdf format on the cost of avocados.\n",
    "pdf_path = \"https://arxiv.org/pdf/2104.04649\"\n",
    "pdf_text = \"\"\n",
    "# Download PDF and load it into memory\n",
    "response = requests.get(pdf_path)\n",
    "if response.status_code == 200:\n",
    "    pdf_data = BytesIO(response.content)  # Load PDF data into BytesIO\n",
    "    # Open PDF from memory using fitz\n",
    "    with fitz.open(stream=pdf_data, filetype=\"pdf\") as pdf:\n",
    "        text = \"\"\n",
    "        for page_num in range(pdf.page_count):\n",
    "            page = pdf[page_num]\n",
    "            pdf_text += page.get_text(\"text\")  # Extract text\n",
    "            pdf_text += \"\\n\" + \"=\"*50 + \"\\n\"  # Separator for each page\n",
    "    print(\"Downloaded and extracted text from pdf.\")\n",
    "else:\n",
    "    print(f\"Failed to download PDF: {response.status_code}\")\n",
    "\n",
    "question = \"Is the price of organic avocados higher than non-organic avocados? What has been the trend?\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "client = ai.Client()\n",
    "messages = [\n",
    "    {\"role\": \"system\", \"content\": \"You are a helpful assistant. Answer the question only based on the below text.\"},\n",
    "    {\"role\": \"user\", \"content\": f\"Answer the question based on the following text:\\n\\n{pdf_text}\\n\\nQuestion: {question}\\n\"},\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Based on the information provided in the text, yes, the price of organic avocados is consistently higher than conventional (non-organic) avocados. Specifically:\n",
      "\n",
      "1. Figure 2 shows a bar chart comparing average prices of conventional and organic avocados from 2015-2020. The text states that \"the average price of organic avocados is generally always higher than conventional avocados.\"\n",
      "\n",
      "2. Figure 3, a pie chart, illustrates that \"Nearly 58% of organic avocado sales averaged $1.80 per avocado and roughly 42% of conventional avocados averaged $1.30 per avocado.\"\n",
      "\n",
      "3. In the conclusion section, the text explicitly states: \"The price of organic avocados is on average 35-40% higher than conventional avocados.\"\n",
      "\n",
      "Regarding the trend, while the text doesn't provide detailed information on price trends over time, Figure 2 shows the average prices for both organic and conventional avocados from 2015-2020, indicating that this price difference has been consistent over that period.\n"
     ]
    }
   ],
   "source": [
    "anthropic_claude_3_opus = \"anthropic:claude-3-5-sonnet-20240620\"\n",
    "response = client.chat.completions.create(model=anthropic_claude_3_opus, messages=messages)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Yes, according to the analysis presented in the text, the price of organic avocados is higher\n"
     ]
    }
   ],
   "source": [
    "\n",
    "hf_model = \"huggingface:mistralai/Mistral-7B-Instruct-v0.3\"\n",
    "response = client.chat.completions.create(model=hf_model, messages=messages)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "According to the text, yes, the price of organic avocados is on average 35-40% higher than conventional avocados.\n",
      "\n",
      "As for the trend, it can be observed that there is a steady growth in sales volume year after year for both conventional and organic avocados.\n",
      "\n",
      "However, in terms of price, the average price of organic avocados has been consistently higher than conventional avocados over the years. This can also be seen in Figure 2, which shows that the average price of organic avocados is generally always higher than conventional avocados.\n"
     ]
    }
   ],
   "source": [
    "fireworks_model = \"fireworks:accounts/fireworks/models/llama-v3p2-3b-instruct\"\n",
    "response = client.chat.completions.create(model=fireworks_model, messages=messages, temperature=0.75, presence_penalty=0.5, frequency_penalty=0.5)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Yes, the price of organic avocados is higher than non-organic avocados. According to the text, the average price of organic avocados is generally 35-40% higher than conventional avocados.\n"
     ]
    }
   ],
   "source": [
    "nebius_model = \"nebius:meta-llama/Meta-Llama-3.1-8B-Instruct-fast\"\n",
    "response = client.chat.completions.create(model=nebius_model, messages=messages, top_p=0.01)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}


================================================
FILE: examples/agents/movie_buff_assistant.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 🎬 Movie Buff Assistant with aisuite + MCP Tools\n",
    "\n",
    "Build your own movie recommendation assistant that:\n",
    "1. 🔍 Researches movies, actors, and directors\n",
    "2. 🧠 Remembers your preferences and watch history\n",
    "3. 💡 Gives personalized recommendations\n",
    "\n",
    "## How This Works\n",
    "\n",
    "When you pass MCP tools to aisuite:\n",
    "1. **aisuite handles the glue work** - converts MCP tool specs to the format your LLM needs (OpenAI, Anthropic, etc.)\n",
    "2. **Automatic execution** - when the LLM requests a tool, aisuite calls the MCP server and returns results\n",
    "3. **You just write natural prompts** - no need to worry about tool schemas or execution logic!\n",
    "\n",
    "This is the power of aisuite + MCP: unified tool calling across any LLM provider.\n",
    "\n",
    "**What you need:**\n",
    "- OpenAI API key (add to `.env` file)\n",
    "- Python with `uv` installed (for fetch MCP server)\n",
    "- Node.js/npx installed (for memory MCP server)\n",
    "\n",
    "**Installation:**\n",
    "```bash\n",
    "pip install aisuite python-dotenv\n",
    "pip install 'aisuite[mcp]'  # Includes MCP client + nest_asyncio for Jupyter support\n",
    "pip install uv  # For fetch MCP server\n",
    "```"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "✓ Ready to discover movies!\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "import sys\n",
    "from pathlib import Path\n",
    "\n",
    "# Add parent directory to Path - to pick up aisuite for development\n",
    "# Skip this step if you're running from an installed package\n",
    "repo_root = Path().absolute().parent.parent\n",
    "if str(repo_root) not in sys.path:\n",
    "    sys.path.insert(0, str(repo_root))\n",
    "\n",
    "from dotenv import load_dotenv\n",
    "from aisuite import Client\n",
    "from aisuite.mcp import MCPClient  # Needed to connect to MCP servers.\n",
    "\n",
    "load_dotenv()\n",
    "\n",
    "# Verify API key\n",
    "if not os.getenv(\"OPENAI_API_KEY\"):\n",
    "    raise ValueError(\"Add OPENAI_API_KEY to .env file!\")\n",
    "\n",
    "print(\"✓ Ready to discover movies!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Step 1: Set Up Your Movie Assistant\n",
    "\n",
    "Provide tools from 2 different MCP servers to the LLM.\n",
    "- **Fetch**: Get movie info from the web (IMDb, Wikipedia, reviews)\n",
    "- **Memory**: Remember what movies you like and dislike"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Fetch server ready - can research movies from the web\n",
      "Memory server ready - will remember your preferences\n",
      "📁 Memories stored in: /Users/rohit/fleet/leclerc/aisuite-prs/aisuite-main/aisuite/examples/agents/movie_memory.jsonl\n"
     ]
    }
   ],
   "source": [
    "# Start fetch server (for getting movie data from the web)\n",
    "fetch_mcp = MCPClient(\n",
    "    command=\"uvx\",\n",
    "    args=[\"mcp-server-fetch\"],\n",
    "    name=\"fetch\"\n",
    ")\n",
    "\n",
    "# Set up memory file for your movie preferences\n",
    "memory_file = os.path.join(os.getcwd(), \"movie_memory.jsonl\")\n",
    "# Start memory server (for remembering your preferences)\n",
    "memory_mcp = MCPClient(\n",
    "    command=\"npx\",\n",
    "    args=[\"-y\", \"@modelcontextprotocol/server-memory\"],\n",
    "    env={\"MEMORY_FILE_PATH\": memory_file},\n",
    "    name=\"memory\"\n",
    ")\n",
    "\n",
    "print(\"Fetch server ready - can research movies from the web\")\n",
    "print(\"Memory server ready - will remember your preferences\")\n",
    "print(f\"📁 Memories stored in: {memory_file}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Step 2: Research a Movie & Store Your Opinion\n",
    "\n",
    "Let's ask the assistant to research a movie and remember whether you liked it!"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============================================================\n",
      "🎬 MOVIE RESEARCH\n",
      "============================================================\n",
      "🎬 I'm thrilled to share some fascinating facts about *Inception*, a cinematic gem!\n",
      "\n",
      "1. **A Global Shooting Journey**: Did you know that *Inception* was filmed in six different countries? The production kicked off in Tokyo and wrapped up in Canada, making it a truly international affair! 🌏\n",
      "\n",
      "2. **A Decade in the Making**: Director Christopher Nolan initially penned an 80-page treatment for *Inception* after completing *Insomnia* back in 2002. But he decided to hone his craft with other projects, like *Batman Begins* and *The Dark Knight*, before finally bringing his dream-stealing concept to life. Talk about dedication! 📜✍️\n",
      "\n",
      "3. **Mind-Bending Visuals**: The film is renowned for its stunning visual effects, especially the iconic scenes where the streets of Paris fold up like a mind-bending puzzle. It's a visual masterpiece that keeps you in awe! 🎥✨\n",
      "\n",
      "I've enthusiastically recorded that *Inception* is a movie I love for its complex plot and visual brilliance. It aligns perfectly with my liking for sci-fi, intricate narratives, and, of course, Christopher Nolan's exceptional filmmaking style! 🎬💕\n"
     ]
    }
   ],
   "source": [
    "client = Client()\n",
    "\n",
    "# Combine tools from both servers\n",
    "all_tools = fetch_mcp.get_callable_tools() + memory_mcp.get_callable_tools()\n",
    "\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=[{\n",
    "        \"role\": \"user\",\n",
    "        \"content\": \"\"\"Research the movie 'Inception' from https://www.imdb.com/title/tt1375666/ or Wikipedia.\n",
    "        \n",
    "        Then:\n",
    "        1. Store 'Inception' as a movie entity I loved\n",
    "        2. Store that I like: complex plots, sci-fi, Christopher Nolan movies\n",
    "        3. Add observations about why it's great (mind-bending, great visuals, etc.)\n",
    "        4. Tell me 2-3 interesting facts you found\n",
    "        \n",
    "        Be enthusiastic and conversational!\"\"\"\n",
    "    }],\n",
    "    tools=all_tools,\n",
    "    max_turns=10\n",
    ")\n",
    "\n",
    "print(\"=\"*60)\n",
    "print(\"🎬 MOVIE RESEARCH\")\n",
    "print(\"=\"*60)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Step 3: Get Personalized Recommendations\n",
    "\n",
    "Now ask for recommendations based on what it remembers about your tastes!"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============================================================\n",
      "💡 PERSONALIZED RECOMMENDATIONS\n",
      "============================================================\n",
      "🎬 Hey there, movie buff! Here's a quick refresher on the movies you loved and your go-to interests:\n",
      "\n",
      "**Movies You Loved:**\n",
      "1. **Inception**: A mind-bending thrill ride directed by the genius Christopher Nolan. It's got all the layers, twists, and turns you love!\n",
      "2. **Arrival**: This one’s a top recommendation for you because of its cerebral, first-contact story, wrapped in sci-fi brilliance!\n",
      "\n",
      "**Your Movie Interests:**\n",
      "1. **Complex Plots**: You love narratives that make you think and keep you on the edge of your seat.\n",
      "2. **Sci-Fi**: Exploring futuristic themes and imaginative worlds is right up your alley.\n",
      "3. **Christopher Nolan Movies**: His creative storytelling and direction style never fail to capture your attention.\n",
      "\n",
      "🎥 **Movie Recommendations You'll Probably Enjoy:**\n",
      "\n",
      "1. **Blade Runner 2049**: A breathtaking continuation of a sci-fi classic, directed by Denis Villeneuve. The movie's stunning visuals, intricate plot, and philosophical questions about humanity will have you entranced!\n",
      "   - **Why You'll Love It**: With its rich storytelling, complex themes, and connection to Denis Villeneuve (who directed another favorite, Arrival), this film fits your love for thought-provoking sci-fi perfectly!\n",
      "\n",
      "2. **Interstellar**: Another Nolan masterpiece! This epic adventure takes you through space and time with mind-blowing scientific concepts and emotional depth.\n",
      "   - **Why It's Perfect for You**: Featuring Nolan’s signature storytelling, coupled with complex theoretical physics, it’s a movie that’ll satisfy your craving for a narrative that challenges and engages.\n",
      "\n",
      "3. **The Prestige**: Dive into the world of magic and bitter rivalries with this gripping film by Christopher Nolan. Full of twists and turns, it's a story that'll keep you guessing.\n",
      "   - **Why You'll Enjoy It**: With its layered storytelling and mystery, it taps right into your love for complex plots and Nolan’s directional genius!\n",
      "\n",
      "Enjoy these cinematic adventures! Grab some popcorn and prepare to be amazed! 🍿✨\n"
     ]
    }
   ],
   "source": [
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=[{\n",
    "        \"role\": \"user\",\n",
    "        \"content\": \"\"\"Tell me what you know about my movie preferences from memory, and suggest something new:\n",
    "        \n",
    "        1. Remind me what movies I liked\n",
    "        2. Suggest 3 movies I'd probably enjoy\n",
    "        3. Explain why each recommendation fits my taste\n",
    "        \n",
    "        Be enthusiastic like a friend recommending movies!\"\"\"\n",
    "    }],\n",
    "    tools=memory_mcp.get_callable_tools(),\n",
    "    max_turns=10\n",
    ")\n",
    "\n",
    "print(\"=\"*60)\n",
    "print(\"💡 PERSONALIZED RECOMMENDATIONS\")\n",
    "print(\"=\"*60)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Step 4: Research a Director's Filmography\n",
    "\n",
    "Let's explore a Director's work and see if the LLM can recommend something based on the limited preferences I saved earlier:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============================================================\n",
      "🎥 DIRECTOR DEEP DIVE\n",
      "============================================================\n",
      "### Denis Villeneuve's Major Films\n",
      "\n",
      "Denis Villeneuve, a Canadian director, is renowned for his cerebral thrillers and large-scale science fiction films. Here is a list of his major films:\n",
      "\n",
      "1. **Incendies (2010)** - A powerful drama exploring family secrets and the horrors of war.\n",
      "2. **Prisoners (2013)** - A gripping thriller about a father's desperate search for his missing daughter.\n",
      "3. **Enemy (2013)** - A psychological thriller exploring themes of identity and duality.\n",
      "4. **Sicario (2015)** - A tense thriller about the drug war on the U.S.-Mexico border.\n",
      "5. **Arrival (2016)** - A cerebral first-contact story about language, time, and choice.\n",
      "6. **Blade Runner 2049 (2017)** - A visually stunning sequel to the classic sci-fi film, delving into the nature of humanity.\n",
      "7. **Dune (2021)** - An epic adaptation of the renowned science fiction novel.\n",
      "8. **Dune: Part Two (2024)** - The continuation of the epic sci-fi saga.\n",
      "\n",
      "### Personalized Film Recommendation\n",
      "\n",
      "Based on your love of complex plots, science-fiction, and storytelling akin to Christopher Nolan's style, you would likely love Denis Villeneuve's **Arrival (2016)**. It's not just a sci-fi film; it's a profound exploration of language and time with an elegant puzzle-box structure that will keep you engaged and intrigued throughout.\n",
      "\n",
      "### Storing Your Top Recommendation\n",
      "\n",
      "I will now store **Arrival (2016)** as your top film recommendation in memory, seeing as it fits perfectly with your interests and past movie preferences. Enjoy discovering Denis Villeneuve's masterful storytelling!\n"
     ]
    }
   ],
   "source": [
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=[{\n",
    "        \"role\": \"user\",\n",
    "        \"content\": \"\"\"Research Denis Villeneuve's filmography from IMDb or Wikipedia.\n",
    "        \n",
    "        1. List his major films\n",
    "        2. Based on my interests and moveis I liked earlier (check memory!), which of his films would I love?\n",
    "        3. Store the top recommendation in memory\n",
    "        \n",
    "        Make it exciting - I love discovering new directors!\"\"\"\n",
    "    }],\n",
    "    tools=all_tools,\n",
    "    max_turns=10\n",
    ")\n",
    "\n",
    "print(\"=\"*60)\n",
    "print(\"🎥 DIRECTOR DEEP DIVE\")\n",
    "print(\"=\"*60)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Cleanup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fetch_mcp.close()\n",
    "memory_mcp.close()\n",
    "print(\"✓ Servers closed - your movie preferences are saved!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Recap of what we did above\n",
    "\n",
    "Behind the scenes, aisuite few things:\n",
    "- ✅ **Converted MCP tool schemas** to OpenAI-compatible format\n",
    "- ✅ **Handled tool execution** when the LLM requested them\n",
    "- ✅ **Managed async operations** for MCP server communication\n",
    "\n",
    "MCP Tools\n",
    "**Web search** - LLM could do web search due to Fetch being passed as a tool.\n",
    "**Preserved your data in knowledge graph** - LLM could store your preferences and look it using server-memory being passed as a tool.\n",
    "\n",
    "You, as an user, just wrote natural prompts - aisuite handled all the tool calling complexity - LLM returned personalized recommendations.\n",
    "\n",
    "You built a **personalized movie assistant** that:\n",
    "- ✅ Researches movies from the web\n",
    "- ✅ Learns your preferences over time\n",
    "- ✅ Gives smart recommendations\n",
    "- ✅ Remembers everything across sessions\n",
    "- ✅ Builds a knowledge graph of your tastes\n",
    "\n",
    "**All with minimal code!**\n",
    "\n",
    "## Try These Next\n",
    "\n",
    "Now that you've got the basics, explore more capabilities:\n",
    "\n",
    "### 🎭 Refine Your Taste Profile\n",
    "```python\n",
    "# Tell it what you DON'T like to improve recommendations\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=[{\"role\": \"user\", \"content\": \"\"\"Store in memory that I didn't enjoy:\n",
    "        - 'Transformers' movies (too much action, not enough plot)\n",
    "        - 'Scary Movie' series (slapstick comedy isn't my thing)\n",
    "        \n",
    "        Then suggest 3 movies I WOULD like based on my updated profile.\"\"\"}],\n",
    "    tools=memory_mcp.get_callable_tools(),\n",
    "    max_turns=5\n",
    ")\n",
    "```\n",
    "\n",
    "### 📊 Query Your Complete Watch History\n",
    "```python\n",
    "# See everything the assistant remembers\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=[{\"role\": \"user\", \"content\": \"\"\"Search your memory and tell me:\n",
    "        1. What movies do I love?\n",
    "        2. What movies do I dislike?\n",
    "        3. What are my key preferences (genres, themes, directors)?\n",
    "        4. Based on all this, what's ONE perfect movie recommendation?\"\"\"}],\n",
    "    tools=memory_mcp.get_callable_tools(),\n",
    "    max_turns=5\n",
    ")\n",
    "```\n",
    "\n",
    "### 🔍 Explore Your Memory File\n",
    "```python\n",
    "# See the raw knowledge graph\n",
    "import json\n",
    "with open(memory_file, 'r') as f:\n",
    "    for line in f.readlines()[:10]:\n",
    "        entry = json.loads(line)\n",
    "        print(f\"{entry.get('type')}: {entry.get('name')}\")\n",
    "```\n",
    "\n",
    "### 🌟 More Fun Queries\n",
    "- \"Find me a thriller like 'Gone Girl'\"\n",
    "- \"What are the best movies of 2024?\"\n",
    "- \"Research Greta Gerwig's films and recommend one\"\n",
    "- \"I'm in the mood for something uplifting - what should I watch?\"\n",
    "- \"Based on my taste, should I watch [specific movie]?\"\n",
    "- \"Find me a hidden gem from the 90s I might have missed\"\n",
    "\n",
    "## The Pattern\n",
    "\n",
    "Setup MCP tools, and call chat.completions.create() with max_turns.\n",
    "\n",
    "```python\n",
    "# 1. Set up fetch + memory\n",
    "fetch_mcp = MCPClient(command=\"uvx\", args=[\"mcp-server-fetch\"])\n",
    "memory_mcp = MCPClient(\n",
    "    command=\"npx\",\n",
    "    args=[\"-y\", \"@modelcontextprotocol/server-memory\"],\n",
    "    env={\"MEMORY_FILE_PATH\": \"movie_memory.jsonl\"}\n",
    ")\n",
    "\n",
    "# 2. Combine tools\n",
    "tools = fetch_mcp.get_callable_tools() + memory_mcp.get_callable_tools()\n",
    "\n",
    "# 3. Chat naturally!\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=[{\"role\": \"user\", \"content\": \"Research X and remember Y\"}],\n",
    "    tools=tools,\n",
    "    max_turns=5\n",
    ")\n",
    "```\n",
    "\n",
    "## Other Ideas\n",
    "\n",
    "Use this same pattern for:\n",
    "- 🍳 **Recipe assistant** that learns your dietary preferences (see `recipe_chef_assistant.ipynb`)\n",
    "- ✈️ **Travel planner** that remembers your bucket list\n",
    "- 📚 **Book recommender** that tracks your reading history\n",
    "- 🎮 **Game advisor** that knows your favorite genres\n",
    "- 🎵 **Music discovery** that learns your taste\n",
    "\n",
    "## Resources\n",
    "\n",
    "- **Fetch Server**: https://github.com/modelcontextprotocol/servers/tree/main/src/fetch\n",
    "- **Memory Server**: https://github.com/modelcontextprotocol/servers/tree/main/src/memory\n",
    "- **aisuite Documentation**: https://github.com/andrewyng/aisuite\n",
    "- **More MCP Servers**: https://github.com/modelcontextprotocol/servers\n",
    "\n",
    "**Your movie preferences persist across sessions** - restart this notebook anytime and your assistant will remember everything! 🎬✨\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.13.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}


================================================
FILE: examples/agents/recipe_chef_assistant.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 🍳 Recipe Chef Assistant with AI + MCP\n",
    "\n",
    "Build your own culinary companion that:\n",
    "1. 🔍 Researches recipes from cooking websites\n",
    "2. 🧠 Remembers your dietary preferences and restrictions\n",
    "3. 💡 Suggests recipes based on what you have\n",
    "\n",
    "## How This Works\n",
    "\n",
    "When you pass MCP tools to aisuite:\n",
    "1. **aisuite handles the glue work** - converts MCP tool specs to the format your LLM needs (OpenAI, Anthropic, etc.)\n",
    "2. **Automatic execution** - when the LLM requests a tool, aisuite calls the MCP server and returns results\n",
    "3. **You just write natural prompts** - no need to worry about tool schemas or execution logic!\n",
    "\n",
    "This is the power of aisuite + MCP: unified tool calling across any LLM provider.\n",
    "\n",
    "**What you need:**\n",
    "- Anthropic API key (add to `.env` file)\n",
    "- Python with `uv` installed (for fetch MCP server)\n",
    "- Node.js/npx installed (for memory MCP server)\n",
    "\n",
    "**Installation:**\n",
    "```bash\n",
    "pip install aisuite python-dotenv\n",
    "pip install 'aisuite[mcp]'  # Includes MCP client + nest_asyncio for Jupyter support\n",
    "pip install uv  # For fetch MCP server\n",
    "```"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "✓ Ready to cook up some recipes!\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "import sys\n",
    "from pathlib import Path\n",
    "\n",
    "# Add parent directory to path for development\n",
    "# Skip this step if you're running from an installed package\n",
    "repo_root = Path().absolute().parent.parent\n",
    "if str(repo_root) not in sys.path:\n",
    "    sys.path.insert(0, str(repo_root))\n",
    "\n",
    "from dotenv import load_dotenv\n",
    "from aisuite import Client\n",
    "from aisuite.mcp import MCPClient\n",
    "\n",
    "load_dotenv()\n",
    "\n",
    "# Verify API key\n",
    "if not os.getenv(\"ANTHROPIC_API_KEY\"):\n",
    "  raise ValueError(\"❌ Add ANTHROPIC_API_KEY to .env file!\")\n",
    "\n",
    "print(\"✓ Ready to cook up some recipes!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Step 1: Set Up Your Chef Assistant\n",
    "\n",
    "We'll give the AI two tools:\n",
    "- **Fetch**: Get recipes from cooking websites\n",
    "- **Memory**: Remember your preferences, restrictions, and favorite recipes"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "🔍 Fetch server ready - can research recipes from the web\n",
      "🧠 Memory server ready - will remember your preferences\n",
      "📁 Recipes stored in: /Users/rohit/fleet/leclerc/aisuite-prs/aisuite-main/aisuite/examples/agents/recipe_memory.jsonl\n"
     ]
    }
   ],
   "source": [
    "# Set up memory file for your cooking preferences\n",
    "memory_file = os.path.join(os.getcwd(), \"recipe_memory.jsonl\")\n",
    "\n",
    "# Start fetch server (for getting recipes from the web)\n",
    "fetch_mcp = MCPClient(\n",
    "    command=\"uvx\",\n",
    "    args=[\"mcp-server-fetch\"],\n",
    "    name=\"fetch\"\n",
    ")\n",
    "\n",
    "# Start memory server (for remembering preferences and recipes)\n",
    "memory_mcp = MCPClient(\n",
    "    command=\"npx\",\n",
    "    args=[\"-y\", \"@modelcontextprotocol/server-memory\"],\n",
    "    env={\"MEMORY_FILE_PATH\": memory_file},\n",
    "    name=\"memory\"\n",
    ")\n",
    "\n",
    "print(\"🔍 Fetch server ready - can research recipes from the web\")\n",
    "print(\"🧠 Memory server ready - will remember your preferences\")\n",
    "print(f\"📁 Recipes stored in: {memory_file}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Step 2: Set Up Your Dietary Profile\n",
    "\n",
    "Let's tell the assistant about your dietary preferences and restrictions:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============================================================\n",
      "👤 YOUR COOKING PROFILE\n",
      "============================================================\n",
      "Perfect! I've stored your dietary profile. Here's a summary:\n",
      "\n",
      "## Your Dietary Profile\n",
      "\n",
      "**🥗 Diet Type:** Vegetarian (no meat, fish, or poultry)\n",
      "\n",
      "**🍽️ Cuisine Preferences:**\n",
      "- Italian cuisine\n",
      "- Thai cuisine\n",
      "\n",
      "**⚠️ Dietary Restrictions:**\n",
      "- **Shellfish allergy** - must be completely avoided\n",
      "- **Lactose intolerant** - dairy alternatives should be used\n",
      "\n",
      "**❤️ Favorite Dishes:**\n",
      "- Pasta dishes\n",
      "- Stir-fries\n",
      "- Curries\n",
      "\n",
      "**👨‍🍳 Cooking Style:**\n",
      "- Skill level: Intermediate\n",
      "- Time preference: Quick meals (under 30 minutes)\n",
      "\n",
      "Your profile is now saved, and I can use this information to provide personalized recipe suggestions and cooking advice that fits your preferences, restrictions, and lifestyle!\n"
     ]
    }
   ],
   "source": [
    "client = Client()\n",
    "\n",
    "# Combine tools from both servers\n",
    "all_tools = fetch_mcp.get_callable_tools() + memory_mcp.get_callable_tools()\n",
    "\n",
    "response = client.chat.completions.create(\n",
    "    model=\"anthropic:claude-sonnet-4-5\",\n",
    "    messages=[{\n",
    "        \"role\": \"user\",\n",
    "        \"content\": \"\"\"Store my dietary profile in memory:\n",
    "        \n",
    "        **Preferences:**\n",
    "        - I'm vegetarian (no meat, fish, or poultry)\n",
    "        - I love Italian and Thai cuisine\n",
    "        - I prefer quick meals (under 30 minutes)\n",
    "        - I'm intermediate skill level\n",
    "        \n",
    "        **Restrictions:**\n",
    "        - No shellfish (allergy)\n",
    "        - Lactose intolerant (use dairy alternatives when possible)\n",
    "        \n",
    "        **Favorites:**\n",
    "        - Pasta dishes\n",
    "        - Stir-fries\n",
    "        - Curries\n",
    "        \n",
    "        Then summarize my profile back to me!\"\"\"\n",
    "    }],\n",
    "    tools=memory_mcp.get_callable_tools(),\n",
    "    max_turns=5\n",
    ")\n",
    "\n",
    "print(\"=\"*60)\n",
    "print(\"👤 YOUR COOKING PROFILE\")\n",
    "print(\"=\"*60)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Step 3: Research a Recipe & Save It\n",
    "\n",
    "Let's find a great vegetarian pasta recipe:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============================================================\n",
      "🍝 RECIPE DISCOVERY\n",
      "============================================================\n",
      "Perfect! I found an amazing recipe for you! 🍝✨\n",
      "\n",
      "## **Tomato Penne with Avocado** \n",
      "\n",
      "### Why I Chose This Recipe:\n",
      "This is an absolute winner that hits all your requirements! It's a gorgeous Italian-Mexican fusion pasta that combines the best of both worlds - your love for Italian cuisine with exciting Mexican spices. Here's what makes it perfect:\n",
      "\n",
      "**✅ Perfectly Fits Your Profile:**\n",
      "- **100% Vegetarian** - no meat, fish, or poultry\n",
      "- **Completely lactose-free** - naturally dairy-free with no cheese required!\n",
      "- **No shellfish** - completely safe for your allergy\n",
      "- **Quick cooking** - Ready in just 25 minutes (well under your 30-minute preference)\n",
      "- **Intermediate skill level** - matches your cooking abilities perfectly\n",
      "\n",
      "**🌟 What Makes It Special:**\n",
      "This dish is absolutely stunning! Picture tender wholemeal penne tossed in a vibrant, mildly spiced tomato sauce studded with golden caramelized onions, sweet orange peppers, and bright yellow sweetcorn. The whole thing is crowned with chunks of creamy avocado dressed in zesty lime - giving you all that rich, indulgent texture without any dairy!\n",
      "\n",
      "The Mexican spices (cumin, coriander, mild chilli) add warmth and depth without overwhelming heat, while fresh coriander and lime brighten everything up. It's comfort food that's also incredibly healthy - you get ALL FIVE of your daily vegetable servings in one gorgeous bowl!\n",
      "\n",
      "**📊 The Stats:**\n",
      "- **Cook Time:** 25 minutes total\n",
      "- **Difficulty:** Easy to Intermediate  \n",
      "- **Rating:** 4.3/5 stars (177 ratings)\n",
      "- **Nutrition:** Only 495 calories, packed with 18g of fiber, low fat, rich in iron and vitamin C\n",
      "\n",
      "**🎨 Key Ingredients:**\n",
      "Wholemeal penne, orange pepper, onion, garlic, chopped tomatoes, sweetcorn, avocado, lime, fresh coriander, and warming spices (chilli powder, cumin, ground coriander)\n",
      "\n",
      "This recipe is budget-friendly, uses mostly pantry staples, and the presentation is absolutely beautiful with all those vibrant colors. It's the perfect weeknight meal that tastes like you spent hours on it! 🥑🌶️🍅\n"
     ]
    }
   ],
   "source": [
    "response = client.chat.completions.create(\n",
    "    model=\"anthropic:claude-sonnet-4-5\",\n",
    "    messages=[{\n",
    "        \"role\": \"user\",\n",
    "        \"content\": \"\"\"Research a delicious vegetarian pasta recipe from:\n",
    "        - https://www.bbcgoodfood.com/recipes/collection/vegetarian-pasta-recipes\n",
    "        - https://www.allrecipes.com/search?q=vegetarian+pasta\n",
    "        \n",
    "        Then:\n",
    "        1. Make sure it fits my dietary profile (check memory!)\n",
    "        2. Save the recipe name and key ingredients in memory\n",
    "        3. Add notes about cook time and difficulty\n",
    "        4. Give me a brief summary with why you chose it\n",
    "\n",
    "        If you can't find any suitable recipe, let me know about your findings. Don't do more than 10 web fetches.\n",
    "        \n",
    "        Make it sound appetizing!\"\"\"\n",
    "    }],\n",
    "    tools=all_tools,\n",
    "    max_turns=20\n",
    ")\n",
    "\n",
    "print(\"=\"*60)\n",
    "print(\"🍝 RECIPE DISCOVERY\")\n",
    "print(\"=\"*60)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Step 4: \"What Can I Make?\" - Ingredient-Based Search\n",
    "\n",
    "Got random ingredients? Let's find what you can cook:\n",
    "\n",
    "NOTE: We have not saved much recipes nor preferences, so you may not get an excellent suggestion! But, it will still serve the purpose of demonstrating tool usage, and can be easily extended to provide better suggestions."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "============================================================\n",
      "🥘 INGREDIENT-BASED RECIPE\n",
      "============================================================\n",
      "# 🍛 **Thai Chickpea Coconut Curry** - Perfect for You Tonight!\n",
      "\n",
      "---\n",
      "\n",
      "## ✨ **Why I Chose This Recipe:**\n",
      "\n",
      "This is absolutely **IDEAL** for you! Here's why:\n",
      "- ✅ **Thai cuisine** - one of your favorites!\n",
      "- ✅ **Curry** - you specifically mentioned this as a favorite dish\n",
      "- ✅ **25 minutes total** - under your 30-minute preference\n",
      "- ✅ **100% vegetarian & vegan** - naturally dairy-free (no lactose issues!)\n",
      "- ✅ **You have EVERY ingredient** already in your kitchen!\n",
      "- ✅ **Intermediate skill level** - perfect for your abilities\n",
      "- ✅ **One-pot meal** - easy cleanup!\n",
      "\n",
      "---\n",
      "\n",
      "## 📝 **Simple Step-by-Step Instructions:**\n",
      "\n",
      "### **Step 1: Start Your Rice** (5 mins)\n",
      "- Cook your rice according to package directions. This will be ready when your curry is done!\n",
      "\n",
      "### **Step 2: Build Your Flavor Base** (5 mins)\n",
      "- Heat a little oil in a large pan over medium heat\n",
      "- Add diced onion and sauté until soft and translucent (about 5 minutes)\n",
      "\n",
      "### **Step 3: Add Aromatics** (1-2 mins)\n",
      "- Stir in minced garlic and ginger\n",
      "- Cook for 1 minute until fragrant (your kitchen will smell amazing!)\n",
      "\n",
      "### **Step 4: Toast Your Spices** (1 min)\n",
      "- Add your spices: curry powder, cumin, turmeric, and coriander (about 1-2 tsp each)\n",
      "- Stir for about 1 minute to bloom the flavors\n",
      "\n",
      "### **Step 5: Add Tomatoes** (3 mins)\n",
      "- Toss in diced tomatoes\n",
      "- Cook until they start to soften and break down\n",
      "\n",
      "### **Step 6: Make It Creamy** (10 mins)\n",
      "- Pour in the entire can of coconut milk\n",
      "- Add drained chickpeas\n",
      "- Give it a good stir and let it simmer for 10 minutes until the sauce thickens nicely\n",
      "\n",
      "### **Step 7: Season & Serve!**\n",
      "- Taste and add salt and pepper as needed\n",
      "- Serve over your fluffy rice\n",
      "- *Optional garnish*: fresh cilantro if you have it, or a squeeze of lime for extra zing!\n",
      "\n",
      "---\n",
      "\n",
      "## 💪 **You've Got This!**\n",
      "\n",
      "This recipe is **foolproof** and incredibly forgiving. The coconut milk makes everything creamy and rich, the chickpeas add protein and heartiness, and those aromatics (garlic, ginger, onion) create layers of flavor that taste like you spent hours cooking!\n",
      "\n",
      "Plus, this gets even **better the next day**, so if you make extra, you'll have an amazing lunch tomorrow. The best part? It's all pantry staples, so you're making restaurant-quality Thai food without a trip to the store!\n",
      "\n",
      "**Enjoy your delicious, aromatic curry! You're going to love how this turns out!** 🌟\n"
     ]
    }
   ],
   "source": [
    "response = client.chat.completions.create(\n",
    "    model=\"anthropic:claude-sonnet-4-5\",\n",
    "    messages=[{\n",
    "        \"role\": \"user\",\n",
    "        \"content\": \"\"\"I have these ingredients in my kitchen:\n",
    "        - Chickpeas (canned)\n",
    "        - Coconut milk\n",
    "        - Tomatoes\n",
    "        - Onions, garlic, ginger\n",
    "        - Rice\n",
    "        - Various spices\n",
    "        \n",
    "        Based on my dietary profile and what I have:\n",
    "        1. Suggest a recipe I can make\n",
    "        2. Check if it matches my preferences (Thai/Italian, quick, vegetarian)\n",
    "        3. Save this recipe idea to memory\n",
    "        \n",
    "        As the final response, give me a simple step-by-step overview of how to make it, and why you chose this for me!\n",
    "        \n",
    "        Be encouraging and practical!\"\"\"\n",
    "    }],\n",
    "    tools=all_tools,\n",
    "    max_turns=10\n",
    ")\n",
    "\n",
    "print(\"=\"*60)\n",
    "print(\"🥘 INGREDIENT-BASED RECIPE\")\n",
    "print(\"=\"*60)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Cleanup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fetch_mcp.close()\n",
    "memory_mcp.close()\n",
    "print(\"✓ Servers closed - your recipes are saved!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Recap of what we did above\n",
    "\n",
    "Behind the scenes, aisuite did some magic:\n",
    "- ✅ **Converted MCP tool schemas** to OpenAI-compatible format\n",
    "- ✅ **Handled tool execution** when the LLM requested them\n",
    "- ✅ **Managed async operations** for MCP server communication\n",
    "\n",
    "MCP Tools\n",
    "**Web search** - LLM could do web search due to Fetch being passed as a tool.\n",
    "**Preserved your data in knowledge graph** - LLM could store your preferences and look it using server-memory being passed as a tool.\n",
    "\n",
    "You, as an user, just wrote natural prompts - aisuite handled all the tool calling complexity - LLM returned personalized recommendations.\n",
    "\n",
    "You built a **personal chef assistant** that:\n",
    "- ✅ Researches recipes tailored to your diet\n",
    "- ✅ Remembers your restrictions and preferences\n",
    "- ✅ Suggests recipes based on ingredients you have\n",
    "- ✅ Saves your favorite recipes and cooking notes\n",
    "- ✅ Provides personalized cooking advice\n",
    "\n",
    "**All with minimal code!**\n",
    "\n",
    "## Try These Next\n",
    "\n",
    "Now that you've got the basics, explore more capabilities:\n",
    "\n",
    "### 📦 Meal Prep Planning\n",
    "```python\n",
    "response = client.chat.completions.create(\n",
    "    model=\"anthropic:claude-sonnet-4-5\",\n",
    "    messages=[{\"role\": \"user\", \"content\": \"\"\"I want to meal prep for the week. Based on my profile:\n",
    "        \n",
    "        1. Suggest 2 vegetarian recipes that:\n",
    "           - Reheat well\n",
    "           - Stay fresh for 3-4 days\n",
    "           - Match my taste (Italian/Thai)\n",
    "           - Are filling and nutritious\n",
    "        \n",
    "        2. Save both recipes to memory as 'meal prep favorites'\n",
    "        3. Give me storage tips for each\"\"\"}],\n",
    "    tools=all_tools,\n",
    "    max_turns=8\n",
    ")\n",
    "```\n",
    "\n",
    "### 📚 Browse Your Recipe Collection\n",
    "```python\n",
    "response = client.chat.completions.create(\n",
    "    model=\"anthropic:claude-sonnet-4-5\",\n",
    "    messages=[{\"role\": \"user\", \"content\": \"\"\"Search your memory and tell me:\n",
    "        \n",
    "        1. What recipes have I saved?\n",
    "        2. What are my dietary restrictions and preferences?\n",
    "        3. Which recipes are best for meal prep?\n",
    "        4. Suggest what I should cook tonight based on my saved recipes\"\"\"}],\n",
    "    tools=memory_mcp.get_callable_tools(),\n",
    "    max_turns=5\n",
    ")\n",
    "```\n",
    "\n",
    "### 💡 Cooking Tips & Substitutions\n",
    "```python\n",
    "response = client.chat.completions.create(\n",
    "    model=\"anthropic:claude-sonnet-4-5\",\n",
    "    messages=[{\"role\": \"user\", \"content\": \"\"\"I want to make a recipe that calls for:\n",
    "        - Heavy cream (but I'm lactose intolerant!)\n",
    "        - Parmesan cheese\n",
    "        \n",
    "        1. Suggest dairy-free substitutions\n",
    "        2. Store these substitution tips in memory\n",
    "        3. Any other dairy-free tips for Italian cooking?\"\"\"}],\n",
    "    tools=all_tools,\n",
    "    max_turns=6\n",
    ")\n",
    "```\n",
    "\n",
    "### 🔍 Explore Your Recipe Memory\n",
    "```python\n",
    "# See the raw knowledge graph\n",
    "import json\n",
    "with open(memory_file, 'r') as f:\n",
    "    for line in f.readlines()[:10]:\n",
    "        entry = json.loads(line)\n",
    "        if 'recipe' in entry.get('name', '').lower():\n",
    "            print(f\"🍽️ {entry.get('name')}\")\n",
    "```\n",
    "\n",
    "### 🌟 More Fun Queries\n",
    "- \"Find me a healthy salad for lunch\"\n",
    "- \"I want to try baking - suggest a beginner dessert\"\n",
    "- \"Research authentic Thai curry recipes from https://www.bbcgoodfood.com/recipes/collection/thai-curry-recipes\"\n",
    "- \"Plan a dinner party menu for 6 people\"\n",
    "- \"What cooking techniques should I learn next?\"\n",
    "- \"Create a grocery list for this week's meal prep\"\n",
    "\n",
    "## The Pattern\n",
    "\n",
    "Setup MCP tools, and call chat.completions.create() with max_turns.\n",
    "\n",
    "```python\n",
    "# 1. Set up fetch + memory\n",
    "fetch_mcp = MCPClient(command=\"uvx\", args=[\"mcp-server-fetch\"])\n",
    "memory_mcp = MCPClient(\n",
    "    command=\"npx\",\n",
    "    args=[\"-y\", \"@modelcontextprotocol/server-memory\"],\n",
    "    env={\"MEMORY_FILE_PATH\": \"recipe_memory.jsonl\"}\n",
    ")\n",
    "\n",
    "# 2. Combine tools\n",
    "tools = fetch_mcp.get_callable_tools() + memory_mcp.get_callable_tools()\n",
    "\n",
    "# 3. Cook with AI!\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=[{\"role\": \"user\", \"content\": \"Find a recipe and remember it\"}],\n",
    "    tools=tools,\n",
    "    max_turns=5\n",
    ")\n",
    "```\n",
    "\n",
    "## Advanced Ideas\n",
    "\n",
    "Extend this assistant to:\n",
    "- 📊 Track nutritional goals and suggest balanced meals\n",
    "- 🛒 Generate smart grocery lists with budget tracking\n",
    "- 📅 Plan weekly menus automatically\n",
    "- 👨‍🍳 Learn and improve from your cooking feedback\n",
    "- 🌍 Explore cuisines from different cultures\n",
    "- 📸 Store photos of your dishes (with filesystem MCP)\n",
    "- ⏰ Set cooking timers and reminders\n",
    "\n",
    "## Other Assistants to Build\n",
    "\n",
    "Use the same pattern for:\n",
    "- 🎬 **Movie recommendations** (see `movie_buff_assistant.ipynb`)\n",
    "- ✈️ **Travel planning** that remembers your bucket list\n",
    "- 📚 **Reading tracker** that knows your taste in books\n",
    "- 🏋️ **Fitness coach** that tracks your progress\n",
    "- 🌱 **Garden planner** that remembers what you planted\n",
    "\n",
    "## Resources\n",
    "\n",
    "- **Fetch Server**: https://github.com/modelcontextprotocol/servers/tree/main/src/fetch\n",
    "- **Memory Server**: https://github.com/modelcontextprotocol/servers/tree/main/src/memory\n",
    "- **aisuite Documentation**: https://github.com/andrewyng/aisuite\n",
    "- **More MCP Servers**: https://github.com/modelcontextprotocol/servers\n",
    "\n",
    "**Happy cooking! Your recipes and preferences persist forever!** 🍳✨"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.13.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}


================================================
FILE: examples/agents/snake_game_generator.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Snake Game Generator - AI Creates a Game\n",
    "\n",
    "This notebook shows how to use aisuite + MCP tools to have an AI generate a complete, playable Snake game.\n",
    "\n",
    "**What it does**: The LLM generates a Snake game in HTML/CSS/JavaScript, saves it to a file using MCP filesystem tools, and we display it right in the notebook.\n",
    "\n",
    "**Requirements**: `OPENAI_API_KEY` or `ANTHROPIC_API_KEY` in your `.env` file (depending on which model you choose)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Setup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "✓ Ready!\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "from dotenv import load_dotenv\n",
    "import aisuite as ai\n",
    "from aisuite.mcp import MCPClient\n",
    "from IPython.display import IFrame, display  # For displaying HTML file\n",
    "\n",
    "load_dotenv()\n",
    "\n",
    "# Initialize filesystem MCP server for file writing\n",
    "filesystem_mcp = MCPClient(\n",
    "    command=\"npx\",\n",
    "    args=[\"-y\", \"@modelcontextprotocol/server-filesystem\", os.getcwd()]\n",
    ")\n",
    "\n",
    "print(\"✓ Ready!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Craft Instructions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "prompt = \"\"\"Create a complete, playable Snake game.\n",
    "\n",
    "**EXECUTION RULES:**\n",
    "- Execute ALL tools silently (no intermediate text responses)\n",
    "- Write the HTML file FIRST, then provide a brief summary\n",
    "\n",
    "**GAME REQUIREMENTS:**\n",
    " Styling:\n",
    " - Clean, modern look\n",
    "   - Centered on page\n",
    "   - Nice colors (dark background, bright snake, contrasting food)\n",
    "   - Clear score display\n",
    "   - Arrow keys to change direction\n",
    "   - Instructions shown on screen\n",
    "\n",
    "**Save the file:**\n",
    "   - Use write_file to save as 'snake_game.html'\n",
    "   - After saving, respond with confirmation that the game was created\n",
    "\"\"\""
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Run Agent with MCP Tools"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "client = ai.Client()\n",
    "tools = filesystem_mcp.get_callable_tools()\n",
    "\n",
    "# Choose your model (uncomment one):\n",
    "model = \"openai:gpt-5.1\"\n",
    "# model = \"anthropic:claude-sonnet-4-5\"\n",
    "\n",
    "response = client.chat.completions.create(\n",
    "    model=model,\n",
    "    messages=[{\"role\": \"user\", \"content\": prompt}],\n",
    "    tools=tools,\n",
    "    max_turns=5\n",
    ")\n",
    "\n",
    "print(\"✓ Done!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Play the Game"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "\n",
       "        <iframe\n",
       "            width=\"600\"\n",
       "            height=\"800\"\n",
       "            src=\"snake_game.html\"\n",
       "            frameborder=\"0\"\n",
       "            allowfullscreen\n",
       "            \n",
       "        ></iframe>\n",
       "        "
      ],
      "text/plain": [
       "<IPython.lib.display.IFrame at 0x11c9dbe00>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "💡 Open 'snake_game.html' in your browser for full view\n"
     ]
    }
   ],
   "source": [
    "if os.path.exists('snake_game.html'):\n",
    "    display(IFrame(src='snake_game.html', width=600, height=800))\n",
    "    print(\"\\n💡 Open 'snake_game.html' in your browser for full view\")\n",
    "else:\n",
    "    print(\"⚠️ Game not created. Printing response from the model:\")\n",
    "    print(f\"\\n{response.choices[0].message.content}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(f\"\\n{response.choices[0].message.content}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Cleanup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "filesystem_mcp.close()\n",
    "print(\"✓ Done!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "---\n",
    "\n",
    "## That's It!\n",
    "\n",
    "In just a few lines of code, you had an AI:\n",
    "- ✅ Generate a complete Snake game from scratch\n",
    "- ✅ Save it to disk using MCP filesystem tools\n",
    "- ✅ Display it playable right in the notebook\n",
    "\n",
    "**Try it yourself:**\n",
    "- Ask for a different game (Pong, Tetris, etc.)\n",
    "- Add difficulty levels or speed settings\n",
    "- Request different color themes\n",
    "- Try with different models (swap the commented line)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.13.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}


================================================
FILE: examples/agents/stock_dashboard.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
  <meta charset="UTF-8" />
  <meta name="viewport" content="width=device-width, initial-scale=1" />
  <title>Stock Market Movers - November 10, 2025</title>
  <style>
    :root {
      --bg: #0b1020;
      --card: #111832;
      --text: #e8eefc;
      --muted: #9fb2d9;
      --accent: #3b82f6;
      --positive: #16a34a;
      --border: #1f2a4d;
      --shadow: 0 10px 30px rgba(0,0,0,0.35);
    }
    * { box-sizing: border-box; }
    body {
      margin: 0;
      font-family: Inter, ui-sans-serif, system-ui, -apple-system, Segoe UI, Roboto, Helvetica, Arial, "Apple Color Emoji", "Segoe UI Emoji";
      background: linear-gradient(180deg, #0b1020 0%, #0a0f1d 100%);
      color: var(--text);
    }
    .container {
      max-width: 1100px;
      margin: 48px auto;
      padding: 0 20px;
    }
    header h1 {
      margin: 0 0 8px 0;
      font-weight: 800;
      letter-spacing: 0.2px;
    }
    header p { margin: 0; color: var(--muted); }

    .card {
      margin-top: 24px;
      background: var(--card);
      border: 1px solid var(--border);
      border-radius: 14px;
      box-shadow: var(--shadow);
      overflow: hidden;
    }

    .table-wrap { width: 100%; overflow-x: auto; }
    table {
      width: 100%;
      border-collapse: collapse;
      min-width: 720px;
    }
    thead th {
      text-align: left;
      font-size: 12px;
      letter-spacing: .05em;
      text-transform: uppercase;
      color: var(--muted);
      padding: 16px 18px;
      background: rgba(255,255,255,0.02);
      border-bottom: 1px solid var(--border);
    }
    tbody td {
      padding: 16px 18px;
      border-bottom: 1px solid var(--border);
    }
    tbody tr:hover { background: rgba(255,255,255,0.03); }

    .ticker {
      font-weight: 700;
      color: #ffffff;
      letter-spacing: .3px;
    }
    .company { color: var(--muted); }

    .chip {
      display: inline-flex;
      align-items: center;
      gap: 6px;
      padding: 6px 10px;
      border-radius: 999px;
      font-weight: 700;
      font-variant-numeric: tabular-nums;
      font-size: 13px;
      background: rgba(22,163,74,.12);
      color: var(--positive);
      border: 1px solid rgba(22,163,74,.35);
      box-shadow: inset 0 0 0 1px rgba(22,163,74,.15);
    }
    .price { font-variant-numeric: tabular-nums; }

    .footer {
      display: flex;
      gap: 16px;
      align-items: center;
      flex-wrap: wrap;
      padding: 16px 18px;
      background: rgba(255,255,255,0.02);
      border-top: 1px solid var(--border);
      color: var(--muted);
      font-size: 14px;
    }
    .badge {
      display: inline-block;
      padding: 6px 10px;
      background: rgba(59,130,246,.12);
      border: 1px solid rgba(59,130,246,.35);
      color: #cde1ff;
      border-radius: 999px;
      font-size: 12px;
      letter-spacing: .03em;
      text-transform: uppercase;
    }
    a { color: #93c5fd; text-decoration: none; }
    a:hover { text-decoration: underline; }
    @media (max-width: 640px){
      header h1 { font-size: 22px; }
    }
  </style>
</head>
<body>
  <div class="container">
    <header>
      <h1>Stock Market Movers - November 10, 2025</h1>
      <p>Top gainers snapshot, styled for a professional financial look.</p>
    </header>

    <section class="card">
      <div class="table-wrap">
        <table>
          <thead>
            <tr>
              <th>Ticker</th>
              <th>Company</th>
              <th>Price (USD)</th>
              <th>% Change</th>
            </tr>
          </thead>
          <tbody>
            <tr>
              <td class="ticker">GLTO</td>
              <td class="company">Galecto, Inc.</td>
              <td class="price">17.25</td>
              <td><span class="chip">+248.49%</span></td>
            </tr>
            <tr>
              <td class="ticker">COGT</td>
              <td class="company">Cogent Biosciences, Inc.</td>
              <td class="price">32.46</td>
              <td><span class="chip">+119.03%</span></td>
            </tr>
            <tr>
              <td class="ticker">NVTS</td>
              <td class="company">Navitas Semiconductor Corporation</td>
              <td class="price">9.60</td>
              <td><span class="chip">+22.45%</span></td>
            </tr>
            <tr>
              <td class="ticker">XPEV</td>
              <td class="company">XPeng Inc.</td>
              <td class="price">26.04</td>
              <td><span class="chip">+16.15%</span></td>
            </tr>
            <tr>
              <td class="ticker">SEDG</td>
              <td class="company">SolarEdge Technologies, Inc.</td>
              <td class="price">45.38</td>
              <td><span class="chip">+13.45%</span></td>
            </tr>
          </tbody>
        </table>
      </div>
      <div class="footer">
        <span class="badge">As of Nov 10, 2025</span>
        <span>Source: <a href="https://finance.yahoo.com/markets/stocks/gainers/" target="_blank" rel="noopener">Yahoo Finance — Top Gainers</a></span>
      </div>
    </section>
  </div>
</body>
</html>

================================================
FILE: examples/agents/stock_market_dashboard.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Stock Market Movers - 2025-11-10</title>
    <style>
        body {
            font-family: Arial, sans-serif;
            margin: 0;
            padding: 0;
            background-color: #f4f4f9;
            color: #333;
        }
        header {
            background-color: #333;
            color: #fff;
            padding: 10px 0;
            text-align: center;
        }
        .container {
            width: 90%;
            max-width: 1200px;
            margin: 20px auto;
        }
        .gain, .loss {
            padding: 10px;
            border-radius: 5px;
            margin: 10px 0;
        }
        .gain {
            background-color: #d4fdd4;
            color: #006400;
            border: 1px solid #006400;
        }
        .loss {
            background-color: #ffdede;
            color: #b22222;
            border: 1px solid #b22222;
        }
        table {
            width: 100%;
            border-collapse: collapse;
            margin: 20px 0;
        }
        table thead {
            background-color: #333;
            color: #fff;
        }
        table th, table td {
            padding: 15px;
            text-align: left;
            border-bottom: 1px solid #ddd;
        }
        footer {
            text-align: center;
            padding: 15px 0;
            background-color: #333;
            color: #fff;
        }
        @media (max-width: 768px) {
            table, thead, tbody, th, td, tr {
                display: block;
            }
            td {
                position: relative;
                padding-left: 50%;
                text-align: left;
            }
            td:before {
                position: absolute;
                top: 0;
                left: 0;
                width: 45%;
                padding-right: 10px;
                white-space: nowrap;
            }
        }
    </style>
</head>
<body>
    <header>
        <h1>Stock Market Movers - 2025-11-10</h1>
        <p>Market Sentiment: Bullish</p>
    </header>
    <div class="container">
        <section id="top-gainers">
            <h2>Top Gainers</h2>
            <table>
                <thead>
                    <tr>
                        <th>Company Name</th>
                        <th>Ticker</th>
                        <th>Current Price</th>
                        <th>% Change</th>
                        <th>Reason</th>
                    </tr>
                </thead>
                <tbody>
                    <tr class="gain">
                        <td>Cogent Biosciences, Inc.</td>
                        <td>COGT</td>
                        <td>$32.46</td>
                        <td>+119.03%</td>
                        <td>Positive clinical trial result</td>
                    </tr>
                    <tr class="gain">
                        <td>Navitas Semiconductor Corporation</td>
                        <td>NVTS</td>
                        <td>$9.60</td>
                        <td>+22.45%</td>
                        <td>Strong quarterly earnings</td>
                    </tr>
                    <tr class="gain">
                        <td>Opendoor Technologies Inc.</td>
                        <td>OPEN</td>
                        <td>$7.99</td>
                        <td>+21.77%</td>
                        <td>Acquisition news</td>
                    </tr>
                </tbody>
            </table>
        </section>
        <section id="market-news">
            <h2>Market News</h2>
            <ul>
                <li>Sony raises profit forecast after earnings beat, boosted by Music and Imaging divisions</li>
                <li>U.S. markets rally as investors anticipate FOMC meeting outcomes</li>
                <li>European markets gain on strong manufacturing data</li>
            </ul>
        </section>
    </div>
    <footer>
        <p>Sources: Yahoo Finance, CNBC</p>
        <p>Timestamp: 2025-11-10</p>
        <p>Disclaimer: This is for informational purposes only, not financial advice.</p>
    </footer>
</body>
</html>

================================================
FILE: examples/agents/stock_market_mini_tracker.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Stock Market Tracker - Multi-step Agent in a single prompt\n",
    "\n",
    "This notebook shows how **easy** it is to build a multi-step agent using a single prompt with aisuite + MCP tools.\n",
    "\n",
    "**What it does**: 1. Fetches latest stock market data, 2. Analyzes content and 3. Creates an HTML dashboard.\n",
    "\n",
    "**Requirements**: `OPENAI_API_KEY` in your `.env` file"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Setup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "✓ Ready!\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "from datetime import datetime\n",
    "from dotenv import load_dotenv\n",
    "import aisuite as ai\n",
    "from aisuite.mcp import MCPClient\n",
    "\n",
    "load_dotenv()\n",
    "\n",
    "# Initialize MCP servers for web fetching and file writing\n",
    "fetch_mcp = MCPClient(command=\"uvx\", args=[\"mcp-server-fetch\"])\n",
    "filesystem_mcp = MCPClient(\n",
    "    command=\"npx\",\n",
    "    args=[\"-y\", \"@modelcontextprotocol/server-filesystem\", os.getcwd()]\n",
    ")\n",
    "\n",
    "print(\"✓ Ready!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Craft instructions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "✓ Agent instructions defined\n"
     ]
    }
   ],
   "source": [
    "# Define what you want the agent to do\n",
    "prompt = f\"\"\"Create a stock market dashboard for {datetime.now().strftime('%Y-%m-%d')}.\n",
    "\n",
    "**⚠️ EXECUTION RULES:**\n",
    "- Execute ALL tools silently (no intermediate text responses)\n",
    "- Write the HTML file FIRST, then provide summary\n",
    "- If you respond with text before writing the file, the loop stops!\n",
    "\n",
    "**TASK:**\n",
    "\n",
    "1. **Fetch Stock Data**\n",
    "   - Get top gainers from: https://finance.yahoo.com/markets/stocks/gainers/\n",
    "   - Extract: ticker, company name, price, % change\n",
    "   - Get 3-5 stocks\n",
    "\n",
    "2. **Create Professional HTML Dashboard**\n",
    "   - Title: \"Stock Market Movers - {datetime.now().strftime('%B %d, %Y')}\"\n",
    "   - Display top gainers in a clean table or card layout\n",
    "   - Use green color for positive % changes\n",
    "   - Add professional styling:\n",
    "     * Modern typography\n",
    "     * Shadows and borders\n",
    "     * Responsive design\n",
    "     * Clean spacing\n",
    "   - Include timestamp and data source\n",
    "\n",
    "3. **Save File**\n",
    "   - Use write_file to save as 'stock_dashboard.html'\n",
    "   - Confirm successful write\n",
    "\n",
    "4. **Respond**\n",
    "   - ONLY after file is written, provide a brief summary\n",
    "   - Include: number of stocks, top 3 gainers with % changes\n",
    "\n",
    "Make it look like a professional financial dashboard!\"\"\"\n",
    "\n",
    "print(\"✓ Agent instructions defined\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Run Agent with MCP tools."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "============================================================\n",
      "✓ DASHBOARD CREATED!\n",
      "============================================================\n",
      "\n",
      "The stock market dashboard for November 11, 2025, has been successfully created and saved as 'stock_dashboard.html'. It displays the top 5 stock gainers with a professional layout. Here are the top 3 gainers:\n",
      "\n",
      "1. **Cogent Biosciences, Inc. (COGT)** - +119.03%\n",
      "2. **Navitas Semiconductor Corporation (NVTS)** - +22.45%\n",
      "3. **Opendoor Technologies Inc. (OPEN)** - +21.77%\n",
      "\n",
      "The dashboard includes modern typography, responsive design, and highlights positive percentage changes in green.\n"
     ]
    }
   ],
   "source": [
    "# Create agent and run it\n",
    "client = ai.Client()\n",
    "tools = fetch_mcp.get_callable_tools() + filesystem_mcp.get_callable_tools()\n",
    "\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=[{\"role\": \"user\", \"content\": prompt}],\n",
    "    tools=tools,\n",
    "    max_turns=20\n",
    ")\n",
    "\n",
    "print(\"\\n\" + \"=\"*60)\n",
    "print(\"✓ DASHBOARD CREATED!\")\n",
    "print(\"=\"*60)\n",
    "print(f\"\\n{response.choices[0].message.content}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## View Dashboard"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "\n",
       "        <iframe\n",
       "            width=\"900\"\n",
       "            height=\"600\"\n",
       "            src=\"stock_dashboard.html\"\n",
       "            frameborder=\"0\"\n",
       "            allowfullscreen\n",
       "            \n",
       "        ></iframe>\n",
       "        "
      ],
      "text/plain": [
       "<IPython.lib.display.IFrame at 0x114517b60>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "💡 Open 'stock_dashboard.html' in your browser for full view\n"
     ]
    }
   ],
   "source": [
    "from IPython.display import IFrame, display\n",
    "\n",
    "if os.path.exists('stock_dashboard.html'):\n",
    "    display(IFrame(src='stock_dashboard.html', width=900, height=600))\n",
    "    print(\"\\n💡 Open 'stock_dashboard.html' in your browser for full view\")\n",
    "else:\n",
    "    print(\"⚠️ Dashboard not created - check the output above\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Cleanup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fetch_mcp.close()\n",
    "filesystem_mcp.close()\n",
    "print(\"✓ Done! That's how easy it is to build an agent with aisuite.\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "---\n",
    "\n",
    "## That's It!\n",
    "\n",
    "In just **few lines of code**, you built an autonomous agent that:\n",
    "- ✅ Fetches live stock data from the web\n",
    "- ✅ Creates a beautiful HTML dashboard\n",
    "- ✅ Saves it to disk\n",
    "\n",
    "**Try it yourself**:\n",
    "- Modify the prompt to fetch TOP losers and gainers.\n",
    "- Modify to fetch data across multiple days.\n",
    "- Modify to fetch headlines from any Finance News website to explain why stocks rose or fell. (NOTE: Many websites do not like automated calls - be mindful of their policies.)\n",
    "- Try asking Agent to plot a graph with the data in the HTML page.\n",
    "- Add more MCP tools (memory, search, etc.)\n",
    "\n",
    "Remember to **increase max_turns** to a higher number if you increase the complexity of the tasks.\n",
    "\n",
    "**Learn more**: Check out other notebooks in `examples/agents/`"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.13.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}


================================================
FILE: examples/agents/stock_market_tracker.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Stock Market Tracker - Latest Market Movers Dashboard\n",
    "\n",
    "This notebook demonstrates an autonomous research agent that:\n",
    "- Fetches latest stock market news and data\n",
    "- Identifies stocks that rose and fell today\n",
    "- Creates a beautiful HTML dashboard with market analysis\n",
    "\n",
    "## Requirements\n",
    "\n",
    "1. **API Keys** (set in `.env` file):\n",
    "   - `ANTHROPIC_API_KEY` - Get from https://console.anthropic.com/\n",
    "\n",
    "2. **MCP Servers** (install if needed):\n",
    "   ```bash\n",
    "   # Fetch server for web research\n",
    "   pip install mcp-server-fetch\n",
    "   \n",
    "   # Filesystem server for saving HTML\n",
    "   npm install -g @modelcontextprotocol/server-filesystem\n",
    "   ```\n",
    "\n",
    "3. **Python Packages**:\n",
    "   ```bash\n",
    "   pip install 'aisuite[anthropic,mcp]' python-dotenv\n",
    "   ```"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Setup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "✓ Environment configured\n",
      "✓ Working directory: /Users/rohit/fleet/leclerc/aisuite-prs/aisuite-main/aisuite/examples/agents\n",
      "✓ Today's date: 2025-11-10\n",
      "\n",
      "Ready to track the markets!\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "import json\n",
    "from pathlib import Path\n",
    "from dotenv import load_dotenv\n",
    "from datetime import datetime\n",
    "import aisuite as ai\n",
    "from aisuite.mcp import MCPClient\n",
    "\n",
    "# Load environment variables\n",
    "load_dotenv()\n",
    "\n",
    "# Verify required API keys\n",
    "if not os.getenv(\"ANTHROPIC_API_KEY\"):\n",
    "    raise ValueError(\n",
    "        \"Missing ANTHROPIC_API_KEY\\n\"\n",
    "        \"Please add it to your .env file\"\n",
    "    )\n",
    "\n",
    "print(\"✓ Environment configured\")\n",
    "print(f\"✓ Working directory: {os.getcwd()}\")\n",
    "print(f\"✓ Today's date: {datetime.now().strftime('%Y-%m-%d')}\")\n",
    "print(\"\\nReady to track the markets!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Initialize MCP Servers"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "✓ MCP servers initialized\n",
      "\n",
      "Available tools:\n",
      "  - Fetch: ['fetch']\n",
      "  - Filesystem: ['read_file', 'read_text_file', 'read_media_file', 'read_multiple_files', 'write_file', 'edit_file', 'create_directory', 'list_directory', 'list_directory_with_sizes', 'directory_tree', 'move_file', 'search_files', 'get_file_info', 'list_allowed_directories']\n"
     ]
    }
   ],
   "source": [
    "# Fetch MCP Server - for web research\n",
    "fetch_mcp = MCPClient(\n",
    "    command=\"uvx\",\n",
    "    args=[\"mcp-server-fetch\"],\n",
    "    name=\"fetch\"\n",
    ")\n",
    "\n",
    "# Filesystem MCP Server - for saving HTML files\n",
    "filesystem_mcp = MCPClient(\n",
    "    command=\"npx\",\n",
    "    args=[\"-y\", \"@modelcontextprotocol/server-filesystem\", os.getcwd()],\n",
    "    name=\"filesystem\"\n",
    ")\n",
    "\n",
    "print(\"✓ MCP servers initialized\")\n",
    "print(f\"\\nAvailable tools:\")\n",
    "print(f\"  - Fetch: {[tool['name'] for tool in fetch_mcp.list_tools()]}\")\n",
    "print(f\"  - Filesystem: {[tool['name'] for tool in filesystem_mcp.list_tools()]}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Generate Market Movers Dashboard\n",
    "\n",
    "Watch the AI agent:\n",
    "1. Fetch latest stock market news and data\n",
    "2. Identify top gainers and losers\n",
    "3. Create a comprehensive HTML dashboard\n",
    "4. **Save the HTML file FIRST** (critical!)\n",
    "5. Provide summary"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "📈 Fetching latest stock market data...\n",
      "\n",
      "============================================================\n",
      "\n",
      "============================================================\n",
      "✓ STOCK MARKET DASHBOARD COMPLETE!\n",
      "============================================================\n",
      "\n",
      "The stock market dashboard for November 10, 2025, has been successfully created and saved as 'stock_market_dashboard.html'. Here's a summary of the dashboard:\n",
      "\n",
      "- **Number of Stocks Analyzed**: Multiple stocks, focusing on the top 3 gainers.\n",
      "- **Top 3 Gainers**:\n",
      "  1. **Cogent Biosciences, Inc. (COGT)**: Price $32.46, Change +119.03%\n",
      "  2. **Navitas Semiconductor Corporation (NVTS)**: Price $9.60, Change +22.45%\n",
      "  3. **Opendoor Technologies Inc. (OPEN)**: Price $7.99, Change +21.77%\n",
      "- **Overall Market Sentiment**: Bullish\n",
      "- **Key Market News**:\n",
      "  - Sony raises profit forecast after earnings beat\n",
      "  - U.S. markets rally in anticipation of FOMC meeting outcomes\n",
      "  - European markets gain on strong manufacturing data\n",
      "\n",
      "The dashboard provides a clean, professional, and responsive layout suitable for financial analysis.\n"
     ]
    }
   ],
   "source": [
    "# Initialize aisuite client\n",
    "client = ai.Client()\n",
    "\n",
    "# Combine all available tools\n",
    "all_tools = fetch_mcp.get_callable_tools() + filesystem_mcp.get_callable_tools()\n",
    "\n",
    "print(\"📈 Fetching latest stock market data...\\n\")\n",
    "print(\"=\" * 60)\n",
    "\n",
    "# Create comprehensive research prompt\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=[{\n",
    "        \"role\": \"user\",\n",
    "        \"content\": f\"\"\"Create a stock market movers dashboard for today ({datetime.now().strftime('%Y-%m-%d')}).\n",
    "\n",
    "**⚠️ CRITICAL EXECUTION RULES - READ FIRST:**\n",
    "1. DO NOT provide ANY text responses while executing tools\n",
    "2. DO NOT say things like \"Now let me...\", \"I'll create...\", or \"Let me gather...\"\n",
    "3. Execute ALL tools SILENTLY - fetch URLs, write files, etc.\n",
    "4. Your FIRST and ONLY text response must come AFTER the HTML file is successfully written\n",
    "5. If you respond with text before calling write_file, the tool execution loop will STOP and the file will NOT be created!\n",
    "\n",
    "**REMEMBER**: Research → Write HTML → THEN (and only then) respond with summary!\n",
    "\n",
    "---\n",
    "\n",
    "Steps to execute SILENTLY (no text responses until step 6):\n",
    "\n",
    "1. **Fetch latest market data** from these sources:\n",
    "   - Yahoo Finance market movers: https://finance.yahoo.com/markets/stocks/gainers/\n",
    "   - MarketWatch: https://www.marketwatch.com/\n",
    "   - Or any other reliable financial news source\n",
    "   \n",
    "   Extract:\n",
    "   - Top 3 stocks that rose today (gainers)\n",
    "   - For each stock: ticker symbol, company name, price, % change\n",
    "   - Major market indices (S&P 500, Dow, NASDAQ) if available\n",
    "   - Key market news/headlines\n",
    "\n",
    "2. **Create a beautiful HTML dashboard** with:\n",
    "   \n",
    "   **Header Section**:\n",
    "   - Title: \"Stock Market Movers - [Today's Date]\"\n",
    "   - Market sentiment indicator (bullish/bearish/neutral)\n",
    "   \n",
    "   **Top Gainers Section**:\n",
    "   - Table or cards showing:\n",
    "     * Company name and ticker\n",
    "     * Current price\n",
    "     * % change (in green)\n",
    "     * Brief reason for rise if known\n",
    "      \n",
    "   **Market News Section**:\n",
    "   - 3-5 key headlines impacting the market\n",
    "   \n",
    "   **Footer**:\n",
    "   - Data sources cited\n",
    "   - Timestamp\n",
    "   - Disclaimer: \"This is for informational purposes only, not financial advice\"\n",
    "\n",
    "4. **Styling requirements**:\n",
    "   - Professional financial dashboard aesthetic\n",
    "   - Color coding: GREEN for gains, RED for losses\n",
    "   - Clean table or card-based layout\n",
    "   - Responsive design\n",
    "   - Modern typography\n",
    "   - Use shadows and borders for visual separation.\n",
    " \n",
    "5. **SAVE HTML FILE (still no text response yet!)**:\n",
    "   - Use write_file to save as 'stock_market_dashboard.html'\n",
    "   - Wait for confirmation that write succeeded\n",
    "   \n",
    "6. **NOW you can respond with text** - provide a summary with:\n",
    "   - Confirmation that the HTML file was created\n",
    "   - Number of stocks analyzed\n",
    "   - Top 3 gainers with % changes\n",
    "   - Optionally, Top 3 losers with % changes\n",
    "   - Overall market sentiment\n",
    "\n",
    "Make it look like a professional Bloomberg/Yahoo Finance dashboard!\"\"\"\n",
    "    }],\n",
    "    tools=all_tools,\n",
    "    max_turns=30\n",
    ")\n",
    "\n",
    "print(\"\\n\" + \"=\" * 60)\n",
    "print(\"✓ STOCK MARKET DASHBOARD COMPLETE!\")\n",
    "print(\"=\" * 60)\n",
    "print(f\"\\n{response.choices[0].message.content}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Verify File Was Created"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "✅ File created successfully!\n",
      "   - Filename: stock_market_dashboard.html\n",
      "   - Size: 4,231 bytes\n",
      "   - Location: /Users/rohit/fleet/leclerc/aisuite-prs/aisuite-main/aisuite/examples/agents/stock_market_dashboard.html\n"
     ]
    }
   ],
   "source": [
    "filename = \"stock_market_dashboard.html\"\n",
    "\n",
    "if os.path.exists(filename):\n",
    "    file_size = os.path.getsize(filename)\n",
    "    print(f\"✅ File created successfully!\")\n",
    "    print(f\"   - Filename: {filename}\")\n",
    "    print(f\"   - Size: {file_size:,} bytes\")\n",
    "    print(f\"   - Location: {os.path.abspath(filename)}\")\n",
    "else:\n",
    "    print(f\"❌ ERROR: File was not created!\")\n",
    "    print(f\"   Expected: {filename}\")\n",
    "    print(f\"\\n   The agent may have stopped before writing the file.\")\n",
    "    print(f\"   Try re-running with a higher max_turns value.\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## View the Generated Dashboard"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "\n",
       "        <iframe\n",
       "            width=\"900\"\n",
       "            height=\"800\"\n",
       "            src=\"stock_market_dashboard.html\"\n",
       "            frameborder=\"0\"\n",
       "            allowfullscreen\n",
       "            \n",
       "        ></iframe>\n",
       "        "
      ],
      "text/plain": [
       "<IPython.lib.display.IFrame at 0x116915550>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "💡 Tip: Open 'stock_market_dashboard.html' in your browser for full-screen viewing!\n"
     ]
    }
   ],
   "source": [
    "from IPython.display import IFrame, display\n",
    "\n",
    "if os.path.exists(filename):\n",
    "    display(IFrame(src=filename, width=900, height=800))\n",
    "    print(f\"\\n💡 Tip: Open '{filename}' in your browser for full-screen viewing!\")\n",
    "else:\n",
    "    print(f\"⚠️  File not found: {filename}\")\n",
    "    print(\"The dashboard was not created. Check the error above.\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Optional: View Tool Execution History\n",
    "\n",
    "See what sources the agent consulted and when it wrote the file:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Tool Execution History:\n",
      "\n",
      "============================================================\n",
      "\n",
      "[1] 🌐 Fetched: https://finance.yahoo.com/markets/stocks/gainers/...\n",
      "\n",
      "[1] 🌐 Fetched: https://www.marketwatch.com/...\n"
     ]
    },
    {
     "ename": "AttributeError",
     "evalue": "'dict' object has no attribute 'role'",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mAttributeError\u001b[0m                            Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[6], line 8\u001b[0m\n\u001b[1;32m      5\u001b[0m write_count \u001b[38;5;241m=\u001b[39m \u001b[38;5;241m0\u001b[39m\n\u001b[1;32m      7\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m i, msg \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28menumerate\u001b[39m(response\u001b[38;5;241m.\u001b[39mchoices[\u001b[38;5;241m0\u001b[39m]\u001b[38;5;241m.\u001b[39mintermediate_messages, \u001b[38;5;241m1\u001b[39m):\n\u001b[0;32m----> 8\u001b[0m     \u001b[38;5;28;01mif\u001b[39;00m \u001b[43mmsg\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrole\u001b[49m \u001b[38;5;241m==\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124massistant\u001b[39m\u001b[38;5;124m\"\u001b[39m \u001b[38;5;129;01mand\u001b[39;00m \u001b[38;5;28mhasattr\u001b[39m(msg, \u001b[38;5;124m'\u001b[39m\u001b[38;5;124mtool_calls\u001b[39m\u001b[38;5;124m'\u001b[39m) \u001b[38;5;129;01mand\u001b[39;00m msg\u001b[38;5;241m.\u001b[39mtool_calls:\n\u001b[1;32m      9\u001b[0m         \u001b[38;5;28;01mfor\u001b[39;00m tool_call \u001b[38;5;129;01min\u001b[39;00m msg\u001b[38;5;241m.\u001b[39mtool_calls:\n\u001b[1;32m     10\u001b[0m             \u001b[38;5;28;01mif\u001b[39;00m tool_call\u001b[38;5;241m.\u001b[39mfunction\u001b[38;5;241m.\u001b[39mname \u001b[38;5;241m==\u001b[39m \u001b[38;5;124m'\u001b[39m\u001b[38;5;124mfetch\u001b[39m\u001b[38;5;124m'\u001b[39m:\n",
      "\u001b[0;31mAttributeError\u001b[0m: 'dict' object has no attribute 'role'"
     ]
    }
   ],
   "source": [
    "print(\"Tool Execution History:\\n\")\n",
    "print(\"=\" * 60)\n",
    "\n",
    "fetch_count = 0\n",
    "write_count = 0\n",
    "\n",
    "for i, msg in enumerate(response.choices[0].intermediate_messages, 1):\n",
    "    if msg.role == \"assistant\" and hasattr(msg, 'tool_calls') and msg.tool_calls:\n",
    "        for tool_call in msg.tool_calls:\n",
    "            if tool_call.function.name == 'fetch':\n",
    "                fetch_count += 1\n",
    "                args = json.loads(tool_call.function.arguments)\n",
    "                url = args.get('url', 'N/A')\n",
    "                print(f\"\\n[{i}] 🌐 Fetched: {url[:80]}...\")\n",
    "            elif tool_call.function.name == 'write_file':\n",
    "                write_count += 1\n",
    "                args = json.loads(tool_call.function.arguments)\n",
    "                path = args.get('path', 'N/A')\n",
    "                content_size = len(args.get('contents', ''))\n",
    "                print(f\"\\n[{i}] 💾 WROTE FILE: {path} ({content_size:,} bytes)\")\n",
    "\n",
    "print(f\"\\n{'=' * 60}\")\n",
    "print(f\"Total web fetches: {fetch_count}\")\n",
    "print(f\"Total file writes: {write_count}\")\n",
    "\n",
    "if write_count == 0:\n",
    "    print(\"\\n⚠️  WARNING: No file writes detected!\")\n",
    "    print(\"   The agent did not call write_file.\")\n",
    "elif write_count == 1:\n",
    "    print(\"\\n✅ Perfect! File was written exactly once.\")\n",
    "else:\n",
    "    print(f\"\\n⚠️  NOTE: File was written {write_count} times (may have been overwritten)\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Market Refresh\n",
    "\n",
    "Markets change throughout the day! Re-run the notebook to get fresh data."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(f\"Dashboard generated at: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}\")\n",
    "print(\"\\n💡 Tip: Re-run the 'Generate Market Movers Dashboard' cell for updated data!\")\n",
    "print(\"\\n⚠️  Disclaimer: This is for informational purposes only.\")\n",
    "print(\"   This is not financial advice. Always do your own research.\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Cleanup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Close MCP connections\n",
    "fetch_mcp.close()\n",
    "filesystem_mcp.close()\n",
    "\n",
    "print(\"✓ MCP servers closed\")\n",
    "if os.path.exists(filename):\n",
    "    print(f\"✓ Your dashboard is saved as: {filename}\")\n",
    "print(\"\\n📊 Happy trading! (Remember: not financial advice!)\")"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.13.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}


================================================
FILE: examples/agents/world_weather_dashboard.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# World Weather Dashboard - AI-Generated with Tailwind CSS\n",
    "\n",
    "This notebook demonstrates an AI agent that fetches live weather data and creates a beautiful dashboard.\n",
    "\n",
    "**What it does**:\n",
    "1. Fetches current weather for major world capitals from wttr.in\n",
    "2. Creates a responsive Tailwind CSS dashboard\n",
    "3. Displays weather cards with temperature, conditions, and more\n",
    "\n",
    "**Requirements**:\n",
    "- `OPENAI_API_KEY` or `ANTHROPIC_API_KEY` in your `.env` file\n",
    "- MCP servers: `pip install mcp-server-fetch` and `npm install -g @modelcontextprotocol/server-filesystem`"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Setup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "from datetime import datetime\n",
    "from dotenv import load_dotenv\n",
    "import aisuite as ai\n",
    "from aisuite.mcp import MCPClient\n",
    "\n",
    "load_dotenv()\n",
    "\n",
    "# Initialize MCP servers\n",
    "fetch_mcp = MCPClient(command=\"uvx\", args=[\"mcp-server-fetch\"])\n",
    "filesystem_mcp = MCPClient(\n",
    "    command=\"npx\",\n",
    "    args=[\"-y\", \"@modelcontextprotocol/server-filesystem\", os.getcwd()]\n",
    ")\n",
    "\n",
    "print(\"✓ Ready!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Craft Instructions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Cities to fetch weather for\n",
    "capitals = [\n",
    "    \"London\", \"Paris\", \"Tokyo\", \"New York\", \"Sydney\", \"São Paulo\"\n",
    "]\n",
    "\n",
    "prompt = f\"\"\"Create a world weather dashboard for these capitals: {', '.join(capitals)}.\n",
    "\n",
    "**EXECUTION RULES:**\n",
    "- Execute ALL tools silently (no intermediate text responses)\n",
    "- Write the HTML file FIRST, then provide a brief summary\n",
    "\n",
    "**TASK:**\n",
    "1. **Fetch Weather Data**\n",
    "   - Use wttr.in for each city: `https://wttr.in/CityName?format=j1`\n",
    "   - This returns JSON with current conditions\n",
    "   - Extract: temperature (°C), weather description, humidity, wind speed\n",
    "   - Note: wttr.in explicitly allows automated access\n",
    "\n",
    "2. **Create Single page HTML Dashboard with Tailwind CSS**   \n",
    "   Each weather card should have:\n",
    "   - City name (bold, large)\n",
    "   - Weather emoji (☀️ sunny, 🌧️ rain, ☁️ cloudy, etc.)\n",
    "   - Temperature in large font\n",
    "   - Weather description\n",
    "   - Humidity and wind as smaller details\n",
    "   - Background color based on temperature:\n",
    "     * Cold (<10°C): blue tones\n",
    "     * Mild (10-25°C): green/teal tones  \n",
    "     * Warm (25-35°C): orange/yellow tones\n",
    "     * Hot (>35°C): red tones\n",
    "\n",
    "3. **Styling Requirements**\n",
    "   - Use Tailwind CSS classes\n",
    "   - Rounded cards with shadows\n",
    "   - Responsive grid (2 cols mobile, 3 tablet, 5 desktop)\n",
    "   - Clean, modern design\n",
    "   - White text on colored backgrounds\n",
    "   - Smooth gradients\n",
    "\n",
    "4. **Save File**\n",
    "   - Use write_file to save as 'weather_dashboard.html'\n",
    "\n",
    "5. **Respond with summary**\n",
    "   - ONLY after file is written\n",
    "   - List hottest and coldest cities\n",
    "   - Any interesting weather patterns\n",
    "\"\"\"\n",
    "\n",
    "print(\"✓ Agent instructions defined\")\n",
    "print(f\"✓ Will fetch weather for {len(capitals)} cities\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Run Agent"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "client = ai.Client()\n",
    "tools = fetch_mcp.get_callable_tools() + filesystem_mcp.get_callable_tools()\n",
    "\n",
    "# Choose your model (uncomment one):\n",
    "model = \"openai:gpt-5.1\"\n",
    "# model = \"anthropic:claude-sonnet-4-5\"\n",
    "\n",
    "print(\"Fetching weather for world capitals...\\n\")\n",
    "print(\"(This may take a minute or more\\n\")\n",
    "\n",
    "response = client.chat.completions.create(\n",
    "    model=model,\n",
    "    messages=[{\"role\": \"user\", \"content\": prompt}],\n",
    "    tools=tools,\n",
    "    max_turns=20\n",
    ")\n",
    "\n",
    "print(\"✓ WEATHER DASHBOARD CREATED!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## View the Dashboard"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from IPython.display import IFrame, display\n",
    "\n",
    "if os.path.exists('weather_dashboard.html'):\n",
    "    display(IFrame(src='weather_dashboard.html', width=950, height=700))\n",
    "    print(\"\\n💡 Open 'weather_dashboard.html' in your browser for full view\")\n",
    "else:\n",
    "    print(\"⚠️ Dashboard not created\")\n",
    "print(f\"\\n{response.choices[0].message.content}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Cleanup"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fetch_mcp.close()\n",
    "filesystem_mcp.close()\n",
    "print(\"✓ Done!\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "---\n",
    "\n",
    "## That's It!\n",
    "\n",
    "You just built an AI agent that:\n",
    "- ✅ Fetched live weather data for few world capitals\n",
    "- ✅ Created a beautiful Tailwind CSS dashboard\n",
    "- ✅ Color-coded temperatures for visual impact\n",
    "\n",
    "**Try it yourself:**\n",
    "- Add more cities to the `capitals` list\n",
    "- Request a dark mode version\n",
    "- Add 3-day forecast for each city\n",
    "- Include weather icons instead of emojis\n",
    "- Add a world map visualization\n",
    "\n",
    "**About wttr.in:**\n",
    "- Free weather service designed for terminal/API access\n",
    "- No API key required\n",
    "- Supports JSON format with `?format=j1`\n",
    "- More info: https://github.com/chubin/wttr.in\n",
    "\n",
    "**Learn more**: Check out other notebooks in `examples/agents/`"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.13.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}


================================================
FILE: examples/aisuite_tool_abstraction.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import sys\n",
    "from dotenv import load_dotenv, find_dotenv\n",
    "import os\n",
    "\n",
    "sys.path.append('../../aisuite')\n",
    "# Load from .env file if available\n",
    "load_dotenv(find_dotenv())\n",
    "os.environ['ALLOW_MULTI_TURN'] = 'true'"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Define the functions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Mock tool functions.\n",
    "def get_current_temperature(location: str, unit: str):\n",
    "    \"\"\"This is a short description of what the function does.\n",
    "\n",
    "    This is a longer description that can span\n",
    "    multiple lines and provide more details.\n",
    "\n",
    "    Args:\n",
    "        param1: Description of param1\n",
    "        param2: Description of param2\n",
    "    \"\"\"\n",
    "    return \"70\"\n",
    "\n",
    "def is_it_raining(location: str):\n",
    "    # Simulate fetching rain probability\n",
    "    return \"yes\""
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Call the model with tools"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "from aisuite import Client\n",
    "\n",
    "client = Client()\n",
    "messages = [{\n",
    "    \"role\": \"user\",\n",
    "    \"content\": \"Can you plan a picnic for today afternoon in San Francisco? Check the temperature and if its raining.\"}]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "--------- response from LLM ---------\n",
      "ChatCompletion(id='chatcmpl-AvuR3w6M83nWHL9sIO23pgvD0E5PF', choices=[Choice(finish_reason='tool_calls', index=0, logprobs=None, message=ChatCompletionMessage(content=None, refusal=None, role='assistant', audio=None, function_call=None, tool_calls=[ChatCompletionMessageToolCall(id='call_PVhrHTUQ2qY7FDyPkCT54phU', function=Function(arguments='{\\n\"location\": \"San Francisco\",\\n\"unit\": \"Fahrenheit\"\\n}', name='get_current_temperature'), type='function')]))], created=1738364997, model='gpt-4-0613', object='chat.completion', service_tier='default', system_fingerprint=None, usage=CompletionUsage(completion_tokens=24, prompt_tokens=110, total_tokens=134, completion_tokens_details=CompletionTokensDetails(accepted_prediction_tokens=0, audio_tokens=0, reasoning_tokens=0, rejected_prediction_tokens=0), prompt_tokens_details=PromptTokensDetails(audio_tokens=0, cached_tokens=0)))\n",
      "Executing tool:  get_current_temperature\n",
      "--------- tool_message to send to LLM ---------\n",
      "[{'role': 'tool', 'name': 'get_current_temperature', 'content': '\"70\"', 'tool_call_id': 'call_PVhrHTUQ2qY7FDyPkCT54phU'}]\n",
      "--------- response from LLM ---------\n",
      "ChatCompletion(id='chatcmpl-AvuR4hpiCgXFxRMNLg1Scv1UD2JlR', choices=[Choice(finish_reason='tool_calls', index=0, logprobs=None, message=ChatCompletionMessage(content=None, refusal=None, role='assistant', audio=None, function_call=None, tool_calls=[ChatCompletionMessageToolCall(id='call_Fvy3JUhIbVqzV0Nb0QfSnWQC', function=Function(arguments='{\\n\"location\": \"San Francisco\"\\n}', name='is_it_raining'), type='function')]))], created=1738364998, model='gpt-4-0613', object='chat.completion', service_tier='default', system_fingerprint=None, usage=CompletionUsage(completion_tokens=18, prompt_tokens=145, total_tokens=163, completion_tokens_details=CompletionTokensDetails(accepted_prediction_tokens=0, audio_tokens=0, reasoning_tokens=0, rejected_prediction_tokens=0), prompt_tokens_details=PromptTokensDetails(audio_tokens=0, cached_tokens=0)))\n",
      "Executing tool:  is_it_raining\n",
      "--------- tool_message to send to LLM ---------\n",
      "[{'role': 'tool', 'name': 'is_it_raining', 'content': '\"yes\"', 'tool_call_id': 'call_Fvy3JUhIbVqzV0Nb0QfSnWQC'}]\n",
      "--------- response from LLM ---------\n",
      "ChatCompletion(id='chatcmpl-AvuR7puWSJLEpCNIZLLkF40gYJp3c', choices=[Choice(finish_reason='stop', index=0, logprobs=None, message=ChatCompletionMessage(content=\"I'm sorry, it seems like it will be raining this afternoon in San Francisco. You might want to plan your picnic for another day. Also the temperature is forecasted to be around 70 degrees Fahrenheit.\", refusal=None, role='assistant', audio=None, function_call=None, tool_calls=None))], created=1738365001, model='gpt-4-0613', object='chat.completion', service_tier='default', system_fingerprint=None, usage=CompletionUsage(completion_tokens=44, prompt_tokens=175, total_tokens=219, completion_tokens_details=CompletionTokensDetails(accepted_prediction_tokens=0, audio_tokens=0, reasoning_tokens=0, rejected_prediction_tokens=0), prompt_tokens_details=PromptTokensDetails(audio_tokens=0, cached_tokens=0)))\n",
      "I'm sorry, it seems like it will be raining this afternoon in San Francisco. You might want to plan your picnic for another day. Also the temperature is forecasted to be around 70 degrees Fahrenheit.\n"
     ]
    }
   ],
   "source": [
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4\", messages=messages, tools=[get_current_temperature, is_it_raining], max_turns=4)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "response = client.chat.completions.create(\n",
    "    model=\"anthropic:claude-3-5-sonnet-20241022\", messages=messages, tools=[get_current_temperature, is_it_raining], max_turns=4)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(response)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[ChatCompletionMessage(content=None, refusal=None, role='assistant', audio=None, function_call=None, tool_calls=[ChatCompletionMessageToolCall(id='call_PVhrHTUQ2qY7FDyPkCT54phU', function=Function(arguments='{\\n\"location\": \"San Francisco\",\\n\"unit\": \"Fahrenheit\"\\n}', name='get_current_temperature'), type='function')]),\n",
      " {'content': '\"70\"',\n",
      "  'name': 'get_current_temperature',\n",
      "  'role': 'tool',\n",
      "  'tool_call_id': 'call_PVhrHTUQ2qY7FDyPkCT54phU'},\n",
      " ChatCompletionMessage(content=None, refusal=None, role='assistant', audio=None, function_call=None, tool_calls=[ChatCompletionMessageToolCall(id='call_Fvy3JUhIbVqzV0Nb0QfSnWQC', function=Function(arguments='{\\n\"location\": \"San Francisco\"\\n}', name='is_it_raining'), type='function')]),\n",
      " {'content': '\"yes\"',\n",
      "  'name': 'is_it_raining',\n",
      "  'role': 'tool',\n",
      "  'tool_call_id': 'call_Fvy3JUhIbVqzV0Nb0QfSnWQC'},\n",
      " ChatCompletionMessage(content=\"I'm sorry, it seems like it will be raining this afternoon in San Francisco. You might want to plan your picnic for another day. Also the temperature is forecasted to be around 70 degrees Fahrenheit.\", refusal=None, role='assistant', audio=None, function_call=None, tool_calls=None)]\n"
     ]
    }
   ],
   "source": [
    "from pprint import pprint \n",
    "pprint(response.choices[0].intermediate_messages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from aisuite import Tools\n",
    "tools = Tools(tools=[get_current_temperature, is_it_raining])\n",
    "tools.tools()\n",
    "# tools.add_description(\"is_it_raining\", \"Use this function to understand if it is going to rain or not\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "messages = append(messages, response.choices[0].intermediate_messages)\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}


================================================
FILE: examples/asr_example.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "5a7a0ca2",
   "metadata": {},
   "source": [
    "# ASR Example - Basic Transcription Interface\n",
    "\n",
    "Audio Speech Recognition with aisuite's unified API supporting OpenAI, Deepgram, and Google providers.\n",
    "\n",
    "This example demonstrates basic transcription using the OpenAI format with different providers."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d72f8c18",
   "metadata": {},
   "outputs": [],
   "source": [
    "import aisuite as ai\n",
    "from aisuite.framework.message import TranscriptionResult\n",
    "from dotenv import load_dotenv, find_dotenv\n",
    "import os\n",
    "\n",
    "load_dotenv(find_dotenv())\n",
    "\n",
    "\n",
    "# Set up client with provider configurations\n",
    "client = ai.Client({\n",
    "    \"openai\": {\"api_key\": os.getenv(\"OPENAI_API_KEY\")},\n",
    "    \"deepgram\": {\"api_key\": os.getenv(\"DEEPGRAM_API_KEY\")},\n",
    "    \"google\": {\n",
    "        \"project_id\": os.getenv(\"GOOGLE_PROJECT_ID\"),\n",
    "        \"region\": os.getenv(\"GOOGLE_REGION\"),\n",
    "        \"application_credentials\": os.getenv(\"GOOGLE_APPLICATION_CREDENTIALS\"),\n",
    "    },\n",
    "})\n",
    "\n",
    "audio_file = \"../aiplayground/speech.mp3\"  # Replace with your audio file path"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8ed7f8de",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Basic transcription using kwargs (OpenAI format)\n",
    "print(\"=== Basic Transcription ===\")\n",
    "\n",
    "try:\n",
    "    result = client.audio.transcriptions.create(\n",
    "        model=\"openai:whisper-1\",\n",
    "        file=audio_file,\n",
    "        language=\"en\"\n",
    "    )\n",
    "    if isinstance(result, TranscriptionResult):\n",
    "        print(f\"OpenAI: {result.text}\")\n",
    "    else:\n",
    "        print(\"OpenAI: Got streaming result (not expected for basic call)\")\n",
    "except Exception as e:\n",
    "    print(f\"OpenAI error: {e}\")\n",
    "\n",
    "print(\"--------------------------------\")\n",
    "\n",
    "try:\n",
    "    # Same kwargs work with other providers (auto-mapped)\n",
    "    result = client.audio.transcriptions.create(\n",
    "        model=\"deepgram:nova-2\",\n",
    "        file=audio_file,\n",
    "        language=\"en\",\n",
    "        punctuate=True\n",
    "    )\n",
    "    if isinstance(result, TranscriptionResult):\n",
    "        print(f\"Deepgram: {result.text}\")\n",
    "    else:\n",
    "        print(\"Deepgram: Got streaming result (not expected for basic call)\")\n",
    "except Exception as e:\n",
    "    print(f\"Deepgram error: {e}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "32ed3f0f",
   "metadata": {},
   "source": [
    "## Summary\n",
    "\n",
    "This notebook demonstrates the unified ASR interface with:\n",
    "\n",
    "1. **Basic transcription**: Using OpenAI-format kwargs that work across providers\n",
    "2. **Provider compatibility**: Same interface works with OpenAI, Deepgram, and Google\n",
    "\n",
    "### Environment Setup Required:\n",
    "\n",
    "- **OpenAI**: `OPENAI_API_KEY`\n",
    "- **Deepgram**: `DEEPGRAM_API_KEY`  \n",
    "- **Google**: `GOOGLE_PROJECT_ID`, `GOOGLE_REGION`, `GOOGLE_APPLICATION_CREDENTIALS`\n",
    "\n",
    "### Key Benefits:\n",
    "\n",
    "- Write once, run on any provider\n",
    "- Consistent error handling and response format\n",
    "- Easy provider switching for testing and optimization"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.0"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}


================================================
FILE: examples/chat-ui/.streamlit/config.toml
================================================
[theme]
primaryColor = "#1E90FF"  # Blue color for primary components
backgroundColor = "#0e1117"  # Background color
secondaryBackgroundColor = "#262730"  # Secondary background color
textColor = "#ffffff"  # Text color
font = "sans serif"


================================================
FILE: examples/chat-ui/README.md
================================================
# Chat UI

This is a simple chat UI built using Streamlit. It uses the `aisuite` library to power the chat.

You will need to install streamlit to run this example.

```bash
pip install streamlit
```

You will also need to create a `config.yaml` file in the same directory as the `chat.py` file. An example config file has been provided. You need to set environment variables for the API keys and other configuration for the LLMs you want to use. Place a .env file in this directory since `chat.py` will look for it.

In config.yaml, you can specify the LLMs you want to use in the chat. The chat UI will then display all these LLMs and you can select the one you want to use.

To run the app, simply run the following command in your terminal:

```bash
streamlit run chat.py
```

You can choose different LLMs by ticking the "Comparison Mode" checkbox. Then select the two LLMs you want to compare.
Here are some sample queries you can try:

```
User: "What is the weather in Tokyo?"
```

```
User: "Write a poem about the weather in Tokyo."
```

```
User: "Write a python program to print the fibonacci sequence."
Assistant: "-- Content from LLM 1 --"
User: "Write test cases for this program."
```


================================================
FILE: examples/chat-ui/chat.py
================================================
import os
import requests
import streamlit as st
import sys
import yaml
from dotenv import load_dotenv, find_dotenv

sys.path.append("../../../aisuite")
from aisuite.client import Client

# Configure Streamlit to use wide mode and hide the top streamlit menu
st.set_page_config(layout="wide", menu_items={})
# Add heading with padding
st.markdown(
    "<div style='padding-top: 1rem;'><h2 style='text-align: center; color: #ffffff;'>Chat & Compare LLM responses</h2></div>",
    unsafe_allow_html=True,
)
st.markdown(
    """
    <style>
        /* Apply default font size globally */
        html, body, [class*="css"] {
            font-size: 14px !important;
        }
        
        /* Style for Reset button focus */
        button[data-testid="stButton"][aria-label="Reset Chat"]:focus {
            border-color: red !important;
            box-shadow: 0 0 0 2px red !important;
        }
    </style>
    """,
    unsafe_allow_html=True,
)
st.markdown(
    """
    <style>
        /* Hide Streamlit's default top bar */
        #MainMenu {visibility: hidden;}
        header {visibility: hidden;}
        footer {visibility: hidden;}
        
        /* Remove top padding/margin */
        .block-container {
            padding-top: 0rem;
            padding-bottom: 0rem;
            margin-top: 0rem;
        }

        /* Remove padding from the app container */
        .appview-container {
            padding-top: 0rem;
        }
        
        /* Custom CSS for scrollable chat container */
        .chat-container {
            height: 650px;
            overflow-y: auto !important;
            background-color: #1E1E1E;
            border: 1px solid #333;
            border-radius: 10px;
            padding: 20px;
            margin: 10px 0;
        }
        
        /* Ensure the container takes full width */
        .stMarkdown {
            width: 100%;
        }
        
        /* Style for chat messages to ensure they're visible */
        .chat-message {
            margin: 10px 0;
            padding: 10px;
        }
        
        #text_area_1 {
            min-height: 20px !important;
        } 
    </style>
    """,
    unsafe_allow_html=True,
)

# Load configuration and initialize aisuite client
with open("config.yaml", "r") as file:
    config = yaml.safe_load(file)
configured_llms = config["llms"]
load_dotenv(find_dotenv())
client = Client()


# Function to display chat history
def display_chat_history(chat_history, model_name):
    for message in chat_history:
        role_display = "User" if message["role"] == "user" else model_name
        role = "user" if message["role"] == "user" else "assistant"
        if role == "user":
            with st.chat_message(role, avatar="👤"):
                st.write(message["content"])
        else:
            with st.chat_message(role, avatar="🤖"):
                st.write(message["content"])


# Helper function to query each LLM
def query_llm(model_config, chat_history):
    print(f"Querying {model_config['name']} with {chat_history}")
    try:
        model = model_config["provider"] + ":" + model_config["model"]
        response = client.chat.completions.create(model=model, messages=chat_history)
        print(
            f"Response from {model_config['name']}: {response.choices[0].message.content}"
        )
        return response.choices[0].message.content
    except Exception as e:
        st.error(f"Error querying {model_config['name']}: {e}")
        return "Error with LLM response."


# Initialize session states
if "chat_history_1" not in st.session_state:
    st.session_state.chat_history_1 = []
if "chat_history_2" not in st.session_state:
    st.session_state.chat_history_2 = []
if "is_processing" not in st.session_state:
    st.session_state.is_processing = False
if "use_comparison_mode" not in st.session_state:
    st.session_state.use_comparison_mode = False

# Top Section - Controls
col1, col2 = st.columns([1, 2])
with col1:
    st.session_state.use_comparison_mode = st.checkbox("Comparison Mode", value=True)

# Move LLM selection below comparison mode checkbox - now in columns
llm_col1, llm_col2 = st.columns(2)
with llm_col1:
    selected_model_1 = st.selectbox(
        "Choose LLM Model 1",
        [llm["name"] for llm in configured_llms],
        key="model_1",
        index=0 if configured_llms else 0,
    )
with llm_col2:
    if st.session_state.use_comparison_mode:
        selected_model_2 = st.selectbox(
            "Choose LLM Model 2",
            [llm["name"] for llm in configured_llms],
            key="model_2",
            index=1 if len(configured_llms) > 1 else 0,
        )

# Display Chat Histories first, always
# Middle Section - Display Chat Histories
if st.session_state.use_comparison_mode:
    col1, col2 = st.columns(2)
    with col1:
        chat_container = st.container(height=500)
        with chat_container:
            display_chat_history(st.session_state.chat_history_1, selected_model_1)
    with col2:
        chat_container = st.container(height=500)
        with chat_container:
            display_chat_history(st.session_state.chat_history_2, selected_model_2)
else:
    chat_container = st.container(height=500)
    with chat_container:
        display_chat_history(st.session_state.chat_history_1, selected_model_1)

# Bottom Section - User Input
st.markdown("<div style='height: 20px;'></div>", unsafe_allow_html=True)

col1, col2, col3 = st.columns([6, 1, 1])
with col1:
    user_query = st.text_area(
        label="Enter your query",
        label_visibility="collapsed",
        placeholder="Enter your query...",
        key="query_input",
        height=70,
    )


# CSS for aligning buttons with the bottom of the text area
st.markdown(
    """
    <style>
        /* Adjust the container of the buttons to align at the bottom */
        .stButton > button {
            margin-top: 35px !important; /* Adjust the margin to align */
        }

        /* Align buttons and "Processing..." text to the bottom of the text area */
        .button-container {
            margin-top: 42px !important;
            text-align: center; /* Center-aligns "Processing..." */
        }
    </style>
    """,
    unsafe_allow_html=True,
)

with col2:
    send_button = False  # Initialize send_button
    if st.session_state.is_processing:
        st.markdown(
            "<div class='button-container'>Processing... ⏳</div>",
            unsafe_allow_html=True,
        )
    else:
        send_button = st.button("Send Query", use_container_width=True)

with col3:
    if st.button("Reset Chat", use_container_width=True):
        st.session_state.chat_history_1 = []
        st.session_state.chat_history_2 = []
        st.rerun()

# Handle send button click and processing
if send_button and user_query and not st.session_state.is_processing:
    # Set processing state
    st.session_state.is_processing = True

    # Append user's message to chat histories first
    st.session_state.chat_history_1.append({"role": "user", "content": user_query})
    if st.session_state.use_comparison_mode:
        st.session_state.chat_history_2.append({"role": "user", "content": user_query})

    st.rerun()

# Handle the actual processing
if st.session_state.is_processing and user_query:
    # Query the selected LLM(s)
    model_config_1 = next(
        llm for llm in configured_llms if llm["name"] == selected_model_1
    )
    response_1 = query_llm(model_config_1, st.session_state.chat_history_1)
    st.session_state.chat_history_1.append({"role": "assistant", "content": response_1})

    if st.session_state.use_comparison_mode:
        model_config_2 = next(
            llm for llm in configured_llms if llm["name"] == selected_model_2
        )
        response_2 = query_llm(model_config_2, st.session_state.chat_history_2)
        st.session_state.chat_history_2.append(
            {"role": "assistant", "content": response_2}
        )

    # Reset processing state
    st.session_state.is_processing = False
    st.rerun()


================================================
FILE: examples/chat-ui/config.yaml
================================================
# config.yaml
llms:
  - name: "OpenAI GPT-4o"
    provider: "openai"
    model: "gpt-4o"
  - name: "Anthropic Claude 3.5 Sonnet"
    provider: "anthropic"
    model: "claude-3-5-sonnet-20240620"
  - name: "Azure/OpenAI GPT-4o"
    provider: "azure"
    model: "gpt-4o"
  - name: "Huggingface/Mistral 7B"
    provider: "huggingface"
    model: "mistralai/Mistral-7B-Instruct"


================================================
FILE: examples/client.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "d34f8c48-90fc-4981-8d2b-b47724c2a6dd",
   "metadata": {
    "vscode": {
     "languageId": "raw"
    }
   },
   "source": [
    "# Client Examples\n",
    "\n",
    "Client provides a uniform interface for interacting with LLMs from various providers. It adapts the official python libraries from providers such as Mistral, OpenAI, Groq, Anthropic, AWS, etc to conform to the OpenAI chat completion interface. It directly calls the REST endpoints in some cases.\n",
    "\n",
    "Below are some examples of how to use Client to interact with different LLMs."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "initial_id",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-07-04T15:30:02.064319Z",
     "start_time": "2024-07-04T15:30:02.051986Z"
    }
   },
   "outputs": [],
   "source": [
    "import sys\n",
    "from dotenv import load_dotenv, find_dotenv\n",
    "\n",
    "sys.path.append('../../aisuite')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f75736ee",
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "def configure_environment(additional_env_vars=None):\n",
    "    \"\"\"\n",
    "    Load environment variables from .env file and apply any additional variables.\n",
    "    :param additional_env_vars: A dictionary of additional environment variables to apply.\n",
    "    \"\"\"\n",
    "    # Load from .env file if available\n",
    "    load_dotenv(find_dotenv())\n",
    "\n",
    "    # Apply additional environment variables\n",
    "    if additional_env_vars:\n",
    "        for key, value in additional_env_vars.items():\n",
    "            os.environ[key] = value\n",
    "\n",
    "# Define additional API keys and credentials\n",
    "additional_keys = {\n",
    "    'GROQ_API_KEY': 'xxx',\n",
    "    'AWS_ACCESS_KEY_ID': 'xxx',\n",
    "    'AWS_SECRET_ACCESS_KEY': 'xxx',\n",
    "    'ANTHROPIC_API_KEY': 'xxx',\n",
    "    'NEBIUS_API_KEY': 'xxx',\n",
    "}\n",
    "\n",
    "# Configure environment\n",
    "configure_environment(additional_env_vars=additional_keys)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4de3a24f",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-07-04T15:31:12.914321Z",
     "start_time": "2024-07-04T15:31:12.796445Z"
    }
   },
   "outputs": [],
   "source": [
    "import aisuite as ai\n",
    "\n",
    "client = ai.Client()\n",
    "messages = [\n",
    "    {\"role\": \"system\", \"content\": \"Respond in Pirate English. Always try to include the phrase - No rum No fun.\"},\n",
    "    {\"role\": \"user\", \"content\": \"Tell me a joke about Captain Jack Sparrow\"},\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "520a6879",
   "metadata": {},
   "outputs": [],
   "source": [
    "# print(os.environ[\"ANTHROPIC_API_KEY\"])\n",
    "anthropic_claude_3_opus = \"anthropic:claude-3-5-sonnet-20240620\"\n",
    "response = client.chat.completions.create(model=anthropic_claude_3_opus, messages=messages)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9893c7e4-799a-42c9-84de-f9e643044462",
   "metadata": {},
   "outputs": [],
   "source": [
    "aws_bedrock_llama3_8b = \"aws:meta.llama3-1-8b-instruct-v1:0\"\n",
    "response = client.chat.completions.create(model=aws_bedrock_llama3_8b, messages=messages)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7e46c20a",
   "metadata": {},
   "outputs": [],
   "source": [
    "# IMP NOTE: Azure expects model endpoint to be passed in the format of \"azure:<model_name>\".\n",
    "# The model name is the deployment name in Project/Deployments.\n",
    "# In the example below, the model is \"mistral-large-2407\", but the name given to the\n",
    "# deployment is \"aisuite-mistral-large-2407\" under the deployments section in Azure.\n",
    "client.configure({\"azure\" : {\n",
    "  \"api_key\": os.environ[\"AZURE_API_KEY\"],\n",
    "  \"base_url\": \"https://aisuite-mistral-large-2407.westus3.models.ai.azure.com/v1/\",\n",
    "}});\n",
    "azure_model = \"azure:aisuite-mistral-large-2407\"\n",
    "response = client.chat.completions.create(model=azure_model, messages=messages)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f996b121",
   "metadata": {},
   "outputs": [],
   "source": [
    "# HuggingFace expects the model to be passed in the format of \"huggingface:<model_name>\".\n",
    "# The model name is the full name of the model in HuggingFace.\n",
    "# In the example below, the model is \"mistralai/Mistral-7B-Instruct-v0.3\".\n",
    "# The model is deployed as serverless inference endpoint in HuggingFace.\n",
    "hf_model = \"huggingface:mistralai/Mistral-7B-Instruct-v0.3\"\n",
    "response = client.chat.completions.create(model=hf_model, messages=messages)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c9b2aad6-8603-4227-9566-778f714eb0b5",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "# Groq expects the model to be passed in the format of \"groq:<model_name>\".\n",
    "# The model name is the full name of the model in Groq.\n",
    "# In the example below, the model is \"llama3-8b-8192\".\n",
    "groq_llama3_8b = \"groq:llama3-8b-8192\"\n",
    "# groq_llama3_70b = \"groq:llama3-70b-8192\"\n",
    "response = client.chat.completions.create(model=groq_llama3_8b, messages=messages)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6819ac17",
   "metadata": {},
   "outputs": [],
   "source": [
    "ollama_tinyllama = \"ollama:tinyllama\"\n",
    "ollama_phi3mini = \"ollama:phi3:mini\"\n",
    "response = client.chat.completions.create(model=ollama_phi3mini, messages=messages, temperature=0.75)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4a94961b2bddedbb",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2024-07-04T15:31:39.472675Z",
     "start_time": "2024-07-04T15:31:38.283368Z"
    }
   },
   "outputs": [],
   "source": [
    "mistral_7b = \"mistral:open-mistral-7b\"\n",
    "response = client.chat.completions.create(model=mistral_7b, messages=messages, temperature=0.2)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "611210a4dc92845f",
   "metadata": {},
   "outputs": [],
   "source": [
    "openai_gpt35 = \"openai:gpt-3.5-turbo\"\n",
    "response = client.chat.completions.create(model=openai_gpt35, messages=messages, temperature=0.75)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f38d033a-a580-4239-9176-27f3d53e7fe1",
   "metadata": {},
   "outputs": [],
   "source": [
    "nebius_model = \"nebius:Qwen/Qwen2.5-1.5B-Instruct\"\n",
    "response = client.chat.completions.create(model=nebius_model, messages=messages, top_p=0.01)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "321783ae",
   "metadata": {},
   "outputs": [],
   "source": [
    "fireworks_model = \"fireworks:accounts/fireworks/models/llama-v3p2-3b-instruct\"\n",
    "response = client.chat.completions.create(model=fireworks_model, messages=messages, temperature=0.75, presence_penalty=0.5, frequency_penalty=0.5)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e30e5ae0",
   "metadata": {},
   "outputs": [],
   "source": [
    "togetherai_model = \"together:meta-llama/Llama-3.2-3B-Instruct-Turbo\"\n",
    "response = client.chat.completions.create(model=togetherai_model, messages=messages, temperature=0.75, top_p=0.7, top_k=50)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "dcf63a11",
   "metadata": {},
   "outputs": [],
   "source": [
    "gemini_15_flash = \"google:gemini-1.5-flash\"\n",
    "response = client.chat.completions.create(model=gemini_15_flash, messages=messages, temperature=0.75)\n",
    "print(response.choices[0].message.content)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}

================================================
FILE: examples/llm_reasoning.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "d39a806c-02a3-4a2d-8c51-f1ab1ea79d2e",
   "metadata": {},
   "source": [
    "# LLM Reasoning\n",
    "\n",
    "This notebook compares how LLMs from different Generative AI providers perform on three examples that can show issues with LLM reasoning:\n",
    "\n",
    "* [The Reversal Curse](https://github.com/lukasberglund/reversal_curse) shows that LLMs trained on \"A is B\" fail to learn \"B is A\".\n",
    "* [How many r's in the word strawberry?](https://x.com/karpathy/status/1816637781659254908) shows \"the weirdness of LLM Tokenization\".  \n",
    "* [Which number is bigger, 9.11 or 9.9?](https://x.com/DrJimFan/status/1816521330298356181) shows that \"LLMs are alien beasts.\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d2e413bd-983c-42a0-9580-96fedc7b1275",
   "metadata": {},
   "outputs": [],
   "source": [
    "!cat ../.env.sample"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "8d843e36-7de6-4726-8a39-c5dcd3c7cc11",
   "metadata": {},
   "source": [
    "Make sure your ~/.env file (copied from the .env.sample file above) has the API keys of the LLM providers to compare set before running the cell below:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3c966895-1a63-4922-80b7-5a20e47f29de",
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys\n",
    "sys.path.append('../../aisuite')\n",
    "\n",
    "from dotenv import load_dotenv, find_dotenv\n",
    "\n",
    "load_dotenv(find_dotenv())"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "09d5c5be-1085-4252-9d5e-80b50961484b",
   "metadata": {},
   "source": [
    "## Specify LLMs to Compare"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "26c3d5ef-b1c9-48dd-9b89-30799fd4b698",
   "metadata": {},
   "outputs": [],
   "source": [
    "import aisuite as ai\n",
    "\n",
    "client = ai.Client()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "886a904f-fef0-4f25-b3ed-41085bf0f2dd",
   "metadata": {},
   "outputs": [],
   "source": [
    "import time\n",
    "\n",
    "llms = [\n",
    "        \"anthropic:claude-3-5-sonnet-20240620\",\n",
    "        \"aws:meta.llama3-1-8b-instruct-v1:0\",\n",
    "        \"groq:llama3-8b-8192\",\n",
    "        \"groq:llama3-70b-8192\",\n",
    "        \"huggingface:mistralai/Mistral-7B-Instruct-v0.3\",\n",
    "        \"openai:gpt-3.5-turbo\",\n",
    "       ]\n",
    "\n",
    "def compare_llm(messages):\n",
    "    execution_times = []\n",
    "    responses = []\n",
    "    for llm in llms:\n",
    "        start_time = time.time()\n",
    "        response = client.chat.completions.create(model=llm, messages=messages)\n",
    "        end_time = time.time()\n",
    "        execution_time = end_time - start_time\n",
    "        responses.append(response.choices[0].message.content.strip())\n",
    "        execution_times.append(execution_time)\n",
    "        print(f\"{llm} - {execution_time:.2f} seconds: {response.choices[0].message.content.strip()}\")\n",
    "    return responses, execution_times"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "3c3e8aa2-4ff4-485b-93d9-4a6f22d62e67",
   "metadata": {},
   "source": [
    "## The Reversal Curse"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f3c4a8ef-e23b-4d4a-8561-3e5a2a866bd1",
   "metadata": {},
   "outputs": [],
   "source": [
    "messages = [\n",
    "    {\"role\": \"user\", \"content\": \"Who is Tom Cruise's mother?\"},\n",
    "]\n",
    "\n",
    "responses, execution_times = compare_llm(messages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "769f7f42-2adb-4903-ab17-3143a5d950ce",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "\n",
    "def display(llms, execution_times, responses):\n",
    "    data = {\n",
    "        'Provider:Model Name': llms,\n",
    "        'Execution Time': execution_times,\n",
    "        'Model Response ': responses\n",
    "    }\n",
    "    \n",
    "    df = pd.DataFrame(data)\n",
    "    df.index = df.index + 1\n",
    "    styled_df = df.style.set_table_styles(\n",
    "        [{'selector': 'th', 'props': [('text-align', 'center')]}, \n",
    "         {'selector': 'td', 'props': [('text-align', 'center')]}]\n",
    "    ).set_properties(**{'text-align': 'center'})\n",
    "    \n",
    "    return styled_df "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d2359ad5-9f0b-4bd6-9838-54df91de0fb3",
   "metadata": {},
   "outputs": [],
   "source": [
    "display(llms, execution_times, responses)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "399f6cca-7f34-4a91-aab0-070560640033",
   "metadata": {},
   "outputs": [],
   "source": [
    "messages = [\n",
    "    {\"role\": \"user\", \"content\": \"Who is Mary Lee Pfeiffer's son?\"},\n",
    "]\n",
    "\n",
    "responses, execution_times = compare_llm(messages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "eee7704d-a187-41bc-b119-c94461d0ee74",
   "metadata": {},
   "outputs": [],
   "source": [
    "display(llms, execution_times, responses)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "ada8e0fb-17f0-4781-bf6a-c23ac86922ad",
   "metadata": {},
   "source": [
    "## How many r's in the word strawberry?"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e537871e-68b6-44c3-886a-d3ebe7a692c1",
   "metadata": {},
   "outputs": [],
   "source": [
    "messages = [\n",
    "    {\"role\": \"user\", \"content\": \"How many r's in the word strawberry?\"},\n",
    "]\n",
    "\n",
    "responses, execution_times = compare_llm(messages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5678e393-4967-49f1-9e0f-251471dc92b7",
   "metadata": {},
   "outputs": [],
   "source": [
    "display(llms, execution_times, responses)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "cae3fb5f-a173-4a33-b843-65df6d1086f9",
   "metadata": {},
   "source": [
    "## Which number is bigger?"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "efdf2fd6-f63a-4f9b-af15-1df25590e4fc",
   "metadata": {},
   "outputs": [],
   "source": [
    "messages = [\n",
    "    {\"role\": \"user\", \"content\": \"Which number is bigger, 9.11 or 9.9?\"},\n",
    "]\n",
    "\n",
    "responses, execution_times = compare_llm(messages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "eaa14ed1-c83b-4c8f-bb14-d318bf0c9a60",
   "metadata": {},
   "outputs": [],
   "source": [
    "display(llms, execution_times, responses)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "198b213a-b7bf-4cce-8c30-a8408454370b",
   "metadata": {},
   "outputs": [],
   "source": [
    "messages = [\n",
    "    {\"role\": \"user\", \"content\": \"Which number is bigger, 9.11 or 9.9? Think step by step.\"},\n",
    "]\n",
    "\n",
    "responses, execution_times = compare_llm(messages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4a3fb8fc-a7a2-47d3-9db2-792f03cc47c2",
   "metadata": {},
   "outputs": [],
   "source": [
    "display(llms, execution_times, responses)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "66987d26-4245-4de1-816f-fa57475101f3",
   "metadata": {},
   "source": [
    "## Takeaways\n",
    "1. Not all LLMs are created equal - not even all Llama 3 (or 3.1) are created equal (by different providers).\n",
    "2. Ask LLM to think step by step may help improve its reasoning.\n",
    "3. The way tokenization works in LLM could lead to a lot of weirdness in LLM (see AK's awesome [video](https://www.youtube.com/watch?v=zduSFxRajkE) for a deep dive).\n",
    "4. A more comprehensive benchmark would be desired, but a quick LLM comparison like shown here can be the first step."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "04e13c90-3680-4f1d-8f65-768a78b7adb2",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}


================================================
FILE: examples/mcp_config_dict_example.py
================================================
"""
MCP Tools with Config Dict Format - Example

This example demonstrates using MCP tools with the simplified config dict format.
Instead of explicitly creating MCPClient objects, you can pass MCP server configs
directly to the tools parameter.
"""

import os
from dotenv import load_dotenv
import aisuite as ai

# Load environment variables
load_dotenv()

# Create aisuite client
client = ai.Client()

print("=" * 70)
print("Example 1: Basic Config Dict Usage")
print("=" * 70)

# Instead of creating MCPClient explicitly, pass config dict directly!
response = client.chat.completions.create(
    model="openai:gpt-4o",
    messages=[
        {"role": "user", "content": "List all Python files in the current directory"}
    ],
    tools=[
        {
            "type": "mcp",
            "name": "filesystem",
            "command": "npx",
            "args": ["-y", "@modelcontextprotocol/server-filesystem", os.getcwd()],
        }
    ],
    max_turns=2,
)

print(response.choices[0].message.content)

print("\n" + "=" * 70)
print("Example 2: Filtering Tools with allowed_tools")
print("=" * 70)

# Only allow specific tools for security
response = client.chat.completions.create(
    model="openai:gpt-4o",
    messages=[{"role": "user", "content": "Read the README.md file"}],
    tools=[
        {
            "type": "mcp",
            "name": "filesystem",
            "command": "npx",
            "args": ["-y", "@modelcontextprotocol/server-filesystem", os.getcwd()],
            "allowed_tools": ["read_file"],  # Security: only allow reading, not writing
        }
    ],
    max_turns=2,
)

print(response.choices[0].message.content)

print("\n" + "=" * 70)
print("Example 3: Multiple MCP Servers with Tool Prefixing")
print("=" * 70)

import tempfile

temp_dir = tempfile.mkdtemp()

# Connect to two different filesystem servers with prefixing
# This avoids tool name collisions
response = client.chat.completions.create(
    model="anthropic:claude-3-5-sonnet-20240620",
    messages=[
        {
            "role": "user",
            "content": "How many files are in the current directory vs the temp directory?",
        }
    ],
    tools=[
        {
            "type": "mcp",
            "name": "current_dir",
            "command": "npx",
            "args": ["-y", "@modelcontextprotocol/server-filesystem", os.getcwd()],
            "use_tool_prefix": True,  # Tools named "current_dir__list_directory", etc.
        },
        {
            "type": "mcp",
            "name": "temp_dir",
            "command": "npx",
            "args": ["-y", "@modelcontextprotocol/server-filesystem", temp_dir],
            "use_tool_prefix": True,  # Tools named "temp_dir__list_directory", etc.
        },
    ],
    max_turns=3,
)

print(response.choices[0].message.content)

print("\n" + "=" * 70)
print("Example 4: Mixing MCP Configs with Python Functions")
print("=" * 70)

from datetime import datetime


def get_current_time() -> str:
    """Get the current date and time."""
    return datetime.now().strftime("%Y-%m-%d %H:%M:%S")


def calculate_stats(numbers: list) -> dict:
    """Calculate basic statistics for a list of numbers.

    Args:
        numbers: List of numbers to analyze
    """
    return {
        "count": len(numbers),
        "sum": sum(numbers),
        "average": sum(numbers) / len(numbers) if numbers else 0,
    }


# Mix everything: MCP configs + Python functions!
response = client.chat.completions.create(
    model="openai:gpt-4o",
    messages=[
        {
            "role": "user",
            "content": "What time is it? Also, list all files in the current directory.",
        }
    ],
    tools=[
        get_current_time,  # Regular Python function
        calculate_stats,  # Another Python function
        {
            "type": "mcp",
            "name": "filesystem",
            "command": "npx",
            "args": ["-y", "@modelcontextprotocol/server-filesystem", os.getcwd()],
        },  # MCP config dict
    ],
    max_turns=3,
)

print(response.choices[0].message.content)

print("\n" + "=" * 70)
print("Example 5: When to Use Config Dict vs MCPClient")
print("=" * 70)

print(
    """
Use Config Dict When:
✓ Quick prototypes and simple scripts
✓ One-off tool usage
✓ Don't need to reuse MCP client across multiple requests
✓ Want automatic cleanup
✓ Less code is better

Use Explicit MCPClient When:
✓ Need to reuse the same MCP connection across multiple requests
✓ Want to inspect available tools before using them
✓ Need fine-grained control over connection lifecycle
✓ Building a long-running application
✓ Want to manually manage resources

Example of explicit MCPClient:
"""
)

from aisuite.mcp import MCPClient

# Create once, reuse many times
mcp = MCPClient(
    command="npx", args=["-y", "@modelcontextprotocol/server-filesystem", os.getcwd()]
)

# Inspect available tools
print(f"\\nAvailable tools: {[t['name'] for t in mcp.list_tools()]}")

# Reuse across multiple requests
for query in ["List files", "Count files", "Check if README exists"]:
    response = client.chat.completions.create(
        model="openai:gpt-4o",
        messages=[{"role": "user", "content": query}],
        tools=mcp.get_callable_tools(),
        max_turns=2,
    )
    print(f"\\n{query}: {response.choices[0].message.content[:100]}...")

mcp.close()

print("\n" + "=" * 70)
print("All examples completed!")
print("=" * 70)


================================================
FILE: examples/mcp_http_example.py
================================================
"""
MCP HTTP Transport Example

This example demonstrates how to use HTTP-based MCP servers with aisuite.

Prerequisites:
- An HTTP MCP server running (e.g., http://localhost:8000)
- OpenAI API key in .env file or OPENAI_API_KEY environment variable
- pip install 'aisuite[mcp]'
- pip install python-dotenv

Note: This example assumes you have an HTTP MCP server running.
If you don't have one, this is a demonstration of the API usage.
"""

import aisuite as ai
from aisuite.mcp import MCPClient
import os
from dotenv import load_dotenv

# Load environment variables
load_dotenv()


def example_1_config_dict_format():
    """Example 1: Using HTTP MCP server with config dict format."""
    print("=" * 60)
    print("Example 1: HTTP MCP with Config Dict")
    print("=" * 60)

    client = ai.Client()

    response = client.chat.completions.create(
        model="openai:gpt-4o",
        messages=[
            {
                "role": "user",
                "content": "Use the available tools to get the current weather data.",
            }
        ],
        tools=[
            {
                "type": "mcp",
                "name": "weather-api",
                "server_url": "http://localhost:8000/mcp/v1",  # Full endpoint URL
                "timeout": 30.0,  # Optional: request timeout in seconds
            }
        ],
        max_turns=3,
    )

    print(response.choices[0].message.content)
    print()


def example_2_explicit_mcp_client():
    """Example 2: Using HTTP MCP server with explicit MCPClient."""
    print("=" * 60)
    print("Example 2: HTTP MCP with Explicit MCPClient")
    print("=" * 60)

    # Create HTTP-based MCP client
    mcp = MCPClient(
        server_url="http://localhost:8000/mcp/v1",  # Full endpoint URL
        name="weather-api",
        timeout=30.0,
    )

    # List available tools
    print("Available tools:")
    for tool in mcp.list_tools():
        print(f"  - {tool['name']}: {tool['description']}")
    print()

    # Use with aisuite
    client = ai.Client()
    response = client.chat.completions.create(
        model="openai:gpt-4o",
        messages=[{"role": "user", "content": "What tools are available?"}],
        tools=mcp.get_callable_tools(),
        max_turns=2,
    )

    print(response.choices[0].message.content)

    # Clean up
    mcp.close()
    print()


def example_3_with_authentication():
    """Example 3: HTTP MCP server with authentication headers."""
    print("=" * 60)
    print("Example 3: HTTP MCP with Authentication")
    print("=" * 60)

    # Get API token from environment
    api_token = os.getenv("MCP_API_TOKEN", "your-token-here")

    client = ai.Client()

    response = client.chat.completions.create(
        model="openai:gpt-4o",
        messages=[{"role": "user", "content": "Fetch the user profile using the API."}],
        tools=[
            {
                "type": "mcp",
                "name": "api-server",
                "server_url": "https://api.example.com/mcp/v1",  # Full endpoint URL
                "headers": {
                    "Authorization": f"Bearer {api_token}",
                    "X-API-Version": "2024-01",
                },
                "timeout": 60.0,
            }
        ],
        max_turns=3,
    )

    print(response.choices[0].message.content)
    print()


def example_4_context_manager():
    """Example 4: Using context manager for automatic cleanup."""
    print("=" * 60)
    print("Example 4: HTTP MCP with Context Manager")
    print("=" * 60)

    with MCPClient(
        server_url="http://localhost:8000/mcp/v1",
        name="api-server",  # Full endpoint URL
    ) as mcp:
        client = ai.Client()

        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[{"role": "user", "content": "List available data."}],
            tools=mcp.get_callable_tools(),
            max_turns=2,
        )

        print(response.choices[0].message.content)
    # mcp.close() is called automatically
    print()


def example_5_mixing_http_and_python_functions():
    """Example 5: Mixing HTTP MCP tools with regular Python functions."""
    print("=" * 60)
    print("Example 5: Mixing HTTP MCP with Python Functions")
    print("=" * 60)

    # Define a custom Python function
    def get_current_time() -> str:
        """Get the current date and time in ISO format."""
        from datetime import datetime

        return datetime.now().isoformat()

    client = ai.Client()

    response = client.chat.completions.create(
        model="anthropic:claude-sonnet-4-5",
        messages=[
            {
                "role": "user",
                "content": "What time is it now? Also get the weather data from the API.",
            }
        ],
        tools=[
            get_current_time,  # Regular Python function
            {
                "type": "mcp",
                "name": "weather-api",
                "server_url": "http://localhost:8000/mcp/v1",  # Full endpoint URL
            },  # HTTP MCP server
        ],
        max_turns=3,
    )

    print(response.choices[0].message.content)
    print()


def example_6_tool_filtering():
    """Example 6: Using allowed_tools to restrict available tools."""
    print("=" * 60)
    print("Example 6: HTTP MCP with Tool Filtering")
    print("=" * 60)

    client = ai.Client()

    response = client.chat.completions.create(
        model="openai:gpt-4o",
        messages=[{"role": "user", "content": "Get the weather forecast."}],
        tools=[
            {
                "type": "mcp",
                "name": "api-server",
                "server_url": "http://localhost:8000/mcp/v1",  # Full endpoint URL
                "allowed_tools": ["get_weather"],  # Only allow this specific tool
            }
        ],
        max_turns=2,
    )

    print(response.choices[0].message.content)
    print()


def example_7_multiple_http_servers():
    """Example 7: Using multiple HTTP MCP servers with prefixing."""
    print("=" * 60)
    print("Example 7: Multiple HTTP MCP Servers with Prefixing")
    print("=" * 60)

    client = ai.Client()

    response = client.chat.completions.create(
        model="openai:gpt-4o",
        messages=[
            {
                "role": "user",
                "content": "Get weather data and user data.",
            }
        ],
        tools=[
            {
                "type": "mcp",
                "name": "weather",
                "server_url": "http://localhost:8000/mcp/v1",  # Full endpoint URL
                "use_tool_prefix": True,  # Tools: weather__get_forecast, etc.
            },
            {
                "type": "mcp",
                "name": "users",
                "server_url": "http://localhost:9000/mcp/v1",  # Full endpoint URL
                "use_tool_prefix": True,  # Tools: users__get_profile, etc.
            },
        ],
        max_turns=3,
    )

    print(response.choices[0].message.content)
    print()


if __name__ == "__main__":
    print("\nMCP HTTP Transport Examples")
    print("=" * 60)
    print()
    print("Note: These examples require an HTTP MCP server to be running.")
    print("Uncomment the examples you want to run.\n")

    # Uncomment the examples you want to run:

    # example_1_config_dict_format()
    # example_2_explicit_mcp_client()
    # example_3_with_authentication()
    # example_4_context_manager()
    # example_5_mixing_http_and_python_functions()
    # example_6_tool_filtering()
    # example_7_multiple_http_servers()

    print("\nTo run these examples:")
    print("1. Start an HTTP MCP server (e.g., on http://localhost:8000)")
    print("2. Set your OPENAI_API_KEY environment variable")
    print("3. Uncomment the example functions you want to run")
    print("4. Run: python examples/mcp_http_example.py")


================================================
FILE: examples/mcp_tools_example.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Using MCP Tools with aisuite\n",
    "\n",
    "This notebook demonstrates how to use MCP (Model Context Protocol) servers with aisuite to give AI models access to external tools and data sources.\n",
    "\n",
    "## What is MCP?\n",
    "\n",
    "MCP (Model Context Protocol) is a standardized protocol that allows AI applications to connect to external data sources and tools. MCP servers expose tools, resources, and prompts that AI models can use.\n",
    "\n",
    "## Prerequisites\n",
    "\n",
    "Install aisuite with MCP support:\n",
    "```bash\n",
    "pip install 'aisuite[mcp]'\n",
    "# Or install providers you need:\n",
    "pip install 'aisuite[openai,mcp]'\n",
    "```\n",
    "\n",
    "You'll also need to install an MCP server. For this example, we'll use the filesystem server:\n",
    "```bash\n",
    "npm install -g @modelcontextprotocol/server-filesystem\n",
    "```"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "from dotenv import load_dotenv\n",
    "import aisuite as ai\n",
    "from aisuite.mcp import MCPClient\n",
    "\n",
    "# Load environment variables (API keys)\n",
    "load_dotenv()\n",
    "\n",
    "# Verify API key is set\n",
    "if not os.getenv(\"OPENAI_API_KEY\"):\n",
    "    raise ValueError(\"Please set OPENAI_API_KEY environment variable\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Example 1: Basic MCP Tool Usage\n",
    "\n",
    "Let's connect to a filesystem MCP server and use it to read files."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Connect to the filesystem MCP server\n",
    "# This gives the AI access to files in the specified directory\n",
    "mcp_client = MCPClient(\n",
    "    command=\"npx\",\n",
    "    args=[\"-y\", \"@modelcontextprotocol/server-filesystem\", os.getcwd()]\n",
    ")\n",
    "\n",
    "print(f\"Connected to MCP server: {mcp_client}\")\n",
    "print(f\"\\nAvailable tools:\")\n",
    "for tool in mcp_client.list_tools():\n",
    "    print(f\"  - {tool['name']}: {tool.get('description', 'No description')}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Create aisuite client\n",
    "client = ai.Client()\n",
    "\n",
    "# Use MCP tools with aisuite\n",
    "messages = [\n",
    "    {\"role\": \"user\", \"content\": \"Please read the README.md file and summarize what this project does.\"}\n",
    "]\n",
    "\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=messages,\n",
    "    tools=mcp_client.get_callable_tools(),  # MCP tools work like regular Python functions!\n",
    "    max_turns=3  # Allow multiple tool calls\n",
    ")\n",
    "\n",
    "print(\"\\nAI Response:\")\n",
    "print(response.choices[0].message.content)\n",
    "\n",
    "# View the tool interactions\n",
    "print(\"\\n\" + \"=\"*60)\n",
    "print(\"Tool Call History:\")\n",
    "print(\"=\"*60)\n",
    "for msg in response.choices[0].intermediate_messages:\n",
    "    if msg.role == \"assistant\" and msg.tool_calls:\n",
    "        for tool_call in msg.tool_calls:\n",
    "            print(f\"\\nTool: {tool_call.function.name}\")\n",
    "            print(f\"Arguments: {tool_call.function.arguments}\")\n",
    "    elif msg.role == \"tool\":\n",
    "        print(f\"Result: {msg.content[:200]}...\")  # First 200 chars"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Example 2: Mixing MCP Tools with Python Functions\n",
    "\n",
    "You can seamlessly mix MCP tools with regular Python functions!"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Define a custom Python function\n",
    "def get_current_time() -> str:\n",
    "    \"\"\"Get the current date and time.\"\"\"\n",
    "    from datetime import datetime\n",
    "    return datetime.now().strftime(\"%Y-%m-%d %H:%M:%S\")\n",
    "\n",
    "def calculate_word_count(text: str) -> int:\n",
    "    \"\"\"Calculate the number of words in a text.\n",
    "    \n",
    "    Args:\n",
    "        text: The text to count words in\n",
    "    \"\"\"\n",
    "    return len(text.split())\n",
    "\n",
    "# Mix MCP tools and Python functions\n",
    "all_tools = mcp_client.get_callable_tools() + [get_current_time, calculate_word_count]\n",
    "\n",
    "messages = [\n",
    "    {\n",
    "        \"role\": \"user\", \n",
    "        \"content\": \"What time is it? Also, read the README.md file and tell me how many words it contains.\"\n",
    "    }\n",
    "]\n",
    "\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=messages,\n",
    "    tools=all_tools,  # Both MCP and Python tools!\n",
    "    max_turns=5\n",
    ")\n",
    "\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Example 3: Using Specific MCP Tools\n",
    "\n",
    "You can also select specific tools instead of using all of them."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Get only specific tools\n",
    "read_file = mcp_client.get_tool(\"read_file\")\n",
    "list_directory = mcp_client.get_tool(\"list_directory\")\n",
    "\n",
    "# Use only these tools\n",
    "messages = [\n",
    "    {\"role\": \"user\", \"content\": \"List all Python files in the current directory.\"}\n",
    "]\n",
    "\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\",\n",
    "    messages=messages,\n",
    "    tools=[read_file, list_directory],  # Only specific tools\n",
    "    max_turns=2\n",
    ")\n",
    "\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Example 4: Using MCP with Different Providers\n",
    "\n",
    "MCP tools work with all aisuite providers!"
   ]
  },
  {
   "cell_type": "markdown",
   "source": "## Example 4: Using MCP Config Dict Format (Simplified)\n\nInstead of creating an MCPClient explicitly, you can pass MCP server configuration directly as a dict in the `tools` parameter! This is more convenient for simple use cases.",
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Try with different providers\n",
    "providers = [\n",
    "    \"openai:gpt-4o\",\n",
    "    \"anthropic:claude-3-5-sonnet-20240620\",\n",
    "]\n",
    "\n",
    "messages = [\n",
    "    {\"role\": \"user\", \"content\": \"List the files in the current directory and tell me how many there are.\"}\n",
    "]\n",
    "\n",
    "for model in providers:\n",
    "    print(f\"\\n{'='*60}\")\n",
    "    print(f\"Provider: {model}\")\n",
    "    print(f\"{'='*60}\\n\")\n",
    "    \n",
    "    try:\n",
    "        response = client.chat.completions.create(\n",
    "            model=model,\n",
    "            messages=messages,\n",
    "            tools=mcp_client.get_callable_tools(),\n",
    "            max_turns=3\n",
    "        )\n",
    "        print(response.choices[0].message.content)\n",
    "    except Exception as e:\n",
    "        print(f\"Error: {e}\")\n",
    "        print(\"Make sure you have the API key set and provider installed.\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Example 5: Connecting to Multiple MCP Servers\n",
    "\n",
    "You can connect to multiple MCP servers and combine their tools."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Connect to a second MCP server (example - adjust as needed)\n",
    "# For demonstration, we'll create another filesystem server for a different directory\n",
    "\n",
    "# Create a temp directory for demonstration\n",
    "import tempfile\n",
    "temp_dir = tempfile.mkdtemp()\n",
    "\n",
    "# Second MCP client\n",
    "mcp_client_2 = MCPClient(\n",
    "    command=\"npx\",\n",
    "    args=[\"-y\", \"@modelcontextprotocol/server-filesystem\", temp_dir]\n",
    ")\n",
    "\n",
    "# Combine tools from both servers\n",
    "all_mcp_tools = (\n",
    "    mcp_client.get_callable_tools() + \n",
    "    mcp_client_2.get_callable_tools()\n",
    ")\n",
    "\n",
    "print(f\"Total tools available: {len(all_mcp_tools)}\")\n",
    "\n",
    "# Note: In practice, you might want to rename tools or use namespacing\n",
    "# to avoid conflicts between servers with similar tools"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Cleanup\n",
    "\n",
    "It's good practice to close MCP connections when done. You can also use MCPClient as a context manager."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Close the MCP connections\n",
    "mcp_client.close()\n",
    "mcp_client_2.close()\n",
    "\n",
    "print(\"MCP connections closed.\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Using Context Manager (Recommended)\n",
    "\n",
    "The recommended way to use MCPClient is with a context manager:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Using context manager ensures proper cleanup\n",
    "with MCPClient(\n",
    "    command=\"npx\",\n",
    "    args=[\"-y\", \"@modelcontextprotocol/server-filesystem\", os.getcwd()]\n",
    ") as mcp:\n",
    "    response = client.chat.completions.create(\n",
    "        model=\"openai:gpt-4o\",\n",
    "        messages=[{\"role\": \"user\", \"content\": \"How many files are in the current directory?\"}],\n",
    "        tools=mcp.get_callable_tools(),\n",
    "        max_turns=2\n",
    "    )\n",
    "    print(response.choices[0].message.content)\n",
    "\n",
    "# Connection is automatically closed after the with block"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Summary\n",
    "\n",
    "Key takeaways:\n",
    "\n",
    "1. **Easy Integration**: MCP tools work seamlessly with aisuite's existing tool system\n",
    "2. **Mix and Match**: Combine MCP tools with regular Python functions\n",
    "3. **Provider Agnostic**: Works with any aisuite provider (OpenAI, Anthropic, Google, etc.)\n",
    "4. **Multiple Servers**: Connect to multiple MCP servers simultaneously\n",
    "5. **Simple API**: Just `MCPClient()` → `get_callable_tools()` → pass to `tools=[]`\n",
    "\n",
    "For more MCP servers, check out:\n",
    "- https://github.com/modelcontextprotocol/servers\n",
    "- Official MCP documentation: https://modelcontextprotocol.io/"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.0"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}

================================================
FILE: examples/simple_tool_calling.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import sys\n",
    "from dotenv import load_dotenv, find_dotenv\n",
    "import os\n",
    "\n",
    "sys.path.append('../../aisuite')\n",
    "\n",
    "# Load from .env file if available\n",
    "load_dotenv(find_dotenv())"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Make a request to model without tools"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from aisuite import Client\n",
    "\n",
    "client = Client()\n",
    "# Configuring Azure. Rest all providers use environment variables for their parameters.\n",
    "client.configure({\"azure\" : {\n",
    "  \"api_key\": os.environ[\"AZURE_API_KEY\"],\n",
    "  \"base_url\": \"https://aisuite-mistral-large-2407.westus3.models.ai.azure.com/v1/\",\n",
    "}})\n",
    "# model = \"anthropic:claude-3-5-sonnet-20241022\"\n",
    "# model = \"aws:mistral.mistral-7b-instruct-v0:2\"\n",
    "# model = \"azure:aisuite-mistral-large\"\n",
    "# model = \"cohere:command-r-plus\"\n",
    "# model = \"deepseek:deepseek-chat\"\n",
    "# model = \"fireworks:accounts/fireworks/models/llama-v3p1-405b-instruct\"\n",
    "# model = \"google:gemini-1.5-pro-002\"\n",
    "# model = \"groq:llama-3.3-70b-versatile\"\n",
    "# model = \"huggingface:meta-llama/Llama-3.1-8B-Instruct\"\n",
    "# model = \"mistral:mistral-large-latest\"\n",
    "# model = \"nebius:\"\n",
    "# model = \"ollama:\"\n",
    "# model = \"sambanova:Meta-Llama-3.3-70B-Instruct\"\n",
    "# model = \"together:meta-llama/Llama-3.3-70B-Instruct-Turbo\"\n",
    "# model = \"watsonx:\"\n",
    "model = \"xai:grok-2-latest\"\n",
    "\n",
    "messages = [{\n",
    "    \"role\": \"user\",\n",
    "    \"content\": \"What is the current temperature in San Francisco in Celsius?\"}]\n",
    "\n",
    "response = client.chat.completions.create(\n",
    "    model=model, messages=messages)\n",
    "\n",
    "print(\"For model: \" + model)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Equip model with tools"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Define the functions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Mock tool functions.\n",
    "def get_current_temperature(location: str, unit: str):\n",
    "    # Simulate fetching temperature from an API\n",
    "    return {\"temperature\": 72}\n",
    "\n",
    "def get_rain_probability(location: str):\n",
    "    # Simulate fetching rain probability\n",
    "    return {\"location\": location, \"probability\": 40}\n",
    "\n",
    "# Function to get the available tools (functions) to provide to the model\n",
    "# Note: we could use decorators or utils from OpenAI to generate this.\n",
    "def get_available_tools():\n",
    "    return [\n",
    "        {   \"type\": \"function\",\n",
    "            \"function\": {\n",
    "                \"name\": \"get_current_temperature\",\n",
    "                \"description\": \"Get the current temperature for a specific location\",\n",
    "                \"parameters\": {\n",
    "                    \"type\": \"object\",\n",
    "                    \"properties\": {\n",
    "                        \"location\": {\n",
    "                            \"type\": \"string\",\n",
    "                            \"description\": \"The city and state, e.g., San Francisco, CA\"\n",
    "                        },\n",
    "                        \"unit\": {\n",
    "                            \"type\": \"string\",\n",
    "                            \"enum\": [\"Celsius\", \"Fahrenheit\"],\n",
    "                            \"description\": \"The temperature unit to use.\"\n",
    "                        }\n",
    "                    },\n",
    "                    \"required\": [\"location\", \"unit\"]\n",
    "                }\n",
    "            }\n",
    "        },\n",
    "        {\n",
    "            \"type\": \"function\",\n",
    "            \"function\": {\n",
    "                \"name\": \"get_rain_probability\",\n",
    "                \"description\": \"Get the probability of rain for a specific location\",\n",
    "                \"parameters\": {\n",
    "                    \"type\": \"object\",\n",
    "                    \"properties\": {\n",
    "                        \"location\": {\n",
    "                            \"type\": \"string\",\n",
    "                            \"description\": \"The city and state, e.g., San Francisco, CA\"\n",
    "                        }\n",
    "                    },\n",
    "                    \"required\": [\"location\"]\n",
    "                }\n",
    "            }\n",
    "        }\n",
    "    ]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Function to process tool calls and get the result\n",
    "def handle_tool_call(tool_call):\n",
    "    function_name = tool_call.function.name\n",
    "    arguments = json.loads(tool_call.function.arguments)\n",
    "\n",
    "    # Map function names to actual tool function implementations\n",
    "    tools_map = {\n",
    "        \"get_current_temperature\": get_current_temperature,\n",
    "        \"get_rain_probability\": get_rain_probability,\n",
    "    }\n",
    "    return tools_map[function_name](**arguments)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Function to format tool response as a message\n",
    "def create_tool_response_message(tool_call, tool_result):\n",
    "    return {\n",
    "        \"role\": \"tool\",\n",
    "        \"tool_call_id\": tool_call.id,\n",
    "        \"name\": tool_call.function.name,\n",
    "        \"content\": json.dumps(tool_result)\n",
    "    }"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Call the model with tools"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import sys\n",
    "from dotenv import load_dotenv, find_dotenv\n",
    "import os\n",
    "\n",
    "sys.path.append('../../aisuite')\n",
    "\n",
    "# Load from .env file if available\n",
    "load_dotenv(find_dotenv())\n",
    "\n",
    "from aisuite import Client\n",
    "\n",
    "client = Client()\n",
    "client.configure({\"azure\" : {\n",
    "  \"api_key\": os.environ[\"AZURE_API_KEY\"],\n",
    "  \"base_url\": \"https://aisuite-mistral-large-2407.westus3.models.ai.azure.com/v1/\",\n",
    "}})\n",
    "\n",
    "# model = \"anthropic:claude-3-5-sonnet-20241022\"\n",
    "# model = \"aws:mistral.mistral-7b-instruct-v0:2\"\n",
    "# model = \"azure:aisuite-mistral-large\"\n",
    "# model = \"cohere:command-r-plus\"\n",
    "# model = \"deepseek:deepseek-chat\"\n",
    "# model = \"fireworks:accounts/fireworks/models/llama-v3p1-405b-instruct\"\n",
    "# model = \"google:gemini-1.5-pro-002\"\n",
    "# model = \"groq:llama-3.3-70b-versatile\"\n",
    "# model = \"huggingface:meta-llama/Llama-3.1-8B-Instruct\"\n",
    "# model = \"mistral:mistral-large-latest\"\n",
    "# model = \"nebius:\"\n",
    "# model = \"ollama:\"\n",
    "# model = \"sambanova:Meta-Llama-3.3-70B-Instruct\"\n",
    "# model = \"together:meta-llama/Llama-3.3-70B-Instruct-Turbo\"\n",
    "# model = \"watsonx:\"\n",
    "model = \"xai:grok-2-latest\"\n",
    "\n",
    "messages = [{\n",
    "    \"role\": \"user\",\n",
    "    \"content\": \"What is the current temperature in San Francisco in Celsius?\"}]\n",
    "\n",
    "tools = get_available_tools()\n",
    "\n",
    "# Make the initial request to OpenAI API\n",
    "response = client.chat.completions.create(\n",
    "    model=model, messages=messages, tools=tools)\n",
    "\n",
    "print(response)\n",
    "print(response.choices[0].message)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Process tool calls - Parse tool name, args, and call the function. Pass the result to the model."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "if response.choices[0].message.tool_calls:\n",
    "    for tool_call in response.choices[0].message.tool_calls:\n",
    "        tool_result = handle_tool_call(tool_call)\n",
    "        print(tool_result)\n",
    "\n",
    "        messages.append(response.choices[0].message) # Model's function call message\n",
    "        messages.append(create_tool_response_message(tool_call, tool_result))\n",
    "        # Send the tool response back to the model\n",
    "        final_response = client.chat.completions.create(\n",
    "            model=model, messages=messages, tools=tools)\n",
    "        print(final_response.choices[0].message)\n",
    "        \n",
    "        # Output the final response from the model\n",
    "        print(final_response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}


================================================
FILE: examples/tool_calling_abstraction.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "9efdda2f-e3ab-4ec3-9b04-3ebea6fdf4c1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import json\n",
    "import sys\n",
    "from dotenv import load_dotenv, find_dotenv\n",
    "import os\n",
    "\n",
    "sys.path.append('../../aisuite')\n",
    "\n",
    "# Load from .env file if available\n",
    "load_dotenv(find_dotenv())"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "b7604862",
   "metadata": {},
   "source": [
    "### Define the function"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "aaba7cb2-29de-4552-8fd5-8b966fbc0cd5",
   "metadata": {},
   "outputs": [],
   "source": [
    "def will_it_rain(location: str, time_of_day: str):\n",
    "    \"\"\"Check if it will rain in a location at a given time today.\n",
    "\n",
    "    Args:\n",
    "        location (str): Name of the city\n",
    "        time_of_day (str): Time of the day in HH:MM format.\n",
    "    \"\"\"\n",
    "    return \"YES\""
   ]
  },
  {
   "cell_type": "markdown",
   "id": "cf943639",
   "metadata": {},
   "source": [
    "---"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "090dc2d1",
   "metadata": {},
   "source": [
    "### Using OpenAI"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "29537ae1",
   "metadata": {},
   "source": [
    "### JSON spec for the function"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "b1a7196a-e5f2-4016-8dca-eca804ef18ac",
   "metadata": {},
   "outputs": [],
   "source": [
    "tools = [{\n",
    "    \"type\": \"function\",\n",
    "    \"function\": {\n",
    "        \"name\": \"will_it_rain\",\n",
    "        \"description\": \"Check if it will rain in a location at a given time today\",\n",
    "        \"parameters\": {\n",
    "            \"type\": \"object\",\n",
    "            \"properties\": {\n",
    "                \"location\": {\n",
    "                    \"type\": \"string\",\n",
    "                    \"description\": \"Name of the city\"\n",
    "                },\n",
    "                \"time_of_day\": {\n",
    "                    \"type\": \"string\",\n",
    "                    \"description\": \"Time of the day in HH:MM format.\"\n",
    "                }\n",
    "            },\n",
    "            \"required\": [\"location\", \"time_of_day\"]\n",
    "        }\n",
    "    }\n",
    "}]"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "5359d145",
   "metadata": {},
   "source": [
    "### Send user request to LLM"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "4b522391-5a82-4d27-bbad-9db91e531815",
   "metadata": {},
   "outputs": [],
   "source": [
    "from openai import OpenAI\n",
    "\n",
    "client = OpenAI()\n",
    "messages = [{\n",
    "    \"role\": \"user\",\n",
    "    \"content\": \"I live in San Francisco. Can you check for weather \"\n",
    "               \"and plan an outdoor picnic for me at 2pm?\"\n",
    "}]\n",
    "response = client.chat.completions.create(\n",
    "    model=\"gpt-4o\", messages=messages, tools=tools\n",
    ")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "fc47b536",
   "metadata": {},
   "source": [
    "### Process tool call response, Execute the tool & call the model again"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "d281fe8e-9d87-4150-be4d-f01a2525edf6",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "It looks like it will rain in San Francisco at 2 PM today. It's probably not the best day for an outdoor picnic. Would you like to consider indoor activities or reschedule the picnic for another day?\n"
     ]
    }
   ],
   "source": [
    "response2 = None\n",
    "if response.choices[0].message.tool_calls:\n",
    "    tool_call = response.choices[0].message.tool_calls[0]\n",
    "    args = json.loads(tool_call.function.arguments)\n",
    "\n",
    "    result = will_it_rain(args[\"location\"], args[\"time_of_day\"])\n",
    "    messages.append(response.choices[0].message)\n",
    "    messages.append({\n",
    "        \"role\": \"tool\", \"tool_call_id\": tool_call.id, \"content\": str(result)\n",
    "    })\n",
    "\n",
    "    response2 = client.chat.completions.create(\n",
    "        model=\"gpt-4o\", messages=messages, tools=tools)\n",
    "    print(response2.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "e81fb905",
   "metadata": {},
   "source": [
    "### Optionally, continue the conversation"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "f6de5c21-2983-4539-a4a2-cdd76071fdea",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "If you're set on having the picnic despite the rain, here are a few suggestions to make it enjoyable:\n",
      "\n",
      "1. **Location:** Consider a location with some shelter, like a gazebo in a park, or find a picnic spot with large trees for some natural cover. Alternatively, you might want to think about an indoor space with large windows where you can enjoy the view without getting wet.\n",
      "\n",
      "2. **Packing Essentials:**\n",
      "   - Bring waterproof blankets or tarps to sit on.\n",
      "   - Pack an umbrella or a rain poncho to stay dry.\n",
      "   - Use waterproof containers for your food to keep everything dry.\n",
      "   - Bring extra towels and a change of clothes.\n",
      "\n",
      "3. **Food Ideas:** Opt for warm, hearty meals that are comforting on a rainy day, such as soup in a thermos or grilled sandwiches.\n",
      "\n",
      "4. **Activities:** Plan indoor-friendly games or activities you can enjoy sheltered from the rain, like card games or board games.\n",
      "\n",
      "5. **Safety First:** Check the weather forecast regularly in case of any severe weather warnings.\n",
      "\n",
      "Enjoy your rainy-day picnic!\n"
     ]
    }
   ],
   "source": [
    "messages.append(response2.choices[0].message)\n",
    "messages.append({\n",
    "    \"role\": \"user\", \"content\": \"Schedule it despite the rain\"\n",
    "})\n",
    "response = client.chat.completions.create(\n",
    "    model=\"gpt-4o\", messages=messages)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "f6d5fd91",
   "metadata": {},
   "source": [
    "---"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "897b9aa2",
   "metadata": {},
   "source": [
    "### Using aisuite"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "8b587445",
   "metadata": {},
   "source": [
    "### Call the model with tools. Tool call is handled internally."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "0b74257b-8d53-4326-8ea1-d4a7f89c0e57",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "It is expected to rain in San Francisco at 2 PM today, so it might not be the best time for an outdoor picnic. You might want to consider indoor alternatives or plan for another day when the weather is more favorable for outdoor activities. If you have any other plans in mind or need further assistance, feel free to ask!\n"
     ]
    }
   ],
   "source": [
    "from aisuite import Client\n",
    "\n",
    "client = Client()\n",
    "messages = [{\n",
    "    \"role\": \"user\",\n",
    "    \"content\": \"I live in San Francisco. Can you check for weather \"\n",
    "               \"and plan an outdoor picnic for me at 2pm?\"\n",
    "}]\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\", messages=messages, tools=[will_it_rain], max_turns=2\n",
    ")\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "ba5f0327",
   "metadata": {},
   "source": [
    "### Optionally, continue the conversation"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "b1736dc9",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Sure! If you'd like to go ahead and plan an outdoor picnic despite the rain, here are a few tips to help you enjoy your experience:\n",
      "\n",
      "1. **Choose a Covered Location**: Try to find a spot with a shelter, like a gazebo or a pavilion, in one of San Francisco's parks. These can provide good protection from the rain.\n",
      "\n",
      "2. **Prepare for Wet Weather**:\n",
      "   - Bring waterproof blankets or tarps to sit on.\n",
      "   - Pack umbrellas and raincoats to stay dry.\n",
      "   - Use waterproof containers and bags to keep your picnic items protected.\n",
      "\n",
      "3. **Select Comforting Foods**: Warm beverages in thermoses and foods that are enjoyable when slightly cooler, such as sandwiches, can be comforting on a rainy day.\n",
      "\n",
      "4. **Stay Safe**: Be cautious of slippery surfaces and keep an eye on kids or pets if they are joining you.\n",
      "\n",
      "5. **Enjoy the Atmosphere**: Rain can create a cozy and calming environment. Embrace the natural sounds and sights of the rain.\n",
      "\n",
      "6. **Plan Indoor Activities**: Bring board games or books in case the rain becomes too heavy.\n",
      "\n",
      "Have fun, and make the most of your unique outdoor picnic experience! If you need more help with planning or have any other questions, let me know.\n"
     ]
    }
   ],
   "source": [
    "messages.extend(response.choices[0].intermediate_messages)\n",
    "messages.append({\n",
    "    \"role\": \"user\", \"content\": \"Schedule it despite the rain\"\n",
    "})\n",
    "response = client.chat.completions.create(\n",
    "    model=\"openai:gpt-4o\", messages=messages)\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "6bf09c0a",
   "metadata": {},
   "source": [
    "### Using, other providers"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "6c266c68-095b-4625-8de5-70960a117f69",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "I apologize, but it looks like it will be raining in San Francisco at 2:00 PM today. This might not be the best conditions for an outdoor picnic. However, I can suggest a few alternatives:\n",
      "\n",
      "1. Reschedule: We could check the weather for a different time today or another day this week. Would you like me to check a different time or date?\n",
      "\n",
      "2. Indoor picnic: You could have an indoor picnic at home or find a covered area in a park with picnic shelters.\n",
      "\n",
      "3. Rain-ready picnic: If you're up for an adventure, you could prepare for a rainy day picnic with appropriate gear like umbrellas, waterproof blankets, and covered food containers.\n",
      "\n",
      "4. Alternative activity: We could look into indoor activities or attractions in San Francisco that you might enjoy instead.\n",
      "\n",
      "What would you prefer to do? If you'd like to try for a different time or date, please let me know, and I'll be happy to check the weather again.\n"
     ]
    }
   ],
   "source": [
    "messages = [{\n",
    "    \"role\": \"user\",\n",
    "    \"content\": \"I live in San Francisco. Can you check for weather \"\n",
    "               \"and plan an outdoor picnic for me at 2pm?\"\n",
    "}]\n",
    "response = client.chat.completions.create(\n",
    "    model=\"anthropic:claude-3-5-sonnet-20240620\", messages=messages, tools=[will_it_rain], max_turns=2\n",
    ")\n",
    "print(response.choices[0].message.content)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "25a8c5ab-3a9f-4bf1-8174-aba313a00085",
   "metadata": {},
   "outputs": [],
   "source": [
    "response = client.chat.completions.create(\n",
    "    model=\"groq:llama3-8b-8192\", messages=messages, tools=[will_it_rain], max_turns=2)"
   ]
  },
 {
   "cell_type": "code",
   "execution_count": 17,
   "id": "53e937bd",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "I can help with that! To provide accurate information, I'll need to know your tolerance for rain. Would you prefer the picnic indoors if it rains?\n"
     ]
    }
   ],
   "source": [
    "response = client.chat.completions.create(\n",
    "    model=\"ollama:llama3-groq-tool-use\", messages=messages, tools=[will_it_rain], max_turns=2)\n",
    "print(response.choices[0].message.content)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}


================================================
FILE: guides/README.md
================================================
# Provider guides 

These guides give directions for obtaining API keys from different providers. 

Here are the instructions for:
- [Anthropic](anthropic.md) 
- [AWS](aws.md)
- [Azure](azure.md) 
- [Cohere](cohere.md)
- [Google](google.md)
- [Hugging Face](huggingface.md)
- [Mistral](mistral.md)
- [OpenAI](openai.md)
- [SambaNova](sambanova.md)
- [xAI](xai.md)
- [DeepSeek](deepseek.md)

For locally hosted models using `Ollama` or `LM Studio`, follow these instructions:
- [Ollama](ollama.md)
- [LM Studio](lmstudio.md)

Unless otherwise stated, these guides have not been endorsed by the providers. 

We also welcome additional [contributions](../CONTRIBUTING.md). 


================================================
FILE: guides/anthropic.md
================================================
# Anthropic

To use Anthropic with `aisuite` you will need to [create an account](https://console.anthropic.com/login). Once logged in, go to the [API Keys](https://console.anthropic.com/settings/keys)
and click the "Create Key" button and export that key into your environment.


```shell
export ANTHROPIC_API_KEY="your-anthropic-api-key"
```

## Create a Chat Completion

Install the `anthropic` python client

Example with pip
```shell
pip install anthropic
```

Example with poetry
```shell
poetry add anthropic
```

In your code:
```python
import aisuite as ai
client = ai.Client()


provider = "anthropic"
model_id = "claude-3-5-sonnet-20241022"

messages = [
    {"role": "system", "content": "Respond in Pirate English."},
    {"role": "user", "content": "Tell me a joke."},
]

response = client.chat.completions.create(
    model=f"{provider}:{model_id}",
    messages=messages,
)

print(response.choices[0].message.content)
```

Happy coding! If you would like to contribute, please read our [Contributing Guide](../CONTRIBUTING.md).


================================================
FILE: guides/aws.md
================================================
# AWS

To use AWS Bedrock with `aisuite` you will need to create an AWS account and
navigate to https://console.aws.amazon.com/bedrock/home. This route
will be redirected to your default region. In this example the region has been set to
`us-west-2`. Anywhere the region is specified can be replaced with your desired region.

Navigate to the [overview](https://us-west-2.console.aws.amazon.com/bedrock/home?region=us-west-2#/overview) page
directly or by clicking on the `Get started` link.

## Foundation Model Access

You will first need to give your AWS account access to the foundation models by
visiting the [modelaccess](https://us-west-2.console.aws.amazon.com/bedrock/home?region=us-west-2#/modelaccess)
page to enable the models you would like to use. 

After enabling the foundation models, navigate to [providers page](https://us-west-2.console.aws.amazon.com/bedrock/home?region=us-west-2#/providers) 
and select the provider of the model you would like to use. From this page select the specific model you would like to use and 
make note of the `Model ID` (currently located near the bottom) this will be used when using the chat completion example below.

Once that has been enabled set your Access Key and Secret in the env variables:

```shell
export AWS_ACCESS_KEY="your-access-key"
export AWS_SECRET_KEY="your-secret-key"
export AWS_REGION="region-name" 
```
*Note: AWS_REGION is optional, a default of `us-west-2` has been set for easy of use*

## Create a Chat Completion

Install the boto3 client using your package installer

Example with pip
```shell
pip install boto3
```

Example with poetry
```shell
poetry add boto3
```

In your code:
```python
import aisuite as ai
client = ai.Client()


provider = "aws"
model_id = "meta.llama3-1-405b-instruct-v1:0" # Model ID from above

messages = [
    {"role": "system", "content": "Respond in Pirate English."},
    {"role": "user", "content": "Tell me a joke."},
]

response = client.chat.completions.create(
    model=f"{provider}:{model_id}",
    messages=messages,
)

print(response.choices[0].message.content)
```

Happy coding! If you would like to contribute, please read our [Contributing Guide](../CONTRIBUTING.md).


================================================
FILE: guides/azure.md
================================================
# Azure AI

To use Azure AI with the `aisuite` library, you'll need to set up an Azure account and configure your environment for Azure AI services.

## Create an Azure Account and deploy a model from AI Studio

1. Visit [Azure Portal](https://portal.azure.com/) and sign up for an account if you don't have one.
2. Create a project and resource group.
3. Choose a model from https://ai.azure.com/explore/models and deploy it. You can choose serverless deployment option.
4. Give a deployment name. Lets say you choose to deploy Mistral-large-2407. You could leave the deployment names as "mistral-large-2407" or give a custom name.
5. You can see the deployment from project/deployment option. Note the Target URI from the Endpoint panel. It should look something like this - "https://aisuite-Mistral-large-2407.westus3.models.ai.azure.com".
6. Also note, that is provides a Chat completion URL. It should look like this - https://aisuite-Mistral-large-2407.westus3.models.ai.azure.com/v1/chat/completions


## Obtain Necessary Details & set environment variables.

After creating your deployment, you'll need to gather the following information:

1. API Key: Found in the "Keys and Endpoint" section of your Azure OpenAI resource.
2. Base URL: This can be obtained from your deployment details. It will look something like this - `https://aisuite-Mistral-large-2407.westus3.models.ai.azure.com/v1/`
3. API Version: Optional configuration and mainly introduced for Azure OpenAI services. Once specified, the `api-version` query parameters will be added in the end of the API request.


Set the following environment variables:

```shell
export AZURE_API_KEY="your-api-key"
export AZURE_BASE_URL="https://deployment-name.region-name.models.ai.azure.com/v1"
export AZURE_API_VERSION="=2024-08-01-preview"
```

## Create a Chat Completion

With your account set up and environment configured, you can send a chat completion request:

```python
import aisuite as ai

# Either set the environment variables or set the below two parameters.
# Setting the params in ai.Client() will override the values from environment vars.
client = ai.Client(
    base_url=os.environ["AZURE_OPENAI_BASE_URL"],
    api_key=os.environ["AZURE_OPENAI_API_KEY"],
    api_version=os.environ["AZURE_API_VERSION"]
)

model = "azure:aisuite-Mistral-large-2407"  # Replace with your deployment name.
# The model name must match the deployment name in the base-url.

messages = [
    {"role": "system", "content": "You are a helpful assistant."},
    {"role": "user", "content": "What's the weather like today?"},
]

response = client.chat.completions.create(
    model=model,
    messages=messages,
)

print(response.choices[0].message.content)
```

Happy coding! If you would like to contribute, please read our [Contributing Guide](../CONTRIBUTING.md).

================================================
FILE: guides/cerebras.md
================================================
# Cerebras AI Suite Provider Guide

## About Cerebras

At Cerebras, we've developed the world's largest and fastest AI processor, the Wafer-Scale Engine-3 (WSE-3). The Cerebras CS-3 system, powered by the WSE-3, represents a new class of AI supercomputer that sets the standard for generative AI training and inference with unparalleled performance and scalability.

With Cerebras as your inference provider, you can:
- Achieve unprecedented speed for AI inference workloads
- Build commercially with high throughput
- Effortlessly scale your AI workloads with our seamless clustering technology

Our CS-3 systems can be quickly and easily clustered to create the largest AI supercomputers in the world, making it simple to place and run the largest models. Leading corporations, research institutions, and governments are already using Cerebras solutions to develop proprietary models and train popular open-source models.

Want to experience the power of Cerebras? Check out our [website](https://cerebras.net) for more resources and explore options for accessing our technology through the Cerebras Cloud or on-premise deployments!

> [!NOTE]  
> This SDK has a mechanism that sends a few requests to `/v1/tcp_warming` upon construction to reduce the TTFT. If this behaviour is not desired, set `warm_tcp_connection=False` in the constructor.
>
> If you are repeatedly reconstructing the SDK instance it will lead to poor performance. It is recommended that you construct the SDK once and reuse the instance if possible.

## Documentation

For the most comprehensive and up-to-date Cerebras Inference docs, please visit [inference-docs.cerebras.ai](https://inference-docs.cerebras.ai).

## Usage
Get an API Key from [cloud.cerebras.ai](https://cloud.cerebras.ai/) and add it to your environment variables:

```shell
export CEREBRAS_API_KEY="your-cerebras-api-key"
```

Use the python client.

```python
import aisuite as ai
client = ai.Client()

messages = [
    {"role": "system", "content": "Respond in Pirate English."},
    {"role": "user", "content": "Tell me a joke."},
]

response = client.chat.completions.create(
    model="cerebras:llama3.1-8b",
    messages=messages,
    temperature=0.75
)
print(response.choices[0].message.content)

```

## Requirements

Python 3.8 or higher.


================================================
FILE: guides/cohere.md
================================================
# Cohere

To use Cohere with `aisuite`, you’ll need an [Cohere account](https://cohere.com/). After logging in, go to the [API Keys](https://dashboard.cohere.com/api-keys) section in your account settings, agree to the terms of service, connect your card, and generate a new key. Once you have your key, add it to your environment as follows:

```shell
export CO_API_KEY="your-cohere-api-key"
```

## Create a Chat Completion

Install the `cohere` Python client:

Example with pip:
```shell
pip install cohere
```

Example with poetry:
```shell
poetry add cohere
```

In your code:
```python
import aisuite as ai

client = ai.Client()

provider = "cohere"
model_id = "command-r-plus-08-2024"

messages = [
    {"role": "user", "content": "Hi, how are you?"}
]

response = client.chat.completions.create(
    model=f"{provider}:{model_id}",
    messages=messages,
)

print(response.choices[0].message.content)
```

Happy coding! If you’d like to contribute, please read our [Contributing Guide](CONTRIBUTING.md).


================================================
FILE: guides/deepseek.md
================================================
# DeepSeek

To use DeepSeek with `aisuite`, you’ll need an [DeepSeek account](https://platform.deepseek.com). After logging in, go to the [API Keys](https://platform.deepseek.com/api_keys) section in your account settings and generate a new key. Once you have your key, add it to your environment as follows:

```shell
export DEEPSEEK_API_KEY="your-deepseek-api-key"
```

## Create a Chat Completion

(Note: The DeepSeek uses an API format consistent with OpenAI, hence why we need to install OpenAI, there is no DeepSeek Library at least not for now)

Install the `openai` Python client:

Example with pip:
```shell
pip install openai
```

Example with poetry:
```shell
poetry add openai
```

In your code:
```python
import aisuite as ai
client = ai.Client()

provider = "deepseek"
model_id = "deepseek-chat"

messages = [
    {"role": "system", "content": "You are a helpful assistant."},
    {"role": "user", "content": "What’s the weather like in San Francisco?"},
]

response = client.chat.completions.create(
    model=f"{provider}:{model_id}",
    messages=messages,
)

print(response.choices[0].message.content)
```

Happy coding! If you’d like to contribute, please read our [Contributing Guide](../CONTRIBUTING.md).


================================================
FILE: guides/google.md
================================================
# Google (Vertex) AI

To use Google (Vertex) AI with the `aisuite` library, you'll first need to create a Google Cloud account and set up your environment to work with Google Cloud.

## Create a Google Cloud Account and Project

Google Cloud provides in-depth [documentation](https://cloud.google.com/vertex-ai/docs/start/cloud-environment) on getting started with their platform, but here are the basic steps:

### Create your account.

Visit [Google Cloud](https://cloud.google.com/free) and follow the instructions for registering a new account. If you already have an account with Google Cloud, sign in and skip to the next step.

### Create a new project and enable billing.

Once you have an account, you can create a new project. Visit the [project selector page](https://console.cloud.google.com/projectselector2/home/dashboard) and click the "New Project" button. Give your project a name and click "Create Project." Your project will be created and you will be redirected to the project dashboard.

Now that you have a project, you'll need to enable billing. Visit the [how-to page](https://cloud.google.com/billing/docs/how-to/verify-billing-enabled#confirm_billing_is_enabled_on_a_project) for billing enablement instructions.

### Set your project ID in an environment variable.

Set the `GOOGLE_PROJECT_ID` environment variable to the ID of your project. You can find the Project ID by visiting the project dashboard in the "Project Info" section toward the top of the page.

### Set your preferred region in an environment variable.

Set the `GOOGLE_REGION` environment variable. You can find the region by going to Project Dashboard under VertexAI side navigation menu, and then scrolling to the bottom of the page.

## Create a Service Account For API Access

Because `aisuite` needs to authenticate with Google Cloud to access the Vertex AI API, you'll need to create a service account and set the `GOOGLE_APPLICATION_CREDENTIALS` environment variable to the path of a JSON file containing the service account's credentials, which you can download from the Google Cloud Console.

This is documented [here](https://cloud.google.com/docs/authentication/provide-credentials-adc#how-to), and the basic steps are as follows:

1. Visit the [service accounts page](https://console.cloud.google.com/iam-admin/serviceaccounts) in the Google Cloud Console.
2. Click the "+ Create Service Account" button toward the top of the page.
3. Follow the steps for naming your service account and granting access to the project.
4. Click "Done" to create the service account.
5. Now, click the "Keys" tab towards the top of the page.
6. Click the "Add Key" menu, then select "Create New Key."
6. Choose "JSON" as the key type, and click "Create."
7. Move this file to a location on your file system like your home directory.
8. Set the `GOOGLE_APPLICATION_CREDENTIALS` environment variable to the path of the JSON file.

## Double check your environment is configured correctly.

At this point, you should have three environment variables set to ensure your environment is set up correctly:

- `GOOGLE_PROJECT_ID`
- `GOOGLE_REGION`
- `GOOGLE_APPLICATION_CREDENTIALS`

Once these are set, you are ready to write some code and send a chat completion request.

## Create a chat completion.

With your account and service account set up, you can send a chat completion request.

Export the environment variables:

```shell
export GOOGLE_PROJECT_ID="your-project-id"
export GOOGLE_REGION="your-region"
export GOOGLE_APPLICATION_CREDENTIALS="path/to/your/service-account-file.json"
```

Install the Vertex AI SDK:

```shell
pip install vertexai
```

In your code:

```python
import aisuite as ai
client = ai.Client()

model="google:gemini-1.5-pro-001"

messages = [
    {"role": "system", "content": "Respond in Pirate English."},
    {"role": "user", "content": "Tell me a joke."},
]

response = client.chat.completions.create(
    model=model,
    messages=messages,
)

print(response.choices[0].message.content)
```

Happy coding! If you would like to contribute, please read our [Contributing Guide](../CONTRIBUTING.md).


================================================
FILE: guides/groq.md
================================================
# Groq

To use Groq with `aisuite`, you’ll need a free [Groq account](https://console.groq.com/). After logging in, go to the [API Keys](https://console.groq.com/keys) section in your account settings and generate a new Groq API key. Once you have your key, add it to your environment as follows:

```shell
export GROQ_API_KEY="your-groq-api-key"
```

## Create a Python Chat Completion

1. First, install the `groq` Python client library:

```shell
pip install groq
```

2. Now you can simply create your first chat completion with the following example code or customize by swapoping out the `model_id` with any of the other available [models powered by Groq](https://console.groq.com/docs/models) and `messages` array with whatever you'd like:
```python
import aisuite as ai
client = ai.Client()

provider = "groq"
model_id = "llama-3.2-3b-preview"

messages = [
    {"role": "system", "content": "You are a helpful assistant."},
    {"role": "user", "content": "What’s the weather like in San Francisco?"},
]

response = client.chat.completions.create(
    model=f"{provider}:{model_id}",
    messages=messages,
)

print(response.choices[0].message.content)
```


Happy coding! If you’d like to contribute, please read our [Contributing Guide](CONTRIBUTING.md).


================================================
FILE: guides/huggingface.md
================================================
# Hugging Face AI

To use Hugging Face with the `aisuite` library, you'll need to set up a Hugging Face account, obtain the necessary API credentials, and configure your environment for Hugging Face's API.

## Create a Hugging Face Account and Deploy a Model

1. Visit [Hugging Face](https://huggingface.co/) and sign up for an account if you don't already have one.
2. Explore conversational models on the [Hugging Face Model Hub](https://huggingface.co/models?inference=warm&other=conversational&sort=trending) and select a model you want to use. Popular models include conversational AI models like `gpt2`, `gpt3`, and `mistral`.
3. Deploy or host your chosen model if needed; Hugging Face provides various hosting options, including free, individual, and organizational hosting. Using Serverless Inference API is a fast way to get started.
5. Once the model is deployed (or if using a public model directly), note the model's unique identifier (e.g., `mistralai/Mistral-7B-Instruct-v0.3`), which you'll use for making requests.

## Obtain Necessary Details & Set Environment Variables

After setting up your model, you'll need to gather the following information:

- **API Token**: You can generate an API token in your [Hugging Face account settings](https://huggingface.co/settings/tokens).

Set the following environment variables to make authentication and requests easy:

```shell
export HF_TOKEN="your-api-token"
```

## Create a Chat Completion

With your account set up and environment variables configured, you can send a chat completion request as follows:

```python
import os
import aisuite as ai

# Either set the environment variables or define the parameters below.
# Setting the parameters in ai.Client() will override the environment variable values.
client = ai.Client()

model = "huggingface:your-model-name"  # Replace with your model's identifier.

messages = [
    {"role": "system", "content": "You are a helpful assistant."},
    {"role": "user", "content": "What's the weather like today?"},
]

response = client.chat.completions.create(
    model=model,
    messages=messages,
)

print(response.choices[0].message.content)
```

### Notes

- Ensure that the `model` variable matches the identifier of your model as seen in the Hugging Face Model Hub.
- If you encounter any rate limits or API access restrictions, you may have to upgrade your Hugging Face plan to enable higher usage limits.
"""

Happy coding! If you would like to contribute, please read our [Contributing Guide](../CONTRIBUTING.md).

================================================
FILE: guides/lmstudio.md
================================================
# LM Studio

LM Studio allows users to locally host open-source models available in [their model catalog](https://lmstudio.ai/models). 
It also provides a web portal with a ChatGPT-like interface.
Once an LM Studio instance is locally running in your setup (default `http://localhost:1234`), you can use the `aisuite` API for chat completions as shown below.
No API Key is needed for these locally hosted models.

## Create a Chat Completion

Sample code:
```python
import aisuite as ai

def main():
    # Set the API URL to remote NGA2 server
    client = ai.Client(
        provider_configs={
            "lmstudio": {
                "api_url": "http://localhost:1234",
                "timeout": 300,
            }
        }
    )
    messages = [
        {
            "role": "system", 
            "content": "Be verbose"
        },
        {
            "role": "user", 
            "content": "Tell me something about University of Michigan's CSE department."
        },
    ]

    lmstudio_llama = "lmstudio:llama-3.2-3b-instruct"

    response = client.chat.completions.create(
        model=lmstudio_llama, 
        messages=messages, 
        temperature=0.75,
    )
    print(response.choices[0].message.content)


if __name__ == "__main__":
    main()
```

You can expect a response like the following:

```markdown
The Computer Science and Engineering (CSE) Department at the University of Michigan is one of the most prestigious and highly-regarded computer science programs in the world. Located in the heart of Ann Arbor, Michigan, the Department of CSE is a leading institution for undergraduate and graduate education in the field of computer science.

With a rich history dating back to 1940, the CSE Department at the University of Michigan has a long tradition of academic excellence, cutting-edge research, and innovative teaching. The department is composed of over 70 faculty members, many of whom are prominent researchers in their fields, and has a student body of around 500 undergraduate majors and 1,000 graduate students.

The CSE Department offers a wide range of undergraduate and graduate degree programs, including Bachelor of Science in Computer Science, Bachelor of Arts in Computer Science, Master of Science in Computer Science, Master of Engineering in Computer Science, and Ph.D. in Computer Science. These programs are designed to provide students with a comprehensive education in computer science, including a strong foundation in mathematics, computer systems, algorithms, computer networks, and software engineering.

The department is particularly renowned for its research programs in areas such as artificial intelligence, computer vision, natural language processing, robotics, and data science. The CSE Department has a strong research focus, and its faculty members are actively engaged in research projects, partnerships, and collaborations with industry, government, and academia.

One of the unique aspects of the CSE Department at the University of Michigan is its strong commitment to interdisciplinary research and education. The department has established partnerships with various academic departments across the university, including physics, mathematics, and engineering, to provide students with a well-rounded education that incorporates multiple disciplines.

The CSE Department also has a strong focus on industry collaboration and engagement. The department has established the University of Michigan's College of Engineering, which provides students with opportunities to engage in research, internships, and co-op programs with top industry partners.

Overall, the Computer Science and Engineering Department at the University of Michigan is a world-class institution that provides students with a world-class education, innovative research opportunities, and strong industry connections. Its highly-regarded faculty, cutting-edge research programs, and strong industry partnerships make it an attractive destination for students interested in pursuing a career in computer science.

Some of the key statistics and achievements of the CSE Department at the University of Michigan include:

* Ranked #5 in the US News & World Report's Best Undergraduate Computer Science Programs (2022)
* Ranked #10 in the QS World University Rankings by Subject: Computer Science (2022)
* 97% of undergraduate graduates find employment or continue their education within six months of graduation
* 98% of graduate students are employed or continue their education within six months of graduation
* 10:1 student-to-faculty ratio, providing students with personalized attention and mentorship

These statistics demonstrate the exceptional quality of education and research provided by the CSE Department at the University of Michigan, and highlight its reputation as one of the world's leading institutions for computer science education and research.
```

Happy coding! If you’d like to contribute, please read our [Contributing Guide](CONTRIBUTING.md).


================================================
FILE: guides/mistral.md
================================================
# Mistral

To use Mistral with `aisuite`, you’ll need a [Mistral account](https://console.mistral.ai/). 

After logging in, go to [Workspace billing](https://console.mistral.ai/billing) and choose a plan
- **Experiment** *(Free, 1 request per second); or*
- **Scale** *(Pay per use).*

Visit the [API Keys](https://console.mistral.ai/api-keys/) section in your account settings and generate a new key. Once you have your key, add it to your environment as follows:

```shell
export MISTRAL="your-mistralai-api-key"
```
## Create a Chat Completion

Install the `mistralai` Python client:

Example with pip:
```shell
pip install mistralai
```

Example with poetry:
```shell
poetry add mistralai
```

In your code:
```python
import aisuite as ai
client = ai.Client()

provider = "mistral"
model_id = "mistral-large-latest"

messages = [
    {"role": "system", "content": "You are a helpful assistant."},
    {"role": "user", "content": "What’s the weather like in Montréal?"},
]

response = client.chat.completions.create(
    model=f"{provider}:{model_id}",
    messages=messages,
)

print(response.choices[0].message.content)
```

Happy coding! If you’d like to contribute, please read our [Contributing Guide](../CONTRIBUTING.md).


================================================
FILE: guides/nebius.md
================================================
# Nebius AI Studio

To use Nebius AI Studio with `aisuite`, you need an AI Studio account. Go to [AI Studio](https://studio.nebius.ai/) and press "Log in to AI Studio" in the right top corner. After logging in, go to the [API Keys](https://studio.nebius.ai/settings/api-keys) section and generate a new key. Once you have a key, add it to your environment as follows:

```shell
export NEBIUS_API_KEY="your-nebius-api-key"
```

## Create a Chat Completion

Install the `openai` Python client:

Example with pip:
```shell
pip install openai
```

Example with poetry:
```shell
poetry add openai
```

In your code:
```python
import aisuite as ai
client = ai.Client()

provider = "nebius"
model_id = "meta-llama/Llama-3.3-70B-Instruct"

messages = [
    {"role": "system", "content": "You are a helpful assistant."},
    {"role": "user", "content": "How many times has Jurgen Klopp won the Champions League?"},
]

response = client.chat.completions.create(
    model=f"{provider}:{model_id}",
    messages=messages,
)

print(response.choices[0].message.content)
```

Happy coding! If you’d like to contribute, please read our [Contributing Guide](CONTRIBUTING.md).


================================================
FILE: guides/ollama.md
================================================
# Ollama

Ollama allows users to locally host open-source models available in [their library](https://ollama.com/library). 
Once an Ollama instance is locally running in your setup (default `http://localhost:11434`), you can use the `aisuite` API for chat completions as shown below.
No API Key is needed for these locally hosted models.

## Create a Chat Completion

Sample code:
```python
import aisuite as ai

def main():
    client = ai.Client(
        provider_configs={
            "ollama": {
                "api_url": "http://10.168.0.177:11434",
                "timeout": 300,
            }
        }
    )
    messages = [
        {
            "role": "system", 
            "content": "Be verbose"
        },
        {
            "role": "user", 
            "content": "Tell me something about University of Michigan's CSE department."
        },
    ]

    ollama_llama3 = "ollama:llama3:latest"
    ollama_gemma = "ollama:gemma:latest"
    ollama_deepseek_32B = "ollama:deepseek-r1:32b"
    ollama_deepseek_70B = "ollama:deepseek-r1:70b"

    response = client.chat.completions.create(
        model=ollama_gemma, 
        messages=messages, 
        temperature=0.75,
    )
    print(response.choices[0].message.content)


if __name__ == "__main__":
    main()
```

Happy coding! If you’d like to contribute, please read our [Contributing Guide](CONTRIBUTING.md).


================================================
FILE: guides/openai.md
================================================
# OpenAI

To use OpenAI with `aisuite`, you’ll need an [OpenAI account](https://platform.openai.com/). After logging in, go to the [API Keys](https://platform.openai.com/account/api-keys) section in your account settings and generate a new key. Once you have your key, add it to your environment as follows:

```shell
export OPENAI_API_KEY="your-openai-api-key"
```

## Create a Chat Completion

Install the `openai` Python client:

Example with pip:
```shell
pip install openai
```

Example with poetry:
```shell
poetry add openai
```

In your code:
```python
import aisuite as ai
client = ai.Client()

provider = "openai"
model_id = "gpt-4-turbo"

messages = [
    {"role": "system", "content": "You are a helpful assistant."},
    {"role": "user", "content": "What’s the weather like in San Francisco?"},
]

response = client.chat.completions.create(
    model=f"{provider}:{model_id}",
    messages=messages,
)

print(response.choices[0].message.content)
```

Happy coding! If you’d like to contribute, please read our [Contributing Guide](../CONTRIBUTING.md).


================================================
FILE: guides/sambanova.md
================================================
# Sambanova

To use Sambanova with `aisuite`, you’ll need a [Sambanova Cloud](https://cloud.sambanova.ai/) account. After logging in, go to the [API](https://cloud.sambanova.ai/apis) section and generate a new key. Once you have your key, add it to your environment as follows:

```shell
export SAMBANOVA_API_KEY="your-sambanova-api-key"
```

## Create a Chat Completion

Install the `openai` Python client:

Example with pip:
```shell
pip install openai
```

Example with poetry:
```shell
poetry add openai
```

In your code:
```python
import aisuite as ai
client = ai.Client()

provider = "sambanova"
model_id = "Meta-Llama-3.1-405B-Instruct"

messages = [
    {"role": "system", "content": "You are a helpful assistant."},
    {"role": "user", "content": "What’s the weather like in San Francisco?"},
]

response = client.chat.completions.create(
    model=f"{provider}:{model_id}",
    messages=messages,
)

print(response.choices[0].message.content)
```

Happy coding! If you’d like to contribute, please read our [Contributing Guide](CONTRIBUTING.md).


================================================
FILE: guides/watsonx.md
================================================
# Watsonx with `aisuite`

A a step-by-step guide to set up Watsonx with the `aisuite` library, enabling you to use IBM Watsonx's powerful AI models for various tasks.

## Setup Instructions

### Step 1: Create a Watsonx Account

1. Visit [IBM Watsonx](https://www.ibm.com/watsonx).
2. Sign up for a new account or log in with your existing IBM credentials.
3. Once logged in, navigate to the **Watsonx Dashboard** (<https://dataplatform.cloud.ibm.com>)

---

### Step 2: Obtain API Credentials

1. **Generate an API Key**:
   - Go to IAM > API keys and create a new API key (<https://cloud.ibm.com/iam/overview>)
   - Copy the API key. This is your `WATSONX_API_KEY`.

2. **Locate the Service URL**:
   - Your service URL is based on the region where your service is hosted.
   - Pick one from the list here <https://cloud.ibm.com/apidocs/watsonx-ai#endpoint-url>
   - Copy the service URL. This is your `WATSONX_SERVICE_URL`.

3. **Get the Project ID**:
   - Go to the **Watsonx Dashboard** (<https://dataplatform.cloud.ibm.com>)
   - Under the **Projects** section, If you don't have a sandbox project, create a new project.
   - Navigate to the **Manage** tab and find the **Project ID**.
   - Copy the **Project ID**. This will serve as your `WATSONX_PROJECT_ID`.

---

### Step 3: Set Environment Variables

To simplify authentication, set the following environment variables:

Run the following commands in your terminal:

```bash
export WATSONX_API_KEY="your-watsonx-api-key"
export WATSONX_SERVICE_URL="your-watsonx-service-url"
export WATSONX_PROJECT_ID="your-watsonx-project-id"
```


## Create a Chat Completion

Install the `ibm-watsonx-ai` Python client:

Example with pip:

```shell
pip install ibm-watsonx-ai
```

Example with poetry:

```shell
poetry add ibm-watsonx-ai
```

In your code:

```python
import aisuite as ai
client = ai.Client()

provider = "watsonx"
model_id = "meta-llama/llama-3-70b-instruct"

messages = [
    {"role": "system", "content": "You are a helpful assistant."},
    {"role": "user", "content": "Tell me a joke."},
]

response = client.chat.completions.create(
    model=f"{provider}:{model_id}",
    messages=messages,
)

print(response.choices[0].message.content)
```

================================================
FILE: guides/xai.md
================================================
# xAI

To use xAI with `aisuite`, you’ll need an [API key](https://console.x.ai/). Generate a new key and once you have your key, add it to your environment as follows:

```shell
export XAI_API_KEY="your-xai-api-key"
```

## Create a Chat Completion

Sample code:
```python
import aisuite as ai
client = ai.Client()

models = ["xai:grok-beta"]

messages = [
    {"role": "system", "content": "Respond in Pirate English."},
    {"role": "user", "content": "Tell me a joke."},
]

for model in models:
    response = client.chat.completions.create(
        model=model,
        messages=messages,
        temperature=0.75
    )
    print(response.choices[0].message.content)

```

Happy coding! If you’d like to contribute, please read our [Contributing Guide](CONTRIBUTING.md).


================================================
FILE: pyproject.toml
================================================
[tool.poetry]
name = "aisuite"
version = "0.1.14"
description = "Uniform access layer for LLMs"
authors = ["Andrew Ng <ng@deeplearning.ai>", "Rohit P <rohit.prasad15@gmail.com>"]
maintainers = ["Andrew Ng <ng@deeplearning.ai>", "Rohit P <rohit.prasad15@gmail.com>"]
readme = "README.md"

[tool.poetry.dependencies]
python = "^3.10"
anthropic = { version = "^0.30.1", optional = true }
boto3 = { version = "^1.34.144", optional = true }
cohere = { version = "^5.12.0", optional = true }
vertexai = { version = "^1.63.0", optional = true }
google-cloud-speech = { version = "^2.33.0", optional = true }
deepgram-sdk = { version = "^5.0.0", optional = true }
soundfile = { version = "^0.12.1", optional = true }
scipy = { version = "^1.11.0", optional = true }
numpy = { version = "^1.24.0", optional = true }
groq = { version = "^0.9.0", optional = true }
mistralai = { version = "^1.0.3", optional = true }
ibm-watsonx-ai = { version = "^1.1.16", optional = true }
docstring-parser = { version = "^0.15.0" }
cerebras_cloud_sdk = { version = "^1.19.0", optional = true }
openai = { version = "^1.107.0", optional = true }
mcp = { version = "^1.1.2", optional = true }
nest-asyncio = { version = "^1.6.0", optional = true }

# Optional dependencies for different providers
httpx = "~0.27.0"
[tool.poetry.extras]
anthropic = ["anthropic"]
aws = ["boto3"]
azure = []
cerebras = ["cerebras_cloud_sdk"]
cohere = ["cohere"]
deepgram = ["deepgram-sdk", "soundfile", "scipy", "numpy"]
deepseek = ["openai"]
google = ["vertexai", "google-cloud-speech"]
groq = ["groq"]
huggingface = []
mistral = ["mistralai"]
ollama = []
openai = ["openai"]
watsonx = ["ibm-watsonx-ai"]
mcp = ["mcp", "nest-asyncio"]
all = ["anthropic", "boto3", "cerebras_cloud_sdk", "vertexai", "google-cloud-speech", "groq", "mistralai", "openai", "cohere", "ibm-watsonx-ai", "deepgram-sdk", "soundfile", "scipy", "numpy", "mcp", "nest-asyncio"]  # To install all providers

[tool.poetry.group.dev.dependencies]
pre-commit = "^3.7.1"
black = "^24.4.2"
python-dotenv = "^1.0.1"
openai = "^1.107.0"
groq = "^0.9.0"
anthropic = "^0.30.1"
notebook = "^7.2.1"
ollama = "^0.2.1"
mistralai = "^1.0.3"
boto3 = "^1.34.144"
fireworks-ai = "^0.14.0"
chromadb = "^0.5.4"
sentence-transformers = "^3.0.1"
datasets = "^2.20.0"
vertexai = "^1.63.0"
google-cloud-speech = "^2.33.0"
deepgram-sdk = "^5.0.0"
ibm-watsonx-ai = "^1.1.16"
cerebras_cloud_sdk = "^1.19.0"

[tool.poetry.group.test]
optional = true

[tool.poetry.group.test.dependencies]
pytest = "^8.2.2"
pytest-cov = "^6.0.0"
pytest-asyncio = "^0.24.0"

[build-system]
requires = ["poetry-core"]
build-backend = "poetry.core.masonry.api"

[tool.pytest.ini_options]
testpaths="tests"
markers = [
    "integration: marks tests as integration tests that interact with external services",
    "llm: marks tests that make real LLM API calls and incur costs (subset of integration)",
    "mcp_server: marks tests that require MCP server functionality (e.g., npx, external MCP servers)",
]


================================================
FILE: tests/__init__.py
================================================


================================================
FILE: tests/client/__init__.py
================================================


================================================
FILE: tests/client/test_client.py
================================================
from unittest.mock import Mock, patch
import io

import pytest

from aisuite import Client
from aisuite.framework.message import TranscriptionResult
from aisuite.provider import ASRError


@pytest.fixture(scope="module")
def provider_configs():
    return {
        "openai": {"api_key": "test_openai_api_key"},
        "aws": {
            "aws_access_key": "test_aws_access_key",
            "aws_secret_key": "test_aws_secret_key",
            "aws_session_token": "test_aws_session_token",
            "aws_region": "us-west-2",
        },
        "azure": {
            "api_key": "azure-api-key",
            "base_url": "https://model.ai.azure.com",
        },
        "groq": {
            "api_key": "groq-api-key",
        },
        "mistral": {
            "api_key": "mistral-api-key",
        },
        "google": {
            "project_id": "test_google_project_id",
            "region": "us-west4",
            "application_credentials": "test_google_application_credentials",
        },
        "fireworks": {
            "api_key": "fireworks-api-key",
        },
        "nebius": {
            "api_key": "nebius-api-key",
        },
        "inception": {
            "api_key": "inception-api-key",
        },
        "deepgram": {
            "api_key": "deepgram-api-key",
        },
    }


@pytest.mark.parametrize(
    argnames=("patch_target", "provider", "model"),
    argvalues=[
        (
            "aisuite.providers.openai_provider.OpenaiProvider.chat_completions_create",
            "openai",
            "gpt-4o",
        ),
        (
            "aisuite.providers.mistral_provider.MistralProvider.chat_completions_create",
            "mistral",
            "mistral-model",
        ),
        (
            "aisuite.providers.groq_provider.GroqProvider.chat_completions_create",
            "groq",
            "groq-model",
        ),
        (
            "aisuite.providers.aws_provider.AwsProvider.chat_completions_create",
            "aws",
            "claude-v3",
        ),
        (
            "aisuite.providers.azure_provider.AzureProvider.chat_completions_create",
            "azure",
            "azure-model",
        ),
        (
            "aisuite.providers.anthropic_provider.AnthropicProvider.chat_completions_create",
            "anthropic",
            "anthropic-model",
        ),
        (
            "aisuite.providers.google_provider.GoogleProvider.chat_completions_create",
            "google",
            "google-model",
        ),
        (
            "aisuite.providers.fireworks_provider.FireworksProvider.chat_completions_create",
            "fireworks",
            "fireworks-model",
        ),
        (
            "aisuite.providers.nebius_provider.NebiusProvider.chat_completions_create",
            "nebius",
            "nebius-model",
        ),
        (
            "aisuite.providers.inception_provider.InceptionProvider.chat_completions_create",
            "inception",
            "mercury",
        ),
    ],
)
def test_client_chat_completions(
    provider_configs: dict, patch_target: str, provider: str, model: str
):
    expected_response = f"{patch_target}_{provider}_{model}"
    with patch(patch_target) as mock_provider:
        mock_provider.return_value = expected_response
        client = Client()
        client.configure(provider_configs)
        messages = [
            {"role": "system", "content": "You are a helpful assistant."},
            {"role": "user", "content": "Who won the world series in 2020?"},
        ]

        model_str = f"{provider}:{model}"
        model_response = client.chat.completions.create(model_str, messages=messages)
        assert model_response == expected_response


def test_invalid_provider_in_client_config():
    # Testing an invalid provider name in the configuration
    invalid_provider_configs = {
        "invalid_provider": {"api_key": "invalid_api_key"},
    }

    # With lazy loading, Client initialization should succeed
    client = Client()
    client.configure(invalid_provider_configs)

    messages = [
        {"role": "user", "content": "Hello"},
    ]

    # Expect ValueError when actually trying to use the invalid provider
    with pytest.raises(
        ValueError,
        match=r"Invalid provider key 'invalid_provider'. Supported providers: ",
    ):
        client.chat.completions.create("invalid_provider:some-model", messages=messages)


def test_invalid_model_format_in_create(monkeypatch):
    from aisuite.providers.openai_provider import OpenaiProvider

    monkeypatch.setattr(
        target=OpenaiProvider,
        name="chat_completions_create",
        value=Mock(),
    )

    # Valid provider configurations
    provider_configs = {
        "openai": {"api_key": "test_openai_api_key"},
    }

    # Initialize the client with valid provider
    client = Client()
    client.configure(provider_configs)

    messages = [
        {"role": "system", "content": "You are a helpful assistant."},
        {"role": "user", "content": "Tell me a joke."},
    ]

    # Invalid model format
    invalid_model = "invalidmodel"

    # Expect ValueError when calling create with invalid model format and verify message
    with pytest.raises(
        ValueError, match=r"Invalid model format. Expected 'provider:model'"
    ):
        client.chat.completions.create(invalid_model, messages=messages)


class TestClientASR:
    """Test suite for Client ASR functionality - essential tests only."""

    def test_audio_interface_initialization(self):
        """Test that Audio interface is properly initialized."""
        client = Client()
        assert hasattr(client, "audio")
        assert hasattr(client.audio, "transcriptions")

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_transcriptions_create_success(
        self, mock_create_provider, provider_configs
    ):
        """Test successful audio transcription with OpenAI."""
        mock_result = TranscriptionResult(
            text="Hello, this is a test transcription.",
            language="en",
            confidence=0.95,
            task="transcribe",
        )

        # Create a mock provider with audio support
        mock_provider = Mock()
        mock_provider.audio.transcriptions.create.return_value = mock_result
        mock_create_provider.return_value = mock_provider

        client = Client()
        client.configure(provider_configs)

        audio_data = io.BytesIO(b"fake audio data")
        result = client.audio.transcriptions.create(
            model="openai:whisper-1", file=audio_data, language="en"
        )

        assert isinstance(result, TranscriptionResult)
        assert result.text == "Hello, this is a test transcription."
        mock_provider.audio.transcriptions.create.assert_called_once()

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_transcriptions_create_deepgram(
        self, mock_create_provider, provider_configs
    ):
        """Test audio transcription with Deepgram provider."""
        mock_result = TranscriptionResult(
            text="Deepgram transcription result.",
            language="en",
            confidence=0.92,
            task="transcribe",
        )

        # Create a mock provider with audio support
        mock_provider = Mock()
        mock_provider.audio.transcriptions.create.return_value = mock_result
        mock_create_provider.return_value = mock_provider

        client = Client()
        client.configure(provider_configs)

        result = client.audio.transcriptions.create(
            model="deepgram:nova-2", file="test_audio.wav", language="en"
        )

        assert isinstance(result, TranscriptionResult)
        assert result.text == "Deepgram transcription result."
        mock_provider.audio.transcriptions.create.assert_called_once()

    def test_transcriptions_invalid_model_format(self, provider_configs):
        """Test that invalid model format raises ValueError."""
        client = Client()
        client.configure(provider_configs)

        with pytest.raises(ValueError, match="Invalid model format"):
            client.audio.transcriptions.create(
                model="invalid-format", file="test.wav", language="en"
            )

    def test_transcriptions_unsupported_provider(self, provider_configs):
        """Test error handling for unsupported ASR provider."""
        client = Client()
        client.configure(provider_configs)

        with pytest.raises(ValueError, match="Invalid provider key"):
            client.audio.transcriptions.create(
                model="unsupported:model", file="test.wav", language="en"
            )


class TestClientASRParameterValidation:
    """Test suite for Client-level ASR parameter validation."""

    def test_client_initialization_strict_mode(self):
        """Test Client initialization with strict extra_param_mode."""
        client = Client(extra_param_mode="strict")
        assert client.extra_param_mode == "strict"
        assert client.param_validator.extra_param_mode == "strict"

    def test_client_initialization_warn_mode(self):
        """Test Client initialization with warn extra_param_mode (default)."""
        client = Client()
        assert client.extra_param_mode == "warn"
        assert client.param_validator.extra_param_mode == "warn"

    def test_client_initialization_permissive_mode(self):
        """Test Client initialization with permissive extra_param_mode."""
        client = Client(extra_param_mode="permissive")
        assert client.extra_param_mode == "permissive"
        assert client.param_validator.extra_param_mode == "permissive"

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_strict_mode_rejects_unknown_param(self, mock_create_provider):
        """Test that strict mode raises ValueError for unknown parameters."""
        client = Client(
            provider_configs={"openai": {"api_key": "test"}}, extra_param_mode="strict"
        )

        # Mock provider shouldn't be called due to validation error
        mock_provider = Mock()
        mock_create_provider.return_value = mock_provider

        with pytest.raises(ValueError, match="Unknown parameters for openai"):
            client.audio.transcriptions.create(
                model="openai:whisper-1",
                file=io.BytesIO(b"audio"),
                language="en",
                invalid_param=True,  # Unknown param
            )

        # Provider should not have been called (validation failed first)
        mock_provider.audio.transcriptions.create.assert_not_called()

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_strict_mode_typo_detection(self, mock_create_provider):
        """Test that strict mode catches typos in parameter names."""
        client = Client(
            provider_configs={"openai": {"api_key": "test"}}, extra_param_mode="strict"
        )

        mock_provider = Mock()
        mock_create_provider.return_value = mock_provider

        with pytest.raises(
            ValueError, match="Unknown parameters for openai: \\['langauge'\\]"
        ):
            client.audio.transcriptions.create(
                model="openai:whisper-1",
                file=io.BytesIO(b"audio"),
                langauge="en",  # TYPO: should be "language"
            )

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_warn_mode_continues_execution(self, mock_create_provider):
        """Test that warn mode continues execution after warning."""
        import warnings

        client = Client(
            provider_configs={"openai": {"api_key": "test"}}, extra_param_mode="warn"
        )

        mock_result = TranscriptionResult(text="Test", language="en")
        mock_provider = Mock()
        mock_provider.audio.transcriptions.create.return_value = mock_result
        mock_create_provider.return_value = mock_provider

        # Should warn but continue
        with warnings.catch_warnings(record=True) as w:
            warnings.simplefilter("always")
            result = client.audio.transcriptions.create(
                model="openai:whisper-1",
                file=io.BytesIO(b"audio"),
                language="en",
                invalid_param=True,  # Unknown param
            )

            # Should have issued a warning
            assert len(w) == 1
            assert "Unknown parameters" in str(w[0].message)

            # But execution should continue
            assert result.text == "Test"
            mock_provider.audio.transcriptions.create.assert_called_once()

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_permissive_mode_allows_unknown_params(self, mock_create_provider):
        """Test that permissive mode allows unknown parameters."""
        import warnings

        client = Client(
            provider_configs={"openai": {"api_key": "test"}},
            extra_param_mode="permissive",
        )

        mock_result = TranscriptionResult(text="Test", language="en")
        mock_provider = Mock()
        mock_provider.audio.transcriptions.create.return_value = mock_result
        mock_create_provider.return_value = mock_provider

        # Should not warn or raise
        with warnings.catch_warnings(record=True) as w:
            warnings.simplefilter("always")
            result = client.audio.transcriptions.create(
                model="openai:whisper-1",
                file=io.BytesIO(b"audio"),
                experimental_feature=True,  # Unknown param
            )

            # Should not have issued any warnings
            assert len(w) == 0

            # Execution should succeed
            assert result.text == "Test"
            mock_provider.audio.transcriptions.create.assert_called_once()

            # Unknown param should be passed through
            call_kwargs = mock_provider.audio.transcriptions.create.call_args.kwargs
            assert call_kwargs.get("experimental_feature") is True

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_common_param_mapping_at_client_level(self, mock_create_provider):
        """Test that common parameters are mapped correctly at Client level."""
        client = Client(
            provider_configs={"google": {"project_id": "test", "region": "us"}},
            extra_param_mode="strict",
        )

        mock_result = TranscriptionResult(text="Test", language="en")
        mock_provider = Mock()
        mock_provider.audio.transcriptions.create.return_value = mock_result
        mock_create_provider.return_value = mock_provider

        # Use common param "language" which should map to "language_code" for Google
        result = client.audio.transcriptions.create(
            model="google:latest_long",
            file=io.BytesIO(b"audio"),
            language="en",  # Common param
        )

        assert result.text == "Test"
        mock_provider.audio.transcriptions.create.assert_called_once()

        # Verify parameter was mapped to language_code
        call_kwargs = mock_provider.audio.transcriptions.create.call_args.kwargs
        assert "language_code" in call_kwargs
        assert call_kwargs["language_code"] == "en-US"  # Expanded
        assert "language" not in call_kwargs  # Original key should be mapped

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_provider_specific_params_passthrough(self, mock_create_provider):
        """Test that provider-specific parameters pass through correctly."""
        client = Client(
            provider_configs={"deepgram": {"api_key": "test"}},
            extra_param_mode="strict",
        )

        mock_result = TranscriptionResult(text="Test", language="en")
        mock_provider = Mock()
        mock_provider.audio.transcriptions.create.return_value = mock_result
        mock_create_provider.return_value = mock_provider

        result = client.audio.transcriptions.create(
            model="deepgram:nova-2",
            file=io.BytesIO(b"audio"),
            punctuate=True,
            diarize=True,
        )

        assert result.text == "Test"

        # Verify provider-specific params passed through
        call_kwargs = mock_provider.audio.transcriptions.create.call_args.kwargs
        assert call_kwargs["punctuate"] is True
        assert call_kwargs["diarize"] is True

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_mixed_common_and_provider_params(self, mock_create_provider):
        """Test mixing common and provider-specific parameters."""
        client = Client(
            provider_configs={"deepgram": {"api_key": "test"}},
            extra_param_mode="strict",
        )

        mock_result = TranscriptionResult(text="Test", language="en")
        mock_provider = Mock()
        mock_provider.audio.transcriptions.create.return_value = mock_result
        mock_create_provider.return_value = mock_provider

        result = client.audio.transcriptions.create(
            model="deepgram:nova-2",
            file=io.BytesIO(b"audio"),
            language="en",  # Common param
            prompt="meeting",  # Common param that maps to keywords
            punctuate=True,  # Deepgram-specific
            diarize=True,  # Deepgram-specific
        )

        assert result.text == "Test"

        # Verify both common and provider params processed correctly
        call_kwargs = mock_provider.audio.transcriptions.create.call_args.kwargs
        assert call_kwargs["language"] == "en"
        assert call_kwargs["keywords"] == ["meeting"]  # prompt mapped to keywords
        assert call_kwargs["punctuate"] is True
        assert call_kwargs["diarize"] is True

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_validation_happens_before_provider_call(self, mock_create_provider):
        """Test that validation occurs before provider SDK is called."""
        client = Client(
            provider_configs={"openai": {"api_key": "test"}}, extra_param_mode="strict"
        )

        mock_provider = Mock()
        mock_create_provider.return_value = mock_provider

        # Validation should fail before provider is even initialized
        with pytest.raises(ValueError, match="Unknown parameters"):
            client.audio.transcriptions.create(
                model="openai:whisper-1",
                file=io.BytesIO(b"audio"),
                completely_invalid_param=True,
            )

        # Provider create method should still have been called to initialize
        # but the transcription method should never be called
        mock_provider.audio.transcriptions.create.assert_not_called()

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_unsupported_common_param_ignored(self, mock_create_provider):
        """Test that unsupported common params are gracefully ignored."""
        client = Client(
            provider_configs={"deepgram": {"api_key": "test"}},
            extra_param_mode="strict",
        )

        mock_result = TranscriptionResult(text="Test", language="en")
        mock_provider = Mock()
        mock_provider.audio.transcriptions.create.return_value = mock_result
        mock_create_provider.return_value = mock_provider

        # temperature is not supported by Deepgram (should be ignored)
        result = client.audio.transcriptions.create(
            model="deepgram:nova-2",
            file=io.BytesIO(b"audio"),
            language="en",
            temperature=0.5,  # Not supported by Deepgram
        )

        assert result.text == "Test"

        # Verify temperature was not passed to provider
        call_kwargs = mock_provider.audio.transcriptions.create.call_args.kwargs
        assert "temperature" not in call_kwargs
        assert call_kwargs["language"] == "en"

    @patch("aisuite.provider.ProviderFactory.create_provider")
    def test_multiple_providers_with_same_client(self, mock_create_provider):
        """Test that the same client can handle multiple providers with different validation."""
        client = Client(
            provider_configs={
                "openai": {"api_key": "test1"},
                "deepgram": {"api_key": "test2"},
            },
            extra_param_mode="strict",
        )

        mock_result = TranscriptionResult(text="Test", language="en")
        mock_provider = Mock()
        mock_provider.audio.transcriptions.create.return_value = mock_result
        mock_create_provider.return_value = mock_provider

        # Test OpenAI with temperature (supported)
        result1 = client.audio.transcriptions.create(
            model="openai:whisper-1", file=io.BytesIO(b"audio"), temperature=0.5
        )
        assert result1.text == "Test"
        call_kwargs1 = mock_provider.audio.transcriptions.create.call_args.kwargs
        assert call_kwargs1.get("temperature") == 0.5

        # Reset mock
        mock_provider.reset_mock()

        # Test Deepgram with temperature (not supported, should be ignored)
        result2 = client.audio.transcriptions.create(
            model="deepgram:nova-2", file=io.BytesIO(b"audio"), temperature=0.5
        )
        assert result2.text == "Test"
        call_kwargs2 = mock_provider.audio.transcriptions.create.call_args.kwargs
        assert "temperature" not in call_kwargs2


================================================
FILE: tests/client/test_prerelease.py
================================================
# Run this test before releasing a new version.
# It will test all the models in the client.

import pytest
import aisuite as ai
from typing import List, Dict
from dotenv import load_dotenv, find_dotenv


def setup_client() -> ai.Client:
    """Initialize the AI client with environment variables."""
    load_dotenv(find_dotenv())
    return ai.Client()


def get_test_models() -> List[str]:
    """Return a list of model identifiers to test."""
    return [
        "anthropic:claude-3-5-sonnet-20240620",
        "aws:meta.llama3-1-8b-instruct-v1:0",
        "huggingface:mistralai/Mistral-7B-Instruct-v0.3",
        "groq:llama3-8b-8192",
        "mistral:open-mistral-7b",
        "openai:gpt-3.5-turbo",
        "cohere:command-r-plus-08-2024",
        "inception:mercury",
    ]


def get_test_messages() -> List[Dict[str, str]]:
    """Return the test messages to send to each model."""
    return [
        {
            "role": "system",
            "content": "Respond in Pirate English. Always try to include the phrase - No rum No fun.",
        },
        {"role": "user", "content": "Tell me a joke about Captain Jack Sparrow"},
    ]


@pytest.mark.integration
@pytest.mark.parametrize("model_id", get_test_models())
def test_model_pirate_response(model_id: str):
    """
    Test that each model responds appropriately to the pirate prompt.

    Args:
        model_id: The provider:model identifier to test
    """
    client = setup_client()
    messages = get_test_messages()

    try:
        response = client.chat.completions.create(
            model=model_id, messages=messages, temperature=0.75
        )

        content = response.choices[0].message.content.lower()

        # Check if either version of the required phrase is present
        assert any(
            phrase in content for phrase in ["no rum no fun", "no rum, no fun"]
        ), f"Model {model_id} did not include required phrase 'No rum No fun'"

        assert len(content) > 0, f"Model {model_id} returned empty response"
        assert isinstance(
            content, str
        ), f"Model {model_id} returned non-string response"

    except Exception as e:
        pytest.fail(f"Error testing model {model_id}: {str(e)}")


def get_test_asr_models() -> List[str]:
    """Return a list of ASR model identifiers to test."""
    return [
        "openai:whisper-1",
        "deepgram:nova-2",
        "google:latest_long",
        "huggingface:openai/whisper-large-v3",
    ]


@pytest.mark.integration
@pytest.mark.parametrize("model_id", get_test_asr_models())
def test_asr_portable_transcription(model_id: str):
    """
    Test that portable ASR code works across different providers.

    This test verifies:
    1. Common parameter 'language' works for all providers
    2. Same audio file can be transcribed by different providers
    3. All providers return non-empty transcription results

    Args:
        model_id: The provider:model identifier to test (e.g., "openai:whisper-1")
    """
    client = setup_client()

    # Simple test audio file - you'll need to provide a valid audio file
    # For actual testing, replace with a real audio file path
    audio_file_path = "tests/test-data/test_audio.mp3"

    try:
        # Use common parameter 'language' that should work across all providers
        result = client.audio.transcriptions.create(
            model=model_id,
            file=audio_file_path,
            language="en",  # Common param - should auto-map for each provider
        )

        # Verify result has text
        assert hasattr(
            result, "text"
        ), f"Model {model_id} result missing 'text' attribute"
        assert len(result.text) > 0, f"Model {model_id} returned empty transcription"
        assert isinstance(
            result.text, str
        ), f"Model {model_id} returned non-string transcription"

        # Verify transcription contains expected content from tests/test-data/test_audio.mp3
        # Audio: "Why did the scarecrow win an award? Because he was outstanding in the field."
        expected_keywords = ["scarecrow", "award", "field"]
        found_keywords = [
            kw for kw in expected_keywords if kw.lower() in result.text.lower()
        ]
        assert len(found_keywords) >= 2, (
            f"Model {model_id} transcription missing expected content. "
            f"Found {len(found_keywords)}/3 keywords. Text: '{result.text}'"
        )

        # Optional: Check for language if available and returned by provider
        # Note: Some providers (e.g., Deepgram) only return language if detect_language=True
        if hasattr(result, "language") and result.language is not None:
            assert isinstance(
                result.language, str
            ), f"Model {model_id} returned invalid language type"

    except FileNotFoundError:
        pytest.skip(f"Test audio file not found for {model_id}. Skipping test.")
    except Exception as e:
        pytest.fail(f"Error testing ASR model {model_id}: {str(e)}")


@pytest.mark.integration
def test_asr_deepgram_provider_specific_feature():
    """
    Test Deepgram provider-specific feature to verify pass-through works.

    This ensures that provider-specific parameters like 'punctuate' are
    correctly passed through the validation layer to the provider SDK.
    """
    client = setup_client()
    audio_file_path = "tests/test-data/test_audio.mp3"

    try:
        # Use Deepgram-specific feature
        result = client.audio.transcriptions.create(
            model="deepgram:nova-2",
            file=audio_file_path,
            language="en",  # Common param
            punctuate=True,  # Deepgram-specific param
        )

        assert len(result.text) > 0, "Deepgram returned empty transcription"

        # If punctuation worked, text should contain punctuation marks
        # Note: This is a soft check as it depends on audio content
        # Just verify execution succeeded with provider-specific param

    except FileNotFoundError:
        pytest.skip("Test audio file not found. Skipping Deepgram feature test.")
    except Exception as e:
        pytest.fail(f"Error testing Deepgram provider-specific feature: {str(e)}")


@pytest.mark.integration
def test_asr_google_language_mapping():
    """
    Test Google language mapping to verify auto-transformation.

    This test verifies that the common parameter 'language="en"' is
    automatically transformed to 'language_code="en-US"' for Google.
    """
    client = setup_client()
    audio_file_path = "tests/test-data/test_audio.mp3"

    try:
        # Use 2-letter language code that should be expanded for Google
        result = client.audio.transcriptions.create(
            model="google:latest_long",
            file=audio_file_path,
            language="en",  # Should be auto-transformed to "en-US"
        )

        assert len(result.text) > 0, "Google returned empty transcription"
        # If we got here, the language code transformation worked

    except FileNotFoundError:
        pytest.skip("Test audio file not found. Skipping Google mapping test.")
    except Exception as e:
        pytest.fail(f"Error testing Google language mapping: {str(e)}")


@pytest.mark.integration
def test_asr_huggingface_word_timestamps():
    """
    Test Hugging Face word-level timestamps feature.

    This ensures that provider-specific parameters like 'return_timestamps'
    are correctly passed through to the Hugging Face Inference API.
    """
    client = setup_client()
    audio_file_path = "tests/test-data/test_audio.mp3"

    try:
        # Use Hugging Face-specific feature
        result = client.audio.transcriptions.create(
            model="huggingface:openai/whisper-large-v3",
            file=audio_file_path,
            return_timestamps="word",  # HF-specific param for word-level timestamps
        )

        assert len(result.text) > 0, "Hugging Face returned empty transcription"

        # If return_timestamps worked, result should have words with timestamps
        if hasattr(result, "words") and result.words:
            # Verify at least some words have timestamps
            words_with_timestamps = [
                w for w in result.words if w.start is not None and w.end is not None
            ]
            assert (
                len(words_with_timestamps) > 0
            ), "No words with timestamps found in result"

    except FileNotFoundError:
        pytest.skip("Test audio file not found. Skipping Hugging Face feature test.")
    except Exception as e:
        pytest.fail(f"Error testing Hugging Face word timestamps feature: {str(e)}")


if __name__ == "__main__":
    pytest.main([__file__, "-v"])


================================================
FILE: tests/framework/test_asr_models.py
================================================
"""Tests for ASR framework data models."""

import pytest
from pydantic import ValidationError

from aisuite.framework.message import (
    Word,
    Segment,
    Alternative,
    Channel,
    TranscriptionResult,
)


class TestWord:
    """Test suite for Word model."""

    def test_word_creation_and_validation(self):
        """Test Word creation with all fields and validation."""
        # Test basic creation
        word = Word(word="hello", start=0.0, end=0.5)
        assert word.word == "hello"
        assert word.start == 0.0
        assert word.end == 0.5
        assert word.confidence is None

        # Test with all fields
        word_full = Word(
            word="hello",
            start=0.0,
            end=0.5,
            confidence=0.95,
            speaker=1,
            punctuated_word="Hello,",
        )
        assert word_full.confidence == 0.95
        assert word_full.speaker == 1

        # Test validation
        with pytest.raises(ValidationError):
            Word()  # Missing required fields


class TestSegment:
    """Test suite for Segment model."""

    def test_segment_creation_and_validation(self):
        """Test Segment creation and validation."""
        # Test basic creation
        segment = Segment(id=0, seek=0, start=0.0, end=5.0, text="Hello world")
        assert segment.id == 0
        assert segment.text == "Hello world"

        # Test validation
        with pytest.raises(ValidationError):
            Segment()  # Missing required fields


class TestAlternative:
    """Test suite for Alternative model."""

    def test_alternative_creation_and_validation(self):
        """Test Alternative creation and validation."""
        # Test creation
        alt = Alternative(transcript="Hello world", confidence=0.9)
        assert alt.transcript == "Hello world"
        assert alt.confidence == 0.9

        # Test validation
        with pytest.raises(ValidationError):
            Alternative()  # Missing required transcript


class TestChannel:
    """Test suite for Channel model."""

    def test_channel_creation_and_validation(self):
        """Test Channel creation and validation."""
        # Test creation
        alternatives = [Alternative(transcript="Test transcript")]
        channel = Channel(alternatives=alternatives)
        assert len(channel.alternatives) == 1

        # Test validation
        with pytest.raises(ValidationError):
            Channel()  # Missing required alternatives


class TestTranscriptionResult:
    """Test suite for TranscriptionResult model."""

    def test_transcription_result_basic(self):
        """Test basic TranscriptionResult creation and validation."""
        # Test basic creation
        result = TranscriptionResult(text="Hello world")
        assert result.text == "Hello world"
        assert result.language is None

        # Test validation
        with pytest.raises(ValidationError):
            TranscriptionResult()  # Missing required text field

    def test_transcription_result_openai_style(self):
        """Test TranscriptionResult with OpenAI-style fields."""
        segments = [Segment(id=0, seek=0, start=0.0, end=2.5, text="Hello world")]
        words = [Word(word="hello", start=0.0, end=0.5)]

        result = TranscriptionResult(
            text="Hello world",
            language="en",
            confidence=0.95,
            task="transcribe",
            segments=segments,
            words=words,
        )

        assert result.text == "Hello world"
        assert result.language == "en"
        assert result.confidence == 0.95
        assert len(result.segments) == 1
        assert len(result.words) == 1

    def test_transcription_result_deepgram_style(self):
        """Test TranscriptionResult with Deepgram-style fields."""
        alternatives = [Alternative(transcript="Hello world", confidence=0.9)]
        channels = [Channel(alternatives=alternatives)]

        result = TranscriptionResult(
            text="Hello world",
            language="en-US",
            channels=channels,
            alternatives=alternatives,
            topics=[{"topic": "greeting"}],
        )

        assert result.text == "Hello world"
        assert len(result.channels) == 1
        assert len(result.alternatives) == 1
        assert result.topics is not None


================================================
FILE: tests/framework/test_asr_params.py
================================================
"""Unit tests for ASR parameter validation and mapping."""

import pytest
import warnings
from aisuite.framework.asr_params import (
    ParamValidator,
    COMMON_PARAMS,
    PROVIDER_PARAMS,
    GOOGLE_LANGUAGE_MAP,
)


class TestParamValidatorCommonParams:
    """Test common parameter mapping across providers."""

    def test_language_mapping_openai(self):
        """Test that language param passes through for OpenAI."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("openai", {"language": "en"})
        assert result == {"language": "en"}

    def test_language_mapping_deepgram(self):
        """Test that language param passes through for Deepgram."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("deepgram", {"language": "en"})
        assert result == {"language": "en"}

    def test_language_mapping_google(self):
        """Test that language param maps to language_code and expands for Google."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("google", {"language": "en"})
        assert result == {"language_code": "en-US"}

    def test_prompt_mapping_openai(self):
        """Test that prompt param passes through for OpenAI."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("openai", {"prompt": "meeting notes"})
        assert result == {"prompt": "meeting notes"}

    def test_prompt_mapping_deepgram(self):
        """Test that prompt param maps to keywords for Deepgram."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("deepgram", {"prompt": "meeting notes"})
        assert result == {"keywords": ["meeting", "notes"]}

    def test_prompt_mapping_google(self):
        """Test that prompt param maps to speech_contexts for Google."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("google", {"prompt": "technical terms"})
        assert result == {"speech_contexts": [{"phrases": ["technical terms"]}]}

    def test_temperature_mapping_openai(self):
        """Test that temperature param passes through for OpenAI."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("openai", {"temperature": 0.5})
        assert result == {"temperature": 0.5}

    def test_temperature_ignored_deepgram(self):
        """Test that temperature param is ignored for Deepgram (not supported)."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("deepgram", {"temperature": 0.5})
        assert result == {}

    def test_temperature_ignored_google(self):
        """Test that temperature param is ignored for Google (not supported)."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("google", {"temperature": 0.5})
        assert result == {}


class TestParamValidatorTransformations:
    """Test value transformations for provider-specific formats."""

    def test_google_language_expansion_common_codes(self):
        """Test Google language code expansion for common 2-letter codes."""
        validator = ParamValidator("strict")

        test_cases = {
            "en": "en-US",
            "es": "es-ES",
            "fr": "fr-FR",
            "de": "de-DE",
            "ja": "ja-JP",
            "zh": "zh-CN",
        }

        for input_lang, expected_output in test_cases.items():
            result = validator.validate_and_map("google", {"language": input_lang})
            assert result == {
                "language_code": expected_output
            }, f"Failed for {input_lang}: expected {expected_output}, got {result}"

    def test_google_language_expansion_unknown_code(self):
        """Test Google language code expansion for unknown 2-letter code (fallback to -US)."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("google", {"language": "xx"})
        assert result == {"language_code": "xx-US"}

    def test_google_language_no_expansion_for_full_code(self):
        """Test that Google doesn't expand already full language codes."""
        validator = ParamValidator("strict")
        # When a full locale code is passed to language_code directly (not via common param)
        result = validator.validate_and_map("google", {"language_code": "en-GB"})
        assert result == {"language_code": "en-GB"}

    def test_deepgram_prompt_to_keywords_single_word(self):
        """Test Deepgram prompt splits single word into list."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("deepgram", {"prompt": "meeting"})
        assert result == {"keywords": ["meeting"]}

    def test_deepgram_prompt_to_keywords_multiple_words(self):
        """Test Deepgram prompt splits multiple words into list."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map(
            "deepgram", {"prompt": "meeting notes action items"}
        )
        assert result == {"keywords": ["meeting", "notes", "action", "items"]}

    def test_deepgram_prompt_to_keywords_already_list(self):
        """Test Deepgram handles prompt that's already a list."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map(
            "deepgram", {"prompt": ["meeting", "notes"]}
        )
        assert result == {"keywords": ["meeting", "notes"]}

    def test_google_prompt_to_speech_contexts(self):
        """Test Google wraps prompt in speech_contexts structure."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("google", {"prompt": "technical terms"})
        assert result == {"speech_contexts": [{"phrases": ["technical terms"]}]}


class TestParamValidatorProviderSpecific:
    """Test provider-specific parameter pass-through."""

    def test_openai_response_format(self):
        """Test OpenAI response_format param passes through."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map(
            "openai", {"response_format": "verbose_json"}
        )
        assert result == {"response_format": "verbose_json"}

    def test_openai_timestamp_granularities(self):
        """Test OpenAI timestamp_granularities param passes through."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map(
            "openai", {"timestamp_granularities": ["word", "segment"]}
        )
        assert result == {"timestamp_granularities": ["word", "segment"]}

    def test_deepgram_punctuate(self):
        """Test Deepgram punctuate param passes through."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("deepgram", {"punctuate": True})
        assert result == {"punctuate": True}

    def test_deepgram_diarize(self):
        """Test Deepgram diarize param passes through."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("deepgram", {"diarize": True})
        assert result == {"diarize": True}

    def test_deepgram_multiple_features(self):
        """Test Deepgram multiple features pass through together."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map(
            "deepgram",
            {
                "punctuate": True,
                "diarize": True,
                "sentiment": True,
                "topics": True,
            },
        )
        assert result == {
            "punctuate": True,
            "diarize": True,
            "sentiment": True,
            "topics": True,
        }

    def test_google_enable_automatic_punctuation(self):
        """Test Google enable_automatic_punctuation param passes through."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map(
            "google", {"enable_automatic_punctuation": True}
        )
        assert result == {"enable_automatic_punctuation": True}

    def test_google_enable_speaker_diarization(self):
        """Test Google enable_speaker_diarization param passes through."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map(
            "google", {"enable_speaker_diarization": True}
        )
        assert result == {"enable_speaker_diarization": True}

    def test_google_diarization_speaker_count(self):
        """Test Google diarization_speaker_count param passes through."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("google", {"diarization_speaker_count": 3})
        assert result == {"diarization_speaker_count": 3}


class TestParamValidatorMixedParams:
    """Test combinations of common and provider-specific parameters."""

    def test_openai_common_and_specific(self):
        """Test OpenAI with common params + provider-specific params."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map(
            "openai",
            {
                "language": "en",
                "temperature": 0.5,
                "response_format": "verbose_json",
            },
        )
        assert result == {
            "language": "en",
            "temperature": 0.5,
            "response_format": "verbose_json",
        }

    def test_deepgram_common_and_specific(self):
        """Test Deepgram with common params + provider-specific params."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map(
            "deepgram",
            {
                "language": "en",
                "prompt": "meeting",
                "punctuate": True,
                "diarize": True,
            },
        )
        assert result == {
            "language": "en",
            "keywords": ["meeting"],
            "punctuate": True,
            "diarize": True,
        }

    def test_google_common_and_specific(self):
        """Test Google with common params + provider-specific params."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map(
            "google",
            {
                "language": "en",
                "enable_automatic_punctuation": True,
                "enable_speaker_diarization": True,
            },
        )
        assert result == {
            "language_code": "en-US",
            "enable_automatic_punctuation": True,
            "enable_speaker_diarization": True,
        }


class TestParamValidatorStrictMode:
    """Test strict validation mode behavior."""

    def test_strict_mode_rejects_unknown_param_openai(self):
        """Test strict mode raises ValueError for unknown OpenAI param."""
        validator = ParamValidator("strict")
        with pytest.raises(
            ValueError, match="Unknown parameters for openai: \\['invalid_param'\\]"
        ):
            validator.validate_and_map("openai", {"invalid_param": True})

    def test_strict_mode_rejects_unknown_param_deepgram(self):
        """Test strict mode raises ValueError for unknown Deepgram param."""
        validator = ParamValidator("strict")
        with pytest.raises(
            ValueError, match="Unknown parameters for deepgram: \\['invalid_param'\\]"
        ):
            validator.validate_and_map("deepgram", {"invalid_param": True})

    def test_strict_mode_rejects_multiple_unknown_params(self):
        """Test strict mode raises ValueError for multiple unknown params."""
        validator = ParamValidator("strict")
        with pytest.raises(ValueError, match="Unknown parameters for openai"):
            validator.validate_and_map(
                "openai",
                {
                    "invalid_param1": True,
                    "invalid_param2": False,
                },
            )

    def test_strict_mode_error_message_helpful(self):
        """Test that strict mode error message mentions provider documentation."""
        validator = ParamValidator("strict")
        with pytest.raises(ValueError, match="See openai documentation"):
            validator.validate_and_map("openai", {"typo_param": True})

    def test_strict_mode_allows_valid_params(self):
        """Test that strict mode allows all valid params."""
        validator = ParamValidator("strict")
        # Should not raise
        result = validator.validate_and_map(
            "deepgram",
            {
                "language": "en",
                "punctuate": True,
            },
        )
        assert result == {"language": "en", "punctuate": True}


class TestParamValidatorWarnMode:
    """Test warn validation mode behavior."""

    def test_warn_mode_issues_warning_unknown_param(self):
        """Test warn mode issues UserWarning for unknown param."""
        validator = ParamValidator("warn")
        with pytest.warns(
            UserWarning, match="Unknown parameters for openai: \\['invalid_param'\\]"
        ):
            result = validator.validate_and_map("openai", {"invalid_param": True})
        # Param should be filtered out (not passed through in warn mode)
        assert result == {}

    def test_warn_mode_continues_execution(self):
        """Test warn mode continues execution after warning."""
        validator = ParamValidator("warn")
        with warnings.catch_warnings():
            warnings.simplefilter("ignore")  # Suppress warning for this test
            result = validator.validate_and_map(
                "openai",
                {
                    "language": "en",
                    "invalid_param": True,
                },
            )
        # Valid param should pass through, invalid should be filtered
        assert result == {"language": "en"}

    def test_warn_mode_warning_message_helpful(self):
        """Test that warn mode warning message mentions provider documentation."""
        validator = ParamValidator("warn")
        with pytest.warns(UserWarning, match="See deepgram documentation"):
            validator.validate_and_map("deepgram", {"typo_param": True})


class TestParamValidatorPermissiveMode:
    """Test permissive validation mode behavior."""

    def test_permissive_mode_allows_unknown_param(self):
        """Test permissive mode passes through unknown params."""
        validator = ParamValidator("permissive")
        result = validator.validate_and_map("openai", {"experimental_feature": True})
        assert result == {"experimental_feature": True}

    def test_permissive_mode_no_warning(self):
        """Test permissive mode doesn't issue warnings."""
        validator = ParamValidator("permissive")
        with warnings.catch_warnings():
            warnings.simplefilter("error")  # Turn warnings into errors
            # Should not raise (no warning should be issued)
            result = validator.validate_and_map("openai", {"unknown_param": True})
        assert result == {"unknown_param": True}

    def test_permissive_mode_mixed_valid_and_unknown(self):
        """Test permissive mode with mix of valid and unknown params."""
        validator = ParamValidator("permissive")
        result = validator.validate_and_map(
            "deepgram",
            {
                "language": "en",
                "punctuate": True,
                "experimental_feature": True,
                "beta_param": "value",
            },
        )
        assert result == {
            "language": "en",
            "punctuate": True,
            "experimental_feature": True,
            "beta_param": "value",
        }


class TestParamValidatorEdgeCases:
    """Test edge cases and error conditions."""

    def test_empty_params(self):
        """Test validation with empty params dict."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("openai", {})
        assert result == {}

    def test_unknown_provider(self):
        """Test validation with unknown provider (uses empty param set)."""
        validator = ParamValidator("strict")
        # Unknown provider with non-common param should raise error
        with pytest.raises(ValueError, match="Unknown parameters for unknown_provider"):
            validator.validate_and_map("unknown_provider", {"custom_param": "value"})

    def test_none_value_param(self):
        """Test that None values are handled correctly."""
        validator = ParamValidator("strict")
        result = validator.validate_and_map("openai", {"language": None})
        assert result == {"language": None}

    def test_common_param_overrides_provider_param(self):
        """Test that common param mapping takes precedence."""
        validator = ParamValidator("strict")
        # If someone passes both 'language' and 'language_code' to Google
        # The common param 'language' should map to 'language_code'
        result = validator.validate_and_map(
            "google",
            {
                "language": "en",
                "language_code": "fr-FR",  # This should be overridden
            },
        )
        # language maps to language_code, then language_code as provider param is also valid
        # In current implementation, common param is processed first, then provider params
        # So we'll get both, but language takes precedence in the transformation
        assert "language_code" in result
        assert result["language_code"] == "fr-FR" or result["language_code"] == "en-US"

    def test_validator_mode_case_sensitivity(self):
        """Test that validator handles only valid mode strings."""
        # Valid modes should work
        ParamValidator("strict")
        ParamValidator("warn")
        ParamValidator("permissive")

        # Note: Python typing will catch invalid modes at type-check time,
        # but runtime won't enforce it unless we add validation
        # This test documents expected behavior


class TestParamValidatorRegistry:
    """Test that parameter registries are complete and consistent."""

    def test_common_params_has_required_providers(self):
        """Test COMMON_PARAMS includes all ASR providers."""
        assert "openai" in COMMON_PARAMS["language"]
        assert "deepgram" in COMMON_PARAMS["language"]
        assert "google" in COMMON_PARAMS["language"]

    def test_provider_params_has_all_providers(self):
        """Test PROVIDER_PARAMS includes all ASR providers."""
        assert "openai" in PROVIDER_PARAMS
        assert "deepgram" in PROVIDER_PARAMS
        assert "google" in PROVIDER_PARAMS

    def test_google_language_map_completeness(self):
        """Test GOOGLE_LANGUAGE_MAP has common language codes."""
        required_languages = ["en", "es", "fr", "de", "ja", "zh"]
        for lang in required_languages:
            assert lang in GOOGLE_LANGUAGE_MAP, f"Missing {lang} in GOOGLE_LANGUAGE_MAP"

    def test_provider_params_includes_common_params(self):
        """Test that provider param sets include their common params."""
        # OpenAI should have language, prompt, temperature in its set
        assert "language" in PROVIDER_PARAMS["openai"]
        assert "prompt" in PROVIDER_PARAMS["openai"]
        assert "temperature" in PROVIDER_PARAMS["openai"]

        # Deepgram should have language in its set (but not temperature)
        assert "language" in PROVIDER_PARAMS["deepgram"]
        assert "temperature" not in PROVIDER_PARAMS["deepgram"]


================================================
FILE: tests/mcp/README.md
================================================
# MCP Integration Tests

This directory contains integration tests for aisuite's MCP (Model Context Protocol) support.

## Prerequisites

To run these tests, you need:

1. **Node.js and npx** - Required to run the Anthropic filesystem MCP server
   - Install from: https://nodejs.org/
   - Verify with: `npx --version`

2. **Python test dependencies**:
   ```bash
   pip install pytest pytest-asyncio python-dotenv
   ```

3. **MCP package** (should already be installed if you have aisuite[mcp]):
   ```bash
   pip install 'aisuite[mcp]'
   ```

4. **Environment variables** (for e2e tests that mock LLM calls):
   Create a `.env` file in the project root with your API keys:
   ```bash
   OPENAI_API_KEY=your-key-here
   ANTHROPIC_API_KEY=your-key-here
   EXA_API_KEY=your-key-here  # Optional: for Exa MCP tests
   ```
   Note: E2E tests mock LLM responses, so API keys won't be charged, but providers validate keys on initialization.

## Running Tests

### Run all MCP integration tests (mocked LLM, free):
```bash
pytest tests/mcp/ -v -m "integration and not llm"
```

### Run specific test file:
```bash
# MCPClient tests
pytest tests/mcp/test_client.py -v -m integration

# End-to-end tests (mocked LLM)
pytest tests/mcp/test_e2e.py -v -m integration

# Real LLM tests with stdio (⚠️ costs money, requires API keys)
pytest tests/mcp/test_llm_e2e.py -v -m llm

# Real LLM tests with HTTP (⚠️ costs money, requires API keys)
pytest tests/mcp/test_http_llm_e2e.py -v -m llm
```

### Run ONLY real LLM tests (⚠️ costs ~$0.50):
```bash
pytest tests/mcp/ -v -m llm
```

### Run ALL tests including LLM (⚠️ costs money):
```bash
pytest tests/mcp/ -v -m integration
```

### Run a specific test:
```bash
pytest tests/mcp/test_client.py::TestMCPClientConnection::test_connect_to_filesystem_server -v
```

### Skip integration tests (if no Node.js):
```bash
pytest tests/mcp/ -v -m "not integration"
```

## Test Structure

### `test_client.py` - MCPClient Integration Tests
Tests the `MCPClient` class with a real MCP server:
- Connection to Anthropic filesystem server
- Listing tools
- Calling tools
- Tool filtering (`allowed_tools`)
- Tool prefixing (`use_tool_prefix`)
- `from_config()` method
- Context manager support

### `test_e2e.py` - End-to-End Tests (Mocked LLM)
Tests the complete flow with `client.chat.completions.create()`:
- Config dict format
- Mixing MCP configs with Python functions
- Multiple MCP servers with prefixing
- Automatic cleanup
- Error handling
- **Note:** LLM responses are mocked, so no API calls are made

### `test_llm_e2e.py` - Real LLM End-to-End Tests with stdio (⚠️ Costs Money)
Tests with **actual API calls** to verify stdio MCP works with real LLMs:
- OpenAI GPT-4o reading files via stdio MCP
- Anthropic Claude reading files via stdio MCP
- Mixed tools (stdio MCP + Python functions)
- Multiple MCP servers with prefixing
- **Uses:** `@modelcontextprotocol/server-filesystem` (stdio)
- **Note:** These tests make real API calls (~$0.05-0.10 per test)
- **Marked with:** `@pytest.mark.llm`
- **Skipped if:** API keys not present in .env

### `test_http_llm_e2e.py` - Real LLM End-to-End Tests with HTTP (⚠️ Costs Money)
Tests with **actual API calls** to verify HTTP MCP works with real LLMs:
- OpenAI GPT-4o using HTTP MCP tools (Context7 and Exa)
- Anthropic Claude using HTTP MCP tools (Context7 and Exa)
- Mixed tools (HTTP MCP + Python functions)
- Config dict format with HTTP transport
- Custom headers support (including Authorization headers for Exa)
- **Uses:**
  - Context7 HTTP MCP server (`https://mcp.context7.com/mcp`)
    - Tools: `resolve-library-id`, `get-library-docs` (library documentation)
  - Exa HTTP MCP server (`https://mcp.exa.ai/mcp`)
    - Tools: `web_search_exa`, `get_code_context_exa` (web search and code context)
    - Requires: EXA_API_KEY in .env
- **Note:** These tests make real API calls (~$0.05-0.10 per test)
- **Marked with:** `@pytest.mark.llm`
- **Skipped if:** API keys not present in .env

### `conftest.py` - Test Fixtures
- `temp_test_dir` - Creates temp directory with test files
- `skip_if_no_npx` - Skips tests if npx not available

## What Gets Tested

### stdio Transport Tests
Use the **real** `@modelcontextprotocol/server-filesystem` MCP server from Anthropic, which:
- Provides file system access tools (read_file, write_file, list_directory, etc.)
- Is installed automatically via `npx -y @modelcontextprotocol/server-filesystem`
- Runs in a temporary test directory for isolation

### HTTP Transport Tests
Use **real** HTTP MCP servers:

1. **Context7** (`https://mcp.context7.com/mcp`):
   - Provides library documentation tools
   - Tools: `resolve-library-id`, `get-library-docs`
   - No installation required (hosted service)
   - No authentication required (optional API key for higher rate limits)

2. **Exa** (`https://mcp.exa.ai/mcp`):
   - Provides web search and code context tools
   - Tools: `web_search_exa`, `get_code_context_exa`, `deep_researcher`
   - No installation required (hosted service)
   - Requires: EXA_API_KEY (via Authorization header)

The tests verify:
1. ✅ Connection to real MCP servers (stdio and HTTP)
2. ✅ Tool discovery and schema parsing
3. ✅ Tool execution and result handling
4. ✅ Config dict → callable conversion
5. ✅ Tool filtering and prefixing
6. ✅ Integration with aisuite's tool system
7. ✅ Proper resource cleanup
8. ✅ Error handling
9. ✅ HTTP transport with headers and timeout

## CI/CD

### GitHub Actions
If running in CI without Node.js:
```yaml
- name: Run tests
  run: pytest tests/mcp/ -v -m "not integration"
```

With Node.js:
```yaml
- name: Setup Node.js
  uses: actions/setup-node@v3
  with:
    node-version: '18'

- name: Run integration tests
  run: pytest tests/mcp/ -v -m integration
```

## Notes

- Tests are marked with `@pytest.mark.integration` to allow selective running
- Most tests use mocking for LLM API calls to avoid costs
- Real LLM tests are marked with `@pytest.mark.llm` and can be skipped
- Each test creates isolated temp directories for file operations
- MCP servers are started fresh for each test
- Cleanup is automatic via fixtures and context managers

## Test Markers

- `@pytest.mark.integration` - All MCP tests (includes both mocked and real LLM)
- `@pytest.mark.llm` - Real LLM tests only (makes actual API calls, costs money)

To run tests without LLM costs:
```bash
pytest tests/mcp/ -v -m "integration and not llm"
```

## Troubleshooting

**Error: "npx not found"**
- Install Node.js from https://nodejs.org/

**Error: "MCP package not installed"**
- Run: `pip install 'aisuite[mcp]'`

**Tests hang or timeout**
- Check Node.js/npx is working: `npx --version`
- Check MCP server can be installed: `npx -y @modelcontextprotocol/server-filesystem --help`

**Import errors**
- Make sure you're running from the project root
- Install test dependencies: `pip install pytest pytest-asyncio`


================================================
FILE: tests/mcp/__init__.py
================================================
"""Tests for MCP (Model Context Protocol) integration."""


================================================
FILE: tests/mcp/conftest.py
================================================
"""
Pytest fixtures for MCP integration tests.
"""

import pytest
import tempfile
import os
from pathlib import Path

# Load environment variables from .env file
try:
    from dotenv import load_dotenv

    load_dotenv()
except ImportError:
    # dotenv not installed, that's okay
    pass


@pytest.fixture
def temp_test_dir():
    """
    Create a temporary directory with test files for filesystem MCP server.

    This fixture creates a temp directory with sample files that can be used
    to test the Anthropic filesystem MCP server.

    Yields:
        str: Real path to the temporary test directory (resolves symlinks)

    Example:
        >>> def test_mcp(temp_test_dir):
        ...     mcp = MCPClient(
        ...         command="npx",
        ...         args=["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir]
        ...     )
    """
    with tempfile.TemporaryDirectory() as tmpdir:
        # Resolve real path to handle symlinks (e.g., /var -> /private/var on macOS)
        real_tmpdir = os.path.realpath(tmpdir)

        # Create test files
        test_file = Path(real_tmpdir) / "test.txt"
        test_file.write_text("Hello from MCP test!")

        readme = Path(real_tmpdir) / "README.md"
        readme.write_text("# Test Directory\n\nThis is a test README file.")

        data_file = Path(real_tmpdir) / "data.json"
        data_file.write_text('{"key": "value", "number": 42}')

        # Create a subdirectory
        subdir = Path(real_tmpdir) / "subdir"
        subdir.mkdir()
        (subdir / "nested.txt").write_text("Nested file content")

        yield real_tmpdir


@pytest.fixture
def skip_if_no_npx():
    """
    Skip test if npx is not available.

    This fixture checks if npx (Node.js package executor) is installed,
    which is required to run the Anthropic filesystem MCP server.

    Raises:
        pytest.skip: If npx is not found in PATH
    """
    import shutil

    if not shutil.which("npx"):
        pytest.skip(
            "npx not found. Install Node.js to run MCP integration tests. "
            "See: https://nodejs.org/"
        )


================================================
FILE: tests/mcp/test_client.py
================================================
"""
Integration tests for MCPClient.

These tests use the real Anthropic filesystem MCP server
(@modelcontextprotocol/server-filesystem) to verify that MCPClient
can connect to, discover tools from, and execute tools on real MCP servers.

Requirements:
    - Node.js and npx must be installed
    - Tests are marked with @pytest.mark.integration
    - Run with: pytest tests/mcp/test_client.py -v -m integration
"""

import pytest
from aisuite.mcp import MCPClient
from aisuite.mcp.config import validate_mcp_config


@pytest.mark.integration
class TestMCPClientConnection:
    """Test MCPClient connection and basic functionality."""

    def test_connect_to_filesystem_server(self, temp_test_dir, skip_if_no_npx):
        """Test connecting to real Anthropic filesystem MCP server."""
        mcp = MCPClient(
            command="npx",
            args=["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
            name="test_filesystem",
        )

        try:
            # Verify client is connected
            assert mcp._session is not None
            assert mcp.name == "test_filesystem"

            # List tools
            tools = mcp.list_tools()
            assert len(tools) > 0

            # Verify expected tools are present
            tool_names = [t["name"] for t in tools]
            assert "read_file" in tool_names
            assert "list_directory" in tool_names

            # Verify tools have descriptions
            for tool in tools:
                assert "name" in tool
                assert "description" in tool or "inputSchema" in tool

        finally:
            mcp.close()

    def test_list_tools_returns_schemas(self, temp_test_dir, skip_if_no_npx):
        """Test that list_tools returns proper tool schemas."""
        mcp = MCPClient(
            command="npx",
            args=["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
        )

        try:
            tools = mcp.list_tools()

            # Find read_file tool
            read_file_tool = next((t for t in tools if t["name"] == "read_file"), None)
            assert read_file_tool is not None

            # Verify it has an input schema
            assert "inputSchema" in read_file_tool
            assert "properties" in read_file_tool["inputSchema"]

        finally:
            mcp.close()

    def test_context_manager(self, temp_test_dir, skip_if_no_npx):
        """Test MCPClient as context manager."""
        with MCPClient(
            command="npx",
            args=["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
        ) as mcp:
            tools = mcp.list_tools()
            assert len(tools) > 0

        # After exiting context, session should be closed
        # (We don't have a good way to verify this without inspecting internals)


@pytest.mark.integration
class TestMCPClientToolExecution:
    """Test executing tools via MCPClient."""

    def test_call_read_file_tool(self, temp_test_dir, skip_if_no_npx):
        """Test calling the read_file tool."""
        import os

        mcp = MCPClient(
            command="npx",
            args=["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
        )

        try:
            # Call read_file tool with absolute path
            test_file_path = os.path.join(temp_test_dir, "test.txt")
            result = mcp.call_tool("read_file", {"path": test_file_path})

            # Verify result contains file content
            assert "Hello from MCP test!" in result

        finally:
            mcp.close()

    def test_call_list_directory_tool(self, temp_test_dir, skip_if_no_npx):
        """Test calling the list_directory tool."""
        mcp = MCPClient(
            command="npx",
            args=["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
        )

        try:
            # Call list_directory tool with absolute path
            result = mcp.call_tool("list_directory", {"path": temp_test_dir})

            # Verify result contains our test files
            assert "test.txt" in result or "README.md" in result

        finally:
            mcp.close()


@pytest.mark.integration
class TestMCPClientCallableTools:
    """Test getting callable tools from MCPClient."""

    def test_get_callable_tools(self, temp_test_dir, skip_if_no_npx):
        """Test getting all tools as callables."""
        mcp = MCPClient(
            command="npx",
            args=["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
        )

        try:
            tools = mcp.get_callable_tools()

            # Verify we got callables
            assert len(tools) > 0
            assert all(callable(t) for t in tools)

            # Verify callables have expected attributes
            for tool in tools:
                assert hasattr(tool, "__name__")
                assert hasattr(tool, "__doc__")
                assert hasattr(tool, "__annotations__")

            # Find read_file callable
            read_file = next((t for t in tools if t.__name__ == "read_file"), None)
            assert read_file is not None

            # Test calling it with absolute path
            import os

            test_file_path = os.path.join(temp_test_dir, "test.txt")
            result = read_file(path=test_file_path)
            assert "Hello from MCP test!" in result

        finally:
            mcp.close()

    def test_get_callable_tools_with_filtering(self, temp_test_dir, skip_if_no_npx):
        """Test filtering tools with allowed_tools parameter."""
        mcp = MCPClient(
            command="npx",
            args=["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
        )

        try:
            # Get only read_file tool
            tools = mcp.get_callable_tools(allowed_tools=["read_file"])

            # Should only get one tool
            assert len(tools) == 1
            assert tools[0].__name__ == "read_file"

            # Test it works with absolute path
            import os

            test_file_path = os.path.join(temp_test_dir, "test.txt")
            result = tools[0](path=test_file_path)
            assert "Hello from MCP test!" in result

        finally:
            mcp.close()

    def test_get_callable_tools_with_prefixing(self, temp_test_dir, skip_if_no_npx):
        """Test tool name prefixing with use_tool_prefix."""
        mcp = MCPClient(
            command="npx",
            args=["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
            name="filesystem",
        )

        try:
            # Get tools with prefixing
            tools = mcp.get_callable_tools(use_tool_prefix=True)

            # Verify tools are prefixed
            tool_names = [t.__name__ for t in tools]
            assert any(name.startswith("filesystem__") for name in tool_names)
            assert "filesystem__read_file" in tool_names

        finally:
            mcp.close()

    def test_get_specific_tool(self, temp_test_dir, skip_if_no_npx):
        """Test getting a specific tool by name."""
        mcp = MCPClient(
            command="npx",
            args=["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
        )

        try:
            # Get specific tool
            read_file = mcp.get_tool("read_file")

            assert read_file is not None
            assert callable(read_file)
            assert read_file.__name__ == "read_file"

            # Test it works with absolute path
            import os

            readme_path = os.path.join(temp_test_dir, "README.md")
            result = read_file(path=readme_path)
            assert "Test Directory" in result

            # Test getting non-existent tool
            fake_tool = mcp.get_tool("nonexistent_tool")
            assert fake_tool is None

        finally:
            mcp.close()


@pytest.mark.integration
class TestMCPClientFromConfig:
    """Test creating MCPClient from configuration dict."""

    def test_from_config_stdio(self, temp_test_dir, skip_if_no_npx):
        """Test creating MCPClient from config dict with stdio transport."""
        config = {
            "type": "mcp",
            "name": "test_filesystem",
            "command": "npx",
            "args": ["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
        }

        mcp = MCPClient.from_config(config)

        try:
            assert mcp.name == "test_filesystem"
            tools = mcp.list_tools()
            assert len(tools) > 0

        finally:
            mcp.close()

    def test_from_config_with_env(self, temp_test_dir, skip_if_no_npx):
        """Test creating MCPClient with environment variables."""
        import os

        config = {
            "type": "mcp",
            "name": "test_filesystem",
            "command": "npx",
            "args": ["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
            "env": {"TEST_VAR": "test_value"},
        }

        mcp = MCPClient.from_config(config)

        try:
            tools = mcp.list_tools()
            assert len(tools) > 0

        finally:
            mcp.close()

    def test_get_tools_from_config(self, temp_test_dir, skip_if_no_npx):
        """Test get_tools_from_config convenience method."""
        config = {
            "type": "mcp",
            "name": "test_filesystem",
            "command": "npx",
            "args": ["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
            "allowed_tools": ["read_file"],
            "use_tool_prefix": True,
        }

        # Note: This creates a client internally and doesn't provide a way to close it
        # In production, this would be managed by the Completions class
        tools = MCPClient.get_tools_from_config(config)

        assert len(tools) == 1
        assert tools[0].__name__ == "test_filesystem__read_file"
        assert callable(tools[0])

        # Test the tool works with absolute path
        import os

        test_file_path = os.path.join(temp_test_dir, "test.txt")
        result = tools[0](path=test_file_path)
        assert "Hello from MCP test!" in result


@pytest.mark.integration
class TestMCPClientErrorHandling:
    """Test error handling in MCPClient."""

    def test_invalid_command_raises_error(self, temp_test_dir):
        """Test that invalid command raises appropriate error."""
        with pytest.raises(Exception):
            # This should fail to connect
            mcp = MCPClient(
                command="nonexistent_command_12345",
                args=["--test"],
            )

    def test_call_nonexistent_tool_returns_error(self, temp_test_dir, skip_if_no_npx):
        """Test that calling non-existent tool returns error or raises exception."""
        mcp = MCPClient(
            command="npx",
            args=["-y", "@modelcontextprotocol/server-filesystem", temp_test_dir],
        )

        try:
            # Calling a non-existent tool should either raise an error or return error message
            try:
                result = mcp.call_tool("nonexistent_tool_xyz_123", {})
                # If it doesn't raise, the result should contain an error message
                assert "error" in result.lower() or "not found" in result.lower()
            except Exception:
                # It's also acceptable to raise an exception
                pass

        finally:
            mcp.close()


================================================
FILE: tests/mcp/test_e2e.py
================================================
"""
End-to-end integration tests for MCP with aisuite.

These tests verify the complete flow of using MCP tools with aisuite's
chat.completions.create() API, including:
- Config dict format
- Mixing MCP tools with Python functions
- Multiple MCP servers with prefixing
- Automatic cleanup

Requirements:
    - Node.js and npx must be installed
    - Tests are marked with @pytest.mark.integration
    - Run with: pytest tests/mcp/test_e2e.py -v -m integration
"""

import pytest
from unittest.mock import patch, MagicMock, Mock
from aisuite import Client


def create_mock_response(content="Test response", tool_calls=None):
    """Helper to create a mock chat completion response."""
    # Create a simple mock object that mimics the response structure
    response = MagicMock()
    response.choices = [MagicMock()]
    response.choices[0].message = MagicMock()
    response.choices[0].message.content = content
    response.choices[0].message.tool_calls = tool_calls
    response.choices[0].intermediate_messages = [response.choices[0].message]
    response.intermediate_responses = []

    return response


@pytest.mark.integration
class TestMCPConfigDictFormat:
    """Test using MCP config dict format in chat.completions.create()."""

    def test_basic_config_dict(self, temp_test_dir, skip_if_no_npx):
        """Test basic MCP config dict usage."""
        client = Client()

        # Mock the provider to avoid actual LLM API calls
        with patch.object(client.chat.completions, "_tool_runner") as mock_runner:
            mock_runner.return_value = create_mock_response("Files listed successfully")

            response = client.chat.completions.create(
                model="openai:gpt-4o",
                messages=[{"role": "user", "content": "List all files"}],
                tools=[
                    {
                        "type": "mcp",
                        "name": "filesystem",
                        "command": "npx",
                        "args": [
                            "-y",
                            "@modelcontextprotocol/server-filesystem",
                            temp_test_dir,
                        ],
                    }
                ],
                max_turns=2,
            )

            # Verify response
            assert response.choices[0].message.content == "Files listed successfully"

            # Verify tool_runner was called with processed tools
            assert mock_runner.called
            call_args = mock_runner.call_args
            tools_arg = call_args[0][3]  # tools is 4th positional arg

            # Verify tools were converted to callables
            assert isinstance(tools_arg, list)
            assert all(callable(t) for t in tools_arg)

    def test_config_dict_with_allowed_tools(self, temp_test_dir, skip_if_no_npx):
        """Test MCP config dict with allowed_tools filtering."""
        client = Client()

        with patch.object(client.chat.completions, "_tool_runner") as mock_runner:
            mock_runner.return_value = create_mock_response("File read successfully")

            response = client.chat.completions.create(
                model="openai:gpt-4o",
                messages=[{"role": "user", "content": "Read test.txt"}],
                tools=[
                    {
                        "type": "mcp",
                        "name": "filesystem",
                        "command": "npx",
                        "args": [
                            "-y",
                            "@modelcontextprotocol/server-filesystem",
                            temp_test_dir,
                        ],
                        "allowed_tools": ["read_file"],  # Only allow reading
                    }
                ],
                max_turns=2,
            )

            assert response.choices[0].message.content == "File read successfully"

            # Verify only read_file tool was passed
            call_args = mock_runner.call_args
            tools_arg = call_args[0][3]

            assert len(tools_arg) == 1
            assert tools_arg[0].__name__ == "read_file"

    def test_config_dict_with_prefixing(self, temp_test_dir, skip_if_no_npx):
        """Test MCP config dict with tool name prefixing."""
        client = Client()

        with patch.object(client.chat.completions, "_tool_runner") as mock_runner:
            mock_runner.return_value = create_mock_response("Success")

            response = client.chat.completions.create(
                model="openai:gpt-4o",
                messages=[{"role": "user", "content": "Test"}],
                tools=[
                    {
                        "type": "mcp",
                        "name": "docs",
                        "command": "npx",
                        "args": [
                            "-y",
                            "@modelcontextprotocol/server-filesystem",
                            temp_test_dir,
                        ],
                        "use_tool_prefix": True,
                    }
                ],
                max_turns=2,
            )

            # Verify tools have prefixes
            call_args = mock_runner.call_args
            tools_arg = call_args[0][3]

            tool_names = [t.__name__ for t in tools_arg]
            assert any(name.startswith("docs__") for name in tool_names)


@pytest.mark.integration
class TestMCPWithPythonFunctions:
    """Test mixing MCP tools with regular Python functions."""

    def test_mix_mcp_and_python_functions(self, temp_test_dir, skip_if_no_npx):
        """Test using MCP config dict alongside Python functions."""
        client = Client()

        # Define a Python function
        def get_current_time() -> str:
            """Get the current time."""
            return "2025-01-01 12:00:00"

        with patch.object(client.chat.completions, "_tool_runner") as mock_runner:
            mock_runner.return_value = create_mock_response("Mixed tools work!")

            response = client.chat.completions.create(
                model="openai:gpt-4o",
                messages=[{"role": "user", "content": "What time is it?"}],
                tools=[
                    get_current_time,  # Python function
                    {
                        "type": "mcp",
                        "name": "filesystem",
                        "command": "npx",
                        "args": [
                            "-y",
                            "@modelcontextprotocol/server-filesystem",
                            temp_test_dir,
                        ],
                    },  # MCP config
                ],
                max_turns=2,
            )

            assert response.choices[0].message.content == "Mixed tools work!"

            # Verify both types of tools were passed
            call_args = mock_runner.call_args
            tools_arg = call_args[0][3]

            # Should have Python function + MCP tools
            assert len(tools_arg) > 1

            # Verify Python function is in there
            assert any(t.__name__ == "get_current_time" for t in tools_arg)

            # Verify MCP tools are in there
            assert any(t.__name__ == "read_file" for t in tools_arg)


@pytest.mark.integration
class TestMultipleMCPServers:
    """Test using multiple MCP servers simultaneously."""

    def test_multiple_servers_with_prefixing(self, temp_test_dir, skip_if_no_npx):
        """Test multiple MCP servers with tool name prefixing to avoid collisions."""
        import tempfile

        client = Client()

        # Create a second temp directory
        with tempfile.TemporaryDirectory() as temp_dir_2:
            with patch.object(client.chat.completions, "_tool_runner") as mock_runner:
                mock_runner.return_value = create_mock_response(
                    "Multiple servers work!"
                )

                response = client.chat.completions.create(
                    model="openai:gpt-4o",
                    messages=[{"role": "user", "content": "Compare directories"}],
                    tools=[
                        {
                            "type": "mcp",
                            "name": "dir1",
                            "command": "npx",
                            "args": [
                                "-y",
                                "@modelcontextprotocol/server-filesystem",
                                temp_test_dir,
                            ],
                            "use_tool_prefix": True,
                        },
                        {
                            "type": "mcp",
                            "name": "dir2",
                            "command": "npx",
                            "args": [
                                "-y",
                                "@modelcontextprotocol/server-filesystem",
                                temp_dir_2,
                            ],
                            "use_tool_prefix": True,
                        },
                    ],
                    max_turns=2,
                )

                assert response.choices[0].message.content == "Multiple servers work!"

                # Verify tools from both servers with prefixes
                call_args = mock_runner.call_args
                tools_arg = call_args[0][3]

                tool_names = [t.__name__ for t in tools_arg]

                # Should have tools from both servers
                assert any(name.startswith("dir1__") for name in tool_names)
                assert any(name.startswith("dir2__") for name in tool_names)

                # Should have both read_file tools with different prefixes
                assert "dir1__read_file" in tool_names
                assert "dir2__read_file" in tool_names


@pytest.mark.integration
class TestMCPCleanup:
    """Test that MCP clients are properly cleaned up."""

    def test_cleanup_after_success(self, temp_test_dir, skip_if_no_npx):
        """Test MCP clients are cleaned up after successful request."""
        client = Client()

        with patch.object(client.chat.completions, "_tool_runner") as mock_runner:
            mock_runner.return_value = create_mock_response("Success")

            # Patch MCPClient to track close() calls
            with patch("aisuite.client.MCPClient") as mock_mcp_class:
                mock_mcp_instance = MagicMock()
                mock_mcp_class.from_config.return_value = mock_mcp_instance
                mock_mcp_instance.get_callable_tools.return_value = []

                response = client.chat.completions.create(
                    model="openai:gpt-4o",
                    messages=[{"role": "user", "content": "Test"}],
                    tools=[
                        {
                            "type": "mcp",
                            "name": "filesystem",
                            "command": "npx",
                            "args": [
                                "-y",
                                "@modelcontextprotocol/server-filesystem",
                                temp_test_dir,
                            ],
                        }
                    ],
                    max_turns=2,
                )

                # Verify MCP client was used as context manager (cleanup called)
                mock_mcp_instance.__enter__.assert_called_once()
                mock_mcp_instance.__exit__.assert_called_once()

    def test_cleanup_after_error(self, temp_test_dir, skip_if_no_npx):
        """Test MCP clients are cleaned up even after error."""
        client = Client()

        with patch.object(client.chat.completions, "_tool_runner") as mock_runner:
            # Make tool_runner raise an error
            mock_runner.side_effect = ValueError("Test error")

            # Patch MCPClient to track close() calls
            with patch("aisuite.client.MCPClient") as mock_mcp_class:
                mock_mcp_instance = MagicMock()
                mock_mcp_class.from_config.return_value = mock_mcp_instance
                mock_mcp_instance.get_callable_tools.return_value = []

                with pytest.raises(ValueError, match="Test error"):
                    client.chat.completions.create(
                        model="openai:gpt-4o",
                        messages=[{"role": "user", "content": "Test"}],
                        tools=[
                            {
                                "type": "mcp",
                                "name": "filesystem",
                                "command": "npx",
                                "args": [
                                    "-y",
                                    "@modelcontextprotocol/server-filesystem",
                                    temp_test_dir,
                                ],
                            }
                        ],
                        max_turns=2,
                    )

                # Even after error, MCP client context manager exit should be called
                mock_mcp_instance.__enter__.assert_called_once()
                mock_mcp_instance.__exit__.assert_called_once()


@pytest.mark.integration
class TestMCPErrorHandling:
    """Test error handling for MCP integration."""

    def test_invalid_mcp_config_raises_error(self):
        """Test that invalid MCP config raises clear error."""
        client = Client()

        with pytest.raises(ValueError, match="must have 'name'"):
            client.chat.completions.create(
                model="openai:gpt-4o",
                messages=[{"role": "user", "content": "Test"}],
                tools=[
                    {
                        "type": "mcp",
                        # Missing 'name' field
                        "command": "npx",
                        "args": ["server"],
                    }
                ],
                max_turns=2,
            )

    def test_mcp_not_installed_raises_error(self, temp_test_dir, skip_if_no_npx):
        """Test that helpful error is raised if MCP package not installed."""
        client = Client()

        # Simulate MCP not being installed
        with patch("aisuite.client.MCP_AVAILABLE", False):
            with pytest.raises(ImportError, match="mcp.*package"):
                client.chat.completions.create(
                    model="openai:gpt-4o",
                    messages=[{"role": "user", "content": "Test"}],
                    tools=[
                        {
                            "type": "mcp",
                            "name": "filesystem",
                            "command": "npx",
                            "args": [
                                "-y",
                                "@modelcontextprotocol/server-filesystem",
                                temp_test_dir,
                            ],
                        }
                    ],
                    max_turns=2,
                )


================================================
FILE: tests/mcp/test_http_llm_e2e.py
================================================
"""
Real LLM End-to-End Tests for HTTP MCP Integration.

These tests make ACTUAL API calls to LLM providers (OpenAI, Anthropic) to verify
that HTTP-based MCP tools work correctly with real models. Unlike test_http_transport.py
which mocks HTTP responses, these tests verify the complete integration stack.

⚠️ WARNING: These tests will make real API calls and incur costs!
   - Each test costs ~$0.01-0.05 depending on the model
   - Tests are marked with @pytest.mark.llm
   - Tests are skipped if API keys are not present

MCP Servers Used:
   - Context7 (https://mcp.context7.com/mcp)
     - Public HTTP MCP server for library documentation
     - No authentication required (optional API key for higher limits)
     - Tools: resolve-library-id, get-library-docs

   - Exa (https://mcp.exa.ai/mcp)
     - Web search and code context search
     - Requires EXA_API_KEY for authentication
     - Tools: web_search_exa, get_code_context_exa

Requirements:
    - API keys in .env file:
        OPENAI_API_KEY=your-key
        ANTHROPIC_API_KEY=your-key
        EXA_API_KEY=your-key (for Exa tests only)
    - pytest-asyncio, python-dotenv

Running:
    # Run ONLY HTTP LLM tests (⚠️ costs money):
    pytest tests/mcp/test_http_llm_e2e.py -v -m llm

    # Skip LLM tests (default, free):
    pytest tests/mcp/ -v -m "integration and not llm"
"""

import pytest
import os
from aisuite import Client


# Helper functions to check if we have API keys
def has_openai_key():
    """Check if OpenAI API key is available."""
    return bool(os.getenv("OPENAI_API_KEY"))


def has_anthropic_key():
    """Check if Anthropic API key is available."""
    return bool(os.getenv("ANTHROPIC_API_KEY"))


def has_exa_key():
    """Check if Exa API key is available."""
    return bool(os.getenv("EXA_API_KEY"))


@pytest.mark.llm
@pytest.mark.integration
class TestOpenAIWithHTTPMCP:
    """Test OpenAI models with HTTP MCP tools (Context7)."""

    @pytest.mark.skipif(not has_openai_key(), reason="OPENAI_API_KEY not set")
    def test_gpt4o_resolves_library_via_http_mcp(self):
        """Test GPT-4o can resolve library names using HTTP MCP."""
        client = Client()

        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": 'Use resolve-library-id to resolve the library name "requests" and tell me the library ID.',
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "context7",
                    "server_url": "https://mcp.context7.com/mcp",
                    "allowed_tools": ["resolve-library-id"],
                }
            ],
            max_turns=3,
        )

        # Verify the LLM used the HTTP MCP tool
        content = response.choices[0].message.content.lower()
        # Should mention requests or library ID
        assert any(
            keyword in content
            for keyword in ["requests", "library", "id", "pypi", "python"]
        ), f"Expected library resolution info in response, got: {content}"

    @pytest.mark.skipif(not has_openai_key(), reason="OPENAI_API_KEY not set")
    def test_gpt4o_gets_library_docs_via_http_mcp(self):
        """Test GPT-4o can get library documentation using HTTP MCP."""
        client = Client()

        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": 'First use resolve-library-id to get the ID for "requests", then use get-library-docs to fetch its documentation.',
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "context7",
                    "server_url": "https://mcp.context7.com/mcp",
                    "allowed_tools": ["resolve-library-id", "get-library-docs"],
                    "timeout": 90.0,  # Increase timeout - docs fetching can be slow
                }
            ],
            max_turns=5,
        )

        # Verify the LLM got documentation
        content = response.choices[0].message.content.lower()
        # Should mention documentation or requests library
        assert any(
            keyword in content
            for keyword in ["documentation", "requests", "http", "api", "library"]
        ), f"Expected documentation content in response, got: {content}"

    @pytest.mark.skipif(not has_openai_key(), reason="OPENAI_API_KEY not set")
    def test_gpt4o_mixed_tools_http(self):
        """Test GPT-4o with both HTTP MCP tools and regular Python functions."""

        # Define a Python function
        def get_current_year() -> str:
            """Get the current year."""
            from datetime import datetime

            return str(datetime.now().year)

        client = Client()

        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": 'First use get_current_year to get the year, then use resolve-library-id to resolve "requests".',
                }
            ],
            tools=[
                get_current_year,  # Python function
                {
                    "type": "mcp",
                    "name": "context7",
                    "server_url": "https://mcp.context7.com/mcp",
                    "allowed_tools": ["resolve-library-id"],
                },  # HTTP MCP
            ],
            max_turns=5,
        )

        # Verify both tools were used
        content = response.choices[0].message.content.lower()
        # Should mention the year (from Python function)
        assert any(
            str(y) in content for y in [2024, 2025, 2026]
        ), f"Expected year in response, got: {content}"
        # Should mention requests or library (from HTTP MCP tool)
        assert any(
            keyword in content for keyword in ["requests", "library", "id"]
        ), f"Expected library info in response, got: {content}"


@pytest.mark.llm
@pytest.mark.integration
class TestAnthropicWithHTTPMCP:
    """Test Anthropic Claude models with HTTP MCP tools (Context7)."""

    @pytest.mark.skipif(not has_anthropic_key(), reason="ANTHROPIC_API_KEY not set")
    def test_claude_resolves_library_via_http_mcp(self):
        """Test Claude can resolve library names using HTTP MCP."""
        client = Client()

        response = client.chat.completions.create(
            model="anthropic:claude-sonnet-4-5",
            messages=[
                {
                    "role": "user",
                    "content": 'Use resolve-library-id to resolve the library name "flask" and tell me the library ID.',
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "context7",
                    "server_url": "https://mcp.context7.com/mcp",
                    "allowed_tools": ["resolve-library-id"],
                }
            ],
            max_turns=3,
        )

        # Verify Claude used the HTTP MCP tool
        content = response.choices[0].message.content.lower()
        assert any(
            keyword in content
            for keyword in ["flask", "library", "id", "pypi", "python"]
        ), f"Expected library resolution info in response, got: {content}"

    @pytest.mark.skipif(not has_anthropic_key(), reason="ANTHROPIC_API_KEY not set")
    def test_claude_gets_library_docs_via_http_mcp(self):
        """Test Claude can get library documentation using HTTP MCP."""
        client = Client()

        response = client.chat.completions.create(
            model="anthropic:claude-sonnet-4-5",
            messages=[
                {
                    "role": "user",
                    "content": 'Use resolve-library-id to get the ID for "flask", then use get-library-docs to fetch documentation.',
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "context7",
                    "server_url": "https://mcp.context7.com/mcp",
                    "allowed_tools": ["resolve-library-id", "get-library-docs"],
                    "timeout": 90.0,  # Increase timeout - docs fetching can be slow
                }
            ],
            max_turns=5,
        )

        # Verify Claude got documentation
        content = response.choices[0].message.content.lower()
        assert any(
            keyword in content
            for keyword in ["documentation", "flask", "web", "library"]
        ), f"Expected documentation content in response, got: {content}"

    @pytest.mark.skipif(not has_anthropic_key(), reason="ANTHROPIC_API_KEY not set")
    def test_claude_mixed_tools_http(self):
        """Test Claude with both HTTP MCP tools and regular Python functions."""

        def get_language() -> str:
            """Get the primary programming language."""
            return "Python"

        client = Client()

        response = client.chat.completions.create(
            model="anthropic:claude-sonnet-4-5",
            messages=[
                {
                    "role": "user",
                    "content": 'Use get_language to get the language, then use resolve-library-id to resolve "django". Tell me both.',
                }
            ],
            tools=[
                get_language,  # Python function
                {
                    "type": "mcp",
                    "name": "context7",
                    "server_url": "https://mcp.context7.com/mcp",
                    "allowed_tools": ["resolve-library-id"],
                },  # HTTP MCP
            ],
            max_turns=5,
        )

        # Verify both tools were used
        content = response.choices[0].message.content.lower()
        # Should mention Python (from Python function)
        assert "python" in content, f"Expected Python in response, got: {content}"
        # Should mention django or library (from HTTP MCP tool)
        assert any(
            keyword in content for keyword in ["django", "library", "id"]
        ), f"Expected library info in response, got: {content}"


@pytest.mark.llm
@pytest.mark.integration
class TestHTTPMCPConfigDict:
    """Test HTTP MCP with config dict format."""

    @pytest.mark.skipif(not has_openai_key(), reason="OPENAI_API_KEY not set")
    def test_http_mcp_config_dict_format(self):
        """Test that HTTP MCP works with config dict format."""
        client = Client()

        # Using config dict format (not explicit MCPClient)
        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": 'Use resolve-library-id to resolve the library name "numpy".',
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "context7",
                    "server_url": "https://mcp.context7.com/mcp",
                    "timeout": 60.0,  # Test timeout parameter
                    "allowed_tools": ["resolve-library-id"],
                }
            ],
            max_turns=3,
        )

        # Verify it worked
        content = response.choices[0].message.content.lower()
        assert any(
            keyword in content
            for keyword in ["numpy", "library", "id", "pypi", "python"]
        ), f"Expected library resolution info in response, got: {content}"


@pytest.mark.llm
@pytest.mark.integration
class TestHTTPMCPWithHeaders:
    """Test HTTP MCP with custom headers."""

    @pytest.mark.skipif(not has_openai_key(), reason="OPENAI_API_KEY not set")
    def test_http_mcp_with_headers(self):
        """Test that HTTP MCP accepts custom headers (Context7 supports optional API key)."""
        client = Client()

        # Context7 doesn't require auth for basic usage, but supports it
        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": 'Use resolve-library-id to resolve "pandas".',
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "context7",
                    "server_url": "https://mcp.context7.com/mcp",
                    "headers": {
                        "User-Agent": "aisuite-test"
                    },  # Custom header (optional)
                    "allowed_tools": ["resolve-library-id"],
                }
            ],
            max_turns=3,
        )

        # Verify it worked with headers
        content = response.choices[0].message.content.lower()
        assert any(
            keyword in content for keyword in ["pandas", "library", "id", "data"]
        ), f"Expected library info in response, got: {content}"


@pytest.mark.llm
@pytest.mark.integration
class TestOpenAIWithExaMCP:
    """Test OpenAI models with Exa HTTP MCP tools."""

    @pytest.mark.skipif(
        not has_openai_key() or not has_exa_key(),
        reason="OPENAI_API_KEY or EXA_API_KEY not set",
    )
    def test_gpt4o_web_search_via_exa(self):
        """Test GPT-4o can perform web search using Exa."""
        client = Client()

        exa_api_key = os.getenv("EXA_API_KEY")

        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": "Search for recent Python 3.12 features and summarize the top 2.",
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "exa",
                    "server_url": "https://mcp.exa.ai/mcp",
                    "headers": {"Authorization": f"Bearer {exa_api_key}"},
                    "allowed_tools": ["web_search_exa"],
                    "timeout": 60.0,
                }
            ],
            max_turns=3,
        )

        # Verify search results
        content = response.choices[0].message.content.lower()
        assert any(
            keyword in content for keyword in ["python", "3.12", "feature"]
        ), f"Expected Python 3.12 info in response, got: {content}"

    @pytest.mark.skipif(
        not has_openai_key() or not has_exa_key(),
        reason="OPENAI_API_KEY or EXA_API_KEY not set",
    )
    def test_gpt4o_code_context_via_exa(self):
        """Test GPT-4o can search code context using Exa."""
        client = Client()

        exa_api_key = os.getenv("EXA_API_KEY")

        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": "Find an example of using asyncio.gather in Python.",
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "exa",
                    "server_url": "https://mcp.exa.ai/mcp",
                    "headers": {"Authorization": f"Bearer {exa_api_key}"},
                    "allowed_tools": ["get_code_context_exa"],
                    "timeout": 60.0,
                }
            ],
            max_turns=3,
        )

        # Verify code context results
        content = response.choices[0].message.content.lower()
        assert any(
            keyword in content for keyword in ["asyncio", "gather", "async", "await"]
        ), f"Expected asyncio.gather info in response, got: {content}"

    @pytest.mark.skipif(
        not has_openai_key() or not has_exa_key(),
        reason="OPENAI_API_KEY or EXA_API_KEY not set",
    )
    def test_gpt4o_mixed_tools_with_exa(self):
        """Test GPT-4o with both Exa tools and Python functions."""

        def get_current_year() -> str:
            """Get the current year."""
            from datetime import datetime

            return str(datetime.now().year)

        client = Client()
        exa_api_key = os.getenv("EXA_API_KEY")

        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": "Get the current year, then search for major tech events from that year.",
                }
            ],
            tools=[
                get_current_year,  # Python function
                {
                    "type": "mcp",
                    "name": "exa",
                    "server_url": "https://mcp.exa.ai/mcp",
                    "headers": {"Authorization": f"Bearer {exa_api_key}"},
                    "allowed_tools": ["web_search_exa"],
                    "timeout": 60.0,
                },  # Exa HTTP MCP
            ],
            max_turns=4,
        )

        # Verify both tools were used
        content = response.choices[0].message.content.lower()
        # Should mention the year (from Python function)
        assert any(
            str(y) in content for y in [2024, 2025, 2026]
        ), f"Expected year in response, got: {content}"
        # Should mention tech or events (from web search)
        assert any(
            keyword in content for keyword in ["tech", "event", "technology"]
        ), f"Expected tech events in response, got: {content}"


@pytest.mark.llm
@pytest.mark.integration
class TestAnthropicWithExaMCP:
    """Test Anthropic Claude models with Exa HTTP MCP tools."""

    @pytest.mark.skipif(
        not has_anthropic_key() or not has_exa_key(),
        reason="ANTHROPIC_API_KEY or EXA_API_KEY not set",
    )
    def test_claude_web_search_via_exa(self):
        """Test Claude can perform web search using Exa."""
        client = Client()

        exa_api_key = os.getenv("EXA_API_KEY")

        response = client.chat.completions.create(
            model="anthropic:claude-sonnet-4-5",
            messages=[
                {
                    "role": "user",
                    "content": "Search for information about Rust programming language features.",
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "exa",
                    "server_url": "https://mcp.exa.ai/mcp",
                    "headers": {"Authorization": f"Bearer {exa_api_key}"},
                    "allowed_tools": ["web_search_exa"],
                    "timeout": 60.0,
                }
            ],
            max_turns=3,
        )

        # Verify search results
        content = response.choices[0].message.content.lower()
        assert any(
            keyword in content for keyword in ["rust", "programming", "language"]
        ), f"Expected Rust info in response, got: {content}"

    @pytest.mark.skipif(
        not has_anthropic_key() or not has_exa_key(),
        reason="ANTHROPIC_API_KEY or EXA_API_KEY not set",
    )
    def test_claude_code_context_via_exa(self):
        """Test Claude can search code context using Exa."""
        client = Client()

        exa_api_key = os.getenv("EXA_API_KEY")

        response = client.chat.completions.create(
            model="anthropic:claude-sonnet-4-5",
            messages=[
                {
                    "role": "user",
                    "content": "Find code examples for FastAPI route decorators.",
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "exa",
                    "server_url": "https://mcp.exa.ai/mcp",
                    "headers": {"Authorization": f"Bearer {exa_api_key}"},
                    "allowed_tools": ["get_code_context_exa"],
                    "timeout": 60.0,
                }
            ],
            max_turns=3,
        )

        # Verify code context results
        content = response.choices[0].message.content.lower()
        assert any(
            keyword in content for keyword in ["fastapi", "route", "decorator", "@"]
        ), f"Expected FastAPI route info in response, got: {content}"

    @pytest.mark.skipif(
        not has_anthropic_key() or not has_exa_key(),
        reason="ANTHROPIC_API_KEY or EXA_API_KEY not set",
    )
    def test_claude_mixed_tools_with_exa(self):
        """Test Claude with both Exa tools and Python functions."""

        def get_language() -> str:
            """Get the primary programming language."""
            return "Python"

        client = Client()
        exa_api_key = os.getenv("EXA_API_KEY")

        response = client.chat.completions.create(
            model="anthropic:claude-sonnet-4-5",
            messages=[
                {
                    "role": "user",
                    "content": "Get the language name, then search for its latest version features.",
                }
            ],
            tools=[
                get_language,  # Python function
                {
                    "type": "mcp",
                    "name": "exa",
                    "server_url": "https://mcp.exa.ai/mcp",
                    "headers": {"Authorization": f"Bearer {exa_api_key}"},
                    "allowed_tools": ["web_search_exa"],
                    "timeout": 60.0,
                },  # Exa HTTP MCP
            ],
            max_turns=4,
        )

        # Verify both tools were used
        content = response.choices[0].message.content.lower()
        # Should mention Python (from Python function)
        assert "python" in content, f"Expected Python in response, got: {content}"
        # Should mention version or features (from web search)
        assert any(
            keyword in content for keyword in ["version", "feature", "3."]
        ), f"Expected version info in response, got: {content}"


================================================
FILE: tests/mcp/test_http_transport.py
================================================
"""
Tests for MCP HTTP Transport.

These tests verify that the MCPClient works correctly with HTTP-based MCP servers.
All HTTP requests are mocked to avoid requiring a real HTTP MCP server.
"""

import pytest
from unittest.mock import AsyncMock, MagicMock, patch
import json
import httpx
from aisuite.mcp.client import MCPClient


@pytest.mark.integration
class TestHTTPTransportBasics:
    """Test basic HTTP transport functionality."""

    def test_create_http_client_success(self):
        """Test creating an HTTP MCPClient with valid parameters."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            # Mock the HTTP client
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock initialize response
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {
                    "protocolVersion": "2024-11-05",
                    "serverInfo": {"name": "test-server", "version": "1.0.0"},
                },
            }
            mock_response_init.raise_for_status = MagicMock()

            # Mock tools/list response
            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {
                    "tools": [
                        {
                            "name": "test_tool",
                            "description": "A test tool",
                            "inputSchema": {
                                "type": "object",
                                "properties": {"param": {"type": "string"}},
                            },
                        }
                    ]
                },
            }
            mock_response_tools.raise_for_status = MagicMock()

            # Set up post responses in order (init + notification + tools)
            mock_client_instance.post = AsyncMock(
                side_effect=[
                    mock_response_init,
                    MagicMock(),  # initialized notification
                    mock_response_tools,
                ]
            )

            # Create client
            mcp = MCPClient(server_url="http://localhost:8000", name="test-server")

            # Verify client was created
            assert mcp.server_url == "http://localhost:8000"
            assert mcp.name == "test-server"
            assert len(mcp.list_tools()) == 1
            assert mcp.list_tools()[0]["name"] == "test_tool"

            # Cleanup
            mcp.close()

    def test_create_http_client_with_headers(self):
        """Test creating an HTTP MCPClient with custom headers."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock responses
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {"protocolVersion": "2024-11-05"},
            }
            mock_response_init.raise_for_status = MagicMock()

            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {"tools": []},
            }
            mock_response_tools.raise_for_status = MagicMock()

            mock_client_instance.post = AsyncMock(
                side_effect=[mock_response_init, MagicMock(), mock_response_tools]
            )

            # Create client with headers
            headers = {"Authorization": "Bearer secret-token"}
            mcp = MCPClient(
                server_url="http://localhost:8000", headers=headers, name="test"
            )

            # Verify headers were stored
            assert mcp.headers == headers

            # Cleanup
            mcp.close()

    def test_http_client_validation_errors(self):
        """Test that validation errors are raised for invalid parameters."""
        # Test: no command or server_url
        with pytest.raises(ValueError, match="Must provide either"):
            MCPClient()

        # Test: both command and server_url
        with pytest.raises(ValueError, match="Cannot mix stdio parameters"):
            MCPClient(command="npx", server_url="http://localhost:8000")


@pytest.mark.integration
class TestHTTPToolCalling:
    """Test HTTP tool discovery and calling."""

    def test_list_tools_http(self):
        """Test listing tools via HTTP transport."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock responses
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {},
            }
            mock_response_init.raise_for_status = MagicMock()

            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {
                    "tools": [
                        {
                            "name": "tool1",
                            "description": "First tool",
                            "inputSchema": {},
                        },
                        {
                            "name": "tool2",
                            "description": "Second tool",
                            "inputSchema": {},
                        },
                    ]
                },
            }
            mock_response_tools.raise_for_status = MagicMock()

            mock_client_instance.post = AsyncMock(
                side_effect=[mock_response_init, MagicMock(), mock_response_tools]
            )

            mcp = MCPClient(server_url="http://localhost:8000")

            tools = mcp.list_tools()
            assert len(tools) == 2
            assert tools[0]["name"] == "tool1"
            assert tools[1]["name"] == "tool2"

            mcp.close()

    def test_call_tool_http(self):
        """Test calling a tool via HTTP transport."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock init and tools/list
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {},
            }
            mock_response_init.raise_for_status = MagicMock()

            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {
                    "tools": [
                        {
                            "name": "echo",
                            "description": "Echo tool",
                            "inputSchema": {
                                "type": "object",
                                "properties": {"message": {"type": "string"}},
                            },
                        }
                    ]
                },
            }
            mock_response_tools.raise_for_status = MagicMock()

            # Mock tool call response
            mock_response_call = MagicMock()
            mock_response_call.headers = {"content-type": "application/json"}
            mock_response_call.json.return_value = {
                "jsonrpc": "2.0",
                "id": 3,
                "result": {"content": [{"text": "Hello, World!"}]},
            }
            mock_response_call.raise_for_status = MagicMock()

            mock_client_instance.post = AsyncMock(
                side_effect=[
                    mock_response_init,
                    MagicMock(),
                    mock_response_tools,
                    mock_response_call,
                ]
            )

            mcp = MCPClient(server_url="http://localhost:8000")

            # Call tool
            result = mcp.call_tool("echo", {"message": "Hello"})
            assert result == "Hello, World!"

            mcp.close()

    def test_get_callable_tools_http(self):
        """Test getting callable tools via HTTP transport."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock responses
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {},
            }
            mock_response_init.raise_for_status = MagicMock()

            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {
                    "tools": [
                        {
                            "name": "test_tool",
                            "description": "A test tool",
                            "inputSchema": {"type": "object", "properties": {}},
                        }
                    ]
                },
            }
            mock_response_tools.raise_for_status = MagicMock()

            mock_client_instance.post = AsyncMock(
                side_effect=[mock_response_init, MagicMock(), mock_response_tools]
            )

            mcp = MCPClient(server_url="http://localhost:8000")

            tools = mcp.get_callable_tools()
            assert len(tools) == 1
            assert callable(tools[0])
            assert tools[0].__name__ == "test_tool"

            mcp.close()


@pytest.mark.integration
class TestHTTPFromConfig:
    """Test creating HTTP MCPClient from config dict."""

    def test_from_config_http(self):
        """Test creating HTTP client from config."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock responses
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {},
            }
            mock_response_init.raise_for_status = MagicMock()

            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {"tools": []},
            }
            mock_response_tools.raise_for_status = MagicMock()

            mock_client_instance.post = AsyncMock(
                side_effect=[mock_response_init, MagicMock(), mock_response_tools]
            )

            config = {
                "type": "mcp",
                "name": "test-server",
                "server_url": "http://localhost:8000",
                "headers": {"Authorization": "Bearer token"},
                "timeout": 60.0,
            }

            mcp = MCPClient.from_config(config)

            assert mcp.server_url == "http://localhost:8000"
            assert mcp.headers == {"Authorization": "Bearer token"}
            assert mcp.timeout == 60.0
            assert mcp.name == "test-server"

            mcp.close()

    def test_get_tools_from_config_http(self):
        """Test getting tools from HTTP config."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock responses
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {},
            }
            mock_response_init.raise_for_status = MagicMock()

            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {
                    "tools": [
                        {"name": "tool1", "description": "Tool 1", "inputSchema": {}},
                        {"name": "tool2", "description": "Tool 2", "inputSchema": {}},
                    ]
                },
            }
            mock_response_tools.raise_for_status = MagicMock()

            mock_client_instance.post = AsyncMock(
                side_effect=[mock_response_init, MagicMock(), mock_response_tools]
            )

            config = {
                "type": "mcp",
                "name": "test",
                "server_url": "http://localhost:8000",
                "allowed_tools": ["tool1"],
            }

            tools = MCPClient.get_tools_from_config(config)

            # Only tool1 should be returned due to allowed_tools filter
            assert len(tools) == 1
            assert tools[0].__name__ == "tool1"


@pytest.mark.integration
class TestHTTPErrorHandling:
    """Test error handling for HTTP transport."""

    def test_http_connection_error(self):
        """Test handling of HTTP connection errors."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock connection error
            mock_client_instance.post = AsyncMock(
                side_effect=httpx.ConnectError("Connection refused")
            )

            with pytest.raises(RuntimeError, match="HTTP request to MCP server failed"):
                MCPClient(server_url="http://localhost:8000")

    def test_http_json_rpc_error(self):
        """Test handling of JSON-RPC errors from server."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock JSON-RPC error response
            mock_response = MagicMock()
            mock_response.headers = {"content-type": "application/json"}
            mock_response.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "error": {"code": -32600, "message": "Invalid Request"},
            }
            mock_response.raise_for_status = MagicMock()

            mock_client_instance.post = AsyncMock(return_value=mock_response)

            with pytest.raises(RuntimeError, match="MCP server error: Invalid Request"):
                MCPClient(server_url="http://localhost:8000")

    def test_http_status_error(self):
        """Test handling of HTTP status errors."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock HTTP status error
            mock_client_instance.post = AsyncMock(
                side_effect=httpx.HTTPStatusError(
                    "404 Not Found",
                    request=MagicMock(),
                    response=MagicMock(),
                )
            )

            with pytest.raises(RuntimeError, match="HTTP request to MCP server failed"):
                MCPClient(server_url="http://localhost:8000")


@pytest.mark.integration
class TestHTTPEndpointHandling:
    """Test that server URLs are used exactly as provided."""

    def test_endpoint_uses_exact_url(self):
        """Test that the exact server URL is used without modification."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock responses
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {},
            }
            mock_response_init.raise_for_status = MagicMock()

            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {"tools": []},
            }
            mock_response_tools.raise_for_status = MagicMock()

            mock_client_instance.post = AsyncMock(
                side_effect=[mock_response_init, MagicMock(), mock_response_tools]
            )

            # Use full endpoint URL
            mcp = MCPClient(server_url="http://localhost:8000/mcp/v1")

            # Verify that post was called with exact URL (no modification)
            # Calls: initialize, initialized notification, tools/list
            calls = mock_client_instance.post.call_args_list
            assert len(calls) == 3
            assert calls[0][0][0] == "http://localhost:8000/mcp/v1"  # initialize
            assert (
                calls[1][0][0] == "http://localhost:8000/mcp/v1"
            )  # initialized notification
            assert calls[2][0][0] == "http://localhost:8000/mcp/v1"  # tools/list

            mcp.close()

    def test_endpoint_trailing_slash_handled(self):
        """Test that trailing slashes in server URL are removed."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock responses
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {},
            }
            mock_response_init.raise_for_status = MagicMock()

            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {"tools": []},
            }
            mock_response_tools.raise_for_status = MagicMock()

            mock_client_instance.post = AsyncMock(
                side_effect=[mock_response_init, MagicMock(), mock_response_tools]
            )

            # URL with trailing slash
            mcp = MCPClient(server_url="http://localhost:8000/mcp/v1/")

            # Verify trailing slash is removed
            calls = mock_client_instance.post.call_args_list
            assert calls[0][0][0] == "http://localhost:8000/mcp/v1"

            mcp.close()


@pytest.mark.integration
class TestHTTPSSEResponses:
    """Test SSE (Server-Sent Events) response handling."""

    def test_sse_response_parsing(self):
        """Test handling SSE stream responses."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock initialize (JSON response)
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {},
            }
            mock_response_init.raise_for_status = MagicMock()

            # Mock tools/list (JSON response)
            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {"tools": []},
            }
            mock_response_tools.raise_for_status = MagicMock()

            # Mock tool call (SSE response)
            mock_response_sse = MagicMock()
            mock_response_sse.headers = {"content-type": "text/event-stream"}
            mock_response_sse.raise_for_status = MagicMock()

            # Simulate SSE stream with data lines
            # MCP format: result has "content" array with text items
            async def mock_aiter_lines():
                lines = [
                    'data: {"jsonrpc": "2.0", "id": 3, "result": {"content": [{"type": "text", "text": "SSE result"}]}}',
                    "",
                ]
                for line in lines:
                    yield line

            mock_response_sse.aiter_lines = mock_aiter_lines

            mock_client_instance.post = AsyncMock(
                side_effect=[
                    mock_response_init,
                    MagicMock(),  # initialized notification (no response checked)
                    mock_response_tools,
                    mock_response_sse,
                ]
            )

            mcp = MCPClient(server_url="http://localhost:8000")

            # Call tool which returns SSE response
            result = mcp.call_tool("test_tool", {})

            # Verify SSE response was parsed correctly
            # call_tool extracts the text from content array
            assert result == "SSE result"

            mcp.close()

    def test_session_id_management(self):
        """Test Mcp-Session-Id header handling."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock initialize with session ID in response
            mock_response_init = MagicMock()
            mock_response_init.headers = {
                "content-type": "application/json",
                "Mcp-Session-Id": "test-session-123",
            }
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {},
            }
            mock_response_init.raise_for_status = MagicMock()

            # Mock tools/list
            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {"tools": []},
            }
            mock_response_tools.raise_for_status = MagicMock()

            mock_client_instance.post = AsyncMock(
                side_effect=[
                    mock_response_init,
                    MagicMock(),  # initialized notification
                    mock_response_tools,
                ]
            )

            mcp = MCPClient(server_url="http://localhost:8000")

            # Verify session ID was captured
            assert mcp._session_id == "test-session-123"

            # Verify subsequent requests include session ID
            calls = mock_client_instance.post.call_args_list
            # tools/list request (3rd call, index 2) should have session ID
            tools_call = calls[2]
            headers = tools_call[1]["headers"]
            assert "Mcp-Session-Id" in headers
            assert headers["Mcp-Session-Id"] == "test-session-123"

            mcp.close()

    def test_sse_with_multiple_events(self):
        """Test SSE stream with multiple events before final response."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock initialize and tools/list
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {},
            }
            mock_response_init.raise_for_status = MagicMock()

            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {"tools": []},
            }
            mock_response_tools.raise_for_status = MagicMock()

            # Mock SSE response with notifications before result
            mock_response_sse = MagicMock()
            mock_response_sse.headers = {"content-type": "text/event-stream"}
            mock_response_sse.raise_for_status = MagicMock()

            async def mock_aiter_lines():
                lines = [
                    'data: {"jsonrpc": "2.0", "method": "notification", "params": {"status": "processing"}}',
                    "",
                    'data: {"jsonrpc": "2.0", "method": "notification", "params": {"status": "almost done"}}',
                    "",
                    'data: {"jsonrpc": "2.0", "id": 3, "result": {"content": [{"type": "text", "text": "final result"}]}}',
                    "",
                ]
                for line in lines:
                    yield line

            mock_response_sse.aiter_lines = mock_aiter_lines

            mock_client_instance.post = AsyncMock(
                side_effect=[
                    mock_response_init,
                    MagicMock(),  # initialized notification
                    mock_response_tools,
                    mock_response_sse,
                ]
            )

            mcp = MCPClient(server_url="http://localhost:8000")
            result = mcp.call_tool("test_tool", {})

            # Should return the final result, ignoring notifications
            assert result == "final result"

            mcp.close()

    def test_mixed_json_and_sse_responses(self):
        """Test that client handles both JSON and SSE responses from same server."""
        with patch("aisuite.mcp.client.httpx.AsyncClient") as mock_async_client:
            mock_client_instance = AsyncMock()
            mock_async_client.return_value = mock_client_instance

            # Mock initialize (JSON)
            mock_response_init = MagicMock()
            mock_response_init.headers = {"content-type": "application/json"}
            mock_response_init.json.return_value = {
                "jsonrpc": "2.0",
                "id": 1,
                "result": {},
            }
            mock_response_init.raise_for_status = MagicMock()

            # Mock tools/list (JSON)
            mock_response_tools = MagicMock()
            mock_response_tools.headers = {"content-type": "application/json"}
            mock_response_tools.json.return_value = {
                "jsonrpc": "2.0",
                "id": 2,
                "result": {
                    "tools": [
                        {"name": "fast_tool", "description": "Fast", "inputSchema": {}},
                        {"name": "slow_tool", "description": "Slow", "inputSchema": {}},
                    ]
                },
            }
            mock_response_tools.raise_for_status = MagicMock()

            # Mock fast tool call (JSON response)
            mock_response_fast = MagicMock()
            mock_response_fast.headers = {"content-type": "application/json"}
            mock_response_fast.json.return_value = {
                "jsonrpc": "2.0",
                "id": 3,
                "result": {"content": [{"type": "text", "text": "fast"}]},
            }
            mock_response_fast.raise_for_status = MagicMock()

            # Mock slow tool call (SSE response)
            mock_response_slow = MagicMock()
            mock_response_slow.headers = {"content-type": "text/event-stream"}
            mock_response_slow.raise_for_status = MagicMock()

            async def mock_aiter_lines():
                lines = [
                    'data: {"jsonrpc": "2.0", "id": 4, "result": {"content": [{"type": "text", "text": "slow"}]}}',
                    "",
                ]
                for line in lines:
                    yield line

            mock_response_slow.aiter_lines = mock_aiter_lines

            mock_client_instance.post = AsyncMock(
                side_effect=[
                    mock_response_init,
                    MagicMock(),  # initialized notification
                    mock_response_tools,
                    mock_response_fast,
                    mock_response_slow,
                ]
            )

            mcp = MCPClient(server_url="http://localhost:8000")

            # Call fast tool (JSON response)
            result1 = mcp.call_tool("fast_tool", {})
            assert result1 == "fast"

            # Call slow tool (SSE response)
            result2 = mcp.call_tool("slow_tool", {})
            assert result2 == "slow"

            mcp.close()


================================================
FILE: tests/mcp/test_llm_e2e.py
================================================
"""
Real LLM End-to-End Tests for MCP Integration.

These tests make ACTUAL API calls to LLM providers (OpenAI, Anthropic) to verify
that MCP tools work correctly with real models. Unlike test_e2e.py which mocks
LLM responses, these tests verify the complete integration stack.

⚠️ WARNING: These tests will make real API calls and incur costs!
   - Each test costs ~$0.01-0.05 depending on the model
   - Tests are marked with @pytest.mark.llm
   - Tests are skipped if API keys are not present

Requirements:
    - Node.js and npx (for MCP filesystem server)
    - API keys in .env file:
        OPENAI_API_KEY=your-key
        ANTHROPIC_API_KEY=your-key
    - pytest-asyncio, python-dotenv

Running:
    # Run ONLY LLM tests (⚠️ costs money):
    pytest tests/mcp/test_llm_e2e.py -v -m llm

    # Skip LLM tests (default, free):
    pytest tests/mcp/ -v -m "integration and not llm"
"""

import pytest
import os
from pathlib import Path
from aisuite import Client


# Helper function to check if we have API keys
def has_openai_key():
    """Check if OpenAI API key is available."""
    return bool(os.getenv("OPENAI_API_KEY"))


def has_anthropic_key():
    """Check if Anthropic API key is available."""
    return bool(os.getenv("ANTHROPIC_API_KEY"))


@pytest.mark.llm
@pytest.mark.integration
class TestOpenAIWithMCP:
    """Test OpenAI models with real MCP tools."""

    @pytest.mark.skipif(not has_openai_key(), reason="OPENAI_API_KEY not set")
    def test_gpt4o_reads_file_via_mcp(self, temp_test_dir, skip_if_no_npx):
        """Test GPT-4o can read a file using MCP filesystem tools."""
        client = Client()

        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": f'Use read_file to read the file at path "{temp_test_dir}/test.txt" and tell me what it contains.',
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "filesystem",
                    "command": "npx",
                    "args": [
                        "-y",
                        "@modelcontextprotocol/server-filesystem",
                        temp_test_dir,
                    ],
                    "allowed_tools": ["read_file"],  # Security: only allow reading
                }
            ],
            max_turns=3,
        )

        # Debug: Print intermediate messages to see what happened
        if hasattr(response.choices[0], "intermediate_messages"):
            print("\n=== Intermediate Messages ===")
            import json

            for i, msg in enumerate(response.choices[0].intermediate_messages):
                print(f"\nMessage {i}:")
                # Handle both dict and object formats
                if isinstance(msg, dict):
                    print(json.dumps(msg, indent=2, default=str))
                else:
                    print(f"Role: {msg.role}")
                    if hasattr(msg, "content") and msg.content:
                        print(f"Content: {msg.content[:200]}")
                    if hasattr(msg, "tool_calls") and msg.tool_calls:
                        for tc in msg.tool_calls:
                            print(
                                f"Tool Call: {tc.function.name}({tc.function.arguments})"
                            )

        # Verify the LLM actually read the file
        content = response.choices[0].message.content.lower()
        assert (
            "hello from mcp test" in content or "hello from mcp" in content
        ), f"Expected file content in response, got: {content}"

    @pytest.mark.skipif(not has_openai_key(), reason="OPENAI_API_KEY not set")
    def test_gpt4o_lists_files_via_mcp(self, temp_test_dir, skip_if_no_npx):
        """Test GPT-4o can list directory contents using MCP tools."""
        client = Client()

        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": f'Use list_directory to list all files in the directory at path "{temp_test_dir}" and tell me what you find.',
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "filesystem",
                    "command": "npx",
                    "args": [
                        "-y",
                        "@modelcontextprotocol/server-filesystem",
                        temp_test_dir,
                    ],
                    "allowed_tools": ["list_directory"],  # Security: only allow listing
                }
            ],
            max_turns=3,
        )

        # Verify the LLM found the test files
        content = response.choices[0].message.content.lower()
        # Test dir has: test.txt, README.md, data.json, subdir/
        assert (
            "test.txt" in content or "readme" in content
        ), f"Expected file names in response, got: {content}"

    @pytest.mark.skipif(not has_openai_key(), reason="OPENAI_API_KEY not set")
    def test_gpt4o_mixed_tools(self, temp_test_dir, skip_if_no_npx):
        """Test GPT-4o with both MCP tools and regular Python functions."""

        # Define a Python function
        def get_current_date() -> str:
            """Get the current date in YYYY-MM-DD format."""
            from datetime import datetime

            return datetime.now().strftime("%Y-%m-%d")

        client = Client()

        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": f'First use get_current_date to get today\'s date, then use read_file to read "{temp_test_dir}/test.txt" and tell me both.',
                }
            ],
            tools=[
                get_current_date,  # Python function
                {
                    "type": "mcp",
                    "name": "filesystem",
                    "command": "npx",
                    "args": [
                        "-y",
                        "@modelcontextprotocol/server-filesystem",
                        temp_test_dir,
                    ],
                    "allowed_tools": ["read_file"],
                },
            ],
            max_turns=5,
        )

        # Verify both tools were used
        content = response.choices[0].message.content.lower()
        # Should mention the date (from Python function)
        assert any(
            str(y) in content for y in [2024, 2025, 2026]
        ), f"Expected date in response, got: {content}"
        # Should mention the file content (from MCP tool)
        assert (
            "hello" in content or "mcp test" in content
        ), f"Expected file content in response, got: {content}"


@pytest.mark.llm
@pytest.mark.integration
class TestAnthropicWithMCP:
    """Test Anthropic Claude models with real MCP tools."""

    @pytest.mark.skipif(not has_anthropic_key(), reason="ANTHROPIC_API_KEY not set")
    def test_claude_reads_file_via_mcp(self, temp_test_dir, skip_if_no_npx):
        """Test Claude can read a file using MCP filesystem tools."""
        client = Client()

        response = client.chat.completions.create(
            model="anthropic:claude-sonnet-4-5",
            messages=[
                {
                    "role": "user",
                    "content": f'Use read_file to read the file at path "{temp_test_dir}/test.txt" and tell me what it contains.',
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "filesystem",
                    "command": "npx",
                    "args": [
                        "-y",
                        "@modelcontextprotocol/server-filesystem",
                        temp_test_dir,
                    ],
                    "allowed_tools": ["read_file"],
                }
            ],
            max_turns=3,
        )

        # Verify Claude actually read the file
        content = response.choices[0].message.content.lower()
        assert (
            "hello from mcp test" in content or "hello from mcp" in content
        ), f"Expected file content in response, got: {content}"

    @pytest.mark.skipif(not has_anthropic_key(), reason="ANTHROPIC_API_KEY not set")
    def test_claude_lists_files_via_mcp(self, temp_test_dir, skip_if_no_npx):
        """Test Claude can list directory contents using MCP tools."""
        client = Client()

        response = client.chat.completions.create(
            model="anthropic:claude-sonnet-4-5",
            messages=[
                {
                    "role": "user",
                    "content": f'Use list_directory with path "{temp_test_dir}" to list all files.',
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "filesystem",
                    "command": "npx",
                    "args": [
                        "-y",
                        "@modelcontextprotocol/server-filesystem",
                        temp_test_dir,
                    ],
                    "allowed_tools": ["list_directory"],
                }
            ],
            max_turns=3,
        )

        # Verify Claude found the test files
        content = response.choices[0].message.content.lower()
        assert (
            "test.txt" in content or "readme" in content or "data.json" in content
        ), f"Expected file names in response, got: {content}"

    @pytest.mark.skipif(not has_anthropic_key(), reason="ANTHROPIC_API_KEY not set")
    def test_claude_mixed_tools(self, temp_test_dir, skip_if_no_npx):
        """Test Claude with both MCP tools and regular Python functions."""

        def get_weather(location: str) -> str:
            """Get the weather for a location (mock function).

            Args:
                location: The city name
            """
            # Mock weather function for testing
            return f"The weather in {location} is sunny and 72°F"

        client = Client()

        response = client.chat.completions.create(
            model="anthropic:claude-sonnet-4-5",
            messages=[
                {
                    "role": "user",
                    "content": f'Use get_weather for San Francisco, then use read_file to read "{temp_test_dir}/README.md". Tell me both results.',
                }
            ],
            tools=[
                get_weather,  # Python function
                {
                    "type": "mcp",
                    "name": "filesystem",
                    "command": "npx",
                    "args": [
                        "-y",
                        "@modelcontextprotocol/server-filesystem",
                        temp_test_dir,
                    ],
                    "allowed_tools": ["read_file"],
                },
            ],
            max_turns=5,
        )

        # Verify both tools were used
        content = response.choices[0].message.content.lower()
        # Should mention weather (from Python function)
        assert (
            "weather" in content or "sunny" in content or "72" in content
        ), f"Expected weather info in response, got: {content}"
        # Should mention the README content (from MCP tool)
        assert (
            "test directory" in content or "readme" in content
        ), f"Expected README content in response, got: {content}"


@pytest.mark.llm
@pytest.mark.integration
class TestToolPrefixingWithLLM:
    """Test tool prefixing works with real LLMs."""

    @pytest.mark.skipif(not has_openai_key(), reason="OPENAI_API_KEY not set")
    def test_multiple_mcp_servers_with_prefixing(self, temp_test_dir, skip_if_no_npx):
        """Test using multiple MCP servers with prefixing to avoid name collisions."""
        # Create two subdirectories
        dir1 = Path(temp_test_dir) / "dir1"
        dir2 = Path(temp_test_dir) / "dir2"
        dir1.mkdir()
        dir2.mkdir()

        (dir1 / "file1.txt").write_text("Content from dir1")
        (dir2 / "file2.txt").write_text("Content from dir2")

        client = Client()

        response = client.chat.completions.create(
            model="openai:gpt-4o",
            messages=[
                {
                    "role": "user",
                    "content": f'Use dir1_fs__list_directory with path "{dir1}" to list dir1, then use dir2_fs__list_directory with path "{dir2}" to list dir2.',
                }
            ],
            tools=[
                {
                    "type": "mcp",
                    "name": "dir1_fs",
                    "command": "npx",
                    "args": [
                        "-y",
                        "@modelcontextprotocol/server-filesystem",
                        str(dir1),
                    ],
                    "use_tool_prefix": True,  # Tools will be "dir1_fs__list_directory", etc.
                    "allowed_tools": ["list_directory"],
                },
                {
                    "type": "mcp",
                    "name": "dir2_fs",
                    "command": "npx",
                    "args": [
                        "-y",
                        "@modelcontextprotocol/server-filesystem",
                        str(dir2),
                    ],
                    "use_tool_prefix": True,  # Tools will be "dir2_fs__list_directory", etc.
                    "allowed_tools": ["list_directory"],
                },
            ],
            max_turns=5,
        )

        # Verify the LLM found files from both directories
        content = response.choices[0].message.content.lower()
        assert (
            "file1" in content or "dir1" in content
        ), f"Expected dir1 content, got: {content}"
        assert (
            "file2" in content or "dir2" in content
        ), f"Expected dir2 content, got: {content}"


================================================
FILE: tests/providers/__init__.py
================================================


================================================
FILE: tests/providers/test_anthropic_converter.py
================================================
"""Tests for the AnthropicMessageConverter."""

import unittest
from unittest.mock import MagicMock
from aisuite.providers.anthropic_provider import AnthropicMessageConverter
from aisuite.framework import ChatCompletionResponse


class TestAnthropicMessageConverter(unittest.TestCase):
    """Test suite for the AnthropicMessageConverter class."""

    def setUp(self):
        """Set up the test case."""
        self.converter = AnthropicMessageConverter()

    def test_convert_request_single_user_message(self):
        """Test converting a single user message."""
        messages = [{"role": "user", "content": "Hello, how are you?"}]
        system_message, converted_messages = self.converter.convert_request(messages)

        self.assertEqual(system_message, [])
        self.assertEqual(
            converted_messages, [{"role": "user", "content": "Hello, how are you?"}]
        )

    def test_convert_request_with_system_message(self):
        """Test converting a request with a system message."""
        messages = [
            {"role": "system", "content": "You are a helpful assistant."},
            {"role": "user", "content": "What is the weather?"},
        ]
        system_message, converted_messages = self.converter.convert_request(messages)

        self.assertEqual(system_message, "You are a helpful assistant.")
        self.assertEqual(
            converted_messages, [{"role": "user", "content": "What is the weather?"}]
        )

    def test_convert_request_with_tool_use_message(self):
        """Test converting a request with a tool use message."""
        messages = [
            {"role": "tool", "tool_call_id": "tool123", "content": "Weather data here."}
        ]
        system_message, converted_messages = self.converter.convert_request(messages)

        self.assertEqual(system_message, [])
        self.assertEqual(
            converted_messages,
            [
                {
                    "role": "user",
                    "content": [
                        {
                            "type": "tool_result",
                            "tool_use_id": "tool123",
                            "content": "Weather data here.",
                        }
                    ],
                }
            ],
        )

    def test_convert_response_normal_message(self):
        """Test converting a normal text response."""
        response = MagicMock()
        response.stop_reason = "end_turn"
        response.usage.input_tokens = 10
        response.usage.output_tokens = 5
        content_mock = MagicMock()
        content_mock.type = "text"
        content_mock.text = "The weather is sunny."
        response.content = [content_mock]

        normalized_response = self.converter.convert_response(response)

        self.assertIsInstance(normalized_response, ChatCompletionResponse)
        self.assertEqual(normalized_response.choices[0].finish_reason, "stop")
        self.assertEqual(normalized_response.usage.prompt_tokens, 10)
        self.assertEqual(normalized_response.usage.completion_tokens, 5)
        self.assertEqual(normalized_response.usage.total_tokens, 15)
        self.assertEqual(
            normalized_response.choices[0].message.content, "The weather is sunny."
        )

    def test_convert_response_with_tool_use(self):
        """Test converting a response containing a tool use request."""
        response = MagicMock()
        response.id = "msg_01Aq9w938a90dw8q"
        response.model = "claude-3-5-sonnet-20241022"
        response.role = "assistant"
        response.stop_reason = "tool_use"
        response.usage.input_tokens = 20
        response.usage.output_tokens = 10
        tool_use_mock = MagicMock()
        tool_use_mock.type = "tool_use"
        tool_use_mock.id = "tool123"
        tool_use_mock.name = "get_weather"
        tool_use_mock.input = {"location": "Paris"}

        text_mock = MagicMock()
        text_mock.type = "text"
        text_mock.text = "<thinking>I need to call the get_weather function</thinking>"

        response.content = [tool_use_mock, text_mock]

        normalized_response = self.converter.convert_response(response)

        self.assertIsInstance(normalized_response, ChatCompletionResponse)
        self.assertEqual(normalized_response.choices[0].finish_reason, "tool_calls")
        self.assertEqual(normalized_response.usage.prompt_tokens, 20)
        self.assertEqual(normalized_response.usage.completion_tokens, 10)
        self.assertEqual(normalized_response.usage.total_tokens, 30)
        self.assertEqual(
            normalized_response.choices[0].message.content,
            "<thinking>I need to call the get_weather function</thinking>",
        )
        self.assertEqual(len(normalized_response.choices[0].message.tool_calls), 1)
        self.assertEqual(
            normalized_response.choices[0].message.tool_calls[0].id, "tool123"
        )
        self.assertEqual(
            normalized_response.choices[0].message.tool_calls[0].function.name,
            "get_weather",
        )

    def test_convert_tool_spec(self):
        """Test converting OpenAI tool specifications to Anthropic format."""
        openai_tools = [
            {
                "type": "function",
                "function": {
                    "name": "get_weather",
                    "description": "Get the weather.",
                    "parameters": {
                        "type": "object",
                        "properties": {
                            "location": {"type": "string", "description": "City name."}
                        },
                        "required": ["location"],
                    },
                },
            }
        ]

        anthropic_tools = self.converter.convert_tool_spec(openai_tools)

        self.assertEqual(len(anthropic_tools), 1)
        self.assertEqual(anthropic_tools[0]["name"], "get_weather")
        self.assertEqual(anthropic_tools[0]["description"], "Get the weather.")
        self.assertEqual(
            anthropic_tools[0]["input_schema"],
            {
                "type": "object",
                "properties": {
                    "location": {"type": "string", "description": "City name."}
                },
                "required": ["location"],
            },
        )

    def test_convert_request_with_tool_call_and_result(self):
        """Test converting a request with a tool call and its result."""
        messages = [
            {
                "role": "assistant",
                "content": "Let me check the weather.",
                "tool_calls": [
                    {
                        "id": "tool123",
                        "function": {
                            "name": "get_weather",
                            "arguments": '{"location": "Paris"}',
                        },
                        "type": "function",
                    }
                ],
            },
            {
                "role": "tool",
                "tool_call_id": "tool123",
                "content": "The weather in Paris is sunny.",
            },
        ]
        system_message, converted_messages = self.converter.convert_request(messages)

        self.assertEqual(system_message, [])
        self.assertEqual(len(converted_messages), 2)
        self.assertEqual(converted_messages[0]["role"], "assistant")
        self.assertEqual(converted_messages[1]["role"], "user")
        self.assertEqual(
            converted_messages[0]["content"],
            [
                {"type": "text", "text": "Let me check the weather."},
                {
                    "type": "tool_use",
                    "id": "tool123",
                    "name": "get_weather",
                    "input": {"location": "Paris"},
                },
            ],
        )
        self.assertEqual(
            converted_messages[1]["content"],
            [
                {
                    "type": "tool_result",
                    "tool_use_id": "tool123",
                    "content": "The weather in Paris is sunny.",
                }
            ],
        )


if __name__ == "__main__":
    unittest.main()


================================================
FILE: tests/providers/test_asr_parameter_passthrough.py
================================================
"""Component tests for ASR parameter pass-through to provider SDKs."""

import io
from unittest.mock import MagicMock, mock_open, patch
import pytest

from aisuite.providers.openai_provider import OpenaiProvider
from aisuite.providers.deepgram_provider import DeepgramProvider
from aisuite.providers.google_provider import GoogleProvider
from aisuite.framework.message import TranscriptionResult


@pytest.fixture(autouse=True)
def set_env_vars(monkeypatch):
    """Fixture to set environment variables for all tests."""
    monkeypatch.setenv("OPENAI_API_KEY", "test-openai-key")
    monkeypatch.setenv("DEEPGRAM_API_KEY", "test-deepgram-key")
    monkeypatch.setenv("GOOGLE_APPLICATION_CREDENTIALS", "test-creds.json")
    monkeypatch.setenv("GOOGLE_PROJECT_ID", "test-project")
    monkeypatch.setenv("GOOGLE_REGION", "us-central1")


class TestOpenAIParameterPassthrough:
    """Test that parameters correctly reach OpenAI SDK."""

    def test_language_param_passthrough(self):
        """Test language parameter reaches OpenAI SDK."""
        provider = OpenaiProvider()
        mock_response = MagicMock()
        mock_response.text = "Test transcription"
        mock_response.language = "en"
        mock_response.segments = None

        with patch("builtins.open", mock_open(read_data=b"audio")), patch.object(
            provider.client.audio.transcriptions, "create", return_value=mock_response
        ) as mock_create:

            provider.audio.transcriptions.create(
                model="whisper-1", file="test.mp3", language="en"
            )

            # Verify language was passed to SDK
            mock_create.assert_called_once()
            call_kwargs = mock_create.call_args.kwargs
            assert "language" in call_kwargs
            assert call_kwargs["language"] == "en"

    def test_temperature_param_passthrough(self):
        """Test temperature parameter reaches OpenAI SDK."""
        provider = OpenaiProvider()
        mock_response = MagicMock()
        mock_response.text = "Test"
        mock_response.language = "en"
        mock_response.segments = None

        with patch("builtins.open", mock_open(read_data=b"audio")), patch.object(
            provider.client.audio.transcriptions, "create", return_value=mock_response
        ) as mock_create:

            provider.audio.transcriptions.create(
                model="whisper-1", file="test.mp3", temperature=0.7
            )

            call_kwargs = mock_create.call_args.kwargs
            assert "temperature" in call_kwargs
            assert call_kwargs["temperature"] == 0.7

    def test_response_format_param_passthrough(self):
        """Test response_format parameter reaches OpenAI SDK."""
        provider = OpenaiProvider()
        mock_response = MagicMock()
        mock_response.text = "Test"
        mock_response.language = "en"
        mock_response.segments = None

        with patch("builtins.open", mock_open(read_data=b"audio")), patch.object(
            provider.client.audio.transcriptions, "create", return_value=mock_response
        ) as mock_create:

            provider.audio.transcriptions.create(
                model="whisper-1", file="test.mp3", response_format="verbose_json"
            )

            call_kwargs = mock_create.call_args.kwargs
            assert "response_format" in call_kwargs
            assert call_kwargs["response_format"] == "verbose_json"

    def test_multiple_params_passthrough(self):
        """Test multiple parameters reach OpenAI SDK together."""
        provider = OpenaiProvider()
        mock_response = MagicMock()
        mock_response.text = "Test"
        mock_response.language = "en"
        mock_response.segments = None

        with patch("builtins.open", mock_open(read_data=b"audio")), patch.object(
            provider.client.audio.transcriptions, "create", return_value=mock_response
        ) as mock_create:

            provider.audio.transcriptions.create(
                model="whisper-1",
                file="test.mp3",
                language="en",
                temperature=0.5,
                response_format="json",
            )

            call_kwargs = mock_create.call_args.kwargs
            assert call_kwargs["language"] == "en"
            assert call_kwargs["temperature"] == 0.5
            assert call_kwargs["response_format"] == "json"

    def test_file_object_with_params(self):
        """Test that file-like object works with parameters."""
        provider = OpenaiProvider()
        mock_response = MagicMock()
        mock_response.text = "Test"
        mock_response.language = "en"
        mock_response.segments = None

        audio_data = io.BytesIO(b"fake audio data")

        with patch.object(
            provider.client.audio.transcriptions, "create", return_value=mock_response
        ) as mock_create:

            provider.audio.transcriptions.create(
                model="whisper-1", file=audio_data, language="en"
            )

            call_kwargs = mock_create.call_args.kwargs
            assert call_kwargs["file"] == audio_data
            assert call_kwargs["language"] == "en"


class TestGoogleParameterPassthrough:
    """Test that parameters correctly reach Google Speech SDK."""

    @patch("aisuite.providers.google_provider.vertexai.init")
    def test_language_code_param_passthrough(self, mock_vertexai_init):
        """Test language_code parameter reaches Google SDK."""
        provider = GoogleProvider()
        mock_response = MagicMock()
        mock_result = MagicMock()
        mock_alternative = MagicMock()
        mock_alternative.transcript = "Test"
        mock_alternative.confidence = 0.95
        mock_alternative.words = []
        mock_result.alternatives = [mock_alternative]
        mock_response.results = [mock_result]

        provider._speech_client = MagicMock()
        provider._speech_client.recognize.return_value = mock_response

        with patch("builtins.open", mock_open(read_data=b"audio")):
            provider.audio.transcriptions.create(
                model="latest_long", file="test.wav", language_code="en-US"
            )

            # Verify language_code was in the config passed to SDK
            provider._speech_client.recognize.assert_called_once()
            call_kwargs = provider._speech_client.recognize.call_args.kwargs
            assert "config" in call_kwargs
            config = call_kwargs["config"]
            assert config.language_code == "en-US"

    @patch("aisuite.providers.google_provider.vertexai.init")
    def test_enable_automatic_punctuation_passthrough(self, mock_vertexai_init):
        """Test enable_automatic_punctuation parameter reaches Google SDK."""
        provider = GoogleProvider()
        mock_response = MagicMock()
        mock_result = MagicMock()
        mock_alternative = MagicMock()
        mock_alternative.transcript = "Test."
        mock_alternative.confidence = 0.95
        mock_alternative.words = []
        mock_result.alternatives = [mock_alternative]
        mock_response.results = [mock_result]

        provider._speech_client = MagicMock()
        provider._speech_client.recognize.return_value = mock_response

        with patch("builtins.open", mock_open(read_data=b"audio")):
            provider.audio.transcriptions.create(
                model="latest_long",
                file="test.wav",
                language_code="en-US",
                enable_automatic_punctuation=True,
            )

            call_kwargs = provider._speech_client.recognize.call_args.kwargs
            config = call_kwargs["config"]
            assert config.enable_automatic_punctuation is True

    @patch("aisuite.providers.google_provider.vertexai.init")
    def test_speech_contexts_passthrough(self, mock_vertexai_init):
        """Test speech_contexts parameter (from prompt mapping) reaches Google SDK."""
        provider = GoogleProvider()
        mock_response = MagicMock()
        mock_result = MagicMock()
        mock_alternative = MagicMock()
        mock_alternative.transcript = "Technical terms"
        mock_alternative.confidence = 0.95
        mock_alternative.words = []
        mock_result.alternatives = [mock_alternative]
        mock_response.results = [mock_result]

        provider._speech_client = MagicMock()
        provider._speech_client.recognize.return_value = mock_response

        with patch("builtins.open", mock_open(read_data=b"audio")):
            # Note: This would come in as speech_contexts after validation layer transforms prompt
            provider.audio.transcriptions.create(
                model="latest_long",
                file="test.wav",
                language_code="en-US",
                speech_contexts=[{"phrases": ["technical terms"]}],
            )

            call_kwargs = provider._speech_client.recognize.call_args.kwargs
            config = call_kwargs["config"]
            assert len(config.speech_contexts) == 1
            assert config.speech_contexts[0].phrases == ["technical terms"]


================================================
FILE: tests/providers/test_aws_converter.py
================================================
import unittest
from unittest.mock import MagicMock
from aisuite.providers.aws_provider import BedrockMessageConverter
from aisuite.framework.message import Message, ChatCompletionMessageToolCall
from aisuite.framework import ChatCompletionResponse


class TestBedrockMessageConverter(unittest.TestCase):

    def setUp(self):
        self.converter = BedrockMessageConverter()

    def test_convert_request_user_message(self):
        messages = [
            {"role": "user", "content": "What is the most popular song on WZPZ?"}
        ]
        system_message, formatted_messages = self.converter.convert_request(messages)

        self.assertEqual(system_message, [])
        self.assertEqual(len(formatted_messages), 1)
        self.assertEqual(formatted_messages[0]["role"], "user")
        self.assertEqual(
            formatted_messages[0]["content"],
            [{"text": "What is the most popular song on WZPZ?"}],
        )

    def test_convert_request_tool_result(self):
        messages = [
            {
                "role": "tool",
                "tool_call_id": "tool123",
                "content": '{"song": "Elemental Hotel", "artist": "8 Storey Hike"}',
            }
        ]
        system_message, formatted_messages = self.converter.convert_request(messages)

        self.assertEqual(system_message, [])
        self.assertEqual(len(formatted_messages), 1)
        self.assertEqual(formatted_messages[0]["role"], "user")
        self.assertEqual(
            formatted_messages[0]["content"],
            [
                {
                    "toolResult": {
                        "toolUseId": "tool123",
                        "content": [
                            {
                                "json": {
                                    "song": "Elemental Hotel",
                                    "artist": "8 Storey Hike",
                                }
                            }
                        ],
                    }
                }
            ],
        )

    def test_convert_response_tool_call(self):
        response = {
            "output": {
                "message": {
                    "role": "assistant",
                    "content": [
                        {
                            "toolUse": {
                                "toolUseId": "tool123",
                                "name": "top_song",
                                "input": {"sign": "WZPZ"},
                            }
                        }
                    ],
                }
            },
            "stopReason": "tool_use",
        }

        normalized_response = self.converter.convert_response(response)

        self.assertIsInstance(normalized_response, ChatCompletionResponse)
        self.assertEqual(normalized_response.choices[0].finish_reason, "tool_calls")
        tool_call = normalized_response.choices[0].message.tool_calls[0]
        self.assertEqual(tool_call.function.name, "top_song")
        self.assertEqual(tool_call.function.arguments, '{"sign": "WZPZ"}')

    def test_convert_response_text(self):
        response = {
            "output": {
                "message": {
                    "role": "assistant",
                    "content": [
                        {
                            "text": "The most popular song on WZPZ is Elemental Hotel by 8 Storey Hike."
                        }
                    ],
                }
            },
            "stopReason": "complete",
        }

        normalized_response = self.converter.convert_response(response)

        self.assertIsInstance(normalized_response, ChatCompletionResponse)
        self.assertEqual(normalized_response.choices[0].finish_reason, "stop")
        self.assertEqual(
            normalized_response.choices[0].message.content,
            "The most popular song on WZPZ is Elemental Hotel by 8 Storey Hike.",
        )


if __name__ == "__main__":
    unittest.main()


================================================
FILE: tests/providers/test_azure_provider.py
================================================
import unittest
from aisuite.providers.azure_provider import AzureMessageConverter
from aisuite.framework.message import Message, ChatCompletionMessageToolCall
from aisuite.framework import ChatCompletionResponse


class TestAzureMessageConverter(unittest.TestCase):
    def setUp(self):
        self.converter = AzureMessageConverter()

    def test_convert_request_dict_message(self):
        messages = [{"role": "user", "content": "Hello, how are you?"}]
        converted_messages = self.converter.convert_request(messages)

        self.assertEqual(
            converted_messages, [{"role": "user", "content": "Hello, how are you?"}]
        )

    def test_convert_request_message_object(self):
        message = Message(role="user", content="Hello", tool_calls=None, refusal=None)
        messages = [message]
        converted_messages = self.converter.convert_request(messages)

        expected_message = {
            "role": "user",
            "content": "Hello",
            "reasoning_content": None,
            "tool_calls": None,
            "refusal": None,
        }
        self.assertEqual(converted_messages, [expected_message])

    def test_convert_response_basic(self):
        azure_response = {
            "choices": [
                {
                    "message": {
                        "role": "assistant",
                        "content": "Hello! How can I help you?",
                    }
                }
            ]
        }

        response = self.converter.convert_response(azure_response)

        self.assertIsInstance(response, ChatCompletionResponse)
        self.assertEqual(
            response.choices[0].message.content, "Hello! How can I help you?"
        )
        self.assertEqual(response.choices[0].message.role, "assistant")
        self.assertIsNone(response.choices[0].message.tool_calls)

    def test_convert_response_with_tool_calls(self):
        azure_response = {
            "choices": [
                {
                    "message": {
                        "role": "assistant",
                        "content": "Let me check the weather.",
                        "tool_calls": [
                            {
                                "id": "tool123",
                                "type": "function",
                                "function": {
                                    "name": "get_weather",
                                    "arguments": '{"location": "London"}',
                                },
                            }
                        ],
                    }
                }
            ]
        }

        response = self.converter.convert_response(azure_response)

        self.assertIsInstance(response, ChatCompletionResponse)
        self.assertEqual(
            response.choices[0].message.content, "Let me check the weather."
        )
        self.assertEqual(len(response.choices[0].message.tool_calls), 1)

        tool_call = response.choices[0].message.tool_calls[0]
        self.assertEqual(tool_call.id, "tool123")
        self.assertEqual(tool_call.type, "function")
        self.assertEqual(tool_call.function.name, "get_weather")
        self.assertEqual(tool_call.function.arguments, '{"location": "London"}')


if __name__ == "__main__":
    unittest.main()


================================================
FILE: tests/providers/test_cerebras_provider.py
================================================
"""Tests for the Cerebras provider."""

from unittest.mock import MagicMock, patch

import pytest

from aisuite.providers.cerebras_provider import CerebrasProvider


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("CEREBRAS_API_KEY", "test-api-key")


def test_cerebras_provider():
    """Test that the provider is initialized and chat completions are requested."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "our-favorite-model"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = CerebrasProvider()
    mock_response = MagicMock()
    mock_response.model_dump.return_value = {
        "choices": [{"message": {"content": response_text_content}}]
    }

    with patch.object(
        provider.client.chat.completions,
        "create",
        return_value=mock_response,
    ) as mock_create:
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        mock_create.assert_called_with(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert response.choices[0].message.content == response_text_content


def test_cerebras_provider_with_usage():
    """Tests that usage data is correctly parsed when present in the response."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "our-favorite-model"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = CerebrasProvider()
    mock_response = MagicMock()
    mock_response.model_dump.return_value = {
        "choices": [{"message": {"content": response_text_content}}],
        "usage": {
            "prompt_tokens": 10,
            "completion_tokens": 20,
            "total_tokens": 30,
        },
    }

    with patch.object(
        provider.client.chat.completions,
        "create",
        return_value=mock_response,
    ):
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert response.usage is not None
        assert response.usage.prompt_tokens == 10
        assert response.usage.completion_tokens == 20
        assert response.usage.total_tokens == 30


================================================
FILE: tests/providers/test_cohere_provider.py
================================================
from unittest.mock import MagicMock, patch

import pytest

from aisuite.providers.cohere_provider import CohereProvider


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("CO_API_KEY", "test-api-key")


def test_cohere_provider():
    """High-level test that the provider is initialized and chat completions are requested successfully."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "our-favorite-model"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = CohereProvider()
    mock_response = MagicMock()
    mock_response.message = MagicMock()
    mock_response.message.content = [MagicMock()]
    mock_response.message.content[0].text = response_text_content

    with patch.object(
        provider.client,
        "chat",
        return_value=mock_response,
    ) as mock_create:
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        mock_create.assert_called_with(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert response.choices[0].message.content == response_text_content


================================================
FILE: tests/providers/test_deepgram_provider.py
================================================
"""Tests for Deepgram provider functionality."""

import io
from unittest.mock import MagicMock, mock_open, patch

import pytest

from aisuite.providers.deepgram_provider import DeepgramProvider
from aisuite.provider import ASRError
from aisuite.framework.message import (
    TranscriptionResult,
    TranscriptionOptions,
    StreamingTranscriptionChunk,
)


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("DEEPGRAM_API_KEY", "test-api-key")


@pytest.fixture
def deepgram_provider():
    """Create a Deepgram provider instance for testing."""
    return DeepgramProvider()


@pytest.fixture
def mock_deepgram_response():
    """Create a mock Deepgram API response for ASR."""
    return {
        "metadata": {
            "request_id": "test-request-id",
            "duration": 10.5,
            "channels": 1,
        },
        "results": {
            "channels": [
                {
                    "alternatives": [
                        {
                            "transcript": "Hello, this is a test transcription from Deepgram.",
                            "confidence": 0.95,
                            "words": [
                                {
                                    "word": "hello",
                                    "start": 0.0,
                                    "end": 0.5,
                                    "confidence": 0.98,
                                    "speaker": 0,
                                }
                            ],
                        }
                    ]
                }
            ],
            "language": "en-US",
        },
    }


class TestDeepgramProvider:
    """Test suite for Deepgram provider functionality."""

    def test_provider_initialization(self, deepgram_provider):
        """Test that Deepgram provider initializes correctly."""
        assert deepgram_provider is not None
        assert hasattr(deepgram_provider, "api_key")
        assert deepgram_provider.api_key == "test-api-key"
        assert hasattr(deepgram_provider, "audio")
        assert hasattr(deepgram_provider.audio, "transcriptions")

    def test_chat_completions_create_not_implemented(self, deepgram_provider):
        """Test that chat completions are not supported."""
        with pytest.raises(
            NotImplementedError,
            match="Deepgram provider only supports audio transcription",
        ):
            deepgram_provider.chat_completions_create("model", [])

    def test_audio_transcriptions_create_success(
        self, deepgram_provider, mock_deepgram_response
    ):
        """Test successful audio transcription."""
        mock_sdk_response = MagicMock()
        mock_sdk_response.to_dict.return_value = mock_deepgram_response
        mock_sdk_response.model_dump.return_value = mock_deepgram_response

        with patch(
            "builtins.open", mock_open(read_data=b"fake audio data")
        ), patch.object(
            deepgram_provider.client.listen.v1.media,
            "transcribe_file",
            return_value=mock_sdk_response,
        ):
            result = deepgram_provider.audio.transcriptions.create(
                model="deepgram:nova-2", file="test_audio.mp3"
            )

            assert isinstance(result, TranscriptionResult)
            assert result.text == "Hello, this is a test transcription from Deepgram."
            assert result.language == "en-US"
            assert result.confidence == 0.95

    def test_audio_transcriptions_create_with_file_object(
        self, deepgram_provider, mock_deepgram_response
    ):
        """Test audio transcription with file-like object."""
        audio_data = io.BytesIO(b"fake audio data")

        mock_response = MagicMock()
        mock_response.to_dict.return_value = mock_deepgram_response
        mock_response.model_dump.return_value = mock_deepgram_response

        with patch.object(
            deepgram_provider.client.listen.v1.media,
            "transcribe_file",
            return_value=mock_response,
        ):
            result = deepgram_provider.audio.transcriptions.create(
                model="deepgram:nova-2", file=audio_data
            )

            assert isinstance(result, TranscriptionResult)
            assert result.text == "Hello, this is a test transcription from Deepgram."

    def test_audio_transcriptions_create_with_options(
        self, deepgram_provider, mock_deepgram_response
    ):
        """Test audio transcription with TranscriptionOptions."""
        options = TranscriptionOptions(
            language="en",
            enable_speaker_diarization=True,
            enable_automatic_punctuation=True,
        )

        mock_response = MagicMock()
        mock_response.to_dict.return_value = mock_deepgram_response
        mock_response.model_dump.return_value = mock_deepgram_response

        with patch(
            "builtins.open", mock_open(read_data=b"fake audio data")
        ), patch.object(
            deepgram_provider.client.listen.v1.media,
            "transcribe_file",
            return_value=mock_response,
        ) as mock_transcribe:
            result = deepgram_provider.audio.transcriptions.create(
                model="deepgram:nova-2", file="test_audio.mp3", options=options
            )

            mock_transcribe.assert_called_once()
            assert isinstance(result, TranscriptionResult)
            assert result.text == "Hello, this is a test transcription from Deepgram."

    def test_audio_transcriptions_create_error_handling(self, deepgram_provider):
        """Test error handling for API failures."""
        with patch(
            "builtins.open", mock_open(read_data=b"fake audio data")
        ), patch.object(
            deepgram_provider.client.listen.v1.media,
            "transcribe_file",
            side_effect=Exception("API Error"),
        ):
            with pytest.raises(
                ASRError, match="Deepgram transcription error: API Error"
            ):
                deepgram_provider.audio.transcriptions.create(
                    model="deepgram:nova-2", file="test_audio.mp3"
                )

    @pytest.mark.asyncio
    async def test_audio_transcriptions_create_stream_output(self, deepgram_provider):
        """Test streaming audio transcription with single connection and chunking."""
        import numpy as np

        # Mock audio file data (simulate 16kHz mono audio)
        audio_samples = 48000  # 3 seconds of 16kHz audio
        mock_audio_data = np.zeros(audio_samples, dtype=np.float32)

        # Create async context manager mock for v5 API
        mock_connection = MagicMock()
        mock_connection.send = MagicMock()
        mock_connection.on = MagicMock()

        async def mock_connect(*args, **kwargs):
            # Return an async context manager
            class MockAsyncContextManager:
                async def __aenter__(self):
                    return mock_connection

                async def __aexit__(self, *args):
                    pass

            return MockAsyncContextManager()

        with patch(
            "soundfile.read", return_value=(mock_audio_data, 16000)
        ), patch.object(
            deepgram_provider.client.listen.v1,
            "connect",
            side_effect=mock_connect,
        ):
            result = deepgram_provider.audio.transcriptions.create_stream_output(
                model="deepgram:nova-2",
                file="test_audio.mp3",
                chunk_size_minutes=1.0,  # Test with smaller chunks
            )

            # Test that it returns an async generator
            assert hasattr(result, "__aiter__")

    def test_parse_deepgram_response_complete(
        self, deepgram_provider, mock_deepgram_response
    ):
        """Test parsing complete Deepgram response."""
        result = deepgram_provider.audio.transcriptions._parse_deepgram_response(
            mock_deepgram_response
        )

        assert result.text == "Hello, this is a test transcription from Deepgram."
        assert result.language == "en-US"
        assert result.confidence == 0.95

        assert len(result.words) == 1
        word = result.words[0]
        assert word.word == "hello"
        assert word.start == 0.0
        assert word.end == 0.5
        assert word.confidence == 0.98

    def test_parse_deepgram_response_empty_channels(self, deepgram_provider):
        """Test parsing response with empty channels."""
        empty_response = {"results": {"channels": []}}

        result = deepgram_provider.audio.transcriptions._parse_deepgram_response(
            empty_response
        )
        assert result.text == ""
        assert result.language is None


================================================
FILE: tests/providers/test_deepseek_provider.py
================================================
"""Tests for the Deepseek provider."""

from unittest.mock import MagicMock, patch
import pytest

from aisuite.providers.deepseek_provider import DeepseekProvider
from aisuite.framework.chat_completion_response import ChatCompletionResponse


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set the Deepseek API key environment variable for tests."""
    monkeypatch.setenv("DEEPSEEK_API_KEY", "test-api-key")


def test_deepseek_provider():
    """Test that the provider is initialized and chat completions are requested."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "deepseek-chat"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = DeepseekProvider()
    mock_response = MagicMock()
    # The mock response from the client is an object, so we mock the .model_dump() method
    mock_response.model_dump.return_value = {
        "choices": [
            {"message": {"content": response_text_content, "role": "assistant"}}
        ],
        "model": selected_model,
        "created": 12345,
        "id": "chatcmpl-mockid",
        # No usage data in this test
    }

    with patch.object(
        provider.client.chat.completions, "create", return_value=mock_response
    ) as mock_create:
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        mock_create.assert_called_once_with(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert isinstance(response, ChatCompletionResponse)
        assert response.choices[0].message.content == response_text_content
        assert response.usage is None


def test_deepseek_provider_with_usage():
    """Tests that usage data is correctly parsed when present in the response."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "deepseek-chat"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = DeepseekProvider()
    mock_response = MagicMock()
    mock_response.model_dump.return_value = {
        "choices": [
            {"message": {"content": response_text_content, "role": "assistant"}}
        ],
        "model": selected_model,
        "created": 12345,
        "id": "chatcmpl-mockid",
        "usage": {
            "prompt_tokens": 10,
            "completion_tokens": 20,
            "total_tokens": 30,
        },
    }

    with patch.object(
        provider.client.chat.completions, "create", return_value=mock_response
    ) as mock_create:
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        mock_create.assert_called_once_with(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert isinstance(response, ChatCompletionResponse)
        assert response.choices[0].message.content == response_text_content
        assert response.usage is not None
        assert response.usage.prompt_tokens == 10
        assert response.usage.completion_tokens == 20
        assert response.usage.total_tokens == 30


================================================
FILE: tests/providers/test_google_converter.py
================================================
import unittest
from unittest.mock import MagicMock
from aisuite.providers.google_provider import GoogleMessageConverter
from aisuite.framework.message import Message, ChatCompletionMessageToolCall, Function
from aisuite.framework import ChatCompletionResponse


class TestGoogleMessageConverter(unittest.TestCase):

    def setUp(self):
        self.converter = GoogleMessageConverter()

    def test_convert_request_user_message(self):
        messages = [{"role": "user", "content": "What is the weather today?"}]
        converted_messages = self.converter.convert_request(messages)

        self.assertEqual(len(converted_messages), 1)
        self.assertEqual(converted_messages[0].role, "user")
        self.assertEqual(
            converted_messages[0].parts[0].text, "What is the weather today?"
        )

    def test_convert_request_tool_result_message(self):
        messages = [
            {
                "role": "tool",
                "name": "get_weather",
                "content": '{"temperature": "15", "unit": "Celsius"}',
            }
        ]
        converted_messages = self.converter.convert_request(messages)

        self.assertEqual(len(converted_messages), 1)
        self.assertEqual(converted_messages[0].function_response.name, "get_weather")
        self.assertEqual(
            converted_messages[0].function_response.response,
            {"temperature": "15", "unit": "Celsius"},
        )

    def test_convert_request_assistant_message(self):
        messages = [
            {
                "role": "assistant",
                "content": "The weather is sunny with a temperature of 25 degrees Celsius.",
            }
        ]
        converted_messages = self.converter.convert_request(messages)

        self.assertEqual(len(converted_messages), 1)
        self.assertEqual(converted_messages[0].role, "model")
        self.assertEqual(
            converted_messages[0].parts[0].text,
            "The weather is sunny with a temperature of 25 degrees Celsius.",
        )

    def test_convert_response_with_function_call(self):
        function_call_mock = MagicMock()
        function_call_mock.name = "get_exchange_rate"
        function_call_mock.args = {
            "currency_from": "AUD",
            "currency_to": "SEK",
            "currency_date": "latest",
        }

        response = MagicMock()
        response.candidates = [
            MagicMock(
                content=MagicMock(parts=[MagicMock(function_call=function_call_mock)]),
                finish_reason="function_call",
            )
        ]

        normalized_response = self.converter.convert_response(response)

        self.assertIsInstance(normalized_response, ChatCompletionResponse)
        self.assertEqual(normalized_response.choices[0].finish_reason, "tool_calls")
        self.assertEqual(
            normalized_response.choices[0].message.tool_calls[0].function.name,
            "get_exchange_rate",
        )
        self.assertEqual(
            normalized_response.choices[0].message.tool_calls[0].function.arguments,
            '{"currency_from": "AUD", "currency_to": "SEK", "currency_date": "latest"}',
        )

    def test_convert_response_with_text(self):
        response = MagicMock()
        text_content = "The current exchange rate is 7.50 SEK per AUD."

        mock_part = MagicMock()
        mock_part.text = text_content
        mock_part.function_call = None

        mock_content = MagicMock()
        mock_content.parts = [mock_part]

        mock_candidate = MagicMock()
        mock_candidate.content = mock_content
        mock_candidate.finish_reason = "stop"

        response.candidates = [mock_candidate]

        normalized_response = self.converter.convert_response(response)

        self.assertIsInstance(normalized_response, ChatCompletionResponse)
        self.assertEqual(normalized_response.choices[0].finish_reason, "stop")
        self.assertEqual(normalized_response.choices[0].message.content, text_content)


if __name__ == "__main__":
    unittest.main()


================================================
FILE: tests/providers/test_google_provider.py
================================================
"""Tests for Google provider functionality (both chat and ASR)."""

import io
import json
from unittest.mock import MagicMock, mock_open, patch

import pytest

from aisuite.providers.google_provider import GoogleProvider
from aisuite.provider import ASRError
from aisuite.framework.message import (
    TranscriptionResult,
    TranscriptionOptions,
    StreamingTranscriptionChunk,
)
from vertexai.generative_models import Content, Part


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("GOOGLE_APPLICATION_CREDENTIALS", "path-to-service-account-json")
    monkeypatch.setenv("GOOGLE_PROJECT_ID", "vertex-project-id")
    monkeypatch.setenv("GOOGLE_REGION", "us-central1")


@pytest.fixture
def mock_google_speech_response():
    """Create a mock Google Speech-to-Text API response."""
    mock_response = MagicMock()
    mock_result = MagicMock()
    mock_alternative = MagicMock()

    mock_alternative.transcript = "Hello, this is a test transcription."
    mock_alternative.confidence = 0.95

    # Mock words
    mock_word = MagicMock()
    mock_word.word = "Hello"
    mock_word.start_time.total_seconds.return_value = 0.0
    mock_word.end_time.total_seconds.return_value = 0.5
    mock_word.confidence = 0.98
    mock_alternative.words = [mock_word]

    mock_result.alternatives = [mock_alternative]
    mock_response.results = [mock_result]

    return mock_response


def test_missing_env_vars():
    """Test that an error is raised if required environment variables are missing."""
    with patch.dict("os.environ", {}, clear=True):
        with pytest.raises(EnvironmentError) as exc_info:
            GoogleProvider()
        assert "Missing one or more required Google environment variables" in str(
            exc_info.value
        )


def test_vertex_interface():
    """High-level test that the interface is initialized and chat completions are requested successfully."""

    # Test case 1: Regular text response
    def test_text_response():
        user_greeting = "Hello!"
        message_history = [{"role": "user", "content": user_greeting}]
        selected_model = "our-favorite-model"
        response_text_content = "mocked-text-response-from-model"

        interface = GoogleProvider()
        mock_response = MagicMock()
        mock_response.candidates = [MagicMock()]
        mock_response.candidates[0].content.parts = [MagicMock()]
        mock_response.candidates[0].content.parts[0].text = response_text_content
        # Ensure function_call attribute doesn't exist
        del mock_response.candidates[0].content.parts[0].function_call

        with patch(
            "aisuite.providers.google_provider.GenerativeModel"
        ) as mock_generative_model:
            mock_model = MagicMock()
            mock_generative_model.return_value = mock_model
            mock_chat = MagicMock()
            mock_model.start_chat.return_value = mock_chat
            mock_chat.send_message.return_value = mock_response

            response = interface.chat_completions_create(
                messages=message_history,
                model=selected_model,
                temperature=0.7,
            )

            # Assert the response is in the correct format
            assert response.choices[0].message.content == response_text_content
            assert response.choices[0].finish_reason == "stop"

    # Test case 2: Function call response
    def test_function_call():
        user_greeting = "What's the weather?"
        message_history = [{"role": "user", "content": user_greeting}]
        selected_model = "our-favorite-model"

        interface = GoogleProvider()
        mock_response = MagicMock()
        mock_response.candidates = [MagicMock()]
        mock_response.candidates[0].content.parts = [MagicMock()]

        # Mock the function call response
        function_call_mock = MagicMock()
        function_call_mock.name = "get_weather"
        function_call_mock.args = {"location": "San Francisco"}
        mock_response.candidates[0].content.parts[0].function_call = function_call_mock
        mock_response.candidates[0].content.parts[0].text = None

        with patch(
            "aisuite.providers.google_provider.GenerativeModel"
        ) as mock_generative_model:
            mock_model = MagicMock()
            mock_generative_model.return_value = mock_model
            mock_chat = MagicMock()
            mock_model.start_chat.return_value = mock_chat
            mock_chat.send_message.return_value = mock_response

            response = interface.chat_completions_create(
                messages=message_history,
                model=selected_model,
                temperature=0.7,
            )

            # Assert the response contains the function call
            assert response.choices[0].message.content is None
            assert response.choices[0].message.tool_calls[0].type == "function"
            assert (
                response.choices[0].message.tool_calls[0].function.name == "get_weather"
            )
            assert json.loads(
                response.choices[0].message.tool_calls[0].function.arguments
            ) == {"location": "San Francisco"}
            assert response.choices[0].finish_reason == "tool_calls"

    # Run both test cases
    test_text_response()
    test_function_call()


def test_convert_openai_to_vertex_ai():
    """Test the message conversion from OpenAI format to Vertex AI format."""
    interface = GoogleProvider()
    message = {"role": "user", "content": "Hello!"}

    # Use the transformer to convert the message
    result = interface.transformer.convert_request([message])

    # Verify the conversion result
    assert len(result) == 1
    assert isinstance(result[0], Content)
    assert result[0].role == "user"
    assert len(result[0].parts) == 1
    assert isinstance(result[0].parts[0], Part)
    assert result[0].parts[0].text == "Hello!"


def test_role_conversions():
    """Test that different message roles are converted correctly."""
    interface = GoogleProvider()

    messages = [
        {"role": "system", "content": "System message"},
        {"role": "user", "content": "User message"},
        {"role": "assistant", "content": "Assistant message"},
    ]

    result = interface.transformer.convert_request(messages)

    # System and user messages should both be converted to "user" role in Vertex AI
    assert len(result) == 3
    assert result[0].role == "user"  # system converted to user
    assert result[0].parts[0].text == "System message"

    assert result[1].role == "user"
    assert result[1].parts[0].text == "User message"

    assert result[2].role == "model"  # assistant converted to model
    assert result[2].parts[0].text == "Assistant message"


class TestGoogleProvider:
    """Test suite for Google provider functionality."""

    def test_provider_initialization(self):
        """Test that Google provider initializes correctly."""
        provider = GoogleProvider()
        assert provider is not None
        assert hasattr(provider, "audio")
        assert hasattr(provider.audio, "transcriptions")


class TestGoogleASR:
    """Test suite for Google ASR functionality."""

    def test_audio_transcriptions_create_success(self, mock_google_speech_response):
        """Test successful audio transcription."""
        google_provider = GoogleProvider()
        mock_client = MagicMock()
        mock_client.recognize.return_value = mock_google_speech_response
        google_provider._speech_client = mock_client

        with patch("builtins.open", mock_open(read_data=b"fake audio data")):
            result = google_provider.audio.transcriptions.create(
                model="google:latest_long", file="test_audio.wav"
            )

            assert isinstance(result, TranscriptionResult)
            assert result.text == "Hello, this is a test transcription."
            assert result.confidence == 0.95
            assert result.task == "transcribe"

    def test_audio_transcriptions_create_with_file_object(
        self, mock_google_speech_response
    ):
        """Test audio transcription with file-like object."""
        google_provider = GoogleProvider()
        mock_client = MagicMock()
        mock_client.recognize.return_value = mock_google_speech_response
        google_provider._speech_client = mock_client

        audio_data = io.BytesIO(b"fake audio data")

        result = google_provider.audio.transcriptions.create(
            model="google:latest_long", file=audio_data
        )

        assert isinstance(result, TranscriptionResult)
        assert result.text == "Hello, this is a test transcription."

    def test_audio_transcriptions_create_with_options(
        self, mock_google_speech_response
    ):
        """Test audio transcription with TranscriptionOptions."""
        google_provider = GoogleProvider()
        mock_client = MagicMock()
        mock_client.recognize.return_value = mock_google_speech_response
        google_provider._speech_client = mock_client

        options = TranscriptionOptions(
            language="en",
            enable_automatic_punctuation=True,
            include_word_timestamps=True,
        )

        with patch("builtins.open", mock_open(read_data=b"fake audio data")):
            result = google_provider.audio.transcriptions.create(
                model="google:latest_long", file="test_audio.wav", options=options
            )

            mock_client.recognize.assert_called_once()
            assert isinstance(result, TranscriptionResult)
            assert result.text == "Hello, this is a test transcription."

    def test_audio_transcriptions_create_error_handling(self):
        """Test handling of Google Speech API errors."""
        google_provider = GoogleProvider()
        mock_client = MagicMock()
        mock_client.recognize.side_effect = Exception("API Error")
        google_provider._speech_client = mock_client

        with patch("builtins.open", mock_open(read_data=b"fake audio data")):
            with pytest.raises(
                ASRError, match="Google Speech-to-Text error: API Error"
            ):
                google_provider.audio.transcriptions.create(
                    model="google:latest_long", file="test_audio.wav"
                )

    @pytest.mark.asyncio
    async def test_audio_transcriptions_create_stream_output(
        self, mock_google_speech_response
    ):
        """Test streaming audio transcription with fixed config parameter."""
        google_provider = GoogleProvider()
        mock_client = MagicMock()

        # Mock streaming response
        mock_streaming_response = MagicMock()
        mock_streaming_result = MagicMock()
        mock_alternative = MagicMock()
        mock_alternative.transcript = "Hello streaming"
        mock_streaming_result.alternatives = [mock_alternative]
        mock_streaming_result.is_final = True
        mock_streaming_response.results = [mock_streaming_result]

        mock_client.streaming_recognize.return_value = [mock_streaming_response]
        google_provider._speech_client = mock_client

        with patch("builtins.open", mock_open(read_data=b"fake audio data")):
            result = google_provider.audio.transcriptions.create_stream_output(
                model="google:latest_long", file="test_audio.wav"
            )

            assert hasattr(result, "__aiter__")

            # Test that streaming_recognize is called with both config and requests
            chunks = []
            async for chunk in result:
                chunks.append(chunk)
                break  # Just test one chunk

            # Verify the method was called with correct parameters
            mock_client.streaming_recognize.assert_called_once()
            call_args = mock_client.streaming_recognize.call_args
            assert "config" in call_args.kwargs
            assert "requests" in call_args.kwargs

    def test_parse_google_response_complete(self, mock_google_speech_response):
        """Test parsing complete Google response."""
        google_provider = GoogleProvider()
        result = google_provider.audio.transcriptions._parse_google_response(
            mock_google_speech_response
        )

        assert result.text == "Hello, this is a test transcription."
        assert result.confidence == 0.95
        assert result.task == "transcribe"

        assert len(result.words) == 1
        word = result.words[0]
        assert word.word == "Hello"
        assert word.start == 0.0
        assert word.end == 0.5
        assert word.confidence == 0.98

        assert len(result.alternatives) == 1

    def test_parse_google_response_empty_results(self):
        """Test parsing response with empty results."""
        google_provider = GoogleProvider()
        mock_response = MagicMock()
        mock_response.results = []

        result = google_provider.audio.transcriptions._parse_google_response(
            mock_response
        )
        assert result.text == ""
        assert result.language is None


================================================
FILE: tests/providers/test_groq_provider.py
================================================
"""Tests for the Groq provider."""

from unittest.mock import MagicMock, patch

import pytest

from aisuite.providers.groq_provider import GroqProvider


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("GROQ_API_KEY", "test-api-key")


def test_groq_provider():
    """Test that the provider is initialized and chat completions are requested."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "our-favorite-model"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = GroqProvider()
    mock_response = MagicMock()
    mock_response.model_dump.return_value = {
        "choices": [{"message": {"content": response_text_content}}]
    }

    with patch.object(
        provider.client.chat.completions,
        "create",
        return_value=mock_response,
    ) as mock_create:
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        mock_create.assert_called_with(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert response.choices[0].message.content == response_text_content


def test_groq_provider_with_usage():
    """Tests that usage data is correctly parsed when present in the response."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "our-favorite-model"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = GroqProvider()
    mock_response = MagicMock()
    mock_response.model_dump.return_value = {
        "choices": [
            {"message": {"content": response_text_content, "role": "assistant"}}
        ],
        "usage": {
            "prompt_tokens": 10,
            "completion_tokens": 20,
            "total_tokens": 30,
        },
    }

    with patch.object(
        provider.client.chat.completions,
        "create",
        return_value=mock_response,
    ):
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert response.usage is not None
        assert response.usage.prompt_tokens == 10
        assert response.usage.completion_tokens == 20
        assert response.usage.total_tokens == 30


================================================
FILE: tests/providers/test_huggingface_provider.py
================================================
"""Tests for Hugging Face provider ASR functionality."""

import io
from unittest.mock import MagicMock, mock_open, patch

import pytest

from aisuite.providers.huggingface_provider import HuggingfaceProvider
from aisuite.provider import ASRError
from aisuite.framework.message import TranscriptionResult


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("HF_TOKEN", "test-hf-token")


@pytest.fixture
def huggingface_provider():
    """Create a Hugging Face provider instance for testing."""
    return HuggingfaceProvider()


@pytest.fixture
def mock_huggingface_response():
    """Create a mock Hugging Face API response for ASR."""
    return {
        "text": "Hello, this is a test transcription from Hugging Face.",
        "chunks": [
            {"text": " Hello", "timestamp": [0.0, 0.5]},
            {"text": ",", "timestamp": [0.5, 0.6]},
            {"text": " this", "timestamp": [0.6, 0.9]},
            {"text": " is", "timestamp": [0.9, 1.1]},
            {"text": " a", "timestamp": [1.1, 1.2]},
            {"text": " test", "timestamp": [1.2, 1.5]},
        ],
    }


@pytest.fixture
def mock_huggingface_response_text_only():
    """Create a mock Hugging Face API response with text only (no chunks)."""
    return {"text": "Simple transcription without timestamps."}


class TestHuggingFaceProvider:
    """Test suite for Hugging Face provider functionality."""

    def test_provider_initialization(self, huggingface_provider):
        """Test that Hugging Face provider initializes correctly."""
        assert huggingface_provider is not None
        assert hasattr(huggingface_provider, "token")
        assert huggingface_provider.token == "test-hf-token"
        assert hasattr(huggingface_provider, "audio")
        assert hasattr(huggingface_provider.audio, "transcriptions")

    def test_audio_transcriptions_create_success(
        self, huggingface_provider, mock_huggingface_response
    ):
        """Test successful audio transcription."""
        mock_response = MagicMock()
        mock_response.status_code = 200
        mock_response.json.return_value = mock_huggingface_response

        with patch("builtins.open", mock_open(read_data=b"fake audio data")), patch(
            "requests.post", return_value=mock_response
        ) as mock_post:
            result = huggingface_provider.audio.transcriptions.create(
                model="huggingface:openai/whisper-large-v3", file="test_audio.wav"
            )

            # Verify the request
            mock_post.assert_called_once()
            call_args = mock_post.call_args
            # URL is first positional argument
            assert "api-inference.huggingface.co" in call_args.args[0]
            assert "openai/whisper-large-v3" in call_args.args[0]
            assert (
                call_args.kwargs["headers"]["Authorization"] == "Bearer test-hf-token"
            )
            assert call_args.kwargs["headers"]["Content-Type"] == "audio/wav"

            # Verify the result
            assert isinstance(result, TranscriptionResult)
            assert (
                result.text == "Hello, this is a test transcription from Hugging Face."
            )
            assert len(result.words) == 6
            assert result.words[0].word == " Hello"
            assert result.words[0].start == 0.0
            assert result.words[0].end == 0.5

    def test_audio_transcriptions_with_file_object(
        self, huggingface_provider, mock_huggingface_response
    ):
        """Test audio transcription with file-like object."""
        audio_data = io.BytesIO(b"fake audio data")

        mock_response = MagicMock()
        mock_response.status_code = 200
        mock_response.json.return_value = mock_huggingface_response

        with patch("requests.post", return_value=mock_response):
            result = huggingface_provider.audio.transcriptions.create(
                model="huggingface:openai/whisper-large-v3", file=audio_data
            )

            assert isinstance(result, TranscriptionResult)
            assert (
                result.text == "Hello, this is a test transcription from Hugging Face."
            )

    def test_audio_transcriptions_content_type_detection(self, huggingface_provider):
        """Test content type detection for different audio formats."""
        mock_response = MagicMock()
        mock_response.status_code = 200
        mock_response.json.return_value = {"text": "test"}

        test_cases = [
            ("audio.wav", "audio/wav"),
            ("audio.mp3", "audio/mpeg"),  # HF API requires audio/mpeg for MP3
            ("audio.flac", "audio/flac"),
            ("audio.unknown", "audio/wav"),  # Default to wav
        ]

        for filename, expected_content_type in test_cases:
            with patch("builtins.open", mock_open(read_data=b"audio")), patch(
                "requests.post", return_value=mock_response
            ) as mock_post:
                huggingface_provider.audio.transcriptions.create(
                    model="huggingface:test-model", file=filename
                )

                call_args = mock_post.call_args
                assert (
                    call_args.kwargs["headers"]["Content-Type"] == expected_content_type
                )

    def test_audio_transcriptions_retry_503(self, huggingface_provider):
        """Test retry logic for 503 model loading error."""
        import requests

        # First response: 503 error
        mock_response_503 = MagicMock()
        mock_response_503.status_code = 503

        # Create HTTP error with response attribute
        http_error = requests.exceptions.HTTPError("Model loading")
        http_error.response = mock_response_503
        mock_response_503.raise_for_status.side_effect = http_error

        # Second response: Success
        mock_response_success = MagicMock()
        mock_response_success.status_code = 200
        mock_response_success.json.return_value = {"text": "Success after retry"}

        responses = [mock_response_503, mock_response_success]

        with patch("builtins.open", mock_open(read_data=b"audio")), patch(
            "requests.post", side_effect=responses
        ) as mock_post:
            result = huggingface_provider.audio.transcriptions.create(
                model="huggingface:test-model", file="test.wav"
            )

            # Verify retry happened
            assert mock_post.call_count == 2

            # Verify second call had x-wait-for-model header
            second_call_headers = mock_post.call_args_list[1].kwargs["headers"]
            assert second_call_headers.get("x-wait-for-model") == "true"

            assert result.text == "Success after retry"

    def test_audio_transcriptions_error_handling(self, huggingface_provider):
        """Test error handling for API failures."""
        mock_response = MagicMock()
        mock_response.status_code = 400
        mock_response.raise_for_status.side_effect = Exception("Bad Request")

        with patch("builtins.open", mock_open(read_data=b"audio")), patch(
            "requests.post", return_value=mock_response
        ):
            with pytest.raises(ASRError, match="Hugging Face transcription error"):
                huggingface_provider.audio.transcriptions.create(
                    model="huggingface:test-model", file="test.wav"
                )

    def test_parse_response_standard_format(
        self, huggingface_provider, mock_huggingface_response
    ):
        """Test parsing response with text and chunks."""
        result = huggingface_provider.audio.transcriptions._parse_huggingface_response(
            mock_huggingface_response, "test-model"
        )

        assert isinstance(result, TranscriptionResult)
        assert result.text == "Hello, this is a test transcription from Hugging Face."
        assert len(result.words) == 6
        assert result.words[0].word == " Hello"
        assert result.words[0].start == 0.0
        assert result.words[0].end == 0.5

    def test_parse_response_text_only(
        self, huggingface_provider, mock_huggingface_response_text_only
    ):
        """Test parsing response with text only (no chunks)."""
        result = huggingface_provider.audio.transcriptions._parse_huggingface_response(
            mock_huggingface_response_text_only, "test-model"
        )

        assert isinstance(result, TranscriptionResult)
        assert result.text == "Simple transcription without timestamps."
        assert result.words is None

    def test_parse_response_string_format(self, huggingface_provider):
        """Test parsing response that is a plain string."""
        result = huggingface_provider.audio.transcriptions._parse_huggingface_response(
            "Plain string transcription", "test-model"
        )

        assert isinstance(result, TranscriptionResult)
        assert result.text == "Plain string transcription"
        assert result.words is None

    def test_model_id_extraction(self, huggingface_provider):
        """Test that model ID is correctly extracted from model string."""
        mock_response = MagicMock()
        mock_response.status_code = 200
        mock_response.json.return_value = {"text": "test"}

        with patch("builtins.open", mock_open(read_data=b"audio")), patch(
            "requests.post", return_value=mock_response
        ) as mock_post:
            huggingface_provider.audio.transcriptions.create(
                model="huggingface:openai/whisper-large-v3", file="test.wav"
            )

            # Verify URL contains correct model ID (URL is first positional arg)
            call_args = mock_post.call_args
            assert "openai/whisper-large-v3" in call_args.args[0]


================================================
FILE: tests/providers/test_inception_provider.py
================================================
from unittest.mock import MagicMock, patch

import pytest

from aisuite.providers.inception_provider import InceptionProvider


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("INCEPTION_API_KEY", "test-api-key")


def test_inception_provider():
    """High-level test that the provider is initialized and chat completions are requested successfully."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "mercury"
    chosen_temperature = 0
    response_text_content = "mocked-text-response-from-model"

    provider = InceptionProvider()
    mock_response = MagicMock()
    mock_response.choices = [MagicMock()]
    mock_response.choices[0].message = MagicMock()
    mock_response.choices[0].message.content = response_text_content

    with patch.object(
        provider.client.chat.completions,
        "create",
        return_value=mock_response,
    ) as mock_create:
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        mock_create.assert_called_with(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert response.choices[0].message.content == response_text_content


================================================
FILE: tests/providers/test_lmstudio_provider.py
================================================
import pytest
from unittest.mock import patch, MagicMock
from aisuite.providers.lmstudio_provider import LmstudioProvider


@pytest.fixture(autouse=True)
def set_api_url_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("LMSTUDIO_API_URL", "http://localhost:1234")


def test_completion():
    """Test that completions request successfully."""

    user_greeting = "Howdy!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "best-model-ever"
    chosen_temperature = 0.77
    response_text_content = "mocked-text-response-from-ollama-model"

    lmstudio = LmstudioProvider()
    mock_response = {"choices": [{"message": {"content": response_text_content}}]}

    with patch(
        "httpx.post",
        return_value=MagicMock(status_code=200, json=lambda: mock_response),
    ) as mock_post:
        response = lmstudio.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        mock_post.assert_called_once_with(
            "http://localhost:1234/v1/chat/completions",
            json={
                "model": selected_model,
                "messages": message_history,
                "stream": False,
                "temperature": chosen_temperature,
            },
            timeout=300,
        )

        assert response.choices[0].message.content == response_text_content


================================================
FILE: tests/providers/test_mistral_provider.py
================================================
import pytest
from unittest.mock import patch, MagicMock

from aisuite.providers.mistral_provider import MistralProvider


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("MISTRAL_API_KEY", "test-api-key")


def test_mistral_provider():
    """High-level test that the provider is initialized and chat completions are requested successfully."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "our-favorite-model"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = MistralProvider()
    mock_response = MagicMock()
    mock_response.model_dump.return_value = {
        "choices": [{"message": {"content": response_text_content}}]
    }

    with patch.object(
        provider.client.chat, "complete", return_value=mock_response
    ) as mock_create:
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        mock_create.assert_called_with(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert response.choices[0].message.content == response_text_content


def test_mistral_provider_with_usage():
    """Tests that usage data is correctly parsed when present in the response."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "our-favorite-model"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = MistralProvider()
    mock_response = MagicMock()
    mock_response.model_dump.return_value = {
        "choices": [{"message": {"content": response_text_content}}],
        "usage": {
            "prompt_tokens": 10,
            "completion_tokens": 20,
            "total_tokens": 30,
        },
    }

    with patch.object(
        provider.client.chat, "complete", return_value=mock_response
    ) as mock_create:
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert response.usage is not None
        assert response.usage.prompt_tokens == 10
        assert response.usage.completion_tokens == 20
        assert response.usage.total_tokens == 30


================================================
FILE: tests/providers/test_nebius_provider.py
================================================
import pytest
from unittest.mock import patch, MagicMock

from aisuite.providers.nebius_provider import NebiusProvider


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("NEBIUS_API_KEY", "test-api-key")


def test_nebius_provider():
    """High-level test that the provider is initialized and chat completions are requested successfully."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "our-favorite-model"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = NebiusProvider()
    mock_response = MagicMock()
    mock_response.choices = [MagicMock()]
    mock_response.choices[0].message = MagicMock()
    mock_response.choices[0].message.content = response_text_content

    with patch.object(
        provider.client.chat.completions,
        "create",
        return_value=mock_response,
    ) as mock_create:
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        mock_create.assert_called_with(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert response.choices[0].message.content == response_text_content


================================================
FILE: tests/providers/test_ollama_provider.py
================================================
import pytest
from unittest.mock import patch, MagicMock
from aisuite.providers.ollama_provider import OllamaProvider


@pytest.fixture(autouse=True)
def set_api_url_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("OLLAMA_API_URL", "http://localhost:11434")


def test_completion():
    """Test that completions request successfully."""

    user_greeting = "Howdy!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "best-model-ever"
    chosen_temperature = 0.77
    response_text_content = "mocked-text-response-from-ollama-model"

    ollama = OllamaProvider()
    mock_response = {"message": {"content": response_text_content}}

    with patch(
        "httpx.post",
        return_value=MagicMock(status_code=200, json=lambda: mock_response),
    ) as mock_post:
        response = ollama.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        mock_post.assert_called_once_with(
            "http://localhost:11434/api/chat",
            json={
                "model": selected_model,
                "messages": message_history,
                "stream": False,
                "temperature": chosen_temperature,
            },
            timeout=30,
        )

        assert response.choices[0].message.content == response_text_content


================================================
FILE: tests/providers/test_openai_provider.py
================================================
"""Tests for OpenAI provider functionality."""

import io
from unittest.mock import MagicMock, mock_open, patch

import pytest

from aisuite.providers.openai_provider import OpenaiProvider
from aisuite.provider import ASRError
from aisuite.framework.message import (
    TranscriptionResult,
    TranscriptionOptions,
    StreamingTranscriptionChunk,
    Segment,
    Word,
)


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("OPENAI_API_KEY", "test-api-key")


@pytest.fixture
def openai_provider():
    """Create an OpenAI provider instance for testing."""
    return OpenaiProvider()


@pytest.fixture
def mock_openai_response():
    """Create a mock OpenAI API response for ASR."""
    mock_response = MagicMock()
    mock_response.text = "Hello, this is a test transcription."
    mock_response.language = "en"
    mock_response.segments = None
    return mock_response


class TestOpenAIProvider:
    """Test suite for OpenAI provider functionality."""

    def test_provider_initialization(self, openai_provider):
        """Test that OpenAI provider initializes correctly."""
        assert openai_provider is not None
        assert hasattr(openai_provider, "client")
        assert hasattr(openai_provider, "audio")
        assert hasattr(openai_provider.audio, "transcriptions")


class TestOpenAIASR:
    """Test suite for OpenAI ASR functionality."""

    def test_audio_transcriptions_create_success(
        self, openai_provider, mock_openai_response
    ):
        """Test successful audio transcription."""
        with patch(
            "builtins.open", mock_open(read_data=b"fake audio data")
        ), patch.object(
            openai_provider.client.audio.transcriptions,
            "create",
            return_value=mock_openai_response,
        ):
            result = openai_provider.audio.transcriptions.create(
                model="openai:whisper-1", file="test_audio.mp3"
            )

            assert isinstance(result, TranscriptionResult)
            assert result.text == "Hello, this is a test transcription."
            assert result.language == "en"

    def test_audio_transcriptions_create_with_file_object(
        self, openai_provider, mock_openai_response
    ):
        """Test audio transcription with file-like object."""
        audio_data = io.BytesIO(b"fake audio data")

        with patch.object(
            openai_provider.client.audio.transcriptions,
            "create",
            return_value=mock_openai_response,
        ):
            result = openai_provider.audio.transcriptions.create(
                model="openai:whisper-1", file=audio_data
            )

            assert isinstance(result, TranscriptionResult)
            assert result.text == "Hello, this is a test transcription."

    def test_audio_transcriptions_create_with_kwargs(
        self, openai_provider, mock_openai_response
    ):
        """Test audio transcription with additional parameters."""
        with patch(
            "builtins.open", mock_open(read_data=b"fake audio data")
        ), patch.object(
            openai_provider.client.audio.transcriptions,
            "create",
            return_value=mock_openai_response,
        ) as mock_create:
            result = openai_provider.audio.transcriptions.create(
                model="openai:whisper-1",
                file="test_audio.mp3",
                language="en",
                temperature=0.5,
            )

            mock_create.assert_called_once()
            call_kwargs = mock_create.call_args.kwargs
            assert call_kwargs["language"] == "en"
            assert call_kwargs["temperature"] == 0.5
            assert isinstance(result, TranscriptionResult)
            assert result.text == "Hello, this is a test transcription."

    def test_audio_transcriptions_create_with_options(
        self, openai_provider, mock_openai_response
    ):
        """Test audio transcription with TranscriptionOptions."""
        options = TranscriptionOptions(
            language="en",
            include_word_timestamps=True,
            enable_automatic_punctuation=True,
        )

        with patch(
            "builtins.open", mock_open(read_data=b"fake audio data")
        ), patch.object(
            openai_provider.client.audio.transcriptions,
            "create",
            return_value=mock_openai_response,
        ) as mock_create:
            result = openai_provider.audio.transcriptions.create(
                model="openai:whisper-1", file="test_audio.mp3", options=options
            )

            mock_create.assert_called_once()
            call_kwargs = mock_create.call_args.kwargs
            # Check that options parameters were extracted and passed as flat kwargs
            assert call_kwargs["language"] == "en"
            assert call_kwargs["include_word_timestamps"] is True
            assert call_kwargs["enable_automatic_punctuation"] is True
            assert isinstance(result, TranscriptionResult)
            assert result.text == "Hello, this is a test transcription."

    def test_audio_transcriptions_create_error_handling(self, openai_provider):
        """Test error handling for API failures."""
        with patch(
            "builtins.open", mock_open(read_data=b"fake audio data")
        ), patch.object(
            openai_provider.client.audio.transcriptions,
            "create",
            side_effect=Exception("API Error"),
        ):
            with pytest.raises(ASRError, match="OpenAI transcription error: API Error"):
                openai_provider.audio.transcriptions.create(
                    model="openai:whisper-1", file="test_audio.mp3"
                )

    @pytest.mark.asyncio
    async def test_audio_transcriptions_create_stream_output(self, openai_provider):
        """Test streaming audio transcription."""
        # Mock streaming events
        mock_delta_event = MagicMock()
        mock_delta_event.type = "transcript.text.delta"
        mock_delta_event.delta = "Hello"

        mock_done_event = MagicMock()
        mock_done_event.type = "transcript.text.done"
        mock_done_event.text = "Hello world"

        with patch(
            "builtins.open", mock_open(read_data=b"fake audio data")
        ), patch.object(
            openai_provider.client.audio.transcriptions,
            "create",
            return_value=[mock_delta_event, mock_done_event],
        ):
            result = openai_provider.audio.transcriptions.create_stream_output(
                model="openai:gpt-4o-mini-transcribe", file="test_audio.mp3"
            )

            chunks = []
            async for chunk in result:
                chunks.append(chunk)

            assert len(chunks) == 2
            assert isinstance(chunks[0], StreamingTranscriptionChunk)
            assert chunks[0].text == "Hello"
            assert chunks[0].is_final is False  # Delta event

            assert isinstance(chunks[1], StreamingTranscriptionChunk)
            assert chunks[1].text == "Hello world"
            assert chunks[1].is_final is True  # Done event

    @pytest.mark.asyncio
    async def test_timestamp_granularities_error_handling(self, openai_provider):
        """Test error handling for timestamp_granularities with incompatible response_format."""
        options = TranscriptionOptions(
            response_format="json",
            stream=True,
            timestamp_granularities=["word"],  # Now part of TranscriptionOptions
        )

        with patch("builtins.open", mock_open(read_data=b"fake audio data")):
            with pytest.raises(
                ASRError,
                match="timestamp_granularities requires response_format='verbose_json'",
            ):
                # The error should be raised before making the API call
                result = openai_provider.audio.transcriptions.create_stream_output(
                    model="openai:gpt-4o-mini-transcribe",
                    file="test_audio.mp3",
                    options=options,
                )
                # Consume the async generator to trigger the validation
                async for _ in result:
                    pass

    def test_parse_openai_response_with_segments_and_words(self, openai_provider):
        """Test parsing OpenAI response with segments and words."""
        mock_response = MagicMock()
        mock_response.text = "Hello world"
        mock_response.language = "en"

        mock_segment = MagicMock()
        mock_segment.id = 0
        mock_segment.seek = 0
        mock_segment.start = 0.0
        mock_segment.end = 2.5
        mock_segment.text = "Hello world"
        mock_segment.words = []
        mock_response.segments = [mock_segment]

        result = openai_provider.audio.transcriptions._parse_openai_response(
            mock_response
        )

        assert result.text == "Hello world"
        assert len(result.segments) == 1
        assert isinstance(result.segments[0], Segment)

    def test_parse_openai_response_empty(self, openai_provider):
        """Test parsing response with minimal data."""
        mock_response = MagicMock()
        mock_response.text = "Test"
        mock_response.language = "en"
        mock_response.segments = None

        result = openai_provider.audio.transcriptions._parse_openai_response(
            mock_response
        )

        assert result.text == "Test"
        assert result.language == "en"


================================================
FILE: tests/providers/test_sambanova_provider.py
================================================
from unittest.mock import MagicMock, patch

import pytest

from aisuite.providers.sambanova_provider import SambanovaProvider


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("SAMBANOVA_API_KEY", "test-api-key")


def test_sambanova_provider():
    """High-level test that the provider is initialized and chat completions are requested successfully."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "our-favorite-model"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = SambanovaProvider()
    mock_response = MagicMock()
    mock_response.model_dump.return_value = {
        "choices": [
            {"message": {"content": response_text_content, "role": "assistant"}}
        ]
    }

    with patch.object(
        provider.client.chat.completions,
        "create",
        return_value=mock_response,
    ) as mock_create:
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        mock_create.assert_called_with(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert response.choices[0].message.content == response_text_content


def test_sambanova_provider_with_usage():
    """Tests that usage data is correctly parsed when present in the response."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "our-favorite-model"
    chosen_temperature = 0.75
    response_text_content = "mocked-text-response-from-model"

    provider = SambanovaProvider()
    mock_response = MagicMock()
    mock_response.model_dump.return_value = {
        "choices": [
            {"message": {"content": response_text_content, "role": "assistant"}}
        ],
        "usage": {
            "prompt_tokens": 10,
            "completion_tokens": 20,
            "total_tokens": 30,
        },
    }

    with patch.object(
        provider.client.chat.completions,
        "create",
        return_value=mock_response,
    ) as mock_create:
        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        assert response.usage is not None
        assert response.usage.prompt_tokens == 10
        assert response.usage.completion_tokens == 20
        assert response.usage.total_tokens == 30


================================================
FILE: tests/providers/test_watsonx_provider.py
================================================
from unittest.mock import MagicMock, patch

import pytest

try:
    from ibm_watsonx_ai.metanames import GenChatParamsMetaNames as GenChatParams
except Exception as e:
    pytest.skip(f"Skipping test due to import error: {e}", allow_module_level=True)

from aisuite.providers.watsonx_provider import WatsonxProvider


@pytest.fixture(autouse=True)
def set_api_key_env_var(monkeypatch):
    """Fixture to set environment variables for tests."""
    monkeypatch.setenv("WATSONX_SERVICE_URL", "https://watsonx-service-url.com")
    monkeypatch.setenv("WATSONX_API_KEY", "test-api-key")
    monkeypatch.setenv("WATSONX_PROJECT_ID", "test-project-id")


@pytest.mark.skip(reason="Skipping due to version compatibility issue on python 3.11")
def test_watsonx_provider():
    """High-level test that the provider is initialized and chat completions are requested successfully."""

    user_greeting = "Hello!"
    message_history = [{"role": "user", "content": user_greeting}]
    selected_model = "our-favorite-model"
    chosen_temperature = 0.7
    response_text_content = "mocked-text-response-from-model"

    provider = WatsonxProvider()
    mock_response = {"choices": [{"message": {"content": response_text_content}}]}

    with patch(
        "aisuite.providers.watsonx_provider.ModelInference"
    ) as mock_model_inference:
        mock_model = MagicMock()
        mock_model_inference.return_value = mock_model
        mock_model.chat.return_value = mock_response

        response = provider.chat_completions_create(
            messages=message_history,
            model=selected_model,
            temperature=chosen_temperature,
        )

        # Assert that ModelInference was called with correct arguments.
        mock_model_inference.assert_called_once()
        args, kwargs = mock_model_inference.call_args
        assert kwargs["model_id"] == selected_model
        assert kwargs["project_id"] == provider.project_id

        # Assert that the credentials have the correct API key and service URL.
        credentials = kwargs["credentials"]
        assert credentials.api_key == provider.api_key
        assert credentials.url == provider.service_url

        # Assert that chat was called with correct history and params
        mock_model.chat.assert_called_once_with(
            messages=message_history,
            params={GenChatParams.TEMPERATURE: chosen_temperature},
        )

        assert response.choices[0].message.content == response_text_content


================================================
FILE: tests/test_provider.py
================================================
"""Tests for base Provider class and ASRError."""

import pytest
from unittest.mock import MagicMock
from typing import Union, BinaryIO, Optional, AsyncGenerator

from aisuite.provider import Provider, ASRError, Audio
from aisuite.framework.message import (
    TranscriptionResult,
    TranscriptionOptions,
    StreamingTranscriptionChunk,
)


class MockProvider(Provider):
    """Mock provider for testing (no audio support)."""

    def chat_completions_create(self, model, messages):
        return MagicMock()


class MockTranscription(Audio.Transcription):
    """Mock transcription implementation."""

    def create(
        self,
        model: str,
        file: Union[str, BinaryIO],
        options: Optional[TranscriptionOptions] = None,
        **kwargs,
    ) -> TranscriptionResult:
        return TranscriptionResult(
            text="Mock transcription result", language="en", confidence=0.9
        )


class MockAudio(Audio):
    """Mock audio implementation."""

    def __init__(self):
        super().__init__()
        self.transcriptions = MockTranscription()


class MockASRProvider(Provider):
    """Mock provider that implements ASR."""

    def __init__(self):
        super().__init__()
        self.audio = MockAudio()

    def chat_completions_create(self, model, messages):
        return MagicMock()


class TestProvider:
    """Test suite for base Provider class."""

    def test_provider_is_abstract(self):
        """Test that Provider cannot be instantiated directly."""
        with pytest.raises(TypeError):
            Provider()

    def test_provider_without_audio_support(self):
        """Test that provider without audio support has None audio attribute."""
        provider = MockProvider()
        assert provider.audio is None

    def test_provider_asr_implementation_works(self):
        """Test that providers can successfully implement ASR."""
        provider = MockASRProvider()

        assert provider.audio is not None
        assert hasattr(provider.audio, "transcriptions")

        result = provider.audio.transcriptions.create("model", "file.mp3")

        assert isinstance(result, TranscriptionResult)
        assert result.text == "Mock transcription result"
        assert result.language == "en"
        assert result.confidence == 0.9

    def test_transcription_base_class_not_implemented(self):
        """Test that base Transcription class raises NotImplementedError."""
        transcription = Audio.Transcription()

        with pytest.raises(NotImplementedError, match="Transcription not supported"):
            transcription.create("model", "file.mp3")

    def test_audio_base_class_initialization(self):
        """Test that base Audio class initializes correctly."""
        audio = Audio()
        assert audio.transcriptions is None


class TestASRError:
    """Test suite for ASRError exception."""

    def test_asr_error_creation_and_inheritance(self):
        """Test ASRError creation and inheritance."""
        error = ASRError("Test error message")

        assert str(error) == "Test error message"
        assert isinstance(error, ASRError)
        assert isinstance(error, Exception)

    def test_asr_error_raising_and_catching(self):
        """Test raising and catching ASRError."""
        with pytest.raises(ASRError, match="Specific ASR error"):
            raise ASRError("Specific ASR error")

        # Test that it can be caught as Exception too
        with pytest.raises(Exception):
            raise ASRError("Generic catch test")

    def test_asr_error_chaining(self):
        """Test ASRError exception chaining."""
        original_error = ValueError("Original error")

        with pytest.raises(ASRError) as exc_info:
            try:
                raise original_error
            except ValueError as e:
                raise ASRError("Wrapped error") from e

        assert exc_info.value.__cause__ == original_error


================================================
FILE: tests/utils/test_mcp_memory_integration.py
================================================
"""
Integration test simulating the memory MCP server schema that was causing BadRequestError.

This test verifies that the fix for List[dict] schema conversion works correctly.
"""

import unittest
from aisuite.utils.tools import Tools


class MockMemoryMCPTool:
    """Mock memory MCP tool with the exact schema that was failing."""

    def __init__(self):
        self.__name__ = "create_entities"
        self.__doc__ = "Create multiple entities in the knowledge graph"

        # This is the exact schema from the memory MCP server that was causing:
        # "Invalid schema for function 'create_entities': 'typing.List[dict]' is not valid"
        self.__mcp_input_schema__ = {
            "type": "object",
            "properties": {
                "entities": {
                    "type": "array",
                    "description": "List of entities to create",
                    "items": {
                        "type": "object",
                        "properties": {
                            "name": {
                                "type": "string",
                                "description": "The name of the entity",
                            },
                            "entityType": {
                                "type": "string",
                                "description": "The type of the entity",
                            },
                            "observations": {
                                "type": "array",
                                "description": "An array of observation contents",
                                "items": {"type": "string"},
                            },
                        },
                        "required": ["name", "entityType", "observations"],
                    },
                }
            },
            "required": ["entities"],
        }

    def __call__(self, **kwargs):
        """Mock execution."""
        return {"created": len(kwargs.get("entities", [])), "status": "success"}


class TestMCPMemoryIntegration(unittest.TestCase):
    """Test that the memory server schema works correctly."""

    def test_memory_create_entities_schema(self):
        """Test that create_entities schema is converted correctly for OpenAI."""
        tool_manager = Tools()
        memory_tool = MockMemoryMCPTool()

        # This should not raise an error anymore
        tool_manager._add_tool(memory_tool)

        # Get the OpenAI format tools
        tools = tool_manager.tools()

        self.assertEqual(len(tools), 1)
        tool_spec = tools[0]["function"]

        # Verify the structure matches OpenAI expectations
        self.assertEqual(tool_spec["name"], "create_entities")
        self.assertEqual(tool_spec["parameters"]["type"], "object")
        self.assertIn("entities", tool_spec["parameters"]["properties"])

        # Verify the array type is preserved correctly (not 'typing.List[dict]')
        entities_param = tool_spec["parameters"]["properties"]["entities"]
        self.assertEqual(entities_param["type"], "array")
        self.assertIn("items", entities_param)
        self.assertEqual(entities_param["items"]["type"], "object")

        # Verify nested array (observations) is also preserved
        observations = entities_param["items"]["properties"]["observations"]
        self.assertEqual(observations["type"], "array")
        self.assertEqual(observations["items"]["type"], "string")

    def test_memory_tool_openai_format_validation(self):
        """Verify the output format would be accepted by OpenAI API."""
        tool_manager = Tools()
        memory_tool = MockMemoryMCPTool()
        tool_manager._add_tool(memory_tool)

        tools = tool_manager.tools()
        tool_spec = tools[0]["function"]

        # Check that there are no Python type strings in the schema
        import json

        schema_json = json.dumps(tool_spec["parameters"])

        # These should NOT appear in valid OpenAI JSON Schema
        self.assertNotIn("typing.", schema_json)
        self.assertNotIn("List[", schema_json)
        self.assertNotIn("Dict[", schema_json)

        # Only valid JSON Schema types should appear
        self.assertIn('"type": "array"', schema_json)
        self.assertIn('"type": "object"', schema_json)
        self.assertIn('"type": "string"', schema_json)

    def test_memory_tool_execution(self):
        """Test that the tool can be executed with proper validation."""
        tool_manager = Tools()
        memory_tool = MockMemoryMCPTool()
        tool_manager._add_tool(memory_tool)

        # Simulate a tool call from the LLM
        tool_call = {
            "id": "call_123",
            "function": {
                "name": "create_entities",
                "arguments": {
                    "entities": [
                        {
                            "name": "MCP",
                            "entityType": "Protocol",
                            "observations": [
                                "Enables LLM tool calling",
                                "Uses JSON Schema",
                            ],
                        },
                        {
                            "name": "aisuite",
                            "entityType": "Library",
                            "observations": ["Unified API", "Multi-provider support"],
                        },
                    ]
                },
            },
        }

        # This should execute successfully
        results, messages = tool_manager.execute_tool(tool_call)

        self.assertEqual(len(results), 1)
        self.assertEqual(results[0]["created"], 2)
        self.assertEqual(results[0]["status"], "success")


if __name__ == "__main__":
    unittest.main()


================================================
FILE: tests/utils/test_tool_manager.py
================================================
import unittest
from pydantic import BaseModel
from typing import Dict
from aisuite.utils.tools import Tools  # Import your ToolManager class
from enum import Enum


# Define a sample tool function and Pydantic model for testing
class TemperatureUnit(str, Enum):
    CELSIUS = "Celsius"
    FAHRENHEIT = "Fahrenheit"


class TemperatureParamsV2(BaseModel):
    location: str
    unit: TemperatureUnit = TemperatureUnit.CELSIUS


class TemperatureParams(BaseModel):
    location: str
    unit: str = "Celsius"


def get_current_temperature(location: str, unit: str = "Celsius") -> Dict[str, str]:
    """Gets the current temperature for a specific location and unit."""
    return {"location": location, "unit": unit, "temperature": "72"}


def missing_annotation_tool(location, unit="Celsius"):
    """Tool function without type annotations."""
    return {"location": location, "unit": unit, "temperature": "72"}


def get_current_temperature_v2(
    location: str, unit: TemperatureUnit = TemperatureUnit.CELSIUS
) -> Dict[str, str]:
    """Gets the current temperature for a specific location and unit (with enum support)."""
    return {"location": location, "unit": unit, "temperature": "72"}


class TestToolManager(unittest.TestCase):
    def setUp(self):
        self.tool_manager = Tools()

    def test_add_tool_with_pydantic_model(self):
        """Test adding a tool with an explicit Pydantic model."""
        self.tool_manager._add_tool(get_current_temperature, TemperatureParams)

        expected_tool_spec = [
            {
                "type": "function",
                "function": {
                    "name": "get_current_temperature",
                    "description": "Gets the current temperature for a specific location and unit.",
                    "parameters": {
                        "type": "object",
                        "properties": {
                            "location": {
                                "type": "string",
                                "description": "",
                            },
                            "unit": {
                                "type": "string",
                                "description": "",
                                "default": "Celsius",
                            },
                        },
                        "required": ["location"],
                    },
                },
            }
        ]

        tools = self.tool_manager.tools()
        self.assertIn(
            "get_current_temperature", [tool["function"]["name"] for tool in tools]
        )
        assert (
            tools == expected_tool_spec
        ), f"Expected {expected_tool_spec}, but got {tools}"

    def test_add_tool_with_signature_inference(self):
        """Test adding a tool and inferring parameters from the function signature."""
        self.tool_manager._add_tool(get_current_temperature)
        # Expected output from tool_manager.tools() when called with OpenAI format
        expected_tool_spec = [
            {
                "type": "function",
                "function": {
                    "name": "get_current_temperature",
                    "description": "Gets the current temperature for a specific location and unit.",
                    "parameters": {
                        "type": "object",
                        "properties": {
                            "location": {
                                "type": "string",
                                "description": "",  # No description provided in function signature
                            },
                            "unit": {
                                "type": "string",
                                "description": "",
                                "default": "Celsius",
                            },
                        },
                        "required": ["location"],
                    },
                },
            }
        ]
        tools = self.tool_manager.tools()
        print(tools)
        self.assertIn(
            "get_current_temperature", [tool["function"]["name"] for tool in tools]
        )
        assert (
            tools == expected_tool_spec
        ), f"Expected {expected_tool_spec}, but got {tools}"

    def test_add_tool_missing_annotation_raises_exception(self):
        """Test that adding a tool with missing type annotations raises a TypeError."""
        with self.assertRaises(TypeError):
            self.tool_manager._add_tool(missing_annotation_tool)

    def test_execute_tool_valid_parameters(self):
        """Test executing a registered tool with valid parameters."""
        self.tool_manager._add_tool(get_current_temperature, TemperatureParams)
        tool_call = {
            "id": "call_1",
            "function": {
                "name": "get_current_temperature",
                "arguments": {"location": "San Francisco", "unit": "Celsius"},
            },
        }
        result, result_message = self.tool_manager.execute_tool(tool_call)

        # Assuming result is returned as a list with a single dictionary
        result_dict = result[0] if isinstance(result, list) else result

        # Check that the result matches expected output
        self.assertEqual(result_dict["location"], "San Francisco")
        self.assertEqual(result_dict["unit"], "Celsius")
        self.assertEqual(result_dict["temperature"], "72")

    def test_execute_tool_invalid_parameters(self):
        """Test that executing a tool with invalid parameters raises a ValueError."""
        self.tool_manager._add_tool(get_current_temperature, TemperatureParams)
        tool_call = {
            "id": "call_1",
            "function": {
                "name": "get_current_temperature",
                "arguments": {"location": 123},  # Invalid type for location
            },
        }

        with self.assertRaises(ValueError) as context:
            self.tool_manager.execute_tool(tool_call)

        # Verify the error message contains information about the validation error
        self.assertIn(
            "Error in tool 'get_current_temperature' parameters", str(context.exception)
        )

    def test_add_tool_with_enum(self):
        """Test adding a tool with an enum parameter."""
        self.tool_manager._add_tool(get_current_temperature_v2, TemperatureParamsV2)

        expected_tool_spec = [
            {
                "type": "function",
                "function": {
                    "name": "get_current_temperature_v2",
                    "description": "Gets the current temperature for a specific location and unit (with enum support).",
                    "parameters": {
                        "type": "object",
                        "properties": {
                            "location": {
                                "type": "string",
                                "description": "",
                            },
                            "unit": {
                                "type": "string",
                                "enum": ["Celsius", "Fahrenheit"],
                                "description": "",
                                "default": "Celsius",
                            },
                        },
                        "required": ["location"],
                    },
                },
            }
        ]

        tools = self.tool_manager.tools()
        assert (
            tools == expected_tool_spec
        ), f"Expected {expected_tool_spec}, but got {tools}"


if __name__ == "__main__":
    unittest.main()


================================================
FILE: tests/utils/test_tools_mcp_schema.py
================================================
import unittest
from typing import Dict, Any, List
from aisuite.utils.tools import Tools


class MockMCPToolWrapper:
    """Mock MCP tool wrapper for testing schema preservation."""

    def __init__(self, name: str, description: str, input_schema: Dict[str, Any]):
        self.__name__ = name
        self.__doc__ = description
        self.__mcp_input_schema__ = input_schema

    def __call__(self, **kwargs):
        """Mock execution."""
        return {"result": "success", "args": kwargs}


class TestToolsMCPSchema(unittest.TestCase):
    """Test suite for MCP schema handling in Tools class."""

    def setUp(self):
        """Set up test fixtures."""
        self.tool_manager = Tools()

    def test_mcp_tool_with_simple_types(self):
        """Test MCP tool with simple types (string, integer, boolean)."""
        input_schema = {
            "type": "object",
            "properties": {
                "name": {"type": "string", "description": "User name"},
                "age": {"type": "integer", "description": "User age"},
                "active": {"type": "boolean", "description": "Is active"},
            },
            "required": ["name"],
        }

        tool = MockMCPToolWrapper("test_simple", "A simple test tool", input_schema)
        self.tool_manager._add_tool(tool)

        tools = self.tool_manager.tools()
        self.assertEqual(len(tools), 1)

        # Verify the schema was preserved exactly
        tool_spec = tools[0]["function"]
        self.assertEqual(tool_spec["name"], "test_simple")
        self.assertEqual(tool_spec["description"], "A simple test tool")
        self.assertEqual(tool_spec["parameters"], input_schema)

    def test_mcp_tool_with_array_of_objects(self):
        """Test MCP tool with array of objects (List[dict])."""
        input_schema = {
            "type": "object",
            "properties": {
                "entities": {
                    "type": "array",
                    "items": {
                        "type": "object",
                        "properties": {
                            "name": {"type": "string"},
                            "type": {"type": "string"},
                        },
                        "required": ["name", "type"],
                    },
                    "description": "List of entities to create",
                }
            },
            "required": ["entities"],
        }

        tool = MockMCPToolWrapper(
            "create_entities", "Create multiple entities", input_schema
        )
        self.tool_manager._add_tool(tool)

        tools = self.tool_manager.tools()
        tool_spec = tools[0]["function"]

        # Verify complex array schema is preserved
        self.assertEqual(
            tool_spec["parameters"]["properties"]["entities"]["type"], "array"
        )
        self.assertIn("items", tool_spec["parameters"]["properties"]["entities"])
        self.assertEqual(
            tool_spec["parameters"]["properties"]["entities"]["items"]["type"], "object"
        )

    def test_mcp_tool_with_nested_objects(self):
        """Test MCP tool with nested object structures."""
        input_schema = {
            "type": "object",
            "properties": {
                "user": {
                    "type": "object",
                    "properties": {
                        "name": {"type": "string"},
                        "address": {
                            "type": "object",
                            "properties": {
                                "street": {"type": "string"},
                                "city": {"type": "string"},
                            },
                        },
                    },
                }
            },
            "required": ["user"],
        }

        tool = MockMCPToolWrapper(
            "create_user", "Create user with address", input_schema
        )
        self.tool_manager._add_tool(tool)

        tools = self.tool_manager.tools()
        tool_spec = tools[0]["function"]

        # Verify nested structure is preserved
        self.assertEqual(tool_spec["parameters"], input_schema)
        self.assertIn(
            "address", tool_spec["parameters"]["properties"]["user"]["properties"]
        )

    def test_mcp_tool_with_array_of_strings(self):
        """Test MCP tool with array of simple types (List[str])."""
        input_schema = {
            "type": "object",
            "properties": {
                "tags": {
                    "type": "array",
                    "items": {"type": "string"},
                    "description": "List of tags",
                }
            },
            "required": ["tags"],
        }

        tool = MockMCPToolWrapper("add_tags", "Add tags to item", input_schema)
        self.tool_manager._add_tool(tool)

        tools = self.tool_manager.tools()
        tool_spec = tools[0]["function"]

        # Verify array of strings is preserved
        self.assertEqual(tool_spec["parameters"]["properties"]["tags"]["type"], "array")
        self.assertEqual(
            tool_spec["parameters"]["properties"]["tags"]["items"]["type"], "string"
        )

    def test_mcp_tool_detection(self):
        """Test that MCP tools are properly detected via __mcp_input_schema__ attribute."""
        input_schema = {
            "type": "object",
            "properties": {"param": {"type": "string"}},
            "required": ["param"],
        }

        tool = MockMCPToolWrapper("mcp_tool", "An MCP tool", input_schema)

        # Verify the attribute exists
        self.assertTrue(hasattr(tool, "__mcp_input_schema__"))
        self.assertEqual(tool.__mcp_input_schema__, input_schema)

    def test_mcp_tool_with_optional_parameters(self):
        """Test MCP tool with mix of required and optional parameters."""
        input_schema = {
            "type": "object",
            "properties": {
                "required_param": {
                    "type": "string",
                    "description": "Required parameter",
                },
                "optional_param": {
                    "type": "integer",
                    "description": "Optional parameter",
                },
            },
            "required": ["required_param"],
        }

        tool = MockMCPToolWrapper(
            "mixed_params", "Tool with mixed params", input_schema
        )
        self.tool_manager._add_tool(tool)

        tools = self.tool_manager.tools()
        tool_spec = tools[0]["function"]

        # Verify required fields are correct
        self.assertEqual(tool_spec["parameters"]["required"], ["required_param"])
        self.assertIn("required_param", tool_spec["parameters"]["properties"])
        self.assertIn("optional_param", tool_spec["parameters"]["properties"])

    def test_mcp_schema_preserves_additional_fields(self):
        """Test that additional JSON Schema fields are preserved (enum, format, etc.)."""
        input_schema = {
            "type": "object",
            "properties": {
                "status": {
                    "type": "string",
                    "enum": ["active", "inactive", "pending"],
                    "description": "Status value",
                },
                "email": {
                    "type": "string",
                    "format": "email",
                    "description": "Email address",
                },
                "count": {
                    "type": "integer",
                    "minimum": 0,
                    "maximum": 100,
                    "description": "Count value",
                },
            },
            "required": ["status"],
        }

        tool = MockMCPToolWrapper(
            "advanced_schema", "Tool with advanced schema", input_schema
        )
        self.tool_manager._add_tool(tool)

        tools = self.tool_manager.tools()
        tool_spec = tools[0]["function"]

        # Verify enum is preserved
        self.assertIn("enum", tool_spec["parameters"]["properties"]["status"])
        self.assertEqual(
            tool_spec["parameters"]["properties"]["status"]["enum"],
            ["active", "inactive", "pending"],
        )

        # Verify format is preserved
        self.assertIn("format", tool_spec["parameters"]["properties"]["email"])
        self.assertEqual(
            tool_spec["parameters"]["properties"]["email"]["format"], "email"
        )

        # Verify min/max are preserved
        self.assertIn("minimum", tool_spec["parameters"]["properties"]["count"])
        self.assertIn("maximum", tool_spec["parameters"]["properties"]["count"])

    def test_mcp_tool_execution_with_validation(self):
        """Test that MCP tools can be executed and parameters are validated."""
        input_schema = {
            "type": "object",
            "properties": {
                "name": {"type": "string", "description": "Name"},
                "count": {"type": "integer", "description": "Count"},
            },
            "required": ["name"],
        }

        tool = MockMCPToolWrapper(
            "validate_tool", "Tool for validation test", input_schema
        )
        self.tool_manager._add_tool(tool)

        # Test valid execution
        tool_call = {
            "id": "call_1",
            "function": {
                "name": "validate_tool",
                "arguments": {"name": "test", "count": 5},
            },
        }

        results, messages = self.tool_manager.execute_tool(tool_call)
        self.assertEqual(len(results), 1)
        self.assertIn("result", results[0])

    def test_mcp_tool_with_empty_schema(self):
        """Test MCP tool with no parameters."""
        input_schema = {"type": "object", "properties": {}, "required": []}

        tool = MockMCPToolWrapper("no_params", "Tool with no params", input_schema)
        self.tool_manager._add_tool(tool)

        tools = self.tool_manager.tools()
        tool_spec = tools[0]["function"]

        self.assertEqual(tool_spec["parameters"]["properties"], {})
        self.assertEqual(tool_spec["parameters"]["required"], [])

    def test_multiple_mcp_tools(self):
        """Test adding multiple MCP tools to the manager."""
        schema1 = {
            "type": "object",
            "properties": {"param1": {"type": "string"}},
            "required": ["param1"],
        }

        schema2 = {
            "type": "object",
            "properties": {"param2": {"type": "integer"}},
            "required": ["param2"],
        }

        tool1 = MockMCPToolWrapper("tool1", "First tool", schema1)
        tool2 = MockMCPToolWrapper("tool2", "Second tool", schema2)

        self.tool_manager._add_tool(tool1)
        self.tool_manager._add_tool(tool2)

        tools = self.tool_manager.tools()
        self.assertEqual(len(tools), 2)

        tool_names = [tool["function"]["name"] for tool in tools]
        self.assertIn("tool1", tool_names)
        self.assertIn("tool2", tool_names)

    def test_mcp_tool_schema_not_modified(self):
        """Test that the original schema is not modified during processing."""
        original_schema = {
            "type": "object",
            "properties": {
                "data": {
                    "type": "array",
                    "items": {
                        "type": "object",
                        "properties": {"key": {"type": "string"}},
                    },
                }
            },
            "required": ["data"],
        }

        # Create a copy to verify immutability
        import copy

        schema_copy = copy.deepcopy(original_schema)

        tool = MockMCPToolWrapper(
            "immutable_tool", "Test immutability", original_schema
        )
        self.tool_manager._add_tool(tool)

        # Verify original schema wasn't modified
        self.assertEqual(original_schema, schema_copy)

    def test_backward_compatibility_non_mcp_tools(self):
        """Test that regular Python functions still work (backward compatibility)."""

        def regular_function(name: str, age: int = 25) -> Dict[str, Any]:
            """A regular Python function."""
            return {"name": name, "age": age}

        # Regular functions don't have __mcp_input_schema__
        self.assertFalse(hasattr(regular_function, "__mcp_input_schema__"))

        # Should still work with the Tools class
        self.tool_manager._add_tool(regular_function)

        tools = self.tool_manager.tools()
        self.assertEqual(len(tools), 1)
        self.assertEqual(tools[0]["function"]["name"], "regular_function")


if __name__ == "__main__":
    unittest.main()