diff --git a/flo_ai/flo_ai/arium/builder.py b/flo_ai/flo_ai/arium/builder.py
index 633d59d6..5f0c3b60 100644
--- a/flo_ai/flo_ai/arium/builder.py
+++ b/flo_ai/flo_ai/arium/builder.py
@@ -341,7 +341,7 @@ def from_yaml(
 
             # Method 4: External file reference
             elif 'yaml_file' in agent_config:
-                agent_builder = AgentBuilder.from_yaml(
+                agent_builder: AgentBuilder = AgentBuilder.from_yaml(
                     yaml_file=agent_config['yaml_file'], base_llm=base_llm
                 )
                 agent = agent_builder.build()
@@ -648,10 +648,8 @@ def _create_agent_from_direct_config(
                         f'Available: {list(available_tools.keys())}'
                     )
 
-        # Extract output schema if present
-        output_schema = agent_config.get('output_schema')
-
         # Handle parser configuration if present
+        output_schema = None
         if 'parser' in agent_config:
             from flo_ai.formatter.yaml_format_parser import FloYamlParser
 
@@ -660,16 +658,17 @@ def _create_agent_from_direct_config(
             parser = FloYamlParser.create(yaml_dict=parser_config)
             output_schema = parser.get_format()
 
-        # Create and return the agent
-        agent = Agent(
-            name=name,
-            system_prompt=job,
-            llm=llm,
-            tools=agent_tools,
-            max_retries=max_retries,
-            reasoning_pattern=reasoning_pattern,
-            output_schema=output_schema,
-            role=role,
+        agent = (
+            AgentBuilder()
+            .with_name(name)
+            .with_prompt(job)
+            .with_llm(llm)
+            .with_tools(agent_tools)
+            .with_retries(max_retries)
+            .with_reasoning(reasoning_pattern)
+            .with_output_schema(output_schema)
+            .with_role(role)
+            .build()
         )
 
         return agent
diff --git a/flo_ai/flo_ai/llm/anthropic_llm.py b/flo_ai/flo_ai/llm/anthropic_llm.py
index 74685397..05c45cf1 100644
--- a/flo_ai/flo_ai/llm/anthropic_llm.py
+++ b/flo_ai/flo_ai/llm/anthropic_llm.py
@@ -49,7 +49,6 @@ async def generate(
                 'model': self.model,
                 'messages': conversation,
                 'temperature': self.temperature,
-                'max_tokens': 8192,
                 **self.kwargs,
             }
 
diff --git a/flo_ai/flo_ai/llm/gemini_llm.py b/flo_ai/flo_ai/llm/gemini_llm.py
index 89151ff0..6b3f2550 100644
--- a/flo_ai/flo_ai/llm/gemini_llm.py
+++ b/flo_ai/flo_ai/llm/gemini_llm.py
@@ -1,9 +1,8 @@
 from typing import Dict, Any, List, Optional
 from google import genai
-import json
+from google.genai import types
 from .base_llm import BaseLLM, ImageMessage
 from flo_ai.tool.base_tool import Tool
-from flo_ai.utils.logger import logger
 
 
 class Gemini(BaseLLM):
@@ -27,9 +26,9 @@ async def generate(
         output_schema: Optional[Dict[str, Any]] = None,
     ) -> Dict[str, Any]:
         # Convert messages to Gemini format
-        # Gemini uses a simple content string format
         contents = []
         system_prompt = ''
+
         for msg in messages:
             role = msg['role']
             message_content = msg['content']
@@ -39,80 +38,57 @@ async def generate(
             else:
                 contents.append(message_content)
 
-        # Add output schema instruction if provided
-        if output_schema:
-            contents += f'\nPlease provide your response in JSON format according to this schema:\n{json.dumps(output_schema, indent=2)}\n'
-
-        # Add function information if provided
-        if functions:
-            contents += f'\nAvailable functions:\n{json.dumps(functions, indent=2)}\n'
-
         try:
             # Prepare generation config
-            generation_config = genai.types.GenerateContentConfig(
+            generation_config = types.GenerateContentConfig(
                 temperature=self.temperature,
                 system_instruction=system_prompt,
                 **self.kwargs,
             )
 
+            # Add tools if functions are provided
+            if functions:
+                tools = types.Tool(function_declarations=functions)
+                generation_config.tools = [tools]
+
+            # Add structured output configuration if output_schema is provided
+            if output_schema:
+                generation_config.response_mime_type = 'application/json'
+                generation_config.response_schema = output_schema
+
             # Make the API call
             response = self.client.models.generate_content(
                 model=self.model,
                 contents=contents,
-                config=generation_config if generation_config else None,
+                config=generation_config,
             )
 
-            # Check if response contains function call information
-            # For now, we'll assume text response and parse for function calls if needed
-            response_text = (
-                response.text if hasattr(response, 'text') else str(response)
-            )
-
-            # Try to detect function calls in the response
-            # This is a simple implementation - in practice, you might need more sophisticated parsing
-            if functions and self._is_function_call_response(response_text):
-                function_call = self._parse_function_call(response_text)
-                if function_call:
+            # Check for function call in the response
+            if (
+                functions
+                and response.candidates
+                and response.candidates[0].content.parts
+            ):
+                part = response.candidates[0].content.parts[0]
+                if hasattr(part, 'function_call') and part.function_call:
+                    function_call = part.function_call
                     return {
-                        'content': response_text,
-                        'function_call': function_call,
+                        'content': response.text,
+                        'function_call': {
+                            'name': function_call.name,
+                            'arguments': function_call.args,
+                        },
                     }
 
+            # Return regular text response
+            response_text = (
+                response.text if hasattr(response, 'text') else str(response)
+            )
             return {'content': response_text}
 
         except Exception as e:
             raise Exception(f'Error in Gemini API call: {str(e)}')
 
-    def _is_function_call_response(self, response_text: str) -> bool:
-        """Check if the response contains a function call"""
-        # Simple heuristic - look for function call patterns
-        return (
-            'function_call' in response_text.lower()
-            or '(' in response_text
-            and ')' in response_text
-        )
-
-    def _parse_function_call(self, response_text: str) -> Optional[Dict[str, Any]]:
-        """Parse function call from response text"""
-        # This is a simplified parser - in practice, you'd want more robust parsing
-        try:
-            # Look for JSON-like function call structure
-            if '{' in response_text and '}' in response_text:
-                # Extract JSON-like content
-                start = response_text.find('{')
-                end = response_text.rfind('}') + 1
-                json_str = response_text[start:end]
-                parsed = json.loads(json_str)
-
-                if 'name' in parsed and 'arguments' in parsed:
-                    return {
-                        'name': parsed['name'],
-                        'arguments': json.dumps(parsed['arguments']),
-                    }
-        except Exception as e:
-            logger.error(f'Error parsing function call: {str(e)}')
-        return None
-
     def get_message_content(self, response: Any) -> str:
         """Extract message content from response"""
         if isinstance(response, dict):
@@ -120,7 +96,7 @@ def get_message_content(self, response: Any) -> str:
         return str(response)
 
     def format_tool_for_llm(self, tool: 'Tool') -> Dict[str, Any]:
-        """Format a single tool for Gemini's API"""
+        """Format a single tool for Gemini's function declarations"""
         return {
             'name': tool.name,
             'description': tool.description,
@@ -142,7 +118,7 @@ def format_tool_for_llm(self, tool: 'Tool') -> Dict[str, Any]:
         }
 
     def format_tools_for_llm(self, tools: List['Tool']) -> List[Dict[str, Any]]:
-        """Format tools for Gemini's API"""
+        """Format tools for Gemini's function declarations"""
         return [self.format_tool_for_llm(tool) for tool in tools]
 
     def format_image_in_message(self, image: ImageMessage) -> str:
@@ -150,12 +126,12 @@ def format_image_in_message(self, image: ImageMessage) -> str:
         if image.image_file_path:
             with open(image.image_file_path, 'rb') as image_file:
                 image_bytes = image_file.read()
-            return genai.types.Part.from_bytes(
+            return types.Part.from_bytes(
                 data=image_bytes,
                 mime_type=image.mime_type,
             )
         elif image.image_bytes:
-            return genai.types.Part.from_bytes(
+            return types.Part.from_bytes(
                 data=image.image_bytes,
                 mime_type=image.mime_type,
             )
diff --git a/flo_ai/flo_ai/llm/openai_llm.py b/flo_ai/flo_ai/llm/openai_llm.py
index c1dfc24a..6c823bb3 100644
--- a/flo_ai/flo_ai/llm/openai_llm.py
+++ b/flo_ai/flo_ai/llm/openai_llm.py
@@ -7,7 +7,7 @@
 class OpenAI(BaseLLM):
     def __init__(
         self,
-        model='gpt-40-mini',
+        model='gpt-4o-mini',
         api_key: str = None,
         temperature: float = 0.7,
         base_url: str = None,
@@ -53,6 +53,7 @@ async def generate(
         openai_kwargs = {
             'model': self.model,
             'messages': messages,
+            'temperature': self.temperature,
             **kwargs,
             **self.kwargs,
         }
diff --git a/flo_ai/flo_ai/llm/openai_vllm.py b/flo_ai/flo_ai/llm/openai_vllm.py
index 78f071fa..eb4a7c0b 100644
--- a/flo_ai/flo_ai/llm/openai_vllm.py
+++ b/flo_ai/flo_ai/llm/openai_vllm.py
@@ -18,6 +18,8 @@ def __init__(
             base_url=base_url,
             **kwargs,
         )
+        # Store base_url attribute
+        self.base_url = base_url
 
     # overriden
     async def generate(
@@ -41,6 +43,7 @@ async def generate(
                 )
             else:
                 messages.insert(
+                    0,
                     {
                         'role': 'system',
                         'content': f'Please provide your response in JSON format according to the specified schema.\n \n {output_schema}',
diff --git a/flo_ai/flo_ai/llm/vertexai_llm.py b/flo_ai/flo_ai/llm/vertexai_llm.py
index 2f1c883c..f4d92527 100644
--- a/flo_ai/flo_ai/llm/vertexai_llm.py
+++ b/flo_ai/flo_ai/llm/vertexai_llm.py
@@ -17,5 +17,10 @@ def __init__(
     ):
         # Initialize only the BaseLLM part to avoid Gemini's client creation
         BaseLLM.__init__(self, model, api_key, temperature, **kwargs)
+
+        # Store project and location attributes
+        self.project = project
+        self.location = location
+
         # Create VertexAI-specific client
         self.client = genai.Client(project=project, location=location, vertexai=True)
diff --git a/flo_ai/pyproject.toml b/flo_ai/pyproject.toml
index 18f45454..36c01e58 100644
--- a/flo_ai/pyproject.toml
+++ b/flo_ai/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "flo_ai"
-version = "1.0.0"
+version = "1.0.1-dev1"
 description = "A easy way to create structured AI agents"
 authors = ["rootflo <*@rootflo.ai>"]
 license = "MIT"
diff --git a/flo_ai/setup.py b/flo_ai/setup.py
index 0e7e702e..d1e72c9c 100644
--- a/flo_ai/setup.py
+++ b/flo_ai/setup.py
@@ -5,7 +5,7 @@
 
 setuptools.setup(
     name='flo-ai',
-    version='1.0.0',
+    version='1.0.1-dev1',
     author='Rootflo',
     description='Create composable AI agents',
     long_description=long_description,
diff --git a/flo_ai/tests/run_llm_tests.py b/flo_ai/tests/run_llm_tests.py
new file mode 100644
index 00000000..5e5a5c5d
--- /dev/null
+++ b/flo_ai/tests/run_llm_tests.py
@@ -0,0 +1,164 @@
+#!/usr/bin/env python3
+"""
+Test runner script for all LLM tests in the Flo AI framework.
+This script runs comprehensive tests for all LLM implementations.
+"""
+
+import sys
+import os
+import subprocess
+import time
+
+# Add the flo_ai directory to the path
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), '..'))
+
+
+def run_tests_for_llm(test_file, llm_name):
+    """Run tests for a specific LLM implementation."""
+    print(f"\n{'='*60}")
+    print(f'🧪 Running tests for {llm_name}')
+    print(f"{'='*60}")
+
+    start_time = time.time()
+
+    try:
+        # Run pytest for the specific test file
+        result = subprocess.run(
+            [
+                sys.executable,
+                '-m',
+                'pytest',
+                test_file,
+                '-v',  # Verbose output
+                '--tb=short',  # Short traceback format
+                '--color=yes',  # Colored output
+            ],
+            capture_output=True,
+            text=True,
+            cwd=os.path.dirname(__file__),
+        )
+
+        end_time = time.time()
+        duration = end_time - start_time
+
+        if result.returncode == 0:
+            print(f'✅ {llm_name} tests PASSED in {duration:.2f}s')
+            print('📊 Output:')
+            print(result.stdout)
+        else:
+            print(f'❌ {llm_name} tests FAILED in {duration:.2f}s')
+            print('📊 Output:')
+            print(result.stdout)
+            print('🚨 Errors:')
+            print(result.stderr)
+
+        return result.returncode == 0, duration
+
+    except Exception as e:
+        print(f'💥 Error running {llm_name} tests: {e}')
+        return False, 0
+
+
+def run_all_llm_tests():
+    """Run all LLM tests and provide a summary."""
+    print('🚀 Starting comprehensive LLM test suite for Flo AI')
+    print(f'📁 Test directory: {os.path.dirname(__file__)}')
+    print(f'🐍 Python executable: {sys.executable}')
+
+    # Define all LLM test files
+    test_files = [
+        ('test_base_llm.py', 'BaseLLM & ImageMessage'),
+        ('test_openai_llm.py', 'OpenAI LLM'),
+        ('test_anthropic_llm.py', 'Anthropic Claude LLM'),
+        ('test_gemini_llm.py', 'Google Gemini LLM'),
+        ('test_ollama_llm.py', 'Ollama LLM'),
+        ('test_vertexai_llm.py', 'Google VertexAI LLM'),
+        ('test_openai_vllm.py', 'OpenAI VLLM'),
+    ]
+
+    results = []
+    total_tests = 0
+    passed_tests = 0
+    total_duration = 0
+
+    for test_file, llm_name in test_files:
+        test_path = os.path.join(os.path.dirname(__file__), test_file)
+
+        if not os.path.exists(test_path):
+            print(f'⚠️  Test file not found: {test_file}')
+            continue
+
+        success, duration = run_tests_for_llm(test_path, llm_name)
+        results.append((llm_name, success, duration))
+
+        if success:
+            passed_tests += 1
+        total_tests += 1
+        total_duration += duration
+
+    # Print summary
+    print(f"\n{'='*60}")
+    print('📋 TEST SUMMARY')
+    print(f"{'='*60}")
+
+    for llm_name, success, duration in results:
+        status = '✅ PASSED' if success else '❌ FAILED'
+        print(f'{llm_name:<25} {status:<10} {duration:>8.2f}s')
+
+    print('\n📊 Overall Results:')
+    print(f'   Total LLM implementations: {total_tests}')
+    print(f'   Passed: {passed_tests}')
+    print(f'   Failed: {total_tests - passed_tests}')
+    print(f'   Success rate: {(passed_tests/total_tests)*100:.1f}%')
+    print(f'   Total test time: {total_duration:.2f}s')
+
+    if passed_tests == total_tests:
+        print('\n🎉 All LLM tests passed successfully!')
+        return 0
+    else:
+        print('\n⚠️  Some LLM tests failed. Please check the output above.')
+        return 1
+
+
+def run_specific_llm_test(llm_name):
+    """Run tests for a specific LLM implementation."""
+    test_mapping = {
+        'base': 'test_base_llm.py',
+        'openai': 'test_openai_llm.py',
+        'anthropic': 'test_anthropic_llm.py',
+        'gemini': 'test_gemini_llm.py',
+        'ollama': 'test_ollama_llm.py',
+        'vertexai': 'test_vertexai_llm.py',
+        'vllm': 'test_openai_vllm.py',
+    }
+
+    if llm_name.lower() not in test_mapping:
+        print(f'❌ Unknown LLM: {llm_name}')
+        print(f"Available options: {', '.join(test_mapping.keys())}")
+        return 1
+
+    test_file = test_mapping[llm_name.lower()]
+    test_path = os.path.join(os.path.dirname(__file__), test_file)
+
+    if not os.path.exists(test_path):
+        print(f'❌ Test file not found: {test_file}')
+        return 1
+
+    success, duration = run_tests_for_llm(test_path, test_mapping[llm_name.lower()])
+    return 0 if success else 1
+
+
+def main():
+    """Main entry point."""
+    if len(sys.argv) > 1:
+        # Run specific LLM test
+        llm_name = sys.argv[1]
+        return run_specific_llm_test(llm_name)
+    else:
+        # Run all LLM tests
+        return run_all_llm_tests()
+
+
+if __name__ == '__main__':
+    exit_code = main()
+    sys.exit(exit_code)
diff --git a/flo_ai/tests/test_anthropic_llm.py b/flo_ai/tests/test_anthropic_llm.py
new file mode 100644
index 00000000..975b29f9
--- /dev/null
+++ b/flo_ai/tests/test_anthropic_llm.py
@@ -0,0 +1,407 @@
+#!/usr/bin/env python3
+"""
+Pytest tests for the Anthropic LLM implementation.
+"""
+
+import sys
+import os
+import pytest
+from unittest.mock import Mock, AsyncMock, patch
+
+# Add the flo_ai directory to the path
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), '..'))
+
+from flo_ai.llm.anthropic_llm import Anthropic
+from flo_ai.llm.base_llm import ImageMessage
+from flo_ai.tool.base_tool import Tool
+
+
+class TestAnthropic:
+    """Test class for Anthropic LLM implementation."""
+
+    def test_anthropic_initialization(self):
+        """Test Anthropic LLM initialization with different parameters."""
+        # Test with minimal parameters
+        llm = Anthropic()
+        assert llm.model == 'claude-3-5-sonnet-20240620'
+        assert llm.api_key is None
+        assert llm.temperature == 0.7
+        assert llm.kwargs == {}
+
+        # Test with custom parameters
+        llm = Anthropic(
+            model='claude-3-opus-20240229',
+            api_key='test-key-123',
+            temperature=0.5,
+            max_tokens=1000,
+        )
+        assert llm.model == 'claude-3-opus-20240229'
+        assert llm.api_key == 'test-key-123'
+        assert llm.temperature == 0.5
+        assert llm.kwargs == {'max_tokens': 1000}
+
+        # Test with base_url
+        llm = Anthropic(base_url='https://custom.anthropic.com')
+        assert llm.client.base_url == 'https://custom.anthropic.com'
+
+    def test_anthropic_temperature_handling(self):
+        """Test temperature parameter handling."""
+        # Test default temperature
+        llm = Anthropic()
+        assert llm.temperature == 0.7
+
+        # Test custom temperature
+        llm = Anthropic(temperature=0.0)
+        assert llm.temperature == 0.0
+
+        # Test high temperature
+        llm = Anthropic(temperature=1.0)
+        assert llm.temperature == 1.0
+
+        # Test temperature in kwargs
+        llm = Anthropic(temperature=0.3, custom_temp=0.8)
+        assert llm.temperature == 0.3
+        assert llm.kwargs['custom_temp'] == 0.8
+
+    @patch('flo_ai.llm.anthropic_llm.AsyncAnthropic')
+    def test_anthropic_client_creation(self, mock_async_anthropic):
+        """Test that AsyncAnthropic client is created correctly."""
+        mock_client = Mock()
+        mock_async_anthropic.return_value = mock_client
+
+        llm = Anthropic(api_key='test-key', base_url='https://custom.com')
+
+        mock_async_anthropic.assert_called_once_with(
+            api_key='test-key', base_url='https://custom.com'
+        )
+        assert llm.client == mock_client
+
+    @pytest.mark.asyncio
+    async def test_anthropic_generate_basic(self):
+        """Test basic generate method without functions or output schema."""
+        llm = Anthropic(model='claude-3-5-sonnet-20240620')
+
+        # Mock the client response
+        mock_content = Mock()
+        mock_content.text = 'Hello, world!'
+        mock_content.type = 'text'
+
+        mock_response = Mock()
+        mock_response.content = [mock_content]
+
+        llm.client = Mock()
+        llm.client.messages.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+        result = await llm.generate(messages)
+
+        # Verify the API call
+        llm.client.messages.create.assert_called_once()
+        call_args = llm.client.messages.create.call_args
+
+        assert call_args[1]['model'] == 'claude-3-5-sonnet-20240620'
+        assert call_args[1]['messages'] == messages
+        assert call_args[1]['temperature'] == 0.7
+
+        # Verify the result
+        assert result == {'content': 'Hello, world!'}
+
+    @pytest.mark.asyncio
+    async def test_anthropic_generate_with_system_message(self):
+        """Test generate method with system message."""
+        llm = Anthropic(model='claude-3-5-sonnet-20240620')
+
+        # Mock the client response
+        mock_content = Mock()
+        mock_content.text = "I'm a helpful assistant"
+        mock_content.type = 'text'
+
+        mock_response = Mock()
+        mock_response.content = [mock_content]
+
+        llm.client = Mock()
+        llm.client.messages.create = AsyncMock(return_value=mock_response)
+
+        messages = [
+            {'role': 'system', 'content': 'You are a helpful assistant'},
+            {'role': 'user', 'content': 'Hello'},
+        ]
+
+        await llm.generate(messages)
+
+        # Verify system message was passed correctly
+        call_args = llm.client.messages.create.call_args[1]
+        assert call_args['system'] == 'You are a helpful assistant'
+
+        # Verify conversation messages don't include system
+        conversation_messages = call_args['messages']
+        assert len(conversation_messages) == 1
+        assert conversation_messages[0]['role'] == 'user'
+
+    @pytest.mark.asyncio
+    async def test_anthropic_generate_with_output_schema(self):
+        """Test generate method with output schema."""
+        llm = Anthropic(model='claude-3-5-sonnet-20240620')
+
+        output_schema = {
+            'type': 'object',
+            'properties': {'message': {'type': 'string'}, 'count': {'type': 'integer'}},
+        }
+
+        # Mock the client response
+        mock_content = Mock()
+        mock_content.text = '{"message": "test", "count": 42}'
+        mock_content.type = 'text'
+
+        mock_response = Mock()
+        mock_response.content = [mock_content]
+
+        llm.client = Mock()
+        llm.client.messages.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Generate JSON'}]
+        await llm.generate(messages, output_schema=output_schema)
+
+        # Verify system message includes output schema
+        call_args = llm.client.messages.create.call_args[1]
+        system_message = call_args['system']
+        assert 'Provide output in the following JSON schema' in system_message
+        assert 'message' in system_message
+        assert 'count' in system_message
+
+    @pytest.mark.asyncio
+    async def test_anthropic_generate_with_functions(self):
+        """Test generate method with functions (tools)."""
+        llm = Anthropic(model='claude-3-5-sonnet-20240620')
+
+        functions = [
+            {
+                'type': 'custom',
+                'name': 'test_function',
+                'description': 'A test function',
+                'input_schema': {'type': 'object'},
+            }
+        ]
+
+        # Mock the client response
+        mock_content = Mock()
+        mock_content.text = "I'll use the function"
+        mock_content.type = 'text'
+
+        mock_response = Mock()
+        mock_response.content = [mock_content]
+
+        llm.client = Mock()
+        llm.client.messages.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Use the function'}]
+        await llm.generate(messages, functions=functions)
+
+        # Verify functions were passed correctly
+        call_args = llm.client.messages.create.call_args[1]
+        assert call_args['tools'] == functions
+
+    @pytest.mark.asyncio
+    async def test_anthropic_generate_with_tool_use(self):
+        """Test generate method when Claude uses a tool."""
+        llm = Anthropic(model='claude-3-5-sonnet-20240620')
+
+        # Mock the client response with tool use
+        mock_tool_content = Mock()
+        mock_tool_content.type = 'tool_use'
+        mock_tool_content.name = 'test_tool'
+        mock_tool_content.input = {'param': 'value'}
+
+        mock_text_content = Mock()
+        mock_text_content.text = 'I used the tool'
+        mock_text_content.type = 'text'
+
+        mock_response = Mock()
+        mock_response.content = [mock_text_content, mock_tool_content]
+
+        llm.client = Mock()
+        llm.client.messages.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Use the tool'}]
+        result = await llm.generate(messages)
+
+        # Verify tool use was detected and formatted correctly
+        assert 'function_call' in result
+        assert result['function_call']['name'] == 'test_tool'
+        assert result['function_call']['arguments'] == '{"param": "value"}'
+
+    @pytest.mark.asyncio
+    async def test_anthropic_generate_with_max_tokens(self):
+        """Test generate method with max_tokens parameter."""
+        llm = Anthropic(model='claude-3-5-sonnet-20240620', max_tokens=1000)
+
+        # Mock the client response
+        mock_content = Mock()
+        mock_content.text = 'Response with max tokens'
+        mock_content.type = 'text'
+
+        mock_response = Mock()
+        mock_response.content = [mock_content]
+
+        llm.client = Mock()
+        llm.client.messages.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+        await llm.generate(messages)
+
+        # Verify max_tokens was passed
+        call_args = llm.client.messages.create.call_args[1]
+        assert call_args['max_tokens'] == 1000
+
+    @pytest.mark.asyncio
+    async def test_anthropic_generate_with_kwargs(self):
+        """Test generate method with additional kwargs."""
+        llm = Anthropic(model='claude-3-5-sonnet-20240620', top_p=0.9)
+
+        # Mock the client response
+        mock_content = Mock()
+        mock_content.text = 'Response with kwargs'
+        mock_content.type = 'text'
+
+        mock_response = Mock()
+        mock_response.content = [mock_content]
+
+        llm.client = Mock()
+        llm.client.messages.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+        await llm.generate(messages)
+
+        # Verify kwargs were passed through
+        call_args = llm.client.messages.create.call_args[1]
+        assert call_args['top_p'] == 0.9
+
+    def test_anthropic_get_message_content(self):
+        """Test get_message_content method."""
+        llm = Anthropic()
+
+        # Test with dict response
+        response = {'content': 'Hello, world!'}
+        result = llm.get_message_content(response)
+        assert result == 'Hello, world!'
+
+        # Test with string response
+        result = llm.get_message_content('Direct string')
+        assert result == 'Direct string'
+
+        # Test with empty content
+        response = {'content': ''}
+        result = llm.get_message_content(response)
+        assert result == ''
+
+    def test_anthropic_format_tool_for_llm(self):
+        """Test format_tool_for_llm method."""
+        llm = Anthropic()
+
+        # Create a mock tool
+        tool = Tool(
+            name='test_tool',
+            description='A test tool',
+            function=lambda x: x,
+            parameters={
+                'param1': {'type': 'string', 'description': 'First parameter'},
+                'param2': {'type': 'integer', 'description': 'Second parameter'},
+            },
+        )
+
+        formatted = llm.format_tool_for_llm(tool)
+
+        assert formatted['type'] == 'custom'
+        assert formatted['name'] == 'test_tool'
+        assert formatted['description'] == 'A test tool'
+        assert formatted['input_schema']['type'] == 'object'
+        assert 'param1' in formatted['input_schema']['properties']
+        assert 'param2' in formatted['input_schema']['properties']
+        assert formatted['input_schema']['required'] == ['param1', 'param2']
+
+    def test_anthropic_format_tools_for_llm(self):
+        """Test format_tools_for_llm method."""
+        llm = Anthropic()
+
+        # Create mock tools
+        tool1 = Tool(
+            name='tool1',
+            description='First tool',
+            function=lambda x: x,
+            parameters={'param': {'type': 'string', 'description': 'Parameter'}},
+        )
+
+        tool2 = Tool(
+            name='tool2',
+            description='Second tool',
+            function=lambda x: x,
+            parameters={'param': {'type': 'integer', 'description': 'Parameter'}},
+        )
+
+        formatted = llm.format_tools_for_llm([tool1, tool2])
+
+        assert len(formatted) == 2
+        assert formatted[0]['name'] == 'tool1'
+        assert formatted[1]['name'] == 'tool2'
+        assert all(tool['type'] == 'custom' for tool in formatted)
+
+    def test_anthropic_format_image_in_message(self):
+        """Test format_image_in_message method."""
+        llm = Anthropic()
+
+        # This method is not implemented yet
+        image = ImageMessage(image_url='https://example.com/image.jpg')
+
+        with pytest.raises(NotImplementedError):
+            llm.format_image_in_message(image)
+
+    @pytest.mark.asyncio
+    async def test_anthropic_generate_error_handling(self):
+        """Test error handling in generate method."""
+        llm = Anthropic(model='claude-3-5-sonnet-20240620')
+
+        # Mock client to raise an exception
+        llm.client = Mock()
+        llm.client.messages.create = AsyncMock(side_effect=Exception('API Error'))
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+
+        with pytest.raises(Exception, match='Error in Claude API call: API Error'):
+            await llm.generate(messages)
+
+    def test_anthropic_model_parameter_handling(self):
+        """Test that model parameter is properly handled."""
+        test_models = [
+            'claude-3-5-sonnet-20240620',
+            'claude-3-opus-20240229',
+            'claude-3-sonnet-20240229',
+            'claude-3-haiku-20240307',
+        ]
+
+        for model in test_models:
+            llm = Anthropic(model=model)
+            assert llm.model == model
+
+    def test_anthropic_api_key_handling(self):
+        """Test API key handling."""
+        # Test with API key
+        llm = Anthropic(api_key='secret-key-123')
+        assert llm.api_key == 'secret-key-123'
+
+        # Test without API key
+        llm = Anthropic()
+        assert llm.api_key is None
+
+        # Test with empty string API key
+        llm = Anthropic(api_key='')
+        assert llm.api_key == ''
+
+    def test_anthropic_base_url_handling(self):
+        """Test base URL handling."""
+        # Test with base URL
+        llm = Anthropic(base_url='https://custom.anthropic.com')
+        assert llm.client.base_url == 'https://custom.anthropic.com'
+
+        # Test without base URL
+        llm = Anthropic()
+        assert not hasattr(llm, 'base_url')
diff --git a/flo_ai/tests/test_arium_yaml.py b/flo_ai/tests/test_arium_yaml.py
index e1935656..3b8c22a7 100644
--- a/flo_ai/tests/test_arium_yaml.py
+++ b/flo_ai/tests/test_arium_yaml.py
@@ -793,6 +793,11 @@ def test_from_yaml_mixed_configuration_methods(self):
                 mock_llm = Mock()
                 mock_openai.return_value = mock_llm
 
+                # Mock for direct agent configuration
+                mock_direct_agent = Mock(spec=Agent)
+                mock_direct_agent.name = 'direct_agent'
+                mock_direct_agent.role = 'Direct Agent'
+
                 # Mock for inline YAML config
                 mock_yaml_agent = Mock(spec=Agent)
                 mock_yaml_agent.name = 'yaml_agent'
@@ -801,6 +806,24 @@ def test_from_yaml_mixed_configuration_methods(self):
                 mock_file_agent = Mock(spec=Agent)
                 mock_file_agent.name = 'file_agent'
 
+                # Mock the AgentBuilder instance for direct configuration
+                mock_direct_builder = Mock()
+                mock_direct_builder.with_name.return_value = mock_direct_builder
+                mock_direct_builder.with_prompt.return_value = mock_direct_builder
+                mock_direct_builder.with_llm.return_value = mock_direct_builder
+                mock_direct_builder.with_tools.return_value = mock_direct_builder
+                mock_direct_builder.with_retries.return_value = mock_direct_builder
+                mock_direct_builder.with_reasoning.return_value = mock_direct_builder
+                mock_direct_builder.with_output_schema.return_value = (
+                    mock_direct_builder
+                )
+                mock_direct_builder.with_role.return_value = mock_direct_builder
+                mock_direct_builder.build.return_value = mock_direct_agent
+
+                # Mock the AgentBuilder class to return our mocked builder
+                mock_agent_builder.return_value = mock_direct_builder
+
+                # Mock for inline YAML and file config
                 mock_builder_instance = Mock()
                 mock_builder_instance.build.side_effect = [
                     mock_yaml_agent,
@@ -1015,10 +1038,33 @@ def test_from_yaml_mixed_prebuilt_and_configured_agents(self):
                 mock_llm = Mock()
                 mock_openai.return_value = mock_llm
 
+                # Mock for direct agent configuration
+                mock_direct_agent = Mock(spec=Agent)
+                mock_direct_agent.name = 'direct_agent'
+                mock_direct_agent.role = 'Direct Agent'
+
                 # Mock for inline YAML config
                 mock_yaml_agent = Mock(spec=Agent)
                 mock_yaml_agent.name = 'yaml_agent'
 
+                # Mock the AgentBuilder instance for direct configuration
+                mock_direct_builder = Mock()
+                mock_direct_builder.with_name.return_value = mock_direct_builder
+                mock_direct_builder.with_prompt.return_value = mock_direct_builder
+                mock_direct_builder.with_llm.return_value = mock_direct_builder
+                mock_direct_builder.with_tools.return_value = mock_direct_builder
+                mock_direct_builder.with_retries.return_value = mock_direct_builder
+                mock_direct_builder.with_reasoning.return_value = mock_direct_builder
+                mock_direct_builder.with_output_schema.return_value = (
+                    mock_direct_builder
+                )
+                mock_direct_builder.with_role.return_value = mock_direct_builder
+                mock_direct_builder.build.return_value = mock_direct_agent
+
+                # Mock the AgentBuilder class to return our mocked builder
+                mock_agent_builder.return_value = mock_direct_builder
+
+                # Mock for inline YAML config
                 mock_builder_instance = Mock()
                 mock_builder_instance.build.return_value = mock_yaml_agent
                 mock_agent_builder.from_yaml.return_value = mock_builder_instance
diff --git a/flo_ai/tests/test_base_llm.py b/flo_ai/tests/test_base_llm.py
new file mode 100644
index 00000000..147e3457
--- /dev/null
+++ b/flo_ai/tests/test_base_llm.py
@@ -0,0 +1,237 @@
+#!/usr/bin/env python3
+"""
+Pytest tests for the BaseLLM abstract class and ImageMessage dataclass.
+"""
+
+import sys
+import os
+import pytest
+from unittest.mock import Mock
+
+# Add the flo_ai directory to the path
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), '..'))
+
+from flo_ai.llm.base_llm import BaseLLM, ImageMessage
+
+
+class MockLLM(BaseLLM):
+    """Mock LLM implementation for testing BaseLLM functionality"""
+
+    async def generate(self, messages, functions=None):
+        return {'content': 'Mock response'}
+
+    async def get_function_call(self, response):
+        if hasattr(response, 'function_call') and response.function_call:
+            return {
+                'name': response.function_call.name,
+                'arguments': response.function_call.arguments,
+            }
+        elif isinstance(response, dict) and 'function_call' in response:
+            return {
+                'name': response['function_call']['name'],
+                'arguments': response['function_call']['arguments'],
+            }
+        return None
+
+    def get_message_content(self, response):
+        if isinstance(response, dict):
+            return response.get('content', '')
+        return str(response)
+
+    def format_tool_for_llm(self, tool):
+        return {
+            'name': tool.name,
+            'description': tool.description,
+            'parameters': {'type': 'object', 'properties': {}},
+        }
+
+    def format_tools_for_llm(self, tools):
+        return [self.format_tool_for_llm(tool) for tool in tools]
+
+    def format_image_in_message(self, image):
+        return f'image:{image.mime_type}'
+
+
+class TestImageMessage:
+    """Test class for ImageMessage dataclass."""
+
+    def test_image_message_creation(self):
+        """Test creating ImageMessage with different parameters."""
+        # Test with image_url
+        img1 = ImageMessage(image_url='https://example.com/image.jpg')
+        assert img1.image_url == 'https://example.com/image.jpg'
+        assert img1.image_bytes is None
+        assert img1.image_file_path is None
+        assert img1.image_base64 is None
+        assert img1.mime_type is None
+
+        # Test with image_bytes
+        img2 = ImageMessage(image_bytes=b'fake_image_data', mime_type='image/jpeg')
+        assert img2.image_bytes == b'fake_image_data'
+        assert img2.mime_type == 'image/jpeg'
+
+        # Test with image_file_path
+        img3 = ImageMessage(image_file_path='/path/to/image.png', mime_type='image/png')
+        assert img3.image_file_path == '/path/to/image.png'
+        assert img3.mime_type == 'image/png'
+
+        # Test with image_base64
+        img4 = ImageMessage(image_base64='base64_encoded_string', mime_type='image/gif')
+        assert img4.image_base64 == 'base64_encoded_string'
+        assert img4.mime_type == 'image/gif'
+
+    def test_image_message_defaults(self):
+        """Test ImageMessage with no parameters."""
+        img = ImageMessage()
+        assert img.image_url is None
+        assert img.image_bytes is None
+        assert img.image_file_path is None
+        assert img.image_base64 is None
+        assert img.mime_type is None
+
+
+class TestBaseLLM:
+    """Test class for BaseLLM abstract class functionality."""
+
+    def test_base_llm_initialization(self):
+        """Test BaseLLM initialization with different parameters."""
+        # Test with minimal parameters
+        llm = MockLLM(model='test-model')
+        assert llm.model == 'test-model'
+        assert llm.api_key is None
+        assert llm.temperature == 0.7
+        assert llm.kwargs == {}
+
+        # Test with all parameters
+        llm = MockLLM(
+            model='test-model-2',
+            api_key='test-key',
+            temperature=0.5,
+            max_tokens=100,
+            top_p=0.9,
+        )
+        assert llm.model == 'test-model-2'
+        assert llm.api_key == 'test-key'
+        assert llm.temperature == 0.5
+        assert llm.kwargs == {'max_tokens': 100, 'top_p': 0.9}
+
+    def test_base_llm_temperature_validation(self):
+        """Test temperature parameter handling."""
+        # Test default temperature
+        llm = MockLLM(model='test-model')
+        assert llm.temperature == 0.7
+
+        # Test custom temperature
+        llm = MockLLM(model='test-model', temperature=0.0)
+        assert llm.temperature == 0.0
+
+        # Test high temperature
+        llm = MockLLM(model='test-model', temperature=1.0)
+        assert llm.temperature == 1.0
+
+        # Test temperature in kwargs
+        llm = MockLLM(model='test-model', temperature=0.3, custom_temp=0.8)
+        assert llm.temperature == 0.3
+        assert llm.kwargs['custom_temp'] == 0.8
+
+    def test_base_llm_kwargs_storage(self):
+        """Test that additional kwargs are properly stored."""
+        llm = MockLLM(
+            model='test-model',
+            max_tokens=1000,
+            top_p=0.9,
+            frequency_penalty=0.1,
+            presence_penalty=0.1,
+        )
+
+        assert 'max_tokens' in llm.kwargs
+        assert 'top_p' in llm.kwargs
+        assert 'frequency_penalty' in llm.kwargs
+        assert 'presence_penalty' in llm.kwargs
+        assert llm.kwargs['max_tokens'] == 1000
+        assert llm.kwargs['top_p'] == 0.9
+
+    @pytest.mark.asyncio
+    async def test_base_llm_get_function_call(self):
+        """Test get_function_call method with different response formats."""
+        llm = MockLLM(model='test-model')
+
+        # Test with response object that has function_call attribute
+        mock_response = Mock()
+        mock_response.function_call.name = 'test_function'
+        mock_response.function_call.arguments = '{"param": "value"}'
+
+        result = await llm.get_function_call(mock_response)
+        assert result == {'name': 'test_function', 'arguments': '{"param": "value"}'}
+
+        # Test with dict response
+        dict_response = {
+            'function_call': {
+                'name': 'test_function_2',
+                'arguments': '{"param2": "value2"}',
+            }
+        }
+
+        result = await llm.get_function_call(dict_response)
+        assert result == {
+            'name': 'test_function_2',
+            'arguments': '{"param2": "value2"}',
+        }
+
+        # Test with response that has no function_call
+        no_function_response = {'content': 'No function call here'}
+        result = await llm.get_function_call(no_function_response)
+        assert result is None
+
+        # Test with response that has function_call but it's None
+        none_function_response = Mock()
+        none_function_response.function_call = None
+
+        result = await llm.get_function_call(none_function_response)
+        assert result is None
+
+    def test_base_llm_abstract_methods(self):
+        """Test that abstract methods are properly defined."""
+        # This should not raise an error since MockLLM implements all abstract methods
+        llm = MockLLM(model='test-model')
+
+        # Verify all required methods exist
+        assert hasattr(llm, 'generate')
+        assert hasattr(llm, 'get_message_content')
+        assert hasattr(llm, 'format_tool_for_llm')
+        assert hasattr(llm, 'format_tools_for_llm')
+        assert hasattr(llm, 'format_image_in_message')
+
+        # Verify they are callable
+        assert callable(llm.generate)
+        assert callable(llm.get_message_content)
+        assert callable(llm.format_tool_for_llm)
+        assert callable(llm.format_tools_for_llm)
+        assert callable(llm.format_image_in_message)
+
+    def test_base_llm_cannot_instantiate_abstract(self):
+        """Test that BaseLLM cannot be instantiated directly."""
+        with pytest.raises(TypeError):
+            BaseLLM(model='test-model')
+
+    def test_base_llm_model_validation(self):
+        """Test that model parameter is properly set."""
+        test_models = ['gpt-4', 'claude-3', 'gemini-pro', 'llama2']
+
+        for model in test_models:
+            llm = MockLLM(model=model)
+            assert llm.model == model
+
+    def test_base_llm_api_key_handling(self):
+        """Test API key handling."""
+        # Test with API key
+        llm = MockLLM(model='test-model', api_key='secret-key-123')
+        assert llm.api_key == 'secret-key-123'
+
+        # Test without API key
+        llm = MockLLM(model='test-model')
+        assert llm.api_key is None
+
+        # Test with empty string API key
+        llm = MockLLM(model='test-model', api_key='')
+        assert llm.api_key == ''
diff --git a/flo_ai/tests/test_gemini_llm.py b/flo_ai/tests/test_gemini_llm.py
new file mode 100644
index 00000000..50922502
--- /dev/null
+++ b/flo_ai/tests/test_gemini_llm.py
@@ -0,0 +1,490 @@
+#!/usr/bin/env python3
+"""
+Pytest tests for the Gemini LLM implementation.
+"""
+
+import sys
+import os
+import pytest
+from unittest.mock import Mock, patch, mock_open
+
+# Add the flo_ai directory to the path
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), '..'))
+
+from flo_ai.llm.gemini_llm import Gemini
+from flo_ai.llm.base_llm import ImageMessage
+from flo_ai.tool.base_tool import Tool
+
+os.environ['GOOGLE_API_KEY'] = 'test-key-123'
+
+
+class TestGemini:
+    """Test class for Gemini LLM implementation."""
+
+    @patch('flo_ai.llm.gemini_llm.genai.Client')
+    def test_gemini_initialization(self, mock_genai_client):
+        """Test Gemini LLM initialization with different parameters."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        # Test with minimal parameters
+        llm = Gemini()
+        assert llm.model == 'gemini-2.5-flash'
+        assert llm.api_key is None
+        assert llm.temperature == 0.7
+        assert llm.kwargs == {}
+
+        # Test with custom parameters
+        mock_genai_client.reset_mock()
+        llm = Gemini(
+            model='gemini-1.5-pro',
+            api_key='test-key-123',
+            temperature=0.5,
+            max_output_tokens=1000,
+        )
+        assert llm.model == 'gemini-1.5-pro'
+        assert llm.api_key == 'test-key-123'
+        assert llm.temperature == 0.5
+        assert llm.kwargs == {'max_output_tokens': 1000}
+
+        # Test with base_url (should be ignored as it's not implemented)
+        mock_genai_client.reset_mock()
+        llm = Gemini(base_url='https://custom.gemini.com')
+        # base_url is not stored as an attribute, so we just verify it doesn't crash
+
+    @patch('flo_ai.llm.gemini_llm.genai.Client')
+    def test_gemini_temperature_handling(self, mock_genai_client):
+        """Test temperature parameter handling."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        # Test default temperature
+        llm = Gemini()
+        assert llm.temperature == 0.7
+
+        # Test custom temperature
+        mock_genai_client.reset_mock()
+        llm = Gemini(temperature=0.0)
+        assert llm.temperature == 0.0
+
+        # Test high temperature
+        mock_genai_client.reset_mock()
+        llm = Gemini(temperature=1.0)
+        assert llm.temperature == 1.0
+
+        # Test temperature in kwargs
+        mock_genai_client.reset_mock()
+        llm = Gemini(temperature=0.3, custom_temp=0.8)
+        assert llm.temperature == 0.3
+        assert llm.kwargs['custom_temp'] == 0.8
+
+    @patch('flo_ai.llm.gemini_llm.genai.Client')
+    def test_gemini_client_creation(self, mock_genai_client):
+        """Test that genai Client is created correctly."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = Gemini(api_key='test-key')
+
+        mock_genai_client.assert_called_once_with(api_key='test-key')
+        assert llm.client == mock_client
+
+        # Test without API key
+        mock_genai_client.reset_mock()
+        llm = Gemini()
+
+        mock_genai_client.assert_called_once_with()
+        assert llm.client == mock_client
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.gemini_llm.genai.Client')
+    async def test_gemini_generate_basic(self, mock_genai_client):
+        """Test basic generate method without functions or output schema."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = Gemini(model='gemini-2.5-flash')
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = 'Hello, world!'
+
+        llm.client = mock_client
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+        result = await llm.generate(messages)
+
+        # Verify the API call
+        llm.client.models.generate_content.assert_called_once()
+        call_args = llm.client.models.generate_content.call_args
+
+        assert call_args[1]['model'] == 'gemini-2.5-flash'
+        assert call_args[1]['contents'] == ['Hello']
+        assert call_args[1]['config'].temperature == 0.7
+
+        # Verify the result
+        assert result == {'content': 'Hello, world!'}
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.gemini_llm.genai.Client')
+    async def test_gemini_generate_with_system_message(self, mock_genai_client):
+        """Test generate method with system message."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = Gemini(model='gemini-2.5-flash')
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = "I'm a helpful assistant"
+
+        llm.client = mock_client
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [
+            {'role': 'system', 'content': 'You are a helpful assistant'},
+            {'role': 'user', 'content': 'Hello'},
+        ]
+
+        await llm.generate(messages)
+
+        # Verify system instruction was passed correctly
+        call_args = llm.client.models.generate_content.call_args
+        config = call_args[1]['config']
+        assert config.system_instruction == 'You are a helpful assistant\n'
+
+        # Verify contents don't include system message
+        contents = call_args[1]['contents']
+        assert contents == ['Hello']
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.gemini_llm.types.GenerateContentConfig')
+    async def test_gemini_generate_with_output_schema(self, mock_config_class):
+        """Test generate method with output schema."""
+        llm = Gemini(model='gemini-2.5-flash')
+
+        output_schema = {
+            'type': 'object',
+            'properties': {'message': {'type': 'string'}, 'count': {'type': 'integer'}},
+        }
+
+        # Mock the config
+        mock_config = Mock()
+        mock_config_class.return_value = mock_config
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = '{"message": "test", "count": 42}'
+        mock_response.candidates = []
+
+        llm.client = Mock()
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Generate JSON'}]
+        result = await llm.generate(messages, output_schema=output_schema)
+
+        # Verify structured output was configured
+        mock_config.response_mime_type = 'application/json'
+        mock_config.response_schema = output_schema
+
+        # Verify the result
+        assert result == {'content': '{"message": "test", "count": 42}'}
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.gemini_llm.types.Tool')
+    @patch('flo_ai.llm.gemini_llm.types.GenerateContentConfig')
+    async def test_gemini_generate_with_functions(
+        self, mock_config_class, mock_tool_class
+    ):
+        """Test generate method with functions (tools)."""
+        llm = Gemini(model='gemini-2.5-flash')
+
+        functions = [
+            {
+                'name': 'test_function',
+                'description': 'A test function',
+                'parameters': {'type': 'object'},
+            }
+        ]
+
+        # Mock the tool and config
+        mock_tool = Mock()
+        mock_tool_class.return_value = mock_tool
+
+        mock_config = Mock()
+        mock_config_class.return_value = mock_config
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = "I'll use the function"
+        mock_response.candidates = []
+
+        llm.client = Mock()
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Use the function'}]
+        result = await llm.generate(messages, functions=functions)
+
+        # Verify tool was created with function declarations
+        mock_tool_class.assert_called_once_with(function_declarations=functions)
+
+        # Verify tools were added to config
+        mock_config.tools = [mock_tool]
+
+        # Verify the result
+        assert result == {'content': "I'll use the function"}
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.gemini_llm.types.Tool')
+    @patch('flo_ai.llm.gemini_llm.types.GenerateContentConfig')
+    async def test_gemini_generate_with_function_call_detection(
+        self, mock_config_class, mock_tool_class
+    ):
+        """Test generate method with function call detection."""
+        llm = Gemini(model='gemini-2.5-flash')
+
+        functions = [
+            {
+                'name': 'test_function',
+                'description': 'A test function',
+                'parameters': {'type': 'object'},
+            }
+        ]
+
+        # Mock the tool and config
+        mock_tool = Mock()
+        mock_tool_class.return_value = mock_tool
+
+        mock_config = Mock()
+        mock_config_class.return_value = mock_config
+
+        # Mock the client response with function call
+        mock_function_call = Mock()
+        mock_function_call.name = 'test_function'
+        mock_function_call.args = {'param': 'value'}
+
+        mock_part = Mock()
+        mock_part.function_call = mock_function_call
+
+        mock_content = Mock()
+        mock_content.parts = [mock_part]
+
+        mock_candidate = Mock()
+        mock_candidate.content = mock_content
+
+        mock_response = Mock()
+        mock_response.text = 'Function called'
+        mock_response.candidates = [mock_candidate]
+
+        llm.client = Mock()
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Use the function'}]
+        result = await llm.generate(messages, functions=functions)
+
+        # Verify function call was detected and parsed
+        assert 'function_call' in result
+        assert result['function_call']['name'] == 'test_function'
+        assert result['function_call']['arguments'] == {'param': 'value'}
+
+    @pytest.mark.asyncio
+    async def test_gemini_generate_with_kwargs(self):
+        """Test generate method with additional kwargs."""
+        llm = Gemini(model='gemini-2.5-flash', top_p=0.9, max_output_tokens=1000)
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = 'Response with kwargs'
+        mock_response.candidates = []
+
+        llm.client = Mock()
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+        await llm.generate(messages)
+
+        # Verify kwargs were passed through
+        call_args = llm.client.models.generate_content.call_args
+        config = call_args[1]['config']
+        assert config.top_p == 0.9
+        assert config.max_output_tokens == 1000
+
+    def test_gemini_get_message_content(self):
+        """Test get_message_content method."""
+        llm = Gemini()
+
+        # Test with dict response
+        response = {'content': 'Hello, world!'}
+        result = llm.get_message_content(response)
+        assert result == 'Hello, world!'
+
+        # Test with string response
+        result = llm.get_message_content('Direct string')
+        assert result == 'Direct string'
+
+        # Test with empty content
+        response = {'content': ''}
+        result = llm.get_message_content(response)
+        assert result == ''
+
+    def test_gemini_format_tool_for_llm(self):
+        """Test format_tool_for_llm method."""
+        llm = Gemini()
+
+        # Create a mock tool
+        tool = Tool(
+            name='test_tool',
+            description='A test tool',
+            function=lambda x: x,
+            parameters={
+                'param1': {'type': 'string', 'description': 'First parameter'},
+                'param2': {'type': 'integer', 'description': 'Second parameter'},
+            },
+        )
+
+        formatted = llm.format_tool_for_llm(tool)
+
+        assert formatted['name'] == 'test_tool'
+        assert formatted['description'] == 'A test tool'
+        assert formatted['parameters']['type'] == 'object'
+        assert 'param1' in formatted['parameters']['properties']
+        assert 'param2' in formatted['parameters']['properties']
+        assert formatted['parameters']['required'] == ['param1', 'param2']
+
+    def test_gemini_format_tools_for_llm(self):
+        """Test format_tools_for_llm method."""
+        llm = Gemini()
+
+        # Create mock tools
+        tool1 = Tool(
+            name='tool1',
+            description='First tool',
+            function=lambda x: x,
+            parameters={'param': {'type': 'string', 'description': 'Parameter'}},
+        )
+
+        tool2 = Tool(
+            name='tool2',
+            description='Second tool',
+            function=lambda x: x,
+            parameters={'param': {'type': 'integer', 'description': 'Parameter'}},
+        )
+
+        formatted = llm.format_tools_for_llm([tool1, tool2])
+
+        assert len(formatted) == 2
+        assert formatted[0]['name'] == 'tool1'
+        assert formatted[1]['name'] == 'tool2'
+
+    def test_gemini_format_image_in_message_file_path(self):
+        """Test format_image_in_message method with file path."""
+        llm = Gemini()
+
+        # Mock file reading
+        with patch('builtins.open', mock_open(read_data=b'fake_image_data')):
+            image = ImageMessage(
+                image_file_path='/path/to/image.jpg', mime_type='image/jpeg'
+            )
+
+            result = llm.format_image_in_message(image)
+
+            # Verify genai.types.Part.from_bytes was called
+            # Note: We can't easily test the genai call without more complex mocking
+            # but we can verify the method doesn't raise an exception
+            assert result is not None
+
+    def test_gemini_format_image_in_message_bytes(self):
+        """Test format_image_in_message method with image bytes."""
+        llm = Gemini()
+
+        image = ImageMessage(image_bytes=b'fake_image_data', mime_type='image/png')
+
+        result = llm.format_image_in_message(image)
+
+        # Verify genai.types.Part.from_bytes was called
+        assert result is not None
+
+    def test_gemini_format_image_in_message_unsupported(self):
+        """Test format_image_in_message method with unsupported image format."""
+        llm = Gemini()
+
+        # Test with image_url (not implemented)
+        image = ImageMessage(image_url='https://example.com/image.jpg')
+
+        with pytest.raises(
+            NotImplementedError,
+            match='Not other way other than file path has been implemented',
+        ):
+            llm.format_image_in_message(image)
+
+        # Test with image_base64 (not implemented)
+        image = ImageMessage(image_base64='base64_string')
+
+        with pytest.raises(
+            NotImplementedError,
+            match='Not other way other than file path has been implemented',
+        ):
+            llm.format_image_in_message(image)
+
+    @pytest.mark.asyncio
+    async def test_gemini_generate_error_handling(self):
+        """Test error handling in generate method."""
+        llm = Gemini(model='gemini-2.5-flash')
+
+        # Mock client to raise an exception
+        llm.client = Mock()
+        llm.client.models.generate_content = Mock(side_effect=Exception('API Error'))
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+
+        with pytest.raises(Exception, match='Error in Gemini API call: API Error'):
+            await llm.generate(messages)
+
+    def test_gemini_model_parameter_handling(self):
+        """Test that model parameter is properly handled."""
+        test_models = [
+            'gemini-2.5-flash',
+            'gemini-1.5-pro',
+            'gemini-1.5-flash',
+            'gemini-pro',
+        ]
+
+        for model in test_models:
+            llm = Gemini(model=model)
+            assert llm.model == model
+
+    def test_gemini_api_key_handling(self):
+        """Test API key handling."""
+        # Test with API key
+        llm = Gemini(api_key='secret-key-123')
+        assert llm.api_key == 'secret-key-123'
+
+        # Test without API key
+        llm = Gemini()
+        assert llm.api_key is None
+
+        # Test with empty string API key
+        llm = Gemini(api_key='')
+        assert llm.api_key == ''
+
+    def test_gemini_generation_config_creation(self):
+        """Test that generation config is created correctly."""
+        llm = Gemini(temperature=0.5, max_output_tokens=1000, top_p=0.9)
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = 'Test response'
+        mock_response.candidates = []
+
+        llm.client = Mock()
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        # We need to patch the types.GenerateContentConfig to test this
+        with patch('flo_ai.llm.gemini_llm.types.GenerateContentConfig') as mock_config:
+            mock_config_instance = Mock()
+            mock_config.return_value = mock_config_instance
+
+            # This would normally be called in generate method
+            # For testing, we'll just verify the config class exists
+            assert mock_config is not None
diff --git a/flo_ai/tests/test_openai_llm.py b/flo_ai/tests/test_openai_llm.py
new file mode 100644
index 00000000..3a069f5a
--- /dev/null
+++ b/flo_ai/tests/test_openai_llm.py
@@ -0,0 +1,325 @@
+#!/usr/bin/env python3
+"""
+Pytest tests for the OpenAI LLM implementation.
+"""
+
+import sys
+import os
+import pytest
+from unittest.mock import Mock, AsyncMock, patch
+
+# Add the flo_ai directory to the path
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), '..'))
+
+from flo_ai.llm.openai_llm import OpenAI
+from flo_ai.llm.base_llm import ImageMessage
+from flo_ai.tool.base_tool import Tool
+
+os.environ['OPENAI_API_KEY'] = 'test-key-123'
+
+
+class TestOpenAI:
+    """Test class for OpenAI LLM implementation."""
+
+    def test_openai_initialization(self):
+        """Test OpenAI LLM initialization with different parameters."""
+        # Test with minimal parameters
+        llm = OpenAI()
+        assert llm.model == 'gpt-4o-mini'
+        assert llm.api_key is None
+        assert llm.temperature == 0.7
+        assert llm.kwargs == {}
+
+        # Test with custom parameters
+        llm = OpenAI(
+            model='gpt-4', api_key='test-key-123', temperature=0.5, max_tokens=1000
+        )
+        assert llm.model == 'gpt-4'
+        assert llm.api_key == 'test-key-123'
+        assert llm.temperature == 0.5
+        assert llm.kwargs == {'max_tokens': 1000}
+
+        # Test with base_url
+        llm = OpenAI(base_url='https://custom.openai.com')
+        assert llm.client.base_url == 'https://custom.openai.com'
+
+    def test_openai_temperature_handling(self):
+        """Test temperature parameter handling."""
+        # Test default temperature
+        llm = OpenAI()
+        assert llm.temperature == 0.7
+
+        # Test custom temperature
+        llm = OpenAI(temperature=0.0)
+        assert llm.temperature == 0.0
+
+        # Test high temperature
+        llm = OpenAI(temperature=1.0)
+        assert llm.temperature == 1.0
+
+        # Test temperature in kwargs
+        llm = OpenAI(temperature=0.3, custom_temp=0.8)
+        assert llm.temperature == 0.3
+        assert llm.kwargs['custom_temp'] == 0.8
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_client_creation(self, mock_async_openai):
+        """Test that AsyncOpenAI client is created correctly."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAI(api_key='test-key', base_url='https://custom.com')
+
+        mock_async_openai.assert_called_once_with(
+            api_key='test-key', base_url='https://custom.com'
+        )
+        assert llm.client == mock_client
+
+    @pytest.mark.asyncio
+    async def test_openai_generate_basic(self):
+        """Test basic generate method without output schema."""
+        llm = OpenAI(model='gpt-4o-mini')
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.choices = [Mock()]
+        mock_response.choices[0].message = Mock()
+        mock_response.choices[0].message.content = 'Hello, world!'
+
+        llm.client = Mock()
+        llm.client.chat.completions.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+        result = await llm.generate(messages)
+
+        # Verify the API call
+        llm.client.chat.completions.create.assert_called_once()
+        call_args = llm.client.chat.completions.create.call_args
+
+        assert call_args[1]['model'] == 'gpt-4o-mini'
+        assert call_args[1]['messages'] == messages
+        assert call_args[1]['temperature'] == 0.7
+
+        # Verify the result
+        assert result == mock_response.choices[0].message
+
+    @pytest.mark.asyncio
+    async def test_openai_generate_with_output_schema(self):
+        """Test generate method with output schema."""
+        llm = OpenAI(model='gpt-4o-mini')
+
+        output_schema = {
+            'title': 'test_response',
+            'schema': {
+                'type': 'object',
+                'properties': {
+                    'message': {'type': 'string'},
+                    'count': {'type': 'integer'},
+                },
+            },
+        }
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.choices = [Mock()]
+        mock_response.choices[0].message = Mock()
+        mock_response.choices[0].message.content = '{"message": "test", "count": 42}'
+
+        llm.client = Mock()
+        llm.client.chat.completions.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Generate JSON'}]
+        await llm.generate(messages, output_schema=output_schema)
+
+        # Verify the API call
+        call_args = llm.client.chat.completions.create.call_args[1]
+
+        assert call_args['response_format'] == {'type': 'json_object'}
+        assert call_args['functions'] == [
+            {'name': 'test_response', 'parameters': output_schema['schema']}
+        ]
+        assert call_args['function_call'] == {'name': 'test_response'}
+
+        # Verify system message was modified
+        assert len(call_args['messages']) == 2
+        assert call_args['messages'][0]['role'] == 'system'
+        assert 'JSON format' in call_args['messages'][0]['content']
+
+    @pytest.mark.asyncio
+    async def test_openai_generate_with_existing_system_message(self):
+        """Test generate method with existing system message and output schema."""
+        llm = OpenAI(model='gpt-4o-mini')
+
+        output_schema = {'title': 'test', 'schema': {'type': 'object'}}
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.choices = [Mock()]
+        mock_response.choices[0].message = Mock()
+        mock_response.choices[0].message.content = '{"test": "value"}'
+
+        llm.client = Mock()
+        llm.client.chat.completions.create = AsyncMock(return_value=mock_response)
+
+        messages = [
+            {'role': 'system', 'content': 'You are a helpful assistant'},
+            {'role': 'user', 'content': 'Generate JSON'},
+        ]
+
+        await llm.generate(messages, output_schema=output_schema)
+
+        # Verify system message was appended to
+        call_args = llm.client.chat.completions.create.call_args[1]
+        system_message = call_args['messages'][0]['content']
+        assert 'You are a helpful assistant' in system_message
+        assert 'JSON format' in system_message
+
+    @pytest.mark.asyncio
+    async def test_openai_generate_with_kwargs(self):
+        """Test generate method with additional kwargs."""
+        llm = OpenAI(model='gpt-4o-mini', max_tokens=1000, top_p=0.9)
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.choices = [Mock()]
+        mock_response.choices[0].message = Mock()
+        mock_response.choices[0].message.content = 'Response with kwargs'
+
+        llm.client = Mock()
+        llm.client.chat.completions.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+        await llm.generate(messages, stream=False)
+
+        # Verify kwargs were passed through
+        call_args = llm.client.chat.completions.create.call_args[1]
+        assert call_args['max_tokens'] == 1000
+        assert call_args['top_p'] == 0.9
+        assert not call_args['stream']
+
+    def test_openai_get_message_content(self):
+        """Test get_message_content method."""
+        llm = OpenAI()
+
+        # Test with string response
+        result = llm.get_message_content('Hello, world!')
+        assert result == 'Hello, world!'
+
+        # Test with message object
+        mock_message = Mock()
+        mock_message.content = 'Message content'
+        result = llm.get_message_content(mock_message)
+        assert result == 'Message content'
+
+        # Test with object without content attribute
+        mock_obj = Mock()
+        del mock_obj.content
+        result = llm.get_message_content(mock_obj)
+        assert result == str(mock_obj)
+
+    def test_openai_format_tool_for_llm(self):
+        """Test format_tool_for_llm method."""
+        llm = OpenAI()
+
+        # Create a mock tool
+        tool = Tool(
+            name='test_tool',
+            description='A test tool',
+            function=lambda x: x,
+            parameters={
+                'param1': {'type': 'string', 'description': 'First parameter'},
+                'param2': {'type': 'integer', 'description': 'Second parameter'},
+            },
+        )
+
+        formatted = llm.format_tool_for_llm(tool)
+
+        assert formatted['name'] == 'test_tool'
+        assert formatted['description'] == 'A test tool'
+        assert formatted['parameters']['type'] == 'object'
+        assert 'param1' in formatted['parameters']['properties']
+        assert 'param2' in formatted['parameters']['properties']
+        assert formatted['parameters']['required'] == ['param1', 'param2']
+
+    def test_openai_format_tools_for_llm(self):
+        """Test format_tools_for_llm method."""
+        llm = OpenAI()
+
+        # Create mock tools
+        tool1 = Tool(
+            name='tool1',
+            description='First tool',
+            function=lambda x: x,
+            parameters={'param': {'type': 'string', 'description': 'Parameter'}},
+        )
+
+        tool2 = Tool(
+            name='tool2',
+            description='Second tool',
+            function=lambda x: x,
+            parameters={'param': {'type': 'integer', 'description': 'Parameter'}},
+        )
+
+        formatted = llm.format_tools_for_llm([tool1, tool2])
+
+        assert len(formatted) == 2
+        assert formatted[0]['name'] == 'tool1'
+        assert formatted[1]['name'] == 'tool2'
+
+    def test_openai_format_image_in_message(self):
+        """Test format_image_in_message method."""
+        llm = OpenAI()
+
+        # This method is not implemented yet
+        image = ImageMessage(image_url='https://example.com/image.jpg')
+
+        with pytest.raises(NotImplementedError):
+            llm.format_image_in_message(image)
+
+    @pytest.mark.asyncio
+    async def test_openai_generate_error_handling(self):
+        """Test error handling in generate method."""
+        llm = OpenAI(model='gpt-4o-mini')
+
+        # Mock client to raise an exception
+        llm.client = Mock()
+        llm.client.chat.completions.create = AsyncMock(
+            side_effect=Exception('API Error')
+        )
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+
+        with pytest.raises(Exception, match='API Error'):
+            await llm.generate(messages)
+
+    def test_openai_model_parameter_handling(self):
+        """Test that model parameter is properly handled."""
+        test_models = ['gpt-4', 'gpt-4o', 'gpt-4o-mini', 'gpt-3.5-turbo']
+
+        for model in test_models:
+            llm = OpenAI(model=model)
+            assert llm.model == model
+
+    def test_openai_api_key_handling(self):
+        """Test API key handling."""
+        # Test with API key
+        llm = OpenAI(api_key='secret-key-123')
+        assert llm.api_key == 'secret-key-123'
+
+        # Test without API key
+        llm = OpenAI()
+        assert llm.api_key is None
+
+        # Test with empty string API key
+        llm = OpenAI(api_key='')
+        assert llm.api_key == ''
+
+    def test_openai_base_url_handling(self):
+        """Test base URL handling."""
+        # Test with base URL
+        llm = OpenAI(base_url='https://custom.openai.com')
+        assert llm.client.base_url == 'https://custom.openai.com'
+
+        # Test without base URL
+        llm = OpenAI()
+        assert not hasattr(llm, 'base_url')
diff --git a/flo_ai/tests/test_openai_vllm.py b/flo_ai/tests/test_openai_vllm.py
new file mode 100644
index 00000000..a7938c08
--- /dev/null
+++ b/flo_ai/tests/test_openai_vllm.py
@@ -0,0 +1,575 @@
+#!/usr/bin/env python3
+"""
+Pytest tests for the OpenAI VLLM implementation.
+"""
+
+import sys
+import os
+import pytest
+from unittest.mock import Mock, AsyncMock, patch
+
+# Add the flo_ai directory to the path
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), '..'))
+
+from flo_ai.llm.openai_vllm import OpenAIVLLM
+from flo_ai.llm.base_llm import ImageMessage
+from flo_ai.tool.base_tool import Tool
+
+os.environ['OPENAI_API_KEY'] = 'test-key-123'
+
+
+class TestOpenAIVLLM:
+    """Test class for OpenAI VLLM implementation."""
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_initialization(self, mock_async_openai):
+        """Test OpenAI VLLM initialization with different parameters."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        # Test with minimal parameters
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+        assert llm.model == 'gpt-4o-mini'
+        assert llm.api_key is None
+        assert llm.temperature == 0.7
+        assert llm.base_url == 'https://api.vllm.com'
+        assert llm.kwargs == {}
+
+        # Test with custom parameters
+        mock_async_openai.reset_mock()
+        llm = OpenAIVLLM(
+            base_url='https://custom.vllm.com',
+            model='gpt-4',
+            api_key='test-key-123',
+            temperature=0.5,
+            max_tokens=1000,
+        )
+        assert llm.model == 'gpt-4'
+        assert llm.api_key == 'test-key-123'
+        assert llm.temperature == 0.5
+        assert llm.base_url == 'https://custom.vllm.com'
+        assert llm.kwargs == {'max_tokens': 1000}
+
+        # Test with additional kwargs
+        mock_async_openai.reset_mock()
+        llm = OpenAIVLLM(
+            base_url='https://api.vllm.com',
+            model='gpt-4o-mini',
+            max_tokens=1000,
+            top_p=0.9,
+        )
+        assert llm.kwargs == {'max_tokens': 1000, 'top_p': 0.9}
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_temperature_handling(self, mock_async_openai):
+        """Test temperature parameter handling."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        # Test default temperature
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+        assert llm.temperature == 0.7
+
+        # Test custom temperature
+        mock_async_openai.reset_mock()
+        llm = OpenAIVLLM(
+            base_url='https://api.vllm.com', model='gpt-4o-mini', temperature=0.0
+        )
+        assert llm.temperature == 0.0
+
+        # Test high temperature
+        mock_async_openai.reset_mock()
+        llm = OpenAIVLLM(
+            base_url='https://api.vllm.com', model='gpt-4o-mini', temperature=1.0
+        )
+        assert llm.temperature == 1.0
+
+        # Test temperature in kwargs
+        mock_async_openai.reset_mock()
+        llm = OpenAIVLLM(
+            base_url='https://api.vllm.com',
+            model='gpt-4o-mini',
+            temperature=0.3,
+            custom_temp=0.8,
+        )
+        assert llm.temperature == 0.3
+        assert llm.kwargs['custom_temp'] == 0.8
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_client_creation(self, mock_async_openai):
+        """Test that AsyncOpenAI client is created correctly with VLLM parameters."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAIVLLM(
+            base_url='https://custom.vllm.com', model='gpt-4o-mini', api_key='test-key'
+        )
+
+        mock_async_openai.assert_called_once_with(
+            api_key='test-key', base_url='https://custom.vllm.com'
+        )
+        assert llm.client == mock_client
+
+        # Test without API key
+        mock_async_openai.reset_mock()
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        mock_async_openai.assert_called_once_with(
+            api_key=None, base_url='https://api.vllm.com'
+        )
+        assert llm.client == mock_client
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    async def test_openai_vllm_generate_basic(self, mock_async_openai):
+        """Test basic generate method without output schema."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        # Mock the client response
+        mock_choice = Mock()
+        mock_choice.message.content = 'Hello, world!'
+
+        mock_response = Mock()
+        mock_response.choices = [mock_choice]
+
+        llm.client.chat.completions.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+        result = await llm.generate(messages)
+
+        # Verify the API call
+        llm.client.chat.completions.create.assert_called_once()
+        call_args = llm.client.chat.completions.create.call_args
+
+        assert call_args[1]['model'] == 'gpt-4o-mini'
+        assert call_args[1]['messages'] == messages
+        assert call_args[1]['temperature'] == 0.7
+
+        # Verify the result
+        assert result.content == 'Hello, world!'
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    async def test_openai_vllm_generate_with_output_schema(self, mock_async_openai):
+        """Test generate method with output schema."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        output_schema = {
+            'title': 'test_schema',
+            'schema': {
+                'type': 'object',
+                'properties': {
+                    'message': {'type': 'string'},
+                    'count': {'type': 'integer'},
+                },
+            },
+        }
+
+        # Mock the client response
+        mock_choice = Mock()
+        mock_choice.message.content = '{"message": "test", "count": 42}'
+
+        mock_response = Mock()
+        mock_response.choices = [mock_choice]
+
+        llm.client.chat.completions.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Generate JSON'}]
+        result = await llm.generate(messages, output_schema=output_schema)
+
+        # Verify output schema was configured
+        call_args = llm.client.chat.completions.create.call_args
+        assert call_args[1]['response_format']['type'] == 'json_schema'
+        assert call_args[1]['response_format']['json_schema']['name'] == 'test_schema'
+
+        # Verify the result
+        assert result.content == '{"message": "test", "count": 42}'
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    async def test_openai_vllm_generate_with_existing_system_message(
+        self, mock_async_openai
+    ):
+        """Test generate method with existing system message and output schema."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        output_schema = {'title': 'test_schema', 'schema': {'type': 'object'}}
+
+        # Mock the client response
+        mock_choice = Mock()
+        mock_choice.message.content = '{"result": "success"}'
+
+        mock_response = Mock()
+        mock_response.choices = [mock_choice]
+
+        llm.client.chat.completions.create = AsyncMock(return_value=mock_response)
+
+        messages = [
+            {'role': 'system', 'content': 'You are a helpful assistant'},
+            {'role': 'user', 'content': 'Generate JSON'},
+        ]
+
+        result = await llm.generate(messages, output_schema=output_schema)
+
+        # Verify system message was updated
+        call_args = llm.client.chat.completions.create.call_args
+        updated_messages = call_args[1]['messages']
+        assert updated_messages[0]['role'] == 'system'
+        assert 'JSON format' in updated_messages[0]['content']
+        assert 'test_schema' in updated_messages[0]['content']
+
+        # Verify the result
+        assert result.content == '{"result": "success"}'
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    async def test_openai_vllm_generate_with_kwargs(self, mock_async_openai):
+        """Test generate method with additional kwargs."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAIVLLM(
+            base_url='https://api.vllm.com',
+            model='gpt-4o-mini',
+            top_p=0.9,
+            max_output_tokens=1000,
+        )
+
+        # Mock the client response
+        mock_choice = Mock()
+        mock_choice.message.content = 'Response with kwargs'
+
+        mock_response = Mock()
+        mock_response.choices = [mock_choice]
+
+        llm.client.chat.completions.create = AsyncMock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+        result = await llm.generate(messages)
+
+        # Verify kwargs were passed through
+        call_args = llm.client.chat.completions.create.call_args
+        assert call_args[1]['top_p'] == 0.9
+        assert call_args[1]['max_output_tokens'] == 1000
+
+        # Verify the result
+        assert result.content == 'Response with kwargs'
+
+    def test_openai_vllm_get_message_content(self):
+        """Test get_message_content method."""
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        # Test with dict response (should return str representation)
+        response = {'content': 'Hello, world!'}
+        result = llm.get_message_content(response)
+        assert result == "{'content': 'Hello, world!'}"
+
+        # Test with string response
+        result = llm.get_message_content('Direct string')
+        assert result == 'Direct string'
+
+        # Test with empty content
+        response = {'content': ''}
+        result = llm.get_message_content(response)
+        assert result == "{'content': ''}"
+
+        # Test with message object that has content attribute
+        mock_message = Mock()
+        mock_message.content = 'Message content'
+        result = llm.get_message_content(mock_message)
+        assert result == 'Message content'
+
+    def test_openai_vllm_format_tool_for_llm(self):
+        """Test format_tool_for_llm method."""
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        # Create a mock tool
+        tool = Tool(
+            name='test_tool',
+            description='A test tool',
+            function=lambda x: x,
+            parameters={
+                'param1': {'type': 'string', 'description': 'First parameter'},
+                'param2': {'type': 'integer', 'description': 'Second parameter'},
+            },
+        )
+
+        formatted = llm.format_tool_for_llm(tool)
+
+        assert formatted['name'] == 'test_tool'
+        assert formatted['description'] == 'A test tool'
+        assert formatted['parameters']['type'] == 'object'
+        assert 'param1' in formatted['parameters']['properties']
+        assert 'param2' in formatted['parameters']['properties']
+        assert formatted['parameters']['required'] == ['param1', 'param2']
+
+    def test_openai_vllm_format_tools_for_llm(self):
+        """Test format_tools_for_llm method."""
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        # Create mock tools
+        tool1 = Tool(
+            name='tool1',
+            description='First tool',
+            function=lambda x: x,
+            parameters={'param': {'type': 'string', 'description': 'Parameter'}},
+        )
+
+        tool2 = Tool(
+            name='tool2',
+            description='Second tool',
+            function=lambda x: x,
+            parameters={'param': {'type': 'integer', 'description': 'Parameter'}},
+        )
+
+        formatted = llm.format_tools_for_llm([tool1, tool2])
+
+        assert len(formatted) == 2
+        assert formatted[0]['name'] == 'tool1'
+        assert formatted[1]['name'] == 'tool2'
+
+    def test_openai_vllm_format_image_in_message(self):
+        """Test format_image_in_message method."""
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        # Test with image message
+        image = ImageMessage(image_url='https://example.com/image.jpg')
+
+        with pytest.raises(
+            NotImplementedError, match='Not implemented image for LLM OpenAI'
+        ):
+            llm.format_image_in_message(image)
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    async def test_openai_vllm_generate_error_handling(self, mock_async_openai):
+        """Test error handling in generate method."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        # Mock client to raise an exception
+        llm.client.chat.completions.create = AsyncMock(
+            side_effect=Exception('API Error')
+        )
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+
+        with pytest.raises(Exception, match='API Error'):
+            await llm.generate(messages)
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_model_parameter_handling(self, mock_async_openai):
+        """Test that model parameter is properly handled."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        test_models = ['gpt-4', 'gpt-4o', 'gpt-4o-mini', 'gpt-3.5-turbo']
+
+        for model in test_models:
+            mock_async_openai.reset_mock()
+            llm = OpenAIVLLM(base_url='https://api.vllm.com', model=model)
+            assert llm.model == model
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_api_key_handling(self, mock_async_openai):
+        """Test API key handling."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        # Test with API key
+        llm = OpenAIVLLM(
+            base_url='https://api.vllm.com',
+            model='gpt-4o-mini',
+            api_key='secret-key-123',
+        )
+        assert llm.api_key == 'secret-key-123'
+
+        # Test without API key
+        mock_async_openai.reset_mock()
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+        assert llm.api_key is None
+
+        # Test with empty string API key
+        mock_async_openai.reset_mock()
+        llm = OpenAIVLLM(
+            base_url='https://api.vllm.com', model='gpt-4o-mini', api_key=''
+        )
+        assert llm.api_key == ''
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_base_url_handling(self, mock_async_openai):
+        """Test base URL handling."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        # Test with base URL
+        llm = OpenAIVLLM(base_url='https://custom.vllm.com', model='gpt-4o-mini')
+        assert llm.base_url == 'https://custom.vllm.com'
+
+        # Test with different base URL
+        mock_async_openai.reset_mock()
+        llm = OpenAIVLLM(base_url='https://another.vllm.com', model='gpt-4o-mini')
+        assert llm.base_url == 'https://another.vllm.com'
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_inheritance_from_openai(self, mock_async_openai):
+        """Test that OpenAIVLLM inherits from OpenAI."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        # Should inherit from OpenAI
+        from flo_ai.llm.openai_llm import OpenAI
+
+        assert isinstance(llm, OpenAI)
+
+        # Should have all the methods from OpenAI
+        assert hasattr(llm, 'generate')
+        assert hasattr(llm, 'get_message_content')
+        assert hasattr(llm, 'format_tool_for_llm')
+        assert hasattr(llm, 'format_tools_for_llm')
+        assert hasattr(llm, 'format_image_in_message')
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_parameter_combinations(self, mock_async_openai):
+        """Test various parameter combinations."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        # Test with all parameters
+        llm = OpenAIVLLM(
+            model='gpt-4',
+            api_key='key123',
+            temperature=0.3,
+            base_url='https://custom.com',
+            max_tokens=500,
+            top_p=0.8,
+        )
+
+        assert llm.model == 'gpt-4'
+        assert llm.api_key == 'key123'
+        assert llm.temperature == 0.3
+        assert llm.base_url == 'https://custom.com'
+        assert llm.kwargs == {'max_tokens': 500, 'top_p': 0.8}
+
+        # Test with minimal parameters
+        mock_async_openai.reset_mock()
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        assert llm.model == 'gpt-4o-mini'
+        assert llm.api_key is None
+        assert llm.temperature == 0.7
+        assert llm.base_url == 'https://api.vllm.com'
+        assert llm.kwargs == {}
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_method_inheritance(self, mock_async_openai):
+        """Test that OpenAIVLLM inherits all methods from OpenAI."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        # Test that OpenAIVLLM has all the methods from OpenAI
+        assert hasattr(llm, 'generate')
+        assert hasattr(llm, 'get_message_content')
+        assert hasattr(llm, 'format_tool_for_llm')
+        assert hasattr(llm, 'format_tools_for_llm')
+        assert hasattr(llm, 'format_image_in_message')
+
+        # Should be callable
+        assert callable(llm.generate)
+        assert callable(llm.get_message_content)
+        assert callable(llm.format_tool_for_llm)
+        assert callable(llm.format_tools_for_llm)
+        assert callable(llm.format_image_in_message)
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_default_values(self, mock_async_openai):
+        """Test that default values are set correctly."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        # Default values from OpenAI
+        assert llm.model == 'gpt-4o-mini'
+        assert llm.temperature == 0.7
+
+        # Default values from BaseLLM
+        assert llm.api_key is None
+        assert llm.kwargs == {}
+
+        # Default values from OpenAIVLLM
+        assert llm.base_url == 'https://api.vllm.com'
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_parameter_override(self, mock_async_openai):
+        """Test that parameters can be overridden after initialization."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAIVLLM(base_url='https://api.vllm.com', model='gpt-4o-mini')
+
+        # Change parameters
+        llm.model = 'new-model'
+        llm.temperature = 0.1
+        llm.base_url = 'new-url'
+
+        # Verify changes
+        assert llm.model == 'new-model'
+        assert llm.temperature == 0.1
+        assert llm.base_url == 'new-url'
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_kwargs_storage(self, mock_async_openai):
+        """Test that additional kwargs are properly stored."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        llm = OpenAIVLLM(
+            base_url='https://api.vllm.com',
+            model='gpt-4o-mini',
+            max_tokens=1000,
+            top_p=0.9,
+            frequency_penalty=0.1,
+            presence_penalty=0.1,
+        )
+
+        assert 'max_tokens' in llm.kwargs
+        assert 'top_p' in llm.kwargs
+        assert 'frequency_penalty' in llm.kwargs
+        assert 'presence_penalty' in llm.kwargs
+        assert llm.kwargs['max_tokens'] == 1000
+        assert llm.kwargs['top_p'] == 0.9
+
+    @patch('flo_ai.llm.openai_llm.AsyncOpenAI')
+    def test_openai_vllm_initialization_order(self, mock_async_openai):
+        """Test that initialization happens in the correct order."""
+        mock_client = Mock()
+        mock_async_openai.return_value = mock_client
+
+        # This should not raise an error
+        llm = OpenAIVLLM(
+            model='test-model',
+            base_url='https://test.vllm.com',
+            project='test-project',
+            location='test-location',
+        )
+
+        # Verify all attributes are set correctly
+        assert llm.model == 'test-model'
+        assert llm.base_url == 'https://test.vllm.com'
+        assert llm.client == mock_client
diff --git a/flo_ai/tests/test_vertexai_llm.py b/flo_ai/tests/test_vertexai_llm.py
new file mode 100644
index 00000000..54f1e79f
--- /dev/null
+++ b/flo_ai/tests/test_vertexai_llm.py
@@ -0,0 +1,584 @@
+#!/usr/bin/env python3
+"""
+Pytest tests for the VertexAI LLM implementation.
+"""
+
+import sys
+import os
+import pytest
+from unittest.mock import Mock, patch
+
+# Add the flo_ai directory to the path
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), '..'))
+
+from flo_ai.llm.vertexai_llm import VertexAI
+from flo_ai.tool.base_tool import Tool
+
+os.environ['GOOGLE_API_KEY'] = 'test-key-123'
+os.environ['GOOGLE_PROJECT'] = 'my-project-123'
+os.environ['GOOGLE_LOCATION'] = 'us-central1'
+
+
+class TestVertexAI:
+    """Test class for VertexAI LLM implementation."""
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_initialization(self, mock_genai_client):
+        """Test VertexAI LLM initialization with different parameters."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        # Test with minimal parameters
+        llm = VertexAI()
+        assert llm.model == 'gemini-2.5-flash'
+        assert llm.api_key is None
+        assert llm.temperature == 0.7
+        assert llm.kwargs == {}
+        assert llm.project is None
+        assert llm.location is None
+
+        # Test with custom parameters
+        mock_genai_client.reset_mock()
+        llm = VertexAI(
+            model='gemini-1.5-pro',
+            api_key='test-key-123',
+            temperature=0.5,
+            project='my-project-123',
+            location='us-central1',
+        )
+        assert llm.model == 'gemini-1.5-pro'
+        assert llm.api_key == 'test-key-123'
+        assert llm.temperature == 0.5
+        assert llm.project == 'my-project-123'
+        assert llm.location == 'us-central1'
+        assert llm.kwargs == {}
+
+        # Test with additional kwargs
+        mock_genai_client.reset_mock()
+        llm = VertexAI(model='gemini-2.5-flash', max_tokens=1000, top_p=0.9)
+        assert llm.kwargs == {'max_tokens': 1000, 'top_p': 0.9}
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_temperature_handling(self, mock_genai_client):
+        """Test temperature parameter handling."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        # Test default temperature
+        llm = VertexAI()
+        assert llm.temperature == 0.7
+
+        # Test custom temperature
+        mock_genai_client.reset_mock()
+        llm = VertexAI(temperature=0.0)
+        assert llm.temperature == 0.0
+
+        # Test high temperature
+        mock_genai_client.reset_mock()
+        llm = VertexAI(temperature=1.0)
+        assert llm.temperature == 1.0
+
+        # Test temperature in kwargs
+        mock_genai_client.reset_mock()
+        llm = VertexAI(temperature=0.3, custom_temp=0.8)
+        assert llm.temperature == 0.3
+        assert llm.kwargs['custom_temp'] == 0.8
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_client_creation(self, mock_genai_client):
+        """Test that genai Client is created correctly with VertexAI parameters."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI(project='test-project', location='us-central1')
+
+        mock_genai_client.assert_called_once_with(
+            project='test-project', location='us-central1', vertexai=True
+        )
+        assert llm.client == mock_client
+
+        # Test without project and location
+        mock_genai_client.reset_mock()
+        llm = VertexAI()
+
+        mock_genai_client.assert_called_once_with(
+            project=None, location=None, vertexai=True
+        )
+        assert llm.client == mock_client
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    async def test_vertexai_generate_basic(self, mock_genai_client):
+        """Test basic generate method without functions or output schema."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI(model='gemini-2.5-flash')
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = 'Hello, world!'
+        mock_response.candidates = []
+
+        llm.client = mock_client
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+        result = await llm.generate(messages)
+
+        # Verify the API call
+        llm.client.models.generate_content.assert_called_once()
+        call_args = llm.client.models.generate_content.call_args
+
+        assert call_args[1]['model'] == 'gemini-2.5-flash'
+        assert call_args[1]['contents'] == ['Hello']
+        assert call_args[1]['config'].temperature == 0.7
+
+        # Verify the result
+        assert result == {'content': 'Hello, world!'}
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    async def test_vertexai_generate_with_system_message(self, mock_genai_client):
+        """Test generate method with system message."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI(model='gemini-2.5-flash')
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = "I'm a helpful assistant"
+        mock_response.candidates = []
+
+        llm.client = mock_client
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [
+            {'role': 'system', 'content': 'You are a helpful assistant'},
+            {'role': 'user', 'content': 'Hello'},
+        ]
+
+        await llm.generate(messages)
+
+        # Verify system instruction was passed correctly
+        call_args = llm.client.models.generate_content.call_args
+        config = call_args[1]['config']
+        assert config.system_instruction == 'You are a helpful assistant\n'
+
+        # Verify contents don't include system message
+        contents = call_args[1]['contents']
+        assert contents == ['Hello']
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    async def test_vertexai_generate_with_output_schema(self, mock_genai_client):
+        """Test generate method with output schema."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI(model='gemini-2.5-flash')
+
+        output_schema = {
+            'type': 'object',
+            'properties': {'message': {'type': 'string'}, 'count': {'type': 'integer'}},
+        }
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = '{"message": "test", "count": 42}'
+        mock_response.candidates = []
+
+        llm.client = mock_client
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Generate JSON'}]
+        result = await llm.generate(messages, output_schema=output_schema)
+
+        # Verify the result
+        assert result == {'content': '{"message": "test", "count": 42}'}
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    async def test_vertexai_generate_with_functions(self, mock_genai_client):
+        """Test generate method with functions (tools)."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI(model='gemini-2.5-flash')
+
+        functions = [
+            {
+                'name': 'test_function',
+                'description': 'A test function',
+                'parameters': {'type': 'object'},
+            }
+        ]
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = "I'll use the function"
+        mock_response.candidates = []
+
+        llm.client = mock_client
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Use the function'}]
+        result = await llm.generate(messages, functions=functions)
+
+        # Verify the result
+        assert result == {'content': "I'll use the function"}
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    async def test_vertexai_generate_with_function_call_detection(
+        self, mock_genai_client
+    ):
+        """Test generate method with function call detection."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI(model='gemini-2.5-flash')
+
+        functions = [
+            {
+                'name': 'test_function',
+                'description': 'A test function',
+                'parameters': {'type': 'object'},
+            }
+        ]
+
+        # Mock the client response with function call
+        mock_function_call = Mock()
+        mock_function_call.name = 'test_function'
+        mock_function_call.args = {'param': 'value'}
+
+        mock_part = Mock()
+        mock_part.function_call = mock_function_call
+
+        mock_content = Mock()
+        mock_content.parts = [mock_part]
+
+        mock_candidate = Mock()
+        mock_candidate.content = mock_content
+
+        mock_response = Mock()
+        mock_response.text = 'Function called'
+        mock_response.candidates = [mock_candidate]
+
+        llm.client = mock_client
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Use the function'}]
+        result = await llm.generate(messages, functions=functions)
+
+        # Verify function call was detected and parsed
+        assert 'function_call' in result
+        assert result['function_call']['name'] == 'test_function'
+        assert result['function_call']['arguments'] == {'param': 'value'}
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    async def test_vertexai_generate_with_kwargs(self, mock_genai_client):
+        """Test generate method with additional kwargs."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI(model='gemini-2.5-flash', top_p=0.9, max_output_tokens=1000)
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = 'Response with kwargs'
+        mock_response.candidates = []
+
+        llm.client = mock_client
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+        await llm.generate(messages)
+
+        # Verify kwargs were passed through
+        call_args = llm.client.models.generate_content.call_args
+        config = call_args[1]['config']
+        assert config.top_p == 0.9
+        assert config.max_output_tokens == 1000
+
+    def test_vertexai_get_message_content(self):
+        """Test get_message_content method."""
+        llm = VertexAI()
+
+        # Test with dict response
+        response = {'content': 'Hello, world!'}
+        result = llm.get_message_content(response)
+        assert result == 'Hello, world!'
+
+        # Test with string response
+        result = llm.get_message_content('Direct string')
+        assert result == 'Direct string'
+
+        # Test with empty content
+        response = {'content': ''}
+        result = llm.get_message_content(response)
+        assert result == ''
+
+    def test_vertexai_format_tool_for_llm(self):
+        """Test format_tool_for_llm method."""
+        llm = VertexAI()
+
+        # Create a mock tool
+        tool = Tool(
+            name='test_tool',
+            description='A test tool',
+            function=lambda x: x,
+            parameters={
+                'param1': {'type': 'string', 'description': 'First parameter'},
+                'param2': {'type': 'integer', 'description': 'Second parameter'},
+            },
+        )
+
+        formatted = llm.format_tool_for_llm(tool)
+
+        assert formatted['name'] == 'test_tool'
+        assert formatted['description'] == 'A test tool'
+        assert formatted['parameters']['type'] == 'object'
+        assert 'param1' in formatted['parameters']['properties']
+        assert 'param2' in formatted['parameters']['properties']
+        assert formatted['parameters']['required'] == ['param1', 'param2']
+
+    def test_vertexai_format_tools_for_llm(self):
+        """Test format_tools_for_llm method."""
+        llm = VertexAI()
+
+        # Create mock tools
+        tool1 = Tool(
+            name='tool1',
+            description='First tool',
+            function=lambda x: x,
+            parameters={'param': {'type': 'string', 'description': 'Parameter'}},
+        )
+
+        tool2 = Tool(
+            name='tool2',
+            description='Second tool',
+            function=lambda x: x,
+            parameters={'param': {'type': 'integer', 'description': 'Parameter'}},
+        )
+
+        formatted = llm.format_tools_for_llm([tool1, tool2])
+
+        assert len(formatted) == 2
+        assert formatted[0]['name'] == 'tool1'
+        assert formatted[1]['name'] == 'tool2'
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_project_handling(self, mock_genai_client):
+        """Test project parameter handling."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        # Test with project
+        llm = VertexAI(project='my-project-123')
+        assert llm.project == 'my-project-123'
+
+        # Test without project
+        mock_genai_client.reset_mock()
+        llm = VertexAI()
+        assert llm.project is None
+
+        # Test with empty string project
+        mock_genai_client.reset_mock()
+        llm = VertexAI(project='')
+        assert llm.project == ''
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_location_handling(self, mock_genai_client):
+        """Test location parameter handling."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        # Test with location
+        llm = VertexAI(location='us-central1')
+        assert llm.location == 'us-central1'
+
+        # Test without location
+        mock_genai_client.reset_mock()
+        llm = VertexAI()
+        assert llm.location is None
+
+        # Test with empty string location
+        mock_genai_client.reset_mock()
+        llm = VertexAI(location='')
+        assert llm.location == ''
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_kwargs_storage(self, mock_genai_client):
+        """Test that additional kwargs are properly stored."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI(
+            max_tokens=1000, top_p=0.9, frequency_penalty=0.1, presence_penalty=0.1
+        )
+
+        assert 'max_tokens' in llm.kwargs
+        assert 'top_p' in llm.kwargs
+        assert 'frequency_penalty' in llm.kwargs
+        assert 'presence_penalty' in llm.kwargs
+        assert llm.kwargs['max_tokens'] == 1000
+        assert llm.kwargs['top_p'] == 0.9
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_base_llm_initialization(self, mock_genai_client):
+        """Test that BaseLLM is properly initialized."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI(model='test-model', api_key='test-key', temperature=0.5)
+
+        # These should come from BaseLLM
+        assert llm.model == 'test-model'
+        assert llm.api_key == 'test-key'
+        assert llm.temperature == 0.5
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_vertexai_flag(self, mock_genai_client):
+        """Test that vertexai=True is always set in client creation."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        VertexAI()
+
+        # Verify vertexai=True was passed
+        call_args = mock_genai_client.call_args[1]
+        assert call_args['vertexai']
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_parameter_combinations(self, mock_genai_client):
+        """Test various parameter combinations."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        # Test with all parameters
+        llm = VertexAI(
+            model='gemini-1.5-pro',
+            api_key='key123',
+            temperature=0.3,
+            project='proj123',
+            location='us-west1',
+            max_tokens=500,
+            top_p=0.8,
+        )
+
+        assert llm.model == 'gemini-1.5-pro'
+        assert llm.api_key == 'key123'
+        assert llm.temperature == 0.3
+        assert llm.project == 'proj123'
+        assert llm.location == 'us-west1'
+        assert llm.kwargs == {'max_tokens': 500, 'top_p': 0.8}
+
+        # Test with minimal parameters
+        mock_genai_client.reset_mock()
+        llm = VertexAI()
+
+        assert llm.model == 'gemini-2.5-flash'
+        assert llm.api_key is None
+        assert llm.temperature == 0.7
+        assert llm.project is None
+        assert llm.location is None
+        assert llm.kwargs == {}
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_method_inheritance(self, mock_genai_client):
+        """Test that VertexAI inherits all methods from Gemini."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI()
+
+        # Test that VertexAI has all the methods from Gemini
+        assert hasattr(llm, 'generate')
+        assert hasattr(llm, 'get_message_content')
+        assert hasattr(llm, 'format_tool_for_llm')
+        assert hasattr(llm, 'format_tools_for_llm')
+        assert hasattr(llm, 'format_image_in_message')
+
+    @pytest.mark.asyncio
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    async def test_vertexai_generate_error_handling(self, mock_genai_client):
+        """Test error handling in generate method."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI(model='gemini-2.5-flash')
+
+        # Mock client to raise an exception
+        llm.client = mock_client
+        llm.client.models.generate_content = Mock(side_effect=Exception('API Error'))
+
+        messages = [{'role': 'user', 'content': 'Hello'}]
+
+        with pytest.raises(Exception, match='Error in Gemini API call: API Error'):
+            await llm.generate(messages)
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_model_parameter_handling(self, mock_genai_client):
+        """Test that model parameter is properly handled."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        test_models = [
+            'gemini-2.5-flash',
+            'gemini-1.5-pro',
+            'gemini-1.5-flash',
+            'gemini-pro',
+        ]
+
+        for model in test_models:
+            mock_genai_client.reset_mock()
+            llm = VertexAI(model=model)
+            assert llm.model == model
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_api_key_handling(self, mock_genai_client):
+        """Test API key handling."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        # Test with API key
+        llm = VertexAI(api_key='secret-key-123')
+        assert llm.api_key == 'secret-key-123'
+
+        # Test without API key
+        mock_genai_client.reset_mock()
+        llm = VertexAI()
+        assert llm.api_key is None
+
+        # Test with empty string API key
+        mock_genai_client.reset_mock()
+        llm = VertexAI(api_key='')
+        assert llm.api_key == ''
+
+    @patch('flo_ai.llm.vertexai_llm.genai.Client')
+    def test_vertexai_generation_config_creation(self, mock_genai_client):
+        """Test that generation config is created correctly."""
+        mock_client = Mock()
+        mock_genai_client.return_value = mock_client
+
+        llm = VertexAI(temperature=0.5, max_output_tokens=1000, top_p=0.9)
+
+        # Mock the client response
+        mock_response = Mock()
+        mock_response.text = 'Test response'
+        mock_response.candidates = []
+
+        llm.client = mock_client
+        llm.client.models.generate_content = Mock(return_value=mock_response)
+
+        # We need to patch the types.GenerateContentConfig to test this
+        with patch('flo_ai.llm.gemini_llm.types.GenerateContentConfig') as mock_config:
+            mock_config_instance = Mock()
+            mock_config.return_value = mock_config_instance
+
+            # This would normally be called in generate method
+            # For testing, we'll just verify the config class exists
+            assert mock_config is not None