diff --git a/libs/agent/agent/core/types.py b/libs/agent/agent/core/types.py
index ef50d09e..fd337062 100644
--- a/libs/agent/agent/core/types.py
+++ b/libs/agent/agent/core/types.py
@@ -23,6 +23,7 @@ class LLMProvider(StrEnum):
     OPENAI = "openai"
     OLLAMA = "ollama"
     OAICOMPAT = "oaicompat"
+    MLXVLM= "mlxvlm"
 
 
 @dataclass
diff --git a/libs/agent/agent/providers/uitars/clients/mlxvlm.py b/libs/agent/agent/providers/uitars/clients/mlxvlm.py
new file mode 100644
index 00000000..f644ce6d
--- /dev/null
+++ b/libs/agent/agent/providers/uitars/clients/mlxvlm.py
@@ -0,0 +1,158 @@
+"""MLX LVM client implementation."""
+
+import logging
+import base64
+import tempfile
+import os
+from typing import Dict, List, Optional, Any, cast
+
+from .base import BaseUITarsClient
+import mlx.core as mx
+from mlx_vlm import load, generate
+from mlx_vlm.prompt_utils import apply_chat_template
+from mlx_vlm.utils import load_config
+from transformers.tokenization_utils import PreTrainedTokenizer
+
+logger = logging.getLogger(__name__)
+
+
+class MLXLMVUITarsClient(BaseUITarsClient):
+    """MLX LVM client implementation class."""
+
+    def __init__(self, api_key: Optional[str] = None, model: str = "mlx-community/UI-TARS-1.5-7B-4bit"):
+        """Initialize MLX LVM client.
+
+        Args:
+            api_key: Optional API key
+            model: Model name or path (defaults to mlx-community/UI-TARS-1.5-7B-4bit)
+        """
+        self.api_key = api_key
+        self.model = model
+
+    async def run_interleaved(
+        self, messages: List[Dict[str, Any]], system: str, max_tokens: Optional[int] = None
+    ) -> Dict[str, Any]:
+        """Run interleaved chat completion.
+
+        Args:
+            messages: List of message dicts
+            system: System prompt
+            max_tokens: Optional max tokens override
+
+        Returns:
+            Response dict
+        """
+        # Extract text and images from messages
+        prompt_parts = []
+        images = []
+        
+        # Add system message first
+        prompt_parts.append(system)
+        
+        for msg in messages:
+            role = msg.get("role", "user")
+            content = msg.get("content", [])
+            
+            # Handle different content formats
+            if isinstance(content, str):
+                # If content is a string, just add it as text
+                prompt_parts.append(f"{role}: {content}")
+            elif isinstance(content, list):
+                # If content is a list, process each item
+                text_parts = []
+                
+                for item in content:
+                    if item.get("type") == "text":
+                        text_parts.append(item.get("text", ""))
+                    elif item.get("type") == "image_url":
+                        # Extract image URL and add to images list
+                        image_url = item.get("image_url", {}).get("url", "")
+                        if image_url.startswith("data:image/"):
+                            # Extract base64 data and convert to URL or save as temp file
+                            # For now, we'll just store the URL directly
+                            images.append(image_url)
+                
+                # Add text parts to prompt
+                if text_parts:
+                    prompt_parts.append(f"{role}: {''.join(text_parts)}")
+        
+        # Combine all text parts into a single prompt
+        combined_prompt = "\n".join(prompt_parts)
+        
+        try:
+            # Load model and processor
+            model_obj, processor = load(self.model)
+            config = load_config(self.model)
+            
+            # Process images to ensure they're in the right format
+            processed_images = []
+            for img in images:
+                if img.startswith('data:image/'):
+                    # Extract base64 data
+                    img_format = img.split(';')[0].split('/')[1]
+                    base64_data = img.split(',')[1]
+                    
+                    # Create a temporary file to store the image
+                    with tempfile.NamedTemporaryFile(suffix=f'.{img_format}', delete=False) as temp_file:
+                        temp_file.write(base64.b64decode(base64_data))
+                        processed_images.append(temp_file.name)
+                else:
+                    # Assume it's already a valid URL or path
+                    processed_images.append(img)
+            
+            # Format prompt according to model requirements
+            formatted_prompt = apply_chat_template(
+                processor, config, str(combined_prompt), num_images=len(processed_images)
+            )
+            
+            # Cast processor to PreTrainedTokenizer to satisfy type checker
+            tokenizer = cast(PreTrainedTokenizer, processor)
+            
+            # Generate response
+            output = generate(
+                model_obj, 
+                tokenizer, 
+                str(formatted_prompt), 
+                processed_images, 
+                verbose=False,
+                max_tokens=max_tokens
+            )
+            
+            # Clean up temporary files
+            for img_path in processed_images:
+                if img_path.startswith(tempfile.gettempdir()) and os.path.exists(img_path):
+                    try:
+                        os.unlink(img_path)
+                    except Exception as e:
+                        logger.warning(f"Failed to delete temporary file {img_path}: {e}")
+        except Exception as e:
+            logger.error(f"Error generating response: {str(e)}")
+            return {
+                "choices": [
+                    {
+                        "message": {
+                            "role": "assistant",
+                            "content": f"Error generating response: {str(e)}"
+                        },
+                        "finish_reason": "error"
+                    }
+                ],
+                "model": self.model,
+                "error": str(e)
+            }
+        
+        # Format response to match OpenAI format
+        response = {
+            "choices": [
+                {
+                    "message": {
+                        "role": "assistant",
+                        "content": output
+                    },
+                    "finish_reason": "stop"
+                }
+            ],
+            "model": self.model
+        }
+        
+        return response
diff --git a/libs/agent/pyproject.toml b/libs/agent/pyproject.toml
index 1572465b..d3b97112 100644
--- a/libs/agent/pyproject.toml
+++ b/libs/agent/pyproject.toml
@@ -36,6 +36,7 @@ openai = [
 ]
 uitars = [
     "httpx>=0.27.0,<0.29.0",
+    "mlx-vlm>=0.1.25"
 ]
 ui = [
     "gradio>=5.23.3,<6.0.0",