Mervin Praison

DevOps

Replit Mintlify Config

Post author By praison
Post date June 3, 2025

entrypoint = "index.js"
modules = ["nodejs-20"]
hidden = [".config", "package-lock.json"]

[gitHubImport]
requiredFiles = [".replit", "replit.nix", "package.json", "package-lock.json"]

[nix]
channel = "stable-24_05"

[unitTest]
language = "nodejs"

[deployment]
run = [
  "sh",
  "-c",
  "cd PraisonAI/docs && mintlify dev --host 0.0.0.0 --port 3000",
]
deploymentTarget = "gce"
ignorePorts = false
build = ["sh", "-c", "cd PraisonAI/docs && npm install mintlify"]

[[ports]]
localPort = 3000
externalPort = 80

Voice

Chatterbox TTS Gradio for Mac

Post author By praison
Post date June 3, 2025

import random
import numpy as np
import torch
import gradio as gr
from chatterbox.tts import ChatterboxTTS

# Detect device (Mac with M1/M2/M3/M4)
device = "mps" if torch.backends.mps.is_available() else "cpu"
map_location = torch.device(device)

torch_load_original = torch.load
def patched_torch_load(*args, **kwargs):
    if 'map_location' not in kwargs:
        kwargs['map_location'] = map_location
    return torch_load_original(*args, **kwargs)

torch.load = patched_torch_load

DEVICE = device


def set_seed(seed: int):
    torch.manual_seed(seed)
    torch.cuda.manual_seed(seed)
    torch.cuda.manual_seed_all(seed)
    random.seed(seed)
    np.random.seed(seed)


def load_model():
    model = ChatterboxTTS.from_pretrained(DEVICE)
    return model


def generate(model, text, audio_prompt_path, exaggeration, temperature, seed_num, cfgw):
    if model is None:
        model = ChatterboxTTS.from_pretrained(DEVICE)

    if seed_num != 0:
        set_seed(int(seed_num))

    wav = model.generate(
        text,
        audio_prompt_path=audio_prompt_path,
        exaggeration=exaggeration,
        temperature=temperature,
        cfg_weight=cfgw,
    )
    return (model.sr, wav.squeeze(0).numpy())


with gr.Blocks() as demo:
    model_state = gr.State(None)  # Loaded once per session/user

    with gr.Row():
        with gr.Column():
            text = gr.Textbox(
                value="Now let's make my mum's favourite. So three mars bars into the pan. Then we add the tuna and just stir for a bit, just let the chocolate and fish infuse. A sprinkle of olive oil and some tomato ketchup. Now smell that. Oh boy this is going to be incredible.",
                label="Text to synthesize (max chars 300)",
                max_lines=5
            )
            ref_wav = gr.Audio(sources=["upload", "microphone"], type="filepath", label="Reference Audio File", value=None)
            exaggeration = gr.Slider(0.25, 2, step=.05, label="Exaggeration (Neutral = 0.5, extreme values can be unstable)", value=.5)
            cfg_weight = gr.Slider(0.0, 1, step=.05, label="CFG/Pace", value=0.5)

            with gr.Accordion("More options", open=False):
                seed_num = gr.Number(value=0, label="Random seed (0 for random)")
                temp = gr.Slider(0.05, 5, step=.05, label="temperature", value=.8)

            run_btn = gr.Button("Generate", variant="primary")

        with gr.Column():
            audio_output = gr.Audio(label="Output Audio")

    demo.load(fn=load_model, inputs=[], outputs=model_state)

    run_btn.click(
        fn=generate,
        inputs=[
            model_state,
            text,
            ref_wav,
            exaggeration,
            temp,
            seed_num,
            cfg_weight,
        ],
        outputs=audio_output,
    )

if __name__ == "__main__":
    demo.queue(
        max_size=50,
        default_concurrency_limit=1,
    ).launch(share=True)

AI Agents

Microsoft Magentic UI Install

Post author By praison
Post date May 26, 2025

ollama pull qwen3
pip install "magentic-ui[ollama]"
magentic ui --port 8081

YAML Config

model_config: &client
  provider: autogen_ext.models.ollama.OllamaChatCompletionClient
  config:
    model: "qwen3" # change to your desired Ollama model
    host: "http://localhost:11434" # change to your ollama host
    model_info: # change per model you use
      vision: true
      function_calling: true # will work if false but not fully
      json_output: false # prefered true
      family: unknown
      structured_output: false
  max_retries: 5

# Note you can define multiple model clients and use them for different agents
# You can also use the OpenAI client instead and access Ollama models
#model_config: &client
#  provider: OpenAIChatCompletionClient
#  config:
#    model: "qwen2.5vl:32b"
#    base_url: "http://localhost:11434/v1" # change to your ollama host
#    model_info: # change per model
#       vision: true 
#       function_calling: true # required true for file_surfer, but will still work if file_surfer is not needed
#       json_output: false
#       family: unknown
#       structured_output: false
#  max_retries: 5

orchestrator_client: *client
coder_client: *client
web_surfer_client: *client
file_surfer_client: *client
action_guard_client: *client

Requirements

https://ollama.com

https://docker.com

AI Agents

Google ADK Agents

Post author By praison
Post date May 20, 2025

└── app
    ├── __init__.py
    ├── .env
    └── agent.py

agent.py

# 1. Basic Agent
from google.adk.agents import Agent

basic_agent = Agent(
    name="basic_agent",
    model="gemini-2.0-flash",
    description="A simple agent that answers questions",
    instruction="""
    You are a helpful stock market assistant. Be concise.
    If you don't know something, just say so.
    """,
)


# 2. Basic Agent with Tool
from google.adk.agents import Agent
import yfinance as yf

def get_stock_price(ticker: str):
    stock = yf.Ticker(ticker)
    price = stock.info.get("currentPrice", "Price not available")
    return {"price": price, "ticker": ticker}

tool_agent = Agent(
    name="tool_agent",
    model="gemini-2.0-flash",
    description="A simple agent that gets stock prices",
    instruction="""
    You are a stock price assistant. Always use the get_stock_price tool.
    Include the ticker symbol in your response.
    """,
    tools=[get_stock_price],
)


# 3. Agent with State
from google.adk.agents import Agent
from google.adk.tools.tool_context import ToolContext
import yfinance as yf

def get_stock_price(ticker: str, tool_context: ToolContext):
    stock = yf.Ticker(ticker)
    price = stock.info.get("currentPrice", "Price not available")
    
    # Initialize recent_searches if it doesn't exist
    if "recent_searches" not in tool_context.state:
        tool_context.state["recent_searches"] = []
        
    recent_searches = tool_context.state["recent_searches"]
    if ticker not in recent_searches:
        recent_searches.append(ticker)
        tool_context.state["recent_searches"] = recent_searches
    
    return {"price": price, "ticker": ticker}

stateful_agent = Agent(
    name="stateful_agent",
    model="gemini-2.0-flash",
    description="An agent that remembers recent searches",
    instruction="""
    You are a stock price assistant. Use the get_stock_price tool.
    I'll remember your previous searches and can tell you about them if you ask.
    """,
    tools=[get_stock_price],
)


# 4. Multi-Tool Agent
from google.adk.agents import Agent
from google.adk.tools.tool_context import ToolContext
import yfinance as yf

def get_stock_price(ticker: str, tool_context: ToolContext):
    stock = yf.Ticker(ticker)
    price = stock.info.get("currentPrice", "Price not available")
    
    # Initialize recent_searches if it doesn't exist
    if "recent_searches" not in tool_context.state:
        tool_context.state["recent_searches"] = []
        
    recent_searches = tool_context.state["recent_searches"]
    if ticker not in recent_searches:
        recent_searches.append(ticker)
        tool_context.state["recent_searches"] = recent_searches
    
    return {"price": price, "ticker": ticker}

def get_stock_info(ticker: str):
    stock = yf.Ticker(ticker)
    company_name = stock.info.get("shortName", "Name not available")
    sector = stock.info.get("sector", "Sector not available")
    return {
        "ticker": ticker,
        "company_name": company_name,
        "sector": sector
    }

multi_tool_agent = Agent(
    name="multi_tool_agent",
    model="gemini-2.0-flash",
    description="An agent with multiple stock information tools",
    instruction="""
    You are a stock information assistant. You have two tools:
    - get_stock_price: For prices
    - get_stock_info: For company name and sector
    """,
    tools=[get_stock_price, get_stock_info],
)


# 5. Structured Output Agent
from google.adk.agents import LlmAgent
from pydantic import BaseModel, Field
import yfinance as yf

class StockAnalysis(BaseModel):
    ticker: str = Field(description="Stock symbol")
    recommendation: str = Field(description="Buy or Sell recommendation")

# Define a function to get stock data for our prompt
def get_stock_data_for_prompt(ticker):
    stock = yf.Ticker(ticker)
    price = stock.info.get("currentPrice", 0)
    target_price = stock.info.get("targetMeanPrice", 0)
    return price, target_price

structured_agent = LlmAgent(
    name="structured_agent",
    model="gemini-2.0-flash",
    description="An agent with structured output",
    instruction="""
    You are a stock advisor. Analyze the stock ticker provided by the user.
    Return Buy or Sell recommendation in JSON format.
    
    For each ticker, look at the price and target price to make a decision.
    If target price > current price: recommend Buy
    Otherwise: recommend Sell
    """,
    output_schema=StockAnalysis,
    output_key="stock_analysis"
)


# 6. Callback Agent
from google.adk.agents import Agent
from google.adk.tools.tool_context import ToolContext
from google.adk.tools.base_tool import BaseTool
import yfinance as yf
from typing import Dict, Any, Optional

def get_stock_data(ticker: str, tool_context: ToolContext):
    stock = yf.Ticker(ticker)
    price = stock.info.get("currentPrice", 0)
    
    # Initialize tool_usage in state if it doesn't exist
    if "tool_usage" not in tool_context.state:
        tool_context.state["tool_usage"] = {}
    
    return {
        "ticker": ticker,
        "price": price
    }

def before_tool_callback(tool: BaseTool, args: Dict[str, Any], tool_context: ToolContext) -> Optional[Dict]:
    # Initialize tool_usage if it doesn't exist
    if "tool_usage" not in tool_context.state:
        tool_context.state["tool_usage"] = {}
        
    # Track tool usage count
    tool_usage = tool_context.state["tool_usage"]
    tool_name = tool.name
    tool_usage[tool_name] = tool_usage.get(tool_name, 0) + 1
    tool_context.state["tool_usage"] = tool_usage
    
    print(f"[LOG] Running tool: {tool_name}")
    return None

def after_tool_callback(tool: BaseTool, args: Dict[str, Any], tool_context: ToolContext, tool_response: Dict) -> Optional[Dict]:
    print(f"[LOG] Tool {tool.name} completed")
    return None

# Initialize state before creating the agent
initial_state = {"tool_usage": {}}

callback_agent = Agent(
    name="callback_agent",
    model="gemini-2.0-flash",
    description="An agent with callbacks",
    instruction="""
    You are a stock assistant. Use get_stock_data tool to check stock prices.
    This agent keeps track of how many times tools have been used.
    """,
    tools=[get_stock_data],
    before_tool_callback=before_tool_callback,
    after_tool_callback=after_tool_callback,
)

# Choose which agent to run
root_agent = multi_tool_agent

.env

GOOGLE_API_KEY=xxxxxx
GOOGLE_GENAI_USE_VERTEXAI=FALSE

init.py

from . import app

Commands

adk run app
adk web

MCP

Cursor + Playwright MCP

Post author By praison
Post date May 7, 2025

{
  "mcpServers": {
    "playwright": {
      "command": "npx",
      "args": [
        "-y",
        "@playwright/mcp@0.0.22",
        "--vision"
      ]
    }
  }
}

Python

FastAPI Time Function

Post author By praison
Post date April 7, 2025

from fastapi import FastAPI
from pydantic import BaseModel
from datetime import datetime
import pytz
import uvicorn
import threading

class TimeRequest(BaseModel):
    location: str

class MyTime:
    def __init__(self, location: str, host: str = None, port: int = None, route: str = "/time"):
        self.location = location
        self.route = route
        self.time_str = self._get_time_by_location()
        print(f"[MyTime] {self.location}: {self.time_str}")

        if host and port:
            threading.Thread(
                target=self._start_fastapi_server,
                args=(host, port, route),
                daemon=True
            ).start()

    def _get_time_by_location(self, loc: str = None) -> str:
        loc = loc or self.location
        try:
            timezone = pytz.timezone(loc)
            local_time = datetime.now(timezone)
            return local_time.strftime('%Y-%m-%d %H:%M:%S')
        except pytz.UnknownTimeZoneError:
            return f"Unknown timezone: {loc}"

    def _start_fastapi_server(self, host, port, route):
        app = FastAPI()

        @app.post(route)
        async def get_time(req: TimeRequest):
            return {"time": self._get_time_by_location(req.location)}

        uvicorn.run(app, host=host, port=port, log_level="info")

# Example usage
if __name__ == "__main__":
    MyTime("Asia/Kolkata", host="0.0.0.0", port=7860, route="/time")

curl -X POST http://localhost:7860/time \
     -H "Content-Type: application/json" \
     -d '{"location": "Europe/London"}'

Praison AI

Llama 4 Agents

Post author By praison
Post date April 6, 2025

export GROQ_API_KEY=xxxxxxx
export BRAVE_API_KEY=xxxxxxx

pip install -U "praisonaiagents[llm,mcp]" gradio

from praisonaiagents import Agent, Agents, MCP
import os

brave_api_key = os.getenv("BRAVE_API_KEY")

# Travel Research Agent
research_agent = Agent(
    instructions="Research about travel destinations, attractions, local customs, and travel requirements",
    llm="groq/meta-llama/llama-4-scout-17b-16e-instruct",
    tools=MCP("npx -y @modelcontextprotocol/server-brave-search", env={"BRAVE_API_KEY": brave_api_key})
)

# Flight Booking Agent
flight_agent = Agent(
    instructions="Search for available flights, compare prices, and recommend optimal flight choices",
    llm="groq/meta-llama/llama-4-scout-17b-16e-instruct",
    tools=MCP("npx -y @modelcontextprotocol/server-brave-search", env={"BRAVE_API_KEY": brave_api_key})
)

# Accommodation Agent
hotel_agent = Agent(
    instructions="Research hotels and accommodation based on budget and preferences",
    llm="groq/meta-llama/llama-4-scout-17b-16e-instruct",
    tools=MCP("npx -y @modelcontextprotocol/server-brave-search", env={"BRAVE_API_KEY": brave_api_key})
)

# Itinerary Planning Agent
planning_agent = Agent(
    instructions="Design detailed day-by-day travel plans incorporating activities, transport, and rest time",
    llm="groq/meta-llama/llama-4-scout-17b-16e-instruct",
    tools=MCP("npx -y @modelcontextprotocol/server-brave-search", env={"BRAVE_API_KEY": brave_api_key})
)

# Example usage - research travel destinations
destination = "London, UK"
dates = "August 15-22, 2025"
budget = "Mid-range (£1000-£1500)"
preferences = "Historical sites, local cuisine, avoiding crowded tourist traps"
travel_query = f"What are the best attractions to visit in {destination} during {dates} on a budget of {budget} with preferences of {preferences}?"
agents = Agents(agents=[research_agent, flight_agent, hotel_agent, planning_agent])

result = agents.start(travel_query)
print(f"\n=== DESTINATION RESEARCH: {destination} ===\n")
print(result)

from praisonaiagents import Agent, Agents, MCP
import os
from rich import print
import gradio as gr

brave_api_key = os.getenv("BRAVE_API_KEY")

# Travel Research Agent
research_agent = Agent(
    instructions="Research about travel destinations, attractions, local customs, and travel requirements",
    llm="groq/meta-llama/llama-4-scout-17b-16e-instruct",
    tools=MCP("npx -y @modelcontextprotocol/server-brave-search", env={"BRAVE_API_KEY": brave_api_key})
)

# Flight Booking Agent
flight_agent = Agent(
    instructions="Search for available flights, compare prices, and recommend optimal flight choices",
    llm="groq/meta-llama/llama-4-scout-17b-16e-instruct",
    tools=MCP("npx -y @modelcontextprotocol/server-brave-search", env={"BRAVE_API_KEY": brave_api_key})
)

# Accommodation Agent
hotel_agent = Agent(
    instructions="Research hotels and accommodation based on budget and preferences",
    llm="groq/meta-llama/llama-4-scout-17b-16e-instruct",
    tools=MCP("npx -y @modelcontextprotocol/server-brave-search", env={"BRAVE_API_KEY": brave_api_key})
)

# Itinerary Planning Agent
itinerary_agent = Agent(
    instructions="Design detailed day-by-day travel plans incorporating activities, transport, and rest time",
    llm="groq/meta-llama/llama-4-scout-17b-16e-instruct",
    tools=MCP("npx -y @modelcontextprotocol/server-brave-search", env={"BRAVE_API_KEY": brave_api_key})
)

def generate_travel_plan(destination, dates, budget, preferences):
    """Generate a travel plan using the AI agents"""
    
    # Create the travel query
    travel_query = f"""Create a comprehensive travel plan for {destination} during {dates}.
    Budget: {budget}
    Preferences: {preferences}
    
    Include:
    1. Information about the destination
    2. Flight recommendations
    3. Hotel options
    4. A day-by-day itinerary
    """
    
    # Initialize the agents team
    agents = Agents(agents=[research_agent, flight_agent, hotel_agent, itinerary_agent])
    
    try:
        # Generate the travel plan
        result = agents.start(travel_query)
        
        # Format the output
        formatted_result = f"""
=== TRAVEL PLAN: {destination} ===

Dates: {dates}
Budget: {budget}
Preferences: {preferences}

{result}
"""
        
        return formatted_result
    except Exception as e:
        return f"Error generating travel plan: {str(e)}"

# Create the Gradio interface
with gr.Blocks(title="AI Travel Agency", theme="soft") as demo:
    gr.Markdown("# 🌍 AI Travel Agency")
    gr.Markdown("Plan your perfect trip with our AI agents")
    
    with gr.Row():
        with gr.Column(scale=1):
            destination = gr.Textbox(label="Destination", placeholder="London, UK", value="London, UK")
            dates = gr.Textbox(label="Travel Dates", placeholder="August 15-22, 2024", value="August 15-22, 2024")
            budget = gr.Textbox(label="Budget", placeholder="Mid-range (£1000-£1500)", value="Mid-range (£1000-£1500)")
            preferences = gr.Textbox(
                label="Travel Preferences", 
                placeholder="Historical sites, local cuisine, avoiding crowded tourist traps",
                value="Historical sites, local cuisine, avoiding crowded tourist traps"
            )
            submit_btn = gr.Button("Generate Travel Plan 🚀", variant="primary")
        
        with gr.Column(scale=2):
            output = gr.Markdown(label="Your Travel Plan")
    
    submit_btn.click(
        generate_travel_plan,
        inputs=[destination, dates, budget, preferences],
        outputs=output
    )
    
    gr.Markdown("### How to use")
    gr.Markdown("""
    1. Enter your destination
    2. Specify your travel dates
    3. Indicate your budget range
    4. Share your travel preferences
    5. Click 'Generate Travel Plan'
    
    *Note: Generation may take a minute or two as our AI agents research your perfect trip.*
    """)

# Run the CLI version when script is run directly
if __name__ == "__main__":
    # Launch the Gradio interface
    demo.launch()
    
    # Example CLI usage (commented out when using Gradio)
    """
    destination = "London, UK"
    dates = "August 15-22, 2025"
    budget = "Mid-range (£1000-£1500)"
    preferences = "Historical sites, local cuisine, avoiding crowded tourist traps"
    
    travel_query = f"What are the best attractions to visit in {destination} during {dates} on a budget of {budget} with preferences of {preferences}?"
    agents = Agents(agents=[planning_agent, flight_agent, hotel_agent, planning_agent])
    result = agents.start(travel_query)
    print(f"\n=== DESTINATION RESEARCH: {destination} ===\n")
    print(result)
    """

Tools

MCP Server SSE URL

Post author By praison
Post date April 4, 2025

Model context Protocol server SSE URL

from mcp.server.fastmcp import FastMCP
import yfinance as yf
from starlette.applications import Starlette
from starlette.routing import Mount
import uvicorn
import logging

# Set up logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

# Create FastMCP server
mcp = FastMCP("Stock Price Server")

@mcp.tool()
def get_stock_price(ticker: str) -> str:
    """Get the current stock price for a given ticker symbol"""
    try:
        logger.info(f"Fetching stock price for ticker: {ticker}")
        stock = yf.Ticker(ticker)
        price = str(stock.history(period="1d")['Close'].iloc[-1])
        logger.info(f"Price for {ticker}: {price}")
        return price
    except Exception as e:
        logger.error(f"Error getting stock price for {ticker}: {str(e)}")
        return f"Error getting stock price: {str(e)}"

# Create a Starlette application with the SSE endpoint
app = Starlette(routes=[
    # Mount the SSE app directly at the root
    Mount("/", app=mcp.sse_app()),
])

if __name__ == "__main__":
    logger.info("Starting Uvicorn server...")
    uvicorn.run(app, host="127.0.0.1", port=8000)

Config

{
  "mcpServers": {
    "stock-price": {
      "serverUrl": "http://127.0.0.1:8000/sse"
    }
  }
}

Tools

MCP Beginners Guide

Post author By praison
Post date March 18, 2025

pip install "mcp[cli]" yfinance

import yfinance as yf
from mcp.server.fastmcp import FastMCP

mcp = FastMCP("stock_prices")

@mcp.tool()
async def get_stock_price(ticker: str) -> str:
    """Get the current stock price for a given ticker symbol.
    
    Args:
        ticker: Stock ticker symbol (e.g., AAPL, MSFT, GOOG)
        
    Returns:
        Current stock price as a string
    """
    try:
        stock = yf.Ticker(ticker)
        info = stock.info
        current_price = info.get('currentPrice') or info.get('regularMarketPrice')
        if not current_price:
            return f"Could not retrieve price for {ticker}"
        return f"${current_price:.2f}"
        
    except Exception as e:
        return f"Error: {str(e)}"

if __name__ == "__main__":
    mcp.run(transport='stdio')

{
  "mcpServers": {
    "stock_prices": {
      "command": "/Users/praison/miniconda3/envs/mcp/bin/python",
      "args": [
        "/Users/praison/stockprice/app.py"
      ]
  }
}

With Other Providers

{
  "mcpServers": {
    "stock_prices": {
      "command": "/Users/praison/miniconda3/envs/mcp/bin/python",
      "args": [
        "/Users/praison/stockprice/app.py"
      ]
    },
    "neon": {
      "command": "npx",
      "args": [
        "-y",
        "@smithery/cli@latest",
        "run",
        "neon",
        "--config",
        "\"{\\\"apiKey\\\":\\\"YOUR_NEON_API_KEY\\\"}\""
      ]
    }
  }
}

OpenAI

OpenAI Response API Basics

Post author By praison
Post date March 15, 2025

pip install -U openai geopy gradio rich
export OPENAI_API_KEY=xxxxxxxx

Basic

from openai import OpenAI
client = OpenAI()

response = client.responses.create(
    model="gpt-4o",
    input="Write a one-sentence bedtime story about a unicorn."
)

print(response.output_text)

UI

import gradio as gr
from openai import OpenAI

client = OpenAI()

def ask_ai(question):
    response = client.responses.create(
        model="gpt-4o",
        input=question
    )
    return response.output_text

demo = gr.Interface(
    fn=ask_ai,
    inputs="text",
    outputs="text",
    title="AI Assistant"
)

if __name__ == "__main__":
    demo.launch()

Tools

from openai import OpenAI
client = OpenAI()

response = client.responses.create(
    model="gpt-4o",
    tools=[{"type": "web_search_preview"}],
    input="Give me two AI news story from today in 2 sentence."
)

print(response.output_text)

RAG

from openai import OpenAI
from rich import print
client = OpenAI()

response = client.responses.create(
    model="gpt-4o-mini",
    input="Tell me about GraphRAG",
    tools=[{
        "type": "file_search",
        "vector_store_ids": ["vs_67d08c2b03asdf"]
    }]
)
print(response)

Custom Tools

from openai import OpenAI
import requests
import json
from rich import print
from geopy.geocoders import Nominatim

client = OpenAI()

# 1. Create Custom Tool
def get_weather(location):
    geolocator = Nominatim(user_agent="weather_app")
    location_data = geolocator.geocode(location)
    latitude, longitude = location_data.latitude, location_data.longitude if location_data else (0, 0)
    response = requests.get(f"https://api.open-meteo.com/v1/forecast?latitude={latitude}&longitude={longitude}&current=temperature_2m,wind_speed_10m&hourly=temperature_2m,relative_humidity_2m,wind_speed_10m")
    data = response.json()
    return data['current']['temperature_2m']

# 2. Create Custom Tool Definition
tools = [{
    "type": "function",
    "name": "get_weather",
    "description": "Get current temperature for a given location.",
    "parameters": {
        "type": "object",
        "properties": {
            "location": {
                "type": "string",
                "description": "City and country e.g. Bogotá, Colombia"
            }
        },
        "required": [
            "location"
        ],
        "additionalProperties": False
    }
}]

# 3. Ask Question to the model
input_messages = [{"role": "user", "content": "What is the weather like in Paris today?"}]
response = client.responses.create(
    model="gpt-4o",
    input=input_messages,
    tools=tools
)
print(f"Response: {response.output}")

# 4. Parse the model's response & Run the Tool
tool_call = response.output[0]
args = json.loads(tool_call.arguments)
result = get_weather(args["location"])
print(f"Result: {result}")

# 5. Append the result to the input messages
input_messages.append(tool_call)  
input_messages.append({           
    "type": "function_call_output",
    "call_id": tool_call.call_id,
    "output": str(result)
})

# 6. Ask the model again with original question and the response from the tool
response_2 = client.responses.create(
    model="gpt-4o",
    input=input_messages,
    tools=tools,
)
print(f"Response 2: {response_2.output_text}")

Stream

from openai import OpenAI
client = OpenAI()

stream = client.responses.create(
    model="gpt-4o-mini",
    input=[
        {
            "role": "user",
            "content": "Write a 1000 words bedtime story about a unicorn.",
        },
    ],
    stream=True,
)

for event in stream:
    if hasattr(event, 'delta'):
        print(event.delta, end="")
    elif hasattr(event, 'text') and event.type == 'response.output_text.done':
        pass

LM Studio Upcoming update

from openai import OpenAI
client = OpenAI(base_url="http://localhost:1234/v1", api_key="fake-key")

response = client.responses.create(
    model="gemma3",
    input="Write a one-sentence bedtime story about a unicorn."
)

print(response)