LangChain Agents - Build Production AI Agents with LangChain & LangGraph

Introduction to LangChain

LangChain is a powerful framework for building applications with large language models. It provides abstractions for chains, agents, tools, and memory, making it easier to create sophisticated AI systems.

Chains

Compose LLMs with other components in sequences

Agents

LLMs that can use tools and make decisions

Memory

Persist state between chain/agent calls

Tools

Functions agents can use to interact with the world

Retrievers

Interface with vector stores and databases

Callbacks

Hook into various stages of execution

Building Your First LangChain Agent

Installation & Setup

# Install LangChain and dependencies
pip install langchain langchain-openai langchain-community
pip install langchain-experimental langchainhub
pip install chromadb tiktoken

# For LangGraph (advanced agents)
pip install langgraph

# Environment setup
import os
os.environ["OPENAI_API_KEY"] = "your-api-key"
os.environ["LANGCHAIN_TRACING_V2"] = "true"  # Enable tracing
os.environ["LANGCHAIN_API_KEY"] = "your-langsmith-key"

Basic Agent with Tools

from langchain.agents import create_openai_functions_agent, AgentExecutor
from langchain_openai import ChatOpenAI
from langchain.tools import Tool, tool
from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
from langchain_community.tools import DuckDuckGoSearchRun
from langchain.tools.retriever import create_retriever_tool
import requests

# Initialize LLM
llm = ChatOpenAI(model="gpt-4", temperature=0)

# Define custom tools
@tool
def calculate(expression: str) -> str:
    """Evaluate a mathematical expression."""
    try:
        result = eval(expression)
        return f"The result is: {result}"
    except:
        return "Invalid expression"

@tool
def get_weather(city: str) -> str:
    """Get current weather for a city."""
    # In production, use a real weather API
    return f"The weather in {city} is sunny, 22°C"

# Web search tool
search = DuckDuckGoSearchRun()
search_tool = Tool(
    name="web_search",
    func=search.run,
    description="Search the web for current information"
)

# Create agent
tools = [calculate, get_weather, search_tool]

# Agent prompt
prompt = ChatPromptTemplate.from_messages([
    ("system", """You are a helpful AI assistant with access to various tools.
    Use them to answer questions accurately. Think step-by-step."""),
    ("user", "{input}"),
    MessagesPlaceholder(variable_name="agent_scratchpad"),
])

# Create the agent
agent = create_openai_functions_agent(llm, tools, prompt)

# Create executor
agent_executor = AgentExecutor(
    agent=agent,
    tools=tools,
    verbose=True,
    return_intermediate_steps=True,
    max_iterations=5,
    early_stopping_method="generate"
)

# Use the agent
result = agent_executor.invoke({
    "input": "What's the weather in Tokyo and calculate 25% of 480"
})

print(result["output"])

Advanced Agent Types

1. ReAct Agent

from langchain.agents import create_react_agent
from langchain import hub

# Pull ReAct prompt from hub
react_prompt = hub.pull("hwchase17/react")

# Create ReAct agent
react_agent = create_react_agent(
    llm=llm,
    tools=tools,
    prompt=react_prompt
)

react_executor = AgentExecutor(
    agent=react_agent,
    tools=tools,
    verbose=True,
    handle_parsing_errors=True
)

# ReAct pattern: Thought → Action → Observation → loop
result = react_executor.invoke({
    "input": "Find the latest AI news and summarize the top 3 stories"
})

2. Self-Ask with Search

from langchain.agents import create_self_ask_with_search_agent

# This agent decomposes questions into sub-questions
self_ask_agent = create_self_ask_with_search_agent(
    llm=llm,
    search_tool=search_tool,
    prompt=hub.pull("hwchase17/self-ask-with-search")
)

# Example: Complex multi-hop question
result = AgentExecutor(
    agent=self_ask_agent,
    tools=[search_tool],
    verbose=True
).invoke({
    "input": "What is the population of the capital of the country where Tesla's largest factory outside the US is located?"
})

3. Plan-and-Execute Agent

from langchain_experimental.plan_and_execute import (
    PlanAndExecute,
    load_agent_executor,
    load_chat_planner
)

# Create planner and executor
planner = load_chat_planner(llm)
executor = load_agent_executor(llm, tools, verbose=True)

# Create plan-and-execute agent
plan_agent = PlanAndExecute(
    planner=planner,
    executor=executor,
    verbose=True
)

# Complex task requiring planning
result = plan_agent.run(
    "Create a comprehensive market analysis report for electric vehicles: "
    "1) Current market size, 2) Top 5 manufacturers, 3) Growth projections, "
    "4) Key challenges, 5) Investment opportunities"
)

LangChain Agent Architecture

Agent Execution Flow

User Input

→

Agent Brain
(LLM)

→

Tool Selection

→

Tool Execution

→

Observation

→

Decision
(Continue/Stop)

Complete Agent System

from langchain.memory import ConversationBufferWindowMemory
from langchain.callbacks import StdOutCallbackHandler
from langchain_community.vectorstores import Chroma
from langchain_openai import OpenAIEmbeddings
from langchain.text_splitter import RecursiveCharacterTextSplitter

class AdvancedAgent:
    def __init__(self):
        self.llm = ChatOpenAI(model="gpt-4", temperature=0)
        self.memory = ConversationBufferWindowMemory(
            k=10,
            return_messages=True,
            memory_key="chat_history"
        )
        self.tools = self._setup_tools()
        self.agent = self._create_agent()
        
    def _setup_tools(self):
        tools = []
        
        # 1. Vector store tool for RAG
        embeddings = OpenAIEmbeddings()
        vectorstore = Chroma(
            persist_directory="./chroma_db",
            embedding_function=embeddings
        )
        
        retriever_tool = create_retriever_tool(
            vectorstore.as_retriever(),
            "knowledge_base",
            "Search internal knowledge base for information"
        )
        tools.append(retriever_tool)
        
        # 2. Code execution tool
        @tool
        def execute_python(code: str) -> str:
            """Execute Python code and return the result."""
            try:
                # Use exec with restricted globals for safety
                exec_globals = {"__builtins__": {}}
                exec(code, exec_globals)
                return str(exec_globals)
            except Exception as e:
                return f"Error: {e}"
        
        tools.append(execute_python)
        
        # 3. File operations
        @tool
        def read_file(filepath: str) -> str:
            """Read contents of a file."""
            try:
                with open(filepath, 'r') as f:
                    return f.read()
            except Exception as e:
                return f"Error reading file: {e}"
        
        @tool
        def write_file(filepath: str, content: str) -> str:
            """Write content to a file."""
            try:
                with open(filepath, 'w') as f:
                    f.write(content)
                return f"Successfully wrote to {filepath}"
            except Exception as e:
                return f"Error writing file: {e}"
        
        tools.extend([read_file, write_file])
        
        return tools
    
    def _create_agent(self):
        prompt = ChatPromptTemplate.from_messages([
            ("system", """You are an advanced AI assistant with access to:
            - Knowledge base search
            - Python code execution
            - File operations
            - Web search
            
            Always think step-by-step and use tools when needed.
            Maintain context from previous conversations."""),
            MessagesPlaceholder(variable_name="chat_history"),
            ("user", "{input}"),
            MessagesPlaceholder(variable_name="agent_scratchpad"),
        ])
        
        agent = create_openai_functions_agent(
            self.llm,
            self.tools,
            prompt
        )
        
        return AgentExecutor(
            agent=agent,
            tools=self.tools,
            memory=self.memory,
            verbose=True,
            return_intermediate_steps=True,
            max_iterations=10,
            callbacks=[StdOutCallbackHandler()]
        )
    
    def run(self, query: str):
        """Execute agent with query."""
        return self.agent.invoke({"input": query})
    
    def add_to_knowledge_base(self, documents):
        """Add documents to vector store."""
        text_splitter = RecursiveCharacterTextSplitter(
            chunk_size=1000,
            chunk_overlap=200
        )
        texts = text_splitter.split_documents(documents)
        
        embeddings = OpenAIEmbeddings()
        vectorstore = Chroma.from_documents(
            texts,
            embeddings,
            persist_directory="./chroma_db"
        )
        vectorstore.persist()

# Usage
agent_system = AdvancedAgent()
result = agent_system.run(
    "Search the knowledge base for information about LangChain, "
    "then write a Python script that demonstrates its key features"
)

LangGraph: Next-Generation Agents

LangGraph enables building stateful, multi-agent applications with cycles, controllability, and persistence.

Basic LangGraph Agent

from langgraph.graph import StateGraph, END
from typing import TypedDict, Annotated, Sequence
import operator
from langchain_core.messages import BaseMessage, HumanMessage, AIMessage

# Define state
class AgentState(TypedDict):
    messages: Annotated[Sequence[BaseMessage], operator.add]
    next_step: str

# Create graph
workflow = StateGraph(AgentState)

# Define nodes
def researcher(state):
    """Research node that gathers information."""
    messages = state["messages"]
    last_message = messages[-1].content
    
    # Simulate research
    research_result = f"Research on: {last_message}\nFound: [relevant information]"
    
    return {
        "messages": [AIMessage(content=research_result)],
        "next_step": "analyzer"
    }

def analyzer(state):
    """Analyze research results."""
    messages = state["messages"]
    research = messages[-1].content
    
    analysis = f"Analysis: The research shows... [detailed analysis]"
    
    return {
        "messages": [AIMessage(content=analysis)],
        "next_step": "writer"
    }

def writer(state):
    """Generate final output."""
    messages = state["messages"]
    analysis = messages[-1].content
    
    final_output = f"Final Report:\n{analysis}\n[Formatted output]"
    
    return {
        "messages": [AIMessage(content=final_output)],
        "next_step": "end"
    }

# Add nodes to graph
workflow.add_node("researcher", researcher)
workflow.add_node("analyzer", analyzer)
workflow.add_node("writer", writer)

# Define edges
workflow.set_entry_point("researcher")
workflow.add_edge("researcher", "analyzer")
workflow.add_edge("analyzer", "writer")
workflow.add_edge("writer", END)

# Compile graph
app = workflow.compile()

# Run the graph
initial_state = {
    "messages": [HumanMessage(content="Analyze the AI agent market")],
    "next_step": "researcher"
}

result = app.invoke(initial_state)
print(result["messages"][-1].content)

Advanced LangGraph: Multi-Agent Collaboration

from langgraph.graph import StateGraph, END
from langgraph.checkpoint import MemorySaver
from langchain_openai import ChatOpenAI

class MultiAgentState(TypedDict):
    messages: Annotated[Sequence[BaseMessage], operator.add]
    current_agent: str
    task_completed: bool
    results: dict

class MultiAgentSystem:
    def __init__(self):
        self.llm = ChatOpenAI(model="gpt-4")
        self.workflow = StateGraph(MultiAgentState)
        self._setup_agents()
        self._setup_edges()
        
    def _setup_agents(self):
        # Coordinator Agent
        def coordinator(state):
            """Decides which agent should act next."""
            prompt = f"""
            Current state: {state['results']}
            Messages: {state['messages'][-1].content if state['messages'] else 'Start'}
            
            Decide next agent: researcher, coder, reviewer, or end
            """
            
            response = self.llm.invoke(prompt)
            next_agent = self._parse_next_agent(response.content)
            
            return {
                "current_agent": next_agent,
                "messages": [AIMessage(content=f"Routing to {next_agent}")]
            }
        
        # Researcher Agent
        def researcher(state):
            """Researches information."""
            task = state['messages'][-2].content if len(state['messages']) > 1 else ""
            
            research = self.llm.invoke(
                f"Research this topic and provide findings: {task}"
            )
            
            state['results']['research'] = research.content
            
            return {
                "messages": [AIMessage(content=research.content)],
                "current_agent": "coordinator"
            }
        
        # Coder Agent
        def coder(state):
            """Writes code based on requirements."""
            context = state['results'].get('research', '')
            
            code = self.llm.invoke(
                f"Write code based on: {context}"
            )
            
            state['results']['code'] = code.content
            
            return {
                "messages": [AIMessage(content=code.content)],
                "current_agent": "coordinator"
            }
        
        # Reviewer Agent
        def reviewer(state):
            """Reviews and provides feedback."""
            code = state['results'].get('code', '')
            
            review = self.llm.invoke(
                f"Review this code and suggest improvements: {code}"
            )
            
            state['results']['review'] = review.content
            
            return {
                "messages": [AIMessage(content=review.content)],
                "current_agent": "coordinator",
                "task_completed": True
            }
        
        # Add all nodes
        self.workflow.add_node("coordinator", coordinator)
        self.workflow.add_node("researcher", researcher)
        self.workflow.add_node("coder", coder)
        self.workflow.add_node("reviewer", reviewer)
    
    def _setup_edges(self):
        # Conditional routing
        def route_next(state):
            if state.get('task_completed', False):
                return END
            return state['current_agent']
        
        self.workflow.set_entry_point("coordinator")
        
        # Add conditional edges from coordinator
        self.workflow.add_conditional_edges(
            "coordinator",
            route_next,
            {
                "researcher": "researcher",
                "coder": "coder",
                "reviewer": "reviewer",
                END: END
            }
        )
        
        # All agents return to coordinator
        self.workflow.add_edge("researcher", "coordinator")
        self.workflow.add_edge("coder", "coordinator")
        self.workflow.add_edge("reviewer", "coordinator")
    
    def compile(self):
        # Add memory for persistence
        memory = MemorySaver()
        return self.workflow.compile(checkpointer=memory)

# Usage
system = MultiAgentSystem()
app = system.compile()

# Run with streaming
config = {"configurable": {"thread_id": "main-thread"}}

for output in app.stream({
    "messages": [HumanMessage(content="Create a web scraping tool")],
    "current_agent": "coordinator",
    "results": {}
}, config):
    print(output)

Production Best Practices

Performance Optimization:

Use streaming for long-running agents
Implement caching with Redis or in-memory stores
Batch tool calls when possible
Use async operations for I/O-bound tasks
Implement proper error handling and retries
Monitor token usage and costs

Error Handling & Fallbacks

from langchain.agents import AgentExecutor
from tenacity import retry, stop_after_attempt, wait_exponential

class RobustAgent:
    def __init__(self):
        self.primary_llm = ChatOpenAI(model="gpt-4")
        self.fallback_llm = ChatOpenAI(model="gpt-3.5-turbo")
        
    @retry(
        stop=stop_after_attempt(3),
        wait=wait_exponential(multiplier=1, min=4, max=10)
    )
    def execute_with_retry(self, query):
        try:
            # Try with primary LLM
            return self.run_agent(self.primary_llm, query)
        except Exception as e:
            print(f"Primary failed: {e}, using fallback")
            return self.run_agent(self.fallback_llm, query)
    
    def run_agent(self, llm, query):
        agent_executor = AgentExecutor(
            agent=create_openai_functions_agent(llm, tools, prompt),
            tools=tools,
            handle_parsing_errors=True,
            max_iterations=3,
            early_stopping_method="generate"
        )
        
        return agent_executor.invoke({"input": query})

Monitoring & Observability

# LangSmith Integration
import langsmith

client = langsmith.Client()

# Custom callbacks for monitoring
from langchain.callbacks.base import BaseCallbackHandler

class MonitoringCallback(BaseCallbackHandler):
    def __init__(self):
        self.token_count = 0
        self.tool_calls = []
        
    def on_llm_start(self, serialized, prompts, **kwargs):
        print(f"LLM Start: {prompts}")
        
    def on_llm_end(self, response, **kwargs):
        # Track token usage
        if hasattr(response, 'llm_output'):
            tokens = response.llm_output.get('token_usage', {})
            self.token_count += tokens.get('total_tokens', 0)
    
    def on_tool_start(self, serialized, input_str, **kwargs):
        self.tool_calls.append({
            'tool': serialized.get('name'),
            'input': input_str,
            'timestamp': datetime.now()
        })
    
    def get_metrics(self):
        return {
            'total_tokens': self.token_count,
            'tool_calls': len(self.tool_calls),
            'tools_used': list(set(t['tool'] for t in self.tool_calls))
        }

# Use in agent
monitor = MonitoringCallback()
agent_executor = AgentExecutor(
    agent=agent,
    tools=tools,
    callbacks=[monitor],
    verbose=True
)

result = agent_executor.invoke({"input": "Complex task"})
print(monitor.get_metrics())

Comparison: LangChain vs Others

Feature	LangChain	CrewAI	AutoGen
Learning Curve	Moderate-High	Low-Moderate	High
Flexibility	Very High	Moderate	High
Multi-Agent	Via LangGraph	Native	Native
Tool Ecosystem	Extensive	Growing	Moderate
Production Ready	Yes	Yes	Yes
Best For	Complex chains, RAG	Multi-agent teams	Research, Complex reasoning

← CrewAI Tutorial Next: AutoGen →