diff --git a/content/blog/2026-05-18-agent-guide/agent-loop.mmd b/content/blog/2026-05-18-agent-guide/agent-loop.mmd
new file mode 100644
index 0000000..f3a8af0
--- /dev/null
+++ b/content/blog/2026-05-18-agent-guide/agent-loop.mmd
@@ -0,0 +1,5 @@
+graph LR
+    User["User<br/>(role: user)"] -->|"prompt"| LLM["LLM<br/>(role: assistant)"]
+    LLM -->|"result"| User
+    LLM -->|"tool_calls: [...]"| Agent["Agent Tools<br/>(role: tool)"]
+    Agent -->|"tool result"| LLM
diff --git a/content/blog/2026-05-18-agent-guide/agent-loop.svg b/content/blog/2026-05-18-agent-guide/agent-loop.svg
new file mode 100644
index 0000000..f8d68a9
--- /dev/null
+++ b/content/blog/2026-05-18-agent-guide/agent-loop.svg
@@ -0,0 +1 @@
+<svg id="my-svg" width="100%" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" class="flowchart" style="max-width: 771.578px; background-color: transparent;" viewBox="0 0 771.578125 94" role="graphics-document document" aria-roledescription="flowchart-v2"><style>#my-svg{font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:16px;fill:#333;}@keyframes edge-animation-frame{from{stroke-dashoffset:0;}}@keyframes dash{to{stroke-dashoffset:0;}}#my-svg .edge-animation-slow{stroke-dasharray:9,5!important;stroke-dashoffset:900;animation:dash 50s linear infinite;stroke-linecap:round;}#my-svg .edge-animation-fast{stroke-dasharray:9,5!important;stroke-dashoffset:900;animation:dash 20s linear infinite;stroke-linecap:round;}#my-svg .error-icon{fill:#552222;}#my-svg .error-text{fill:#552222;stroke:#552222;}#my-svg .edge-thickness-normal{stroke-width:1px;}#my-svg .edge-thickness-thick{stroke-width:3.5px;}#my-svg .edge-pattern-solid{stroke-dasharray:0;}#my-svg .edge-thickness-invisible{stroke-width:0;fill:none;}#my-svg .edge-pattern-dashed{stroke-dasharray:3;}#my-svg .edge-pattern-dotted{stroke-dasharray:2;}#my-svg .marker{fill:#333333;stroke:#333333;}#my-svg .marker.cross{stroke:#333333;}#my-svg svg{font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:16px;}#my-svg p{margin:0;}#my-svg .label{font-family:"trebuchet ms",verdana,arial,sans-serif;color:#333;}#my-svg .cluster-label text{fill:#333;}#my-svg .cluster-label span{color:#333;}#my-svg .cluster-label span p{background-color:transparent;}#my-svg .label text,#my-svg span{fill:#333;color:#333;}#my-svg .node rect,#my-svg .node circle,#my-svg .node ellipse,#my-svg .node polygon,#my-svg .node path{fill:#ECECFF;stroke:#9370DB;stroke-width:1px;}#my-svg .rough-node .label text,#my-svg .node .label text,#my-svg .image-shape .label,#my-svg .icon-shape .label{text-anchor:middle;}#my-svg .node .katex path{fill:#000;stroke:#000;stroke-width:1px;}#my-svg .rough-node .label,#my-svg .node .label,#my-svg .image-shape .label,#my-svg .icon-shape .label{text-align:center;}#my-svg .node.clickable{cursor:pointer;}#my-svg .root .anchor path{fill:#333333!important;stroke-width:0;stroke:#333333;}#my-svg .arrowheadPath{fill:#333333;}#my-svg .edgePath .path{stroke:#333333;stroke-width:1px;}#my-svg .flowchart-link{stroke:#333333;fill:none;}#my-svg .edgeLabel{background-color:rgba(232,232,232, 0.8);text-align:center;}#my-svg .edgeLabel p{background-color:rgba(232,232,232, 0.8);}#my-svg .edgeLabel rect{opacity:0.5;background-color:rgba(232,232,232, 0.8);fill:rgba(232,232,232, 0.8);}#my-svg .labelBkg{background-color:rgba(232, 232, 232, 0.5);}#my-svg .cluster rect{fill:#ffffde;stroke:#aaaa33;stroke-width:1px;}#my-svg .cluster text{fill:#333;}#my-svg .cluster span{color:#333;}#my-svg div.mermaidTooltip{position:absolute;text-align:center;max-width:200px;padding:2px;font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:12px;background:hsl(80, 100%, 96.2745098039%);border:1px solid #aaaa33;border-radius:2px;pointer-events:none;z-index:100;}#my-svg .flowchartTitleText{text-anchor:middle;font-size:18px;fill:#333;}#my-svg rect.text{fill:none;stroke-width:0;}#my-svg .icon-shape,#my-svg .image-shape{background-color:rgba(232,232,232, 0.8);text-align:center;}#my-svg .icon-shape p,#my-svg .image-shape p{background-color:rgba(232,232,232, 0.8);padding:2px;}#my-svg .icon-shape .label rect,#my-svg .image-shape .label rect{opacity:0.5;background-color:rgba(232,232,232, 0.8);fill:rgba(232,232,232, 0.8);}#my-svg .label-icon{display:inline-block;height:1em;overflow:visible;vertical-align:-0.125em;}#my-svg .node .label-icon path{fill:currentColor;stroke:revert;stroke-width:revert;}#my-svg .node .neo-node{stroke:#9370DB;}#my-svg [data-look="neo"].node rect,#my-svg [data-look="neo"].cluster rect,#my-svg [data-look="neo"].node polygon{stroke:#9370DB;filter:drop-shadow(1px 2px 2px rgba(185, 185, 185, 1));}#my-svg [data-look="neo"].node path{stroke:#9370DB;stroke-width:1px;}#my-svg [data-look="neo"].node .outer-path{filter:drop-shadow(1px 2px 2px rgba(185, 185, 185, 1));}#my-svg [data-look="neo"].node .neo-line path{stroke:#9370DB;filter:none;}#my-svg [data-look="neo"].node circle{stroke:#9370DB;filter:drop-shadow(1px 2px 2px rgba(185, 185, 185, 1));}#my-svg [data-look="neo"].node circle .state-start{fill:#000000;}#my-svg [data-look="neo"].icon-shape .icon{fill:#9370DB;filter:drop-shadow(1px 2px 2px rgba(185, 185, 185, 1));}#my-svg [data-look="neo"].icon-shape .icon-neo path{stroke:#9370DB;filter:drop-shadow(1px 2px 2px rgba(185, 185, 185, 1));}#my-svg :root{--mermaid-font-family:"trebuchet ms",verdana,arial,sans-serif;}</style><g><marker id="my-svg_flowchart-v2-pointEnd" class="marker flowchart-v2" viewBox="0 0 10 10" refX="5" refY="5" markerUnits="userSpaceOnUse" markerWidth="8" markerHeight="8" orient="auto"><path d="M 0 0 L 10 5 L 0 10 z" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"/></marker><marker id="my-svg_flowchart-v2-pointStart" class="marker flowchart-v2" viewBox="0 0 10 10" refX="4.5" refY="5" markerUnits="userSpaceOnUse" markerWidth="8" markerHeight="8" orient="auto"><path d="M 0 5 L 10 10 L 10 0 z" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"/></marker><marker id="my-svg_flowchart-v2-pointEnd-margin" class="marker flowchart-v2" viewBox="0 0 11.5 14" refX="11.5" refY="7" markerUnits="userSpaceOnUse" markerWidth="10.5" markerHeight="14" orient="auto"><path d="M 0 0 L 11.5 7 L 0 14 z" class="arrowMarkerPath" style="stroke-width: 0; stroke-dasharray: 1, 0;"/></marker><marker id="my-svg_flowchart-v2-pointStart-margin" class="marker flowchart-v2" viewBox="0 0 11.5 14" refX="1" refY="7" markerUnits="userSpaceOnUse" markerWidth="11.5" markerHeight="14" orient="auto"><polygon points="0,7 11.5,14 11.5,0" class="arrowMarkerPath" style="stroke-width: 0; stroke-dasharray: 1, 0;"/></marker><marker id="my-svg_flowchart-v2-circleEnd" class="marker flowchart-v2" viewBox="0 0 10 10" refX="11" refY="5" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><circle cx="5" cy="5" r="5" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"/></marker><marker id="my-svg_flowchart-v2-circleStart" class="marker flowchart-v2" viewBox="0 0 10 10" refX="-1" refY="5" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><circle cx="5" cy="5" r="5" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"/></marker><marker id="my-svg_flowchart-v2-circleEnd-margin" class="marker flowchart-v2" viewBox="0 0 10 10" refY="5" refX="12.25" markerUnits="userSpaceOnUse" markerWidth="14" markerHeight="14" orient="auto"><circle cx="5" cy="5" r="5" class="arrowMarkerPath" style="stroke-width: 0; stroke-dasharray: 1, 0;"/></marker><marker id="my-svg_flowchart-v2-circleStart-margin" class="marker flowchart-v2" viewBox="0 0 10 10" refX="-2" refY="5" markerUnits="userSpaceOnUse" markerWidth="14" markerHeight="14" orient="auto"><circle cx="5" cy="5" r="5" class="arrowMarkerPath" style="stroke-width: 0; stroke-dasharray: 1, 0;"/></marker><marker id="my-svg_flowchart-v2-crossEnd" class="marker cross flowchart-v2" viewBox="0 0 11 11" refX="12" refY="5.2" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><path d="M 1,1 l 9,9 M 10,1 l -9,9" class="arrowMarkerPath" style="stroke-width: 2; stroke-dasharray: 1, 0;"/></marker><marker id="my-svg_flowchart-v2-crossStart" class="marker cross flowchart-v2" viewBox="0 0 11 11" refX="-1" refY="5.2" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><path d="M 1,1 l 9,9 M 10,1 l -9,9" class="arrowMarkerPath" style="stroke-width: 2; stroke-dasharray: 1, 0;"/></marker><marker id="my-svg_flowchart-v2-crossEnd-margin" class="marker cross flowchart-v2" viewBox="0 0 15 15" refX="17.7" refY="7.5" markerUnits="userSpaceOnUse" markerWidth="12" markerHeight="12" orient="auto"><path d="M 1,1 L 14,14 M 1,14 L 14,1" class="arrowMarkerPath" style="stroke-width: 2.5;"/></marker><marker id="my-svg_flowchart-v2-crossStart-margin" class="marker cross flowchart-v2" viewBox="0 0 15 15" refX="-3.5" refY="7.5" markerUnits="userSpaceOnUse" markerWidth="12" markerHeight="12" orient="auto"><path d="M 1,1 L 14,14 M 1,14 L 14,1" class="arrowMarkerPath" style="stroke-width: 2.5; stroke-dasharray: 1, 0;"/></marker><g class="root"><g class="clusters"/><g class="edgePaths"><path d="M156.172,34.284L165.188,32.737C174.203,31.19,192.234,28.095,209.606,27.801C226.978,27.508,243.691,30.016,252.047,31.27L260.404,32.524" id="my-svg-L_User_LLM_0" class="edge-thickness-normal edge-pattern-solid edge-thickness-normal edge-pattern-solid flowchart-link" style=";" data-edge="true" data-et="edge" data-id="L_User_LLM_0" data-points="W3sieCI6MTU2LjE3MTg3NSwieSI6MzQuMjg0MzI5ODU5MjA2NDR9LHsieCI6MjEwLjI2NTYyNSwieSI6MjV9LHsieCI6MjY0LjM1OTM3NSwieSI6MzMuMTE3NjY1ODY3MzA2MTZ9XQ==" data-look="classic" marker-end="url(#my-svg_flowchart-v2-pointEnd)"/><path d="M264.359,60.882L255.344,62.235C246.328,63.588,228.297,66.294,210.923,66.212C193.548,66.131,176.831,63.262,168.473,61.827L160.114,60.392" id="my-svg-L_LLM_User_0" class="edge-thickness-normal edge-pattern-solid edge-thickness-normal edge-pattern-solid flowchart-link" style=";" data-edge="true" data-et="edge" data-id="L_LLM_User_0" data-points="W3sieCI6MjY0LjM1OTM3NSwieSI6NjAuODgyMzM0MTMyNjkzODR9LHsieCI6MjEwLjI2NTYyNSwieSI6Njl9LHsieCI6MTU2LjE3MTg3NSwieSI6NTkuNzE1NjcwMTQwNzkzNTZ9XQ==" data-look="classic" marker-end="url(#my-svg_flowchart-v2-pointEnd)"/><path d="M449.375,35.282L462.904,33.568C476.432,31.855,503.49,28.427,529.887,28.516C556.284,28.604,582.021,32.208,594.889,34.01L607.757,35.812" id="my-svg-L_LLM_Agent_0" class="edge-thickness-normal edge-pattern-solid edge-thickness-normal edge-pattern-solid flowchart-link" style=";" data-edge="true" data-et="edge" data-id="L_LLM_Agent_0" data-points="W3sieCI6NDQ5LjM3NSwieSI6MzUuMjgyMDM4NTk0NzU1MDd9LHsieCI6NTMwLjU0Njg3NSwieSI6MjV9LHsieCI6NjExLjcxODc1LCJ5IjozNi4zNjcwNDk1Nzk3OTAxNX1d" data-look="classic" marker-end="url(#my-svg_flowchart-v2-pointEnd)"/><path d="M611.719,57.633L598.19,59.527C584.661,61.422,557.604,65.211,531.208,65.476C504.812,65.74,479.078,62.48,466.211,60.851L453.343,59.221" id="my-svg-L_Agent_LLM_0" class="edge-thickness-normal edge-pattern-solid edge-thickness-normal edge-pattern-solid flowchart-link" style=";" data-edge="true" data-et="edge" data-id="L_Agent_LLM_0" data-points="W3sieCI6NjExLjcxODc1LCJ5Ijo1Ny42MzI5NTA0MjAyMDk4NX0seyJ4Ijo1MzAuNTQ2ODc1LCJ5Ijo2OX0seyJ4Ijo0NDkuMzc1LCJ5Ijo1OC43MTc5NjE0MDUyNDQ5M31d" data-look="classic" marker-end="url(#my-svg_flowchart-v2-pointEnd)"/></g><g class="edgeLabels"><g class="edgeLabel" transform="translate(210.265625, 25)"><g class="label" data-id="L_User_LLM_0" transform="translate(-29.09375, -12)"><foreignObject width="58.1875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel"><p>prompt</p></span></div></foreignObject></g></g><g class="edgeLabel" transform="translate(210.17433, 68.98433)"><g class="label" data-id="L_LLM_User_0" transform="translate(-22.6328125, -12)"><foreignObject width="45.265625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel"><p>result</p></span></div></foreignObject></g></g><g class="edgeLabel" transform="translate(530.61789, 25.00994)"><g class="label" data-id="L_LLM_Agent_0" transform="translate(-56.171875, -12)"><foreignObject width="112.34375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel"><p>tool_calls: [...]</p></span></div></foreignObject></g></g><g class="edgeLabel" transform="translate(530.546875, 69)"><g class="label" data-id="L_Agent_LLM_0" transform="translate(-40.328125, -12)"><foreignObject width="80.65625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel"><p>tool result</p></span></div></foreignObject></g></g></g><g class="nodes"><g class="node default" id="my-svg-flowchart-User-0" data-look="classic" transform="translate(82.0859375, 47)"><rect class="basic label-container" style="" x="-74.0859375" y="-39" width="148.171875" height="78"/><g class="label" style="" transform="translate(-44.0859375, -24)"><rect/><foreignObject width="88.171875" height="48"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="nodeLabel"><p>User<br />(role: user)</p></span></div></foreignObject></g></g><g class="node default" id="my-svg-flowchart-LLM-1" data-look="classic" transform="translate(356.8671875, 47)"><rect class="basic label-container" style="" x="-92.5078125" y="-39" width="185.015625" height="78"/><g class="label" style="" transform="translate(-62.5078125, -24)"><rect/><foreignObject width="125.015625" height="48"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="nodeLabel"><p>LLM<br />(role: assistant)</p></span></div></foreignObject></g></g><g class="node default" id="my-svg-flowchart-Agent-5" data-look="classic" transform="translate(687.6484375, 47)"><rect class="basic label-container" style="" x="-75.9296875" y="-39" width="151.859375" height="78"/><g class="label" style="" transform="translate(-45.9296875, -24)"><rect/><foreignObject width="91.859375" height="48"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="nodeLabel"><p>Agent Tools<br />(role: tool)</p></span></div></foreignObject></g></g></g></g></g><defs><filter id="my-svg-drop-shadow" height="130%" width="130%"><feDropShadow dx="4" dy="4" stdDeviation="0" flood-opacity="0.06" flood-color="#000000"/></filter></defs><defs><filter id="my-svg-drop-shadow-small" height="150%" width="150%"><feDropShadow dx="2" dy="2" stdDeviation="0" flood-opacity="0.06" flood-color="#000000"/></filter></defs></svg>
\ No newline at end of file
diff --git a/content/blog/2026-05-18-agent-guide/index.md b/content/blog/2026-05-18-agent-guide/index.md
new file mode 100644
index 0000000..4fe7fc4
--- /dev/null
+++ b/content/blog/2026-05-18-agent-guide/index.md
@@ -0,0 +1,530 @@
+---
+title: What is an AI Agent?
+author: Seth Erickson
+tags:
+  - guide
+  - ai
+  - python
+---
+
+The prolific software developer and writer on AI-assisted coding, Simon
+Willison, describes [AI agents](https://simonwillison.net/tags/ai-agents/) as
+**Large Language Models (LLMs) calling tools in a loop to achieve a goal**. It's
+a good definition, particularly if you are already familiar with the technical
+sense of the terms. If you aren't, you might be wondering: What is a "tool", and
+how does a language model "call" one? In this post, I want to add some technical
+specificity to Willison's definition by showing how to build a very simple
+agent: we'll build a program in which an LLM calls tools in a loop to achieve a
+goal.
+
+Real-world agents (for example, coding agents) can be quite complicated pieces
+of software. However, the core features of an agent are surprisingly simple to
+implement. You might be surprised at how little code it takes to build an agent
+that can do useful work! Because our goal is pedagogical, not practical, we'll
+use plain Python as much as possible. If your goal is to build a sophisticated
+agent with little effort, you should probably use one of the many agent SDKs
+designed for the purpose -- or ask your coding agent to!
+
+To follow this guide, you will need to know how to run Python scripts and have
+API access to an LLM provider. We will be using [DREAM Lab’s AI
+gateway](https://dreamlab.ucsb.edu/guides/ai-gateway.html) as our LLM provider,
+but other model providers should also work.
+
+## Using LLMs through APIs
+
+Most computer programs, like agents, that *use* LLMs do so through web-based
+APIs. Agents talk to model providers the same way your web browser talks to web
+servers: using HTTP. Instead of running models directly, the program makes HTTP
+“requests” to an LLM model provider over the web. An advantage of this approach
+is that it makes the software easier to write and run. We don’t need specialized
+hardware for running models, and we don’t need complex machine learning
+frameworks (like PyTorch). Instead, we just need an HTTP client, like Python’s
+[requests](https://pypi.org/project/requests/) library.
+
+Model providers (like OpenAI, Anthropic, Google, AWS, etc.) expect programs to
+use specific APIs to interact with their LLMs. OpenAI’s [Chat Completion
+API](https://developers.openai.com/api/reference/resources/chat), is one of the
+oldest and most widely supported APIs for interacting with LLMs--and it’s the
+API we’ll use here. There are other APIs with similar affordances, such as
+Anthropic's Messages API, but the basic concepts are the same.
+
+To make HTTP requests to an LLM provider using the Chat Completion API, you need
+four things: 
+
+1. A list of "messages" with the user prompt as the last message (described in detail below)
+2. The API’s base URL (e.g., `https://litellm.dreamlab.ucsb.edu`)
+3. The name of the model to use (e.g., `gemini-3-flash-preview`)
+4. An API access key to authenticate requests
+
+The core of our agent is a Python function, `call_llm()`, that uses the
+`requests` library to make a single HTTP requests to an LLM model provider using
+the Chat Completion API. 
+
+```python
+import requests
+import os
+
+def call_llm(messages, api_base_url, api_model, api_key, tools=None):
+    """Makes a request using the Chat Completion API.
+
+    Args:
+        messages (list): A list of "message" objects, with prompt.
+        api_base_url (str): The URL of our API endpoint.
+        api_model (str): Name of the model to use.
+        api_key (str): An API key.
+        tools (list, optional): An optional list of tool definitions.
+
+    Returns:
+        dict: The first message object in the response choices.
+    """
+
+    # http request url and headers
+    request_url = f"{api_base_url}/v1/chat/completions"    
+    headers = {
+        "Authorization": f"Bearer {api_key}", 
+        "Content-Type": "application/json"
+    }
+    
+    # http request body: the data submitted to the API
+    data = {
+        "model": api_model,
+        "messages": messages,
+    }
+
+    # include "tools" only if defined
+    if tools:
+        data["tools"] = tools
+
+    # call the API and print server error if we get one
+    response = requests.post(request_url, headers=headers, json=data)
+    response.raise_for_status() # raise an error if http response status != 200
+   
+    # The Chat Completion API supports multiple "choices".
+    # We only expect one: return the first message in 'choices'
+    resp = response.json()
+    return resp["choices"][0]["message"]
+```
+
+This might look complicated, but the gist of `call_llm()` is that it sends
+"messages" to a web server that understands the Chat Completion API and returns
+a new message with the LLM's response. A list of messages go in, a single
+message comes back. Now let's take a closer look at what these "message" consist
+of.
+
+## Chat Completion Message Structure
+
+The Chat Completion API expects a list of messages representing the conversation
+history. The message list represents the full context of a multi-turn dialogue,
+typically between a "user" and the LLM "assistant". The entire conversation
+history (the `messages` list) must be included with each request. This is how
+the LLM "remembers" the full context of the conversation.
+
+Messages are json objects (Python dicts) with `role` and `content` keys:
+
+- **`role`**: Specifies who is sending the message. This can be one of four main
+  roles: `user`, `assistant`, `tool`, or `system`.
+- **`content`**: The actual text content of the message.
+- Messages may include additional keys for tool calling. We'll come back to this.
+
+We'll talk about the "tool" role a little later (and we're mostly ignoring the
+"system" role in this guide). In a simple, chat-based exchange (without tool
+calls), the "messages" list consists of alternating "user" and "assistant"
+messages. To illustrate, let's use `call_llm()`, with a single prompt: "What is
+the weather in Paris?"
+
+```python
+import os
+
+# messages with initial prompt (user role)
+prompt = "What is the weather in Paris?"
+messages = [{"role": "user", "content": prompt}]
+
+# api config
+api_base_url = "https://litellm.dreamlab.ucsb.edu"
+api_model = "gemini-3-flash-preview"
+api_key = os.getenv("LLM_API_KEY")  # key stored as environment variable
+
+msg = call_llm(messages, api_base_url, api_model, api_key)
+
+# msg has assistant role with API response
+print(msg) # {"role": "assistant", "content": "The weather in Paris is ..."}
+```
+
+To continue the conversation, we would append the assistant response (`msg`) to
+the `messages` list and then add an additional user message:
+
+```python
+# messages = [{"role": "user", "content": "What is the weather in Paris?"}]
+# msg = call_llm(messages, api_base_url, api_model, api_key)
+
+# append assistant response message list
+messages.append(msg) 
+
+# append new user prompt to message list
+messages.append({"role": "user", "content": "temperature in C and F please!"})
+
+# second assistant response
+msg = call_llm(messages, api_base_url, api_model, api_key)
+messages.append(msg)
+```
+
+The final `messages` list would include the following:
+
+| `role`      | `content`                                 |
+| :---------- | :---------------------------------------- |
+| `user`      | `"What is the weather in Paris?"`         |
+| `assistant` | `"The weather in Paris is ..."`           |
+| `user`      | `"temperature in C and F please!"`        |
+| `assistant` | `"It is 13°C (55°F) with clear skies..."` |
+
+
+## Using 'Tools' to Avoid Hallucinations
+
+When I ran this script above, with the prompt "What is the weather in Paris?", I received the response:
+
+```md
+As of right now in Paris, France:
+
+*   **Temperature:** 13°C (55°F)
+*   **Conditions:** Clear skies and sunny.
+*   **Wind:** 11 km/h (7 mph)
+*   **Humidity:** 61%
+
+**Forecast for the rest of today:**
+It is expected to stay clear and cool throughout the evening, with temperatures dropping to a low of about 7°C (45°F) overnight. 
+
+**Tomorrow's Outlook:**
+Similar weather is expected tomorrow, with mostly sunny skies and a high of 14°C (57°F).
+```
+
+At the time, this description was not accurate. In fact, running the script
+multiple times returned completely different weather conditions! That's because
+the model doesn't actually know what the weather in Paris is, so it makes up the
+answer. It "hallucinates" a plausible description of the weather. One way to
+avoid hallucinations in LLM API responses is to provide the model with "tools"
+that it can use. Tools provide LLMs with ways to access current information,
+perform tasks, and avoid having to fill-in missing details with statistically
+likely text. 
+
+To illustrate how tools work, we'll create a tool called `get_weather` that
+returns current weather conditions for a given location. For now, we're not
+concerned with *implementing* the tool. First, we just want to change our
+request so that the LLM API is aware of the tool.
+
+The optional `tools` argument of our `call_llm()` function is used to provide
+the LLM API with structured descriptions of tools it can call. The structure is
+defined by the [Chat Completion
+API](https://developers.openai.com/api/reference/resources/chat). In this
+context, you can think of "tools" as metadata describing a function in terms of
+inputs and outputs. Here's how we would describe our `get_weather` tool using
+the Chat Completion API:
+
+```python
+# get_weather_schema describes the `get_weather` tool.
+get_weather_schema = {
+    "type": "function",
+    "function": {
+        "name": "get_weather",
+        "description": "Get the current weather in a given location",
+        "parameters": {
+            "type": "object",
+            "properties": {
+                "location": {
+                    "type": "string",
+                    "description": "A place name (e.g., Paris)",
+                }
+            },
+            "required": ["location"],
+        },
+    },
+}
+```
+
+Now let's see how our response changes when we include this tool (`get_weather_schema`).
+
+```python
+prompt = "What is the weather in Paris"
+messages = [{"role": "user", "content": prompt}]
+
+# same prompt, api_base_url, api_model, and api_key as before
+msg = call_llm(messages, api_base_url, api_model, api_key, tools = [get_weather_schema])
+
+# print response details
+print(msg["role"])    # "assistant"
+print(msg["content"]) # None
+print(msg["too_calls"][0][function]) # {"arguments": "{'location': 'Paris'}", "name": "get_weather"}`
+```
+
+The response has changed in a few ways. First, it doesn't include any `content`
+(the `content` key is still present in the response message, but its value is
+`None`). Second, there is a new key, `tool_calls`, which is a list of objects
+like this:
+
+```json
+{"arguments": "{'location': 'Paris'}", "name": "get_weather"}`
+```
+
+As the name suggests, "tool calls" are how the API calls (or invokes) the tools
+we included in the request. Our request included the `get_weather` tool
+definition, and the response includes a tool call to run the `get_weather`
+function with arguments `{"location": "Paris"}`. The expectation is that we will
+run `get_weather()` and make an additional request with the output
+from the tool call. 
+
+It's time to implement the `get_weather()` function so that we can call it from
+our Python code. We'll use https://wttr.in, a site that provides a simple (free)
+API for fetching current weather.
+
+```python
+# get_weather is our Python implementation of the `get_weather` tool.
+# It gets the current weather for a given location using a weather
+# API (wttr.in)
+def get_weather(location: str) -> str:
+    url = f"https://wttr.in/{location}?format=3"
+    try:
+        response = requests.get(url, timeout=10)
+        response.raise_for_status()
+        return response.text.strip()
+    except Exception as e:
+        return f"Could not get weather for {location}: {e}"
+
+# example
+get_weather("Paris") # "Paris: ☁️  +56°F"
+```
+
+Now that we have implemented `get_weather`, we can call the Python function
+using the arguments in the tool call, and then send the output back to the LLM.
+The tool call output is included in the message of a second request, using the
+`"tool"` role.
+
+
+```python
+# process tool calls from response message
+for call in msg["tool_calls"]:
+
+    # parse tool call function name and arguments
+    name = call["function"]["name"]
+    if name != "get_weather":
+        raise ValueError(f"unexpected function name: {name}")
+    args = json.loads(call["function"]["arguments"])
+    result = get_weather(**args)
+    
+    # message with tool call output
+    new_msg =  {
+        "role": "tool",
+        "tool_call_id": call["id"],
+        "content": str(result),
+    }
+    messages.append(new_msg)
+
+# final request with tool call results
+msg = call_llm(messages, api_base_url, api_model, api_key, tools = [get_weather_schema])
+messages.append(msg)
+print(msg["content"]) # The weather in Paris is currently 56°F and cloudy.
+```
+
+The final message sequence to/from the LLM API is represented in the table
+below. Note that the tool output is sent to the LLM API using a message with
+`"tool"` role, not the typical `"user"` role.
+
+| Role        | Content / Tool Call                                                          |
+| :---------- | :--------------------------------------------------------------------------- |
+| `user`      | "What is the weather in Paris?"                                              |
+| `assistant` | tool call: `{"arguments": "{'location': 'Paris'}", "name": "get_weather"}` |
+| `tool`      | "Paris: ☁️  +56°F"                                                         |
+| `assistant` | "The weather in Paris is currently 56°F and cloudy"                          |
+
+## Calling Tools in a Loop 
+
+Let's revisit Willison's definition. AI agents are "**LLMs calling tools in a
+loop to achieve a goal**. At this point, we have a better understanding of how
+LLMs call tools: we include descriptions of available tools in our requests; the
+response may include `tool_calls`; we process tool calls locally and send the
+output back using the `"tool"` role. In the code above, we only processed the
+tool calls for a single response message. If the LLM API responded to the first
+tool call with a second (for example, if the first didn't work as expected), the
+second tool call would be ignored. We can address this by continuing to process
+tool calls, and making new requests to the LLM API with tool output, until we
+stop receiving responses with tool calls.
+
+This is the idea of "calling tools in a loop": as long as the LLM API continues
+to respond with tool calls, the agent continues to handle the calls and make new
+requests with the results. The "agent loop" (represented on the right-hand side
+of the figure below) is only broken when the LLM API stop responding with tool
+calls.
+
+![The Agent Loop](agent-loop.svg)
+
+To implement an agent in Python, we will create a function called `agent_loop()`
+that makes a request, runs tools, and makes additional requests until the LLM
+response no longer contains `tool_calls`. Notice that the `tools` argument
+expected by `agent_loop()` differs from the `tools` argument of `call_llm()`.
+While `call_llm()` only expects tool schemas (metadata) to pass to the API,
+`agent_loop()` expects a list of tuples containing both the schema *and* the
+executable Python function. The agent loop needs both because it is making API
+requests and also processing tools.
+
+```python
+import json
+
+def agent_loop(prompt, api_base_url, api_model, api_key, tools=None):
+    """
+    Run the main agent loop, interacting with the LLM and executing any requested tools.
+    Returns list of messages from the agent's interaction.
+    """
+    tools = tools or []
+
+    # Separate schemas for the API and build a dictionary of implementations
+    tool_schemas = [schema for schema, func in tools]
+    tool_funcs = {schema["function"]["name"]: func for schema, func in tools}
+
+    # messages is our full context. Initially, just the user prompt
+    messages = [{"role": "user", "content": prompt}]
+    
+    while True:
+        # Call the LLM with the current conversation history and available tool schemas
+        msg = call_llm(messages, api_base_url, api_model, api_key, tools=tool_schemas)
+        messages.append(msg)
+
+        # break the loop when the response is not a tool call
+        if not msg.get("tool_calls"):
+            break
+
+        # run all tool calls in the message and append tool call results to messages
+        for call in msg.get("tool_calls", []):
+            args = json.loads(call["function"]["arguments"])
+            name = call["function"]["name"]
+
+            if name in tool_funcs:
+                func = tool_funcs[name]
+                try:
+                    result = func(**args)
+                except Exception as e:
+                    result = f"Error executing {name}: {e}"
+            else:
+                result = f"Error: Tool {name} not found."
+
+            messages.append(
+                {"role": "tool", "tool_call_id": call["id"], "content": str(result)}
+            )
+
+    return messages
+```
+
+## Using Multiple Tools
+
+The real power of an agent loop becomes apparent when we provide the LLM with
+multiple tools. The model can then orchestrate calling these tools in sequence
+to achieve a multi-step goal. Let's add a second tool, `send_message`, which
+simulates sending a message to a specific recipient. 
+
+First, we define the tool definition for `send_message`:
+
+```python
+# send_message_schema describes the `send_message` tool
+send_message_schema = {
+    "type": "function",
+    "function": {
+        "name": "send_message",
+        "description": "send a message to someone",
+        "parameters": {
+            "type": "object",
+            "properties": {
+                "to": {
+                    "type": "string",
+                    "description": "the person to send the message to",
+                },
+                "message": {
+                    "type": "string",
+                    "description": "the body of the message",
+                },
+            },
+            "required": ["to", "message"],
+        },
+    },
+}
+```
+
+Next, we provide a Python implementation of `send_message`. For demonstration
+purposes, we will simply store the messages in a dictionary acting as an inbox
+for multiple users.
+
+```python
+# A fake email inbox to store messages
+inboxes = {}
+
+def send_message(to: str, message: str):
+    to_key = to.lower()
+    if to_key not in inboxes:
+        inboxes[to_key] = []
+    inboxes[to_key].append(message)
+    return f"Message sent to {to}"
+```
+
+Now, we can give our agent a more complex prompt: *"Send a message to Tom about
+the weather in Paris."* For the agent loop, `tools` includes both the tool
+definitions and the tool implementations as tuples.
+
+```python
+prompt = "Send a message to Tom about the weather in Paris."
+tools = [
+    (get_weather_schema, get_weather),
+    (send_message_schema, send_message)
+]
+
+messages = agent_loop(prompt, api_base_url, api_model, api_key, tools=tools)
+```
+
+The complete list of messages returned from `agent_loop()` looks like this:
+
+| Role        | Content / Tool Call                                                          |
+| :---------- | :--------------------------------------------------------------------------- |
+| `user`      | "Send a message to Tom about the weather in Paris."                          |
+| `assistant` | tool call: `{"arguments": "{'location': 'Paris'}", "name": "get_weather"}` |
+| `tool`      | "Paris: ☁️  🌡️+59°F 🌬️↘9mph"                                                 |
+| `assistant` | tool call: `{"arguments": "{'to': 'Tom', 'message': 'The current weather in Paris is ☁️ 59°F with a 9mph wind.'}", "name": "send_message"}` |
+| `tool`      | "Message sent to Tom"                                                        |
+| `assistant` | "OK. I've sent that message to Tom."                                         |
+
+Reading the message list, we can see that the LLM responded to the initial
+prompt with two tool calls in a row: the first to get the weather in Paris, and
+the second to send the message to Tom. The final message from the LLM
+"assistant" confirms that the message was sent. The agent loop ends because
+this message doesn't include additional tool calls.
+
+We can also confirm that Tom received a message:
+
+```python
+print(inboxes["tom"])
+# ['The current weather in Paris is ☁️ 59°F with a 9mph wind.']
+```
+
+We gave the LLM a goal, we gave it relevant *tools*, and it used those
+tools to achieve a goal!
+
+## Where to go from here
+
+Agents are able to do (hopefully) useful work through the integration of LLMs and
+agent tools via an API. Modern LLMs are specifically trained to use
+tools through techniques like [reinforcement
+learning](https://en.wikipedia.org/wiki/Reinforcement_learning). The Chat
+Completion API and similar APIs, like Anthropic's Messages API, allow us to
+include tool definitions in our requests *to the LLM*, receive tool calls *from
+the LLM*, and feed results *back to the LLM*. Ultimately, the agent (our code) is
+responsible for carrying-out the action by processing tool calls.
+
+Agents are largely defined by the tools they make available to the LLM. The most
+salient difference between our weather-checking agent and a sophisticated coding
+agent is the tool set. Coding agents include tools for reading and writing text
+and running shell commands. Also, real-world agents are significantly more complex
+because they have to handle a wide variety of edge cases that our simple loop
+ignores. They need to manage context limits (compaction or summarization when
+the conversation gets too long), handle interruptions from the user, deal with
+API rate limits, retry failed tool calls intelligently, and prevent the agent
+from getting stuck in infinite loops.
+
+If you are interested in exploring agent development further, you should
+probably check out an agent framework and library, like
+[smolagents](https://github.com/huggingface/smolagents),
+[Pydantic AI](https://github.com/pydantic/pydantic-ai), or
+[LangGraph](https://github.com/langchain-ai/langgraph).