! podman run --replace -d --rm -p 11434:11434 -v dot_ollama:/root/.ollama --name ollama docker.io/ollama/ollama

ed86c9e2787467f1ee8c4c1e8996388bd48bbc189d8792e8e6be7800d06ddccc

# Derived from the the Google Cloud doc:
# https://medium.com/google-cloud/gemma-3-ollama-on-colab-a-developers-quickstart-7bbf93ab8fef
! echo $(tput setaf 1)"Installing APT packages."$(tput setaf 0)
! sudo apt-get -qq update && sudo apt-get -qq install -y pciutils lshw
! echo $(tput setaf 1)"Fetching Ollama."$(tput setaf 0)
! curl -fsSL https://ollama.com/install.sh | sh
! echo $(tput setaf 1)"Starting Ollama server."$(tput setaf 0)
! nohup ollama serve > ollama.log 2>&1 &

import dataclasses
import langchain
import langchain_ollama
import ollama

@dataclasses.dataclass(frozen=True)
class OllamaModel:
    """Wrapper class for models with Ollama and LangChain."""

    name: str

    def __str__(self) -> str:
        return self.name

    def has_tools(self) -> bool:
        return 'tools' in self.show().capabilities

    def is_pulled(self) -> bool:
        for mdl in ollama.list().models:
            if mdl.model == self.name:
                return True
        return False

    def pull(self):
        """Pull the model to make it available to the local Ollama instance."""
        ollama.pull(self.name)

    def show(self) -> ollama._types.ShowResponse:
        return ollama.show(self.name)

    def new_chat(self, temperature:float = 0) -> langchain_ollama.ChatOllama:
        res = langchain_ollama.ChatOllama(
            model=str(self),
            temperature=temperature
        )
        return res

import jinja2

_aimessage_template = jinja2.Template(    
    """<table>
    <thead><tr><td colspan="2">AI message</td></tr></thead>
    <tbody>
    <tr>
      {% if response.content %}
      <td style="vertical-align: top; border-right: 2px solid rgb(40, 40, 150); width: 6em;"><b>response:</b></td>
      <td style="text-align: left; text-indent: 0px;">
        <div style="white-space: pre-wrap;">
        {{ response.content }}
        </div>
      </td>
      {% endif %}
      {% if response.tool_calls %}
      <td style="vertical-align: top; border-right: 2px solid rgb(150, 40, 40); width: 6em;"><b>tools:</b></td>
      <td style="text-align: left; text-indent: 0px;">
        <div style="white-space: pre-wrap;">
        {{ response.tool_calls }}
        </div>
      </td>
      {% endif %}
  </tr></tbody></table>
  """)


def aimessage_html(obj):
    return _aimessage_template.render(response=obj)
    
html_formatter = get_ipython().display_formatter.formatters['text/html']
html_formatter.for_type_by_name('langchain_core.messages.ai', 'AIMessage', aimessage_html)

def toolmessage_html(obj):
    _toolmessage_template = jinja2.Template(    
        """<table>
        <thead><tr><td colspan="2">Tool message</td></tr></thead>
        <tbody>
        <tr>
          {% if response.content %}
          <td style="vertical-align: top; border-right: 2px solid rgb(40, 40, 150); width: 6em;"><b>response:</b></td>
          <td style="text-align: left; text-indent: 0px;">
            <div style="white-space: pre-wrap;">
            {{ response.content }}
            </div>
          </td>
          {% endif %}
        </tr>
        </tbody></table>
        """)
    return _toolmessage_template.render(response=obj)


html_formatter = get_ipython().display_formatter.formatters['text/html']
html_formatter.for_type_by_name('langchain_core.messages.tool', 'ToolMessage', toolmessage_html)

def highlight(text):
    return f'\n\033[1m{text}\033[0m'

MODELS = (
    # OllamaModel('deepseek-r1:1.5b'),
    OllamaModel('gemma3:4b'),
    OllamaModel('functiongemma:270m'),
    OllamaModel('granite4:1b'),
    # OllamaModel('phi4-mini:3.8b'),
    # OllamaModel('qwen3:4b')
)

for mdl in MODELS:
    if mdl.is_pulled():
        print(f'Model {mdl} already pulled.')
    else:
        print(f'Pulling model {mdl}...', end='', flush=True)
        mdl.pull()
        print('done.')

Model gemma3:4b already pulled.
Pulling model functiongemma:270m...done.
Model granite4:1b already pulled.

from langchain_core.messages.human import HumanMessage
from langchain_core.messages.system import SystemMessage
from langchain_core.tools import tool

human_message = HumanMessage('Make the following calculation: 392373366237 * 562310951975')
for mdl in MODELS:
    print(f'\n\033[1m{str(mdl)}\033[0m\n')
    chat = mdl.new_chat()
    response = chat.invoke([human_message])
    display(response)

gemma3:4b

functiongemma:270m

granite4:1b

print(f'{392373366237 * 562310951975:,}')

220,635,841,098,362,793,468,075

answer_as_code = HumanMessage("""
IF this type of question would be better answered by evaluating code, return instead
ONLY Python code in the answer. Use the Markdown format for code snippets:
```python
<code>
```
""")
human_message = HumanMessage("""Make the following calculation: 392373366237 * 562310951975""")
for mdl in MODELS:
    print(highlight(str(mdl)))
    chat = mdl.new_chat()
    response = chat.invoke([human_message, answer_as_code])
    display(response)

gemma3:4b

functiongemma:270m

granite4:1b

human_message = HumanMessage("""What is the name of the natural satellite orbiting around the earth?""")
for mdl in MODELS:
    print(highlight(str(mdl)))
    chat = mdl.new_chat()
    response = chat.invoke([human_message, answer_as_code])
    display(response)

gemma3:4b

functiongemma:270m

granite4:1b

system_prompt_tools = """
You have access to functions. 
You don't have to use tools if not necessary, but *IF* you decide to invoke any of the function(s),
you MUST put it in a valid JSON expression like:
[
  {"name": function name,
   "parameters": dictionary of argument name and its value}
]

You SHOULD NOT include any other text in the response if you call a function.

Functions:
[
  { "name": "multiply",
    "description": "Multiply two numbers.",
    "parameters": {
      "type": "object",
      "properties": {
          "a": "number",
          "b": "number"
      },
      "required": [
          "a", "b"
      ]
    }
  }
]
"""

import operator
tools = [tool(operator.mul)]

human_message = HumanMessage("""Make the following calculation: 392373366237 * 562310951975""")

for model in MODELS:
    chat = model.new_chat()
    if model.has_tools():
        print(f'{highlight(model.name)} (with tools)\n')
        chat = chat.bind_tools(tools)
        messages = [human_message]
    else:
        print(f'{highlight(model.name)}\n')
        messages = [SystemMessage(system_prompt_tools),
                    human_message]
    response = chat.invoke(messages)
    display(response)

gemma3:4b

functiongemma:270m (with tools)

granite4:1b (with tools)

import sqlite3

dbcon = sqlite3.connect(':memory:', check_same_thread=False)
dbcon.execute("""
CREATE TABLE medication(
ndc STRING PRIMARY KEY,
common_name STRING,
quantity INTEGER
);
""")
for values in (
    ('ABCD-DEF', 'Aspirin', 3), ('ABCD-GHI', 'Aspirin', 5), ('GHIK-KLM', 'bacitracin', 10)
):
    dbcon.execute("""
    INSERT INTO medication(ndc, common_name, quantity) VALUES (?,?,?);
    """, values)

def get_ndc_code(medication: str) -> tuple[str, ...]:
    """Get possible ndc codes for a medication.
    
    Args:
      medication: name of the medication for which NDC code should be returned.
    """
    cursor = dbcon.cursor()
    cursor.execute('SELECT ndc FROM medication WHERE common_name==?',
                   (medication, ))
    return tuple(row[0] for row in cursor.fetchall())


def get_ndc_stock(ndc_code: str) -> int:
    """Get the number of boxes of medication in stock.
    
    Args:
      ndc_code: NDC code to retrieve stock for.
    """
    cursor = dbcon.cursor()
    cursor.execute('SELECT quantity FROM medication WHERE ndc==?',
                   (ndc_code, ))
    return cursor.fetchone()[0]

system_prompt_tools = """
You have access to functions. 
You don't have to use tools if not necessary, but *IF* you decide to invoke any of the function(s),
you MUST put it in a valid JSON expression like:
[
  {"name": function name,
   "parameters": dictionary of argument name and its value}
]

You SHOULD NOT include any other text in the response if you call a function.

Functions:
[
  {
    "name": "get_ndc_stock",
    "description": "Get the number of boxes of medication in stock.",
    "parameters": {
      "type": "object",
      "properties": {
        "ndc_code": {
          "type": "string"
        }
      },
      "required": [
        "ndc_code"
      ]
    }
  },
  {
    "name": "get_ndc_code",
    "description": "Get possible ndc codes for a medication.",
    "parameters": {
      "type": "object",
      "properties": {
        "medication": {
          "type": "string"
        }
      },
      "required": [
        "medication"
      ]
    },
  }
]
"""

tools = [tool(get_ndc_code), tool(get_ndc_stock)]

def invoke_model(model, human_message, system_message=SystemMessage('')):
    chat = model.new_chat()
    if model.has_tools():
        print(f'\n{highlight(model.name)} (with tools)\n')
        chat = chat.bind_tools(tools)
    else:
        print(f'\n{highlight(model.name)}\n')
    messages = [system_message,
                human_message]
    response = chat.invoke(messages)
    return response, chat

human_message = HumanMessage('Name the first month of the year.')

for model in MODELS:
    response, chat = invoke_model(model, human_message)
    display(response)


gemma3:4b


functiongemma:270m (with tools)


granite4:1b (with tools)

tool_map = {tool.name: tool for tool in tools}
if len(tool_map) != len(tools):
    raise ValueError("'tools' contains at lease one tool name duplicate.")

human_message = HumanMessage('How many boxes of medication with NDC code ABCD-DEF do we have left?')

for model in MODELS:
    response, chat = invoke_model(model, human_message, SystemMessage(system_prompt_tools))
    display(response)
    if response.tool_calls:
        for tool_call in response.tool_calls:
            print(
                f'  --> calling {tool_call["name"]}'
                f'({", ".join("=".join((k, repr(v))) for k, v in tool_call["args"].items())})'
            )
            selected_tool = tool_map[tool_call['name']]
            res = selected_tool.invoke(tool_call)
            print('      result:')
            print(f'        {res.content}')
    else:
        print('Assessing automatically if there is a tool call is left as an exercise for the reader.')


gemma3:4b

Assessing automatically if there is a tool call is left as an exercise for the reader.


functiongemma:270m (with tools)

  --> calling get_ndc_stock(ndc_code='ABCD-DEF')
      result:
        3


granite4:1b (with tools)

  --> calling get_ndc_stock(ndc_code='ABCD-DEF')
      result:
        3

human_message = HumanMessage("What are possible NDC codes for the medication 'Aspirin'?")

for model in MODELS:
    response, chat = invoke_model(model, human_message, SystemMessage(system_prompt_tools))
    display(response)
    if response.tool_calls:
        print('      result:')
        for tool_call in response.tool_calls:
            selected_tool = tool_map[tool_call['name']]
            res = selected_tool.invoke(tool_call)    
            print(f'        {res.content}')
    else:
        print('Assessing automatically if there is a tool call is left as an exercise for the reader.')


gemma3:4b

Assessing automatically if there is a tool call is left as an exercise for the reader.


functiongemma:270m (with tools)

      result:
        ["ABCD-DEF", "ABCD-GHI"]


granite4:1b (with tools)

      result:
        ["ABCD-DEF", "ABCD-GHI"]

human_message = HumanMessage('How many boxes of Aspirin do we have in stock altogether?')

for model in MODELS:
    response, chat = invoke_model(model, human_message, SystemMessage(system_prompt_tools))
    display(response)


gemma3:4b


functiongemma:270m (with tools)


granite4:1b (with tools)

from langchain.agents import create_agent

human_message = HumanMessage("How many boxes of Aspirin do we have in stock altogether?")

for model in MODELS:
    print(highlight(model.name))
    if model.has_tools():
        react = create_agent(model.new_chat(), tools=tools)
        r_stream = react.stream({'messages': [human_message]}, stream_mode='updates')
        try:
            for chunk in r_stream:
                for k in chunk.keys():
                    for m in chunk[k]['messages']:
                        display(m)
        except TypeError as err:
            print('Error:')
            print(err)
    else:
        print('Parsing AI messages into next actions and results is left as an exercise.')

gemma3:4b
Parsing AI messages into next actions and results is left as an exercise.

functiongemma:270m

Error:
'NoneType' object is not subscriptable

granite4:1b

Small local agents¶

Setup¶

Local Ollama server¶

Required Python packages¶

Utility code¶

Object display customization¶

List of language models¶

Language models and their limitations¶

Adding tools as context¶

Tools in prompt¶

Tools as `tools`¶

Language model opting to answer with a tool call¶

Agentic linear chaining - an example¶

Database¶

Tools to query a database¶

Prompting an LLM to use tools (when needed)¶

Reasoning in steps¶

ReAct¶

Conclusion¶

AI message
response:	Okay, let's calculate 392373366237 * 562310951975. This is a large multiplication, and it's best done using a calculator or a programming language. Here's the result: **2236358838888888888888888888888888888888

AI message
response:	I apologize, but I cannot perform this calculation. The calculation tool I have access to is specialized for calculating mathematical operations related to financial calculations, such as calculating stock market valuations or stock market indices. I cannot access or perform complex financial data like this.

AI message
response:	The result of multiplying 392373366237 by 562310951975 is: 220,646,204,278,964,000,795

AI message
response:	```python print(392373366237 * 562310951975) ```

AI message
response:	I apologize, but I cannot assist with generating Python code. My current capabilities are limited to assisting with mathematical calculations and data analysis using the provided tools. I cannot generate programming code.

AI message
response:	```python result = 392373366237 * 562310951975 result ```

AI message
response:	```python print("The name of the natural satellite orbiting around the Earth is the Moon.") ```

AI message
response:	I apologize, but I cannot assist with programming or generating Python code. My current capabilities are limited to assisting with tasks related to natural language processing and text generation. I cannot provide programming advice or code snippets.

AI message
response:	The name of the natural satellite orbiting around the Earth is called the Moon.

AI message
response:	```json [ { "name": "multiply", "parameters": { "a": 392373366237, "b": 562310951975 } } ] ```

AI message
tools:	[{'name': 'mul', 'args': {'a': 392373366237, 'b': 562310951975}, 'id': '7c9769d1-8531-4868-866f-3d00eb598097', 'type': 'tool_call'}]

AI message
tools:	[{'name': 'mul', 'args': {'a': '392373366237', 'b': '562310951975'}, 'id': '62be38a6-3878-4ad3-839d-31093d5d8d3e', 'type': 'tool_call'}]

AI message
response:	January! Do you want to play a quick game of guessing months? 😊

AI message
tools:	[{'name': 'get_ndc_stock', 'args': {'ndc_code': 'ABCD-DEF'}, 'id': 'a63df468-8c35-4d1c-ba01-f07c58b4a29a', 'type': 'tool_call'}]

AI message
response:	I apologize, but I cannot assist with retrieving the specific NDC code for the first month of the year. My current tools are designed for retrieving medication-related data and stock information. I cannot query or retrieve specific calendar or stock data for specific dates.

AI message
response:	The first month of the year is January.

AI message
response:	```json [ { "name": "get_ndc_stock", "parameters": { "ndc_code": "ABCD-DEF" } } ] ```

AI message
response:	```json [ { "name": "get_ndc_code", "parameters": { "medication": "Aspirin" } } ] ```

AI message
tools:	[{'name': 'get_ndc_code', 'args': {'medication': 'Aspirin'}, 'id': '5d987bf2-cc49-4058-b0d7-08196877a7d3', 'type': 'tool_call'}]

AI message
response:	The total number of boxes in stock for Aspirin is 8.

Small local agents¶

Setup¶

Local Ollama server¶

Required Python packages¶

Utility code¶

Object display customization¶

List of language models¶

Language models and their limitations¶

Adding tools as context¶

Tools in prompt¶

Tools as tools¶

Language model opting to answer with a tool call¶

Agentic linear chaining - an example¶

Database¶

Tools to query a database¶

Prompting an LLM to use tools (when needed)¶

Reasoning in steps¶

ReAct¶

Conclusion¶

Tools as `tools`¶