Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Passing Functions as Tools #321

Merged
merged 32 commits into from
Nov 20, 2024
Merged
Show file tree
Hide file tree
Changes from 27 commits
Commits
Show all changes
32 commits
Select commit Hold shift + click to select a range
4383603
WIP tool parsing
ParthSareen Nov 8, 2024
afe7db6
Managing multiple type options
ParthSareen Nov 9, 2024
8fee892
Add tool parsing and processing
ParthSareen Nov 11, 2024
0e5a940
Formatting and todos
ParthSareen Nov 11, 2024
1ef75a7
TODOs
ParthSareen Nov 11, 2024
93c7a63
wip
ParthSareen Nov 11, 2024
e5dc2b8
add annotations import for old tests
ParthSareen Nov 11, 2024
aa20015
Exhaustive type matching
ParthSareen Nov 11, 2024
d79538e
Ruff fix
ParthSareen Nov 11, 2024
97aa167
WIP trying tests out
ParthSareen Nov 11, 2024
8ec5123
Trying stuff out
ParthSareen Nov 11, 2024
efb775b
Multi-line docstrings and exhaustive tests
ParthSareen Nov 12, 2024
2efa54a
Walrus op for cleanup
ParthSareen Nov 12, 2024
1f089f7
Stringify return type arrays to not break server
ParthSareen Nov 13, 2024
fe8d143
WIP
ParthSareen Nov 14, 2024
67321a8
Organization, cleanup, pydantic serialization, update tests
ParthSareen Nov 14, 2024
2cc0b40
Typing fix
ParthSareen Nov 14, 2024
e68700c
Python3.8+ compatibility
ParthSareen Nov 14, 2024
f452fab
Add str -> str valid json mapping and add test
ParthSareen Nov 14, 2024
ca16670
Code cleanup and organization
ParthSareen Nov 14, 2024
7dcb598
Test unhappy parse path
ParthSareen Nov 14, 2024
7c5c294
Code cleanup + organize and add tests for type serialization
ParthSareen Nov 14, 2024
16c868a
Update to have graceful handling and not raise - added tests as well
ParthSareen Nov 15, 2024
718412a
Making good use of pydantic
ParthSareen Nov 18, 2024
e7bb55f
Add yields and test
ParthSareen Nov 18, 2024
7396ab6
Simplified parsing and fixed required - added tests
ParthSareen Nov 18, 2024
0d9eec0
Add tool.model_validate
ParthSareen Nov 18, 2024
ed3ba8a
Code style updates
ParthSareen Nov 19, 2024
a4ec34a
Add better messaging for chat
ParthSareen Nov 19, 2024
6d9c156
Addressing comments + cleanup + optional tool
ParthSareen Nov 19, 2024
c5c61a3
Better docstring parsing and some fixes
ParthSareen Nov 20, 2024
b0e0409
Bugfix/image encoding (#327)
ParthSareen Nov 20, 2024
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
20 changes: 15 additions & 5 deletions ollama/_client.py
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@

from typing import (
Any,
Callable,
Literal,
Mapping,
Optional,
Expand All @@ -22,6 +23,9 @@

import sys


from ollama._utils import convert_function_to_tool

if sys.version_info < (3, 9):
from typing import Iterator, AsyncIterator
else:
Expand Down Expand Up @@ -284,7 +288,7 @@ def chat(
model: str = '',
messages: Optional[Sequence[Union[Mapping[str, Any], Message]]] = None,
*,
tools: Optional[Sequence[Union[Mapping[str, Any], Tool]]] = None,
tools: Optional[Sequence[Union[Mapping[str, Any], Tool, Callable]]] = None,
stream: bool = False,
format: Optional[Literal['', 'json']] = None,
options: Optional[Union[Mapping[str, Any], Options]] = None,
Expand Down Expand Up @@ -750,7 +754,7 @@ async def chat(
model: str = '',
messages: Optional[Sequence[Union[Mapping[str, Any], Message]]] = None,
*,
tools: Optional[Sequence[Union[Mapping[str, Any], Tool]]] = None,
tools: Optional[Sequence[Union[Mapping[str, Any], Tool, Callable]]] = None,
stream: Literal[True] = True,
format: Optional[Literal['', 'json']] = None,
options: Optional[Union[Mapping[str, Any], Options]] = None,
Expand Down Expand Up @@ -1075,9 +1079,15 @@ def _copy_messages(messages: Optional[Sequence[Union[Mapping[str, Any], Message]
)


def _copy_tools(tools: Optional[Sequence[Union[Mapping[str, Any], Tool]]]) -> Iterator[Tool]:
for tool in tools or []:
yield Tool.model_validate(tool)
def _copy_tools(tools: Optional[Sequence[Union[Mapping[str, Any], Tool, Callable]]] = None) -> Iterator[Tool]:
if not tools:
return []
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved

for unprocessed_tool in tools:
if callable(unprocessed_tool):
yield convert_function_to_tool(unprocessed_tool)
else:
yield Tool.model_validate(unprocessed_tool)
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved


def _as_path(s: Optional[Union[str, PathLike]]) -> Union[Path, None]:
Expand Down
26 changes: 14 additions & 12 deletions ollama/_types.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,25 +2,19 @@
from base64 import b64encode
from pathlib import Path
from datetime import datetime
from typing import (
Any,
Literal,
Mapping,
Optional,
Sequence,
Union,
)
from typing_extensions import Annotated
from typing import Any, Mapping, Optional, Union, Sequence

from typing_extensions import Annotated, Literal

from pydantic import (
BaseModel,
ByteSize,
ConfigDict,
Field,
FilePath,
Base64Str,
model_serializer,
)
from pydantic.json_schema import JsonSchemaValue


class SubscriptableBaseModel(BaseModel):
Expand Down Expand Up @@ -229,9 +223,16 @@ class Function(SubscriptableBaseModel):
description: str

class Parameters(SubscriptableBaseModel):
type: str
type: Literal['object'] = 'object'
required: Optional[Sequence[str]] = None
properties: Optional[JsonSchemaValue] = None

class Property(SubscriptableBaseModel):
model_config = ConfigDict(arbitrary_types_allowed=True)
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved

type: str
description: str

properties: Optional[Mapping[str, Property]] = None

parameters: Parameters

Expand Down Expand Up @@ -335,6 +336,7 @@ class ModelDetails(SubscriptableBaseModel):

class ListResponse(SubscriptableBaseModel):
class Model(SubscriptableBaseModel):
name: Optional[str] = None
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved
modified_at: Optional[datetime] = None
digest: Optional[str] = None
size: Optional[ByteSize] = None
Expand Down
103 changes: 103 additions & 0 deletions ollama/_utils.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,103 @@
from __future__ import annotations
import inspect
from typing import Callable, Union

import pydantic
from ollama._types import Tool


def _parse_docstring(doc_string: Union[str, None]) -> dict[str, str]:
parsed_docstring = {'description': ''}
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved
if not doc_string:
return parsed_docstring

lowered_doc_string = doc_string.lower()
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved

if 'args:' not in lowered_doc_string:
parsed_docstring['description'] = lowered_doc_string.strip()
return parsed_docstring

else:
parsed_docstring['description'] = lowered_doc_string.split('args:')[0].strip()
args_section = lowered_doc_string.split('args:')[1]

if 'returns:' in lowered_doc_string:
# Return section can be captured and used
args_section = args_section.split('returns:')[0]

if 'yields:' in lowered_doc_string:
args_section = args_section.split('yields:')[0]

cur_var = None
for line in args_section.split('\n'):
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved
line = line.strip()
if not line:
continue
if ':' not in line:
# Continuation of the previous parameter's description
if cur_var:
parsed_docstring[cur_var] += f' {line}'
continue

# For the case with: `param_name (type)`: ...
if '(' in line:
param_name = line.split('(')[0]
param_desc = line.split('):')[1]

# For the case with: `param_name: ...`
else:
param_name, param_desc = line.split(':', 1)

parsed_docstring[param_name.strip()] = param_desc.strip()
cur_var = param_name.strip()

return parsed_docstring


def convert_function_to_tool(func: Callable) -> Tool:
schema = type(
func.__name__,
(pydantic.BaseModel,),
{
'__annotations__': {k: v.annotation for k, v in inspect.signature(func).parameters.items()},
'__signature__': inspect.signature(func),
'__doc__': inspect.getdoc(func),
},
).model_json_schema()

properties = {}
required = []
parsed_docstring = _parse_docstring(schema.get('description'))
for k, v in schema.get('properties', {}).items():
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved
prop = {
'description': parsed_docstring.get(k, ''),
'type': v.get('type'),
}

if 'anyOf' in v:
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved
is_optional = any(t.get('type') == 'null' for t in v['anyOf'])
types = [t.get('type', 'string') for t in v['anyOf'] if t.get('type') != 'null']
prop['type'] = types[0] if len(types) == 1 else str(types)
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved
if not is_optional:
required.append(k)
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved
else:
if prop['type'] != 'null':
required.append(k)

properties[k] = prop

schema['properties'] = properties

tool = Tool(
function=Tool.Function(
name=func.__name__,
description=parsed_docstring.get('description'),
parameters=Tool.Function.Parameters(
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved
type='object',
properties=schema.get('properties', {}),
required=required,
),
)
)

return Tool.model_validate(tool)
67 changes: 66 additions & 1 deletion tests/test_client.py
Original file line number Diff line number Diff line change
@@ -1,14 +1,15 @@
import os
import io
import json
from pydantic import ValidationError
import pytest
import tempfile
from pathlib import Path
from pytest_httpserver import HTTPServer, URIPattern
from werkzeug.wrappers import Request, Response
from PIL import Image

from ollama._client import Client, AsyncClient
from ollama._client import Client, AsyncClient, _copy_tools


class PrefixPattern(URIPattern):
Expand Down Expand Up @@ -982,3 +983,67 @@ def test_headers():
)
assert client._client.headers['x-custom'] == 'value'
assert client._client.headers['content-type'] == 'application/json'


def test_copy_tools():
def func1(x: int) -> str:
"""Simple function 1.
Args:
x (integer): A number
"""
pass

def func2(y: str) -> int:
"""Simple function 2.
Args:
y (string): A string
"""
pass

# Test with list of functions
tools = list(_copy_tools([func1, func2]))
assert len(tools) == 2
assert tools[0].function.name == 'func1'
assert tools[1].function.name == 'func2'

# Test with empty input
assert list(_copy_tools()) == []
assert list(_copy_tools(None)) == []
assert list(_copy_tools([])) == []

# Test with mix of functions and tool dicts
tool_dict = {
'type': 'function',
'function': {
'name': 'test',
'description': 'Test function',
'parameters': {
'type': 'object',
'properties': {'x': {'type': 'string', 'description': 'A string'}},
'required': ['x'],
},
},
}

tool_json = json.loads(json.dumps(tool_dict))
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved
tools = list(_copy_tools([func1, tool_dict, tool_json]))
assert len(tools) == 3
assert tools[0].function.name == 'func1'
assert tools[1].function.name == 'test'
assert tools[2].function.name == 'test'


def test_tool_validation():
# Test that malformed tool dictionaries are rejected
# Raises ValidationError when used as it is a generator
with pytest.raises(ValidationError):
invalid_tool = {'type': 'invalid_type', 'function': {'name': 'test'}}
list(_copy_tools([invalid_tool]))

# Test missing required fields
incomplete_tool = {
'type': 'function',
'function': {'name': 'test'}, # missing description and parameters
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Is parameters required?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

So in the previous behavior - no.
But since the last Pydantic PR you have to provide Parameters. Tested out both the OpenAI Python SDK with Ollama and the current published version of ollama-python. I think it might be worthwhile to have the Tool class have optional on all params to make sure it is backwards compatible.

Seems like function calling still works with not a fully-fledged JSON (I'm sure it's flakey but not our job).

Proposed Tool def'n:

class Tool(SubscriptableBaseModel):
  type: Optional[Literal['function']] = 'function'

  class Function(SubscriptableBaseModel):
    name: Optional[str] = None
    description: Optional[str] = None

    class Parameters(SubscriptableBaseModel):
      type: Optional[Literal['object']] = 'object'
      required: Optional[Sequence[str]] = None

      class Property(SubscriptableBaseModel):
        model_config = ConfigDict(arbitrary_types_allowed=True)

        type: Optional[str] = None
        description: Optional[str] = None

      properties: Optional[Mapping[str, Property]] = None

    parameters: Optional[Parameters] = None

  function: Optional[Function] = None

}
with pytest.raises(ValidationError):
list(_copy_tools([incomplete_tool]))
83 changes: 82 additions & 1 deletion tests/test_type_serialization.py
Original file line number Diff line number Diff line change
@@ -1,6 +1,9 @@
from base64 import b64decode, b64encode

from ollama._types import Image
import pytest


from ollama._types import Image, Tool


def test_image_serialization():
Expand All @@ -13,3 +16,81 @@ def test_image_serialization():
b64_str = 'dGVzdCBiYXNlNjQgc3RyaW5n'
img = Image(value=b64_str)
assert img.model_dump() == b64decode(b64_str).decode()


def test_tool_serialization():
ParthSareen marked this conversation as resolved.
Show resolved Hide resolved
# Test valid tool serialization
tool = Tool(
function=Tool.Function(
name='add_two_numbers',
description='Add two numbers together.',
parameters=Tool.Function.Parameters(
type='object',
properties={
'a': Tool.Function.Parameters.Property(
type='integer',
description='The first number',
),
'b': Tool.Function.Parameters.Property(
type='integer',
description='The second number',
),
},
required=['a', 'b'],
),
)
)
assert tool.model_dump() == {
'type': 'function',
'function': {
'name': 'add_two_numbers',
'description': 'Add two numbers together.',
'parameters': {
'type': 'object',
'properties': {
'a': {
'type': 'integer',
'description': 'The first number',
},
'b': {
'type': 'integer',
'description': 'The second number',
},
},
'required': ['a', 'b'],
},
},
}

# Test invalid type
with pytest.raises(ValueError):
property = Tool.Function.Parameters.Property(
type=lambda x: x, # Invalid type
description='Invalid type',
)
Tool.model_validate(
Tool(
function=Tool.Function(
parameters=Tool.Function.Parameters(
properties={
'x': property,
}
)
)
)
)

# Test invalid parameters type
with pytest.raises(ValueError):
Tool.model_validate(
Tool(
function=Tool.Function(
name='test',
description='Test',
parameters=Tool.Function.Parameters(
type='invalid_type', # Must be 'object'
properties={},
),
)
)
)
Loading