Exported source
import inspect
from collections import abc
from fastcore.utils import *
from fastcore.docments import docments
from typing import get_origin, get_args, Dict, List, Optional, Tuple, Union
from types import UnionType
Many LLMs do function calling (aka tool use) by taking advantage of JSON schema.
We’ll use docments to make getting JSON schema from Python functions as ergonomic as possible. Each parameter (and the return value) should have a type, and a docments comment with the description of what it is. Here’s an example:
This is what docments
makes of that:
{ 'a': { 'anno': <class 'int'>,
'default': <class 'inspect._empty'>,
'docment': 'First thing to sum'},
'b': {'anno': <class 'int'>, 'default': 1, 'docment': 'Second thing to sum'},
'c': {'anno': list[int], 'default': None, 'docment': 'A pointless argument'},
'return': { 'anno': <class 'int'>,
'default': <class 'inspect._empty'>,
'docment': 'The sum of the inputs'}}
Note that this is an AttrDict so we can treat it like an object, or a dict:
def _types(t:type)->tuple[str,Optional[str]]:
"Tuple of json schema type name and (if appropriate) array item name."
if t is empty: raise TypeError('Missing type')
tmap = {int:"integer", float:"number", str:"string", bool:"boolean", list:"array", dict:"object"}
tmap.update({k.__name__: v for k, v in tmap.items()})
if getattr(t, '__origin__', None) in (list,tuple):
args = getattr(t, '__args__', None)
item_type = "object" if not args else tmap.get(t.__args__[0].__name__, "object")
return "array", item_type
# if t is a string like 'int', directly use the string as the key
elif isinstance(t, str): return tmap.get(t, "object"), None
# if t is the type itself and a container
elif get_origin(t): return tmap.get(get_origin(t).__name__, "object"), None
# if t is the type itself like int, use the __name__ representation as the key
else: return tmap.get(t.__name__, "object"), None
This internal function is needed to convert Python types into JSON schema types.
(('array', 'integer'), ('integer', None), ('integer', None))
(('array', 'integer'), ('object', None), ('object', None), ('array', 'string'))
Note the current behavior:
These and other approximations may require further refinement in the future.
Will also convert custom types to the object
type.
def _param(name, info):
"json schema parameter given `name` and `info` from docments full dict."
paramt,itemt = _types(info.anno)
pschema = dict(type=paramt, description=info.docment or "")
if itemt: pschema["items"] = {"type": itemt}
if info.default is not empty: pschema["default"] = info.default
return pschema
This private function converts a key/value pair from the docments
structure into the dict
that will be needed for the schema.
a // {'docment': 'First thing to sum', 'anno': <class 'int'>, 'default': <class 'inspect._empty'>}
{'type': 'integer', 'description': 'First thing to sum'}
({'type': 'integer'}, {'type': 'string', 'format': 'Path'})
For union and optional types, Union
covers older Union[str]
syntax while UnionType
covers 3.10+ str | None
syntax.
def _example_new_unioin(opt_tup: str | None):
pass
d = docments(_example_new_unioin, full=True)
anno1 = first(d.items())[1].anno
(anno1, get_origin(anno1), get_args(anno1))
(str | None, types.UnionType, (str, NoneType))
def _example_old_union(opt_tup: Union[str, type(None)] =None):
pass
d = docments(_example_old_union, full=True)
anno2 = first(d.items())[1].anno
(anno2, get_origin(anno2), get_args(anno2))
(typing.Optional[str], typing.Union, (str, NoneType))
Support for both union types is part of the broader container handling:
# Test primitive types
defs = {}
assert _handle_type(int, defs) == {'type': 'integer'}
assert _handle_type(str, defs) == {'type': 'string'}
assert _handle_type(bool, defs) == {'type': 'boolean'}
assert _handle_type(float, defs) == {'type': 'number'}
# Test custom class
class TestClass:
def __init__(self, x: int, y: int): store_attr()
result = _handle_type(TestClass, defs)
assert result == {'$ref': '#/$defs/TestClass'}
assert 'TestClass' in defs
assert defs['TestClass']['type'] == 'object'
assert 'properties' in defs['TestClass']
# Test primitive types in containers
assert _handle_container(list, (int,), defs) == {'type': 'array', 'items': {'type': 'integer'}}
assert _handle_container(tuple, (str,), defs) == {'type': 'array', 'items': {'type': 'string'}}
assert _handle_container(set, (str,), defs) == {'type': 'array', 'items': {'type': 'string'}, 'uniqueItems': True}
assert _handle_container(dict, (str,bool), defs) == {'type': 'object', 'additionalProperties': {'type': 'boolean'}}
result = _handle_container(list, (TestClass,), defs)
assert result == {'type': 'array', 'items': {'$ref': '#/$defs/TestClass'}}
assert 'TestClass' in defs
# Test complex nested structure
ComplexType = dict[str, list[TestClass]]
result = _handle_container(dict, (str, list[TestClass]), defs)
assert result == {
'type': 'object',
'additionalProperties': {
'type': 'array',
'items': {'$ref': '#/$defs/TestClass'}
}
}
# Test processing of a required integer property
props, req = {}, {}
class TestClass:
"Test class"
def __init__(
self,
x: int, # First thing
y: list[float], # Second thing
z: str = "default", # Third thing
): store_attr()
d = docments(TestClass, full=True)
_process_property('x', d.x, props, req, defs)
assert 'x' in props
assert props['x']['type'] == 'integer'
assert 'x' in req
# Test processing of a required list property
_process_property('y', d.y, props, req, defs)
assert 'y' in props
assert props['y']['type'] == 'array'
assert props['y']['items']['type'] == 'number'
assert 'y' in req
# Test processing of an optional string property with default
_process_property('z', d.z, props, req, defs)
assert 'z' in props
assert props['z']['type'] == 'string'
assert props['z']['default'] == "default"
assert 'z' not in req
get_schema (f:<built-infunctioncallable>, pname='input_schema')
Generate JSON schema for a class, function, or method
def get_schema(f:callable, pname='input_schema')->dict:
"Generate JSON schema for a class, function, or method"
schema = _get_nested_schema(f)
desc = f.__doc__
assert desc, "Docstring missing!"
d = docments(f, full=True)
ret = d.pop('return')
if ret.anno is not empty: desc += f'\n\nReturns:\n- type: {_types(ret.anno)[0]}'
return {"name": f.__name__, "description": desc, pname: schema}
Putting this all together, we can now test getting a schema from silly_sum
. The tool use spec doesn’t support return annotations directly, so we put that in the description instead.
Adds a + b.
Returns:
- type: integer
{'name': 'silly_sum',
'input_schema': {'type': 'object',
'properties': {'a': {'type': 'integer', 'description': 'First thing to sum'},
'b': {'type': 'integer',
'description': 'Second thing to sum',
'default': 1},
'c': {'type': 'array',
'description': 'A pointless argument',
'items': {'type': 'integer'},
'default': None}},
'title': None,
'required': ['a']}}
This also works with string annotations, e.g:
def silly_test(
a: 'int', # quoted type hint
):
"Mandatory docstring"
return a
get_schema(silly_test)
{'name': 'silly_test',
'description': 'Mandatory docstring',
'input_schema': {'type': 'object',
'properties': {'a': {'type': 'integer', 'description': 'quoted type hint'}},
'title': None,
'required': ['a']}}
This also works with instance methods:
class Dummy:
def sums(
self,
a:int, # First thing to sum
b:int=1 # Second thing to sum
) -> int: # The sum of the inputs
"Adds a + b."
print(f"Finding the sum of {a} and {b}")
return a + b
get_schema(Dummy.sums)
{'name': 'sums',
'description': 'Adds a + b.\n\nReturns:\n- type: integer',
'input_schema': {'type': 'object',
'properties': {'a': {'type': 'integer', 'description': 'First thing to sum'},
'b': {'type': 'integer',
'description': 'Second thing to sum',
'default': 1}},
'title': None,
'required': ['a']}}
get_schema
also handles more complicated structures such as nested classes. This is useful for things like structured outputs.
class Turn:
"Turn between two speakers"
def __init__(
self,
speaker_a:str, # First speaker's message
speaker_b:str, # Second speaker's message
): store_attr()
class Conversation:
"A conversation between two speakers"
def __init__(
self,
turns:list[Turn], # Turns of the conversation
): store_attr()
get_schema(Conversation)
{'name': 'Conversation',
'description': 'A conversation between two speakers',
'input_schema': {'type': 'object',
'properties': {'turns': {'type': 'array',
'description': 'Turns of the conversation',
'items': {'$ref': '#/$defs/Turn'}}},
'title': 'Conversation',
'required': ['turns'],
'$defs': {'Turn': {'type': 'object',
'properties': {'speaker_a': {'type': 'string',
'description': "First speaker's message"},
'speaker_b': {'type': 'string',
'description': "Second speaker's message"}},
'title': 'Turn',
'required': ['speaker_a', 'speaker_b']}}}}
class DictConversation:
"A conversation between two speakers"
def __init__(
self,
turns:dict[str,list[Turn]], # dictionary of topics and the Turns of the conversation
): store_attr()
get_schema(DictConversation)
{'name': 'DictConversation',
'description': 'A conversation between two speakers',
'input_schema': {'type': 'object',
'properties': {'turns': {'type': 'object',
'description': 'dictionary of topics and the Turns of the conversation',
'additionalProperties': {'type': 'array',
'items': {'$ref': '#/$defs/Turn'}}}},
'title': 'DictConversation',
'required': ['turns'],
'$defs': {'Turn': {'type': 'object',
'properties': {'speaker_a': {'type': 'string',
'description': "First speaker's message"},
'speaker_b': {'type': 'string',
'description': "Second speaker's message"}},
'title': 'Turn',
'required': ['speaker_a', 'speaker_b']}}}}
class SetConversation:
"A conversation between two speakers"
def __init__(
self,
turns:set[Turn], # the unique Turns of the conversation
): store_attr()
get_schema(SetConversation)
{'name': 'SetConversation',
'description': 'A conversation between two speakers',
'input_schema': {'type': 'object',
'properties': {'turns': {'type': 'array',
'description': 'the unique Turns of the conversation',
'items': {'$ref': '#/$defs/Turn'},
'uniqueItems': True}},
'title': 'SetConversation',
'required': ['turns'],
'$defs': {'Turn': {'type': 'object',
'properties': {'speaker_a': {'type': 'string',
'description': "First speaker's message"},
'speaker_b': {'type': 'string',
'description': "Second speaker's message"}},
'title': 'Turn',
'required': ['speaker_a', 'speaker_b']}}}}
PathArg (path:str)
Type | Details | |
---|---|---|
path | str | A filesystem path |
Paths are a special case, since they only take *args
and **kwargs
as params, but normally we’d use them in a schema by just passing a str. So we create a custom param type for that.
def path_test(
a: PathArg, # a type hint
b: PathArg # b type hint
):
"Mandatory docstring"
return a/b
get_schema(path_test)
{'name': 'path_test',
'description': 'Mandatory docstring',
'input_schema': {'type': 'object',
'properties': {'a': {'type': 'object',
'description': 'a type hint',
'$ref': '#/$defs/PathArg'},
'b': {'type': 'object',
'description': 'b type hint',
'$ref': '#/$defs/PathArg'}},
'title': None,
'required': ['a', 'b'],
'$defs': {'PathArg': {'type': 'object',
'properties': {'path': {'type': 'string',
'description': 'A filesystem path'}},
'title': None,
'required': ['path']}}}}
Alternatively, use Path
as usual, and handle the format
key in the json to use that as a callable:
def path_test2(
a: Path, # a type hint
b: Path # b type hint
):
"Mandatory docstring"
return a/b
get_schema(path_test2)
{'name': 'path_test2',
'description': 'Mandatory docstring',
'input_schema': {'type': 'object',
'properties': {'a': {'type': 'string',
'description': 'a type hint',
'format': 'Path'},
'b': {'type': 'string', 'description': 'b type hint', 'format': 'Path'}},
'title': None,
'required': ['a', 'b']}}
get_schema()
Test CasesUnion types are approximately mapped to JSON schema ‘anyOf’ with two or more value types.
def _union_test(opt_tup: Union[Tuple[int, int], str, int]=None):
"Mandatory docstring"
return ""
get_schema(_union_test)
{'name': '_union_test',
'description': 'Mandatory docstring',
'input_schema': {'type': 'object',
'properties': {'opt_tup': {'type': 'object',
'description': '',
'default': None,
'anyOf': [{'type': 'array'}, {'type': 'string'}, {'type': 'integer'}]}},
'title': None}}
The new (Python 3.10+) union syntax can also be used, producing an equivalent schema.
def _new_union_test(opt_tup: Tuple[int, int] | str | int =None):
"Mandatory docstring"
pass
get_schema(_new_union_test)
{'name': '_new_union_test',
'description': 'Mandatory docstring',
'input_schema': {'type': 'object',
'properties': {'opt_tup': {'type': 'object',
'description': '',
'default': None,
'anyOf': [{'type': 'array'}, {'type': 'string'}, {'type': 'integer'}]}},
'title': None}}
Optional is a special case of union types, limited to two types, one of which is None (mapped to null in JSON schema):
def _optional_test(opt_tup: Optional[Tuple[int, int]]=None):
"Mandatory docstring"
pass
get_schema(_optional_test)
{'name': '_optional_test',
'description': 'Mandatory docstring',
'input_schema': {'type': 'object',
'properties': {'opt_tup': {'type': 'object',
'description': '',
'default': None,
'anyOf': [{'type': 'array'}, {'type': 'null'}]}},
'title': None}}
Containers can also be used, both in their parameterized form (List[int]
) or as their unparameterized raw type (List
). In the latter case, the item type is mapped to object
in JSON schema.
{'name': '_list_test',
'description': 'Mandatory docstring',
'input_schema': {'type': 'object',
'properties': {'l': {'type': 'array',
'description': '',
'items': {'type': 'integer'}}},
'title': None,
'required': ['l']}}
{'name': '_raw_list_test',
'description': 'Mandatory docstring',
'input_schema': {'type': 'object',
'properties': {'l': {'type': 'array',
'description': '',
'items': {'type': 'object'}}},
'title': None,
'required': ['l']}}
The same applies to dictionary, which can similarly be parameterized with key/value types or specified as a raw type.
{'name': '_dict_test',
'description': 'Mandatory docstring',
'input_schema': {'type': 'object',
'properties': {'d': {'type': 'object',
'description': '',
'additionalProperties': {'type': 'integer'}}},
'title': None,
'required': ['d']}}
In language model clients it’s often useful to have a ‘code interpreter’ – this is something that runs code, and generally outputs the result of the last expression (i.e like IPython or Jupyter).
In this section we’ll create the python
function, which executes a string as Python code, with an optional timeout. If the last line is an expression, we’ll return that – just like in IPython or Jupyter, but without needing them installed.
def _copy_loc(new, orig):
"Copy location information from original node to new node and all children."
new = ast.copy_location(new, orig)
for field, o in ast.iter_fields(new):
if isinstance(o, ast.AST): setattr(new, field, _copy_loc(o, orig))
elif isinstance(o, list): setattr(new, field, [_copy_loc(value, orig) for value in o])
return new
This is an internal function that’s needed for _run
to ensure that location information is available in the abstract syntax tree (AST), since otherwise python complains.
def _run(code:str ):
"Run `code`, returning final expression (similar to IPython)"
tree = ast.parse(code)
last_node = tree.body[-1] if tree.body else None
# If the last node is an expression, modify the AST to capture the result
if isinstance(last_node, ast.Expr):
tgt = [ast.Name(id='_result', ctx=ast.Store())]
assign_node = ast.Assign(targets=tgt, value=last_node.value)
tree.body[-1] = _copy_loc(assign_node, last_node)
compiled_code = compile(tree, filename='<ast>', mode='exec')
namespace = {}
stdout_buffer = io.StringIO()
saved_stdout = sys.stdout
sys.stdout = stdout_buffer
try: exec(compiled_code, namespace)
finally: sys.stdout = saved_stdout
_result = namespace.get('_result', None)
if _result is not None: return _result
return stdout_buffer.getvalue().strip()
This is the internal function used to actually run the code – we pull off the last AST to see if it’s an expression (i.e something that returns a value), and if so, we store it to a special _result
variable so we can return it.
We now have the machinery needed to create our python
function.
python (code, timeout=5)
Executes python code
with timeout
and returning final expression (similar to IPython). Raised exceptions are returned as a string, with a stack trace.
Type | Default | Details | |
---|---|---|---|
code | Code to execute | ||
timeout | int | 5 | Maximum run time in seconds before a TimeoutError is raised |
def python(code, # Code to execute
timeout=5 # Maximum run time in seconds before a `TimeoutError` is raised
): # Result of last node, if it's an expression, or `None` otherwise
"""Executes python `code` with `timeout` and returning final expression (similar to IPython).
Raised exceptions are returned as a string, with a stack trace."""
def handler(*args): raise TimeoutError()
signal.signal(signal.SIGALRM, handler)
signal.alarm(timeout)
try: return _run(code)
except Exception as e: return traceback.format_exc()
finally: signal.alarm(0)
There’s no builtin security here – you should generally use this in a sandbox, or alternatively prompt before running code. It can handle multiline function definitions, and pretty much any other normal Python syntax.
python("""def factorial(n):
if n == 0 or n == 1: return 1
else: return n * factorial(n-1)
factorial(5)""")
120
If the code takes longer than timeout
then it raises a TimeoutError
.
Many LLM API providers offer tool calling where an LLM can choose to call a given tool. This is also helpful for structured outputs since the response from the LLM is contrained to the required arguments of the tool.
This section will be dedicated to helper functions for calling tools. We don’t want to allow LLMs to call just any possible function (that would be a security disaster!) so we create a namespace – that is, a dictionary of allowable function names to call.
mk_ns (*funcs_or_objs)
{'subs': <function __main__.Dummy.subs(a, b)>,
'mults': <bound method Dummy.mults of <class '__main__.Dummy'>>,
'Dummy': __main__.Dummy}
{'__call__': <bound method Dummy.__call__ of <__main__.Dummy object>>,
'__init__': <bound method Dummy.__init__ of <__main__.Dummy object>>,
'mults': <bound method Dummy.mults of <class '__main__.Dummy'>>,
'sums': <bound method Dummy.sums of <__main__.Dummy object>>,
'subs': <staticmethod(<function Dummy.subs>)>}
call_func (fc_name, fc_inputs, ns)
Call the function fc_name
with the given fc_inputs
using namespace ns
.
Now when we an LLM responses with the tool to use and its inputs, we can simply use the same namespace it was given to look up the tool and call it.