Commit22a63aa

authored

Adding tool input and output guardrails (#1792)

- This PR was started from [PR 1606: ToolGuardrails](#1606)- It adds input and output guardrails at the tool level which cantrigger `ToolInputGuardrailTripwireTriggered` and`ToolOutputGuardrailTripwireTriggered` exceptions- It includes updated documentation, a runnable example, and unit tests- `make check` and unit tests all pass## Edits since last review:- Extracted nested tool running logic in `_run_impl.py`- Added rejecting tool call or tool call output and returning a messageto the model (rather than only raising an exception)- Added the tool guardrail results to the `RunResult`- Removed docs

1 parentc02d863 commit22a63aaCopy full SHA for 22a63aa

File tree

12 files changed

+1309

-21

lines changed

docs
- guardrails.md
examples/basic
- tool_guardrails.py
src/agents
tests
- extensions/memory
  - test_advanced_sqlite_session.py
- test_result_cast.py
- test_tool_guardrails.py

12 files changed

+1309

-21

lines changed

`‎docs/guardrails.md‎`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -151,4 +151,4 @@ async def main():`
`151`	`151`	`1. This is the actual agent's output type.`
`152`	`152`	`2. This is the guardrail's output type.`
`153`	`153`	`3. This is the guardrail function that receives the agent's output, and returns the result.`
`154`		`-4. This is the actual agent that defines the workflow.`
	`154`	`+4. This is the actual agent that defines the workflow.`

`‎examples/basic/tool_guardrails.py‎`

Lines changed: 171 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,171 @@`
	`1`	`+importasyncio`
	`2`	`+importjson`
	`3`	`+`
	`4`	`+fromagentsimport (`
	`5`	`+Agent,`
	`6`	`+Runner,`
	`7`	`+ToolGuardrailFunctionOutput,`
	`8`	`+ToolInputGuardrailData,`
	`9`	`+ToolOutputGuardrailData,`
	`10`	`+ToolOutputGuardrailTripwireTriggered,`
	`11`	`+function_tool,`
	`12`	`+tool_input_guardrail,`
	`13`	`+tool_output_guardrail,`
	`14`	`+)`
	`15`	`+`
	`16`	`+`
	`17`	`+@function_tool`
	`18`	`+defsend_email(to:str,subject:str,body:str)->str:`
	`19`	`+"""Send an email to the specified recipient."""`
	`20`	`+returnf"Email sent to{to} with subject '{subject}'"`
	`21`	`+`
	`22`	`+`
	`23`	`+@function_tool`
	`24`	`+defget_user_data(user_id:str)->dict[str,str]:`
	`25`	`+"""Get user data by ID."""`
	`26`	`+# Simulate returning sensitive data`
	`27`	`+return {`
	`28`	`+"user_id":user_id,`
	`29`	`+"name":"John Doe",`
	`30`	`+"email":"john@example.com",`
	`31`	`+"ssn":"123-45-6789",# Sensitive data that should be blocked!`
	`32`	`+"phone":"555-1234",`
	`33`	`+ }`
	`34`	`+`
	`35`	`+`
	`36`	`+@function_tool`
	`37`	`+defget_contact_info(user_id:str)->dict[str,str]:`
	`38`	`+"""Get contact info by ID."""`
	`39`	`+return {`
	`40`	`+"user_id":user_id,`
	`41`	`+"name":"Jane Smith",`
	`42`	`+"email":"jane@example.com",`
	`43`	`+"phone":"555-1234",`
	`44`	`+ }`
	`45`	`+`
	`46`	`+`
	`47`	`+@tool_input_guardrail`
	`48`	`+defreject_sensitive_words(data:ToolInputGuardrailData)->ToolGuardrailFunctionOutput:`
	`49`	`+"""Reject tool calls that contain sensitive words in arguments."""`
	`50`	`+try:`
	`51`	`+args=json.loads(data.context.tool_arguments)ifdata.context.tool_argumentselse {}`
	`52`	`+exceptjson.JSONDecodeError:`
	`53`	`+returnToolGuardrailFunctionOutput(output_info="Invalid JSON arguments")`
	`54`	`+`
	`55`	`+# Check for suspicious content`
	`56`	`+sensitive_words= [`
	`57`	`+"password",`
	`58`	`+"hack",`
	`59`	`+"exploit",`
	`60`	`+"malware",`
	`61`	`+"ACME",`
	`62`	`+ ]`
	`63`	`+forkey,valueinargs.items():`
	`64`	`+value_str=str(value).lower()`
	`65`	`+forwordinsensitive_words:`
	`66`	`+ifword.lower()invalue_str:`
	`67`	`+# Reject tool call and inform the model the function was not called`
	`68`	`+returnToolGuardrailFunctionOutput.reject_content(`
	`69`	`+message=f"🚨 Tool call blocked: contains '{word}'",`
	`70`	`+output_info={"blocked_word":word,"argument":key},`
	`71`	`+ )`
	`72`	`+`
	`73`	`+returnToolGuardrailFunctionOutput(output_info="Input validated")`
	`74`	`+`
	`75`	`+`
	`76`	`+@tool_output_guardrail`
	`77`	`+defblock_sensitive_output(data:ToolOutputGuardrailData)->ToolGuardrailFunctionOutput:`
	`78`	`+"""Block tool outputs that contain sensitive data."""`
	`79`	`+output_str=str(data.output).lower()`
	`80`	`+`
	`81`	`+# Check for sensitive data patterns`
	`82`	`+if"ssn"inoutput_stror"123-45-6789"inoutput_str:`
	`83`	`+# Use raise_exception to halt execution completely for sensitive data`
	`84`	`+returnToolGuardrailFunctionOutput.raise_exception(`
	`85`	`+output_info={"blocked_pattern":"SSN","tool":data.context.tool_name},`
	`86`	`+ )`
	`87`	`+`
	`88`	`+returnToolGuardrailFunctionOutput(output_info="Output validated")`
	`89`	`+`
	`90`	`+`
	`91`	`+@tool_output_guardrail`
	`92`	`+defreject_phone_numbers(data:ToolOutputGuardrailData)->ToolGuardrailFunctionOutput:`
	`93`	`+"""Reject function output containing phone numbers."""`
	`94`	`+output_str=str(data.output)`
	`95`	`+if"555-1234"inoutput_str:`
	`96`	`+returnToolGuardrailFunctionOutput.reject_content(`
	`97`	`+message="User data not retrieved as it contains a phone number which is restricted.",`
	`98`	`+output_info={"redacted":"phone_number"},`
	`99`	`+ )`
	`100`	`+returnToolGuardrailFunctionOutput(output_info="Phone number check passed")`
	`101`	`+`
	`102`	`+`
	`103`	`+# Apply guardrails to tools`
	`104`	`+send_email.tool_input_guardrails= [reject_sensitive_words]`
	`105`	`+get_user_data.tool_output_guardrails= [block_sensitive_output]`
	`106`	`+get_contact_info.tool_output_guardrails= [reject_phone_numbers]`
	`107`	`+`
	`108`	`+agent=Agent(`
	`109`	`+name="Secure Assistant",`
	`110`	`+instructions="You are a helpful assistant with access to email and user data tools.",`
	`111`	`+tools=[send_email,get_user_data,get_contact_info],`
	`112`	`+)`
	`113`	`+`
	`114`	`+`
	`115`	`+asyncdefmain():`
	`116`	`+print("=== Tool Guardrails Example ===\n")`
	`117`	`+`
	`118`	`+try:`
	`119`	`+# Example 1: Normal operation - should work fine`
	`120`	`+print("1. Normal email sending:")`
	`121`	`+result=awaitRunner.run(agent,"Send a welcome email to john@example.com")`
	`122`	`+print(f"✅ Successful tool execution:{result.final_output}\n")`
	`123`	`+`
	`124`	`+# Example 2: Input guardrail triggers - function tool call is rejected but execution continues`
	`125`	`+print("2. Attempting to send email with suspicious content:")`
	`126`	`+result=awaitRunner.run(`
	`127`	`+agent,"Send an email to john@example.com introducing the company ACME corp."`
	`128`	`+ )`
	`129`	`+print(f"❌ Guardrail rejected function tool call:{result.final_output}\n")`
	`130`	`+exceptExceptionase:`
	`131`	`+print(f"Error:{e}\n")`
	`132`	`+`
	`133`	`+try:`
	`134`	`+# Example 3: Output guardrail triggers - should raise exception for sensitive data`
	`135`	`+print("3. Attempting to get user data (contains SSN). Execution blocked:")`
	`136`	`+result=awaitRunner.run(agent,"Get the data for user ID user123")`
	`137`	`+print(f"✅ Successful tool execution:{result.final_output}\n")`
	`138`	`+exceptToolOutputGuardrailTripwireTriggeredase:`
	`139`	`+print("🚨 Output guardrail triggered: Execution halted for sensitive data")`
	`140`	`+print(f"Details:{e.output.output_info}\n")`
	`141`	`+`
	`142`	`+try:`
	`143`	`+# Example 4: Output guardrail triggers - reject returning function tool output but continue execution`
	`144`	`+print("4. Rejecting function tool output containing phone numbers:")`
	`145`	`+result=awaitRunner.run(agent,"Get contact info for user456")`
	`146`	`+print(f"❌ Guardrail rejected function tool output:{result.final_output}\n")`
	`147`	`+exceptExceptionase:`
	`148`	`+print(f"Error:{e}\n")`
	`149`	`+`
	`150`	`+`
	`151`	`+if__name__=="__main__":`
	`152`	`+asyncio.run(main())`
	`153`	`+`
	`154`	`+"""`
	`155`	`+Example output:`
	`156`	`+`
	`157`	`+=== Tool Guardrails Example ===`
	`158`	`+`
	`159`	`+1. Normal email sending:`
	`160`	`+✅ Successful tool execution: I've sent a welcome email to john@example.com with an appropriate subject and greeting message.`
	`161`	`+`
	`162`	`+2. Attempting to send email with suspicious content:`
	`163`	`+❌ Guardrail rejected function tool call: I'm unable to send the email as mentioning ACME Corp. is restricted.`
	`164`	`+`
	`165`	`+3. Attempting to get user data (contains SSN). Execution blocked:`
	`166`	`+🚨 Output guardrail triggered: Execution halted for sensitive data`
	`167`	`+ Details: {'blocked_pattern': 'SSN', 'tool': 'get_user_data'}`
	`168`	`+`
	`169`	`+4. Rejecting function tool output containing sensitive data:`
	`170`	`+❌ Guardrail rejected function tool output: I'm unable to retrieve the contact info for user456 because it contains restricted information.`
	`171`	`+"""`

`‎src/agents/init.py‎`

Lines changed: 24 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -21,6 +21,8 @@`
`21`	`21`	`ModelBehaviorError,`
`22`	`22`	`OutputGuardrailTripwireTriggered,`
`23`	`23`	`RunErrorDetails,`
	`24`	`+ToolInputGuardrailTripwireTriggered,`
	`25`	`+ToolOutputGuardrailTripwireTriggered,`
`24`	`26`	`UserError,`
`25`	`27`	`)`
`26`	`28`	`from .guardrailimport (`
`@@ -83,6 +85,17 @@`
`83`	`85`	`default_tool_error_function,`
`84`	`86`	`function_tool,`
`85`	`87`	`)`
	`88`	`+from .tool_guardrailsimport (`
	`89`	`+ToolGuardrailFunctionOutput,`
	`90`	`+ToolInputGuardrail,`
	`91`	`+ToolInputGuardrailData,`
	`92`	`+ToolInputGuardrailResult,`
	`93`	`+ToolOutputGuardrail,`
	`94`	`+ToolOutputGuardrailData,`
	`95`	`+ToolOutputGuardrailResult,`
	`96`	`+tool_input_guardrail,`
	`97`	`+tool_output_guardrail,`
	`98`	`+)`
`86`	`99`	`from .tracingimport (`
`87`	`100`	`AgentSpanData,`
`88`	`101`	`CustomSpanData,`
`@@ -191,6 +204,8 @@ def enable_verbose_stdout_logging():`
`191`	`204`	`"AgentsException",`
`192`	`205`	`"InputGuardrailTripwireTriggered",`
`193`	`206`	`"OutputGuardrailTripwireTriggered",`
	`207`	`+"ToolInputGuardrailTripwireTriggered",`
	`208`	`+"ToolOutputGuardrailTripwireTriggered",`
`194`	`209`	`"DynamicPromptFunction",`
`195`	`210`	`"GenerateDynamicPromptData",`
`196`	`211`	`"Prompt",`
`@@ -204,6 +219,15 @@ def enable_verbose_stdout_logging():`
`204`	`219`	`"GuardrailFunctionOutput",`
`205`	`220`	`"input_guardrail",`
`206`	`221`	`"output_guardrail",`
	`222`	`+"ToolInputGuardrail",`
	`223`	`+"ToolOutputGuardrail",`
	`224`	`+"ToolGuardrailFunctionOutput",`
	`225`	`+"ToolInputGuardrailData",`
	`226`	`+"ToolInputGuardrailResult",`
	`227`	`+"ToolOutputGuardrailData",`
	`228`	`+"ToolOutputGuardrailResult",`
	`229`	`+"tool_input_guardrail",`
	`230`	`+"tool_output_guardrail",`
`207`	`231`	`"handoff",`
`208`	`232`	`"Handoff",`
`209`	`233`	`"HandoffInputData",`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit22a63aa

File tree

12 files changed

12 files changed

`‎docs/guardrails.md‎`

`‎examples/basic/tool_guardrails.py‎`

`‎src/agents/init.py‎`

0 commit comments

Movatterモバイル変換

File tree

12 files changed

12 files changed

‎docs/guardrails.md‎

‎examples/basic/tool_guardrails.py‎

‎src/agents/__init__.py‎

0 commit comments

`‎docs/guardrails.md‎`

`‎examples/basic/tool_guardrails.py‎`

`‎src/agents/init.py‎`