From 20053acd74d5b1f1972d51c9342a57732269dc4d Mon Sep 17 00:00:00 2001 From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com> Date: Mon, 26 Jan 2026 17:16:29 +0000 Subject: [PATCH] fix: pass session_id via extra_body in agent.completions.create - Update all agent.completions.create calls to use extra_body={'session_id': session_id} instead of passing session_id as a direct kwarg - Bump version to 0.5.2 Co-Authored-By: Sudeep Pillai --- vlmrun/cli/_cli/chat.py | 8 +++++--- vlmrun/version.py | 2 +- 2 files changed, 6 insertions(+), 4 deletions(-) diff --git a/vlmrun/cli/_cli/chat.py b/vlmrun/cli/_cli/chat.py index 7790a4f..1741b1e 100644 --- a/vlmrun/cli/_cli/chat.py +++ b/vlmrun/cli/_cli/chat.py @@ -598,6 +598,7 @@ def chat( response_content = "" usage_data: Optional[Dict[str, Any]] = None response_id: Optional[str] = None + extra_body: Optional[Dict[str, Any]] = {"session_id": session_id} if session_id else None start_time = time.time() @@ -612,11 +613,12 @@ def chat( ), handle_api_errors(), ): + response = client.agent.completions.create( model=model, messages=messages, stream=False, - session_id=session_id, + extra_body=extra_body, ) else: # JSON output: no status messages, just make the API call @@ -625,7 +627,7 @@ def chat( model=model, messages=messages, stream=False, - session_id=session_id, + extra_body=extra_body, ) latency_s = time.time() - start_time @@ -683,7 +685,7 @@ def chat( model=model, messages=messages, stream=True, - session_id=session_id, + extra_body=extra_body, ) # Collect streaming content and usage data diff --git a/vlmrun/version.py b/vlmrun/version.py index dd9b22c..7225152 100644 --- a/vlmrun/version.py +++ b/vlmrun/version.py @@ -1 +1 @@ -__version__ = "0.5.1" +__version__ = "0.5.2"