mirror of
https://github.com/NousResearch/hermes-agent.git
synced 2026-05-18 04:41:56 +00:00
fix(gateway): forward image attachments to background agent tasks
When the gateway spawned a background agent (e.g. for delegation), media URLs and types from the originating message weren't forwarded — the bg agent saw the prompt but no attached images. Vision-enabled tasks effectively lost their inputs. Forwards media_urls/media_types through the bg-task spawn path and runs the same vision-enrichment step the main flow uses, so the bg agent gets image descriptions inlined into its prompt. Closes #25614. Salvage of #25603 by @oxngon (manually re-applied — original branch was severely stale against current main).
This commit is contained in:
parent
a952ca3ff6
commit
3adde245b7
1 changed files with 29 additions and 1 deletions
|
|
@ -10355,6 +10355,10 @@ class GatewayRunner:
|
|||
|
||||
event_message_id = self._reply_anchor_for_event(event)
|
||||
|
||||
# Forward image/audio attachments so the background agent can see them.
|
||||
media_urls = list(event.media_urls) if event.media_urls else []
|
||||
media_types = list(event.media_types) if event.media_types else []
|
||||
|
||||
# Fire-and-forget the background task
|
||||
_task = asyncio.create_task(
|
||||
self._run_background_task(
|
||||
|
|
@ -10362,6 +10366,8 @@ class GatewayRunner:
|
|||
source,
|
||||
task_id,
|
||||
event_message_id=event_message_id,
|
||||
media_urls=media_urls,
|
||||
media_types=media_types,
|
||||
)
|
||||
)
|
||||
self._background_tasks.add(_task)
|
||||
|
|
@ -10376,10 +10382,15 @@ class GatewayRunner:
|
|||
source: "SessionSource",
|
||||
task_id: str,
|
||||
event_message_id: Optional[str] = None,
|
||||
media_urls: Optional[List[str]] = None,
|
||||
media_types: Optional[List[str]] = None,
|
||||
) -> None:
|
||||
"""Execute a background agent task and deliver the result to the chat."""
|
||||
from run_agent import AIAgent
|
||||
|
||||
media_urls = media_urls or []
|
||||
media_types = media_types or []
|
||||
|
||||
adapter = self.adapters.get(source.platform)
|
||||
if not adapter:
|
||||
logger.warning("No adapter for platform %s in background task %s", source.platform, task_id)
|
||||
|
|
@ -10415,6 +10426,23 @@ class GatewayRunner:
|
|||
self._service_tier = self._load_service_tier()
|
||||
turn_route = self._resolve_turn_agent_config(prompt, model, runtime_kwargs)
|
||||
|
||||
# Enrich the prompt with image descriptions so the background
|
||||
# agent can see user-attached images (same as the main flow).
|
||||
enriched_prompt = prompt
|
||||
if media_urls:
|
||||
image_paths = []
|
||||
for i, path in enumerate(media_urls):
|
||||
mtype = media_types[i] if i < len(media_types) else ""
|
||||
if mtype.startswith("image/"):
|
||||
image_paths.append(path)
|
||||
if image_paths:
|
||||
try:
|
||||
enriched_prompt = await self._enrich_message_with_vision(
|
||||
prompt, image_paths,
|
||||
)
|
||||
except Exception as e:
|
||||
logger.warning("Background task vision enrichment failed: %s", e)
|
||||
|
||||
def run_sync():
|
||||
agent = AIAgent(
|
||||
model=turn_route["model"],
|
||||
|
|
@ -10446,7 +10474,7 @@ class GatewayRunner:
|
|||
)
|
||||
try:
|
||||
return agent.run_conversation(
|
||||
user_message=prompt,
|
||||
user_message=enriched_prompt,
|
||||
task_id=task_id,
|
||||
)
|
||||
finally:
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue