
    Ji/                    	   U d Z ddlZddlZddlZddlZddlZddlmZ ddlm	Z	 ddl
mZmZmZmZmZ ddlmZ ddlmZ ddlmZ dd	lmZ  ej        e          Zd
ddddddddd	Zeeef         ed<   ddddZddgiZda e!ed<   dZ"dZ#dZ$dZ% e            dz  Z&dZ'd Z(d!ed"ee!ee         f         fd#Z)d$ed"efd%Z*dd$ed'ed"efd(Z+d)ed"efd*Z, G d+ d,          Z- G d- d.          Z. G d/ d0          Z/ G d1 d2          Z0 G d3 d4          Z1 G d5 d6          Z2 G d7 d8          Z3 G d9 d:          Z4 G d; d<          Z5 G d= d>          Z6 G d? d@          Z7 G dA dB          Z8d"ee9         fdCZ:d!e9d"efdDZ;d"efdEZ<d"ee         fdFZ=d"eee         ee         f         fdGZ>ddHed"efdIZ?dHedJed"ee         fdKZ@d"eee         ee         f         fdLZAd"eee         ee         f         fdMZBd"efdNZCd"eee         ee         f         fdOZDd"efdPZEd"eee         ee         f         fdQZFd"eee         ee         f         fdRZGd"eee         ee         f         fdSZHdTed"eee         ee         f         fdUZIdVdWdXdYdZd[ZJd"eee         ee         f         fd\ZKd]efd^ZL	 	 	 	 	 dd!ed]ed_e!d`e!daedbed"eee         ee         f         fdcZMddHed"eee         ee         f         fddZNddHefdeZOdfZPd!ee         d"efdgZQd!ed"eee         ee         f         fdhZRd!ed"e!fdiZSd"ee         fdjZTd"ee         fdkZU	 	 dddddld!ee         d]ee         dmee         dnee         d_e!d"eee         ee         ee         f         fdoZVd"eee         ee         f         fdpZWdq ZXd"e9fdrZYdseZd"e9fdtZ[i Z\ee]e]f         edu<    ej^                    Z_ddvZ`dwed"dfdxZaddyZbddzZc	 	 	 	 dd!ed]ed_e!dmedned"eee         ee         f         fd{Zd	 	 	 	 	 ddHed!ed]edmedned"eeee         ee         ee         f         fd|Zed}ZfeffdHed~egd"egfdZh	 	 	 	 	 	 dd!ed]edeideeg         deeZ         deei         degdee9         dmee         d"e9fdZj	 ddddddddddd	dHed!ed]edmednedeidegdeZdeidegde9d"efdZkd"efdZl	 ddddddddddd	dHed!ed]edmednedeidegdeZdeidegde9d"efdZmdS )a=  Shared auxiliary client router for side tasks.

Provides a single resolution chain so every consumer (context compression,
session search, web extraction, vision analysis, browser vision) picks up
the best available backend without duplicating fallback logic.

Resolution order for text tasks (auto mode):
  1. OpenRouter  (OPENROUTER_API_KEY)
  2. Nous Portal (~/.hermes/auth.json active provider)
  3. Custom endpoint (config.yaml model.base_url + OPENAI_API_KEY)
  4. Codex OAuth (Responses API via chatgpt.com with gpt-5.3-codex,
     wrapped to look like a chat.completions client)
  5. Native Anthropic
  6. Direct API-key providers (z.ai/GLM, Kimi/Moonshot, MiniMax, MiniMax-CN)
  7. None

Resolution order for vision/multimodal tasks (auto mode):
  1. Selected main provider, if it is one of the supported vision backends below
  2. OpenRouter
  3. Nous Portal
  4. Codex OAuth (gpt-5.3-codex supports vision via Responses API)
  5. Native Anthropic
  6. Custom endpoint (for local vision models: Qwen-VL, LLaVA, Pixtral, etc.)
  7. None

Per-task provider overrides (e.g. AUXILIARY_VISION_PROVIDER,
CONTEXT_COMPRESSION_PROVIDER) can force a specific provider for each task.
Default "auto" follows the chains above.

Per-task model overrides (e.g. AUXILIARY_VISION_MODEL,
AUXILIARY_WEB_EXTRACT_MODEL) let callers use a different model slug
than the provider's default.

Per-task direct endpoint overrides (e.g. AUXILIARY_VISION_BASE_URL,
AUXILIARY_VISION_API_KEY) let callers route a specific auxiliary task to a
custom OpenAI-compatible endpoint without touching the main model settings.
    N)Path)SimpleNamespace)AnyDictListOptionalTuple)OpenAI)	load_pool)get_hermes_home)OPENROUTER_BASE_URLzglm-4.5-flashzkimi-k2-turbo-previewzMiniMax-M2.7-highspeedclaude-haiku-4-5-20251001zgoogle/gemini-3-flashgemini-3-flashzglm-5zgoogle/gemini-3-flash-preview)	zaizkimi-codingminimaxz
minimax-cn	anthropicz
ai-gatewayzopencode-zenzopencode-gokilocode_API_KEY_PROVIDER_AUX_MODELSz%https://hermes-agent.nousresearch.comzHermes Agentzproductivity,cli-agent)zHTTP-RefererzX-OpenRouter-TitlezX-OpenRouter-Categoriestagsproduct=hermes-agentFauxiliary_is_nousz)https://inference-api.nousresearch.com/v1zhttps://api.anthropic.comz	auth.jsonzgpt-5.2-codexz%https://chatgpt.com/backend-api/codexproviderreturnc                 R   	 t          |           }n4# t          $ r'}t                              d| |           Y d}~dS d}~ww xY w|r|                                sdS 	 d|                                fS # t          $ r'}t                              d| |           Y d}~dS d}~ww xY w)z2Return (pool_exists_for_provider, selected_entry).z0Auxiliary client: could not load pool for %s: %sN)FNTz8Auxiliary client: could not select pool entry for %s: %s)TN)r   	Exceptionloggerdebughas_credentialsselect)r   poolexcs      3/home/ubuntu/hermes-agent/agent/auxiliary_client.py_select_pool_entryr#   d   s    ""   GSVWWW{{{{{  t++-- {T[[]]""   OQY[^___zzzzzs*    
A>AA5 5
B&?B!!B&entryc                     | dS t          | dd           pt          | dd          }t          |pd                                          S )N runtime_api_keyaccess_token)getattrstrstrip)r$   keys     r"   _pool_runtime_api_keyr-   t   sN    }r %*D
1
1
WWUNTV5W5WCsyb>>!!!    r&   fallbackc                 H   | 6t          |pd                                                              d          S t          | dd           p#t          | dd           pt          | dd           p|}t          |pd                                                              d          S )Nr&   /runtime_base_urlinference_base_urlbase_url)r*   r+   rstripr)   )r$   r/   urls      r"   _pool_runtime_base_urlr7   }   s    }8>r""((**11#666 	)400 	5.55	5*d++	 	  syb>>!!((---r.   contentc                 8   t          | t                    r| S t          | t                    s| rt          |           ndS g }| D ]R}t          |t                    s|                    dd          }|dk    r-|                    d|                    dd          d           b|dk    r|                    di           }t          |t                    r|                    dd          nt          |          }d|d	}t          |t                    r|                    d
          nd}|r||d
<   |                    |           |dv r|                    |           "|                    dd          }|r|                    d|d           T|pdS )a  Convert chat.completions content to Responses API format.

    chat.completions uses:
      {"type": "text", "text": "..."}
      {"type": "image_url", "image_url": {"url": "data:image/png;base64,..."}}

    Responses API uses:
      {"type": "input_text", "text": "..."}
      {"type": "input_image", "image_url": "data:image/png;base64,..."}

    If content is a plain string, it's returned as-is (the Responses API
    accepts strings directly for text-only messages).
    r&   typetext
input_text)r:   r;   	image_urlr6   input_image)r:   r=   detailN)r<   r>   )
isinstancer*   listdictgetappend)	r8   	convertedpartptype
image_datar6   r$   r?   r;   s	            r"   _convert_content_for_responsesrI      s    '3 gt$$ /&.s7|||B.&(I G G$%% 	$$F??lDHHVR<P<PQQRRRRk!!+r22J/9*d/K/K`*..+++QTU_Q`Q`C-:$M$ME1;J1M1MWZ^^H---SWF )"(hU####333T"""" 88FB''D G  ,!E!EFFF?r.   c                   .    e Zd ZdZdedefdZdefdZdS )_CodexCompletionsAdapterzyDrop-in shim that accepts chat.completions.create() kwargs and
    routes them through the Codex Responses streaming API.real_clientmodelc                 "    || _         || _        d S N)_client_model)selfrL   rM   s      r"   __init__z!_CodexCompletionsAdapter.__init__   s    "r.   r   c                 <   |                     dg           }|                     d| j                  }|                     d          }d}g }|D ]}|                     dd          }|                     d          pd}	|d	k    r't          |	t                    r|	nt          |	          }\|                    |t          |	          d
           |||pddd
gdd}
|                     d          }|rg }|D ]}t          |t                    r|                     di           ni }|                     d          }|sG|                    d||                     dd          |                     di           d           |r||
d<   g }g }d }	  | j        j        j	        d+i |
5 }|D ]}|
                                }d d d            n# 1 swxY w Y   t          |dg           D ]}t          |dd           }|dk    rNt          |dg           D ];}t          |dd           }|dv r$|                    t          |dd                     <g|dk    ra|                    t          t          |dd          dt          t          |dd          t          |dd                                         t          |dd           }|r?t          t          |dd           t          |d!d           t          |d"d           #          }n.# t          $ r!}t                              d$|            d }~ww xY wd                    |                                          pd }	t          d%|	|pd &          }t          d ||sd'nd()          }t          |g||*          S ),NmessagesrM   temperaturezYou are a helpful assistant.roleuserr8   r&   system)rW   r8   F)rM   instructionsinputstoretoolsfunctionnamedescription
parameters)r:   r_   r`   ra   outputr:   message)output_textr;   r;   function_callcall_id	argumentsz{})r_   rg   )idr:   r^   usageinput_tokensr   output_tokenstotal_tokensprompt_tokenscompletion_tokensrl   z-Codex auxiliary Responses API call failed: %s	assistant)rW   r8   
tool_callsstoprq   indexrc   finish_reasonchoicesrM   ri    )rC   rQ   r@   r*   rD   rI   rB   rP   	responsesstreamget_final_responser)   r   r   r   r   joinr+   )rR   kwargsrU   rM   rV   rZ   
input_msgsmsgrW   r8   resp_kwargsr]   rE   tfnr_   
text_partstool_calls_rawri   rz   _eventfinalitem	item_typerF   rG   
resp_usager!   rc   choices                                 r"   createz_CodexCompletionsAdapter.create   s   ::j"--

7DK00jj//
 6+-
 		 		C7766**Dggi((.BGx*4Wc*B*BTwwG!! =gFF# #     (DV$C$C#D	'
 '
 

7## 	1I 
 
.8D.A.AIQUU:r***rvvf~~   & #%66-#<#<"$&&r":":	" "      1'0G$ !#
$&!	.'.==== 4$  F11334 4 4 4 4 4 4 4 4 4 4 4 4 4 4  x44  #D&$77		)) 'i < < I I 'fd ; ; $;;;&--gdFB.G.GHHHI /11"))/"4B77'!0!(vr!:!:&-dK&F&F" " "+ + +    !66J '")*na"H"H&-j/1&M&M!(^Q!G!G  
  	 	 	LLH#NNN	 ''*%%++--5 "%-
 
 

 !(6H&&L
 
 

 H
 
 
 	
s=   L
 &G L
 GL
 GD5L
 

L5L00L5N)	__name__
__module____qualname____doc__r
   r*   rS   r   r   rx   r.   r"   rK   rK      sb        > >F 3    j
# j
 j
 j
 j
 j
 j
r.   rK   c                       e Zd ZdZdefdZdS )_CodexChatShimz>Wraps the adapter to provide client.chat.completions.create().adapterc                     || _         d S rO   completionsrR   r   s     r"   rS   z_CodexChatShim.__init__9      "r.   N)r   r   r   r   rK   rS   rx   r.   r"   r   r   6  s6        HH# 8 # # # # # #r.   r   c                   (    e Zd ZdZdedefdZd ZdS )CodexAuxiliaryClientzOpenAI-client-compatible wrapper that routes through Codex Responses API.

    Consumers can call client.chat.completions.create(**kwargs) as normal.
    Also exposes .api_key and .base_url for introspection by async wrappers.
    rL   rM   c                     || _         t          ||          }t          |          | _        |j        | _        |j        | _        d S rO   )_real_clientrK   r   chatapi_keyr4   )rR   rL   rM   r   s       r"   rS   zCodexAuxiliaryClient.__init__D  s@    '*;>>"7++	"*#,r.   c                 8    | j                                          d S rO   )r   closerR   s    r"   r   zCodexAuxiliaryClient.closeK  s    !!!!!r.   N)r   r   r   r   r
   r*   rS   r   rx   r.   r"   r   r   =  sO         -F -3 - - - -" " " " "r.   r   c                   *    e Zd ZdZdefdZdefdZdS )_AsyncCodexCompletionsAdapterzAsync version of the Codex Responses adapter.

    Wraps the sync adapter via asyncio.to_thread() so async consumers
    (web_tools, session_search) can await it as normal.
    sync_adapterc                     || _         d S rO   _syncrR   r   s     r"   rS   z&_AsyncCodexCompletionsAdapter.__init__V      !


r.   r   c                 J   K   dd l } |j        | j        j        fi | d {V S Nr   asyncio	to_threadr   r   rR   r}   r   s      r"   r   z$_AsyncCodexCompletionsAdapter.createY  A      &W&tz'8CCFCCCCCCCCCr.   N)r   r   r   r   rK   rS   r   r   rx   r.   r"   r   r   O  s\         "%= " " " "D D D D D D Dr.   r   c                       e Zd ZdefdZdS )_AsyncCodexChatShimr   c                     || _         d S rO   r   r   s     r"   rS   z_AsyncCodexChatShim.__init___  r   r.   N)r   r   r   r   rS   rx   r.   r"   r   r   ^  s0        # = # # # # # #r.   r   c                       e Zd ZdZddZdS )AsyncCodexAuxiliaryClientzHAsync-compatible wrapper matching AsyncOpenAI.chat.completions.create().sync_wrapperr   c                     |j         j        }t          |          }t          |          | _         |j        | _        |j        | _        d S rO   )r   r   r   r   r   r4   rR   r   r   async_adapters       r"   rS   z"AsyncCodexAuxiliaryClient.__init__f  sA    #(45lCC'66	#+$-r.   N)r   r   )r   r   r   r   rS   rx   r.   r"   r   r   c  s.        RR. . . . . .r.   r   c                   4    e Zd ZdZd
dededefdZdefdZd	S )_AnthropicCompletionsAdapterz<OpenAI-client-compatible adapter for Anthropic Messages API.FrL   rM   is_oauthc                 0    || _         || _        || _        d S rO   )rP   rQ   	_is_oauth)rR   rL   rM   r   s       r"   rS   z%_AnthropicCompletionsAdapter.__init__q  s    "!r.   r   c           	      :   ddl m}m} |                    dg           }|                    d| j                  }|                    d          }|                    d          }|                    d          p|                    d          pd	}|                    d
          }	d }
t          |t                    r|}
nt          |t                    rkt          |                    dd                                                    }|dk    r*|                    di                               d          }
n|dv r|}
 |||||d |
| j	                  }|	|	|d
<    | j
        j        j        di |} ||          \  }}d }t          |d          rd|j        r]t          |j        dd          pd}t          |j        dd          pd}t          |j        dd          p||z   }t!          |||          }t!          d||          }t!          |g||          S )Nr   )build_anthropic_kwargsnormalize_anthropic_responserU   rM   r]   tool_choice
max_tokensmax_completion_tokensi  rV   r:   r&   r^   r_   >   autononerequired)rM   rU   r]   r   reasoning_configr   r   ri   rj   rk   rl   rm   rs   rv   rx   )agent.anthropic_adapterr   r   rC   rQ   r@   r*   rB   lowerr   rP   rU   r   hasattrri   r)   r   )rR   r}   r   r   rU   rM   r]   r   r   rV   normalized_tool_choicechoice_typeanthropic_kwargsresponseassistant_messageru   ri   rn   ro   rl   r   s                        r"   r   z#_AnthropicCompletionsAdapter.createv  s   ````````::j"--

7DK00

7##jj//ZZ--\<S1T1T\X\
jj//!%k3'' 	5%0""T** 	5koofb99::@@BBKj(()4R)H)H)L)LV)T)T&& <<<)4&11!!.^
 
 
 ".9]+/4<(/CC2BCC+G+G+Q+Q(=8W%% 	(. 	#HNNAFFK!M ' K K Pq"8>>1EEl-ZkJkL#+"3)  E !%'
 
 

 H
 
 
 	
r.   NF)	r   r   r   r   r   r*   boolrS   r   rx   r.   r"   r   r   n  sc        FF" "C " "t " " " "
7
# 7
 7
 7
 7
 7
 7
r.   r   c                       e Zd ZdefdZdS )_AnthropicChatShimr   c                     || _         d S rO   r   r   s     r"   rS   z_AnthropicChatShim.__init__  r   r.   N)r   r   r   r   rS   rx   r.   r"   r   r     s0        # < # # # # # #r.   r   c                   6    e Zd ZdZddededededef
dZd	 Zd
S )AnthropicAuxiliaryClientz@OpenAI-client-compatible wrapper over a native Anthropic client.FrL   rM   r   r4   r   c                 |    || _         t          |||          }t          |          | _        || _        || _        d S )Nr   )r   r   r   r   r   r4   )rR   rL   rM   r   r4   r   r   s          r"   rS   z!AnthropicAuxiliaryClient.__init__  s?    '.{EHUUU&w//	 r.   c                 h    t          | j        dd           }t          |          r |             d S d S )Nr   )r)   r   callable)rR   close_fns     r"   r   zAnthropicAuxiliaryClient.close  s?    4,gt<<H 	HJJJJJ	 	r.   Nr   )	r   r   r   r   r   r*   r   rS   r   rx   r.   r"   r   r     sf        JJ! !C ! !c !S !\` ! ! ! !    r.   r   c                   &    e Zd ZdefdZdefdZdS )!_AsyncAnthropicCompletionsAdapterr   c                     || _         d S rO   r   r   s     r"   rS   z*_AsyncAnthropicCompletionsAdapter.__init__  r   r.   r   c                 J   K   dd l } |j        | j        j        fi | d {V S r   r   r   s      r"   r   z(_AsyncAnthropicCompletionsAdapter.create  r   r.   N)r   r   r   r   rS   r   r   rx   r.   r"   r   r     sR        "%A " " " "D D D D D D Dr.   r   c                       e Zd ZdefdZdS )_AsyncAnthropicChatShimr   c                     || _         d S rO   r   r   s     r"   rS   z _AsyncAnthropicChatShim.__init__  r   r.   N)r   r   r   r   rS   rx   r.   r"   r   r     s0        # A # # # # # #r.   r   c                       e Zd ZddZdS )AsyncAnthropicAuxiliaryClientr   r   c                     |j         j        }t          |          }t          |          | _         |j        | _        |j        | _        d S rO   )r   r   r   r   r   r4   r   s       r"   rS   z&AsyncAnthropicAuxiliaryClient.__init__  sA    #(49,GG+M::	#+$-r.   N)r   r   )r   r   r   rS   rx   r.   r"   r   r     s(        . . . . . .r.   r   c                     t          d          \  } }| r|dS t          |dd          t          |dd          t          |dd          t          |t                    t          |dd          t          |dd          t          |d	d          t          |d
d          dd	S 	 t                                          sdS t          j        t                                                    }|	                    d          dk    rdS |	                    di           	                    di           }|	                    d          s|	                    d          sdS |S # t          $ r&}t                              d|           Y d}~dS d}~ww xY w)zRead and validate ~/.hermes/auth.json for an active Nous provider.

    Returns the provider state dict if Nous is active with tokens,
    otherwise None.
    nousNr(   r&   refresh_token	agent_keyportal_base_url	client_idscope
token_typeBearerr    )	r(   r   r   r3   r   r   r   r   sourceactive_provider	providerszCould not read Nous auth: %s)r#   r)   r7   _NOUS_DEFAULT_BASE_URL_AUTH_JSON_PATHis_filejsonloads	read_textrC   r   r   r   )pool_presentr$   datar   r!   s        r"   _read_nous_authr     s    -V44L% 
=4#E>2>>$UOTBB T::"8@V"W"W&u.?FF T::UGT22!%x@@

 

 
	
&&(( 	4z/33556688%&&&00488K,,00<<||K(( 	n1M1M 	4   3S999ttttts,   "E =AE AE E 
F%FFc                 X    |                      d          p|                      dd          S )z9Extract the best API key from a Nous provider state dict.r   r(   r&   )rC   r   s    r"   _nous_api_keyr     s'    <<$$H^R(H(HHr.   c                  6    t          j        dt                    S )z8Resolve the Nous inference base URL from env or default.NOUS_INFERENCE_BASE_URL)osgetenvr   rx   r.   r"   _nous_base_urlr    s    9.0FGGGr.   c                  &   t          d          \  } }| rt          |          }|pdS 	 ddlm}  |            }|                    di           }|                    d          }t          |t                    r|                                sdS 	 ddl}|	                    d          d         }|d	t          |           d
z  z  z  }t          j        |                    |                    }	|	                    dd          }
|
r4t          j                    |
k    rt                              d|
           dS n# t"          $ r Y nw xY w|                                S # t"          $ r&}t                              d|           Y d}~dS d}~ww xY w)zJRead a valid, non-expired Codex OAuth access token from Hermes auth store.openai-codexNr   )_read_codex_tokenstokensr(   .   =   expz-Codex access token expired (exp=%s), skippingz2Could not read Codex auth for auxiliary client: %s)r#   r-   hermes_cli.authr  rC   r@   r*   r+   base64splitlenr   r   urlsafe_b64decodetimer   r   r   )r   r$   tokenr  r   r  r(   r  payloadclaimsr  r!   s               r"   _read_codex_access_tokenr    s   ,^<<L% %e,,}666666!!##(B''zz.11,,, 	L4F4F4H4H 	4
	MMM"((--a0Gss7||ma/00GZ 8 8 A ABBF**UA&&C ty{{S((LcRRRt 	 	 	D	 !!###   I3OOOttttts=   A$E  B)D< ;E  <
E	E  E		E   
F*FFc                     	 ddl m} m} n+# t          $ r t                              d           Y dS w xY w|                                 D ]+\  }}|j        dk    r|dk    rt                      c S t          |          \  }}|rt          |          }|sNt          ||j                  p|j        }t                              |d          }t                              d|j        |           i }	d	|                                v rd
di|	d<   n)d|                                v rddlm}
  |
            |	d<   t'          d||d|	|fc S  ||          }t)          |                    dd                                                    }|sFt)          |                    dd                                                                        d          p|j        }t                              |d          }t                              d|j        |           i }	d	|                                v rd
di|	d<   n)d|                                v rddlm}
  |
            |	d<   t'          d||d|	|fc S dS )zTry each API-key provider in PROVIDER_REGISTRY order.

    Returns (client, model) for the first provider with usable runtime
    credentials, or (None, None) if none are configured.
    r   PROVIDER_REGISTRY$resolve_api_key_provider_credentialsz7Could not import PROVIDER_REGISTRY for API-key fallbackNNr   r   defaultz'Auxiliary text client: %s (%s) via poolapi.kimi.com
User-AgentKimiCLI/1.0default_headersapi.githubcopilot.comcopilot_default_headersr   r4   r&   r4   r1   zAuxiliary text client: %s (%s)rx   )r  r  r  ImportErrorr   r   items	auth_type_try_anthropicr#   r-   r7   r3   r   rC   r_   r   hermes_cli.modelsr"  r
   r*   r+   r5   )r  r  provider_idpconfigr   r$   r   r4   rM   extrar"  credss               r"   _resolve_api_key_providerr-  /  s   [[[[[[[[[   NOOOzz !2 7 7 9 9 'J 'JW	))+%%!#####0==e 	N+E22G -eW5OPPnT[TnH044[)LLELLBGLRWXXXE!1!111,8-+H'(((HNN,<,<<<EEEEEE+B+B+D+D'(F'HFFFFMMMM44[AAeii	2..//5577 	uyyR00117799@@EEcIc,00iHH5w|UKKKX^^----(4m'DE#$$$(8(888AAAAAA'>'>'@'@E#$BgBBEBBEIIII:s    $33taskc                     | radD ]^}t          j        | |                                  dd                                                                          }|r
|dk    r|c S _dS )a5  Read the provider override for a specific auxiliary task.

    Checks AUXILIARY_{TASK}_PROVIDER first (e.g. AUXILIARY_VISION_PROVIDER),
    then CONTEXT_{TASK}_PROVIDER (for the compression section's summary_provider),
    then falls back to "auto".  Returns one of: "auto", "openrouter", "nous", "main".
    
AUXILIARY_CONTEXT_	_PROVIDERr&   r   )r   r  upperr+   r   )r.  prefixvals      r"   _get_auxiliary_providerr7  i  sy      0 	 	F)v>tzz||>>>CCIIKKQQSSC sf}}


6r.   suffixc                     | sdS dD ]H}t          j        | |                                  d| d                                          }|r|c S IdS )zFRead an auxiliary env override from AUXILIARY_* or CONTEXT_* prefixes.Nr0  _r&   )r   r  r4  r+   )r.  r8  r5  r6  s       r"   _get_auxiliary_env_overrider;  x  sq     t,  i6:4::<<::&::B??EEGG 	JJJ	4r.   c                     t          d          \  } }| rgt          |          }|sdS t          |t                    pt          }t                              d           t          ||t                    t          fS t          j
        d          }|sdS t                              d           t          |t          t                    t          fS )N
openrouterr  z%Auxiliary client: OpenRouter via pool)r   r4   r  OPENROUTER_API_KEYzAuxiliary client: OpenRouter)r#   r-   r7   r   r   r   r
   _OR_HEADERS_OPENROUTER_MODELr   r  )r   r$   or_keyr4   s       r"   _try_openrouterrB    s    ,\::L% G&u-- 	:)%1DEE\I\<===fx'24 4 45FG 	G Y+,,F z
LL/000&+>#.0 0 01BC Cr.   c                  d   t                      } | sdS dat                              d           |                     d          dk    rdnt
          }t          t          |           t          |                     d          pt                                
                    d          	          |fS )
Nr  TzAuxiliary client: Nous Portalr   r    r   r3   r1   r#  )r   r   r   r   rC   _NOUS_MODELr
   r   r*   r  r5   )r   rM   s     r"   	_try_nousrE    s    D z
LL0111 $ 2 2f < <+E!$''"677K>;K;KLLSSTWXX	
 	
 	
 	 r.   c                     	 ddl m}   |             }|                    di           }t          |t                    r(|                                r|                                S t          |t                    rS|                    dd          }t          |t                    r(|                                r|                                S n# t          $ r Y nw xY wdS )zRead the user's configured main model from config.yaml.

    config.yaml model.default is the single source of truth for the active
    model. Environment variables are no longer consulted.
    r   load_configrM   r  r&   )hermes_cli.configrH  rC   r@   r*   r+   rB   r   )rH  cfg	model_cfgr  s       r"   _read_main_modelrL    s    111111kmmGGGR((	i%% 	%)//*;*; 	%??$$$i&& 	'mmIr22G'3'' 'GMMOO '}}&   2s   A"C %A'C 
CCc                  :   	 ddl m}   | d          }n3# t          $ r&}t                              d|           Y d}~dS d}~ww xY w|                    d          }|                    d	          }t          |t                    r|                                sdS |                                	                    d
          }d|
                                v rdS t          |t                    r|                                sd}||                                fS )zResolve the active custom/main endpoint the same way the main CLI does.

    This covers both env-driven OPENAI_BASE_URL setups and config-saved custom
    endpoints where the base URL lives in config.yaml instead of the live
    environment.
    r   )resolve_runtime_providercustom)	requestedz6Auxiliary client: custom runtime resolution failed: %sNr  r4   r   r1   zopenrouter.aino-key-required)hermes_cli.runtime_providerrN  r   r   r   rC   r@   r*   r+   r5   r   )rN  runtimer!   custom_base
custom_keys        r"   _resolve_custom_runtimerV    s=   HHHHHH**X>>>   MsSSSzzzzz ++j))KY''Jk3'' {/@/@/B/B z##%%,,S11K+++---- z j#&& 'j.>.>.@.@ '&

((****s    
AA  Ac                  ,    t                      \  } }| pdS )Nr&   )rV  )rT  r:  s     r"   _current_custom_base_urlrX    s    ,..NK"r.   c                      t                      \  } }| r|sdS t                      pd}t                              d|           t	          ||           |fS )Nr  gpt-4o-miniz&Auxiliary client: custom endpoint (%s)r#  )rV  rL  r   r   r
   )rT  rU  rM   s      r"   _try_custom_endpointr[    sc    577K j z/-E
LL95AAA*{;;;UBBr.   c                  V   t          d          \  } }| r0t          |          }|sdS t          |t                    pt          }nt	                      }|sdS t          }t
                              dt                     t          ||          }t          |t                    t          fS )Nr  r  z4Auxiliary client: Codex OAuth (%s via Responses API)r#  )
r#   r-   r7   _CODEX_AUX_BASE_URLr  r   r   _CODEX_AUX_MODELr
   r   )r   r$   codex_tokenr4   rL   s        r"   
_try_codexr`    s    ,^<<L% 	'+E22 	:)%1DEE\I\.00 	:&
LLGIYZZZx@@@K-=>>@PPPr.   c                     	 ddl m} m} n# t          $ r Y dS w xY wt	          d          \  }}|r|dS t          |          }nd } |            }|sdS |rt          |t                    nt          }	 ddlm	}  |            }|
                    d          }t          |t                    rt          |
                    d          pd                                                                          }	|	dk    r@|
                    d	          pd                                                    d
          }
|
r|
}n# t"          $ r Y nw xY wddl m}  ||          }t&          
                    dd          }t(                              d|||           	  | ||          }n# t          $ r Y dS w xY wt-          |||||          |fS )Nr   )build_anthropic_clientresolve_anthropic_tokenr  r   rG  rM   r   r&   r4   r1   )_is_oauth_tokenr   z8Auxiliary client: Anthropic native (%s) at %s (oauth=%s)r   )r   rb  rc  r$  r#   r-   r7   _ANTHROPIC_DEFAULT_BASE_URLrI  rH  rC   r@   rB   r*   r+   r   r5   r   rd  r   r   r   r   )rb  rc  r   r$   r  r4   rH  rJ  rK  cfg_providercfg_base_urlrd  r   rM   rL   s                  r"   r'  r'    sQ   [[[[[[[[[   zz -[99L% *=:%e,,'')) z
 NZz%e-HIII_zH111111kmmGGG$$	i&& 	,y}}Z88>B??EEGGMMOOL{** )j 9 9 ?RFFHHOOPSTT ,+H    877777u%%H(,,[:UVVE
LLKUT\^fggg,,UH==    zz	
 $KxRZ[[[]bbbs1    
3CD< <
E	E	F# #
F10F1forcedc                 "   | dk    r1t                      \  }}|t                              d           ||fS | dk    r1t                      \  }}|t                              d           ||fS | dk    r1t	                      \  }}|t                              d           ||fS | dk    rHt
          t          t          fD ]} |            \  }}|||fc S t                              d	           d
S t                              d|            d
S )zKResolve a specific forced provider.  Returns (None, None) if creds missing.r=  Nz<auxiliary.provider=openrouter but OPENROUTER_API_KEY not setr   zJauxiliary.provider=nous but Nous Portal not configured (run: hermes login)codexzKauxiliary.provider=codex but no Codex OAuth token found (run: hermes model)mainz>auxiliary.provider=main but no main endpoint credentials foundr  z3Unknown auxiliary.provider=%r, falling back to auto)rB  r   warningrE  r`  r[  r-  )rh  clientrM   try_fns       r"   _resolve_forced_providerro  /  s2   '))>NNYZZZu}!>NNghhhu}">NNhiiiu}+Z9RS 	% 	%F"FHHMFE!u}$$$ "WXXXz NNH&QQQ:r.   r=  r   zlocal/customr  zapi-key)rB  rE  r[  r`  r-  c            	         da g } t          t          t          t          t
          fD ]}t          |dd          }t                              ||          } |            \  }}|Y| r3t          
                    d||pdd                    |                      nt          
                    d||pd           ||fc S |                     |           t                              d	d                    |                      d
S )uY   Full auto-detection chain: OpenRouter → Nous → custom → Codex → API-key → None.Fr   unknownNu4   Auxiliary auto-detect: using %s (%s) — skipped: %sr  , z$Auxiliary auto-detect: using %s (%s)zAuxiliary auto-detect: no provider available (tried: %s). Compression, summarization, and memory flush will not work. Set OPENROUTER_API_KEY or configure a local model in config.yaml.r  )r   rB  rE  r[  r`  r-  r)   _AUTO_PROVIDER_LABELSrC   r   infor|   rD   rl  )triedrn  fn_namelabelrm  rM   s         r"   _resolve_autorx  Z  s$    E"I/C8:  &*i88%))'7;; _R!5#5Ityy7G7GI I I I BE5K]T]^^^5=   U
NN W 99U##% % % :r.   rM   c                    ddl m} t          | t                    rt	          |           |fS t          | t
                    rt          |           |fS | j        t          | j	                  d}t          | j	                  
                                }d|v rt          t                    |d<   n#d|v rddlm}  |            |d<   nd|v rd	d
i|d<    |di ||fS )zIConvert a sync client to its async counterpart, preserving Codex routing.r   )AsyncOpenAIr#  r=  r  r   r!  r  r  r  rx   )openairz  r@   r   r   r   r   r   r*   r4   r   rB   r?  r(  r"  )sync_clientrM   rz  async_kwargs
base_lowerr"  s         r"   _to_async_clientr  ~  s,   """"""+344 =(55u<<+788 A,[995@@ &,-- L [)**0022Jz!!*.{*;*;&''	 J	.	.======*A*A*C*C&''	:	%	%+7*G&';&&&&--r.   
async_mode	raw_codexexplicit_base_urlexplicit_api_keyc                    | pd                                                                 } | dk    rd} | dk    rd} | dk    rYt                      \  }}|dS |r(d|v r$|r"d|vrt                              d	||           d}|p|}|rt          ||          n||fS | d
k    rIt                      \  }}	|t                              d           dS |p|	}|rt          ||          n||fS | dk    rIt                      \  }}	|t                              d           dS |p|	}|rt          ||          n||fS | dk    r|rOt                      }
|
st                              d           dS |pt          }t          |
t                    }||fS t                      \  }}	|t                              d           dS |p|	}|rt          ||          n||fS | dk    r
|r|                                 }|pd                                 p(t          j        dd                                           pd}|st                              d           dS |pt!                      pd}t          ||          }|rt          ||          n||fS t"          t          t$          fD ]-} |            \  }}	||p|	}|rt          ||          n||fc S .t                              d           dS 	 ddlm}m} n,# t,          $ r t                              d|            Y dS w xY w|                    |           }|t                              d|            dS |j        dk    r| dk    rIt3                      \  }}|t                              d           dS |p|}|rt          ||          n||fS  ||           }t5          |                    dd                                                     }|s`t7          |j                  }| dk    r|                    d           t                              d| d                     |                     dS t5          |                    d!d                                                                         d          p|j         }tB                              | d          }|p|}i }d"|                                v rd#|d$<   n9d%|                                v r#dd&l"m#} |$                     |                       t          d,||d|rd'|ini }t                              d(| |           |rt          ||          n||fS |j        d)v rK| dk    rtK          d||          S | dk    rtK          d||          S t                              d*|            dS t                              d+|j        |            dS )-u  Central router: given a provider name and optional model, return a
    configured client with the correct auth, base URL, and API format.

    The returned client always exposes ``.chat.completions.create()`` — for
    Codex/Responses API providers, an adapter handles the translation
    transparently.

    Args:
        provider: Provider identifier.  One of:
            "openrouter", "nous", "openai-codex" (or "codex"),
            "zai", "kimi-coding", "minimax", "minimax-cn",
            "custom" (OPENAI_BASE_URL + OPENAI_API_KEY),
            "auto" (full auto-detection chain).
        model: Model slug override.  If None, uses the provider's default
               auxiliary model.
        async_mode: If True, return an async-compatible client.
        raw_codex: If True, return a raw OpenAI client for Codex providers
            instead of wrapping in CodexAuxiliaryClient.  Use this when
            the caller needs direct access to responses.stream() (e.g.,
            the main agent loop).
        explicit_base_url: Optional direct OpenAI-compatible endpoint.
        explicit_api_key: Optional API key paired with explicit_base_url.

    Returns:
        (client, resolved_model) or (None, None) if auth is unavailable.
    r   rj  r  rk  rO  Nr  r1   z\Dropping OpenRouter-format model %r for non-OpenRouter auxiliary provider (using %r instead)r=  zLresolve_provider_client: openrouter requested but OPENROUTER_API_KEY not setr   zZresolve_provider_client: nous requested but Nous Portal not configured (run: hermes login)zbresolve_provider_client: openai-codex requested but no Codex OAuth token found (run: hermes model)r#  r&   OPENAI_API_KEYrQ  zQresolve_provider_client: explicit custom endpoint requested but base_url is emptyrZ  zPresolve_provider_client: custom/main requested but no endpoint credentials foundr   r  z-hermes_cli.auth not available for provider %sz,resolve_provider_client: unknown provider %rr   r   zOresolve_provider_client: anthropic requested but no Anthropic credentials foundcopilotzgh auth tokenzJresolve_provider_client: provider %s has no API key configured (tried: %s)rr  r4   r  r  r  r   r!  r  z resolve_provider_client: %s (%s))oauth_device_codeoauth_externalzMresolve_provider_client: OAuth provider %s not directly supported, try 'auto'z6resolve_provider_client: unhandled auth_type %s for %srx   )&r+   r   rx  r   r   r  rB  rl  rE  r  r^  r
   r]  r`  r   r  rL  r[  r-  r  r  r  r$  rC   r&  r'  r*   rA   api_key_env_varsrD   r|   r5   r3   r   r(  r"  updateresolve_provider_client)r   rM   r  r  r  r  rm  resolvedfinal_modelr  r_  
raw_clientrT  rU  rn  r  r  r*  default_modelr,  r   tried_sourcesr4   headersr"  s                            r"   r  r    s   F "F))++1133H7!6 6(??>:
  	SE\\h\3h3F3FLL89>J J J E'x9C + 555k*	, <)++>NN < = = =:&w9C + 555k*	, 6#++>NN P Q Q Q:&w9C + 555k*	, >!! 
	- 344K "  T U U U!z3#3K>QRRRJ,,$,,>NN P Q Q Q:&w9C + 555k*	, 8 	0+1133K!'R..00 %9-r2288::%$ 
  ",   "zF#3#5#5FKJEEEF=G /$V[999 +.0 ,Z02 	4 	4F$fhhOFG!#.wAK 3(===$k24 4 4 " 	 ; 	< 	< 	<z[[[[[[[[[   DhOOOzz  ##H--GExPPPzI%%{""$2$4$4!FM~pqqq!z0=K=Gb$V[999fVaMbc44X>>eii	2..//5577 	 !9::M9$$$$_555LL 6!499]#;#;= = = :uyyR00117799@@EEcIc4882FF,} X^^----$1GL!!$(8(888AAAAAANN2244555 M( M M;BJ-w77M M7;OOO9C + 555k*	, 
	E	E	Ev*65*EEE~%%*>5*MMM 89A	C 	C 	Cz
NNK$h0 0 0:s   (K1 1%LLc                 T    t          | pd          \  }}}}t          ||||          S )aX  Return (client, default_model_slug) for text-only auxiliary tasks.

    Args:
        task: Optional task name ("compression", "web_extract") to check
              for a task-specific provider override.

    Callers may override the returned model with a per-task env var
    (e.g. CONTEXT_COMPRESSION_MODEL, AUXILIARY_WEB_EXTRACT_MODEL).
    N)rM   r  r  _resolve_task_provider_modelr  r.  r   rM   r4   r   s        r"   get_text_auxiliary_clientr  d  sB     *Fdld)S)S&HeXw"" 	   r.   c                 V    t          | pd          \  }}}}t          ||d||          S )a  Return (async_client, model_slug) for async consumers.

    For standard providers returns (AsyncOpenAI, model). For Codex returns
    (AsyncCodexAuxiliaryClient, model) which wraps the Responses API.
    Returns (None, None) when no provider is available.
    NTrM   r  r  r  r  r  s        r"   get_async_text_auxiliary_clientr  w  sE     *Fdld)S)S&HeXw""    r.   )r=  r   r  r   rO  c                 v    | pd                                                                 } | dk    rdS | dk    rdS | S )Nr   rj  r  rk  rO  )r+   r   r   s    r"   _normalize_vision_providerr    sI    "F))++1133H7~6xOr.   c                     t          |           } | dk    rt                      S | dk    rt                      S | dk    rt                      S | dk    rt	                      S | dk    rt                      S dS )Nr=  r   r  r   rO  r  )r  rB  rE  r`  r'  r[  r   s    r"   _resolve_strict_vision_backendr    s    )(33H<   6{{>!!||;8#%%%:r.   c                 0    t          |           d         d uS r   )r  r   s    r"    _strict_vision_backend_availabler    s    )(33A6dBBr.   c                      	 ddl m}   |             }|                    di           }t          |t                    r.t          |                    dd                    }|t          v r|S n# t          $ r Y nw xY wdS )zMReturn the selected main provider when it is also a supported vision backend.r   rG  rM   r   r&   N)rI  rH  rC   r@   rB   r  _VISION_AUTO_PROVIDER_ORDERr   )rH  configrK  r   s       r"   _preferred_main_vision_providerr    s    
111111JJw++	i&& 	 1)--
B2O2OPPH666   4s   A(A, ,
A98A9c                      t          t                    } t                      }|| v r+|                     |           |                     d|           d | D             S )a\  Return the currently available vision backends in auto-selection order.

    This is the single source of truth for setup, tool gating, and runtime
    auto-routing of vision tasks. The selected main provider is preferred when
    it is also a known-good vision backend; otherwise Hermes falls back through
    the standard conservative order.
    r   c                 0    g | ]}t          |          |S rx   )r  ).0r   s     r"   
<listcomp>z1get_available_vision_backends.<locals>.<listcomp>  s'    [[[0PQY0Z0Z[H[[[r.   )rA   r  r  removeinsert)ordered	preferreds     r"   get_available_vision_backendsr    sb     .//G/11IGy!!!q)$$$[[W[[[[r.   )r4   r   r  r4   r   c                   t          d| |||          \  }}}t          |          }dt          dt          dt          t                   ffd}|r t          d||          \  }	}
|	d	S d|	|
fS |d
k    rt          t                    }t                      }||v r+|	                    |           |
                    d|           |D ]%}t          |          \  }}| ||||          c S &t                              d           dS |t          v rt          |          \  }} ||||          S t          |          \  }	}
|	|ddfS ||	|
fS )ar  Resolve the client actually used for vision tasks.

    Direct endpoint overrides take precedence over provider selection. Explicit
    provider overrides still use the generic provider router for non-standard
    backends, so users can intentionally force experimental providers. Auto mode
    stays conservative and only tries vision backends known to work today.
    visionresolved_providerr|  r  c                 X    || d d fS p|}rt          ||          \  }}| ||fS | ||fS rO   )r  )r  r|  r  r  async_clientasync_modelr  resolved_models         r"   	_finalizez1resolve_vision_provider_client.<locals>._finalize  sW    $dD00$5 	@(8k(R(R%L+$lK?? +{::r.   rO  r  N)rO  NNr   r   z'Auxiliary vision client: none available)NNN)r  r  r*   r   r   r  rA   r  r  r  r  r  r   r   _get_cached_client)r   rM   r4   r   r  rP  resolved_base_urlresolved_api_keyr  rm  r  r  r  	candidater|  r  r  s       `           @r"   resolve_vision_provider_clientr    s    Fb(E8WF FBI~02B +955I;S ;s ;8TW= ; ; ; ; ; ; ;  
-5 !/-
 
 
 >'',,F233355	NN9%%%NN1i(((  	H 	HI)G	)R)R&K& yKGGGGG '>???///%CI%N%N"]yK???,Y
SSFK~$$$fk))r.   c                  2    t          d          \  } }}||fS )zJReturn (client, default_model_slug) for vision/multimodal auxiliary tasks.Fr  r  r:  rm  r  s      r"   get_vision_auxiliary_clientr    s$    ;uMMMAv{;r.   c                  2    t          d          \  } }}||fS )z=Return (async_client, model_slug) for async vision consumers.Tr  r  r  s      r"   !get_async_vision_auxiliary_clientr    s$    ;tLLLAv{;r.   c                  <    t           rt          t                    ni S )zReturn extra_body kwargs for auxiliary API calls.
    
    Includes Nous Portal product tags when the auxiliary client is backed
    by Nous Portal. Returns empty dict otherwise.
    )r   rB   NOUS_EXTRA_BODYrx   r.   r"   get_auxiliary_extra_bodyr    s     %6=4   2=r.   valuec                     t                      }t          j        d          }|s(t                      d|                                v rd| iS d| iS )aF  Return the correct max tokens kwarg for the auxiliary client's provider.
    
    OpenRouter and local models use 'max_tokens'. Direct OpenAI with newer
    models (gpt-4o, o-series, gpt-5+) requires 'max_completion_tokens'.
    The Codex adapter translates max_tokens internally, so we use max_tokens
    for it as well.
    r>  Napi.openai.comr   r   )rX  r   r  r   r   )r  rT  rA  s      r"   auxiliary_max_tokens_paramr  #  s`     +,,KY+,,F 0!!) K$5$5$7$777'//%  r.   _client_cachec                  T    	 ddl m}  d | _        dS # t          t          f$ r Y dS w xY w)a  Monkey-patch ``AsyncHttpxClientWrapper.__del__`` to be a no-op.

    The OpenAI SDK's ``AsyncHttpxClientWrapper.__del__`` schedules
    ``self.aclose()`` via ``asyncio.get_running_loop().create_task()``.
    When an ``AsyncOpenAI`` client is garbage-collected while
    prompt_toolkit's event loop is running (the common CLI idle state),
    the ``aclose()`` task runs on prompt_toolkit's loop but the
    underlying TCP transport is bound to a *different* loop (the worker
    thread's loop that the client was originally created on).  If that
    loop is closed or its thread is dead, the transport's
    ``self._loop.call_soon()`` raises ``RuntimeError("Event loop is
    closed")``, which prompt_toolkit surfaces as "Unhandled exception
    in event loop ... Press ENTER to continue...".

    Neutering ``__del__`` is safe because:
    - Cached clients are explicitly cleaned via ``_force_close_async_httpx``
      on stale-loop detection and ``shutdown_cached_clients`` on exit.
    - Uncached clients' TCP connections are cleaned up by the OS when the
      process exits.
    - The OpenAI SDK itself marks this as a TODO (``# TODO(someday):
      support non asyncio runtimes here``).

    Call this once at CLI startup, before any ``AsyncOpenAI`` clients are
    created.
    r   AsyncHttpxClientWrapperc                     d S rO   rx   r   s    r"   <lambda>z(neuter_async_httpx_del.<locals>.<lambda>b  s    t r.   N)openai._base_clientr  __del__r$  AttributeErrorr  s    r"   neuter_async_httpx_delr  F  sR    4??????*;*;'''(   s    ''rm  c                     	 ddl m} t          | dd          }|t          |dd          s|j        |_        dS dS dS # t
          $ r Y dS w xY w)u  Mark the httpx AsyncClient inside an AsyncOpenAI client as closed.

    This prevents ``AsyncHttpxClientWrapper.__del__`` from scheduling
    ``aclose()`` on a (potentially closed) event loop, which causes
    ``RuntimeError: Event loop is closed`` → prompt_toolkit's
    "Press ENTER to continue..." handler.

    We intentionally do NOT run the full async close path — the
    connections will be dropped by the OS when the process exits.
    r   )ClientStaterP   N	is_closedT)httpx._clientr  r)   CLOSED_stater   )rm  r  inners      r"   _force_close_async_httpxr  g  s    ------	400WUK%F%F&-ELLL    s   6> 
AAc                     ddl } t          5  t          t                                                    D ]b\  }}|d         }|t          |           	 t          |dd          }|r|                     |          s
 |             S# t          $ r Y _w xY wt          	                                 ddd           dS # 1 swxY w Y   dS )zClose all cached clients (sync and async) to prevent event-loop errors.

    Call this during CLI shutdown, *before* the event loop is closed, to
    avoid ``AsyncHttpxClientWrapper.__del__`` raising on a dead loop.
    r   Nr   )
inspect_client_cache_lockrA   r  r%  r  r)   iscoroutinefunctionr   clear)r  r,   r$   rm  r   s        r"   shutdown_cached_clientsr  {  s0    NNN	  }224455 	 	JC1XF~ %V,,,"67D99 G$?$?$I$I HJJJ   !                 s6   AB<2BB<
BB<BB<<C C c                  $   t           5  g } t                                          D ]E\  }}|\  }}}|8|                                r$t	          |           |                     |           F| D ]
}t          |= 	 ddd           dS # 1 swxY w Y   dS )uK  Force-close cached async clients whose event loop is closed.

    Call this after each agent turn to proactively clean up stale clients
    before GC can trigger ``AsyncHttpxClientWrapper.__del__`` on them.
    This is defense-in-depth — the primary fix is ``neuter_async_httpx_del``
    which disables ``__del__`` entirely.
    N)r  r  r%  r  r  rD   )
stale_keysr,   r$   rm  _defaultcached_loops         r"   cleanup_stale_async_clientsr    s     
 # #
'--// 	' 	'JC,1)FHk&;+@+@+B+B&(000!!#&&& 	# 	#Cc""	## # # # # # # # # # # # # # # # # #s   A/BB	B	c                    d}d}|r9	 ddl }|                                }t          |          }n# t          $ r Y nw xY w| ||pd|pd|f}t          5  |t
          v ret
          |         \  }	}
}|r@|,|                                rt          |	           t
          |= n$|	|p|
fcddd           S |	|p|
fcddd           S ddd           n# 1 swxY w Y   t          | ||||          \  }}|I|}t          5  |t
          vr|||ft
          |<   nt
          |         \  }}}ddd           n# 1 swxY w Y   ||p|fS )a  Get or create a cached client for the given provider.

    Async clients (AsyncOpenAI) use httpx.AsyncClient internally, which
    binds to the event loop that was current when the client was created.
    Using such a client on a *different* loop causes deadlocks or
    RuntimeError.  To prevent cross-loop issues (especially in gateway
    mode where _run_async() may spawn fresh loops in worker threads), the
    cache key for async clients includes the current event loop's identity
    so each loop gets its own client instance.
    r   Nr&   )r  r  )	r   get_event_looprh   RuntimeErrorr  r  r  r  r  )r   rM   r  r4   r   loop_idcurrent_loop_aio	cache_keycached_clientcached_defaultr  rm  r  
bound_loopr:  s                   r"   r  r    s   ( GL 	""""..00L&&GG 	 	 	D	:x~2w}"gNI	 > >%%9Fy9Q6M>; 
> *{/D/D/F/F*,];;;%i00(%*A>A> > > > > > > > %e&=~=> > > > > > > > > > > > > > > > > > > > > > > 4"   FM  "
 	D 	D--,2M:+Ni((+8+C(q		D 	D 	D 	D 	D 	D 	D 	D 	D 	D 	D 	D 	D 	D 	D
 5)M))s7   '0 
==AC/CCC:)D//D36D3c                    i }d}d}d}d}	| rF	 ddl m}
  |
            }n# t          $ r i }Y nw xY wt          |t                    r|                    di           ni }t          |t                    r|                    | i           ni }t          |t                    si }t          |                    dd                                                    pd}t          |                    dd                                                    pd}t          |                    dd                                                    pd}t          |                    d	d                                                    pd}	| d
k    r|r|dk    rt          |t                    r|                    d
i           ni }t          |t                    r|                    dd                                          pd}|p)|                    dd                                          pd}|                    d          pd}|p|                                pd}| rt          | d          nd}|p|p|}|rd|||fS |r||||fS | rat          | d          }t          | d          }|rd|||p|	fS t          |           }|dk    r||ddfS |rd|||	fS |r|dk    r||ddfS d|ddfS d|ddfS )a  Determine provider + model for a call.

    Priority:
      1. Explicit provider/model/base_url/api_key args (always win)
      2. Env var overrides (AUXILIARY_{TASK}_*, CONTEXT_{TASK}_*)
      3. Config file (auxiliary.{task}.* or compression.*)
      4. "auto" (full auto-detection chain)

    Returns (provider, model, base_url, api_key) where model may be None
    (use provider default). When base_url is set, provider is forced to
    "custom" and the task uses that direct endpoint.
    Nr   rG  	auxiliaryr   r&   rM   r4   r   compressionr   summary_providersummary_modelsummary_base_urlMODELrO  BASE_URLAPI_KEY)
rI  rH  r$  r@   rB   rC   r*   r+   r;  r7  )r.  r   rM   r4   r   r  rf  	cfg_modelrg  cfg_api_keyrH  auxtask_configcomp_sbu	env_modelr  env_base_urlenv_api_keyenv_providers                       r"   r  r    sq   & FLILK D	555555 []]FF 	 	 	FFF	 .8-E-EMfjjb)))2+5c4+@+@HcggdB'''b+t,, 	K;??:r::;;AACCKt4455;;==E	;??:r::;;AACCKt+//)R8899??AAIT
 =  , ,&:P:P4>vt4L4LT6::mR000RTD$%% D#xx(:B??EEGGO4%V/2)F)F)L)L)N)NVRV	xx 2339r+Ctzz||Ct>BL+D':::I4i49N ;7:: ;7:: 224DD1$	BB 	V^\;;U+UU.t446!!t;; 	G^\;FF 	<LF22t;;~tT11>4--s     //      >@r  c                    | s|S 	 ddl m}  |            }n# t          $ r |cY S w xY wt          |t                    r|                    di           ni }t          |t                    r|                    | i           ni }|                    d          }|'	 t          |          S # t          t          f$ r Y nw xY w|S )zPRead timeout from auxiliary.{task}.timeout in config, falling back to *default*.r   rG  r  timeout)	rI  rH  r$  r@   rB   rC   float
ValueError	TypeError)r.  r  rH  r  r  r  raws          r"   _get_task_timeoutr	  ;  s     111111   )3FD)A)A
I&**["
%
%
%rC'1#t'<'<D#''$###"K
//)
$
$C
	::I& 	 	 	D	Ns    &&B* *B>=B>rU   rV   r   r]   r  
extra_bodyc	                 J   |||d}	|||	d<   |=| dk    r2|pt                      }
d|
                                v r||	d<   n||	d<   n||	d<   |r||	d<   t          |pi           }| d	k    st          r*|                    d
g                               dg           |r||	d<   |	S )zLBuild kwargs for .chat.completions.create() with model/provider adjustments.)rM   rU   r  NrV   rO  r  r   r   r]   r   r   r   r
  )rX  r   rB   r   
setdefaultextend)r   rM   rU   rV   r   r]   r  r
  r4   r}   rT  merged_extras               r"   _build_call_kwargsr  O  s      F  +} x"@&>&@&@K;#4#4#6#6662<.//'1|$$#-F<   w 
(b))L6.++224J3KLLL ,+|Mr.   )	r   rM   r4   r   rV   r   r]   r  r
  c       
            t          | ||||          \  }}}}| dk    rpt          ||||d          \  }}}|9|dk    r3|s1t                              d|           t          d|d          \  }}}|t	          d|  d	| d
          |p|}nt          ||||          \  }}||pd                                                                }|r,|dvr(t	          d| d|                                 d          |s8t          	                    d| pd|           t          d|pt                    \  }}|t	          d|  d	| d
          |	|	nt          |           }t          t          |d|          pd          }| r-t          	                    d| |pd|pd|r	d|vrd| nd           t          ||||||||
|	  	        }	  |j        j        j        di |S # t$          $ rT}t          |          }d|v sd|v r7|                    dd           ||d<    |j        j        j        di |cY d}~S  d}~ww xY w)a  Centralized synchronous LLM call.

    Resolves provider + model (from task config, explicit args, or auto-detect),
    handles auth, request formatting, and model-specific arg adjustments.

    Args:
        task: Auxiliary task name ("compression", "vision", "web_extract",
              "session_search", "skills_hub", "mcp", "flush_memories").
              Reads provider:model from config/env. Ignored if provider is set.
        provider: Explicit provider override.
        model: Explicit model override.
        messages: Chat messages list.
        temperature: Sampling temperature (None = provider default).
        max_tokens: Max output tokens (handles max_tokens vs max_completion_tokens).
        tools: Tool definitions (for function calling).
        timeout: Request timeout in seconds (None = read from auxiliary.{task}.timeout config).
        extra_body: Additional request body fields.

    Returns:
        Response object with .choices[0].message.content

    Raises:
        RuntimeError: If no provider is configured.
    r  Fr   rM   r4   r   r  Nr   DVision provider %s unavailable, falling back to auto vision backendsr   rM   r  $No LLM provider configured for task=
 provider=. Run: hermes setup)r4   r   r&   r   r=  rO  
Provider ':' is set in config.yaml but no API key was found. Set the U_API_KEY environment variable, or switch to a different provider with `hermes model`.zAAuxiliary %s: provider %s unavailable, falling back to openroutercallr=  r4   zAuxiliary %s: using %s (%s)%sr  z at rV   r   r]   r  r
  r4   r   unsupported_parameterr   rx   )r  r  r   rl  r  r  r+   r   r4  rt  r@  r	  r*   r)   r  r   r   r   r   pop)r.  r   rM   r4   r   rU   rV   r   r]   r  r
  r  r  r  r  effective_providerrm  r  	_expliciteffective_timeout
_base_infor}   	first_errerr_strs                           r"   call_llmr%  }  s   L NjhxN2 N2J~'8:J x2P3
 3
 3
/FK >/699BS9NNV!   7U$ 7 7 73
 >%t % %GX % % %   /C2C0&$	
 
 
 > +0b7799??AAI Y.NNN"X X X*3//*;*;X X X   % G_ NF,=? ? ?&8 ."E4E'G 'G#>%t % %GX % % %& & & $+#6<Md<S<S WVZ1BCCIrJJJ c3,68Py,6a<z;Y;Y(J(((_a	c 	c 	c  ;J.:"	$ $ $F-v{&-77777   i..7""&=&H&HJJ|T***.8F*+16;*1;;F;;;;;;;;s%   
G! !
H?+AH:3H?9H::H?c                    ddl }| j        d         j        }|j        pd                                }|r<|                    dd||j        |j        z                                            }|r|S g }dD ]i}t          ||d          }|rTt          |t                    r?|                                r+||vr'|                    |                                           jt          |dd          }|rt          |t                    r|D ]}	t          |	t                    r|	                    d          p)|	                    d	          p|	                    d
          }
|
rO|
|vrK|                    t          |
t                    r|
                                nt          |
                     |rd                    |          S dS )u  Extract content from an LLM response, falling back to reasoning fields.

    Mirrors the main agent loop's behavior when a reasoning model (DeepSeek-R1,
    Qwen-QwQ, etc.) returns ``content=None`` with reasoning in structured fields.

    Resolution order:
      1. ``message.content`` — strip inline think/reasoning blocks, check for
         remaining non-whitespace text.
      2. ``message.reasoning`` / ``message.reasoning_content`` — direct
         structured reasoning fields (DeepSeek, Moonshot, Novita, etc.).
      3. ``message.reasoning_details`` — OpenRouter unified array format.

    Returns the best available text, or ``""`` if nothing found.
    r   Nr&   zj<(?:think|thinking|reasoning|REASONING_SCRATCHPAD)>.*?</(?:think|thinking|reasoning|REASONING_SCRATCHPAD)>)flags)	reasoningreasoning_contentreasoning_detailssummaryr8   r;   z

)rerw   rc   r8   r+   subDOTALL
IGNORECASEr)   r@   r*   rD   rA   rB   rC   r|   )r   r,  r   r8   cleanedreasoning_partsfieldr6  detailsr?   r+  s              r"   extract_content_or_reasoningr4    s    III

1

%C{ b''))G 	&&D ry2=8	  
 

 %'' 	  	N "$O3 0 0c5$'' 	0:c3'' 	0CIIKK 	0C<V<V""399;;///c.55G 	j:gt,, 	j 	j 	jF&$'' jJJy)) *zz),,*zz&)) 
  jwo==#**jRU>V>V+h7==???\_`g\h\hiii ,{{?+++2r.   c       
           K   t          | ||||          \  }}}}| dk    rpt          ||||d          \  }}}|9|dk    r3|s1t                              d|           t          d|d          \  }}}|t	          d|  d	| d
          |p|}nt          ||d||          \  }}||pd                                                                }|r,|dvr(t	          d| d|                                 d          |s7t                              d|           t          d|pt          d          \  }}|t	          d|  d	| d
          |	|	nt          |           }t          ||||||||
|	  	        }	  |j        j        j        di | d{V S # t          $ rZ}t!          |          }d|v sd|v r=|                    dd           ||d<    |j        j        j        di | d{V cY d}~S  d}~ww xY w)zqCentralized asynchronous LLM call.

    Same as call_llm() but async. See call_llm() for full documentation.
    r  Tr  Nr   r  r  r  r  r  )r  r4   r   r&   r  r  r  r  z3Provider %s unavailable, falling back to openrouterr=  r  r  r   r  r   rx   )r  r  r   rl  r  r  r+   r   r4  r@  r	  r  r   r   r   r   r*   r  )r.  r   rM   r4   r   rU   rV   r   r]   r  r
  r  r  r  r  r  rm  r  r   r!  r}   r#  r$  s                          r"   async_call_llmr6  .  s`     $ NjhxN2 N2J~'8:J x2P3
 3
 3
/FK >/699BS9NNV!   7U$7 7 73
 >%t % %GX % % %   /C2C0&$
 
 
 >*0b7799??AAI Y.NNN"X X X*3//*;*;X X X  
 % %T02 2 2&8 ."E4E#'% '% '%# >%t % %GX % % %& & & $+#6<Md<S<S;J.:"	$ $ $F3V[,3==f=========   i..7""&=&H&HJJ|T***.8F*+707AA&AAAAAAAAAAAAAAs%   =F 
G>$AG92G>8G99G>)r&   )NFFNNr  )r   N)NFNN)NNNNN)NNNr  NNrO   )nr   r   loggingr   	threadingr  pathlibr   typesr   typingr   r   r   r   r	   r{  r
   agent.credential_poolr   rI  r   hermes_constantsr   	getLoggerr   r   r   r*   __annotations__r?  r  r   r   r@  rD  r   re  r   r^  r]  r#   r-   r7   rI   rK   r   r   r   r   r   r   r   r   r   r   r   rB   r   r   r  r  r-  r7  r;  rB  rE  rL  rV  rX  r[  r`  r'  ro  rs  rx  r  r  r  r  r  r  r  r  r  r  r  r  r  r  intr  r  tupleLockr  r  r  r  r  r  r  _DEFAULT_AUX_TIMEOUTr  r	  rA   r  r%  r4  r6  rx   r.   r"   <module>rD     s4  $ $ $L   				            ! ! ! ! ! ! 3 3 3 3 3 3 3 3 3 3 3 3 3 3       + + + + + + - - - - - - 0 0 0 0 0 0		8	$	$ *'*,)$/
0 
0 d38n 
 
 
 <(7  234   4    4 -D 9 !/##k1 # =  tXc]/B)C     " " " " " ". .# . .c . . . .(-C -C - - - -`r
 r
 r
 r
 r
 r
 r
 r
j# # # # # # # #" " " " " " " "$D D D D D D D D# # # # # # # #
. . . . . . . .?
 ?
 ?
 ?
 ?
 ?
 ?
 ?
D# # # # # # # #
        D D D D D D D D# # # # # # # #
. . . . . . . .#$ # # # #LID IS I I I I
H H H H H
 (3-        F55&)98C=)H#I 5 5 5 5t # s    c 3 8C=    Cx/#>? C C C C&5&)8C=89    "#    *!+x}hsm'C!D !+ !+ !+ !+H#    
CeHV$4hsm$CD C C C CQE(3-#67 Q Q Q Q"-chsmXc]:; -c -c -c -c`S U8F3CXc]3R-S    F $* !*  uXf-x}<=    H. . . . .6 ! H HHH H 	H
 H H 8C=(3-'(H H H HZ C x7GRU7V1W    & #    " # 3    S U8C=(SV-;W5X    Cs Ct C C C C#     \tCy \ \ \ \" #>* #!>* >* >*sm>*C=>* sm	>*
 c]>* >* 8C=(3-#67>* >* >* >*BU8F+;Xc]+J%K      >$ > > > >!c !d ! ! ! !> %'tE5L! & & &#Y^%%    BS T    (   6# # # #* =* =*=*=* =* 	=*
 =* 8C=(3-'(=* =* =* =*B L. L.
L.L. L. 	L.
 L. 3x}hsm;<L. L. L. L.^   3G  C % 5    0 $( $ !%"+ +++ + %	+
 + D>+ + + sm+ 
+ + + +^ v v v v
v v 	v
 v v v v v v v v 	v v v vr5c 5 5 5 5r X X X X
X X 	X
 X X X X X X X X 	X X X X X Xr.   