
    i&g                       U d dl mZ d dlmZ d dlmZmZ d dlmZ d dlm	Z	m
Z
mZmZ d dlmZmZ d dlmZ ddd	Z ed
          Z ed          Zed         Zed         Z ed           G d d                      Z ed           G d d                      Z ed           G d d                      Z ed           G d d                      Zd Zi d e ed           ed           ed           ed          ddd !          d" e ed#           ed           ed$           ed%          ddd !          d& e ed'           ed(           ed)          dd*d+,          d- e ed.           ed/           ed0          dd*d+,          d1 e ed2           ed3           ed4          dd*d+,          d5 e ed6           ed7           ed8          dd*d+,          d9 e ed8           ed6           ed:          dd*d+,          d; e ed(           ed<           ed'          dd*d+,          d= e ed>           ed?           ed@          dd*d+,          dA e ed#           ed           ed$           ed%          dddB!          dC e edD           edE           edF           edG          dddB!          dH e ed           ed           ed           ed          dddB!          dI e edJ           ed)           edK           ed$          dddB!          dL e edM           edN          ddOdPQ          dR e ed@           edS          ddOdPQ          dT e ed)           ed(          ddUdVQ          dW e ed.           ed/          ddUdVQ           e ed8           ed6          ddUdVQ           e ed           ed          ddXdYQ           e ed#           ed          ddXdYQ           e ed#           ed          ddXdYQ           e edD           edE          ddXdYQ           e edD           edZ          ddXdYQ           e ed[           ed\          ddXdYQ           e ed]           edM          ddXdYQ           e ed$           ed^          dd_`           e ed$           ed^          dd_`          da
Zdbedc<   ddhZddjZ	 	 dddqZ ddtZ!dduZ"dd{Z#	 	 	 ddd}Z$dkdkd~ddZ%dkdkdkdddZ&	 	 	 dddZ'ddZ(ddZ)dkS )    )annotations)	dataclass)datetimetimezone)Decimal)AnyDictLiteralOptional)fetch_endpoint_model_metadatafetch_model_metadata)base_url_host_matchesg        )inputoutput01000000)actual	estimatedincludedunknown)provider_cost_apiprovider_generation_apiprovider_models_apiofficial_docs_snapshotuser_overridecustom_contractnoneT)frozenc                      e Zd ZU dZded<   dZded<   dZded<   dZded<   dZded<   dZ	ded	<   d
Z
ded<   edd            Zedd            Zd
S )CanonicalUsager   intinput_tokensoutput_tokenscache_read_tokenscache_write_tokensreasoning_tokens   request_countNzOptional[dict[str, Any]]	raw_usagereturnc                0    | j         | j        z   | j        z   S N)r"   r$   r%   selfs    8/home/ubuntu/.hermes/hermes-agent/agent/usage_pricing.pyprompt_tokenszCanonicalUsage.prompt_tokens&   s     4#99D<SSS    c                     | j         | j        z   S r,   )r0   r#   r-   s    r/   total_tokenszCanonicalUsage.total_tokens*   s    !D$666r1   )r*   r!   )__name__
__module____qualname__r"   __annotations__r#   r$   r%   r&   r(   r)   propertyr0   r3    r1   r/   r    r       s         LMM*.I....T T T XT 7 7 7 X7 7 7r1   r    c                  @    e Zd ZU ded<   ded<   dZded<   dZded<   dS )	BillingRoutestrprovidermodel base_urlr   billing_modeN)r4   r5   r6   r7   r@   rA   r9   r1   r/   r;   r;   /   sF         MMMJJJH!L!!!!!!r1   r;   c                      e Zd ZU dZded<   dZded<   dZded<   dZded<   dZded<   dZ	d	ed
<   dZ
ded<   dZded<   dZded<   dS )PricingEntryNOptional[Decimal]input_cost_per_millionoutput_cost_per_millioncache_read_cost_per_millioncache_write_cost_per_millionrequest_costr   
CostSourcesourceOptional[str]
source_urlpricing_versionOptional[datetime]
fetched_at)r4   r5   r6   rE   r7   rF   rG   rH   rI   rK   rM   rN   rP   r9   r1   r/   rC   rC   7   s         0444441555555999996: ::::&*L****F $J$$$$%)O))))%)J))))))r1   rC   c                  b    e Zd ZU ded<   ded<   ded<   ded<   d	Zd
ed<   d	Zded<   dZded<   d	S )
CostResultrD   
amount_usd
CostStatusstatusrJ   rK   r<   labelNrO   rP   rL   rN   r9   ztuple[str, ...]notes)r4   r5   r6   r7   rP   rN   rW   r9   r1   r/   rR   rR   D   sr         !!!!JJJ%)J))))%)O))))Er1   rR   c                 >    t          j        t          j                  S r,   )r   nowr   utcr9   r1   r/   <lambda>r[   O   s    8<-- r1   )	anthropiczclaude-opus-4-20250514z15.00z75.00z1.50z18.75r   zChttps://docs.anthropic.com/en/docs/build-with-claude/prompt-cachingz#anthropic-prompt-caching-2026-03-16)rE   rF   rG   rH   rK   rM   rN   )r\   zclaude-sonnet-4-20250514z3.00z0.30z3.75)openaizgpt-4oz2.50z10.00z1.25zhttps://openai.com/api/pricing/zopenai-pricing-2026-03-16)rE   rF   rG   rK   rM   rN   )r]   zgpt-4o-miniz0.15z0.60z0.075)r]   zgpt-4.1z2.00z8.00z0.50)r]   zgpt-4.1-miniz0.40z1.60z0.10)r]   zgpt-4.1-nanoz0.025)r]   o3z40.00)r]   zo3-miniz1.10z4.40z0.55)r\   zclaude-3-5-sonnet-20241022zanthropic-pricing-2026-03-16)r\   zclaude-3-5-haiku-20241022z0.80z4.00z0.08z1.00)r\   zclaude-3-opus-20240229)r\   zclaude-3-haiku-20240307z0.25z0.03)deepseekzdeepseek-chatz0.14z0.28z1https://api-docs.deepseek.com/quick_start/pricingzdeepseek-pricing-2026-03-16)rE   rF   rK   rM   rN   )r_   zdeepseek-reasonerz2.19)googlezgemini-2.5-prozhttps://ai.google.dev/pricingzgoogle-pricing-2026-03-16)r`   zgemini-2.5-flashz'https://aws.amazon.com/bedrock/pricing/zbedrock-pricing-2026-04z3.20z0.06z0.24z0.035z1.20zminimax-pricing-2026-04)rE   rF   rK   rN   )
)r`   zgemini-2.0-flash)bedrockzanthropic.claude-opus-4-6)ra   zanthropic.claude-sonnet-4-6)ra   zanthropic.claude-sonnet-4-5)ra   zanthropic.claude-haiku-4-5)ra   zamazon.nova-pro)ra   zamazon.nova-lite)ra   zamazon.nova-micro)minimaxminimax-m2.7)
minimax-cnrc   z#Dict[tuple[str, str], PricingEntry]_OFFICIAL_DOCS_PRICINGvaluer   r*   rD   c                f    | d S 	 t          t          |                     S # t          $ r Y d S w xY wr,   )r   r<   	Exceptionrf   s    r/   _to_decimalrj     sG    }ts5zz"""   tts   " 
00r!   c                H    	 t          | pd          S # t          $ r Y dS w xY w)Nr   )r!   rh   ri   s    r/   _to_intrl     s9    5:A   qqs    
!!N
model_namer<   r=   rL   r@   c                   |pd                                                                 }|pd                                                                 }| pd                                 }|s%d|v r!|                    dd          \  }}|dv r|}|}|dk    rt          d||pdd          S |dk    st	          |pdd	          rt          d||pdd
          S |dk    r.t          d|                    d          d         |pdd          S |dk    r.t          d|                    d          d         |pdd          S |dv r.t          ||                    d          d         |pdd          S |dv s|rd|v rt          |pd||pdd          S t          |pd|r|                    d          d         nd|pdd          S )Nr?   /r'   >   r`   r]   r\   zopenai-codexsubscription_included)r=   r>   r@   rA   
openrouterzopenrouter.aiofficial_models_apir\   r   r]   >   rb   rd   >   localcustom	localhostru   r   )striplowersplitr;   r   )rm   r=   r@   provider_namebaser>   inferred_provider
bare_models           r/   resolve_billing_router~     s   
 ^**,,2244MN!!##))++D2$$&&E SE\\(-C(;(;%: AAA-ME&&^58>WYh  A  A  A  	A$$(=hn"o(^(^$\UWf{||||##[C8H8H8LW_Wece  uM  N  N  N  	N  XU[[5E5Eb5IT\Tb`b  rJ  K  K  K  	K111]%++c:J:J2:NYaYgeg  wO  P  P  P  	P++++9L9L]%>heV^Vdbds|}}}}!;)[`Ch5;;sCSCSTVCWCWfhs{  tB  @B  QZ  [  [  [  [r1   routeOptional[PricingEntry]c                r    t                               | j        | j                                        f          S r,   )re   getr=   r>   rx   r   s    r/   _lookup_official_docs_pricingr     s+    !%%u~u{7H7H7J7J&KLLLr1   c                J    t          t                      | j        dd          S )Nz>https://openrouter.ai/docs/api/api-reference/models/get-modelszopenrouter-models-apirM   rN   )_pricing_entry_from_metadatar   r>   r   s    r/   _openrouter_pricing_entryr     s-    'S/	   r1   metadataDict[str, Dict[str, Any]]model_idrM   rN   c                  || vrd S | |                              d          pi }t          |                     d                    }t          |                     d                    }t          |                     d                    }t          |                     d          p)|                     d          p|                     d                    }t          |                     d          p)|                     d	          p|                     d
                    }	|||d S dd}
t           |
|           |
|           |
|           |
|	          |d||t                      	  	        S )Npricingprompt
completionrequest
cache_readcached_promptinput_cache_readcache_writecache_creationinput_cache_writerf   rD   r*   c                    | d S | t           z  S r,   )_ONE_MILLIONri   s    r/   _per_token_to_per_millionz?_pricing_entry_from_metadata.<locals>._per_token_to_per_million  s    =4|##r1   r   )	rE   rF   rG   rH   rI   rK   rM   rN   rP   )rf   rD   r*   rD   )r   rj   rC   _UTC_NOW)r   r   rM   rN   r   r   r   r   r   r   r   s              r/   r   r     s    xtx $$Y//52GX..//FW[[6677J'++i0011GL!! 	+;;''	+;;)** J
 M"" 	,;;'((	,;;*++ K
 ~*,t$ $ $ $
 88@@ 9 9* E E$=$=j$I$I%>%>{%K%K$'::
 
 
 
r1   api_keyc                   t          | ||          }|j        dk    r)t          t          t          t          t          dd          S |j        dk    rt          |          S |j        rMt          t          |j        |pd          |j	        |j        
                    d	           d
d          }|r|S t          |          S )Nr=   r@   rp   r   included-route)rE   rF   rG   rH   rK   rN   rq   r?   )r   ro   z/modelszopenai-compatible-models-apir   )r~   rA   rC   _ZEROr=   r   r@   r   r   r>   rstripr   rm   r=   r@   r   r   entrys         r/   get_pricing_entryr     s     "*x(SSSE444#($)(-).,
 
 
 	
 ~%%(///~ ,)%.'-RPPPK.//44===:	
 
 
  	L(///r1   )r=   api_moderesponse_usager   c                  | st                      S |pd                                                                }|pd                                                                }|dk    s|dk    rzt          t	          | dd                    }t          t	          | dd                    }t          t	          | dd                    }t          t	          | dd                    }n|d	k    rt          t	          | dd                    }	t          t	          | dd                    }t	          | d
d          }
t          |
rt	          |
dd          nd          }t          |
rt	          |
dd          nd          }t          d|	|z
  |z
            }nt          t	          | dd                    }t          t	          | dd                    }t	          | dd          }
t          |
rt	          |
dd          nd          }|st          t	          | dd                    }t          |
rt	          |
dd          nd          }|st          t	          | dd                    }t          d||z
  |z
            }d}t	          | dd          }|rt          t	          |dd                    }t          |||||          S )u  Normalize raw API response usage into canonical token buckets.

    Handles three API shapes:
    - Anthropic: input_tokens/output_tokens/cache_read_input_tokens/cache_creation_input_tokens
    - Codex Responses: input_tokens includes cache tokens; input_tokens_details.cached_tokens separates them
    - OpenAI Chat Completions: prompt_tokens includes cache tokens; prompt_tokens_details.cached_tokens separates them

    In both Codex and OpenAI modes, input_tokens is derived by subtracting cache
    tokens from the total — the API contract is that input/prompt totals include
    cached tokens and the details object breaks them out.
    r?   anthropic_messagesr\   r"   r   r#   cache_read_input_tokenscache_creation_input_tokenscodex_responsesinput_tokens_detailsNcached_tokenscache_creation_tokensr0   completion_tokensprompt_tokens_detailsr%   output_tokens_detailsr&   )r"   r#   r$   r%   r&   )r    rw   rx   rl   getattrmax)r   r=   r   rz   moder"   r#   r$   r%   input_totaldetailsprompt_totalr&   output_detailss                 r/   normalize_usager     s   "   ^**,,2244MN!!##))++D###}'C'Cw~~qIIJJ K KLL#GN<UWX$Y$YZZ$W^=Z\]%^%^__	"	"	"gnnaHHII K KLL.*@$GG#G$ZGG_a$H$H$HYZ[[$<CJGG4a888
 
 1k,==@RRSSw~JJKK8KQ O OPP.*A4HH $G$ZGG_a$H$H$HYZ[[  	_ '@Y[\(](] ^ ^$9@GGG11555a
 
 " 	!((EqII" " 1l->>ASSTT^-DdKKN S"7>;Mq#Q#QRR!#+-)   r1   r=   r@   r   usagec                  t          | ||          }|j        dk    rt          t          dddd          S t	          | |||          }|st          d ddd	
          S g }t          }|j        r|j        t          d d|j        d	
          S |j        r|j	        t          d d|j        d	
          S |j
        r |j        t          d d|j        d	d          S |j        r |j        t          d d|j        d	d          S |j        '|t          |j                  |j        z  t          z  z  }|j	        '|t          |j                  |j	        z  t          z  z  }|j        '|t          |j
                  |j        z  t          z  z  }|j        '|t          |j                  |j        z  t          z  z  }|j        &|j        r|t          |j                  |j        z  z  }d}	d|d}
|j        dk    r|t          k    rd}	d}
|j        dk    r|                    d           t          ||	|j        |
|j        |j        t-          |                    S )Nr   rp   r   r   r   )rS   rU   rK   rV   rN   r   r   zn/a)rS   rU   rK   rV   )z(cache-read pricing unavailable for route)rS   rU   rK   rV   rW   )z)cache-write pricing unavailable for router   z~$.2frq   zBOpenRouter cost is estimated from the models API until reconciled.)rS   rU   rK   rV   rP   rN   rW   )r~   rA   rR   r   r   r"   rE   rK   r#   rF   r$   rG   r%   rH   r   r   rI   r(   r=   appendrP   rN   tuple)rm   r   r=   r@   r   r   r   rW   amountrU   rV   s              r/   estimate_usage_costr   M  s    "*x(SSSE444,
 
 
 	
 j8hX_```E YT)FRWXXXXEF _e:BT)ELX]^^^^ _u<DT)ELX]^^^^ ,4 |C     -5 |D    #/'%,--0LL|[[$0'%-..1NNQ]]](4'%122U5VVYeee)5'%233e6XX[ggg%%*=%'%-..1CCC$FE|v&E//~%%YZZZ|#-Ell   r1   boolc                n    t          | ||          }|j        dk    rdS t          | |||          }|duS )u   Check whether we have pricing data for this model+route.

    Uses direct lookup instead of routing through the full estimation
    pipeline — avoids creating dummy usage objects just to check status.
    r   rp   Tr   N)r~   rA   r   r   s         r/   has_known_pricingr     sN     "*x(SSSE444tj8hX_```Er1   secondsfloatc                    | dk     r| ddS | dz  }|dk     r|ddS |dz  }|dk     r;t          |dz            }|rt          |           d| dnt          |           dS |dz  }|dd	S )
N<   .0fsm   zh h.1fd)r!   )r   minuteshoursremaining_mindayss        r/   format_duration_compactr     s    ||     lG||     bLErzzGbL))4AW#e**000000#e**GWGWGWW2:D>>>>r1   c                d   t          t          |                     }|dk     rt          t          |                     S | dk     rdnd}d}|D ]`\  }}||k    rU||z  }|dk     r|d}n|dk     r|d	}n|d
}d|v r(|                    d                              d          }| | | c S a| dS )N  r   -r?   ))i ʚ;B)i@B M)r   K
   r   d   r   r   .r   ,)absr!   r<   r   )rf   	abs_valuesignunits	thresholdsuffixscaledtexts           r/   format_token_count_compactr     s    CJJI53u::!))33DBE" + +	6	!!*F{{ #  d{{{{3''..s33*D*&***** " <<r1   )rf   r   r*   rD   )rf   r   r*   r!   )NN)rm   r<   r=   rL   r@   rL   r*   r;   )r   r;   r*   r   )
r   r   r   r<   rM   r<   rN   r<   r*   r   )NNN)
rm   r<   r=   rL   r@   rL   r   rL   r*   r   )r   r   r=   rL   r   rL   r*   r    )rm   r<   r   r    r=   rL   r@   rL   r   rL   r*   rR   )
rm   r<   r=   rL   r@   rL   r   rL   r*   r   )r   r   r*   r<   )rf   r!   r*   r<   )*
__future__r   dataclassesr   r   r   decimalr   typingr   r	   r
   r   agent.model_metadatar   r   utilsr   DEFAULT_PRICINGr   r   rT   rJ   r    r;   rC   rR   r   re   r7   rj   rl   r~   r   r   r   r   r   r   r   r   r   r9   r1   r/   <module>r      s
   " " " " " " " ! ! ! ! ! ! ' ' ' ' ' ' ' '       / / / / / / / / / / / / T T T T T T T T ' ' ' ' ' '3//wy!!AB

 $7 7 7 7 7 7 7 7$ $" " " " " " " " $	* 	* 	* 	* 	* 	* 	* 	* $                .-
i? |&ww// ' 0 0$+GFOO%,WW%5%5'X=  	i? |&wv ' 0 0$+GFOO%,WV__'X=  !i?4 |&wv ' 0 0$+GFOO'43  ;i?J |&wv '$+GG$4$4'43  Qi?` |&wv '$+GFOO'43  gi?v |&wv '$+GFOO'43  }i?L |&wv '$+GG$4$4'43  Si?b |&ww// ' 0 0$+GFOO'43  ii?x |&wv '$+GFOO'43  i?P |&wv ' 0 0$+GFOO%,WV__'X6  Wi?h |&wv '$+GFOO%,WV__'X6  oi?@ |&ww// ' 0 0$+GFOO%,WW%5%5'X6  Gi?X |&wv '$+GFOO%,WV__'X6  _i?r |&wv ''F5  yi?F |&wv ''F5  Mi?\ |&wv ' 0 0'23  ci?p |&wv ''23  wi?J |&wv ''23   |&ww// ' 0 0'<1   |&wv ' 0 0'<1   |&wv ' 0 0'<1   |&wv ''<1   |&wv ''<1   |&wv ''<1   |&ww// ''<1   |&wv ''1	   |&wv ''1	  G	i? i? i?  i i i iX	       #"[ [ [ [ [:M M M M   ) ) ) )\ #"!	0 0 0 0 0B #"	F F F F F FZ #"!L L L L L Lb #"!	    &        r1   