# HELP python_gc_objects_collected_total Objects collected during gc # TYPE python_gc_objects_collected_total counter python_gc_objects_collected_total{generation="0"} 145761.0 python_gc_objects_collected_total{generation="1"} 30373.0 python_gc_objects_collected_total{generation="2"} 2216.0 # HELP python_gc_objects_uncollectable_total Uncollectable objects found during GC # TYPE python_gc_objects_uncollectable_total counter python_gc_objects_uncollectable_total{generation="0"} 0.0 python_gc_objects_uncollectable_total{generation="1"} 0.0 python_gc_objects_uncollectable_total{generation="2"} 0.0 # HELP python_gc_collections_total Number of times this generation was collected # TYPE python_gc_collections_total counter python_gc_collections_total{generation="0"} 658.0 python_gc_collections_total{generation="1"} 59.0 python_gc_collections_total{generation="2"} 4.0 # HELP python_info Python platform information # TYPE python_info gauge python_info{implementation="CPython",major="3",minor="12",patchlevel="13",version="3.12.13"} 1.0 # HELP process_virtual_memory_bytes Virtual memory size in bytes. # TYPE process_virtual_memory_bytes gauge process_virtual_memory_bytes 7.70527232e+08 # HELP process_resident_memory_bytes Resident memory size in bytes. # TYPE process_resident_memory_bytes gauge process_resident_memory_bytes 1.20508416e+08 # HELP process_start_time_seconds Start time of the process since unix epoch in seconds. # TYPE process_start_time_seconds gauge process_start_time_seconds 1.7810241493e+09 # HELP process_cpu_seconds_total Total user and system CPU time spent in seconds. # TYPE process_cpu_seconds_total counter process_cpu_seconds_total 252.07 # HELP process_open_fds Number of open file descriptors. # TYPE process_open_fds gauge process_open_fds 17.0 # HELP process_max_fds Maximum number of open file descriptors. # TYPE process_max_fds gauge process_max_fds 65536.0 # HELP http_requests_total Total HTTP requests. # TYPE http_requests_total counter http_requests_total{method="GET",path="/",status="404"} 2635.0 http_requests_total{method="GET",path="/robots.txt",status="404"} 2.0 http_requests_total{method="GET",path="/readyz",status="200"} 2.0 http_requests_total{method="GET",path="/healthz",status="200"} 17.0 http_requests_total{method="GET",path="/metrics",status="200"} 1.0 http_requests_total{method="GET",path="/docs",status="200"} 1.0 http_requests_total{method="OPTIONS",path="/agent/run",status="200"} 1.0 http_requests_total{method="POST",path="/agent/run",status="200"} 3.0 # HELP http_requests_created Total HTTP requests. # TYPE http_requests_created gauge http_requests_created{method="GET",path="/",status="404"} 1.7810241583411422e+09 http_requests_created{method="GET",path="/robots.txt",status="404"} 1.7811373330506501e+09 http_requests_created{method="GET",path="/readyz",status="200"} 1.7811373337827494e+09 http_requests_created{method="GET",path="/healthz",status="200"} 1.7811373394346173e+09 http_requests_created{method="GET",path="/metrics",status="200"} 1.7811373423601596e+09 http_requests_created{method="GET",path="/docs",status="200"} 1.7811373449580383e+09 http_requests_created{method="OPTIONS",path="/agent/run",status="200"} 1.7811436951011987e+09 http_requests_created{method="POST",path="/agent/run",status="200"} 1.7811436953199263e+09 # HELP http_request_duration_seconds HTTP request duration, in seconds. # TYPE http_request_duration_seconds histogram http_request_duration_seconds_bucket{le="0.01",method="GET",path="/"} 2634.0 http_request_duration_seconds_bucket{le="0.05",method="GET",path="/"} 2634.0 http_request_duration_seconds_bucket{le="0.1",method="GET",path="/"} 2635.0 http_request_duration_seconds_bucket{le="0.25",method="GET",path="/"} 2635.0 http_request_duration_seconds_bucket{le="0.5",method="GET",path="/"} 2635.0 http_request_duration_seconds_bucket{le="1.0",method="GET",path="/"} 2635.0 http_request_duration_seconds_bucket{le="2.5",method="GET",path="/"} 2635.0 http_request_duration_seconds_bucket{le="5.0",method="GET",path="/"} 2635.0 http_request_duration_seconds_bucket{le="10.0",method="GET",path="/"} 2635.0 http_request_duration_seconds_bucket{le="30.0",method="GET",path="/"} 2635.0 http_request_duration_seconds_bucket{le="60.0",method="GET",path="/"} 2635.0 http_request_duration_seconds_bucket{le="+Inf",method="GET",path="/"} 2635.0 http_request_duration_seconds_count{method="GET",path="/"} 2635.0 http_request_duration_seconds_sum{method="GET",path="/"} 0.8730567271572838 http_request_duration_seconds_bucket{le="0.01",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_bucket{le="0.05",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_bucket{le="0.1",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_bucket{le="0.25",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_bucket{le="0.5",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_bucket{le="1.0",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_bucket{le="2.5",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_bucket{le="5.0",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_bucket{le="10.0",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_bucket{le="30.0",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_bucket{le="60.0",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_bucket{le="+Inf",method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_count{method="GET",path="/robots.txt"} 2.0 http_request_duration_seconds_sum{method="GET",path="/robots.txt"} 0.0006108710076659918 http_request_duration_seconds_bucket{le="0.01",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_bucket{le="0.05",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_bucket{le="0.1",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_bucket{le="0.25",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_bucket{le="0.5",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_bucket{le="1.0",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_bucket{le="2.5",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_bucket{le="5.0",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_bucket{le="10.0",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_bucket{le="30.0",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_bucket{le="60.0",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_bucket{le="+Inf",method="GET",path="/readyz"} 2.0 http_request_duration_seconds_count{method="GET",path="/readyz"} 2.0 http_request_duration_seconds_sum{method="GET",path="/readyz"} 0.0012212819856358692 http_request_duration_seconds_bucket{le="0.01",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_bucket{le="0.05",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_bucket{le="0.1",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_bucket{le="0.25",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_bucket{le="0.5",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_bucket{le="1.0",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_bucket{le="2.5",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_bucket{le="5.0",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_bucket{le="10.0",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_bucket{le="30.0",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_bucket{le="60.0",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_bucket{le="+Inf",method="GET",path="/healthz"} 17.0 http_request_duration_seconds_count{method="GET",path="/healthz"} 17.0 http_request_duration_seconds_sum{method="GET",path="/healthz"} 0.005658484034938738 http_request_duration_seconds_bucket{le="0.01",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_bucket{le="0.05",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_bucket{le="0.1",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_bucket{le="0.25",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_bucket{le="0.5",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_bucket{le="1.0",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_bucket{le="2.5",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_bucket{le="5.0",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_bucket{le="10.0",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_bucket{le="30.0",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_bucket{le="60.0",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_bucket{le="+Inf",method="GET",path="/metrics"} 1.0 http_request_duration_seconds_count{method="GET",path="/metrics"} 1.0 http_request_duration_seconds_sum{method="GET",path="/metrics"} 0.0023908029979793355 http_request_duration_seconds_bucket{le="0.01",method="GET",path="/docs"} 1.0 http_request_duration_seconds_bucket{le="0.05",method="GET",path="/docs"} 1.0 http_request_duration_seconds_bucket{le="0.1",method="GET",path="/docs"} 1.0 http_request_duration_seconds_bucket{le="0.25",method="GET",path="/docs"} 1.0 http_request_duration_seconds_bucket{le="0.5",method="GET",path="/docs"} 1.0 http_request_duration_seconds_bucket{le="1.0",method="GET",path="/docs"} 1.0 http_request_duration_seconds_bucket{le="2.5",method="GET",path="/docs"} 1.0 http_request_duration_seconds_bucket{le="5.0",method="GET",path="/docs"} 1.0 http_request_duration_seconds_bucket{le="10.0",method="GET",path="/docs"} 1.0 http_request_duration_seconds_bucket{le="30.0",method="GET",path="/docs"} 1.0 http_request_duration_seconds_bucket{le="60.0",method="GET",path="/docs"} 1.0 http_request_duration_seconds_bucket{le="+Inf",method="GET",path="/docs"} 1.0 http_request_duration_seconds_count{method="GET",path="/docs"} 1.0 http_request_duration_seconds_sum{method="GET",path="/docs"} 0.000291784992441535 http_request_duration_seconds_bucket{le="0.01",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_bucket{le="0.05",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_bucket{le="0.1",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_bucket{le="0.25",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_bucket{le="0.5",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_bucket{le="1.0",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_bucket{le="2.5",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_bucket{le="5.0",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_bucket{le="10.0",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_bucket{le="30.0",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_bucket{le="60.0",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_bucket{le="+Inf",method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_count{method="OPTIONS",path="/agent/run"} 1.0 http_request_duration_seconds_sum{method="OPTIONS",path="/agent/run"} 0.0001632329949643463 http_request_duration_seconds_bucket{le="0.01",method="POST",path="/agent/run"} 0.0 http_request_duration_seconds_bucket{le="0.05",method="POST",path="/agent/run"} 2.0 http_request_duration_seconds_bucket{le="0.1",method="POST",path="/agent/run"} 2.0 http_request_duration_seconds_bucket{le="0.25",method="POST",path="/agent/run"} 3.0 http_request_duration_seconds_bucket{le="0.5",method="POST",path="/agent/run"} 3.0 http_request_duration_seconds_bucket{le="1.0",method="POST",path="/agent/run"} 3.0 http_request_duration_seconds_bucket{le="2.5",method="POST",path="/agent/run"} 3.0 http_request_duration_seconds_bucket{le="5.0",method="POST",path="/agent/run"} 3.0 http_request_duration_seconds_bucket{le="10.0",method="POST",path="/agent/run"} 3.0 http_request_duration_seconds_bucket{le="30.0",method="POST",path="/agent/run"} 3.0 http_request_duration_seconds_bucket{le="60.0",method="POST",path="/agent/run"} 3.0 http_request_duration_seconds_bucket{le="+Inf",method="POST",path="/agent/run"} 3.0 http_request_duration_seconds_count{method="POST",path="/agent/run"} 3.0 http_request_duration_seconds_sum{method="POST",path="/agent/run"} 0.1343810440012021 # HELP http_request_duration_seconds_created HTTP request duration, in seconds. # TYPE http_request_duration_seconds_created gauge http_request_duration_seconds_created{method="GET",path="/"} 1.7810241583411791e+09 http_request_duration_seconds_created{method="GET",path="/robots.txt"} 1.7811373330506809e+09 http_request_duration_seconds_created{method="GET",path="/readyz"} 1.7811373337827837e+09 http_request_duration_seconds_created{method="GET",path="/healthz"} 1.7811373394346445e+09 http_request_duration_seconds_created{method="GET",path="/metrics"} 1.781137342360183e+09 http_request_duration_seconds_created{method="GET",path="/docs"} 1.7811373449580648e+09 http_request_duration_seconds_created{method="OPTIONS",path="/agent/run"} 1.7811436951012652e+09 http_request_duration_seconds_created{method="POST",path="/agent/run"} 1.7811436953199527e+09 # HELP nebius_tokens_total Tokens emitted by Nebius streams. # TYPE nebius_tokens_total counter nebius_tokens_total{model="meta-llama/Llama-3.3-70B-Instruct",type="output"} 246.0 # HELP nebius_tokens_created Tokens emitted by Nebius streams. # TYPE nebius_tokens_created gauge nebius_tokens_created{model="meta-llama/Llama-3.3-70B-Instruct",type="output"} 1.7811436964060102e+09 # HELP nebius_request_duration_seconds Duration of Nebius chat completion requests. # TYPE nebius_request_duration_seconds histogram nebius_request_duration_seconds_bucket{le="0.1",model="meta-llama/Llama-3.3-70B-Instruct"} 0.0 nebius_request_duration_seconds_bucket{le="0.25",model="meta-llama/Llama-3.3-70B-Instruct"} 0.0 nebius_request_duration_seconds_bucket{le="0.5",model="meta-llama/Llama-3.3-70B-Instruct"} 0.0 nebius_request_duration_seconds_bucket{le="1.0",model="meta-llama/Llama-3.3-70B-Instruct"} 0.0 nebius_request_duration_seconds_bucket{le="2.5",model="meta-llama/Llama-3.3-70B-Instruct"} 1.0 nebius_request_duration_seconds_bucket{le="5.0",model="meta-llama/Llama-3.3-70B-Instruct"} 2.0 nebius_request_duration_seconds_bucket{le="10.0",model="meta-llama/Llama-3.3-70B-Instruct"} 2.0 nebius_request_duration_seconds_bucket{le="30.0",model="meta-llama/Llama-3.3-70B-Instruct"} 3.0 nebius_request_duration_seconds_bucket{le="60.0",model="meta-llama/Llama-3.3-70B-Instruct"} 3.0 nebius_request_duration_seconds_bucket{le="120.0",model="meta-llama/Llama-3.3-70B-Instruct"} 3.0 nebius_request_duration_seconds_bucket{le="+Inf",model="meta-llama/Llama-3.3-70B-Instruct"} 3.0 nebius_request_duration_seconds_count{model="meta-llama/Llama-3.3-70B-Instruct"} 3.0 nebius_request_duration_seconds_sum{model="meta-llama/Llama-3.3-70B-Instruct"} 15.86147633602377 # HELP nebius_request_duration_seconds_created Duration of Nebius chat completion requests. # TYPE nebius_request_duration_seconds_created gauge nebius_request_duration_seconds_created{model="meta-llama/Llama-3.3-70B-Instruct"} 1.7811436953300757e+09 # HELP agent_route_total Total agent requests by selected LangGraph route. # TYPE agent_route_total counter agent_route_total{route="direct"} 1.0 agent_route_total{route="deliberate"} 2.0 # HELP agent_route_created Total agent requests by selected LangGraph route. # TYPE agent_route_created gauge agent_route_created{route="direct"} 1.7811436953286612e+09 agent_route_created{route="deliberate"} 1.7811437150951903e+09 # HELP agent_first_token_seconds Time from agent start to first streamed token. # TYPE agent_first_token_seconds histogram agent_first_token_seconds_bucket{le="0.1",route="direct"} 0.0 agent_first_token_seconds_bucket{le="0.25",route="direct"} 0.0 agent_first_token_seconds_bucket{le="0.5",route="direct"} 0.0 agent_first_token_seconds_bucket{le="1.0",route="direct"} 0.0 agent_first_token_seconds_bucket{le="1.2",route="direct"} 1.0 agent_first_token_seconds_bucket{le="1.5",route="direct"} 1.0 agent_first_token_seconds_bucket{le="2.5",route="direct"} 1.0 agent_first_token_seconds_bucket{le="5.0",route="direct"} 1.0 agent_first_token_seconds_bucket{le="10.0",route="direct"} 1.0 agent_first_token_seconds_bucket{le="30.0",route="direct"} 1.0 agent_first_token_seconds_bucket{le="60.0",route="direct"} 1.0 agent_first_token_seconds_bucket{le="+Inf",route="direct"} 1.0 agent_first_token_seconds_count{route="direct"} 1.0 agent_first_token_seconds_sum{route="direct"} 1.0862026879913174 agent_first_token_seconds_bucket{le="0.1",route="deliberate"} 0.0 agent_first_token_seconds_bucket{le="0.25",route="deliberate"} 1.0 agent_first_token_seconds_bucket{le="0.5",route="deliberate"} 1.0 agent_first_token_seconds_bucket{le="1.0",route="deliberate"} 1.0 agent_first_token_seconds_bucket{le="1.2",route="deliberate"} 1.0 agent_first_token_seconds_bucket{le="1.5",route="deliberate"} 1.0 agent_first_token_seconds_bucket{le="2.5",route="deliberate"} 2.0 agent_first_token_seconds_bucket{le="5.0",route="deliberate"} 2.0 agent_first_token_seconds_bucket{le="10.0",route="deliberate"} 2.0 agent_first_token_seconds_bucket{le="30.0",route="deliberate"} 2.0 agent_first_token_seconds_bucket{le="60.0",route="deliberate"} 2.0 agent_first_token_seconds_bucket{le="+Inf",route="deliberate"} 2.0 agent_first_token_seconds_count{route="deliberate"} 2.0 agent_first_token_seconds_sum{route="deliberate"} 2.297571634000633 # HELP agent_first_token_seconds_created Time from agent start to first streamed token. # TYPE agent_first_token_seconds_created gauge agent_first_token_seconds_created{route="direct"} 1.7811436964060488e+09 agent_first_token_seconds_created{route="deliberate"} 1.7811437171559322e+09