# HELP python_gc_objects_collected_total Objects collected during gc # TYPE python_gc_objects_collected_total counter python_gc_objects_collected_total{generation="0"} 17765.0 python_gc_objects_collected_total{generation="1"} 1951.0 python_gc_objects_collected_total{generation="2"} 20.0 # HELP python_gc_objects_uncollectable_total Uncollectable objects found during GC # TYPE python_gc_objects_uncollectable_total counter python_gc_objects_uncollectable_total{generation="0"} 0.0 python_gc_objects_uncollectable_total{generation="1"} 0.0 python_gc_objects_uncollectable_total{generation="2"} 0.0 # HELP python_gc_collections_total Number of times this generation was collected # TYPE python_gc_collections_total counter python_gc_collections_total{generation="0"} 693.0 python_gc_collections_total{generation="1"} 62.0 python_gc_collections_total{generation="2"} 5.0 # HELP python_info Python platform information # TYPE python_info gauge python_info{implementation="CPython",major="3",minor="12",patchlevel="13",version="3.12.13"} 1.0 # HELP process_virtual_memory_bytes Virtual memory size in bytes. # TYPE process_virtual_memory_bytes gauge process_virtual_memory_bytes 1.1964416e+09 # HELP process_resident_memory_bytes Resident memory size in bytes. # TYPE process_resident_memory_bytes gauge process_resident_memory_bytes 3.0148608e+08 # HELP process_start_time_seconds Start time of the process since unix epoch in seconds. # TYPE process_start_time_seconds gauge process_start_time_seconds 1.77308360706e+09 # HELP process_cpu_seconds_total Total user and system CPU time spent in seconds. # TYPE process_cpu_seconds_total counter process_cpu_seconds_total 10.31 # HELP process_open_fds Number of open file descriptors. # TYPE process_open_fds gauge process_open_fds 26.0 # HELP process_max_fds Maximum number of open file descriptors. # TYPE process_max_fds gauge process_max_fds 65536.0 # HELP ai_chat_requests_total Total chat requests # TYPE ai_chat_requests_total counter ai_chat_requests_total{brand="ruay",channel="bxlivechat",persona="customer"} 7.0 ai_chat_requests_total{brand="lotto",channel="bxlivechat",persona="cusromer_l"} 4.0 # HELP ai_chat_requests_created Total chat requests # TYPE ai_chat_requests_created gauge ai_chat_requests_created{brand="ruay",channel="bxlivechat",persona="customer"} 1.7730836558339248e+09 ai_chat_requests_created{brand="lotto",channel="bxlivechat",persona="cusromer_l"} 1.773083765137073e+09 # HELP ai_chat_errors_total Chat errors # TYPE ai_chat_errors_total counter # HELP ai_tool_calls_total Tool calls # TYPE ai_tool_calls_total counter ai_tool_calls_total{success="False",tool="web_r.find_bet_result"} 3.0 ai_tool_calls_total{success="True",tool="web_r.get_user_info_by_userdomain2"} 2.0 ai_tool_calls_total{success="True",tool="web_r.get_user_statement"} 5.0 ai_tool_calls_total{success="True",tool="web_r.get_user_finance"} 1.0 # HELP ai_tool_calls_created Tool calls # TYPE ai_tool_calls_created gauge ai_tool_calls_created{success="False",tool="web_r.find_bet_result"} 1.7730838178378322e+09 ai_tool_calls_created{success="True",tool="web_r.get_user_info_by_userdomain2"} 1.7730838193112257e+09 ai_tool_calls_created{success="True",tool="web_r.get_user_statement"} 1.7730838209021175e+09 ai_tool_calls_created{success="True",tool="web_r.get_user_finance"} 1.7730838246518042e+09 # HELP ai_handoffs_total Handoffs to human # TYPE ai_handoffs_total counter ai_handoffs_total{brand="ruay",reason="repeated_question"} 2.0 # HELP ai_handoffs_created Handoffs to human # TYPE ai_handoffs_created gauge ai_handoffs_created{brand="ruay",reason="repeated_question"} 1.7730839143063452e+09 # HELP ai_cache_hits_total Response cache hits # TYPE ai_cache_hits_total counter # HELP ai_injection_blocked_total Prompt injections blocked # TYPE ai_injection_blocked_total counter ai_injection_blocked_total 0.0 # HELP ai_injection_blocked_created Prompt injections blocked # TYPE ai_injection_blocked_created gauge ai_injection_blocked_created 1.7730836102514215e+09 # HELP ai_chat_latency_seconds Chat response latency # TYPE ai_chat_latency_seconds histogram ai_chat_latency_seconds_bucket{brand="ruay",le="0.5"} 0.0 ai_chat_latency_seconds_bucket{brand="ruay",le="1.0"} 0.0 ai_chat_latency_seconds_bucket{brand="ruay",le="2.0"} 0.0 ai_chat_latency_seconds_bucket{brand="ruay",le="5.0"} 3.0 ai_chat_latency_seconds_bucket{brand="ruay",le="10.0"} 3.0 ai_chat_latency_seconds_bucket{brand="ruay",le="30.0"} 7.0 ai_chat_latency_seconds_bucket{brand="ruay",le="+Inf"} 7.0 ai_chat_latency_seconds_count{brand="ruay"} 7.0 ai_chat_latency_seconds_sum{brand="ruay"} 68.7302517620119 ai_chat_latency_seconds_bucket{brand="lotto",le="0.5"} 0.0 ai_chat_latency_seconds_bucket{brand="lotto",le="1.0"} 0.0 ai_chat_latency_seconds_bucket{brand="lotto",le="2.0"} 4.0 ai_chat_latency_seconds_bucket{brand="lotto",le="5.0"} 4.0 ai_chat_latency_seconds_bucket{brand="lotto",le="10.0"} 4.0 ai_chat_latency_seconds_bucket{brand="lotto",le="30.0"} 4.0 ai_chat_latency_seconds_bucket{brand="lotto",le="+Inf"} 4.0 ai_chat_latency_seconds_count{brand="lotto"} 4.0 ai_chat_latency_seconds_sum{brand="lotto"} 5.599602792004589 # HELP ai_chat_latency_seconds_created Chat response latency # TYPE ai_chat_latency_seconds_created gauge ai_chat_latency_seconds_created{brand="ruay"} 1.773083667785145e+09 ai_chat_latency_seconds_created{brand="lotto"} 1.7730837667829583e+09 # HELP ai_llm_latency_seconds LLM call latency # TYPE ai_llm_latency_seconds histogram ai_llm_latency_seconds_bucket{le="0.5",model="gpt-4o"} 0.0 ai_llm_latency_seconds_bucket{le="1.0",model="gpt-4o"} 4.0 ai_llm_latency_seconds_bucket{le="2.0",model="gpt-4o"} 7.0 ai_llm_latency_seconds_bucket{le="5.0",model="gpt-4o"} 9.0 ai_llm_latency_seconds_bucket{le="10.0",model="gpt-4o"} 9.0 ai_llm_latency_seconds_bucket{le="+Inf",model="gpt-4o"} 9.0 ai_llm_latency_seconds_count{model="gpt-4o"} 9.0 ai_llm_latency_seconds_sum{model="gpt-4o"} 14.1517 # HELP ai_llm_latency_seconds_created LLM call latency # TYPE ai_llm_latency_seconds_created gauge ai_llm_latency_seconds_created{model="gpt-4o"} 1.7730837667629566e+09 # HELP ai_tool_latency_seconds Tool call latency # TYPE ai_tool_latency_seconds histogram ai_tool_latency_seconds_bucket{le="0.1",tool="web_r.find_bet_result"} 3.0 ai_tool_latency_seconds_bucket{le="0.5",tool="web_r.find_bet_result"} 3.0 ai_tool_latency_seconds_bucket{le="1.0",tool="web_r.find_bet_result"} 3.0 ai_tool_latency_seconds_bucket{le="2.0",tool="web_r.find_bet_result"} 3.0 ai_tool_latency_seconds_bucket{le="5.0",tool="web_r.find_bet_result"} 3.0 ai_tool_latency_seconds_bucket{le="+Inf",tool="web_r.find_bet_result"} 3.0 ai_tool_latency_seconds_count{tool="web_r.find_bet_result"} 3.0 ai_tool_latency_seconds_sum{tool="web_r.find_bet_result"} 0.2611 ai_tool_latency_seconds_bucket{le="0.1",tool="web_r.get_user_info_by_userdomain2"} 2.0 ai_tool_latency_seconds_bucket{le="0.5",tool="web_r.get_user_info_by_userdomain2"} 2.0 ai_tool_latency_seconds_bucket{le="1.0",tool="web_r.get_user_info_by_userdomain2"} 2.0 ai_tool_latency_seconds_bucket{le="2.0",tool="web_r.get_user_info_by_userdomain2"} 2.0 ai_tool_latency_seconds_bucket{le="5.0",tool="web_r.get_user_info_by_userdomain2"} 2.0 ai_tool_latency_seconds_bucket{le="+Inf",tool="web_r.get_user_info_by_userdomain2"} 2.0 ai_tool_latency_seconds_count{tool="web_r.get_user_info_by_userdomain2"} 2.0 ai_tool_latency_seconds_sum{tool="web_r.get_user_info_by_userdomain2"} 0.1109 ai_tool_latency_seconds_bucket{le="0.1",tool="web_r.get_user_statement"} 0.0 ai_tool_latency_seconds_bucket{le="0.5",tool="web_r.get_user_statement"} 0.0 ai_tool_latency_seconds_bucket{le="1.0",tool="web_r.get_user_statement"} 5.0 ai_tool_latency_seconds_bucket{le="2.0",tool="web_r.get_user_statement"} 5.0 ai_tool_latency_seconds_bucket{le="5.0",tool="web_r.get_user_statement"} 5.0 ai_tool_latency_seconds_bucket{le="+Inf",tool="web_r.get_user_statement"} 5.0 ai_tool_latency_seconds_count{tool="web_r.get_user_statement"} 5.0 ai_tool_latency_seconds_sum{tool="web_r.get_user_statement"} 3.7711 ai_tool_latency_seconds_bucket{le="0.1",tool="web_r.get_user_finance"} 1.0 ai_tool_latency_seconds_bucket{le="0.5",tool="web_r.get_user_finance"} 1.0 ai_tool_latency_seconds_bucket{le="1.0",tool="web_r.get_user_finance"} 1.0 ai_tool_latency_seconds_bucket{le="2.0",tool="web_r.get_user_finance"} 1.0 ai_tool_latency_seconds_bucket{le="5.0",tool="web_r.get_user_finance"} 1.0 ai_tool_latency_seconds_bucket{le="+Inf",tool="web_r.get_user_finance"} 1.0 ai_tool_latency_seconds_count{tool="web_r.get_user_finance"} 1.0 ai_tool_latency_seconds_sum{tool="web_r.get_user_finance"} 0.045200000000000004 # HELP ai_tool_latency_seconds_created Tool call latency # TYPE ai_tool_latency_seconds_created gauge ai_tool_latency_seconds_created{tool="web_r.find_bet_result"} 1.7730838178378613e+09 ai_tool_latency_seconds_created{tool="web_r.get_user_info_by_userdomain2"} 1.7730838193112683e+09 ai_tool_latency_seconds_created{tool="web_r.get_user_statement"} 1.7730838209021447e+09 ai_tool_latency_seconds_created{tool="web_r.get_user_finance"} 1.7730838246518316e+09 # HELP ai_active_sessions Active sessions # TYPE ai_active_sessions gauge # HELP ai_active_websockets Active WebSocket connections # TYPE ai_active_websockets gauge ai_active_websockets 0.0 # HELP ai_queue_size Message queue size # TYPE ai_queue_size gauge ai_queue_size 0.0 # HELP ai_llm_cost_today_usd LLM cost today in USD # TYPE ai_llm_cost_today_usd gauge ai_llm_cost_today_usd 0.0 # HELP ai_circuit_breaker_state Circuit breaker state (0=closed, 1=open, 2=half_open) # TYPE ai_circuit_breaker_state gauge