@@ -413,7 +413,7 @@ static_resources:
413413 " @type " : type.googleapis.com/envoy.extensions.access_loggers.file.v3.FileAccessLog
414414 path : " /var/log/access_llm.log"
415415 format : |
416- [%START_TIME%] "%REQ(:METHOD)% %REQ(X-ENVOY-ORIGINAL-PATH?:PATH)% %PROTOCOL%" %RESPONSE_CODE% %RESPONSE_FLAGS% %BYTES_RECEIVED% %BYTES_SENT% %DURATION% %RESP(X-ENVOY-UPSTREAM-SERVICE-TIME)% "%REQ(X-FORWARDED-FOR)%" "%REQ(USER-AGENT)%" "%REQ(X-REQUEST-ID)%" "%REQ(:AUTHORITY)%" "%UPSTREAM_HOST%" "%UPSTREAM_CLUSTER%"
416+ [%START_TIME%] "%REQ(:METHOD)% %REQ(X-ENVOY-ORIGINAL-PATH?:PATH)% %PROTOCOL%" %RESPONSE_CODE% %RESPONSE_FLAGS% %BYTES_RECEIVED% %BYTES_SENT% %DURATION% %RESP(X-ENVOY-UPSTREAM-SERVICE-TIME)% "%REQ(X-FORWARDED-FOR)%" "%REQ(USER-AGENT)%" "%REQ(X-REQUEST-ID)%" "%REQ(:AUTHORITY)%" "%UPSTREAM_HOST%" "%UPSTREAM_CLUSTER%" attempts=%UPSTREAM_REQUEST_ATTEMPT_COUNT%
417417 route_config :
418418 name : local_routes
419419 virtual_hosts :
@@ -534,7 +534,7 @@ static_resources:
534534 " @type " : type.googleapis.com/envoy.extensions.access_loggers.file.v3.FileAccessLog
535535 path : " /var/log/access_llm.log"
536536 format : |
537- [%START_TIME%] "%REQ(:METHOD)% %REQ(X-ENVOY-ORIGINAL-PATH?:PATH)% %PROTOCOL%" %RESPONSE_CODE% %RESPONSE_FLAGS% %BYTES_RECEIVED% %BYTES_SENT% %DURATION% %RESP(X-ENVOY-UPSTREAM-SERVICE-TIME)% "%REQ(X-FORWARDED-FOR)%" "%REQ(USER-AGENT)%" "%REQ(X-REQUEST-ID)%" "%REQ(:AUTHORITY)%" "%UPSTREAM_HOST%" "%UPSTREAM_CLUSTER%"
537+ [%START_TIME%] "%REQ(:METHOD)% %REQ(X-ENVOY-ORIGINAL-PATH?:PATH)% %PROTOCOL%" %RESPONSE_CODE% %RESPONSE_FLAGS% %BYTES_RECEIVED% %BYTES_SENT% %DURATION% %RESP(X-ENVOY-UPSTREAM-SERVICE-TIME)% "%REQ(X-FORWARDED-FOR)%" "%REQ(USER-AGENT)%" "%REQ(X-REQUEST-ID)%" "%REQ(:AUTHORITY)%" "%UPSTREAM_HOST%" "%UPSTREAM_CLUSTER%" attempts=%UPSTREAM_REQUEST_ATTEMPT_COUNT%
538538 route_config :
539539 name : local_routes
540540 virtual_hosts :
@@ -559,6 +559,16 @@ static_resources:
559559 auto_host_rewrite : true
560560 cluster : {{ llm_cluster_name }}
561561 timeout : 300s
562+ {% if llm_gateway_listener.max_retries %}
563+ retry_policy :
564+ retry_on : " 5xx,connect-failure,refused-stream,reset,retriable-status-codes"
565+ num_retries : {{ llm_gateway_listener.max_retries }}
566+ per_try_timeout : 30s
567+ retriable_status_codes : [429, 500, 502, 503, 504]
568+ retry_back_off :
569+ base_interval : 0.5s
570+ max_interval : 5s
571+ {% endif %}
562572 {% endfor %}
563573 - match :
564574 prefix : " /"
0 commit comments