@@ -21,7 +21,7 @@ use axum::response::sse::{Event, KeepAlive, Sse};
21
21
use axum:: response:: { IntoResponse , Response } ;
22
22
use axum:: routing:: { get, post} ;
23
23
use axum:: { http, Json , Router } ;
24
- use axum_tracing_opentelemetry:: middleware:: OtelAxumLayer ;
24
+ use axum_tracing_opentelemetry:: middleware:: { OtelAxumLayer , OtelInResponseLayer } ;
25
25
use clap:: error;
26
26
use futures:: stream:: StreamExt ;
27
27
use futures:: Stream ;
@@ -30,6 +30,7 @@ use metrics_exporter_prometheus::{Matcher, PrometheusBuilder, PrometheusHandle};
30
30
use once_cell:: sync:: OnceCell ;
31
31
use reqwest_middleware:: { ClientBuilder , ClientWithMiddleware } ;
32
32
use reqwest_retry:: { policies:: ExponentialBackoff , RetryTransientMiddleware } ;
33
+ use reqwest:: Client ;
33
34
use std:: convert:: Infallible ;
34
35
use std:: net:: SocketAddr ;
35
36
use std:: sync:: atomic:: AtomicBool ;
@@ -960,7 +961,7 @@ async fn request_logger(
960
961
tracing:: info!( "Request logging enabled, sending logs to {url_string}" ) ;
961
962
962
963
let retry_policy = ExponentialBackoff :: builder ( ) . build_with_max_retries ( 3 ) ;
963
- let client = ClientBuilder :: new ( reqwest :: Client :: new ( ) )
964
+ let client = ClientBuilder :: new ( Client :: new ( ) )
964
965
. with ( RetryTransientMiddleware :: new_with_policy ( retry_policy) )
965
966
. build ( ) ;
966
967
while let Some ( ( tokens, api_token, model_id) ) = rx. recv ( ) . await {
@@ -1256,6 +1257,7 @@ pub async fn run(
1256
1257
. layer ( Extension ( infer) )
1257
1258
. layer ( Extension ( prom_handle. clone ( ) ) )
1258
1259
. layer ( OtelAxumLayer :: default ( ) )
1260
+ . layer ( OtelInResponseLayer :: default ( ) )
1259
1261
. layer ( cors_layer)
1260
1262
. layer ( Extension ( cloned_tokenizer) ) ;
1261
1263
0 commit comments