vector/sources/util/grpc/decompression.rs
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377
use std::{
cmp,
io::Write,
mem,
pin::Pin,
task::{Context, Poll},
};
use bytes::{Buf, BufMut, BytesMut};
use flate2::write::GzDecoder;
use futures_util::FutureExt;
use http::{Request, Response};
use hyper::{
body::{HttpBody, Sender},
Body,
};
use std::future::Future;
use tokio::{pin, select};
use tonic::{body::BoxBody, metadata::AsciiMetadataValue, Status};
use tower::{Layer, Service};
use vector_lib::internal_event::{
ByteSize, BytesReceived, InternalEventHandle as _, Protocol, Registered,
};
use crate::internal_events::{GrpcError, GrpcInvalidCompressionSchemeError};
// Every gRPC message has a five byte header:
// - a compressed flag (u8, 0/1 for compressed/decompressed)
// - a length prefix, indicating the number of remaining bytes to read (u32)
const GRPC_MESSAGE_HEADER_LEN: usize = mem::size_of::<u8>() + mem::size_of::<u32>();
const GRPC_ENCODING_HEADER: &str = "grpc-encoding";
const GRPC_ACCEPT_ENCODING_HEADER: &str = "grpc-accept-encoding";
enum CompressionScheme {
Gzip,
}
impl CompressionScheme {
fn from_encoding_header(req: &Request<Body>) -> Result<Option<Self>, Status> {
req.headers()
.get(GRPC_ENCODING_HEADER)
.map(|s| {
s.to_str().map(|s| s.to_string()).map_err(|_| {
Status::unimplemented(format!(
"`{}` contains non-visible characters and is not a valid encoding",
GRPC_ENCODING_HEADER
))
})
})
.transpose()
.and_then(|value| match value {
None => Ok(None),
Some(scheme) => match scheme.as_str() {
"gzip" => Ok(Some(CompressionScheme::Gzip)),
other => Err(Status::unimplemented(format!(
"compression scheme `{}` is not supported",
other
))),
},
})
.map_err(|mut status| {
status.metadata_mut().insert(
GRPC_ACCEPT_ENCODING_HEADER,
AsciiMetadataValue::from_static("gzip,identity"),
);
status
})
}
}
enum State {
WaitingForHeader,
Forward { overall_len: usize },
Decompress { remaining: usize },
}
impl Default for State {
fn default() -> Self {
Self::WaitingForHeader
}
}
fn new_decompressor() -> GzDecoder<Vec<u8>> {
// Create the backing buffer for the decompressor and set the compression flag to false (0) and pre-allocate
// the space for the length prefix, which we'll fill out once we've finalized the decompressor.
let buf = vec![0; GRPC_MESSAGE_HEADER_LEN];
GzDecoder::new(buf)
}
async fn drive_body_decompression(
mut source: Body,
mut destination: Sender,
) -> Result<usize, Status> {
let mut state = State::default();
let mut buf = BytesMut::new();
let mut decompressor = None;
let mut bytes_received = 0;
// Drain all message chunks from the body first.
while let Some(result) = source.data().await {
let chunk = result.map_err(|_| Status::internal("failed to read from underlying body"))?;
buf.put(chunk);
let maybe_message = loop {
match state {
State::WaitingForHeader => {
// If we don't have enough data yet to even read the gRPC message header, we can't do anything yet.
if buf.len() < GRPC_MESSAGE_HEADER_LEN {
break None;
}
// Extract the compressed flag and length prefix.
let (is_compressed, message_len) = {
let header = &buf[..GRPC_MESSAGE_HEADER_LEN];
let message_len_raw: u32 = header[1..]
.try_into()
.map(u32::from_be_bytes)
.expect("there must be four bytes remaining in the header slice");
let message_len = message_len_raw
.try_into()
.expect("Vector does not support 16-bit platforms");
(header[0] == 1, message_len)
};
// Now, if the message is not compressed, then put ourselves into forward mode, where we'll wait for
// the rest of the message to come in -- decoding isn't streaming so there's no benefit there --
// before we emit it.
//
// If the message _is_ compressed, we do roughly the same thing but we shove it into the
// decompressor incrementally because there's no good reason to make both the internal buffer and
// the decompressor buffer expand if we don't have to.
if is_compressed {
// We skip the header in the buffer because it doesn't matter to the decompressor and we
// recreate it anyways.
buf.advance(GRPC_MESSAGE_HEADER_LEN);
state = State::Decompress {
remaining: message_len,
};
} else {
let overall_len = GRPC_MESSAGE_HEADER_LEN + message_len;
state = State::Forward { overall_len };
}
}
State::Forward { overall_len } => {
// All we're doing at this point is waiting until we have all the bytes for the current gRPC message
// before we emit them to the caller.
if buf.len() < overall_len {
break None;
}
// Now that we have all the bytes we need, slice them out of our internal buffer, reset our state,
// and hand the message back to the caller.
let message = buf.split_to(overall_len).freeze();
state = State::WaitingForHeader;
bytes_received += overall_len;
break Some(message);
}
State::Decompress { ref mut remaining } => {
if *remaining > 0 {
// We're waiting for `remaining` more bytes to feed to the decompressor before we finalize it and
// generate our new chunk of data. We might have data in our internal buffer, so try and drain that
// first before polling the underlying body for more.
let available = buf.len();
if available > 0 {
// Write the lesser of what the buffer has, or what is remaining for the current message, into
// the decompressor. This is _technically_ synchronous but there's really no way to do it
// asynchronously since we already have the data, and that's the only asynchronous part.
let to_take = cmp::min(available, *remaining);
let decompressor = decompressor.get_or_insert_with(new_decompressor);
if decompressor.write_all(&buf[..to_take]).is_err() {
return Err(Status::internal("failed to write to decompressor"));
}
*remaining -= to_take;
buf.advance(to_take);
} else {
break None;
}
} else {
// We don't need any more data, so consume the decompressor, finalize it by updating the length
// prefix, and then pass it back to the caller.
let result = decompressor
.take()
.expect("consumed decompressor when no decompressor was present")
.finish();
// The only I/O errors that occur during `finish` should be I/O errors from writing to the internal
// buffer, but `Vec<T>` is infallible in this regard, so this should be impossible without having
// first panicked due to memory exhaustion.
let mut buf = result.map_err(|_| {
Status::internal(
"reached impossible error during decompressor finalization",
)
})?;
bytes_received += buf.len();
// Write the length of our decompressed message in the pre-allocated slot for the message's length prefix.
let message_len_actual = buf.len() - GRPC_MESSAGE_HEADER_LEN;
let message_len = u32::try_from(message_len_actual).map_err(|_| {
Status::out_of_range("messages greater than 4GB are not supported")
})?;
let message_len_bytes = message_len.to_be_bytes();
let message_len_slot = &mut buf[1..GRPC_MESSAGE_HEADER_LEN];
message_len_slot.copy_from_slice(&message_len_bytes[..]);
// Reset our state before returning the decompressed message.
state = State::WaitingForHeader;
break Some(buf.into());
}
}
}
};
if let Some(message) = maybe_message {
// We got a decompressed (or passthrough) message chunk, so just forward it to the destination.
if destination.send_data(message).await.is_err() {
return Err(Status::internal("destination body abnormally closed"));
}
}
}
// When we've exhausted all the message chunks, we try sending any trailers that came in on the underlying body.
let result = source.trailers().await;
let maybe_trailers =
result.map_err(|_| Status::internal("error reading trailers from underlying body"))?;
if let Some(trailers) = maybe_trailers {
if destination.send_trailers(trailers).await.is_err() {
return Err(Status::internal("destination body abnormally closed"));
}
}
Ok(bytes_received)
}
async fn drive_request<F, E>(
source: Body,
destination: Sender,
inner: F,
bytes_received: Registered<BytesReceived>,
) -> Result<Response<BoxBody>, E>
where
F: Future<Output = Result<Response<BoxBody>, E>>,
E: std::fmt::Display,
{
let body_decompression = drive_body_decompression(source, destination);
pin!(inner);
pin!(body_decompression);
let mut body_eof = false;
let mut body_bytes_received = 0;
let result = loop {
select! {
biased;
// Drive the inner future, as this will be consuming the message chunks we give it.
result = &mut inner => break result,
// Drive the core decompression loop, reading chunks from the underlying body, decompressing them if needed,
// and eventually handling trailers at the end, if they're present.
result = &mut body_decompression, if !body_eof => match result {
Err(e) => break Ok(e.to_http()),
Ok(bytes_received) => {
body_bytes_received = bytes_received;
body_eof = true;
},
}
}
};
// If the response indicates success, then emit the necessary metrics
// otherwise emit the error.
match &result {
Ok(res) if res.status().is_success() => {
bytes_received.emit(ByteSize(body_bytes_received));
}
Ok(res) => {
emit!(GrpcError {
error: format!("Received {}", res.status())
});
}
Err(error) => {
emit!(GrpcError { error: &error });
}
};
result
}
#[derive(Clone)]
pub struct DecompressionAndMetrics<S> {
inner: S,
bytes_received: Registered<BytesReceived>,
}
impl<S> Service<Request<Body>> for DecompressionAndMetrics<S>
where
S: Service<Request<Body>, Response = Response<BoxBody>> + Clone + Send + 'static,
S::Future: Send + 'static,
S::Error: std::fmt::Display,
{
type Response = Response<BoxBody>;
type Error = S::Error;
type Future = Pin<Box<dyn Future<Output = Result<Self::Response, Self::Error>> + Send>>;
fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
self.inner.poll_ready(cx)
}
fn call(&mut self, req: Request<Body>) -> Self::Future {
match CompressionScheme::from_encoding_header(&req) {
// There was a header for the encoding, but it was either invalid data or a scheme we don't support.
Err(status) => {
emit!(GrpcInvalidCompressionSchemeError { status: &status });
Box::pin(async move { Ok(status.to_http()) })
}
// The request either isn't using compression, or it has indicated compression may be used and we know we
// can support decompression based on the indicated compression scheme... so wrap the body to decompress, if
// need be, and then track the bytes that flowed through.
//
// TODO: Actually use the scheme given back to us to support other compression schemes.
Ok(_) => {
let (destination, decompressed_body) = Body::channel();
let (req_parts, req_body) = req.into_parts();
let mapped_req = Request::from_parts(req_parts, decompressed_body);
let inner = self.inner.call(mapped_req);
drive_request(req_body, destination, inner, self.bytes_received.clone()).boxed()
}
}
}
}
/// A layer for decompressing Tonic request payloads and emitting telemetry for the payload sizes.
///
/// In some cases, we configure `tonic` to use compression on requests to save CPU and throughput when sending those
/// large requests. In the case of Vector-to-Vector communication, this means the Vector v2 source may deal with
/// compressed requests. The code already transparently handles decompression, but as part of our component
/// specification, we have specific goals around what event representations we pay attention to.
///
/// In the case of tracking bytes sent/received, we always want to track the number of bytes received _after_
/// decompression to faithfully represent the amount of data being processed by Vector. This poses a problem with the
/// out-of-the-box `tonic` codegen as there is no hook whatsoever to inspect the raw request payload (after
/// decompression, if it was compressed at all) prior to the payload being decoded as a Protocol Buffers payload.
///
/// This layer wraps the incoming body in our own body type, which allows us to do two things: decompress the payload
/// before it enters the decoding phase, and emit metrics based on the decompressed payload.
///
/// Since we can see the decompressed bytes, and also know if the underlying service responded successfully -- i.e. the
/// request was valid, and was processed -- we can now report the number of bytes (after decompression) that were
/// received _and_ processed correctly.
///
/// The only supported compression scheme is gzip, which is also the only supported compression scheme in `tonic` itself.
#[derive(Clone, Default)]
pub struct DecompressionAndMetricsLayer;
impl<S> Layer<S> for DecompressionAndMetricsLayer {
type Service = DecompressionAndMetrics<S>;
fn layer(&self, inner: S) -> Self::Service {
DecompressionAndMetrics {
inner,
bytes_received: register!(BytesReceived::from(Protocol::from("grpc"))),
}
}
}