refactor(tvix/store): use read_all_and_chunk in gRPC blobservice
This was the last piece of code using BlobWriter. We can also use `read_all_and_chunk`, it's just requires a bit more plumbing: - The data coming from the client (stream) needs to be mapped (we extract the .data field). - The stream needs to be turned into an (async) reader - The reader needs to be made sync, and that code using the sync reader needs to be in a `task::spawn_blocking`. Change-Id: I4e374e1a9f47d5a0933f59a8f5c121185a5f3e95 Reviewed-on: https://cl.tvl.fyi/c/depot/+/8260 Autosubmit: flokli <flokli@flokli.de> Reviewed-by: raitobezarius <tvl@lahfa.xyz> Tested-by: BuildkiteCI Reviewed-by: tazjin <tazjin@tvl.su>
This commit is contained in:
parent
7ffb2676ee
commit
c8bbddd5e5
4 changed files with 49 additions and 39 deletions
5
tvix/Cargo.lock
generated
5
tvix/Cargo.lock
generated
|
@ -2458,9 +2458,9 @@ dependencies = [
|
|||
|
||||
[[package]]
|
||||
name = "tokio-util"
|
||||
version = "0.7.4"
|
||||
version = "0.7.7"
|
||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||
checksum = "0bb2e075f03b3d66d8d8785356224ba688d2906a371015e225beeb65ca92c740"
|
||||
checksum = "5427d89453009325de0d8f342c9490009f76e999cb7672d77e46267448f7e6b2"
|
||||
dependencies = [
|
||||
"bytes",
|
||||
"futures-core",
|
||||
|
@ -2804,6 +2804,7 @@ dependencies = [
|
|||
"thiserror",
|
||||
"tokio",
|
||||
"tokio-stream",
|
||||
"tokio-util",
|
||||
"tonic",
|
||||
"tonic-build",
|
||||
"tonic-mock",
|
||||
|
|
|
@ -7004,9 +7004,9 @@ rec {
|
|||
};
|
||||
"tokio-util" = rec {
|
||||
crateName = "tokio-util";
|
||||
version = "0.7.4";
|
||||
version = "0.7.7";
|
||||
edition = "2018";
|
||||
sha256 = "0h67jb56bsxy4pi1a41pda8d52569ci5clvqv3c6cg9vy1sy1chb";
|
||||
sha256 = "1cp6yx4789j6gvbp4xnbk7lpd7q0j2a2qd4g1pg2b4q0afadh9sl";
|
||||
authors = [
|
||||
"Tokio Contributors <team@tokio.rs>"
|
||||
];
|
||||
|
@ -7062,7 +7062,7 @@ rec {
|
|||
"time" = [ "tokio/time" "slab" ];
|
||||
"tracing" = [ "dep:tracing" ];
|
||||
};
|
||||
resolvedDefaultFeatures = [ "codec" "default" "tracing" ];
|
||||
resolvedDefaultFeatures = [ "codec" "default" "io" "io-util" "tracing" ];
|
||||
};
|
||||
"toml" = rec {
|
||||
crateName = "toml";
|
||||
|
@ -8356,6 +8356,11 @@ rec {
|
|||
name = "tokio-stream";
|
||||
packageId = "tokio-stream";
|
||||
}
|
||||
{
|
||||
name = "tokio-util";
|
||||
packageId = "tokio-util";
|
||||
features = [ "io" "io-util" ];
|
||||
}
|
||||
{
|
||||
name = "tonic";
|
||||
packageId = "tonic";
|
||||
|
|
|
@ -26,6 +26,7 @@ tonic = "0.8.2"
|
|||
tracing = "0.1.37"
|
||||
tracing-subscriber = { version = "0.3.16", features = ["json"] }
|
||||
walkdir = "2.3.2"
|
||||
tokio-util = { version = "0.7.7", features = ["io", "io-util"] }
|
||||
|
||||
[dependencies.tonic-reflection]
|
||||
optional = true
|
||||
|
|
|
@ -1,14 +1,15 @@
|
|||
use std::collections::VecDeque;
|
||||
|
||||
use crate::{
|
||||
blobservice::BlobService,
|
||||
chunkservice::{update_hasher, ChunkService},
|
||||
chunkservice::{read_all_and_chunk, update_hasher, ChunkService},
|
||||
Error,
|
||||
};
|
||||
use data_encoding::BASE64;
|
||||
use std::io::{BufWriter, Write};
|
||||
use tokio::{sync::mpsc::channel, task};
|
||||
use tokio_stream::wrappers::ReceiverStream;
|
||||
use tokio_stream::{wrappers::ReceiverStream, StreamExt};
|
||||
use tonic::{async_trait, Request, Response, Status, Streaming};
|
||||
use tracing::{debug, error, instrument, warn};
|
||||
use tracing::{debug, instrument, warn};
|
||||
|
||||
pub struct GRPCBlobServiceWrapper<BS: BlobService, CS: ChunkService> {
|
||||
blob_service: BS,
|
||||
|
@ -163,38 +164,40 @@ impl<
|
|||
&self,
|
||||
request: Request<Streaming<super::BlobChunk>>,
|
||||
) -> Result<Response<super::PutBlobResponse>, Status> {
|
||||
let mut req_inner = request.into_inner();
|
||||
let req_inner = request.into_inner();
|
||||
|
||||
// instantiate a [BlobWriter] to write all data received with a client,
|
||||
// but wrap it in a pretty large (1MiB) [BufWriter] to prevent
|
||||
// excessive useless chunk attempts.
|
||||
let mut blob_writer = crate::BlobWriter::new(&self.chunk_service);
|
||||
{
|
||||
let mut blob_writer_buffered = BufWriter::with_capacity(1024 * 1024, &mut blob_writer);
|
||||
let data_stream = req_inner.map(|x| {
|
||||
x.map(|x| VecDeque::from(x.data))
|
||||
.map_err(|e| std::io::Error::new(std::io::ErrorKind::InvalidInput, e))
|
||||
});
|
||||
|
||||
// receive data from the client, and write them all to the blob_writer.
|
||||
while let Some(blob_chunk) = req_inner.message().await? {
|
||||
if let Err(e) = blob_writer_buffered.write_all(&blob_chunk.data) {
|
||||
error!(e=%e,"unable to write blob data");
|
||||
return Err(Status::internal("unable to write blob data"));
|
||||
}
|
||||
}
|
||||
blob_writer_buffered.flush()?;
|
||||
}
|
||||
let data_reader = tokio_util::io::StreamReader::new(data_stream);
|
||||
|
||||
// run finalize
|
||||
let (blob_digest, blob_meta) = blob_writer
|
||||
.finalize()
|
||||
.map_err(|_| Status::internal("unable to finalize blob"))?;
|
||||
// TODO: can we get rid of this clone?
|
||||
let chunk_service = self.chunk_service.clone();
|
||||
|
||||
// check if we have the received blob in the [BlobService] already.
|
||||
let resp = self.blob_service.stat(&super::StatBlobRequest {
|
||||
let (blob_digest, blob_meta) =
|
||||
task::spawn_blocking(move || -> Result<(Vec<u8>, super::BlobMeta), Error> {
|
||||
// feed read_all_and_chunk a (sync) reader to the data retrieved from the stream.
|
||||
read_all_and_chunk(
|
||||
&chunk_service,
|
||||
tokio_util::io::SyncIoBridge::new(data_reader),
|
||||
)
|
||||
})
|
||||
.await
|
||||
.map_err(|e| Status::internal(e.to_string()))??;
|
||||
|
||||
// upload blobmeta if not there yet
|
||||
if self
|
||||
.blob_service
|
||||
.stat(&super::StatBlobRequest {
|
||||
digest: blob_digest.to_vec(),
|
||||
..Default::default()
|
||||
})?;
|
||||
|
||||
// if not, store.
|
||||
if resp.is_none() {
|
||||
include_chunks: false,
|
||||
include_bao: false,
|
||||
})?
|
||||
.is_none()
|
||||
{
|
||||
// upload blobmeta
|
||||
self.blob_service.put(&blob_digest, blob_meta)?;
|
||||
}
|
||||
|
||||
|
|
Loading…
Reference in a new issue