feat(tvix/store): implement PathInfoService with sled

This uses [sled](https://github.com/spacejam/sled) to store PathInfo
objects.

Change-Id: I12e8032e5562af8f884efa23a78049fd1108fdbc
Reviewed-on: https://cl.tvl.fyi/c/depot/+/7726
Reviewed-by: tazjin <tazjin@tvl.su>
Tested-by: BuildkiteCI
This commit is contained in:
Florian Klink 2022-12-29 21:39:28 +01:00 committed by flokli
parent cfa42fd19a
commit 43f6aec384
9 changed files with 652 additions and 40 deletions

View file

@ -1,35 +0,0 @@
use crate::proto::path_info_service_server::PathInfoService;
use crate::proto::CalculateNarResponse;
use crate::proto::GetPathInfoRequest;
use crate::proto::Node;
use crate::proto::PathInfo;
use tonic::{Request, Response, Result, Status};
use tracing::{instrument, warn};
pub struct DummyPathInfoService {}
const NOT_IMPLEMENTED_MSG: &str = "not implemented";
#[tonic::async_trait]
impl PathInfoService for DummyPathInfoService {
#[instrument(skip(self))]
async fn get(&self, _request: Request<GetPathInfoRequest>) -> Result<Response<PathInfo>> {
warn!(NOT_IMPLEMENTED_MSG);
Err(Status::unimplemented(NOT_IMPLEMENTED_MSG))
}
#[instrument(skip(self))]
async fn put(&self, _request: Request<PathInfo>) -> Result<Response<PathInfo>> {
warn!(NOT_IMPLEMENTED_MSG);
Err(Status::unimplemented(NOT_IMPLEMENTED_MSG))
}
#[instrument(skip(self))]
async fn calculate_nar(
&self,
_request: Request<Node>,
) -> Result<Response<CalculateNarResponse>> {
warn!(NOT_IMPLEMENTED_MSG);
Err(Status::unimplemented(NOT_IMPLEMENTED_MSG))
}
}

View file

@ -4,7 +4,7 @@ pub mod store_path;
pub mod dummy_blob_service;
pub mod dummy_directory_service;
pub mod dummy_path_info_service;
pub mod sled_path_info_service;
#[cfg(test)]
mod tests;

View file

@ -36,7 +36,8 @@ async fn main() -> Result<(), Box<dyn std::error::Error>> {
let blob_service = tvix_store::dummy_blob_service::DummyBlobService {};
let directory_service = tvix_store::dummy_directory_service::DummyDirectoryService {};
let path_info_service = tvix_store::dummy_path_info_service::DummyPathInfoService {};
let path_info_service =
tvix_store::sled_path_info_service::SledPathInfoService::new("pathinfo.sled".into())?;
let mut router = server
.add_service(BlobServiceServer::new(blob_service))

View file

@ -0,0 +1,89 @@
use prost::Message;
use std::path::PathBuf;
use crate::proto::get_path_info_request::ByWhat;
use crate::proto::path_info_service_server::PathInfoService;
use crate::proto::CalculateNarResponse;
use crate::proto::GetPathInfoRequest;
use crate::proto::Node;
use crate::proto::PathInfo;
use crate::store_path::DIGEST_SIZE;
use tonic::{Request, Response, Result, Status};
use tracing::{instrument, warn};
const NOT_IMPLEMENTED_MSG: &str = "not implemented";
/// SledPathInfoService stores PathInfo in a [sled](https://github.com/spacejam/sled).
///
/// The PathInfo messages are stored as encoded protos, and keyed by their output hash,
/// as that's currently the only request type available.
pub struct SledPathInfoService {
db: sled::Db,
}
impl SledPathInfoService {
pub fn new(p: PathBuf) -> Result<Self, anyhow::Error> {
let config = sled::Config::default().use_compression(true).path(p);
let db = config.open()?;
Ok(Self { db })
}
}
#[tonic::async_trait]
impl PathInfoService for SledPathInfoService {
#[instrument(skip(self))]
async fn get(&self, request: Request<GetPathInfoRequest>) -> Result<Response<PathInfo>> {
match request.into_inner().by_what {
None => Err(Status::unimplemented("by_what needs to be specified")),
Some(ByWhat::ByOutputHash(digest)) => {
if digest.len() != DIGEST_SIZE {
return Err(Status::invalid_argument("invalid digest length"));
}
match self.db.get(digest) {
Ok(None) => Err(Status::not_found("PathInfo not found")),
Ok(Some(data)) => match PathInfo::decode(&*data) {
Ok(path_info) => Ok(Response::new(path_info)),
Err(e) => {
warn!("failed to decode stored PathInfo: {}", e);
Err(Status::internal("failed to decode stored PathInfo"))
}
},
Err(e) => {
warn!("failed to retrieve PathInfo: {}", e);
Err(Status::internal("error during PathInfo lookup"))
}
}
}
}
}
#[instrument(skip(self))]
async fn put(&self, request: Request<PathInfo>) -> Result<Response<PathInfo>> {
let path_info = request.into_inner();
// Call validate on the received PathInfo message.
match path_info.validate() {
Err(e) => Err(Status::invalid_argument(e.to_string())),
// In case the PathInfo is valid, and we were able to extract a NixPath, store it in the database.
// This overwrites existing PathInfo objects.
Ok(nix_path) => match self.db.insert(nix_path.digest, path_info.encode_to_vec()) {
Ok(_) => Ok(Response::new(path_info)),
Err(e) => {
warn!("failed to insert PathInfo: {}", e);
Err(Status::internal("failed to insert PathInfo"))
}
},
}
}
#[instrument(skip(self))]
async fn calculate_nar(
&self,
_request: Request<Node>,
) -> Result<Response<CalculateNarResponse>> {
warn!(NOT_IMPLEMENTED_MSG);
Err(Status::unimplemented(NOT_IMPLEMENTED_MSG))
}
}

View file

@ -1,6 +1,7 @@
use crate::proto::{Directory, DirectoryNode, FileNode, SymlinkNode, ValidateDirectoryError};
use lazy_static::lazy_static;
mod path_info_service;
mod pathinfo;
lazy_static! {

View file

@ -0,0 +1,74 @@
use tempfile::TempDir;
use crate::proto::path_info_service_server::PathInfoService;
use crate::proto::GetPathInfoRequest;
use crate::proto::{get_path_info_request, PathInfo};
use crate::sled_path_info_service::SledPathInfoService;
use lazy_static::lazy_static;
lazy_static! {
static ref DUMMY_OUTPUT_HASH: Vec<u8> = vec![
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
0x00, 0x00, 0x00, 0x00, 0x00
];
}
/// Trying to get a non-existent PathInfo should return a not found error.
#[tokio::test]
async fn not_found() -> anyhow::Result<()> {
let service = SledPathInfoService::new(TempDir::new()?.path().to_path_buf())?;
let resp = service
.get(tonic::Request::new(GetPathInfoRequest {
by_what: Some(get_path_info_request::ByWhat::ByOutputHash(
DUMMY_OUTPUT_HASH.to_vec(),
)),
}))
.await;
match resp {
Err(status) => {
assert_eq!(status.code(), tonic::Code::NotFound);
}
Ok(_) => panic!("must fail"),
};
Ok(())
}
/// Put a PathInfo into the store, get it back.
#[tokio::test]
async fn put_get() -> anyhow::Result<()> {
let service = SledPathInfoService::new(TempDir::new()?.path().to_path_buf())?;
let path_info = PathInfo {
node: Some(crate::proto::Node {
node: Some(crate::proto::node::Node::Symlink(
crate::proto::SymlinkNode {
name: "00000000000000000000000000000000-foo".to_string(),
target: "doesntmatter".to_string(),
},
)),
}),
..Default::default()
};
let resp = service.put(tonic::Request::new(path_info.clone())).await;
assert!(resp.is_ok());
assert_eq!(resp.expect("must succeed").into_inner(), path_info);
let resp = service
.get(tonic::Request::new(GetPathInfoRequest {
by_what: Some(get_path_info_request::ByWhat::ByOutputHash(
DUMMY_OUTPUT_HASH.to_vec(),
)),
}))
.await;
assert!(resp.is_ok());
assert_eq!(resp.expect("must succeed").into_inner(), path_info);
Ok(())
}