diff options
author | Florian Klink <flokli@flokli.de> | 2023-01-20T22·40+0100 |
---|---|---|
committer | flokli <flokli@flokli.de> | 2023-01-21T10·48+0000 |
commit | 90979d39f330d788f50528056a5180912973831b (patch) | |
tree | ba3920cbdedc041408738e3c0c8d98ae4c13ffef /tvix/store/src/sled_directory_service.rs | |
parent | d8e0fa8e5e67c7cc21a72cad545789914adcc798 (diff) |
feat(tvix/store/directory): validate Directory and sizes r/5724
This calls out to Directory::validate() for all received Directory messages, and also makes sure the sizes we refer a Directory message as matches the sizes that have been calculated. Change-Id: I316f9191d5872ee4ba6d78b9a4326f069b22fa63 Reviewed-on: https://cl.tvl.fyi/c/depot/+/7882 Tested-by: BuildkiteCI Reviewed-by: tazjin <tazjin@tvl.su>
Diffstat (limited to 'tvix/store/src/sled_directory_service.rs')
-rw-r--r-- | tvix/store/src/sled_directory_service.rs | 46 |
1 files changed, 37 insertions, 9 deletions
diff --git a/tvix/store/src/sled_directory_service.rs b/tvix/store/src/sled_directory_service.rs index 3d56b8ef3e6a..4b2c6ed54d62 100644 --- a/tvix/store/src/sled_directory_service.rs +++ b/tvix/store/src/sled_directory_service.rs @@ -1,4 +1,5 @@ use data_encoding::BASE64; +use std::collections::HashMap; use std::collections::HashSet; use std::collections::VecDeque; use std::path::PathBuf; @@ -131,20 +132,47 @@ fn insert_directories( txn: &sled::transaction::TransactionalTree, directories: &Vec<Directory>, ) -> Result<Vec<u8>, Status> { - // This keeps track of the seen directory keys. + // This keeps track of the seen directory keys, and their size. + // This is used to validate the size field of a reference to a previously sent directory. // We don't need to keep the contents around, they're stored in the DB. - let mut seen_directory_dgsts: HashSet<Vec<u8>> = HashSet::new(); + let mut seen_directories_sizes: HashMap<Vec<u8>, u32> = HashMap::new(); let mut last_directory_dgst: Option<Vec<u8>> = None; for directory in directories { + // validate the directory itself. + if let Err(e) = directory.validate() { + return Err(Status::invalid_argument(format!( + "directory {} failed validation: {}", + BASE64.encode(&directory.digest()), + e, + ))); + } + // for each child directory this directory refers to, we need - // to ensure it has been seen already in this stream. + // to ensure it has been seen already in this stream, and that the size + // matches what we recorded. for child_directory in &directory.directories { - if !seen_directory_dgsts.contains(&child_directory.digest) { - return Err(Status::invalid_argument(format!( - "referred child directory {} not seen yet", - BASE64.encode(&child_directory.digest) - ))); + match seen_directories_sizes.get(&child_directory.digest) { + None => { + return Err(Status::invalid_argument(format!( + "child directory '{}' ({}) in directory '{}' not seen yet", + child_directory.name, + BASE64.encode(&child_directory.digest), + BASE64.encode(&directory.digest()), + ))); + } + Some(seen_child_directory_size) => { + if seen_child_directory_size != &child_directory.size { + return Err(Status::invalid_argument(format!( + "child directory '{}' ({}) in directory '{}' referred with wrong size, expected {}, actual {}", + child_directory.name, + BASE64.encode(&child_directory.digest), + BASE64.encode(&directory.digest()), + seen_child_directory_size, + child_directory.size, + ))); + } + } } } @@ -153,7 +181,7 @@ fn insert_directories( // disconnected graphs at the same time… let dgst = directory.digest(); - seen_directory_dgsts.insert(dgst.clone()); + seen_directories_sizes.insert(dgst.clone(), directory.size()); last_directory_dgst = Some(dgst.clone()); // check if the directory already exists in the database. We can skip |