Skip to content

Commit

Permalink
feature: implement hamt writing (#603)
Browse files Browse the repository at this point in the history
* feature: implement hamt writing

* fix: consider link size when sending data

The real fix is of course to make this a streaming request... But that will
come later.

* test: add test for a truly large directory

* refactor: cleanup

* refactor: properly handle hash collisions

I could not find an actual collision, so I just added twice the exact same
name for a test, which currently has the same effect.
  • Loading branch information
rklaehn authored Dec 16, 2022
1 parent 2640522 commit 5f2d87f
Show file tree
Hide file tree
Showing 4 changed files with 293 additions and 86 deletions.
4 changes: 2 additions & 2 deletions iroh-api/src/store.rs
Original file line number Diff line number Diff line change
Expand Up @@ -61,11 +61,11 @@ fn add_blocks_to_store_chunked<S: Store>(
) -> impl Stream<Item = Result<(Cid, u64)>> {
let mut chunk = Vec::new();
let mut chunk_size = 0u64;
const MAX_CHUNK_SIZE: u64 = 1024 * 1024 * 16;
const MAX_CHUNK_SIZE: u64 = 1024 * 1024;
stream! {
while let Some(block) = blocks.next().await {
let block = block?;
let block_size = block.data().len() as u64;
let block_size = block.data().len() as u64 + block.links().len() as u64 * 128;
let cid = *block.cid();
let raw_data_size = block.raw_data_size().unwrap_or_default();
tracing::info!("adding chunk of {} bytes", chunk_size);
Expand Down
58 changes: 49 additions & 9 deletions iroh-resolver/tests/roundtrip.rs
Original file line number Diff line number Diff line change
Expand Up @@ -27,8 +27,11 @@ type TestDir = BTreeMap<String, TestDirEntry>;

/// builds an unixfs directory out of a TestDir
#[async_recursion(?Send)]
async fn build_directory(name: &str, dir: &TestDir) -> Result<Directory> {
async fn build_directory(name: &str, dir: &TestDir, hamt: bool) -> Result<Directory> {
let mut builder = DirectoryBuilder::new().name(name);
if hamt {
builder = builder.hamt();
}
for (name, entry) in dir {
match entry {
TestDirEntry::File(content) => {
Expand All @@ -40,7 +43,7 @@ async fn build_directory(name: &str, dir: &TestDir) -> Result<Directory> {
builder = builder.add_file(file);
}
TestDirEntry::Directory(dir) => {
let dir = build_directory(name, dir).await?;
let dir = build_directory(name, dir, hamt).await?;
builder = builder.add_dir(dir)?;
}
}
Expand Down Expand Up @@ -110,8 +113,8 @@ async fn build_testdir(
}

/// a roundtrip test that converts a dir to an unixfs DAG and back
async fn dir_roundtrip_test(dir: TestDir) -> Result<bool> {
let directory = build_directory("", &dir).await?;
async fn dir_roundtrip_test(dir: TestDir, hamt: bool) -> Result<bool> {
let directory = build_directory("", &dir, hamt).await?;
let stream = directory.encode();
let (root, resolver) = stream_to_resolver(stream).await?;
let stream =
Expand All @@ -121,11 +124,11 @@ async fn dir_roundtrip_test(dir: TestDir) -> Result<bool> {
}

/// sync version of dir_roundtrip_test for use in proptest
fn dir_roundtrip_test_sync(dir: TestDir) -> bool {
fn dir_roundtrip_test_sync(dir: TestDir, hamt: bool) -> bool {
tokio::runtime::Builder::new_current_thread()
.build()
.unwrap()
.block_on(dir_roundtrip_test(dir))
.block_on(dir_roundtrip_test(dir, hamt))
.unwrap()
}

Expand Down Expand Up @@ -183,13 +186,14 @@ fn file_roundtrip_test_sync(data: Bytes, chunk_size: usize, degree: usize) -> bo

fn arb_test_dir() -> impl Strategy<Value = TestDir> {
// create an arbitrary nested directory structure
// zero size file names are not generated, since they are not allowed and don't work with hamt directories
fn arb_dir_entry() -> impl Strategy<Value = TestDirEntry> {
let leaf = any::<Vec<u8>>().prop_map(|x| TestDirEntry::File(Bytes::from(x)));
leaf.prop_recursive(3, 64, 10, |inner| {
prop::collection::btree_map(".*", inner, 0..10).prop_map(TestDirEntry::Directory)
prop::collection::btree_map(".+", inner, 0..10).prop_map(TestDirEntry::Directory)
})
}
prop::collection::btree_map(".*", arb_dir_entry(), 0..10)
prop::collection::btree_map(".+", arb_dir_entry(), 0..10)
}

fn arb_degree() -> impl Strategy<Value = usize> {
Expand All @@ -210,8 +214,44 @@ proptest! {

#[test]
fn test_dir_roundtrip(data in arb_test_dir()) {
assert!(dir_roundtrip_test_sync(data));
assert!(dir_roundtrip_test_sync(data, false));
}

#[test]
fn test_dir_roundtrip_hamt(data in arb_test_dir()) {
assert!(dir_roundtrip_test_sync(data, true));
}
}

#[test]
fn test_hamt_roundtrip_1() {
let mut dir = TestDir::new();
dir.insert("foo".to_string(), TestDirEntry::File(Bytes::from("bar")));
dir.insert("fnord".to_string(), TestDirEntry::File(Bytes::from("baz")));
assert!(dir_roundtrip_test_sync(dir, true));
}

#[test]
fn test_hamt_roundtrip_2() {
let mut dir = TestDir::new();
dir.insert("foo".to_string(), TestDirEntry::File(Bytes::from("bar")));
assert!(dir_roundtrip_test_sync(dir, true));
}

#[test]
fn test_hamt_roundtrip_3() {
let mut dir = TestDir::new();
dir.insert("a".to_string(), TestDirEntry::File(Bytes::from("bar")));
assert!(dir_roundtrip_test_sync(dir, true));
}

#[tokio::test(flavor = "multi_thread")]
async fn test_hamt_roundtrip_large() {
let mut dir = TestDir::new();
for i in 0..10000 {
dir.insert(format!("file_{}", i), TestDirEntry::File(Bytes::new()));
}
assert!(dir_roundtrip_test(dir, true).await.unwrap());
}

#[tokio::test]
Expand Down
Loading

0 comments on commit 5f2d87f

Please sign in to comment.