From 19d061db2feb8eac51f4db86ab81e70544296818 Mon Sep 17 00:00:00 2001 From: Bob Callaway Date: Tue, 27 Aug 2024 13:36:57 -0400 Subject: [PATCH] dedup leafidentityhash values ahead of SQL lookup of existing leaves (#3607) Signed-off-by: Bob Callaway --- storage/mysql/log_storage.go | 11 +++++++++-- storage/mysql/log_storage_test.go | 7 +++++++ 2 files changed, 16 insertions(+), 2 deletions(-) diff --git a/storage/mysql/log_storage.go b/storage/mysql/log_storage.go index 1c3795d5c6..b3f10f7818 100644 --- a/storage/mysql/log_storage.go +++ b/storage/mysql/log_storage.go @@ -476,11 +476,18 @@ func (t *logTreeTX) QueueLeaves(ctx context.Context, leaves []*trillian.LogLeaf, return existingLeaves, nil } - // For existing leaves, we need to retrieve the contents. First collate the desired LeafIdentityHash values. + // For existing leaves, we need to retrieve the contents. First collate the desired LeafIdentityHash values + // We deduplicate the hashes to address https://github.com/google/trillian/issues/3603 but will be mapped + // back to the existingLeaves slice below + uniqueLeafMap := make(map[string]struct{}, len(existingLeaves)) var toRetrieve [][]byte for _, existing := range existingLeaves { if existing != nil { - toRetrieve = append(toRetrieve, existing.LeafIdentityHash) + key := string(existing.LeafIdentityHash) + if _, ok := uniqueLeafMap[key]; !ok { + uniqueLeafMap[key] = struct{}{} + toRetrieve = append(toRetrieve, existing.LeafIdentityHash) + } } } results, err := t.getLeafDataByIdentityHash(ctx, toRetrieve) diff --git a/storage/mysql/log_storage_test.go b/storage/mysql/log_storage_test.go index d0cfc50e41..b67035bd30 100644 --- a/storage/mysql/log_storage_test.go +++ b/storage/mysql/log_storage_test.go @@ -139,6 +139,7 @@ func TestQueueDuplicateLeaf(t *testing.T) { leaves := createTestLeaves(int64(count), 10) leaves2 := createTestLeaves(int64(count), 12) leaves3 := createTestLeaves(3, 100) + leaves4 := createTestLeaves(3, 105) // Note that tests accumulate queued leaves on top of each other. tests := []struct { @@ -161,6 +162,12 @@ func TestQueueDuplicateLeaf(t *testing.T) { leaves: []*trillian.LogLeaf{leaves[0], leaves3[0], leaves[1], leaves3[1], leaves[2]}, want: []*trillian.LogLeaf{leaves[0], nil, leaves[1], nil, leaves[2]}, }, + { + // we explictly reuse tests that have already been integrated to test issue 3603 + desc: "[100, 100, 106, 101, 107]", + leaves: []*trillian.LogLeaf{leaves3[0], leaves3[0], leaves4[1], leaves3[1], leaves4[2]}, + want: []*trillian.LogLeaf{leaves3[0], leaves3[0], leaves4[1], leaves3[1], leaves4[2]}, + }, } for _, test := range tests {