diff --git a/local-cluster/tests/local_cluster.rs b/local-cluster/tests/local_cluster.rs index c0635e7f24f830..35d7191a3f7556 100644 --- a/local-cluster/tests/local_cluster.rs +++ b/local-cluster/tests/local_cluster.rs @@ -3129,13 +3129,13 @@ fn run_test_load_program_accounts(scan_commitment: CommitmentConfig) { #[test] #[serial] fn test_no_optimistic_confirmation_violation_with_tower() { - do_test_optimistic_confirmation_violation_with_or_without_tower(true); + do_test_lockout_violation_with_or_without_tower(true); } #[test] #[serial] fn test_optimistic_confirmation_violation_without_tower() { - do_test_optimistic_confirmation_violation_with_or_without_tower(false); + do_test_lockout_violation_with_or_without_tower(false); } // A bit convoluted test case; but this roughly follows this test theoretical scenario: @@ -3173,7 +3173,7 @@ fn test_optimistic_confirmation_violation_without_tower() { // With the persisted tower: // `A` should not be able to generate a switching proof. // -fn do_test_optimistic_confirmation_violation_with_or_without_tower(with_tower: bool) { +fn do_test_lockout_violation_with_or_without_tower(with_tower: bool) { solana_logger::setup_with("info"); // First set up the cluster with 4 nodes @@ -3184,21 +3184,15 @@ fn do_test_optimistic_confirmation_violation_with_or_without_tower(with_tower: b 33 * DEFAULT_NODE_STAKE, ]; - let base_slot: Slot = 26; // S2 - let next_slot_on_a: Slot = 27; // S3 + let validator_b_last_leader_slot: Slot = 8; let truncated_slots: Slot = 100; // just enough to purge all following slots after the S2 and S3 - // Each pubkeys are prefixed with A, B, C and D. - // D is needed to: - // 1) Propagate A's votes for S2 to validator C after A shuts down so that - // C can avoid NoPropagatedConfirmation errors and continue to generate blocks - // 2) Provide gossip discovery for `A` when it restarts because `A` will restart - // at a different gossip port than the entrypoint saved in C's gossip table + // Each pubkeys are prefixed with A, B, C + let validator_keys = [ "28bN3xyvrP4E8LwEgtLjhnkb7cY4amQb6DrYAbAYjgRV4GAGgkVM2K7wnxnAS7WDneuavza7x21MiafLu1HkwQt4", "2saHBBoTkLMmttmPQP8KfBkcCw45S5cwtV3wTdGCscRC8uxdgvHxpHiWXKx4LvJjNJtnNcbSv5NdheokFFqnNDt8", "4mx9yoFBeYasDKBGDWCTWGJdWuJCKbgqmuP8bN9umybCh5Jzngw7KQxe99Rf5uzfyzgba1i65rJW4Wqk7Ab5S8ye", - "3zsEPEDsjfEay7te9XqNjRTCE7vwuT6u4DHzBJC19yp7GS8BuNRMRjnpVrKCBzb3d44kxc4KPGSHkCmk6tEfswCg", ] .iter() .map(|s| (Arc::new(Keypair::from_base58_string(s)), true)) @@ -3220,15 +3214,21 @@ fn do_test_optimistic_confirmation_violation_with_or_without_tower(with_tower: b // // 2. Validator A doesn't vote past `next_slot_on_a` before we can kill it. This is essential // because if validator A votes past `next_slot_on_a`, and then we copy over validator B's ledger - // below only for slots <= `next_slot_on_a`, validator A will not know how it's last vote chains + // below only for slots <= `next_slot_on_a`, validator A will not know how its last vote chains // to the other forks, and may violate switching proofs on restart. let mut default_config = ValidatorConfig::default_for_test(); - // Ensure B can make leader blocks up till the fork slot, and give the remaining slots to C. + // Ensure B can make leader blocks up till the fork slot, and give the remaining slots to C. This is + // also important so `C` doesn't run into NoPropagatedConfirmation errors on making its first forked + // slot, since `A` will be making a simulated vote that's not actually present in gossip. + // // Don't give validator A any slots because it's going to be deleting its ledger, so it may create // versions of slots it's already created, but on a different fork. let validator_to_slots = vec![ // Ensure validator b is leader for slots <= `next_slot_on_a` - (validator_b_pubkey, next_slot_on_a as usize + 1), + ( + validator_b_pubkey, + validator_b_last_leader_slot as usize + 1, + ), (validator_c_pubkey, DEFAULT_SLOTS_PER_EPOCH as usize), ]; // Trick C into not producing any blocks, in case its leader slots come up before it gets killed @@ -3236,7 +3236,7 @@ fn do_test_optimistic_confirmation_violation_with_or_without_tower(with_tower: b let c_leader_schedule = create_custom_leader_schedule(c_validator_to_slots.into_iter()); let leader_schedule = create_custom_leader_schedule(validator_to_slots.into_iter()); - for slot in 0..=next_slot_on_a { + for slot in 0..=validator_b_last_leader_slot { assert_eq!(leader_schedule[slot], validator_b_pubkey); } @@ -3246,9 +3246,8 @@ fn do_test_optimistic_confirmation_violation_with_or_without_tower(with_tower: b let mut validator_configs = make_identical_validator_configs(&default_config, node_stakes.len()); - // Disable voting on validators C, and D + // Disable voting on validator C validator_configs[2].voting_disabled = true; - validator_configs[3].voting_disabled = true; // C should not produce any blocks at this time validator_configs[2].fixed_leader_schedule = Some(FixedSchedule { leader_schedule: Arc::new(c_leader_schedule), @@ -3283,55 +3282,38 @@ fn do_test_optimistic_confirmation_violation_with_or_without_tower(with_tower: b validator_c_pubkey, val_c_ledger_path ); - // Immediately kill validator C. No need to kill validator A because - // 1) It has no slots in the leader schedule, so no way to make forks - // 2) We need it to vote info!("Exiting validator C"); let mut validator_c_info = cluster.exit_node(&validator_c_pubkey); - // Step 1: - // Let validator A, B, (D) run. Wait for both `A` and `B` to have voted on `next_slot_on_a` or - // one of its descendants - info!( - "Waiting on both validators A and B to vote on fork at slot {}", - next_slot_on_a - ); - let now = Instant::now(); - let mut last_b_vote = 0; - let mut last_a_vote = 0; - loop { - let elapsed = now.elapsed(); - assert!( - elapsed <= Duration::from_secs(30), - "One of the validators failed to vote on a slot >= {} in {} secs, - last validator A vote: {}, - last validator B vote: {}", - next_slot_on_a, - elapsed.as_secs(), - last_a_vote, - last_b_vote, - ); - sleep(Duration::from_millis(100)); - - if let Some((last_vote, _)) = last_vote_in_tower(&val_b_ledger_path, &validator_b_pubkey) { - last_b_vote = last_vote; - if last_vote < next_slot_on_a { - continue; - } - } + info!("Waiting on validator A to vote"); + // Step 1: Wait for validator A to vote so the tower file exists, and so we can determine the + // `base_slot` and `next_slot_on_a` + loop { if let Some((last_vote, _)) = last_vote_in_tower(&val_a_ledger_path, &validator_a_pubkey) { - last_a_vote = last_vote; - if last_vote >= next_slot_on_a { + // The vote needs to have a parent so that we validator C can create a fork + if last_vote >= 1 { break; } } + + sleep(Duration::from_millis(100)); } // kill A and B let _validator_b_info = cluster.exit_node(&validator_b_pubkey); let validator_a_info = cluster.exit_node(&validator_a_pubkey); + let next_slot_on_a = last_vote_in_tower(&val_a_ledger_path, &validator_a_pubkey) + .unwrap() + .0; // S3 + let base_slot = next_slot_on_a - 1; // S2 + + info!( + "base slot: {}, next_slot_on_a: {}", + base_slot, next_slot_on_a + ); + // Step 2: // Truncate ledger, copy over B's ledger to C info!("Create validator C's ledger"); @@ -3345,33 +3327,19 @@ fn do_test_optimistic_confirmation_violation_with_or_without_tower(with_tower: b remove_tower(&val_c_ledger_path, &validator_b_pubkey); let blockstore = open_blockstore(&val_c_ledger_path); - purge_slots_with_count(&blockstore, base_slot + 1, truncated_slots); + purge_slots_with_count(&blockstore, next_slot_on_a, truncated_slots); } info!("Create validator A's ledger"); { - // Find latest vote in B, and wait for it to reach blockstore - let b_last_vote = - wait_for_last_vote_in_tower_to_land_in_ledger(&val_b_ledger_path, &validator_b_pubkey) - .unwrap(); - // Now we copy these blocks to A let b_blockstore = open_blockstore(&val_b_ledger_path); let a_blockstore = open_blockstore(&val_a_ledger_path); - copy_blocks(b_last_vote, &b_blockstore, &a_blockstore, false); + copy_blocks(next_slot_on_a, &b_blockstore, &a_blockstore, false); // Purge uneccessary slots purge_slots_with_count(&a_blockstore, next_slot_on_a + 1, truncated_slots); } - // This should be guaranteed because we waited for validator `A` to vote on a slot > `next_slot_on_a` - // before killing it earlier. - info!("Checking A's tower for a vote on slot descended from slot `next_slot_on_a`"); - let last_vote_slot = last_vote_in_tower(&val_a_ledger_path, &validator_a_pubkey) - .unwrap() - .0; - assert!(last_vote_slot >= next_slot_on_a); - info!("Success, A voted on slot {}", last_vote_slot); - { let blockstore = open_blockstore(&val_a_ledger_path); if !with_tower {