Skip to content

Commit

Permalink
Add support for persistent state in separate virtual memory (#2321)
Browse files Browse the repository at this point in the history
This PR adds support for the storage layout `v9` which keeps the
persistent state in a separate virtual memory.
The PR does _not_ include any migration. Existing II installations will
keep layout `v8`.
  • Loading branch information
Frederik Rothenberger authored Feb 28, 2024
1 parent 2c26130 commit a22e5ec
Show file tree
Hide file tree
Showing 7 changed files with 284 additions and 119 deletions.
16 changes: 15 additions & 1 deletion src/internet_identity/src/state.rs
Original file line number Diff line number Diff line change
Expand Up @@ -12,8 +12,10 @@ use candid::{CandidType, Deserialize};
use canister_sig_util::signature_map::SignatureMap;
use ic_cdk::api::time;
use ic_cdk::trap;
use ic_stable_structures::DefaultMemoryImpl;
use ic_stable_structures::storable::Bound;
use ic_stable_structures::{DefaultMemoryImpl, Storable};
use internet_identity_interface::internet_identity::types::*;
use std::borrow::Cow;
use std::cell::{Cell, RefCell};
use std::collections::HashMap;
use std::ops::{Deref, DerefMut};
Expand Down Expand Up @@ -115,6 +117,18 @@ impl Default for PersistentState {
}
}

impl Storable for PersistentState {
fn to_bytes(&self) -> Cow<[u8]> {
Cow::Owned(candid::encode_one(self).expect("failed to serialize persistent state"))
}

fn from_bytes(bytes: Cow<[u8]>) -> Self {
candid::decode_one(&bytes).expect("failed to deserialize persistent state")
}

const BOUND: Bound = Bound::Unbounded;
}

#[derive(Clone, Debug, CandidType, Deserialize)]
pub struct RateLimitState {
// Number of tokens available for calls, where each call will deduct one token. If tokens reaches
Expand Down
106 changes: 71 additions & 35 deletions src/internet_identity/src/storage.rs
Original file line number Diff line number Diff line change
Expand Up @@ -68,16 +68,14 @@
//! ## Persistent State
//!
//! In order to keep state across upgrades that is not related to specific anchors (such as archive
//! information) Internet Identity will serialize the [PersistentState] into the first unused memory
//! location (after the anchor record of the highest allocated anchor number). The [PersistentState]
//! will be read in `post_upgrade` after which the data can be safely overwritten by the next anchor
//! to be registered.
//! information) Internet Identity will serialize the [PersistentState] on upgrade and restore it
//! again after the upgrade.
//!
//! The [PersistentState] is serialized at the end of stable memory to allow for variable sized data
//! without the risk of running out of space (which might easily happen if the RESERVED_HEADER_BYTES
//! were used instead).
//! The storage layout v8 and earlier use the first unused memory
//! location (after the anchor record of the highest allocated anchor number) to store it.
//! The storage layout v9 uses a separate virtual memory.
//!
//! ### Archive buffer memory
//! ## Archive buffer memory
//!
//! The archive buffer memory is entirely owned by a [StableBTreeMap] used to store the buffered
//! entries. The entries are indexed by their sequence number.
Expand All @@ -97,7 +95,7 @@ use ic_stable_structures::memory_manager::{MemoryId, MemoryManager, VirtualMemor
use ic_stable_structures::reader::{BufferedReader, Reader};
use ic_stable_structures::storable::Bound;
use ic_stable_structures::writer::{BufferedWriter, Writer};
use ic_stable_structures::{Memory, RestrictedMemory, StableBTreeMap, Storable};
use ic_stable_structures::{Memory, RestrictedMemory, StableBTreeMap, StableCell, Storable};
use internet_identity_interface::archive::types::BufferedEntry;

use internet_identity_interface::internet_identity::types::*;
Expand All @@ -116,8 +114,9 @@ mod tests;
/// * version 0: invalid
/// * version 1-7: no longer supported
/// * version 8: 4KB anchors, candid anchor record layout, persistent state with archive pull config,
/// with memory manager (from 2nd page on), archive entries buffer in stable memory
const SUPPORTED_LAYOUT_VERSIONS: RangeInclusive<u8> = 8..=8;
/// with memory manager (from 2nd page on), archive entries buffer in stable memory1
/// * version 9: same as 8, but with persistent state in separate virtual memory
const SUPPORTED_LAYOUT_VERSIONS: RangeInclusive<u8> = 8..=9;

const DEFAULT_ENTRY_SIZE: u16 = 4096;
const EMPTY_SALT: [u8; 32] = [0; 32];
Expand All @@ -128,8 +127,10 @@ const PERSISTENT_STATE_MAGIC: [u8; 4] = *b"IIPS"; // II Persistent State
/// MemoryManager parameters.
const ANCHOR_MEMORY_INDEX: u8 = 0u8;
const ARCHIVE_BUFFER_MEMORY_INDEX: u8 = 1u8;
const PERSISTENT_STATE_MEMORY_INDEX: u8 = 2u8;
const ANCHOR_MEMORY_ID: MemoryId = MemoryId::new(ANCHOR_MEMORY_INDEX);
const ARCHIVE_BUFFER_MEMORY_ID: MemoryId = MemoryId::new(ARCHIVE_BUFFER_MEMORY_INDEX);
const PERSISTENT_STATE_MEMORY_ID: MemoryId = MemoryId::new(PERSISTENT_STATE_MEMORY_INDEX);
// The bucket size 128 is relatively low, to avoid wasting memory when using
// multiple virtual memories for smaller amounts of data.
// This value results in 256 GB of total managed memory, which should be enough
Expand All @@ -145,7 +146,7 @@ pub const MAX_ENTRIES: u64 = (MAX_MANAGED_WASM_PAGES - BUCKET_SIZE_IN_PAGES as u

pub type Salt = [u8; 32];

type ArchiveBufferMemory<M> = RestrictedMemory<VirtualMemory<RestrictedMemory<M>>>;
type SingleBucketMemory<M> = RestrictedMemory<VirtualMemory<RestrictedMemory<M>>>;

/// The [BufferedEntry] is wrapped to allow this crate to implement [Storable].
#[derive(Clone, Debug, CandidType, Deserialize)]
Expand Down Expand Up @@ -173,8 +174,17 @@ pub struct Storage<M: Memory> {
/// This memory is entirely owned by the [archive_entries_buffer] and must never be written to.
/// The only reason it is stored here is to have a reference to it so that we can provide stats
/// about its size.
archive_buffer_memory: ArchiveBufferMemory<M>,
archive_entries_buffer: StableBTreeMap<u64, BufferedEntryWrapper, ArchiveBufferMemory<M>>,
///
/// A single archive entry takes on average 476 bytes of space.
/// To have space for 10_000 entries (accounting for ~10% overhead) we need 82 pages or ~5 MB.
/// Since the memory manager allocates memory in buckets of 128 pages, we round up to 128 pages.
archive_buffer_memory: SingleBucketMemory<M>,
archive_entries_buffer: StableBTreeMap<u64, BufferedEntryWrapper, SingleBucketMemory<M>>,
/// This memory is entirely owned by the [persistent_state] and must never be written to.
/// The only reason it is stored here is to have a reference to it so that we can provide stats
/// about its size.
persistent_state_memory: SingleBucketMemory<M>,
persistent_state: StableCell<PersistentState, SingleBucketMemory<M>>,
}

#[repr(packed)]
Expand Down Expand Up @@ -205,7 +215,7 @@ impl<M: Memory + Clone> Storage<M> {
"id range [{id_range_lo}, {id_range_hi}) is too large for a single canister (max {MAX_ENTRIES} entries)",
));
}
let version: u8 = 8;
let version: u8 = 9;
let header = Header {
magic: *b"IIC",
version,
Expand All @@ -228,14 +238,18 @@ impl<M: Memory + Clone> Storage<M> {
BUCKET_SIZE_IN_PAGES,
);
let anchor_memory = memory_manager.get(ANCHOR_MEMORY_ID);
let archive_buffer_memory = Self::init_archive_buffer_memory(&memory_manager);

let archive_buffer_memory = single_bucket_memory(&memory_manager, ARCHIVE_BUFFER_MEMORY_ID);
let persistent_state_memory =
single_bucket_memory(&memory_manager, PERSISTENT_STATE_MEMORY_ID);
Self {
header,
header_memory,
anchor_memory,
archive_buffer_memory: archive_buffer_memory.clone(),
archive_entries_buffer: StableBTreeMap::init(archive_buffer_memory),
persistent_state_memory: persistent_state_memory.clone(),
persistent_state: StableCell::init(persistent_state_memory, PersistentState::default())
.expect("failed to initialize persistent state"),
}
}

Expand Down Expand Up @@ -452,28 +466,28 @@ impl<M: Memory + Clone> Storage<M> {
record_number as u64 * self.header.entry_size as u64
}

fn init_archive_buffer_memory(
memory_manager: &MemoryManager<RestrictedMemory<M>>,
) -> ArchiveBufferMemory<M> {
// A single archive entry takes on average 476 bytes of space.
// To have space for 10_000 entries (accounting for ~10% overhead) we need 82 pages or 5 MB.
// Since the memory manager allocates memory in buckets of 128 pages, we round up to 128 pages.
RestrictedMemory::new(
memory_manager.get(ARCHIVE_BUFFER_MEMORY_ID),
0..BUCKET_SIZE_IN_PAGES as u64,
)
}

/// Returns the address of the first byte not yet allocated to a anchor.
/// This address exists even if the max anchor number has been reached, because there is a memory
/// reserve at the end of stable memory.
fn unused_memory_start(&self) -> u64 {
self.record_address(self.header.num_anchors)
}

/// Writes the persistent state to stable memory just outside of the space allocated to the highest anchor number.
/// This is only used to _temporarily_ save state during upgrades. It will be overwritten on next anchor registration.
pub fn write_persistent_state(&mut self, state: &PersistentState) {
match self.version() {
8 => self.write_persistent_state_v8(state),
9 => {
self.persistent_state
.set(state.clone())
.expect("failed to write persistent state");
}
version => trap(&format!("unsupported version: {}", version)),
};
}

/// Writes the persistent state to stable memory just outside the space allocated to the highest anchor number.
/// This is only used to _temporarily_ save state during upgrades. It will be overwritten on next anchor registration.
fn write_persistent_state_v8(&mut self, state: &PersistentState) {
let address = self.unused_memory_start();

// In practice, candid encoding is infallible. The Result is an artifact of the serde API.
Expand All @@ -492,12 +506,19 @@ impl<M: Memory + Clone> Storage<M> {
writer.write_all(&encoded_state).unwrap();
}

/// Reads the persistent state from stable memory just outside of the space allocated to the highest anchor number.
/// This is only used to restore state in `post_upgrade`.
pub fn read_persistent_state(&self) -> Result<PersistentState, PersistentStateError> {
const WASM_PAGE_SIZE: u64 = 65536;
match self.version() {
8 => self.read_persistent_state_v8(),
9 => Ok(self.persistent_state.get().clone()),
version => trap(&format!("unsupported version: {}", version)),
}
}

/// Reads the persistent state from stable memory just outside the space allocated to the highest anchor number.
/// This is only used to restore state in `post_upgrade`.
fn read_persistent_state_v8(&self) -> Result<PersistentState, PersistentStateError> {
let address = self.unused_memory_start();
if address > self.anchor_memory.size() * WASM_PAGE_SIZE {
if address > self.anchor_memory.size() * WASM_PAGE_SIZE_IN_BYTES as u64 {
// the address where the persistent state would be is not allocated yet
return Err(PersistentStateError::NotFound);
}
Expand Down Expand Up @@ -544,10 +565,25 @@ impl<M: Memory + Clone> Storage<M> {
"archive_buffer".to_string(),
self.archive_buffer_memory.size(),
),
(
"persistent_state".to_string(),
self.persistent_state_memory.size(),
),
])
}
}

/// Creates a new virtual memory corresponding to the given ID that is limited to a single bucket.
fn single_bucket_memory<M: Memory>(
memory_manager: &MemoryManager<RestrictedMemory<M>>,
memory_id: MemoryId,
) -> SingleBucketMemory<M> {
RestrictedMemory::new(
memory_manager.get(memory_id),
0..BUCKET_SIZE_IN_PAGES as u64,
)
}

#[derive(Debug)]
pub enum PersistentStateError {
CandidError(candid::error::Error),
Expand Down
56 changes: 49 additions & 7 deletions src/internet_identity/src/storage/tests.rs
Original file line number Diff line number Diff line change
Expand Up @@ -29,16 +29,16 @@ fn should_report_max_number_of_entries_for_256gb() {
}

#[test]
fn should_serialize_header_v8() {
fn should_serialize_header_v9() {
let memory = VectorMemory::default();
let mut storage = Storage::new((1, 2), memory.clone());
storage.update_salt([5u8; 32]);
storage.flush();

assert_eq!(storage.version(), 8);
assert_eq!(storage.version(), 9);
let mut buf = vec![0; HEADER_SIZE];
memory.read(0, &mut buf);
assert_eq!(buf, hex::decode("49494308000000000100000000000000020000000000000000100505050505050505050505050505050505050505050505050505050505050505").unwrap());
assert_eq!(buf, hex::decode("49494309000000000100000000000000020000000000000000100505050505050505050505050505050505050505050505050505050505050505").unwrap());
}

#[test]
Expand All @@ -54,6 +54,19 @@ fn should_recover_header_from_memory_v8() {
assert_eq!(storage.version(), 8);
}

#[test]
fn should_recover_header_from_memory_v9() {
let memory = VectorMemory::default();
memory.grow(1);
memory.write(0, &hex::decode("494943090500000040e2010000000000f1fb090000000000000843434343434343434343434343434343434343434343434343434343434343430002000000000000000000000000000000000000000000000000").unwrap());

let storage = Storage::from_memory(memory);
assert_eq!(storage.assigned_anchor_number_range(), (123456, 654321));
assert_eq!(storage.salt().unwrap(), &[67u8; 32]);
assert_eq!(storage.anchor_count(), 5);
assert_eq!(storage.version(), 9);
}

#[test]
fn should_read_previous_write() {
let memory = VectorMemory::default();
Expand Down Expand Up @@ -104,19 +117,32 @@ fn should_save_and_restore_persistent_state() {
}

#[test]
fn should_not_find_persistent_state_if_it_does_not_exist() {
fn should_not_find_persistent_state_if_it_does_not_exist_v8() {
let memory = VectorMemory::default();
let mut storage = Storage::new((10_000, 3_784_873), memory);
memory.grow(1);
memory.write(0, &hex::decode("494943080500000040e2010000000000f1fb090000000000000843434343434343434343434343434343434343434343434343434343434343430002000000000000000000000000000000000000000000000000").unwrap());
let mut storage = Storage::from_memory(memory.clone());
storage.flush();

let result = storage.read_persistent_state();
assert!(matches!(result, Err(PersistentStateError::NotFound)))
}

#[test]
fn should_overwrite_persistent_state_with_next_anchor() {
fn should_always_find_persistent_state_v9() {
let memory = VectorMemory::default();
let mut storage = Storage::new((10_000, 3_784_873), memory.clone());
let mut storage = Storage::new((10_000, 3_784_873), memory);
storage.flush();

assert!(storage.read_persistent_state().is_ok());
}

#[test]
fn should_overwrite_persistent_state_with_next_anchor_v8() {
let memory = VectorMemory::default();
memory.grow(1);
memory.write(0, &hex::decode("494943080500000040e2010000000000f1fb090000000000000843434343434343434343434343434343434343434343434343434343434343430002000000000000000000000000000000000000000000000000").unwrap());
let mut storage = Storage::from_memory(memory.clone());
storage.flush();

storage.allocate_anchor().unwrap();
Expand All @@ -130,6 +156,22 @@ fn should_overwrite_persistent_state_with_next_anchor() {
assert!(matches!(result, Err(PersistentStateError::NotFound)));
}

#[test]
fn should_not_overwrite_persistent_state_with_next_anchor_v9() {
let memory = VectorMemory::default();
let mut storage = Storage::new((10_000, 3_784_873), memory.clone());
storage.flush();

storage.allocate_anchor().unwrap();
storage.write_persistent_state(&sample_persistent_state());
assert!(storage.read_persistent_state().is_ok());

let anchor = storage.allocate_anchor().unwrap();
storage.write(anchor).unwrap();

assert!(storage.read_persistent_state().is_ok());
}

fn sample_device() -> Device {
Device {
pubkey: ByteBuf::from("hello world, I am a public key"),
Expand Down
2 changes: 2 additions & 0 deletions src/internet_identity/stable_memory/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,8 @@ These tests serve two purposes:

The following stable memory backups are currently used:
* `buffered_archive_entries_v8.bin.gz`: a backup with buffered archive entries.
* `clean_init_v8.bin.gz`: a clean initial state with storage layout v8. Used to test that II can be upgraded from v8
storage layout.
* `genesis-layout-migrated-to-v8.bin.gz`: a backup initially created with the first version of the stable memory layout and then incrementally migrated to the v8 layout. It contains a few well-known identities / devices, see `known_devices` in `tests/integration/stable_memory.rs`.
* `genesis-memory-layout.bin`: a backup of the initial memory layout. Not migrated. Mainly used to test behavior with respect to outdated / unsupported memory layouts.
* `multiple-recovery-phrases-v8.bin.gz`: a backup with an identity that has multiple recovery phrases. The input validation does no longer allow to create such an identity (only one recovery phrase is allowed). However, legacy users that are in that state need a way to make their identity consistent again. This backup is used to test exactly that.
Expand Down
Binary file not shown.
Loading

0 comments on commit a22e5ec

Please sign in to comment.