chipsalliance · swenson · Oct 8, 2024 · Oct 8, 2024 · Oct 9, 2024 · Oct 9, 2024
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/api/src/mailbox.rs b/api/src/mailbox.rs
@@ -764,6 +764,8 @@ impl Response for FipsVersionResp {}
 
 // FW_INFO
 // No command-specific input args
+// Safety: Okay to derive PartialEq and Eq because is being sent
+// and we aren't doing sensitive comparisons to its contents.
 #[repr(C)]
 #[derive(Debug, AsBytes, FromBytes, PartialEq, Eq)]
 pub struct FwInfoResp {

diff --git a/builder/src/lib.rs b/builder/src/lib.rs
@@ -20,7 +20,7 @@ use caliptra_image_elf::ElfExecutable;
 use caliptra_image_gen::{
     ImageGenerator, ImageGeneratorConfig, ImageGeneratorOwnerConfig, ImageGeneratorVendorConfig,
 };
-use caliptra_image_types::{ImageBundle, ImageRevision, RomInfo};
+use caliptra_image_types::{ImageBundle, ImageRevision, RomInfo, IMAGE_REVISION_BYTE_SIZE};
 use elf::endian::LittleEndian;
 use nix::fcntl::FlockArg;
 use zerocopy::AsBytes;
@@ -509,7 +509,7 @@ fn image_revision() -> io::Result<ImageRevision> {
     if std::env::var_os("CALIPTRA_IMAGE_NO_GIT_REVISION").is_some() {
         // Sometimes needed to build a consistent ROM image from different
         // commits.
-        Ok(*b"~~~~~NO_GIT_REVISION")
+        Ok(ImageRevision(*b"~~~~~NO_GIT_REVISION"))
     } else {
         image_revision_from_git_repo()
     }
@@ -525,7 +525,7 @@ fn image_revision_from_str(commit_id_str: &str, is_clean: bool) -> io::Result<Im
     // (dirtdirtdirtdirtdirt)
     const DIRTY_SUFFIX: [u8; 10] = [0xd1, 0x47, 0xd1, 0x47, 0xd1, 0x47, 0xd1, 0x47, 0xd1, 0x47];
 
-    let mut commit_id = ImageRevision::default();
+    let mut commit_id = [0u8; IMAGE_REVISION_BYTE_SIZE];
     hex::decode_to_slice(commit_id_str.trim(), &mut commit_id).map_err(|e| {
         other_err(format!(
             "Unable to decode git commit {commit_id_str:?}: {e}"
@@ -536,7 +536,7 @@ fn image_revision_from_str(commit_id_str: &str, is_clean: bool) -> io::Result<Im
         // spoil the revision because the git client is dirty
         commit_id[10..].copy_from_slice(&DIRTY_SUFFIX);
     }
-    Ok(commit_id)
+    Ok(ImageRevision(commit_id))
 }
 
 #[cfg(test)]
@@ -582,24 +582,24 @@ mod test {
     fn test_image_revision_from_str() {
         assert_eq!(
             image_revision_from_str("d6a462a63a9cf2dafa5bbc6cf78b1fccc308009a", true).unwrap(),
-            [
+            ImageRevision([
                 0xd6, 0xa4, 0x62, 0xa6, 0x3a, 0x9c, 0xf2, 0xda, 0xfa, 0x5b, 0xbc, 0x6c, 0xf7, 0x8b,
                 0x1f, 0xcc, 0xc3, 0x08, 0x00, 0x9a
-            ]
+            ])
         );
         assert_eq!(
             image_revision_from_str("d6a462a63a9cf2dafa5bbc6cf78b1fccc308009a\n", true).unwrap(),
-            [
+            ImageRevision([
                 0xd6, 0xa4, 0x62, 0xa6, 0x3a, 0x9c, 0xf2, 0xda, 0xfa, 0x5b, 0xbc, 0x6c, 0xf7, 0x8b,
                 0x1f, 0xcc, 0xc3, 0x08, 0x00, 0x9a
-            ]
+            ])
         );
         assert_eq!(
             image_revision_from_str("d6a462a63a9cf2dafa5bbc6cf78b1fccc308009a", false).unwrap(),
-            [
+            ImageRevision([
                 0xd6, 0xa4, 0x62, 0xa6, 0x3a, 0x9c, 0xf2, 0xda, 0xfa, 0x5b, 0xd1, 0x47, 0xd1, 0x47,
                 0xd1, 0x47, 0xd1, 0x47, 0xd1, 0x47
-            ]
+            ])
         );
         assert_eq!(
             image_revision_from_str("d6a462a63a9cf2dafa5bbc6cf78b1fccc30800", false).unwrap_err().to_string(),

diff --git a/cfi/lib/src/cfi.rs b/cfi/lib/src/cfi.rs
@@ -177,8 +177,8 @@ macro_rules! cfi_assert_macro {
     };
 }
 
-cfi_assert_macro!(cfi_assert_eq, ==, Eq, PartialEq, AssertEqFail);
-cfi_assert_macro!(cfi_assert_ne, !=, Eq, PartialEq, AssertNeFail);
+cfi_assert_macro!(cfi_assert_eq, ==, PartialEq, PartialEq, AssertEqFail);
+cfi_assert_macro!(cfi_assert_ne, !=, PartialEq, PartialEq, AssertNeFail);
 cfi_assert_macro!(cfi_assert_gt, >, Ord, PartialOrd, AssertGtFail);
 cfi_assert_macro!(cfi_assert_lt, <, Ord, PartialOrd, AssertLtFail);
 cfi_assert_macro!(cfi_assert_ge, >=, Ord, PartialOrd, AssertGeFail);

diff --git a/cfi/lib/src/lib.rs b/cfi/lib/src/lib.rs
@@ -13,10 +13,12 @@ extern crate core;
 
 mod cfi;
 mod cfi_counter;
+mod secmem;
 mod xoshiro;
 
 pub use cfi::*;
 pub use cfi_counter::{CfiCounter, CfiInt};
+pub use secmem::memeq;
 pub use xoshiro::Xoshiro128;
 
 #[repr(C)]

diff --git a/cfi/lib/src/secmem.rs b/cfi/lib/src/secmem.rs
@@ -0,0 +1,212 @@
+/*++
+
+Licensed under the Apache-2.0 license.
+
+File Name:
+
+    secmem.rs
+
+Abstract:
+
+    File contains support routines and macros for secure memory operations.
+
+--*/
+
+use core::ptr;
+
+use crate::{cfi_assert_eq, cfi_assert_ne, cfi_launder};
+
+// Adapted from https://github.com/lowRISC/opentitan/blob/7a61300cf7c409fa68fd892942c1d7b58a7cd4c0/sw/device/lib/base/hardened_asm.h
+// and https://github.com/lowRISC/opentitan/blob/7a61300cf7c409fa68fd892942c1d7b58a7cd4c0/sw/device/lib/base/hardened_memory.c
+// which are:
+// Copyright lowRISC contributors.
+
+/// Values for a hardened boolean type.
+///
+/// The intention is that this is used instead of `<stdbool.h>`'s #bool, where a
+/// higher hamming distance is required between the truthy and the falsey value.
+///
+/// The values below were chosen at random, with some specific restrictions. They
+/// have a Hamming Distance of 8, and they are 11-bit values so they can be
+/// materialized with a single instruction on RISC-V. They are also specifically
+/// not the complement of each other.
+pub type HardenedBool = u32;
+pub const HARDENED_BOOL_TRUE: HardenedBool = 0x739;
+pub const HARDENED_BOOL_FALSE: HardenedBool = 0x1d4;
+
+struct RandomOrder {
+    state: u32,
+    max: u32,
+}
+
+/// Context for a random traversal order.
+///
+/// A "random traversal order" specifies a random order to walk through some
+/// buffer of length `n`, which is an important building block for
+/// constant-power code. Given `n`, the random order emits integers in the
+/// range `0..m`, where `m` is an implementation-defined, per-random-order
+/// value greater than `n`. The order is guaranteed to visit each integer in
+/// `0..n` at least once, but with some caveats:
+/// - Values greater than `n` may be returned.
+/// - The same value may be returned multiple times.
+///
+/// Users must be mindful of these constraints when using `RandomOrder`.
+/// These caveats are intended to allow for implementation flexibility, such as
+/// intentionally adding decoys to the sequence.
+impl RandomOrder {
+    /// Constructs a new, randomly-seeded traversal order,
+    /// running from `0` to at least `min_len`.
+    ///
+    /// This function does not take a seed as input; instead, the seed is
+    /// extracted, in some manner or another, from the hardware by this function.
+    ///
+    /// @param min_len The minimum length this traversal order must visit.
+    fn new(min_len: u32) -> RandomOrder {
+        RandomOrder {
+            state: 0,
+            max: min_len * 2,
+        }
+    }
+
+    /// Returns the length of the sequence represented by `ctx`.
+    ///
+    /// This value may be greater than `min_len` specified in
+    /// `random_order_init()`, but the sequence is guaranteed to contain every
+    /// integer in `0..min_len`.
+    ///
+    /// This value represents the number of times `random_order_advance()` may be
+    /// called.
+    ///
+    /// @param ctx The context to query.
+    /// @return The length of the sequence.
+    fn len(&self) -> u32 {
+        self.max
+    }
+
+    /// Returns the next element in the sequence represented by `ctx`.
+    ///
+    /// See `random_order_len()` for discovering how many times this function can
+    /// be called.
+    ///
+    /// @param ctx The context to advance.
+    /// @return The next value in the sequence.
+    fn advance(&mut self) -> u32 {
+        // TODO: The current implementation is just a skeleton, and currently just
+        // traverses from 0 to `min_len * 2`.
+        let s = self.state;
+        self.state += 1;
+        s
+    }
+}
+
+#[inline(always)]
+pub fn memeq(lhs: &[u32], rhs: &[u32]) -> bool {
+    hardened_memeq(lhs, rhs) == HARDENED_BOOL_TRUE
+}
+
+#[inline(never)]
+pub fn hardened_memeq(lhs: &[u32], rhs: &[u32]) -> HardenedBool {
+    let word_len = lhs.len();
+    //assert_eq!(word_len, rhs.len());
+    if word_len != rhs.len() {
+        return HARDENED_BOOL_FALSE;
+    }
+
+    let mut order = RandomOrder::new(word_len as u32);
+
+    let mut count = 0;
+    let expected_count = order.len();
+
+    let lhs_addr = lhs.as_ptr() as usize;
+    let rhs_addr = rhs.as_ptr() as usize;
+
+    // `decoys` is a small stack array that is filled with values with a Hamming weight
+    // of around 16, which is the most common Hamming weight among 32-bit words.
+    //
+    // It is scratch space for us to do "extra" operations, when the number of
+    // iteration indices the chosen random order is different from `word_len`.
+    //
+    // These extra operations also introduce noise that an attacker must do work
+    // to filter, such as by applying side-channel analysis to obtain an address
+    // trace.
+    const DECOYS: usize = 8;
+    let decoys: [u32; DECOYS] = [0xaaaaaaaa; DECOYS];
+    let decoy_addr = decoys.as_ptr() as usize;
+
+    let mut zeros = 0;
+    let mut ones = u32::MAX;
+
+    let byte_len = word_len * core::mem::size_of::<u32>();
+    while count < expected_count {
+        // The order values themselves are in units of words, but we need `byte_idx`
+        // to be in units of bytes.
+        //
+        // The value obtained from `advance()` is laundered to prevent
+        // implementation details from leaking across procedures.
+        let byte_idx = cfi_launder(order.advance()) as usize * core::mem::size_of::<u32>();
+
+        // Prevent the compiler from reordering the loop; this ensures a
+        // happens-before among indices consistent with `order`.
+        barrier(byte_idx as u32);
+
+        // Compute putative offsets into `src`, `dest`, and `decoys`. Some of these
+        // may go off the end of `src` and `dest`, but they will not be cast to
+        // pointers in that case. (Note that casting out-of-range addresses to
+        // pointers is UB.)
+        let ap = lhs_addr + byte_idx;
+        let bp = rhs_addr + byte_idx;
+        let decoy1 = decoy_addr + (byte_idx % core::mem::size_of_val(&decoys));
+        let decoy2 = decoy_addr
+            + ((byte_idx + core::mem::size_of_val(&decoys) / 2) % core::mem::size_of_val(&decoys));
+
+        // Branchlessly select whether to do a "real" comparison or a decoy comparison,
+        // depending on whether we've gone off the end of the array or not.
+        //
+        // Pretty much everything needs to be laundered: we need to launder
+        // `byte_idx` for obvious reasons, and we need to launder the result of the
+        // select, so that the compiler cannot delete the resulting loads and
+        // stores. This is similar to having used `volatile uint32_t *`.
+        let av = if byte_idx < byte_len { ap } else { decoy1 } as *const u32;
+        let bv = if byte_idx < byte_len { bp } else { decoy2 } as *const u32;
+
+        let a = unsafe { ptr::read_volatile(av) };
+        let b = unsafe { ptr::read_volatile(bv) };
+
+        // Launder one of the operands so that the compiler cannot cache the result
+        // of the xor for use in the next operation.
+        //
+        // We launder `zeroes` so that compiler cannot learn that `zeroes` has
+        // strictly more bits set at the end of the loop.
+        zeros = cfi_launder(zeros) | (cfi_launder(a) ^ b);
+
+        // Same as above. The compiler can cache the value of `a[offset]` but it
+        // has no chance to strength-reduce this operation.
+        ones = cfi_launder(ones) & (cfi_launder(a) ^ !b);
+
+        // We need to launder `count` so that the SW.LOOP-COMPLETION check is not
+        // deleted by the compiler.
+        count = cfi_launder(count) + 1;
+    }
+
+    if cfi_launder(zeros) == 0 {
+        cfi_assert_eq(ones, u32::MAX);
+        if ones == u32::MAX {
+            return HARDENED_BOOL_TRUE;
+        }
+    }
+
+    cfi_assert_ne(ones, u32::MAX);
+    HARDENED_BOOL_FALSE
+}
+
+#[allow(asm_sub_register)] // otherwise x86 complains about the no-op asm
+pub fn barrier(val: u32) {
+    if cfg!(feature = "cfi") {
+        unsafe {
+            core::arch::asm!(
+                "/* {t} */",
+                t = in(reg) val,
+            );
+        }
+    }
+}