From 5f965d12c3fdad0b873dc9a786fd7113450ab7bb Mon Sep 17 00:00:00 2001 From: Sahil Bondre Date: Fri, 29 Dec 2023 17:00:45 +0000 Subject: [PATCH] ffdb-006: add Segment implementation --- .../sahilbondre/firefly/model/Segment.java | 131 +++++++++++++ .../firefly/model/SegmentTest.java | 173 ++++++++++++++++++ 2 files changed, 304 insertions(+) create mode 100644 src/main/java/com/sahilbondre/firefly/model/Segment.java create mode 100644 src/test/java/com/sahilbondre/firefly/model/SegmentTest.java diff --git a/src/main/java/com/sahilbondre/firefly/model/Segment.java b/src/main/java/com/sahilbondre/firefly/model/Segment.java new file mode 100644 index 0000000..13b02c0 --- /dev/null +++ b/src/main/java/com/sahilbondre/firefly/model/Segment.java @@ -0,0 +1,131 @@ +package com.sahilbondre.firefly.model; + +public class Segment { + + private static final int CRC_LENGTH = 2; + private static final int KEY_SIZE_LENGTH = 2; + private static final int VALUE_SIZE_LENGTH = 4; + /** + * Class representing a segment of the log file. + *

+ * Two big decisions here to save on performance: + * 1. We're using byte[] instead of ByteBuffer. + * 2. We're trusting that the byte[] is immutable and hence avoiding copying it. + *

+ *

+ * 2 bytes: CRC + * 2 bytes: Key Size + * 4 bytes: Value Size + * n bytes: Key + * m bytes: Value + *

+ * Note: Value size is four bytes because we're using a 32-bit integer to store the size. + * Int is 32-bit signed, so we can only store 2^31 - 1 bytes in the value. + * Hence, the maximum size of the value is 2,147,483,647 bytes or 2.14 GB. + */ + private final byte[] bytes; + + private Segment(byte[] bytes) { + this.bytes = bytes; + } + + public static Segment fromByteArray(byte[] data) { + return new Segment(data); + } + + public static Segment fromKeyValuePair(byte[] key, byte[] value) { + int keySize = key.length; + int valueSize = value.length; + int totalSize = CRC_LENGTH + KEY_SIZE_LENGTH + VALUE_SIZE_LENGTH + keySize + valueSize; + + byte[] segment = new byte[totalSize]; + + // Set key size + segment[2] = (byte) ((keySize >> 8) & 0xFF); + segment[3] = (byte) (keySize & 0xFF); + + // Set value size + segment[4] = (byte) ((valueSize >> 24) & 0xFF); + segment[5] = (byte) ((valueSize >> 16) & 0xFF); + segment[6] = (byte) ((valueSize >> 8) & 0xFF); + segment[7] = (byte) (valueSize & 0xFF); + + System.arraycopy(key, 0, segment, CRC_LENGTH + KEY_SIZE_LENGTH + VALUE_SIZE_LENGTH, keySize); + + System.arraycopy(value, 0, segment, CRC_LENGTH + KEY_SIZE_LENGTH + VALUE_SIZE_LENGTH + keySize, valueSize); + + byte[] crc = new Segment(segment).crc16(); + segment[0] = crc[0]; + segment[1] = crc[1]; + + return new Segment(segment); + } + + public byte[] getBytes() { + return bytes; + } + + public byte[] getKey() { + int keySize = getKeySize(); + return extractBytes(CRC_LENGTH + KEY_SIZE_LENGTH + VALUE_SIZE_LENGTH, keySize); + } + + public byte[] getValue() { + int keySize = getKeySize(); + int valueSize = getValueSize(); + return extractBytes(CRC_LENGTH + KEY_SIZE_LENGTH + VALUE_SIZE_LENGTH + keySize, valueSize); + } + + public int getKeySize() { + return ((bytes[2] & 0xff) << 8) | (bytes[3] & 0xff); + } + + public int getValueSize() { + return ((bytes[4] & 0xff) << 24) | ((bytes[5] & 0xff) << 16) | + ((bytes[6] & 0xff) << 8) | (bytes[7] & 0xff); + } + + public byte[] getCrc() { + return extractBytes(0, CRC_LENGTH); + } + + public boolean isChecksumValid() { + byte[] crc = crc16(); + return crc[0] == bytes[0] && crc[1] == bytes[1]; + } + + public boolean isSegmentValid() { + return isChecksumValid() && getKeySize() > 0 && getValueSize() >= 0 + && bytes.length == CRC_LENGTH + KEY_SIZE_LENGTH + VALUE_SIZE_LENGTH + getKeySize() + getValueSize(); + } + + private byte[] extractBytes(int offset, int length) { + byte[] result = new byte[length]; + System.arraycopy(bytes, offset, result, 0, length); + return result; + } + + private byte[] crc16(byte[] segment) { + int crc = 0xFFFF; // Initial CRC value + int polynomial = 0x1021; // CRC-16 polynomial + + for (int index = CRC_LENGTH; index < segment.length; index++) { + byte b = segment[index]; + crc ^= (b & 0xFF) << 8; + + for (int i = 0; i < 8; i++) { + if ((crc & 0x8000) != 0) { + crc = (crc << 1) ^ polynomial; + } else { + crc <<= 1; + } + } + } + + return new byte[]{(byte) ((crc >> 8) & 0xFF), (byte) (crc & 0xFF)}; + } + + private byte[] crc16() { + return crc16(bytes); + } +} diff --git a/src/test/java/com/sahilbondre/firefly/model/SegmentTest.java b/src/test/java/com/sahilbondre/firefly/model/SegmentTest.java new file mode 100644 index 0000000..effe8a2 --- /dev/null +++ b/src/test/java/com/sahilbondre/firefly/model/SegmentTest.java @@ -0,0 +1,173 @@ +package com.sahilbondre.firefly.model; + +import org.junit.jupiter.api.Test; + +import static org.junit.jupiter.api.Assertions.*; + +class SegmentTest { + + @Test + void givenByteArray_whenCreatingSegment_thenAccessorsReturnCorrectValues() { + // Given + byte[] testData = new byte[]{ + (byte) -83, (byte) 64, + 0x00, 0x05, // Key Size + 0x00, 0x00, 0x00, 0x05, // Value Size + 0x48, 0x65, 0x6C, 0x6C, 0x6F, // Key: "Hello" + 0x57, 0x6F, 0x72, 0x6C, 0x64 // Value: "World" + }; + + // When + Segment segment = Segment.fromByteArray(testData); + + // Then + assertArrayEquals(testData, segment.getBytes()); + assertArrayEquals("Hello".getBytes(), segment.getKey()); + assertArrayEquals("World".getBytes(), segment.getValue()); + assertEquals(5, segment.getKeySize()); + assertEquals(5, segment.getValueSize()); + assertEquals(-83, segment.getCrc()[0]); + assertEquals(64, segment.getCrc()[1]); + assertTrue(segment.isSegmentValid()); + assertTrue(segment.isChecksumValid()); + } + + @Test + void givenCorruptedKeySizeSegment_whenCheckingChecksum_thenIsChecksumValidReturnsFalse() { + // Given + byte[] testData = new byte[]{ + (byte) -83, (byte) 64, + 0x01, 0x45, // Key Size (Bit Flipped) + 0x00, 0x00, 0x00, 0x05, // Value Size + 0x48, 0x65, 0x6C, 0x6C, 0x6F, // Key: "Hello" + 0x57, 0x6F, 0x72, 0x6C, 0x64 // Value: "World" + }; + + // When + Segment corruptedSegment = Segment.fromByteArray(testData); + + // Then + assertFalse(corruptedSegment.isChecksumValid()); + assertFalse(corruptedSegment.isSegmentValid()); + } + + @Test + void givenCorruptedValueSizeSegment_whenCheckingChecksum_thenIsChecksumValidReturnsFalse() { + // Given + byte[] testData = new byte[]{ + (byte) -83, (byte) 64, + 0x00, 0x05, // Key Size + 0x00, 0x00, 0x01, 0x05, // Value Size (Bit Flipped) + 0x48, 0x65, 0x6C, 0x6C, 0x6F, // Key: "Hello" + 0x57, 0x6F, 0x72, 0x6C, 0x64 // Value: "World" + }; + + // When + Segment corruptedSegment = Segment.fromByteArray(testData); + + // Then + assertFalse(corruptedSegment.isChecksumValid()); + assertFalse(corruptedSegment.isSegmentValid()); + } + + @Test + void givenCorruptedKeySegment_whenCheckingChecksum_thenIsChecksumValidReturnsFalse() { + // Given + byte[] testData = new byte[]{ + (byte) -83, (byte) 64, + 0x00, 0x05, // Key Size + 0x00, 0x00, 0x00, 0x05, // Value Size + 0x48, 0x65, 0x6C, 0x6C, 0x6E, // Key: "Hello" (Bit Flipped) + 0x57, 0x6F, 0x72, 0x6C, 0x64 // Value: "World" + }; + + // When + Segment corruptedSegment = Segment.fromByteArray(testData); + + // Then + assertFalse(corruptedSegment.isChecksumValid()); + assertFalse(corruptedSegment.isSegmentValid()); + } + + @Test + void givenCorruptedValueSegment_whenCheckingChecksum_thenIsChecksumValidReturnsFalse() { + // Given + byte[] testData = new byte[]{ + (byte) -83, (byte) 64, + 0x00, 0x05, // Key Size + 0x00, 0x00, 0x00, 0x05, // Value Size + 0x48, 0x65, 0x6C, 0x6C, 0x6F, // Key: "Hello" + 0x57, 0x6F, 0x62, 0x6C, 0x65 // Value: "World" (Bit Flipped) + }; + + // When + Segment corruptedSegment = Segment.fromByteArray(testData); + + // Then + assertFalse(corruptedSegment.isChecksumValid()); + assertFalse(corruptedSegment.isSegmentValid()); + } + + @Test + void givenIncorrectValueLengthSegment_whenCheckingSegmentValid_thenIsSegmentValidReturnsFalse() { + // Given + byte[] testData = new byte[]{ + (byte) -43, (byte) -70, + 0x00, 0x05, // Key Size + 0x00, 0x00, 0x00, 0x06, // Value Size (Incorrect) + 0x48, 0x65, 0x6C, 0x6C, 0x6F, // Key: "Hello" + 0x57, 0x6F, 0x72, 0x6C, 0x64 // Value: "World" + }; + + // When + Segment corruptedSegment = Segment.fromByteArray(testData); + + // Then + assertTrue(corruptedSegment.isChecksumValid()); + assertFalse(corruptedSegment.isSegmentValid()); + } + + @Test + void givenKeyValuePair_whenCreatingSegment_thenAccessorsReturnCorrectValues() { + // Given + byte[] key = "Hello".getBytes(); + byte[] value = "World".getBytes(); + byte[] expectedSegment = new byte[]{ + (byte) -83, (byte) 64, + 0x00, 0x05, // Key Size + 0x00, 0x00, 0x00, 0x05, // Value Size + 0x48, 0x65, 0x6C, 0x6C, 0x6F, // Key: "Hello" + 0x57, 0x6F, 0x72, 0x6C, 0x64 // Value: "World" + }; + + // When + Segment segment = Segment.fromKeyValuePair(key, value); + + // Then + assertArrayEquals("Hello".getBytes(), segment.getKey()); + assertArrayEquals("World".getBytes(), segment.getValue()); + assertEquals(5, segment.getKeySize()); + assertEquals(5, segment.getValueSize()); + assertEquals(-83, segment.getCrc()[0]); + assertEquals(64, segment.getCrc()[1]); + assertTrue(segment.isSegmentValid()); + assertTrue(segment.isChecksumValid()); + assertArrayEquals(expectedSegment, segment.getBytes()); + } + + @Test + void givenKeyAndValue_whenCreatingSegment_thenSegmentIsCreatedWithCorrectSizes() { + // Given + byte[] key = "Hello".getBytes(); + byte[] value = "World".getBytes(); + + // When + Segment segment = Segment.fromKeyValuePair(key, value); + + // Then + assertArrayEquals(key, segment.getKey()); + assertArrayEquals(value, segment.getValue()); + assertEquals(key.length, segment.getKeySize()); + assertEquals(value.length, segment.getValueSize()); + } +}